Description: A good for Java language crawler framework, programming simple and convenient, programmers need not have a good foundation, but also easy to use
To Search:
File list (Check if you may need any files):
crawler4j-e14a29640939\.project
crawler4j-e14a29640939\pom.xml
crawler4j-e14a29640939\.gitignore
crawler4j-e14a29640939\.classpath
crawler4j-e14a29640939\src\main\resources\tld-names.txt
crawler4j-e14a29640939\src\main\resources\log4j.properties
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\crawler\WebCrawler.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\crawler\CrawlConfig.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\crawler\Configurable.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\crawler\Page.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\crawler\CrawlController.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\fetcher\CustomFetchStatus.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\fetcher\IdleConnectionMonitorThread.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\fetcher\PageFetchResult.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\fetcher\PageFetcher.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\frontier\DocIDServer.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\frontier\InProcessPagesDB.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\frontier\WebURLTupleBinding.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\frontier\Frontier.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\frontier\Counters.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\frontier\WorkQueues.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\ParseData.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\ExtractedUrlAnchorPair.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\HtmlContentHandler.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\BinaryParseData.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\HtmlParseData.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\Parser.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\TextParseData.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\robotstxt\HostDirectives.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\robotstxt\RobotstxtParser.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\robotstxt\RobotstxtConfig.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\robotstxt\RobotstxtServer.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\robotstxt\RuleSet.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\url\URLCanonicalizer.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\url\UrlResolver.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\url\TLDList.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\url\WebURL.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\util\IO.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\util\Util.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\tests\URLCanonicalizerTest.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\tests\TLDListTest.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\basic\BasicCrawlController.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\basic\BasicCrawler.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\imagecrawler\ImageCrawlController.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\imagecrawler\Cryptography.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\imagecrawler\ImageCrawler.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\localdata\Downloader.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\localdata\CrawlStat.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\localdata\LocalDataCollectorController.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\localdata\LocalDataCollectorCrawler.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\multiple\MultipleCrawlerController.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\multiple\BasicCrawler.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\shutdown\BasicCrawler.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\shutdown\ControllerWithShutdown.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\statushandler\StatusHandlerCrawlController.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\statushandler\StatusHandlerCrawler.java