文件名称:crawler4j-3.5-src
- 所属分类:
- JSP源码/Java
- 资源属性:
- [Java] [源码]
- 上传时间:
- 2017-07-21
- 文件大小:
- 109kb
- 下载次数:
- 0次
- 提 供 者:
- 记不住***
- 相关连接:
- 无
- 下载说明:
- 别用迅雷下载,失败请重下,重下不扣分!
介绍说明--下载内容均来自于网络,请自行研究使用
一款不错的用于java语言的爬虫框架,编程简单方便,编程人员不需具备较好的功底也能轻松使用(A good for Java language crawler fr a mework, programming simple and convenient, programmers need not have a good foundation, but also easy to use)
(系统自动生成,下载前可以参看下载内容)
下载文件列表
crawler4j-e14a29640939\.project
crawler4j-e14a29640939\pom.xml
crawler4j-e14a29640939\.gitignore
crawler4j-e14a29640939\.classpath
crawler4j-e14a29640939\src\main\resources\tld-names.txt
crawler4j-e14a29640939\src\main\resources\log4j.properties
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\crawler\WebCrawler.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\crawler\CrawlConfig.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\crawler\Configurable.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\crawler\Page.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\crawler\CrawlController.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\fetcher\CustomFetchStatus.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\fetcher\IdleConnectionMonitorThread.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\fetcher\PageFetchResult.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\fetcher\PageFetcher.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\frontier\DocIDServer.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\frontier\InProcessPagesDB.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\frontier\WebURLTupleBinding.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\frontier\Frontier.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\frontier\Counters.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\frontier\WorkQueues.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\ParseData.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\ExtractedUrlAnchorPair.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\HtmlContentHandler.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\BinaryParseData.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\HtmlParseData.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\Parser.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\TextParseData.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\robotstxt\HostDirectives.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\robotstxt\RobotstxtParser.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\robotstxt\RobotstxtConfig.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\robotstxt\RobotstxtServer.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\robotstxt\RuleSet.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\url\URLCanonicalizer.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\url\UrlResolver.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\url\TLDList.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\url\WebURL.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\util\IO.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\util\Util.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\tests\URLCanonicalizerTest.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\tests\TLDListTest.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\basic\BasicCrawlController.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\basic\BasicCrawler.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\imagecrawler\ImageCrawlController.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\imagecrawler\Cryptography.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\imagecrawler\ImageCrawler.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\localdata\Downloader.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\localdata\CrawlStat.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\localdata\LocalDataCollectorController.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\localdata\LocalDataCollectorCrawler.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\multiple\MultipleCrawlerController.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\multiple\BasicCrawler.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\shutdown\BasicCrawler.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\shutdown\ControllerWithShutdown.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\statushandler\StatusHandlerCrawlController.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\statushandler\StatusHandlerCrawler.java
crawler4j-e14a29640939\pom.xml
crawler4j-e14a29640939\.gitignore
crawler4j-e14a29640939\.classpath
crawler4j-e14a29640939\src\main\resources\tld-names.txt
crawler4j-e14a29640939\src\main\resources\log4j.properties
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\crawler\WebCrawler.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\crawler\CrawlConfig.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\crawler\Configurable.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\crawler\Page.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\crawler\CrawlController.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\fetcher\CustomFetchStatus.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\fetcher\IdleConnectionMonitorThread.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\fetcher\PageFetchResult.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\fetcher\PageFetcher.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\frontier\DocIDServer.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\frontier\InProcessPagesDB.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\frontier\WebURLTupleBinding.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\frontier\Frontier.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\frontier\Counters.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\frontier\WorkQueues.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\ParseData.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\ExtractedUrlAnchorPair.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\HtmlContentHandler.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\BinaryParseData.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\HtmlParseData.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\Parser.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\parser\TextParseData.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\robotstxt\HostDirectives.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\robotstxt\RobotstxtParser.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\robotstxt\RobotstxtConfig.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\robotstxt\RobotstxtServer.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\robotstxt\RuleSet.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\url\URLCanonicalizer.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\url\UrlResolver.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\url\TLDList.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\url\WebURL.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\util\IO.java
crawler4j-e14a29640939\src\main\java\edu\uci\ics\crawler4j\util\Util.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\tests\URLCanonicalizerTest.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\tests\TLDListTest.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\basic\BasicCrawlController.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\basic\BasicCrawler.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\imagecrawler\ImageCrawlController.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\imagecrawler\Cryptography.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\imagecrawler\ImageCrawler.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\localdata\Downloader.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\localdata\CrawlStat.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\localdata\LocalDataCollectorController.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\localdata\LocalDataCollectorCrawler.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\multiple\MultipleCrawlerController.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\multiple\BasicCrawler.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\shutdown\BasicCrawler.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\shutdown\ControllerWithShutdown.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\statushandler\StatusHandlerCrawlController.java
crawler4j-e14a29640939\src\test\java\edu\uci\ics\crawler4j\examples\statushandler\StatusHandlerCrawler.java