crawler4j-master
code 

Directory: Windows Develop
Plat: Unix_Linux
Size: 194KB
Downloads: 1
Upload time: 2018-03-12 17:39:34
Uploader: Elkalash
Description:   basic crawler controller

File list:
crawler4j-master, 0 , 2017-04-18
crawler4j-master\.gitignore, 1824 , 2017-04-18
crawler4j-master\.idea, 0 , 2017-04-18
crawler4j-master\.idea\.name, 9 , 2017-04-18
crawler4j-master\.idea\codeStyleSettings.xml, 4400 , 2017-04-18
crawler4j-master\.idea\compiler.xml, 643 , 2017-04-18
crawler4j-master\.idea\copyright, 0 , 2017-04-18
crawler4j-master\.idea\copyright\profiles_settings.xml, 74 , 2017-04-18
crawler4j-master\.idea\encodings.xml, 172 , 2017-04-18
crawler4j-master\.idea\inspectionProfiles, 0 , 2017-04-18
crawler4j-master\.idea\inspectionProfiles\Project_Default.xml, 99720 , 2017-04-18
crawler4j-master\.idea\inspectionProfiles\profiles_settings.xml, 235 , 2017-04-18
crawler4j-master\.idea\misc.xml, 10660 , 2017-04-18
crawler4j-master\.idea\modules.xml, 258 , 2017-04-18
crawler4j-master\.idea\sqldialects.xml, 174 , 2017-04-18
crawler4j-master\.idea\vcs.xml, 167 , 2017-04-18
crawler4j-master\.travis.yml, 35 , 2017-04-18
crawler4j-master\CHANGES.txt, 5920 , 2017-04-18
crawler4j-master\LICENSE, 527 , 2017-04-18
crawler4j-master\README.md, 11436 , 2017-04-18
crawler4j-master\checkstyle.xml, 5552 , 2017-04-18
crawler4j-master\pom.xml, 10470 , 2017-04-18
crawler4j-master\src, 0 , 2017-04-18
crawler4j-master\src\main, 0 , 2017-04-18
crawler4j-master\src\main\java, 0 , 2017-04-18
crawler4j-master\src\main\java\edu, 0 , 2017-04-18
crawler4j-master\src\main\java\edu\uci, 0 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics, 0 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j, 0 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\crawler, 0 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\crawler\Configurable.java, 1199 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\crawler\CrawlConfig.java, 18645 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\crawler\CrawlController.java, 20831 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\crawler\Page.java, 7976 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\crawler\WebCrawler.java, 22722 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\crawler\authentication, 0 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\crawler\authentication\AuthInfo.java, 4711 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\crawler\authentication\BasicAuthInfo.java, 1175 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\crawler\authentication\FormAuthInfo.java, 2161 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\crawler\authentication\NtAuthInfo.java, 698 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\crawler\exceptions, 0 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\crawler\exceptions\ContentFetchException.java, 247 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\crawler\exceptions\PageBiggerThanMaxSizeException.java, 537 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\crawler\exceptions\ParseException.java, 246 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\fetcher, 0 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\fetcher\IdleConnectionMonitorThread.java, 1946 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\fetcher\PageFetchResult.java, 3271 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\fetcher\PageFetcher.java, 15547 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\fetcher\SniPoolingHttpClientConnectionManager.java, 2492 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\fetcher\SniSSLConnectionSocketFactory.java, 1831 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\frontier, 0 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\frontier\Counters.java, 4868 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\frontier\DocIDServer.java, 5255 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\frontier\Frontier.java, 7043 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\frontier\InProcessPagesDB.java, 2551 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\frontier\WebURLTupleBinding.java, 1973 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\frontier\WorkQueues.java, 5257 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\parser, 0 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\parser\AllTagMapper.java, 1393 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\parser\BinaryParseData.java, 4691 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\parser\ExtractedUrlAnchorPair.java, 1056 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\parser\HtmlContentHandler.java, 7375 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\parser\HtmlParseData.java, 2114 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\parser\NotAllowedContentException.java, 452 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\parser\ParseData.java, 1065 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\parser\Parser.java, 7141 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\parser\TextParseData.java, 1542 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\robotstxt, 0 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\robotstxt\HostDirectives.java, 5444 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\robotstxt\PathRule.java, 4923 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\robotstxt\RobotstxtConfig.java, 2623 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\robotstxt\RobotstxtParser.java, 4100 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\robotstxt\RobotstxtServer.java, 8096 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\robotstxt\UserAgentDirectives.java, 7619 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\url, 0 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\url\TLDList.java, 3880 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\url\URLCanonicalizer.java, 6587 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\url\UrlResolver.java, 19322 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\url\WebURL.java, 5988 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\util, 0 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\util\IO.java, 1683 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\util\Net.java, 1806 , 2017-04-18
crawler4j-master\src\main\java\edu\uci\ics\crawler4j\util\Util.java, 2681 , 2017-04-18
crawler4j-master\src\main\resources, 0 , 2017-04-18
crawler4j-master\src\main\resources\tld-names.txt, 133718 , 2017-04-18
crawler4j-master\src\test, 0 , 2017-04-18
crawler4j-master\src\test\groovy, 0 , 2017-04-18
crawler4j-master\src\test\groovy\edu, 0 , 2017-04-18
crawler4j-master\src\test\groovy\edu\uci, 0 , 2017-04-18
crawler4j-master\src\test\groovy\edu\uci\ics, 0 , 2017-04-18
crawler4j-master\src\test\groovy\edu\uci\ics\crawler4j, 0 , 2017-04-18
crawler4j-master\src\test\groovy\edu\uci\ics\crawler4j\crawler, 0 , 2017-04-18
crawler4j-master\src\test\groovy\edu\uci\ics\crawler4j\crawler\CrawlerWithJSTest.groovy, 5283 , 2017-04-18
crawler4j-master\src\test\groovy\edu\uci\ics\crawler4j\crawler\NoFollowTest.groovy, 3533 , 2017-04-18
crawler4j-master\src\test\groovy\edu\uci\ics\crawler4j\crawler\NoIndexTest.groovy, 3914 , 2017-04-18
crawler4j-master\src\test\groovy\edu\uci\ics\crawler4j\crawler\RedirectHandlerTest.groovy, 4001 , 2017-04-18
crawler4j-master\src\test\groovy\edu\uci\ics\crawler4j\crawler\WebCrawlerTest.groovy, 4021 , 2017-04-18
crawler4j-master\src\test\java, 0 , 2017-04-18
crawler4j-master\src\test\java\edu, 0 , 2017-04-18
crawler4j-master\src\test\java\edu\uci, 0 , 2017-04-18

Download users:

Relate files:

Comment: Add Comment

Favorite users: