Download crawler Free Java Code
Description
Simple java web crawler.
Source Files
The download file crawler-master.zip has the following entries.
.gitignore/*from ww w . j a va 2 s .c o m*/
.travis.yml
CHANGELOG
LICENSE
README.md
pom.xml
src/main/java/com/soulgalore/crawler/core/Crawler.java
src/main/java/com/soulgalore/crawler/core/CrawlerConfiguration.java
src/main/java/com/soulgalore/crawler/core/CrawlerResult.java
src/main/java/com/soulgalore/crawler/core/HTMLPageResponse.java
src/main/java/com/soulgalore/crawler/core/HTMLPageResponseCallable.java
src/main/java/com/soulgalore/crawler/core/HTMLPageResponseFetcher.java
src/main/java/com/soulgalore/crawler/core/PageURL.java
src/main/java/com/soulgalore/crawler/core/PageURLParser.java
src/main/java/com/soulgalore/crawler/core/assets/AssetFetcher.java
src/main/java/com/soulgalore/crawler/core/assets/AssetResponse.java
src/main/java/com/soulgalore/crawler/core/assets/AssetResponseCallable.java
src/main/java/com/soulgalore/crawler/core/assets/AssetsParser.java
src/main/java/com/soulgalore/crawler/core/assets/AssetsVerificationResult.java
src/main/java/com/soulgalore/crawler/core/assets/AssetsVerifier.java
src/main/java/com/soulgalore/crawler/core/assets/impl/DefaultAssetsParser.java
src/main/java/com/soulgalore/crawler/core/assets/impl/DefaultAssetsVerifier.java
src/main/java/com/soulgalore/crawler/core/assets/impl/HTTPClientAssetFetcher.java
src/main/java/com/soulgalore/crawler/core/impl/AhrefPageURLParser.java
src/main/java/com/soulgalore/crawler/core/impl/DefaultCrawler.java
src/main/java/com/soulgalore/crawler/core/impl/HTTPClientResponseFetcher.java
src/main/java/com/soulgalore/crawler/guice/AbstractPropertiesModule.java
src/main/java/com/soulgalore/crawler/guice/CrawlModule.java
src/main/java/com/soulgalore/crawler/guice/ExecutorServiceProvider.java
src/main/java/com/soulgalore/crawler/guice/HttpClientProvider.java
src/main/java/com/soulgalore/crawler/run/AbstractCrawl.java
src/main/java/com/soulgalore/crawler/run/AbstractRunner.java
src/main/java/com/soulgalore/crawler/run/CrawlAndVerifyAssets.java
src/main/java/com/soulgalore/crawler/run/CrawlToCsv.java
src/main/java/com/soulgalore/crawler/run/CrawlToFile.java
src/main/java/com/soulgalore/crawler/run/CrawlToPlainTxtOnlyMatching.java
src/main/java/com/soulgalore/crawler/run/CrawlToSystemOut.java
src/main/java/com/soulgalore/crawler/util/Auth.java
src/main/java/com/soulgalore/crawler/util/AuthUtil.java
src/main/java/com/soulgalore/crawler/util/HTTPSFaker.java
src/main/java/com/soulgalore/crawler/util/HeaderUtil.java
src/main/java/com/soulgalore/crawler/util/StatusCode.java
src/main/resources/crawler.properties
src/test/java/com/soulgalore/crawler/WhenACrawlerResultIsCreated.java
src/test/java/com/soulgalore/crawler/WhenAPageURLIsCreated.java
src/test/java/com/soulgalore/crawler/WhenAStatusCodeIsChecked.java
src/test/java/com/soulgalore/crawler/core/impl/WhenACrawlIsDone.java
src/test/java/com/soulgalore/crawler/core/impl/WhenAhrefsIsParsedFromResponse.java
src/test/java/com/soulgalore/crawler/run/AbstractRun.java
src/test/java/com/soulgalore/crawler/run/WhenCrawlToPlainTxtRun.java
src/test/java/com/soulgalore/crawler/test/TestFileHelper.java
src/test/java/com/soulgalore/crawler/util/WhenAHeaderIsParsed.java
src/test/java/com/soulgalore/crawler/util/WhenAnAuthObjectIsCreated.java
src/test/resources/crawler/crawler1.html
src/test/resources/crawler/crawler2.html
src/test/resources/crawler/crawler3.html
src/test/resources/crawler/crawler4.html
src/test/resources/crawler/crawler5.html
src/test/resources/crawler/pageToParse.html
src/test/resources/crawler/pageWithMailToLinks.html
Download
Click the following link to download crawler-master.zip.
crawler-master.zip