Download scraper Free Java Code
Description
A simple Java html scraper.
Source Files
The download file scraper-master.zip has the following entries.
.gitignore/* w w w . j a va 2s.co m*/
pom.xml
src/docs/010-scraper.afc
src/docs/020-project.afc
src/docs/030-tutorial.afc
src/docs/040-templates.afc
src/docs/050-matching.afc
src/docs/060-converting.afc
src/docs/070-examples.afc
src/main/java/br/com/adaptideas/scraper/Html.java
src/main/java/br/com/adaptideas/scraper/MultipleMatchTemplate.java
src/main/java/br/com/adaptideas/scraper/SingleTemplate.java
src/main/java/br/com/adaptideas/scraper/SplitTemplate.java
src/main/java/br/com/adaptideas/scraper/Template.java
src/main/java/br/com/adaptideas/scraper/cleaner/Cleaner.java
src/main/java/br/com/adaptideas/scraper/cleaner/IrrelevantContentTagCleaner.java
src/main/java/br/com/adaptideas/scraper/cleaner/IrrelevantTagCleaner.java
src/main/java/br/com/adaptideas/scraper/cleaner/TagCleaner.java
src/main/java/br/com/adaptideas/scraper/converter/Converter.java
src/main/java/br/com/adaptideas/scraper/converter/DataConverter.java
src/main/java/br/com/adaptideas/scraper/converter/NoOpConverter.java
src/main/java/br/com/adaptideas/scraper/exception/ScraperException.java
src/main/java/br/com/adaptideas/scraper/infra/InputStreamToStringReader.java
src/main/java/br/com/adaptideas/scraper/infra/Tuple2.java
src/main/java/br/com/adaptideas/scraper/matcher/ContentCleaner.java
src/main/java/br/com/adaptideas/scraper/matcher/PatternCreator.java
src/main/java/br/com/adaptideas/scraper/matcher/TemplateMatcher.java
src/main/java/br/com/adaptideas/scraper/matcher/TemplateTag.java
src/main/java/br/com/adaptideas/scraper/matcher/regex/CaptureGroupsRegexCreator.java
src/main/java/br/com/adaptideas/scraper/matcher/regex/EllipsisRegexCreator.java
src/main/java/br/com/adaptideas/scraper/matcher/regex/OrdinaryWordRegexCreator.java
src/main/java/br/com/adaptideas/scraper/matcher/regex/RegexCreator.java
src/main/java/br/com/adaptideas/scraper/tag/Attribute.java
src/main/java/br/com/adaptideas/scraper/tag/BangTag.java
src/main/java/br/com/adaptideas/scraper/tag/CloseTag.java
src/main/java/br/com/adaptideas/scraper/tag/DefaultTagMatcher.java
src/main/java/br/com/adaptideas/scraper/tag/OpenTag.java
src/main/java/br/com/adaptideas/scraper/tag/PatternAttribute.java
src/main/java/br/com/adaptideas/scraper/tag/StringAttribute.java
src/main/java/br/com/adaptideas/scraper/tag/Tag.java
src/main/java/br/com/adaptideas/scraper/tag/TagListMatcher.java
src/main/java/br/com/adaptideas/scraper/tag/TagMatcher.java
src/main/java/br/com/adaptideas/scraper/tag/TagParser.java
src/main/java/br/com/adaptideas/scraper/tag/TagReader.java
src/main/java/br/com/adaptideas/scraper/tag/TagSanitizer.java
src/main/java/br/com/adaptideas/scraper/tag/TagType.java
src/test/java/br/com/adaptideas/scraper/BangTagTest.java
src/test/java/br/com/adaptideas/scraper/CloseTagTest.java
src/test/java/br/com/adaptideas/scraper/HtmlTest.java
src/test/java/br/com/adaptideas/scraper/Item.java
src/test/java/br/com/adaptideas/scraper/MultipleMatchTemplateTest.java
src/test/java/br/com/adaptideas/scraper/OpenTagTest.java
src/test/java/br/com/adaptideas/scraper/ScraperSpecificationTest.java
src/test/java/br/com/adaptideas/scraper/SingleTemplateTest.java
src/test/java/br/com/adaptideas/scraper/SplitTemplateTest.java
src/test/java/br/com/adaptideas/scraper/TagParserTest.java
src/test/java/br/com/adaptideas/scraper/cleaner/IrrelevantContentTagCleanerTest.java
src/test/java/br/com/adaptideas/scraper/cleaner/IrrelevantTagCleanerTest.java
src/test/java/br/com/adaptideas/scraper/converter/DataConverterTest.java
src/test/java/br/com/adaptideas/scraper/infra/InputStreamToStringReaderTest.java
src/test/java/br/com/adaptideas/scraper/matcher/TemplateTagTest.java
src/test/java/br/com/adaptideas/scraper/matcher/regex/CaptureGroupsRegexCreatorTest.java
src/test/java/br/com/adaptideas/scraper/matcher/regex/EllipsisRegexCreatorTest.java
src/test/java/br/com/adaptideas/scraper/matcher/regex/OrdinaryWordRegexCreatorTest.java
src/test/java/br/com/adaptideas/scraper/tag/AttributeTest.java
src/test/java/br/com/adaptideas/scraper/tag/DefaultTagMatcherTest.java
src/test/java/br/com/adaptideas/scraper/tag/PatternAttributeTest.java
src/test/java/br/com/adaptideas/scraper/tag/StringAttributeTest.java
src/test/java/br/com/adaptideas/scraper/tag/TagListMatcherTest.java
src/test/java/br/com/adaptideas/scraper/tag/TagReaderTest.java
src/test/java/br/com/adaptideas/scraper/tag/TagSanitizerTest.java
src/test/java/br/com/adaptideas/scraper/tag/TagTypeTest.java
src/test/resources/log4j.xml
src/tubainaTemplates/html/chapter.ftl
src/tubainaTemplates/html/footer.ftl
src/tubainaTemplates/html/header.ftl
src/tubainaTemplates/html/includes/css/java.css
src/tubainaTemplates/html/includes/css/style.css
src/tubainaTemplates/html/includes/images/body.png
src/tubainaTemplates/html/includes/images/menu.png
src/tubainaTemplates/html/index.ftl
src/tubainaTemplates/html/menu.ftl
src/tubainaTemplates/html/section.ftl
src/tubainaTemplates/html/sectionContent.ftl
src/tubainaTemplates/html/toc.ftl
src/util/index.html
src/util/site-deploy.sh
Download
Click the following link to download scraper-master.zip.
scraper-master.zip