org.sonatype.oss oss-parent 7 us.codecraft 0.5.0-SNAPSHOT 4.0.0 pom UTF-8 UTF-8 4.0.0.RELEASE webmagic-parent webmagic-parent A crawler framework. It covers the whole lifecycle of crawler: downloading, url management, content extraction and persistent. It can simply the development of a specific crawler. https://github.com/code4craft/webmagic/ code4craft Yihua huang code4crafer@gmail.com yuany Ligang Yao ligang.yao@answers.com scm:git:git@github.com:code4craft/webmagic.git scm:git:git@github.com:code4craft/webmagic.git git@github.com:code4craft/webmagic.git HEAD Apache License, Version 2.0 http://www.apache.org/licenses/LICENSE-2.0 webmagic-core webmagic-extension/ webmagic-scripts/ webmagic-selenium webmagic-saxon webmagic-samples webmagic-avalon junit junit 4.11 test org.apache.httpcomponents httpclient 4.3.3 com.google.guava guava 15.0 org.slf4j slf4j-api 1.7.6 org.slf4j slf4j-log4j12 1.7.6 us.codecraft xsoup 0.2.2 com.alibaba fastjson 1.1.37 log4j log4j 1.2.17 org.assertj assertj-core 1.5.0 org.apache.commons commons-lang3 3.1 commons-collections commons-collections 3.2.1 org.apache.commons commons-io 1.3.2 org.jsoup jsoup 1.7.2 org.mockito mockito-all 1.9.5 test org.apache.maven.plugins maven-surefire-plugin pertest -Xms1024m -Xmx1024m -Xss1m org.apache.maven.plugins maven-compiler-plugin 3.1 1.6 1.6 UTF-8 org.apache.maven.plugins maven-dependency-plugin 2.8 copy-dependencies package copy-dependencies ${project.build.directory}/lib false false true org.apache.maven.plugins maven-resources-plugin 2.6 UTF-8 org.apache.maven.plugins maven-jar-plugin log4j.xml org.apache.maven.plugins maven-source-plugin 2.2.1 attach-sources jar org.apache.maven.plugins maven-javadoc-plugin 2.9.1 UTF-8 attach-javadocs jar org.apache.maven.plugins maven-release-plugin 2.4.1 release-sign-artifacts performRelease true org.apache.maven.plugins maven-gpg-plugin 1.1 sign-artifacts verify sign