|
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
|
|
<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
|
|
|
|
<groupId>us.codecraft</groupId>
|
|
|
|
<version>0.7.4</version>
|
|
|
|
<modelVersion>4.0.0</modelVersion>
|
|
|
|
<packaging>pom</packaging>
|
|
|
|
<properties>
|
|
|
|
<project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
|
|
|
|
<project.reporting.outputEncoding>UTF-8</project.reporting.outputEncoding>
|
|
|
|
<maven.compiler.source>1.8</maven.compiler.source>
|
|
|
|
<maven.compiler.target>1.8</maven.compiler.target>
|
|
|
|
<spring-version>4.0.0.RELEASE</spring-version>
|
|
|
|
</properties>
|
|
|
|
<artifactId>webmagic-parent</artifactId>
|
|
|
|
<name>webmagic-parent</name>
|
|
|
|
<description>
|
|
|
|
A crawler framework. It covers the whole lifecycle of crawler: downloading, url management, content
|
|
|
|
extraction and persistent. It can simply the development of a specific crawler.
|
|
|
|
</description>
|
|
|
|
<url>https://github.com/code4craft/webmagic/</url>
|
|
|
|
<developers>
|
|
|
|
<developer>
|
|
|
|
<id>code4craft</id>
|
|
|
|
<name>Yihua huang</name>
|
|
|
|
<email>code4crafer@gmail.com</email>
|
|
|
|
</developer>
|
|
|
|
<developer>
|
|
|
|
<id>yuany</id>
|
|
|
|
<name>Ligang Yao</name>
|
|
|
|
<email>ligang.yao@answers.com</email>
|
|
|
|
</developer>
|
|
|
|
</developers>
|
|
|
|
<scm>
|
|
|
|
<connection>scm:git:git@github.com:code4craft/webmagic.git</connection>
|
|
|
|
<developerConnection>scm:git:git@github.com:code4craft/webmagic.git</developerConnection>
|
|
|
|
<url>git@github.com:code4craft/webmagic.git</url>
|
|
|
|
<tag>WebMagic-${project.version}</tag>
|
|
|
|
</scm>
|
|
|
|
<licenses>
|
|
|
|
<license>
|
|
|
|
<name>Apache License, Version 2.0</name>
|
|
|
|
<url>http://www.apache.org/licenses/LICENSE-2.0</url>
|
|
|
|
</license>
|
|
|
|
</licenses>
|
|
|
|
|
|
|
|
<modules>
|
|
|
|
<module>webmagic-core</module>
|
|
|
|
<module>webmagic-extension/</module>
|
|
|
|
<module>webmagic-scripts/</module>
|
|
|
|
<module>webmagic-selenium</module>
|
|
|
|
<module>webmagic-saxon</module>
|
|
|
|
<module>webmagic-samples</module>
|
|
|
|
</modules>
|
|
|
|
|
|
|
|
<dependencyManagement>
|
|
|
|
<dependencies>
|
|
|
|
<dependency>
|
|
|
|
<groupId>junit</groupId>
|
|
|
|
<artifactId>junit</artifactId>
|
|
|
|
<version>4.13.1</version>
|
|
|
|
<scope>test</scope>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>org.mockito</groupId>
|
|
|
|
<artifactId>mockito-all</artifactId>
|
|
|
|
<version>1.10.19</version>
|
|
|
|
<scope>test</scope>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>org.apache.httpcomponents</groupId>
|
|
|
|
<artifactId>httpclient</artifactId>
|
|
|
|
<version>4.5.13</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>org.apache.httpcomponents</groupId>
|
|
|
|
<artifactId>httpcore</artifactId>
|
|
|
|
<version>4.4.14</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>com.google.guava</groupId>
|
|
|
|
<artifactId>guava</artifactId>
|
|
|
|
<version>30.1-jre</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>com.jayway.jsonpath</groupId>
|
|
|
|
<artifactId>json-path</artifactId>
|
|
|
|
<version>2.5.0</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>org.slf4j</groupId>
|
|
|
|
<artifactId>slf4j-api</artifactId>
|
|
|
|
<version>1.7.30</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>org.slf4j</groupId>
|
|
|
|
<artifactId>slf4j-log4j12</artifactId>
|
|
|
|
<version>1.7.30</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>us.codecraft</groupId>
|
|
|
|
<artifactId>xsoup</artifactId>
|
|
|
|
<version>0.3.2</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>com.alibaba</groupId>
|
|
|
|
<artifactId>fastjson</artifactId>
|
|
|
|
<version>1.2.75</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>com.github.dreamhead</groupId>
|
|
|
|
<artifactId>moco-core</artifactId>
|
|
|
|
<version>1.1.0</version>
|
|
|
|
<scope>test</scope>
|
|
|
|
<exclusions>
|
|
|
|
<exclusion>
|
|
|
|
<groupId>org.slf4j</groupId>
|
|
|
|
<artifactId>slf4j-simple</artifactId>
|
|
|
|
</exclusion>
|
|
|
|
</exclusions>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>log4j</groupId>
|
|
|
|
<artifactId>log4j</artifactId>
|
|
|
|
<version>1.2.17</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>org.assertj</groupId>
|
|
|
|
<artifactId>assertj-core</artifactId>
|
|
|
|
<version>3.18.1</version>
|
|
|
|
<scope>test</scope>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>org.apache.commons</groupId>
|
|
|
|
<artifactId>commons-lang3</artifactId>
|
|
|
|
<version>3.11</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>commons-collections</groupId>
|
|
|
|
<artifactId>commons-collections</artifactId>
|
|
|
|
<version>3.2.2</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>commons-io</groupId>
|
|
|
|
<artifactId>commons-io</artifactId>
|
|
|
|
<version>2.8.0</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>org.codehaus.groovy</groupId>
|
|
|
|
<artifactId>groovy-all</artifactId>
|
|
|
|
<version>3.0.7</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>org.jruby</groupId>
|
|
|
|
<artifactId>jruby</artifactId>
|
|
|
|
<version>9.2.14.0</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>org.python</groupId>
|
|
|
|
<artifactId>jython</artifactId>
|
|
|
|
<version>2.7.2</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>org.seleniumhq.selenium</groupId>
|
|
|
|
<artifactId>selenium-java</artifactId>
|
|
|
|
<version>3.141.59</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>net.sf.saxon</groupId>
|
|
|
|
<artifactId>Saxon-HE</artifactId>
|
|
|
|
<version>10.3</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>net.sourceforge.htmlcleaner</groupId>
|
|
|
|
<artifactId>htmlcleaner</artifactId>
|
|
|
|
<version>2.9</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>com.github.detro</groupId>
|
|
|
|
<artifactId>phantomjsdriver</artifactId>
|
|
|
|
<version>1.2.0</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>commons-cli</groupId>
|
|
|
|
<artifactId>commons-cli</artifactId>
|
|
|
|
<version>1.4</version>
|
|
|
|
</dependency>
|
|
|
|
<dependency>
|
|
|
|
<groupId>redis.clients</groupId>
|
|
|
|
<artifactId>jedis</artifactId>
|
|
|
|
<version>3.6.0</version>
|
|
|
|
</dependency>
|
|
|
|
</dependencies>
|
|
|
|
</dependencyManagement>
|
|
|
|
|
|
|
|
<build>
|
|
|
|
<plugins>
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-enforcer-plugin</artifactId>
|
|
|
|
<version>3.0.0-M3</version>
|
|
|
|
<executions>
|
|
|
|
<execution>
|
|
|
|
<id>enforce-maven</id>
|
|
|
|
<goals>
|
|
|
|
<goal>enforce</goal>
|
|
|
|
</goals>
|
|
|
|
<configuration>
|
|
|
|
<rules>
|
|
|
|
<requireMavenVersion>
|
|
|
|
<version>3.0.5</version>
|
|
|
|
</requireMavenVersion>
|
|
|
|
</rules>
|
|
|
|
</configuration>
|
|
|
|
</execution>
|
|
|
|
</executions>
|
|
|
|
</plugin>
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-surefire-plugin</artifactId>
|
|
|
|
<configuration>
|
|
|
|
<forkCount>0</forkCount>
|
|
|
|
</configuration>
|
|
|
|
</plugin>
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-compiler-plugin</artifactId>
|
|
|
|
</plugin>
|
|
|
|
<!--<plugin>-->
|
|
|
|
<!--<groupId>org.apache.maven.plugins</groupId>-->
|
|
|
|
<!--<artifactId>maven-dependency-plugin</artifactId>-->
|
|
|
|
<!--<version>2.8</version>-->
|
|
|
|
<!--<executions>-->
|
|
|
|
<!--<execution>-->
|
|
|
|
<!--<id>copy-dependencies</id>-->
|
|
|
|
<!--<phase>package</phase>-->
|
|
|
|
<!--<goals>-->
|
|
|
|
<!--<goal>copy-dependencies</goal>-->
|
|
|
|
<!--</goals>-->
|
|
|
|
<!--<configuration>-->
|
|
|
|
<!--<outputDirectory>${project.build.directory}/lib</outputDirectory>-->
|
|
|
|
<!--<overWriteReleases>false</overWriteReleases>-->
|
|
|
|
<!--<overWriteSnapshots>false</overWriteSnapshots>-->
|
|
|
|
<!--<overWriteIfNewer>true</overWriteIfNewer>-->
|
|
|
|
<!--</configuration>-->
|
|
|
|
<!--</execution>-->
|
|
|
|
<!--</executions>-->
|
|
|
|
<!--</plugin>-->
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-resources-plugin</artifactId>
|
|
|
|
</plugin>
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-jar-plugin</artifactId>
|
|
|
|
<configuration>
|
|
|
|
<excludes>
|
|
|
|
<exclude>log4j.xml</exclude>
|
|
|
|
</excludes>
|
|
|
|
</configuration>
|
|
|
|
</plugin>
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-source-plugin</artifactId>
|
|
|
|
<version>3.2.1</version>
|
|
|
|
<executions>
|
|
|
|
<execution>
|
|
|
|
<id>attach-sources</id>
|
|
|
|
<goals>
|
|
|
|
<goal>jar</goal>
|
|
|
|
</goals>
|
|
|
|
</execution>
|
|
|
|
</executions>
|
|
|
|
</plugin>
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-javadoc-plugin</artifactId>
|
|
|
|
<version>3.2.0</version>
|
|
|
|
<configuration>
|
|
|
|
<encoding>UTF-8</encoding>
|
|
|
|
<doctitle>WebMagic 0.7.4</doctitle>
|
|
|
|
<locale>en_US</locale>
|
|
|
|
|
|
|
|
<!-- avoid the issue: https://bugs.openjdk.java.net/browse/JDK-8212233 -->
|
|
|
|
<detectJavaApiLink>false</detectJavaApiLink>
|
|
|
|
|
|
|
|
</configuration>
|
|
|
|
<executions>
|
|
|
|
<execution>
|
|
|
|
<id>aggregate</id>
|
|
|
|
<goals>
|
|
|
|
<goal>aggregate</goal>
|
|
|
|
</goals>
|
|
|
|
<phase>site</phase>
|
|
|
|
</execution>
|
|
|
|
<execution>
|
|
|
|
<id>attach-javadocs</id>
|
|
|
|
<goals>
|
|
|
|
<goal>jar</goal>
|
|
|
|
</goals>
|
|
|
|
</execution>
|
|
|
|
</executions>
|
|
|
|
</plugin>
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-release-plugin</artifactId>
|
|
|
|
<version>3.0.0-M1</version>
|
|
|
|
</plugin>
|
|
|
|
<plugin>
|
|
|
|
<groupId>com.amashchenko.maven.plugin</groupId>
|
|
|
|
<artifactId>gitflow-maven-plugin</artifactId>
|
|
|
|
</plugin>
|
|
|
|
</plugins>
|
|
|
|
<pluginManagement>
|
|
|
|
<plugins>
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-clean-plugin</artifactId>
|
|
|
|
<version>3.1.0</version>
|
|
|
|
</plugin>
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-compiler-plugin</artifactId>
|
|
|
|
<version>3.8.1</version>
|
|
|
|
</plugin>
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-deploy-plugin</artifactId>
|
|
|
|
<version>3.0.0-M1</version>
|
|
|
|
</plugin>
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-install-plugin</artifactId>
|
|
|
|
<version>3.0.0-M1</version>
|
|
|
|
</plugin>
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-jar-plugin</artifactId>
|
|
|
|
<version>3.2.0</version>
|
|
|
|
</plugin>
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-resources-plugin</artifactId>
|
|
|
|
<version>3.1.0</version>
|
|
|
|
</plugin>
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-site-plugin</artifactId>
|
|
|
|
<version>3.9.0</version>
|
|
|
|
</plugin>
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-surefire-plugin</artifactId>
|
|
|
|
<version>3.0.0-M5</version>
|
|
|
|
</plugin>
|
|
|
|
<plugin>
|
|
|
|
<groupId>com.amashchenko.maven.plugin</groupId>
|
|
|
|
<artifactId>gitflow-maven-plugin</artifactId>
|
|
|
|
<version>1.15.0</version>
|
|
|
|
</plugin>
|
|
|
|
</plugins>
|
|
|
|
</pluginManagement>
|
|
|
|
</build>
|
|
|
|
|
|
|
|
<profiles>
|
|
|
|
<profile>
|
|
|
|
<id>release</id>
|
|
|
|
<build>
|
|
|
|
<plugins>
|
|
|
|
<!-- Source -->
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-source-plugin</artifactId>
|
|
|
|
<version>2.2.1</version>
|
|
|
|
<executions>
|
|
|
|
<execution>
|
|
|
|
<phase>package</phase>
|
|
|
|
<goals>
|
|
|
|
<goal>jar-no-fork</goal>
|
|
|
|
</goals>
|
|
|
|
</execution>
|
|
|
|
</executions>
|
|
|
|
</plugin>
|
|
|
|
<!-- Javadoc -->
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-javadoc-plugin</artifactId>
|
|
|
|
<version>2.9.1</version>
|
|
|
|
<executions>
|
|
|
|
<execution>
|
|
|
|
<phase>package</phase>
|
|
|
|
<goals>
|
|
|
|
<goal>jar</goal>
|
|
|
|
</goals>
|
|
|
|
</execution>
|
|
|
|
</executions>
|
|
|
|
</plugin>
|
|
|
|
<!-- GPG -->
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.apache.maven.plugins</groupId>
|
|
|
|
<artifactId>maven-gpg-plugin</artifactId>
|
|
|
|
<version>1.6</version>
|
|
|
|
<executions>
|
|
|
|
<execution>
|
|
|
|
<phase>verify</phase>
|
|
|
|
<goals>
|
|
|
|
<goal>sign</goal>
|
|
|
|
</goals>
|
|
|
|
</execution>
|
|
|
|
</executions>
|
|
|
|
</plugin>
|
|
|
|
<plugin>
|
|
|
|
<groupId>org.sonatype.plugins</groupId>
|
|
|
|
<artifactId>nexus-staging-maven-plugin</artifactId>
|
|
|
|
<version>1.6.8</version>
|
|
|
|
<extensions>true</extensions>
|
|
|
|
<configuration>
|
|
|
|
<serverId>sonatype-nexus-staging</serverId>
|
|
|
|
<nexusUrl>https://oss.sonatype.org/</nexusUrl>
|
|
|
|
<autoReleaseAfterClose>true</autoReleaseAfterClose>
|
|
|
|
</configuration>
|
|
|
|
</plugin>
|
|
|
|
</plugins>
|
|
|
|
</build>
|
|
|
|
<distributionManagement>
|
|
|
|
<snapshotRepository>
|
|
|
|
<id>sonatype-nexus-snapshots</id>
|
|
|
|
<url>https://oss.sonatype.org/content/repositories/snapshots/</url>
|
|
|
|
</snapshotRepository>
|
|
|
|
<repository>
|
|
|
|
<id>sonatype-nexus-staging</id>
|
|
|
|
<url>https://oss.sonatype.org/service/local/staging/deploy/maven2/</url>
|
|
|
|
</repository>
|
|
|
|
</distributionManagement>
|
|
|
|
</profile>
|
|
|
|
</profiles>
|
|
|
|
</project>
|