pull/17/head
yihua.huang 12 years ago
parent fd9ae6d93e
commit 5cb45af3a4

@ -8,7 +8,7 @@ import java.util.ArrayList;
import java.util.List; import java.util.List;
/** /**
* <pre> * <pre class="zh">
* Page * Page
* *
* *
@ -19,6 +19,17 @@ import java.util.List;
* {@link #addTargetRequests(java.util.List)} {@link #addTargetRequest(String)} * {@link #addTargetRequests(java.util.List)} {@link #addTargetRequest(String)}
* *
* </pre> * </pre>
* <pre class="en">
* Store extracted result and urls to be crawled.
*
* Main method
* {@link #getUrl()} get url of current page
* {@link #getHtml()} get content of current page
* {@link #putField(String, Object)} save extracted result
* {@link #getResultItems()} get extract results to be used in {@link us.codecraft.webmagic.pipeline.Pipeline}
* {@link #addTargetRequests(java.util.List)} {@link #addTargetRequest(String)} add urls to crawl
*
* </pre>
* *
* @author code4crafter@gmail.com <br> * @author code4crafter@gmail.com <br>
*/ */
@ -44,7 +55,7 @@ public class Page {
} }
/** /**
* *
* *
* @param key key * @param key key
* @param field value * @param field value

@ -5,6 +5,7 @@ import java.util.HashMap;
import java.util.Map; import java.util.Map;
/** /**
* <div class="zh">
* Requesturl<br/> * Requesturl<br/>
* PageProcessorRequest{@link us.codecraft.webmagic.Page#getRequest()} <br/> * PageProcessorRequest{@link us.codecraft.webmagic.Page#getRequest()} <br/>
* <br/> * <br/>
@ -22,6 +23,7 @@ import java.util.Map;
* String linktext = (String)page.getRequest().getExtra()[0]; * String linktext = (String)page.getRequest().getExtra()[0];
* } * }
* </pre> * </pre>
* </div>
* *
* @author code4crafter@gmail.com <br> * @author code4crafter@gmail.com <br>
* Date: 13-4-21 * Date: 13-4-21

@ -1,5 +1,10 @@
<html> <html>
<body> <body>
<div class="en">
Main class "Spider" and models.
</div>
<div class="zh">
包括webmagic入口类Spider和一些数据传递的实体类。 包括webmagic入口类Spider和一些数据传递的实体类。
</div>
</body> </body>
</html> </html>

@ -0,0 +1,18 @@
package us.codecraft.webmagic.model.annotation;
import java.lang.annotation.ElementType;
import java.lang.annotation.Retention;
import java.lang.annotation.Target;
/**
* @author code4crafter@gmail.com <br>
* Date: 13-8-16 <br>
* Time: 11:09 <br>
*/
@Retention(java.lang.annotation.RetentionPolicy.RUNTIME)
@Target({ElementType.FIELD, ElementType.TYPE})
public @interface ComboExtract {
}
Loading…
Cancel
Save