add core
parent
619a12b303
commit
971e7b6ce2
|
@ -5,6 +5,7 @@ import java.lang.annotation.Retention;
|
|||
import java.lang.annotation.Target;
|
||||
|
||||
/**
|
||||
* 定义类或者字段的抽取规则。<br>
|
||||
* @author code4crafter@gmail.com <br>
|
||||
* @date: 13-8-1 <br>
|
||||
* Time: 下午8:40 <br>
|
||||
|
|
|
@ -5,6 +5,7 @@ import java.lang.annotation.Retention;
|
|||
import java.lang.annotation.Target;
|
||||
|
||||
/**
|
||||
* 定义类或者字段的抽取规则(从url中抽取,只支持正则表达式)。<br>
|
||||
* @author code4crafter@gmail.com <br>
|
||||
* @date: 13-8-1 <br>
|
||||
* Time: 下午8:40 <br>
|
||||
|
|
|
@ -5,6 +5,7 @@ import java.lang.annotation.Retention;
|
|||
import java.lang.annotation.Target;
|
||||
|
||||
/**
|
||||
* 定义辅助爬取的url。<br>
|
||||
* @author code4crafter@gmail.com <br>
|
||||
* @date: 13-8-1 <br>
|
||||
* Time: 下午8:40 <br>
|
||||
|
|
|
@ -5,6 +5,7 @@ import java.lang.annotation.Retention;
|
|||
import java.lang.annotation.Target;
|
||||
|
||||
/**
|
||||
* 定义某个类抽取的范围和来源,sourceRegion可以用xpath语法限定抽取区域。<br>
|
||||
* @author code4crafter@gmail.com <br>
|
||||
* @date: 13-8-1 <br>
|
||||
* Time: 下午8:40 <br>
|
||||
|
|
|
@ -3,7 +3,7 @@ package us.codecraft.webmagic.utils;
|
|||
import java.util.Map;
|
||||
|
||||
/**
|
||||
* @author yihua.huang@dianping.com
|
||||
* @author code4crafter@gmail.com
|
||||
* @date Dec 14, 2012
|
||||
*/
|
||||
public class DoubleKeyMap<K1, K2, V> extends MultiKeyMapBase {
|
||||
|
|
|
@ -1,7 +1,7 @@
|
|||
package us.codecraft.webmagic.utils;
|
||||
|
||||
/**
|
||||
* @author yihua.huang@dianping.com
|
||||
* @author code4crafter@gmail.com
|
||||
* @date Dec 14, 2012
|
||||
*/
|
||||
|
||||
|
|
|
@ -46,7 +46,7 @@ public class News163 implements PagedModel, AfterExtractor {
|
|||
@Override
|
||||
public String getPage() {
|
||||
if (page == null) {
|
||||
return "0";
|
||||
return "1";
|
||||
}
|
||||
return page;
|
||||
}
|
||||
|
|
Loading…
Reference in New Issue