update
parent
cc18d863f3
commit
461cd31718
|
@ -9,6 +9,8 @@ import us.codecraft.webmagic.scheduler.RedisScheduler;
|
||||||
import us.codecraft.webmagic.selenium.downloader.SeleniumDownloader;
|
import us.codecraft.webmagic.selenium.downloader.SeleniumDownloader;
|
||||||
|
|
||||||
/**
|
/**
|
||||||
|
* 花瓣网抽取器。<br>
|
||||||
|
* 使用Selenium做页面动态渲染。<br>
|
||||||
* @author yihua.huang@dianping.com <br>
|
* @author yihua.huang@dianping.com <br>
|
||||||
* @date: 13-7-26 <br>
|
* @date: 13-7-26 <br>
|
||||||
* Time: 下午4:08 <br>
|
* Time: 下午4:08 <br>
|
||||||
|
@ -30,7 +32,7 @@ public class HuabanProcessor implements PageProcessor {
|
||||||
@Override
|
@Override
|
||||||
public Site getSite() {
|
public Site getSite() {
|
||||||
if (site == null) {
|
if (site == null) {
|
||||||
site = Site.me().setDomain("huaban.com").addStartUrl("http://huaban.com/").setSleepTime(1000);
|
site = Site.me().setDomain("huaban.com").addStartUrl("http://huaban.com/").setSleepTime(0);
|
||||||
}
|
}
|
||||||
return site;
|
return site;
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue