add scripts

master
yihua.huang 2013-11-12 11:42:42 +08:00
parent 4cd3e1d871
commit f1d5e297bf
2 changed files with 16 additions and 3 deletions

View File

@ -1,6 +1,7 @@
package us.codecraft.webmagic.scripts;
import org.apache.commons.io.IOUtils;
import sun.org.mozilla.javascript.internal.NativeObject;
import us.codecraft.webmagic.Page;
import us.codecraft.webmagic.Site;
import us.codecraft.webmagic.processor.PageProcessor;
@ -11,6 +12,7 @@ import javax.script.ScriptEngineManager;
import javax.script.ScriptException;
import java.io.IOException;
import java.io.InputStream;
import java.util.Map;
/**
* @author code4crafter@gmail.com
@ -51,6 +53,19 @@ public class ScriptProcessor implements PageProcessor {
context.setAttribute("config", site, ScriptContext.ENGINE_SCOPE);
try {
engine.eval(defines + "\n" + script, context);
switch (language) {
case JavaScript:
NativeObject o = (NativeObject) engine.get("result");
if (o != null) {
for (Map.Entry<Object, Object> objectObjectEntry : o.entrySet()) {
page.getResultItems().put(objectObjectEntry.getKey().toString(), objectObjectEntry.getValue());
}
}
break;
case JRuby:
Object o1 = engine.get("result");
break;
}
} catch (ScriptException e) {
e.printStackTrace();
}

View File

@ -1,5 +1,3 @@
title = css "div.BlogTitle h1"
content = css "div.BlogContent"
urls "http://my\\.oschina\\.net/flashsword/blog/\\d+"
puts title
puts content