From fb0797b65c2e78b1cfe072685cdee873ff931746 Mon Sep 17 00:00:00 2001 From: "yihua.huang" Date: Tue, 18 Jun 2013 22:13:40 +0800 Subject: [PATCH] update docs --- .../main/java/us/codecraft/webmagic/Page.java | 18 ++++++++++++++---- .../java/us/codecraft/webmagic/Request.java | 2 +- .../main/java/us/codecraft/webmagic/Site.java | 2 +- .../java/us/codecraft/webmagic/Spider.java | 2 +- .../main/java/us/codecraft/webmagic/Task.java | 2 +- .../webmagic/downloader/Downloader.java | 4 ++-- .../downloader/HttpClientDownloader.java | 2 +- .../webmagic/downloader/HttpClientPool.java | 2 +- .../webmagic/pipeline/ConsolePipeline.java | 2 +- .../webmagic/pipeline/FilePipeline.java | 2 +- .../codecraft/webmagic/pipeline/Pipeline.java | 2 +- .../webmagic/processor/PageProcessor.java | 2 +- .../processor/SimplePageProcessor.java | 2 +- .../schedular/FileCacheQueueSchedular.java | 2 +- .../webmagic/schedular/QueueSchedular.java | 2 +- .../webmagic/schedular/Schedular.java | 2 +- .../us/codecraft/webmagic/selector/Html.java | 2 +- .../codecraft/webmagic/selector/PlainText.java | 2 +- .../webmagic/selector/RegexResult.java | 2 +- .../webmagic/selector/RegexSelector.java | 2 +- .../webmagic/selector/ReplaceSelector.java | 2 +- .../webmagic/selector/Selectable.java | 2 +- .../codecraft/webmagic/selector/Selector.java | 2 +- .../webmagic/selector/SelectorFactory.java | 2 +- .../selector/SmartContentSelector.java | 2 +- .../webmagic/selector/XpathSelector.java | 2 +- .../us/codecraft/webmagic/utils/UrlUtils.java | 2 +- .../java/us/codecraft/webmagic/HtmlTest.java | 2 +- .../webmagic/selector/RegexSelectorTest.java | 2 +- .../webmagic/selector/XpathSelectorTest.java | 2 +- .../codecraft/webmagic/utils/UrlUtilsTest.java | 2 +- .../webmagic/pipeline/FreemarkerPipeline.java | 2 +- .../webmagic/FreemarkerPipelineTest.java | 2 +- .../samples/DiandianBlogProcessor.java | 2 +- .../webmagic/samples/DianpingProcessor.java | 2 +- .../webmagic/samples/DiaoyuwengProcessor.java | 2 +- .../webmagic/samples/F58PageProcesser.java | 2 +- .../webmagic/samples/HuxiuProcessor.java | 2 +- .../webmagic/samples/KaichibaProcessor.java | 2 +- .../webmagic/samples/MeicanProcessor.java | 2 +- .../webmagic/samples/NjuBBSProcessor.java | 2 +- .../samples/OschinaBlogPageProcesser.java | 2 +- .../webmagic/samples/OschinaPageProcesser.java | 2 +- .../webmagic/samples/QzoneBlogProcessor.java | 2 +- .../webmagic/samples/SinaBlogProcesser.java | 2 +- .../webmagic/samples/TianyaPageProcesser.java | 2 +- .../java/us/codecraft/webmagic/SpiderTest.java | 2 +- .../processor/DiandianProcessorTest.java | 2 +- .../processor/DiaoyuwengProcessorTest.java | 2 +- .../processor/SinablogProcessorTest.java | 2 +- 50 files changed, 64 insertions(+), 54 deletions(-) diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/Page.java b/webmagic-core/src/main/java/us/codecraft/webmagic/Page.java index eee1a8a..ec9f959 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/Page.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/Page.java @@ -10,10 +10,16 @@ import java.util.Map; import java.util.concurrent.ConcurrentHashMap; /** - * Page保存了抓取的结果,并可定义下一次抓取的链接内容。 - * Author: code4crafter@gmail.com - * Date: 13-4-21 - * Time: 上午11:22 + *
+ *Page保存了上一次抓取的结果,并可定义待抓取的链接内容。
+ *
+ *     主要方法:
+ *     {@link #getUrl()} 获取页面的Url
+ *     {@link #getHtml()}  获取页面的html内容
+ *     {@link #addTargetRequests(java.util.List)} {@link #addTargetRequest(String)} 添加待抓取的链接
+ *
+ * 
+ * @author code4crafter@gmail.com
*/ public class Page { @@ -34,6 +40,10 @@ public class Page { public Page() { } + /** + * + * @return fields + */ public Map getFields() { return fields; } diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/Request.java b/webmagic-core/src/main/java/us/codecraft/webmagic/Request.java index ecb8b4e..37ede0d 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/Request.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/Request.java @@ -17,7 +17,7 @@ package us.codecraft.webmagic; * String linktext = (String)page.getRequest().getExtra()[0]; * } * - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 上午11:37 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/Site.java b/webmagic-core/src/main/java/us/codecraft/webmagic/Site.java index a4d88d8..5c208dd 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/Site.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/Site.java @@ -4,7 +4,7 @@ import java.util.*; /** * Site定义一个待抓取的站点的各种信息。 - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午12:13 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/Spider.java b/webmagic-core/src/main/java/us/codecraft/webmagic/Spider.java index 6464d61..67e9c94 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/Spider.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/Spider.java @@ -14,7 +14,7 @@ import java.util.ArrayList; import java.util.List; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 上午6:53 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/Task.java b/webmagic-core/src/main/java/us/codecraft/webmagic/Task.java index 0eaf6c9..2aab74a 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/Task.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/Task.java @@ -1,7 +1,7 @@ package us.codecraft.webmagic; /** - * Author: code4crafer@gmail.com + * @author code4crafter@gmail.com
* Date: 13-6-18 * Time: 下午2:57 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/downloader/Downloader.java b/webmagic-core/src/main/java/us/codecraft/webmagic/downloader/Downloader.java index f276fde..e3ecff8 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/downloader/Downloader.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/downloader/Downloader.java @@ -6,7 +6,7 @@ import us.codecraft.webmagic.Site; /** * Downloader是webmagic下载页面的接口。webmagic默认使用了HttpComponent作为下载器,一般情况,你无需自己实现这个接口。 - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午12:14 */ @@ -17,7 +17,7 @@ public interface Downloader { * * @param request * @param site - * @return + * @return page */ public Page download(Request request, Site site); } diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/downloader/HttpClientDownloader.java b/webmagic-core/src/main/java/us/codecraft/webmagic/downloader/HttpClientDownloader.java index 2eb55c0..4332fa3 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/downloader/HttpClientDownloader.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/downloader/HttpClientDownloader.java @@ -14,7 +14,7 @@ import us.codecraft.webmagic.utils.UrlUtils; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午12:15 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/downloader/HttpClientPool.java b/webmagic-core/src/main/java/us/codecraft/webmagic/downloader/HttpClientPool.java index 891ff18..4e57e16 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/downloader/HttpClientPool.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/downloader/HttpClientPool.java @@ -18,7 +18,7 @@ import us.codecraft.webmagic.Site; import java.util.Map; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午12:29 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/pipeline/ConsolePipeline.java b/webmagic-core/src/main/java/us/codecraft/webmagic/pipeline/ConsolePipeline.java index 7b93876..866db92 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/pipeline/ConsolePipeline.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/pipeline/ConsolePipeline.java @@ -7,7 +7,7 @@ import us.codecraft.webmagic.selector.Selectable; import java.util.Map; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午1:45 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/pipeline/FilePipeline.java b/webmagic-core/src/main/java/us/codecraft/webmagic/pipeline/FilePipeline.java index 2311a75..c7cd9c5 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/pipeline/FilePipeline.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/pipeline/FilePipeline.java @@ -12,7 +12,7 @@ import java.io.PrintWriter; import java.util.Map; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午6:28 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/pipeline/Pipeline.java b/webmagic-core/src/main/java/us/codecraft/webmagic/pipeline/Pipeline.java index b2b51e0..1be447c 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/pipeline/Pipeline.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/pipeline/Pipeline.java @@ -4,7 +4,7 @@ import us.codecraft.webmagic.Page; import us.codecraft.webmagic.Task; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午1:39 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/processor/PageProcessor.java b/webmagic-core/src/main/java/us/codecraft/webmagic/processor/PageProcessor.java index 9820059..c36ae98 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/processor/PageProcessor.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/processor/PageProcessor.java @@ -4,7 +4,7 @@ import us.codecraft.webmagic.Page; import us.codecraft.webmagic.Site; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 上午11:42 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/processor/SimplePageProcessor.java b/webmagic-core/src/main/java/us/codecraft/webmagic/processor/SimplePageProcessor.java index 9f4eed3..3ffc9a3 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/processor/SimplePageProcessor.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/processor/SimplePageProcessor.java @@ -7,7 +7,7 @@ import us.codecraft.webmagic.utils.UrlUtils; import java.util.List; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-22 * Time: 下午9:15 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/schedular/FileCacheQueueSchedular.java b/webmagic-core/src/main/java/us/codecraft/webmagic/schedular/FileCacheQueueSchedular.java index 882f498..0a93e52 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/schedular/FileCacheQueueSchedular.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/schedular/FileCacheQueueSchedular.java @@ -16,7 +16,7 @@ import java.util.concurrent.atomic.AtomicBoolean; import java.util.concurrent.atomic.AtomicInteger; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午1:13 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/schedular/QueueSchedular.java b/webmagic-core/src/main/java/us/codecraft/webmagic/schedular/QueueSchedular.java index 8c3da3b..20576fc 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/schedular/QueueSchedular.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/schedular/QueueSchedular.java @@ -10,7 +10,7 @@ import java.util.concurrent.BlockingQueue; import java.util.concurrent.LinkedBlockingQueue; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午1:13 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/schedular/Schedular.java b/webmagic-core/src/main/java/us/codecraft/webmagic/schedular/Schedular.java index 8e4edb4..8df7760 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/schedular/Schedular.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/schedular/Schedular.java @@ -4,7 +4,7 @@ import us.codecraft.webmagic.Request; import us.codecraft.webmagic.Task; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午1:12 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/Html.java b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/Html.java index 22bf73d..3b3c80a 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/Html.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/Html.java @@ -4,7 +4,7 @@ import java.util.ArrayList; import java.util.List; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 上午7:54 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/PlainText.java b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/PlainText.java index 1d7a41e..a11c9a2 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/PlainText.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/PlainText.java @@ -6,7 +6,7 @@ import java.util.ArrayList; import java.util.List; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 上午7:54 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/RegexResult.java b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/RegexResult.java index 06c00dd..9f4e2f0 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/RegexResult.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/RegexResult.java @@ -1,7 +1,7 @@ package us.codecraft.webmagic.selector; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 上午7:39 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/RegexSelector.java b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/RegexSelector.java index 3b98718..49fbffd 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/RegexSelector.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/RegexSelector.java @@ -9,7 +9,7 @@ import java.util.regex.Pattern; import java.util.regex.PatternSyntaxException; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 上午7:09 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/ReplaceSelector.java b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/ReplaceSelector.java index e240f08..1ce7c4d 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/ReplaceSelector.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/ReplaceSelector.java @@ -6,7 +6,7 @@ import java.util.regex.Pattern; import java.util.regex.PatternSyntaxException; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 上午7:09 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/Selectable.java b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/Selectable.java index f02cbc4..921e6c3 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/Selectable.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/Selectable.java @@ -3,7 +3,7 @@ package us.codecraft.webmagic.selector; import java.util.List; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-20 * Time: 下午7:51 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/Selector.java b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/Selector.java index 3e1b056..35632b3 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/Selector.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/Selector.java @@ -3,7 +3,7 @@ package us.codecraft.webmagic.selector; import java.util.List; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-20 * Time: 下午8:02 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/SelectorFactory.java b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/SelectorFactory.java index 633cb4a..3c87ac9 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/SelectorFactory.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/SelectorFactory.java @@ -7,7 +7,7 @@ import java.util.Map; import java.util.concurrent.ConcurrentHashMap; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 上午7:56 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/SmartContentSelector.java b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/SmartContentSelector.java index 919a795..8974897 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/SmartContentSelector.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/SmartContentSelector.java @@ -10,7 +10,7 @@ import java.util.concurrent.atomic.AtomicInteger; /** * readability算法,基础是找到所有p标签的父节点 * 写的比较乱,最终效果还在尝试中 - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午4:42 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/XpathSelector.java b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/XpathSelector.java index 991f926..c2b408e 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/selector/XpathSelector.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/selector/XpathSelector.java @@ -6,7 +6,7 @@ import java.util.ArrayList; import java.util.List; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 上午9:39 */ diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/utils/UrlUtils.java b/webmagic-core/src/main/java/us/codecraft/webmagic/utils/UrlUtils.java index fd26499..74e486c 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/utils/UrlUtils.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/utils/UrlUtils.java @@ -6,7 +6,7 @@ import java.util.regex.Matcher; import java.util.regex.Pattern; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午1:52 */ diff --git a/webmagic-core/src/test/java/us/codecraft/webmagic/HtmlTest.java b/webmagic-core/src/test/java/us/codecraft/webmagic/HtmlTest.java index 0f8c061..6dacc98 100644 --- a/webmagic-core/src/test/java/us/codecraft/webmagic/HtmlTest.java +++ b/webmagic-core/src/test/java/us/codecraft/webmagic/HtmlTest.java @@ -5,7 +5,7 @@ import org.junit.Test; import us.codecraft.webmagic.selector.Html; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 上午8:42 */ diff --git a/webmagic-core/src/test/java/us/codecraft/webmagic/selector/RegexSelectorTest.java b/webmagic-core/src/test/java/us/codecraft/webmagic/selector/RegexSelectorTest.java index 3b80f92..849a4d6 100644 --- a/webmagic-core/src/test/java/us/codecraft/webmagic/selector/RegexSelectorTest.java +++ b/webmagic-core/src/test/java/us/codecraft/webmagic/selector/RegexSelectorTest.java @@ -4,7 +4,7 @@ import junit.framework.Assert; import org.junit.Test; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 上午7:13 */ diff --git a/webmagic-core/src/test/java/us/codecraft/webmagic/selector/XpathSelectorTest.java b/webmagic-core/src/test/java/us/codecraft/webmagic/selector/XpathSelectorTest.java index 239630a..8ee8885 100644 --- a/webmagic-core/src/test/java/us/codecraft/webmagic/selector/XpathSelectorTest.java +++ b/webmagic-core/src/test/java/us/codecraft/webmagic/selector/XpathSelectorTest.java @@ -4,7 +4,7 @@ import org.junit.Assert; import org.junit.Test; /** - * Author: code4crafter@gmail.com Date: 13-4-21 Time: 上午10:06 + * @author code4crafter@gmail.com
Date: 13-4-21 Time: 上午10:06 */ public class XpathSelectorTest { diff --git a/webmagic-core/src/test/java/us/codecraft/webmagic/utils/UrlUtilsTest.java b/webmagic-core/src/test/java/us/codecraft/webmagic/utils/UrlUtilsTest.java index 36361bf..4cfdc04 100644 --- a/webmagic-core/src/test/java/us/codecraft/webmagic/utils/UrlUtilsTest.java +++ b/webmagic-core/src/test/java/us/codecraft/webmagic/utils/UrlUtilsTest.java @@ -4,7 +4,7 @@ import org.junit.Assert; import org.junit.Test; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午2:22 */ diff --git a/webmagic-plugin/src/main/java/us/codecraft/webmagic/pipeline/FreemarkerPipeline.java b/webmagic-plugin/src/main/java/us/codecraft/webmagic/pipeline/FreemarkerPipeline.java index 218276d..f512f26 100644 --- a/webmagic-plugin/src/main/java/us/codecraft/webmagic/pipeline/FreemarkerPipeline.java +++ b/webmagic-plugin/src/main/java/us/codecraft/webmagic/pipeline/FreemarkerPipeline.java @@ -13,7 +13,7 @@ import java.io.IOException; import java.io.PrintWriter; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-6-8 * Time: 下午9:00 */ diff --git a/webmagic-plugin/src/test/java/us/codecraft/webmagic/FreemarkerPipelineTest.java b/webmagic-plugin/src/test/java/us/codecraft/webmagic/FreemarkerPipelineTest.java index 9e6b995..68ff904 100644 --- a/webmagic-plugin/src/test/java/us/codecraft/webmagic/FreemarkerPipelineTest.java +++ b/webmagic-plugin/src/test/java/us/codecraft/webmagic/FreemarkerPipelineTest.java @@ -6,7 +6,7 @@ import us.codecraft.webmagic.pipeline.FreemarkerPipeline; import java.io.IOException; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-6-9 * Time: 上午7:14 */ diff --git a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/DiandianBlogProcessor.java b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/DiandianBlogProcessor.java index a9351a1..a5b355c 100644 --- a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/DiandianBlogProcessor.java +++ b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/DiandianBlogProcessor.java @@ -7,7 +7,7 @@ import us.codecraft.webmagic.processor.PageProcessor; import java.util.List; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午8:08 */ diff --git a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/DianpingProcessor.java b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/DianpingProcessor.java index 63aa0f0..2f28e6a 100644 --- a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/DianpingProcessor.java +++ b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/DianpingProcessor.java @@ -8,7 +8,7 @@ import us.codecraft.webmagic.processor.PageProcessor; import java.util.List; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午8:08 */ diff --git a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/DiaoyuwengProcessor.java b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/DiaoyuwengProcessor.java index 8d64bbc..f5032ff 100644 --- a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/DiaoyuwengProcessor.java +++ b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/DiaoyuwengProcessor.java @@ -8,7 +8,7 @@ import us.codecraft.webmagic.selector.PlainText; import java.util.List; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午8:08 */ diff --git a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/F58PageProcesser.java b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/F58PageProcesser.java index 82db2dd..385e3f2 100644 --- a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/F58PageProcesser.java +++ b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/F58PageProcesser.java @@ -7,7 +7,7 @@ import us.codecraft.webmagic.processor.PageProcessor; import java.util.List; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午1:48 */ diff --git a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/HuxiuProcessor.java b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/HuxiuProcessor.java index 36f6946..1fa0b7b 100644 --- a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/HuxiuProcessor.java +++ b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/HuxiuProcessor.java @@ -7,7 +7,7 @@ import us.codecraft.webmagic.processor.PageProcessor; import java.util.List; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午8:08 */ diff --git a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/KaichibaProcessor.java b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/KaichibaProcessor.java index 11f0462..8ea4afe 100644 --- a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/KaichibaProcessor.java +++ b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/KaichibaProcessor.java @@ -5,7 +5,7 @@ import us.codecraft.webmagic.Site; import us.codecraft.webmagic.processor.PageProcessor; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-5-20 * Time: 下午5:31 */ diff --git a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/MeicanProcessor.java b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/MeicanProcessor.java index aaeca8f..98fe8de 100644 --- a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/MeicanProcessor.java +++ b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/MeicanProcessor.java @@ -7,7 +7,7 @@ import us.codecraft.webmagic.processor.PageProcessor; import java.util.List; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-5-20 * Time: 下午5:31 */ diff --git a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/NjuBBSProcessor.java b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/NjuBBSProcessor.java index 58e19c4..e4cc33c 100644 --- a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/NjuBBSProcessor.java +++ b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/NjuBBSProcessor.java @@ -7,7 +7,7 @@ import us.codecraft.webmagic.processor.PageProcessor; import java.util.List; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午8:08 */ diff --git a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/OschinaBlogPageProcesser.java b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/OschinaBlogPageProcesser.java index bcc2d6e..0d6354d 100644 --- a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/OschinaBlogPageProcesser.java +++ b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/OschinaBlogPageProcesser.java @@ -7,7 +7,7 @@ import us.codecraft.webmagic.processor.PageProcessor; import java.util.List; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午1:48 */ diff --git a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/OschinaPageProcesser.java b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/OschinaPageProcesser.java index d85ca81..b708ec5 100644 --- a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/OschinaPageProcesser.java +++ b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/OschinaPageProcesser.java @@ -7,7 +7,7 @@ import us.codecraft.webmagic.processor.PageProcessor; import java.util.List; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午1:48 */ diff --git a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/QzoneBlogProcessor.java b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/QzoneBlogProcessor.java index fac491d..400ebd5 100644 --- a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/QzoneBlogProcessor.java +++ b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/QzoneBlogProcessor.java @@ -7,7 +7,7 @@ import us.codecraft.webmagic.processor.PageProcessor; import java.util.List; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午8:08 */ diff --git a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/SinaBlogProcesser.java b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/SinaBlogProcesser.java index 37c6864..5bc2fc6 100644 --- a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/SinaBlogProcesser.java +++ b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/SinaBlogProcesser.java @@ -5,7 +5,7 @@ import us.codecraft.webmagic.Page; import us.codecraft.webmagic.processor.PageProcessor; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午1:48 */ diff --git a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/TianyaPageProcesser.java b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/TianyaPageProcesser.java index db5f9ff..a15ef74 100644 --- a/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/TianyaPageProcesser.java +++ b/webmagic-samples/src/main/java/us/codecraft/webmagic/samples/TianyaPageProcesser.java @@ -7,7 +7,7 @@ import us.codecraft.webmagic.processor.PageProcessor; import java.util.List; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-21 * Time: 下午1:48 */ diff --git a/webmagic-samples/src/test/java/us/codecraft/webmagic/SpiderTest.java b/webmagic-samples/src/test/java/us/codecraft/webmagic/SpiderTest.java index b67ffc4..6293884 100644 --- a/webmagic-samples/src/test/java/us/codecraft/webmagic/SpiderTest.java +++ b/webmagic-samples/src/test/java/us/codecraft/webmagic/SpiderTest.java @@ -8,7 +8,7 @@ import us.codecraft.webmagic.samples.HuxiuProcessor; import us.codecraft.webmagic.schedular.FileCacheQueueSchedular; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-4-20 * Time: 下午7:46 */ diff --git a/webmagic-samples/src/test/java/us/codecraft/webmagic/processor/DiandianProcessorTest.java b/webmagic-samples/src/test/java/us/codecraft/webmagic/processor/DiandianProcessorTest.java index 721a5eb..b87815c 100644 --- a/webmagic-samples/src/test/java/us/codecraft/webmagic/processor/DiandianProcessorTest.java +++ b/webmagic-samples/src/test/java/us/codecraft/webmagic/processor/DiandianProcessorTest.java @@ -11,7 +11,7 @@ import us.codecraft.webmagic.schedular.FileCacheQueueSchedular; import java.io.IOException; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-6-9 * Time: 上午8:02 */ diff --git a/webmagic-samples/src/test/java/us/codecraft/webmagic/processor/DiaoyuwengProcessorTest.java b/webmagic-samples/src/test/java/us/codecraft/webmagic/processor/DiaoyuwengProcessorTest.java index 8f03b6a..2b2caac 100644 --- a/webmagic-samples/src/test/java/us/codecraft/webmagic/processor/DiaoyuwengProcessorTest.java +++ b/webmagic-samples/src/test/java/us/codecraft/webmagic/processor/DiaoyuwengProcessorTest.java @@ -11,7 +11,7 @@ import us.codecraft.webmagic.schedular.FileCacheQueueSchedular; import java.io.IOException; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-6-9 * Time: 上午8:02 */ diff --git a/webmagic-samples/src/test/java/us/codecraft/webmagic/processor/SinablogProcessorTest.java b/webmagic-samples/src/test/java/us/codecraft/webmagic/processor/SinablogProcessorTest.java index 8fb2583..9613c9e 100644 --- a/webmagic-samples/src/test/java/us/codecraft/webmagic/processor/SinablogProcessorTest.java +++ b/webmagic-samples/src/test/java/us/codecraft/webmagic/processor/SinablogProcessorTest.java @@ -11,7 +11,7 @@ import us.codecraft.webmagic.schedular.FileCacheQueueSchedular; import java.io.IOException; /** - * Author: code4crafter@gmail.com + * @author code4crafter@gmail.com
* Date: 13-6-9 * Time: 上午8:02 */