yihua.huang
|
b51fb2696b
|
update ut for cookie
|
2013-12-06 00:30:01 +08:00 |
yihua.huang
|
ff2f588c41
|
#48 nullpointer exception
|
2013-12-04 22:11:20 +08:00 |
yihua.huang
|
d274310cb2
|
[maven-release-plugin] prepare for next development iteration
|
2013-12-03 23:35:06 +08:00 |
yihua.huang
|
e8c32a32dc
|
[maven-release-plugin] prepare release webmagic-0.4.2
|
2013-12-03 23:34:57 +08:00 |
yihua.huang
|
6a828e923c
|
#46 Downloader thread hang up when timeout
|
2013-12-03 09:59:54 +08:00 |
shijinping
|
9a524aa364
|
double-check 中再取次httpClient的内容
|
2013-11-28 14:38:30 +08:00 |
yihua.huang
|
e7083dc39d
|
[maven-release-plugin] prepare for next development iteration
|
2013-11-28 13:04:32 +08:00 |
yihua.huang
|
ae623567b3
|
[maven-release-plugin] prepare release webmagic-0.4.1
|
2013-11-28 13:04:22 +08:00 |
yihua.huang
|
59ad4cad27
|
#42 Add jsonpath in annotation mode for json result
|
2013-11-28 08:25:16 +08:00 |
yihua.huang
|
c2d6d495b3
|
#41 add getThreadAlive(),getStatus,getPageCount() to spider
|
2013-11-28 07:59:24 +08:00 |
yihua.huang
|
cf62d707e0
|
#36 Spider does not exit when success
|
2013-11-27 23:33:18 +08:00 |
yihua.huang
|
a01312930a
|
#39 Parsing html after page.getHtml()
|
2013-11-27 22:01:34 +08:00 |
yihua.huang
|
f63d33b457
|
update some comments
|
2013-11-27 21:06:53 +08:00 |
yihua.huang
|
04fcf3193f
|
#38 Change algorithm of SmartContentSelector
|
2013-11-23 13:56:55 +08:00 |
yihua.huang
|
296a68920e
|
fix javadoc and add setPipelines() for spider
|
2013-11-14 13:23:29 +08:00 |
yihua.huang
|
47a0360783
|
#35 add status code to page
|
2013-11-12 11:51:34 +08:00 |
yihua.huang
|
bc5c30de17
|
update scripts
|
2013-11-12 08:20:59 +08:00 |
yihua.huang
|
f9daae39cf
|
[maven-release-plugin] prepare for next development iteration
|
2013-11-11 14:33:11 +08:00 |
yihua.huang
|
fdb9441519
|
[maven-release-plugin] prepare release webmagic-0.4.0
|
2013-11-11 14:33:01 +08:00 |
yihua.huang
|
1d75ae7f5b
|
rollback version to 0.4.0 because not deploy success
|
2013-11-11 11:52:56 +08:00 |
yihua.huang
|
df8ca8ad09
|
add scripts
|
2013-11-10 22:30:48 +08:00 |
yihua.huang
|
775eb9732f
|
[maven-release-plugin] prepare for next development iteration
|
2013-11-06 22:17:58 +08:00 |
yihua.huang
|
0b4fadc24d
|
[maven-release-plugin] prepare release webmagic-0.4.0
|
2013-11-06 22:17:47 +08:00 |
yihua.huang
|
fe6d9bb2e2
|
get keep-alive rework
|
2013-11-06 21:53:39 +08:00 |
yihua.huang
|
fd6d2fd6f8
|
try to keepalive TCP connection
|
2013-11-06 21:19:14 +08:00 |
yihua.huang
|
425df08523
|
update version to 0.4.0
|
2013-11-06 12:50:45 +08:00 |
yihua.huang
|
e046bb0723
|
remove useless code
|
2013-11-06 12:48:14 +08:00 |
yihua.huang
|
6e32a19f80
|
update api for direct download
|
2013-11-06 12:46:50 +08:00 |
yihua.huang
|
807aefe9df
|
change EntityUtil to IOUtil because some encoding error
|
2013-11-06 07:37:34 +08:00 |
yihua.huang
|
00b0a751b4
|
#33 ignore 'content-encoding' when redirect
|
2013-11-06 06:57:58 +08:00 |
yihua.huang
|
8f774afc84
|
add direct download
|
2013-11-06 06:41:04 +08:00 |
yihua.huang
|
c18b603399
|
optimize long compare
|
2013-11-04 07:09:44 +08:00 |
yihua.huang
|
ed3f3583cc
|
downloader refactor
|
2013-11-04 01:03:23 +08:00 |
yihua.huang
|
a37f40e6e6
|
add cookie supoort
|
2013-11-04 00:59:48 +08:00 |
yihua.huang
|
3c6fced48e
|
update connection client
|
2013-11-04 00:53:01 +08:00 |
yihua.huang
|
09153ff715
|
#22 http proxy support #32 update httpclient to 4.3.1
|
2013-11-04 00:47:09 +08:00 |
yihua.huang
|
edfc319c45
|
update httpclient to 4.3.1
|
2013-11-04 00:06:30 +08:00 |
yihua.huang
|
160a149b05
|
todo bugfix
|
2013-11-03 23:10:09 +08:00 |
yihua.huang
|
583a0eba8c
|
#29 refactor some method name
|
2013-11-03 20:24:26 +08:00 |
yihua.huang
|
6fa82a418b
|
#29 seed urls with more information
|
2013-11-03 20:20:50 +08:00 |
yihua.huang
|
1446ada732
|
some refactor
|
2013-10-31 22:50:22 +08:00 |
yihua.huang
|
84976c81ec
|
remove useless code
|
2013-10-31 22:48:18 +08:00 |
yihua.huang
|
b4fcf41168
|
add exit when comlete option
|
2013-10-31 22:41:02 +08:00 |
yihua.huang
|
352887870c
|
remove shutdown call
|
2013-10-31 22:22:14 +08:00 |
yihua.huang
|
a3f9ad198f
|
refactor multi thread code in Spider
|
2013-10-31 21:52:43 +08:00 |
yihua.huang
|
7fb44d2eec
|
#30 reuse PoolingClientConnectionManager for HttpClientDownloader
|
2013-10-14 23:22:04 +08:00 |
yihua.huang
|
5a226387e0
|
#27 nullpointer fix
|
2013-10-11 11:32:44 +08:00 |
yihua.huang
|
16e12e3bc9
|
#27 customize http header for downloader
|
2013-10-11 08:37:21 +08:00 |
yihua.huang
|
1a2c84ea78
|
#27 add timeout config to site
|
2013-10-11 07:36:16 +08:00 |
yihua.huang
|
4acbc19cee
|
[maven-release-plugin] prepare for next development iteration
|
2013-09-23 13:12:32 +08:00 |