yihua.huang
|
a37f40e6e6
|
add cookie supoort
|
2013-11-04 00:59:48 +08:00 |
yihua.huang
|
3c6fced48e
|
update connection client
|
2013-11-04 00:53:01 +08:00 |
yihua.huang
|
09153ff715
|
#22 http proxy support #32 update httpclient to 4.3.1
|
2013-11-04 00:47:09 +08:00 |
yihua.huang
|
edfc319c45
|
update httpclient to 4.3.1
|
2013-11-04 00:06:30 +08:00 |
yihua.huang
|
160a149b05
|
todo bugfix
|
2013-11-03 23:10:09 +08:00 |
yihua.huang
|
583a0eba8c
|
#29 refactor some method name
|
2013-11-03 20:24:26 +08:00 |
yihua.huang
|
6fa82a418b
|
#29 seed urls with more information
|
2013-11-03 20:20:50 +08:00 |
yihua.huang
|
1446ada732
|
some refactor
|
2013-10-31 22:50:22 +08:00 |
yihua.huang
|
84976c81ec
|
remove useless code
|
2013-10-31 22:48:18 +08:00 |
yihua.huang
|
b4fcf41168
|
add exit when comlete option
|
2013-10-31 22:41:02 +08:00 |
yihua.huang
|
352887870c
|
remove shutdown call
|
2013-10-31 22:22:14 +08:00 |
yihua.huang
|
a3f9ad198f
|
refactor multi thread code in Spider
|
2013-10-31 21:52:43 +08:00 |
yihua.huang
|
7fb44d2eec
|
#30 reuse PoolingClientConnectionManager for HttpClientDownloader
|
2013-10-14 23:22:04 +08:00 |
yihua.huang
|
5a226387e0
|
#27 nullpointer fix
|
2013-10-11 11:32:44 +08:00 |
yihua.huang
|
16e12e3bc9
|
#27 customize http header for downloader
|
2013-10-11 08:37:21 +08:00 |
yihua.huang
|
1a2c84ea78
|
#27 add timeout config to site
|
2013-10-11 07:36:16 +08:00 |
yihua.huang
|
4acbc19cee
|
[maven-release-plugin] prepare for next development iteration
|
2013-09-23 13:12:32 +08:00 |
yihua.huang
|
cc3b787991
|
[maven-release-plugin] prepare release webmagic-0.3.2
|
2013-09-23 13:12:19 +08:00 |
yihua.huang
|
b131878123
|
add example
|
2013-09-23 13:01:28 +08:00 |
yihua.huang
|
95ab4edec3
|
some bugfix
|
2013-09-23 08:38:54 +08:00 |
yihua.huang
|
fba330872b
|
fix a thread pool exception
|
2013-09-22 23:57:15 +08:00 |
yihua.huang
|
3c79d031bd
|
fix thread pool
|
2013-09-22 22:52:52 +08:00 |
yihua.huang
|
fb693a4ac4
|
[maven-release-plugin] prepare for next development iteration
|
2013-09-08 22:25:07 +08:00 |
yihua.huang
|
bfaaa042b9
|
[maven-release-plugin] prepare release webmagic-parent-0.3.1
|
2013-09-08 22:24:48 +08:00 |
yihua.huang
|
c17a31a21d
|
fix null pointe exception #26
|
2013-09-08 21:09:49 +08:00 |
yihua.huang
|
d2e0f0cd33
|
#25 use URL api in UrlUtils.canonicalizeUrl()
|
2013-09-06 21:35:23 +08:00 |
yihua.huang
|
ef4cf49fee
|
add stop method to spider #24
|
2013-09-06 21:17:36 +08:00 |
yihua.huang
|
692de76f86
|
fix issue #21 charset detect error
|
2013-09-04 15:27:51 +08:00 |
yihua.huang
|
e7bf425df4
|
[maven-release-plugin] prepare for next development iteration
|
2013-09-04 10:51:01 +08:00 |
yihua.huang
|
77ff252316
|
[maven-release-plugin] prepare release webmagic-0.3.0
|
2013-09-04 10:50:50 +08:00 |
yihua.huang
|
1fc8e104ab
|
add cycle retry
|
2013-09-04 10:32:13 +08:00 |
yihua.huang
|
d141541ef3
|
add retry
|
2013-09-04 09:57:19 +08:00 |
yihua.huang
|
a1ef2523cc
|
update xsoup version
|
2013-09-04 09:38:40 +08:00 |
yihua.huang
|
aefd0569a5
|
update version
|
2013-09-04 09:36:56 +08:00 |
yihua.huang
|
194518fd82
|
add switch
|
2013-09-04 08:21:34 +08:00 |
yihua.huang
|
326b97c65a
|
update
|
2013-09-04 00:15:54 +08:00 |
yihua.huang
|
2c3574537a
|
refactor in selectors
|
2013-09-02 14:14:24 +08:00 |
yihua.huang
|
85b7cf1563
|
complete test
|
2013-09-02 13:52:41 +08:00 |
yihua.huang
|
d7cd9e5747
|
update pom
|
2013-09-02 11:56:01 +08:00 |
yihua.huang
|
55d4a76ab7
|
newselectors
|
2013-09-02 08:21:32 +08:00 |
yihua.huang
|
d7abbd0e4b
|
fix compile error
|
2013-08-25 16:31:00 +08:00 |
yihua.huang
|
5e9e8b2541
|
add TextContentSelector
|
2013-08-25 16:30:38 +08:00 |
yihua.huang
|
0cc0ccee35
|
add charset specific for easy call of HttpClientDownloader
|
2013-08-25 15:41:43 +08:00 |
yihua.huang
|
91dcccf7b5
|
add a sample
|
2013-08-21 21:55:15 +08:00 |
yihua.huang
|
ad66d33f38
|
[maven-release-plugin] prepare for next development iteration
|
2013-08-20 23:39:59 +08:00 |
yihua.huang
|
9dc6b11954
|
[maven-release-plugin] prepare release webmagic-parent-0.2.1
|
2013-08-20 23:37:55 +08:00 |
yihua.huang
|
4f62dfc8a4
|
release
|
2013-08-20 23:37:20 +08:00 |
yihua.huang
|
74c940c758
|
[maven-release-plugin] prepare for next development iteration
|
2013-08-20 23:19:58 +08:00 |
yihua.huang
|
a4bb4e3429
|
[maven-release-plugin] prepare release webmagic-parent-0.2.1
|
2013-08-20 23:19:27 +08:00 |
yihua.huang
|
194f16aa75
|
update
|
2013-08-20 23:16:43 +08:00 |
yihua.huang
|
0f0f1a9bcd
|
release notes
|
2013-08-20 22:51:30 +08:00 |
yihua.huang
|
c1471718df
|
extractors
|
2013-08-20 22:44:53 +08:00 |
yihua.huang
|
20705b34ac
|
add more option to extractors
|
2013-08-20 22:13:30 +08:00 |
yihua.huang
|
c70ed57025
|
remove PriorityScheduler to core
|
2013-08-20 21:55:58 +08:00 |
yihua.huang
|
7003426898
|
update pom
|
2013-08-20 21:52:39 +08:00 |
yihua.huang
|
606417fdc7
|
update pom
|
2013-08-19 09:55:49 +08:00 |
yihua.huang
|
d460e136ef
|
update version
|
2013-08-19 09:52:15 +08:00 |
yihua.huang
|
c79d6ecf09
|
complete all comments
|
2013-08-17 23:30:49 +08:00 |
yihua.huang
|
90bbe9b951
|
webmagic-core
|
2013-08-17 23:24:04 +08:00 |
yihua.huang
|
17f8ead28f
|
update comments for selector
|
2013-08-17 21:33:54 +08:00 |
yihua.huang
|
77e6ca2945
|
update comments
|
2013-08-17 21:26:44 +08:00 |
yihua.huang
|
5073258237
|
closable
|
2013-08-17 21:19:24 +08:00 |
yihua.huang
|
d01c0eb8ce
|
update comments of spider
|
2013-08-17 21:15:36 +08:00 |
yihua.huang
|
5f1f4cbc46
|
update comments
|
2013-08-17 20:41:29 +08:00 |
yihua.huang
|
1148450ff9
|
update filecache to more useful
|
2013-08-17 18:12:47 +08:00 |
yihua.huang
|
3ba7a76f44
|
add combo extract to replace Extract2 Extract3...
|
2013-08-17 17:23:11 +08:00 |
yihua.huang
|
5cb45af3a4
|
+doc
|
2013-08-17 12:10:34 +08:00 |
yihua.huang
|
ef673b985e
|
add a method for httpclientdownloader
|
2013-08-14 13:32:23 +08:00 |
yihua.huang
|
067f3ea0cb
|
add some null pointer check for httpclientdownloader
|
2013-08-14 13:30:09 +08:00 |
yihua.huang
|
9e82256ce3
|
update docs
|
2013-08-12 10:08:20 +08:00 |
yihua.huang
|
0a902b441c
|
update docs
|
2013-08-12 09:55:17 +08:00 |
yihua.huang
|
0f2c5b5723
|
update redisscheduler
|
2013-08-11 18:28:12 +08:00 |
yihua.huang
|
787b952932
|
release notes and docs
|
2013-08-11 10:21:26 +08:00 |
yihua.huang
|
8b15f3c63d
|
add test
|
2013-08-10 20:33:47 +08:00 |
yihua.huang
|
ade5714d50
|
add https support
|
2013-08-10 18:52:27 +08:00 |
yihua.huang
|
21eca688e9
|
complete docs
|
2013-08-09 20:56:33 +08:00 |
yihua.huang
|
17d2d98cec
|
remove invalid @date
|
2013-08-09 20:43:06 +08:00 |
yihua.huang
|
268bd8d0c4
|
remove saxon to extension
|
2013-08-07 23:04:10 +08:00 |
yihua.huang
|
cff943f698
|
fix path format error
|
2013-08-07 13:05:12 +08:00 |
yihua.huang
|
5ef231a768
|
update version
|
2013-08-07 12:48:32 +08:00 |
yihua.huang
|
570533cce5
|
update readme
|
2013-08-07 09:45:38 +08:00 |
yihua.huang
|
36494bcfa5
|
add xpath2.0 api
|
2013-08-06 23:01:43 +08:00 |
yihua.huang
|
5c96407a3d
|
fix a null domain error
|
2013-08-06 22:43:31 +08:00 |
yihua.huang
|
c7005a0227
|
json fix
|
2013-08-06 22:36:37 +08:00 |
yihua.huang
|
e5f4b3916f
|
change file dir
|
2013-08-06 22:26:39 +08:00 |
yihua.huang
|
7d277e84d4
|
update lucene pipeline
|
2013-08-06 21:47:44 +08:00 |
yihua.huang
|
b40cca1122
|
move model package to plugin
|
2013-08-06 20:41:35 +08:00 |
yihua.huang
|
4eb3d60083
|
fix nullpointer exception
|
2013-08-05 22:06:39 +08:00 |
yihua.huang
|
b0af45f4bb
|
complete redis support
|
2013-08-05 21:44:29 +08:00 |
yihua.huang
|
f3a29d9315
|
fix pagedmodel bug
|
2013-08-05 21:03:47 +08:00 |
yihua.huang
|
629f8ac2d1
|
add extractors chain
|
2013-08-05 20:45:34 +08:00 |
yihua.huang
|
27ce3fc176
|
lazy init
|
2013-08-05 19:36:49 +08:00 |
yihua.huang
|
dc9f574e27
|
update request
|
2013-08-05 18:17:52 +08:00 |
yihua.huang
|
d56c681be1
|
add priority to request
|
2013-08-05 18:08:28 +08:00 |
yihua.huang
|
971e7b6ce2
|
add core
|
2013-08-05 13:53:13 +08:00 |
yihua.huang
|
619a12b303
|
add paged support
|
2013-08-04 21:22:15 +08:00 |
yihua.huang
|
a5c85c3c8b
|
add annotation ExtractByRaw
|
2013-08-04 15:12:06 +08:00 |
yihua.huang
|
1a50c64e33
|
update name
|
2013-08-04 10:05:03 +08:00 |
yihua.huang
|
a3a868f584
|
rename
|
2013-08-04 09:55:50 +08:00 |
yihua.huang
|
04a7fa037a
|
update pipeline
|
2013-08-04 09:53:01 +08:00 |
yihua.huang
|
21cae2ff2e
|
update package
|
2013-08-04 07:53:28 +08:00 |
yihua.huang
|
cfb8990453
|
update author
|
2013-08-04 03:04:30 +08:00 |
yihua.huang
|
b393e38320
|
add multi entity extract
|
2013-08-03 20:42:29 +08:00 |
yihua.huang
|
bfadac756a
|
fix an attribute bug
|
2013-08-03 18:36:03 +08:00 |
yihua.huang
|
145628557d
|
update afterextract api
|
2013-08-03 18:01:17 +08:00 |
yihua.huang
|
aca165b132
|
add and or selector
|
2013-08-03 17:38:36 +08:00 |
yihua.huang
|
69245e8c03
|
fix Class.assinable bug
|
2013-08-03 17:17:59 +08:00 |
yihua.huang
|
65518f7672
|
add list support
|
2013-08-03 17:01:25 +08:00 |
yihua.huang
|
d4de60a562
|
skip test
|
2013-08-03 16:35:12 +08:00 |
yihua.huang
|
d26cd82d59
|
rename package
|
2013-08-03 16:29:50 +08:00 |
yihua.huang
|
f84b53514f
|
complete objectpipeline
|
2013-08-03 15:55:54 +08:00 |
yihua.huang
|
866ab0a056
|
update email
|
2013-08-03 14:01:18 +08:00 |
yihua.huang
|
7c9e9ce869
|
xpath2.0
|
2013-08-03 07:28:46 +08:00 |
yihua.huang
|
7f27c28d4c
|
simplify api
|
2013-08-02 23:45:13 +08:00 |
yihua.huang
|
d7899e94ae
|
test saxon and invite XPath2.0 support
|
2013-08-02 23:39:34 +08:00 |
yihua.huang
|
3fe3d8f044
|
update
|
2013-08-02 13:51:42 +08:00 |
yihua.huang
|
516ff3310d
|
add failfast
|
2013-08-02 08:20:55 +08:00 |
yihua.huang
|
7a4dbb1f15
|
invite notnull
|
2013-08-02 08:09:37 +08:00 |
yihua.huang
|
06a39af0f3
|
add setter support
|
2013-08-02 07:32:37 +08:00 |
yihua.huang
|
abba3b7bff
|
add extract by url
|
2013-08-02 06:59:25 +08:00 |
yihua.huang
|
f08ffc34fd
|
rename
|
2013-08-02 06:33:48 +08:00 |
yihua.huang
|
c5cf05640a
|
processor
|
2013-08-01 22:53:44 +08:00 |
yihua.huang
|
50edd22ef6
|
add annotation
|
2013-08-01 22:40:57 +08:00 |
yihua.huang
|
7020b8648d
|
fix a thread problem
|
2013-07-30 21:39:43 +08:00 |
yihua.huang
|
52fd5cfc1c
|
fix encoding
|
2013-07-30 15:24:59 +08:00 |
yihua.huang
|
e87aabf8fd
|
为downloader增加了一个新方法,可设置线程数
|
2013-07-29 20:01:44 +08:00 |
yihua.huang
|
18fefa0c0a
|
fix a spider init problem
|
2013-07-29 10:59:23 +08:00 |
yihua.huang
|
54904851ea
|
add list output support
|
2013-07-26 21:22:57 +08:00 |
yihua.huang
|
42508af041
|
add huaban processor
|
2013-07-26 16:32:51 +08:00 |
yihua.huang
|
fe224cbf66
|
release resource
|
2013-07-26 15:27:47 +08:00 |
yihua.huang
|
86a20eabd9
|
fix a httpclient pool size bug
|
2013-07-26 14:41:30 +08:00 |
yihua.huang
|
fed3c0c98a
|
update readme
|
2013-07-26 11:55:40 +08:00 |
yihua.huang
|
d3e527fd6b
|
try invite selenium
|
2013-07-26 11:52:23 +08:00 |
yihua.huang
|
c2142f872b
|
add iteye sample
|
2013-07-26 08:24:08 +08:00 |
yihua.huang
|
65dc372152
|
update pipeline api
|
2013-07-25 13:32:39 +08:00 |
yihua.huang
|
cea866520d
|
update version
|
2013-07-24 20:45:45 +08:00 |
yihua.huang
|
de006333c8
|
update java docs
|
2013-07-24 20:38:49 +08:00 |
yihua.huang
|
827972d80f
|
update java docs
|
2013-07-24 19:49:00 +08:00 |
yihua.huang
|
96454fd74c
|
update java doc
|
2013-07-24 18:26:54 +08:00 |
yihua.huang
|
81e7f7982e
|
invite jsoup and cssselector
|
2013-07-20 08:34:18 +08:00 |
yihua.huang
|
c733046045
|
+sina blog
|
2013-07-19 12:36:55 +08:00 |
yihua.huang
|
2b34dc9d3f
|
add retry
|
2013-07-18 17:22:26 +08:00 |
yihua.huang
|
5c79550fd9
|
add offline cache and process
|
2013-06-24 14:42:49 +08:00 |
yihua.huang
|
a7316a1f57
|
add runasync
|
2013-06-23 22:16:04 +08:00 |
yihua.huang
|
cad2594a08
|
add multithread support
|
2013-06-23 21:09:26 +08:00 |
yihua.huang
|
5a6a68a318
|
add gzip support
|
2013-06-23 18:56:31 +08:00 |
yihua.huang
|
adeed3bcaf
|
add extra
|
2013-06-23 17:06:43 +08:00 |
yihua.huang
|
a0bcfb8567
|
add extra for page
|
2013-06-23 17:05:10 +08:00 |
yihua.huang
|
7e17c71c3e
|
add page skip
|
2013-06-23 16:57:01 +08:00 |
yihua.huang
|
9b1ba6e8bc
|
ignore unstable test
|
2013-06-20 17:57:31 +08:00 |