list_spider 2.0.1 → 2.0.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 9ef1d9cd5edd321718137a9b9055b6e223fb870f1209271df4142930c35dd6f5
4
- data.tar.gz: 983055db2e6714337f4f76ec3d279a83f46d48e689be0334c9a944bce197599c
3
+ metadata.gz: 4a69a63919c971b077855f236631b5b91895e11836338c8970dec65214f92a4c
4
+ data.tar.gz: 6e0fefdd9a9eba8bfbead303bfbe2e27a0d98171bd60cdae89864f026289c987
5
5
  SHA512:
6
- metadata.gz: dcccc6c7761931c93bd729e58a844e127d9ac7a63075f8163c92083f7749df2e978cc745071a2c319bcc48825d2dd53a2e043e97a02329884168cc50d21f7975
7
- data.tar.gz: 33cd0806b64df7e88296a9ff8ce0a3b233f6702df9cdb4c87938c7cc0b64cde2d096970903a3242c228c308d7fc2d8a35f4eff85d2262e5034de83bf7d009e85
6
+ metadata.gz: 11a2591f94021e7bb3d06bb7a712f98cf8329142150cf09979d44cc65f1803c809e9077d85ad5d41c83457b20c2bf9694a3a65692898145eb7738e18460e40ba
7
+ data.tar.gz: 3e393c808733042ba3b13a950fcc63f7498641a55d16a5ccae11f3bf1100ca04558e32873bd9063602abd6c72194e8d90492b9b292e47cbd08bfc44476f5417f
data/Gemfile.lock CHANGED
@@ -1,7 +1,7 @@
1
1
  PATH
2
2
  remote: .
3
3
  specs:
4
- list_spider (2.0.0)
4
+ list_spider (2.0.1)
5
5
  em-http-request (~> 1.1, >= 1.1.3)
6
6
  nokogiri (~> 1.6, >= 1.6.7)
7
7
  rchardet (~> 1.6, >= 1.6.1)
data/lib/list_spider.rb CHANGED
@@ -126,7 +126,7 @@ module ListSpider
126
126
 
127
127
  http_req.callback do
128
128
  s = http_req.response_header.status
129
- puts s
129
+ puts "#{Time.now}, http status code: #{s}"
130
130
 
131
131
  if s == 200
132
132
  local_dir = File.dirname(task_struct.local_path)
@@ -149,27 +149,9 @@ module ListSpider
149
149
  end
150
150
 
151
151
  http_req.errback do
152
- puts "errback:#{http_req.response_header},retry..."
153
- puts task_struct.href
154
- puts http_req.response_header.status
155
-
156
- if task_struct.errback
157
- task_struct.errback.call(task_struct, http_req)
158
- # else
159
- # ret = false
160
- # if task_struct.http_method == :get
161
- # ret = SpiderHelper.direct_http_get(task_struct.href, task_struct.local_path, convert_to_utf8: @convert_to_utf8)
162
- # elsif task_struct.http_method == :post
163
- # ret = SpiderHelper.direct_http_post(task_struct.href, task_struct.local_path, task_struct.params, convert_to_utf8: @convert_to_utf8)
164
- # end
152
+ puts "#{Time.now}, #{task_struct.href}, error: #{http_req.error}"
165
153
 
166
- # if ret
167
- # call_parse_method(task_struct)
168
- # succeed_list << task_struct
169
- # else
170
- # failed_list << task_struct
171
- # end
172
- end
154
+ task_struct.errback.call(task_struct, http_req) if task_struct.errback
173
155
  end
174
156
 
175
157
  begin
@@ -1,3 +1,3 @@
1
1
  module ListSpider
2
- VERSION = '2.0.1'.freeze
2
+ VERSION = '2.0.2'.freeze
3
3
  end
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: list_spider
3
3
  version: !ruby/object:Gem::Version
4
- version: 2.0.1
4
+ version: 2.0.2
5
5
  platform: ruby
6
6
  authors:
7
7
  - Charles Zhang
8
8
  autorequire:
9
9
  bindir: exe
10
10
  cert_chain: []
11
- date: 2018-02-23 00:00:00.000000000 Z
11
+ date: 2018-02-28 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: bundler