rubyretriever 0.1.2 → 0.1.3
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/lib/retriever/fetch.rb +2 -3
- data/lib/retriever/version.rb +1 -1
- data/readme.md +1 -1
- metadata +1 -1
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: f27793b1294bd489c3338aa5bc739dc6058d479a
|
4
|
+
data.tar.gz: e48491765a741087ba7bf708d62a8bbf8aa3cf80
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 60c017cf5dda8c659b12c3146f565df743dc4f6cf0e8436889bebb86cdccd5b128cca233d76b1413f526c21d1d99478c8149e6c43772e5dd0db1067f8dea5263
|
7
|
+
data.tar.gz: ec8142f3a8cbd75861c74322dd0358da51ee45388376ca0118d0998b81cf302b182eef93c39d88ef17dd35ef80a6253bf7a058e2e2052ea60ea3266d401892ab
|
data/lib/retriever/fetch.rb
CHANGED
@@ -155,7 +155,7 @@ module Retriever
|
|
155
155
|
@linkStack.concat(new_links_arr)
|
156
156
|
@sitemap.concat(new_links_arr) if @s
|
157
157
|
end
|
158
|
-
@progressbar.finish
|
158
|
+
@progressbar.finish if @prgrss
|
159
159
|
end
|
160
160
|
def asyncGetWave() #send a new wave of GET requests, using current @linkStack
|
161
161
|
new_stuff = []
|
@@ -167,11 +167,10 @@ module Retriever
|
|
167
167
|
if @already_crawled.include?(url)
|
168
168
|
@linkStack.delete(url)
|
169
169
|
next
|
170
|
-
else
|
171
|
-
@already_crawled.insert(url)
|
172
170
|
end
|
173
171
|
resp = EventMachine::HttpRequest.new(url).get
|
174
172
|
lg("URL Crawled: #{url}")
|
173
|
+
@already_crawled.insert(url)
|
175
174
|
if @prgrss
|
176
175
|
@progressbar.increment if @already_crawled.size < @maxPages
|
177
176
|
end
|
data/lib/retriever/version.rb
CHANGED
data/readme.md
CHANGED