Dynamised 0.2.0 → 0.2.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/bin/dynamised +0 -1
- data/lib/dynamised/helpers.rb +10 -0
- data/lib/dynamised/meta.rb +1 -1
- data/lib/dynamised/scraper.rb +8 -7
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: c5635a9d0b97dcc25da301b5a176de94ea7afc42
|
4
|
+
data.tar.gz: 4eb55543e0be23dd36cd840a4198ce719f85e381
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: e1eea295b1d0852072bfdfa8464ad6de008288d419831b042b74df827faa5f28478725faeb2127bfbfc6bf44b6bde82ee91e36fc168677f33f4578db00edce7a
|
7
|
+
data.tar.gz: 797fbcb4b2b9ecd58531a59c11d5ca65813315c09b2e1c593f09ad6794c1ddf6482c47a9cfec148cdb58e865a4951f7615f2e9ee8cb55a224bfa2711808604c4
|
data/bin/dynamised
CHANGED
data/lib/dynamised/helpers.rb
CHANGED
data/lib/dynamised/meta.rb
CHANGED
data/lib/dynamised/scraper.rb
CHANGED
@@ -101,7 +101,7 @@ module Dynamised
|
|
101
101
|
scrape(doc,tree,&block)
|
102
102
|
end
|
103
103
|
if pagination?(doc,tree)
|
104
|
-
paginate(tree) do |item|
|
104
|
+
paginate(doc,tree) do |item|
|
105
105
|
pull(item,tree,&block)
|
106
106
|
end
|
107
107
|
else
|
@@ -117,10 +117,10 @@ module Dynamised
|
|
117
117
|
|
118
118
|
def paginate(doc,tree)
|
119
119
|
current_page = doc
|
120
|
-
max = scrape_tag(current_page,tree[:paginate][:max],{r_type: :to_i})
|
120
|
+
max = scrape_tag(current_page,tree.data[:paginate][:max],{r_type: :to_i})
|
121
121
|
raise "No paginate max tag found" unless max
|
122
122
|
(1..max).each do
|
123
|
-
(current_page.xpath(tree[:paginate][:item])).each do |node|
|
123
|
+
(current_page.xpath(tree.data[:paginate][:item])).each do |node|
|
124
124
|
yield(item)
|
125
125
|
end
|
126
126
|
current_page = get_doc(current_page.xpath(tree[:paginate][:next]).attr('href'))
|
@@ -128,7 +128,7 @@ module Dynamised
|
|
128
128
|
end
|
129
129
|
|
130
130
|
def pagination?(doc,tree)
|
131
|
-
search_for_tag(doc,tree[:paginate][:if])
|
131
|
+
search_for_tag(doc,tree.data[:paginate][:if])
|
132
132
|
end
|
133
133
|
|
134
134
|
|
@@ -152,12 +152,13 @@ module Dynamised
|
|
152
152
|
fields =
|
153
153
|
tree.data[:fields].each_with_object({}) do |(field,data),res_hash|
|
154
154
|
target = execute_method(data[:meta][:before],remove_style_tags(doc),res_hash)
|
155
|
-
value = scrape_tag(target,data[:xpath],data[:meta])
|
155
|
+
value = data[:xpath].empty? ? target : scrape_tag(target,data[:xpath],data[:meta])
|
156
156
|
res_hash[field] =
|
157
157
|
if value
|
158
|
-
[*data[:meta][:after]].
|
158
|
+
res = [*data[:meta][:after]].map do |method|
|
159
159
|
execute_method(method,value,res_hash)
|
160
160
|
end
|
161
|
+
res.length > 1 ? res : res.first
|
161
162
|
else
|
162
163
|
data[:meta].fetch(:default,nil)
|
163
164
|
end
|
@@ -230,7 +231,7 @@ module Dynamised
|
|
230
231
|
end
|
231
232
|
|
232
233
|
def search_for_tag(doc,xpath)
|
233
|
-
doc.at_xpath(XPATH_Anchor % xpath)
|
234
|
+
xpath ? doc.at_xpath(XPATH_Anchor % xpath) : false
|
234
235
|
end
|
235
236
|
|
236
237
|
def scrape_tag(doc,xpath,meta={})
|
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: Dynamised
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.2.
|
4
|
+
version: 0.2.1
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Martin Becker
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2017-
|
11
|
+
date: 2017-05-06 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: tty-spinner
|