refract 0.0.1 → 0.0.2
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/lib/refract.rb +19 -15
- metadata +1 -1
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 4b85603db75df917843a9a472adc0be6c4d70c82
|
4
|
+
data.tar.gz: 4e6fd2bc73965689460ba68a7abe19fc22ad883c
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 9a3081a106e86c3d643966fea33bf8bd5b0a4028baa1943da033d197a488bd64594a9c85380ac6f47563fdac630c470eaddb226ab19e44cdadbeec8b7e69d8ab
|
7
|
+
data.tar.gz: 18220738bdb8f0d26a8b114e5fec5d2ea311437e20fbd19ea59c71c2079ff8586da2a415510de2a42fc96cc973021dc46c1fb7a9045a268bfec863fdddcb5543
|
data/lib/refract.rb
CHANGED
@@ -7,23 +7,27 @@ class Refract
|
|
7
7
|
Spidr.site(homePage) do |spider|
|
8
8
|
spider.every_html_page do |page|
|
9
9
|
if page.title
|
10
|
-
|
10
|
+
pageTitle = page.title.downcase.gsub(' ', "_").delete('|')
|
11
11
|
else
|
12
|
-
|
12
|
+
pageTitle = "unknown_page_#{Time.now.to_f.to_s.sub('.', '_')}"
|
13
13
|
end
|
14
|
-
|
15
|
-
|
16
|
-
|
17
|
-
|
18
|
-
|
19
|
-
|
20
|
-
|
21
|
-
|
22
|
-
|
23
|
-
|
24
|
-
|
25
|
-
|
26
|
-
File.
|
14
|
+
fileName = pageTitle
|
15
|
+
className = pageTitle.gsub(' ', '').delete('|')
|
16
|
+
begin
|
17
|
+
body = page.doc.to_s
|
18
|
+
idElements=body.scan(/\id="(.*?)"/).flatten
|
19
|
+
nameElements=body.scan(/\name="(.*?)"/).flatten
|
20
|
+
dataTestElements=body.scan(/\data-test="(.*?)"/).flatten
|
21
|
+
url = page.url.to_s.partition('.com').last
|
22
|
+
elements = element_formatter('id', idElements)
|
23
|
+
elements += element_formatter('name', nameElements)
|
24
|
+
elements += element_formatter('data-test', dataTestElements)
|
25
|
+
path = File.join(Dir.pwd, 'page_objects', "#{fileName}.rb")
|
26
|
+
unless File.exists?(path)
|
27
|
+
File.open(path, 'w') {|file| file.write(base_page_object_content(url, className, elements)) }
|
28
|
+
end
|
29
|
+
rescue
|
30
|
+
puts "page object not created for #{page.url}"
|
27
31
|
end
|
28
32
|
end
|
29
33
|
end
|