tspider 0.0.2 → 0.0.3
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/lib/tspider/page.rb +14 -11
- data/lib/tspider/version.rb +1 -1
- metadata +1 -1
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: e407e0ef33ba799382dd43ce3772f18fe76656b5
|
4
|
+
data.tar.gz: 33f0ecf9e8fd1797dfd8f2e34dd3fd7bfc02dd47
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 94242783d24aaf9b55c44df8d57ac601514aca916c039614b88e6be207f984f388eebff49eecde56c4790e2089e526c222f37c32e25f1a44246d0f3172532f19
|
7
|
+
data.tar.gz: fb0b64edbdb382f975033799b7f5760150e67ec38759fccd27361159863a8657e4b10b6397c9a79049f8e3ed7f6fa1bae3f3c8ef83bf892a910b6d9daa12ae5e
|
data/lib/tspider/page.rb
CHANGED
@@ -46,19 +46,19 @@ module Tspider
|
|
46
46
|
end
|
47
47
|
|
48
48
|
def title
|
49
|
-
safe_search('title',[0,
|
49
|
+
safe_search('title', [0], true)
|
50
50
|
end
|
51
51
|
|
52
52
|
def meta_description
|
53
|
-
safe_search('meta[@name="description"]',[0,'content'])
|
53
|
+
safe_search('meta[@name="description"]', [0, 'content'])
|
54
54
|
end
|
55
55
|
|
56
56
|
def meta_keywords
|
57
|
-
safe_search('meta[@name="keywords"]',[0,'content'])
|
57
|
+
safe_search('meta[@name="keywords"]', [0, 'content'])
|
58
58
|
end
|
59
59
|
|
60
60
|
def meta_robots
|
61
|
-
safe_search('meta[@name="robots"]',[0,'content'])
|
61
|
+
safe_search('meta[@name="robots"]', [0, 'content'])
|
62
62
|
end
|
63
63
|
|
64
64
|
def links
|
@@ -81,7 +81,7 @@ module Tspider
|
|
81
81
|
end
|
82
82
|
|
83
83
|
def canonical
|
84
|
-
safe_search('link[@rel="canonical"]',[0,'href'])
|
84
|
+
safe_search('link[@rel="canonical"]', [0, 'href'])
|
85
85
|
end
|
86
86
|
|
87
87
|
(1..6).each do |i|
|
@@ -94,10 +94,8 @@ module Tspider
|
|
94
94
|
end
|
95
95
|
end
|
96
96
|
|
97
|
-
|
98
|
-
|
99
|
-
def safe_search(search_value,select_path=[])
|
100
|
-
value = @doc.search(search_value)
|
97
|
+
def safe_search(search_value, select_path=[], return_content=false)
|
98
|
+
value = @doc.search(search_value).dup
|
101
99
|
select_path.each do |key|
|
102
100
|
begin
|
103
101
|
value = value[key]
|
@@ -105,8 +103,13 @@ module Tspider
|
|
105
103
|
return nil
|
106
104
|
end
|
107
105
|
end
|
108
|
-
value
|
109
|
-
end
|
110
106
|
|
107
|
+
return nil if value.nil?
|
108
|
+
if return_content
|
109
|
+
value.content
|
110
|
+
else
|
111
|
+
value
|
112
|
+
end
|
113
|
+
end
|
111
114
|
end
|
112
115
|
end
|
data/lib/tspider/version.rb
CHANGED