tspider 0.0.2 → 0.0.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/lib/tspider/page.rb +14 -11
- data/lib/tspider/version.rb +1 -1
- metadata +1 -1
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: e407e0ef33ba799382dd43ce3772f18fe76656b5
|
4
|
+
data.tar.gz: 33f0ecf9e8fd1797dfd8f2e34dd3fd7bfc02dd47
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 94242783d24aaf9b55c44df8d57ac601514aca916c039614b88e6be207f984f388eebff49eecde56c4790e2089e526c222f37c32e25f1a44246d0f3172532f19
|
7
|
+
data.tar.gz: fb0b64edbdb382f975033799b7f5760150e67ec38759fccd27361159863a8657e4b10b6397c9a79049f8e3ed7f6fa1bae3f3c8ef83bf892a910b6d9daa12ae5e
|
data/lib/tspider/page.rb
CHANGED
@@ -46,19 +46,19 @@ module Tspider
|
|
46
46
|
end
|
47
47
|
|
48
48
|
def title
|
49
|
-
safe_search('title',[0,
|
49
|
+
safe_search('title', [0], true)
|
50
50
|
end
|
51
51
|
|
52
52
|
def meta_description
|
53
|
-
safe_search('meta[@name="description"]',[0,'content'])
|
53
|
+
safe_search('meta[@name="description"]', [0, 'content'])
|
54
54
|
end
|
55
55
|
|
56
56
|
def meta_keywords
|
57
|
-
safe_search('meta[@name="keywords"]',[0,'content'])
|
57
|
+
safe_search('meta[@name="keywords"]', [0, 'content'])
|
58
58
|
end
|
59
59
|
|
60
60
|
def meta_robots
|
61
|
-
safe_search('meta[@name="robots"]',[0,'content'])
|
61
|
+
safe_search('meta[@name="robots"]', [0, 'content'])
|
62
62
|
end
|
63
63
|
|
64
64
|
def links
|
@@ -81,7 +81,7 @@ module Tspider
|
|
81
81
|
end
|
82
82
|
|
83
83
|
def canonical
|
84
|
-
safe_search('link[@rel="canonical"]',[0,'href'])
|
84
|
+
safe_search('link[@rel="canonical"]', [0, 'href'])
|
85
85
|
end
|
86
86
|
|
87
87
|
(1..6).each do |i|
|
@@ -94,10 +94,8 @@ module Tspider
|
|
94
94
|
end
|
95
95
|
end
|
96
96
|
|
97
|
-
|
98
|
-
|
99
|
-
def safe_search(search_value,select_path=[])
|
100
|
-
value = @doc.search(search_value)
|
97
|
+
def safe_search(search_value, select_path=[], return_content=false)
|
98
|
+
value = @doc.search(search_value).dup
|
101
99
|
select_path.each do |key|
|
102
100
|
begin
|
103
101
|
value = value[key]
|
@@ -105,8 +103,13 @@ module Tspider
|
|
105
103
|
return nil
|
106
104
|
end
|
107
105
|
end
|
108
|
-
value
|
109
|
-
end
|
110
106
|
|
107
|
+
return nil if value.nil?
|
108
|
+
if return_content
|
109
|
+
value.content
|
110
|
+
else
|
111
|
+
value
|
112
|
+
end
|
113
|
+
end
|
111
114
|
end
|
112
115
|
end
|
data/lib/tspider/version.rb
CHANGED