tspider 0.0.1 → 0.0.2
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/lib/tspider/page.rb +17 -16
- data/lib/tspider/version.rb +1 -1
- metadata +1 -1
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 937326af40049679a7372ee0b0ee78b01f01083c
|
4
|
+
data.tar.gz: e5dc5058e8e1e9f5f740470aa14fef0260480de8
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: d9016aed3de2ac470617cb0f19760e0f23949c3b437768f2c006e7d75ae6f4ea4bffb805d3067734b7943bde2e1d73a301afeefb6946d349a108fcd9c7af3813
|
7
|
+
data.tar.gz: b9c8d326fb1ea24065393d7b34b8b121e1beeb4c3bc76b993c1a6697cc915e68d88f264e132d0b20707cf842918736c076baf1bfd8b6aefb2469924ee8cb4430
|
data/lib/tspider/page.rb
CHANGED
@@ -5,7 +5,7 @@ require 'webrobots'
|
|
5
5
|
|
6
6
|
module Tspider
|
7
7
|
class Page
|
8
|
-
attr_reader :
|
8
|
+
attr_reader :html, :doc, :url, :status, :location, :response_time, :response
|
9
9
|
|
10
10
|
def initialize(attrs)
|
11
11
|
@url = attrs[:url]
|
@@ -25,23 +25,24 @@ module Tspider
|
|
25
25
|
@doc = Nokogiri::HTML(@html)
|
26
26
|
@location = r.headers['location']
|
27
27
|
@headers = r.headers.to_hash
|
28
|
+
end
|
28
29
|
|
29
|
-
|
30
|
-
|
31
|
-
|
32
|
-
|
33
|
-
|
34
|
-
|
35
|
-
|
36
|
-
|
37
|
-
|
38
|
-
|
39
|
-
|
40
|
-
|
41
|
-
|
42
|
-
|
30
|
+
def opf
|
31
|
+
{:url => @url,
|
32
|
+
:status => @status,
|
33
|
+
:location => @Location,
|
34
|
+
:response_time => @response_time,
|
35
|
+
:canonical => canonical,
|
36
|
+
:title => title,
|
37
|
+
:meta_keywords => meta_keywords,
|
38
|
+
:meta_description => meta_description,
|
39
|
+
:meta_robots => meta_robots,
|
40
|
+
:h1 => h1,
|
41
|
+
:h2 => h2,
|
42
|
+
:h3 => h3,
|
43
|
+
:links => links,
|
44
|
+
:headers => @headers
|
43
45
|
}
|
44
|
-
|
45
46
|
end
|
46
47
|
|
47
48
|
def title
|
data/lib/tspider/version.rb
CHANGED