spidr 0.4.0 → 0.4.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/.gitignore +10 -0
- data/ChangeLog.md +4 -0
- data/Gemfile +4 -0
- data/README.md +1 -1
- data/gemspec.yml +2 -2
- data/lib/spidr/agent.rb +4 -2
- data/lib/spidr/version.rb +1 -1
- data/spidr.gemspec +1 -1
- metadata +22 -21
data/.gitignore
ADDED
data/ChangeLog.md
CHANGED
data/Gemfile
CHANGED
data/README.md
CHANGED
@@ -4,7 +4,7 @@
|
|
4
4
|
* [Source](http://github.com/postmodern/spidr)
|
5
5
|
* [Issues](http://github.com/postmodern/spidr/issues)
|
6
6
|
* [Mailing List](http://groups.google.com/group/spidr)
|
7
|
-
*
|
7
|
+
* [IRC](http://webchat.freenode.net/?channels=spidr&uio=d4)
|
8
8
|
|
9
9
|
## Description
|
10
10
|
|
data/gemspec.yml
CHANGED
data/lib/spidr/agent.rb
CHANGED
@@ -8,6 +8,7 @@ require 'spidr/cookie_jar'
|
|
8
8
|
require 'spidr/auth_store'
|
9
9
|
require 'spidr/spidr'
|
10
10
|
|
11
|
+
require 'openssl'
|
11
12
|
require 'net/http'
|
12
13
|
require 'set'
|
13
14
|
|
@@ -684,8 +685,9 @@ module Spidr
|
|
684
685
|
rescue SystemCallError,
|
685
686
|
Timeout::Error,
|
686
687
|
SocketError,
|
687
|
-
|
688
|
-
|
688
|
+
IOError,
|
689
|
+
OpenSSL::SSL::SSLError,
|
690
|
+
Net::HTTPBadResponse
|
689
691
|
|
690
692
|
@sessions.kill!(url)
|
691
693
|
|
data/lib/spidr/version.rb
CHANGED
data/spidr.gemspec
CHANGED
@@ -99,7 +99,7 @@ Gem::Specification.new do |gemspec|
|
|
99
99
|
end
|
100
100
|
|
101
101
|
if gemspec.respond_to?(:required_rubygems_version=)
|
102
|
-
gemspec.required_rubygems_version = metadata['
|
102
|
+
gemspec.required_rubygems_version = metadata['required_rubygems_version']
|
103
103
|
end
|
104
104
|
|
105
105
|
parse_versions = lambda { |versions|
|
metadata
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: spidr
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.4.
|
4
|
+
version: 0.4.1
|
5
5
|
prerelease:
|
6
6
|
platform: ruby
|
7
7
|
authors:
|
@@ -9,12 +9,11 @@ authors:
|
|
9
9
|
autorequire:
|
10
10
|
bindir: bin
|
11
11
|
cert_chain: []
|
12
|
-
date: 2011-
|
13
|
-
default_executable:
|
12
|
+
date: 2011-12-09 00:00:00.000000000 Z
|
14
13
|
dependencies:
|
15
14
|
- !ruby/object:Gem::Dependency
|
16
15
|
name: nokogiri
|
17
|
-
requirement: &
|
16
|
+
requirement: &19474920 !ruby/object:Gem::Requirement
|
18
17
|
none: false
|
19
18
|
requirements:
|
20
19
|
- - ~>
|
@@ -22,39 +21,41 @@ dependencies:
|
|
22
21
|
version: '1.3'
|
23
22
|
type: :runtime
|
24
23
|
prerelease: false
|
25
|
-
version_requirements: *
|
24
|
+
version_requirements: *19474920
|
26
25
|
- !ruby/object:Gem::Dependency
|
27
26
|
name: bundler
|
28
|
-
requirement: &
|
27
|
+
requirement: &19474320 !ruby/object:Gem::Requirement
|
29
28
|
none: false
|
30
29
|
requirements:
|
31
30
|
- - ~>
|
32
31
|
- !ruby/object:Gem::Version
|
33
|
-
version: 1.0
|
32
|
+
version: '1.0'
|
34
33
|
type: :development
|
35
34
|
prerelease: false
|
36
|
-
version_requirements: *
|
35
|
+
version_requirements: *19474320
|
37
36
|
- !ruby/object:Gem::Dependency
|
38
37
|
name: yard
|
39
|
-
requirement: &
|
38
|
+
requirement: &19473820 !ruby/object:Gem::Requirement
|
40
39
|
none: false
|
41
40
|
requirements:
|
42
41
|
- - ~>
|
43
42
|
- !ruby/object:Gem::Version
|
44
|
-
version: 0.
|
43
|
+
version: '0.7'
|
45
44
|
type: :development
|
46
45
|
prerelease: false
|
47
|
-
version_requirements: *
|
46
|
+
version_requirements: *19473820
|
48
47
|
description: Spidr is a versatile Ruby web spidering library that can spider a site,
|
49
48
|
multiple domains, certain links or infinitely. Spidr is designed to be fast and
|
50
49
|
easy to use.
|
51
|
-
email:
|
52
|
-
- postmodern.mod3@gmail.com
|
50
|
+
email: postmodern.mod3@gmail.com
|
53
51
|
executables: []
|
54
52
|
extensions: []
|
55
53
|
extra_rdoc_files:
|
54
|
+
- ChangeLog.md
|
55
|
+
- LICENSE.txt
|
56
56
|
- README.md
|
57
57
|
files:
|
58
|
+
- .gitignore
|
58
59
|
- .rspec
|
59
60
|
- .yardopts
|
60
61
|
- ChangeLog.md
|
@@ -105,7 +106,6 @@ files:
|
|
105
106
|
- spec/spec_helper.rb
|
106
107
|
- spec/spidr_spec.rb
|
107
108
|
- spidr.gemspec
|
108
|
-
has_rdoc: yard
|
109
109
|
homepage: http://github.com/postmodern/spidr
|
110
110
|
licenses:
|
111
111
|
- MIT
|
@@ -124,21 +124,22 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
124
124
|
requirements:
|
125
125
|
- - ! '>='
|
126
126
|
- !ruby/object:Gem::Version
|
127
|
-
version:
|
127
|
+
version: '0'
|
128
128
|
requirements: []
|
129
|
-
rubyforge_project:
|
130
|
-
rubygems_version: 1.
|
129
|
+
rubyforge_project:
|
130
|
+
rubygems_version: 1.8.10
|
131
131
|
signing_key:
|
132
132
|
specification_version: 3
|
133
133
|
summary: A versatile Ruby web spidering library
|
134
134
|
test_files:
|
135
|
-
- spec/agent_spec.rb
|
136
135
|
- spec/actions_spec.rb
|
137
|
-
- spec/
|
138
|
-
- spec/extensions/uri_spec.rb
|
136
|
+
- spec/agent_spec.rb
|
139
137
|
- spec/auth_store_spec.rb
|
140
138
|
- spec/cookie_jar_spec.rb
|
139
|
+
- spec/extensions/uri_spec.rb
|
141
140
|
- spec/filters_spec.rb
|
141
|
+
- spec/page_spec.rb
|
142
|
+
- spec/rules_spec.rb
|
142
143
|
- spec/sanitizers_spec.rb
|
143
144
|
- spec/spidr_spec.rb
|
144
|
-
|
145
|
+
has_rdoc:
|