tarantula 0.4.1 → 0.4.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/.gitignore +1 -0
- data/.travis.yml +3 -0
- data/CHANGELOG +4 -0
- data/README.rdoc +2 -8
- data/lib/relevance/core_extensions/response.rb +5 -3
- data/lib/relevance/tarantula.rb +0 -8
- data/lib/relevance/tarantula/invalid_html_handler.rb +4 -1
- data/lib/relevance/tarantula/tidy_handler.rb +2 -4
- data/lib/relevance/tarantula/version.rb +1 -1
- data/spec/relevance/core_extensions/file_spec.rb +0 -1
- data/spec/relevance/core_extensions/response_spec.rb +32 -13
- data/spec/relevance/core_extensions/test_case_spec.rb +1 -2
- data/spec/relevance/tarantula/rails_integration_proxy_spec.rb +2 -2
- data/spec/spec_helper.rb +2 -4
- metadata +24 -23
- data/Gemfile.lock +0 -108
data/.gitignore
CHANGED
data/.travis.yml
ADDED
data/CHANGELOG
CHANGED
data/README.rdoc
CHANGED
@@ -11,7 +11,7 @@ Tarantula is a big fuzzy spider. It crawls your Rails 3 application, fuzzing dat
|
|
11
11
|
The latest and greatest version is always available on GitHub. (See the rakefile for dependencies, or
|
12
12
|
just let RubyGems handle it). Add it to your Gemfile as normal:
|
13
13
|
|
14
|
-
gem "tarantula"
|
14
|
+
gem "tarantula"
|
15
15
|
|
16
16
|
=== Crawling Your App
|
17
17
|
|
@@ -124,13 +124,7 @@ The above will crawl your app twice, and each specific crawl will timeout if it
|
|
124
124
|
|
125
125
|
== Bugs/Requests
|
126
126
|
|
127
|
-
Please submit your bug reports, patches, or feature requests
|
128
|
-
|
129
|
-
http://relevance.lighthouseapp.com/projects/17868-tarantula/overview
|
130
|
-
|
131
|
-
You can view the continuous integration results for Tarantula, including results against all supported versions of Rails, on RunCodeRun here:
|
132
|
-
|
133
|
-
http://runcoderun.com/relevance/tarantula
|
127
|
+
Please submit your bug reports, patches, or feature requests in Github Issues.
|
134
128
|
|
135
129
|
== License
|
136
130
|
|
@@ -1,11 +1,13 @@
|
|
1
1
|
# dynamically mixed in to response objects
|
2
2
|
module Relevance
|
3
3
|
module CoreExtensions
|
4
|
-
module Response
|
5
|
-
def html?
|
4
|
+
module Response
|
5
|
+
def html?
|
6
6
|
# some versions of Rails integration tests don't set content type
|
7
7
|
# so we are treating nil as html. A better fix would be welcome here.
|
8
|
-
((
|
8
|
+
(content_type.respond_to?(:html?) ?
|
9
|
+
content_type.html? : content_type =~ %r{^text/html}) ||
|
10
|
+
content_type.nil?
|
9
11
|
end
|
10
12
|
end
|
11
13
|
end
|
data/lib/relevance/tarantula.rb
CHANGED
@@ -1,15 +1,7 @@
|
|
1
|
-
TARANTULA_ROOT = File.expand_path(File.join(File.dirname(__FILE__), "../.."))
|
2
|
-
|
3
1
|
require 'forwardable'
|
4
2
|
require 'erb'
|
5
3
|
require 'active_support'
|
6
4
|
require 'action_controller'
|
7
|
-
# bringing in xss-shield requires a bunch of other dependencies
|
8
|
-
# still not certain about this, if it ruins your world please let me know
|
9
|
-
#xss_shield_path = File.join(TARANTULA_ROOT, %w{vendor xss-shield})
|
10
|
-
#$: << File.join(xss_shield_path, "lib")
|
11
|
-
#require File.join(xss_shield_path, "init")
|
12
|
-
|
13
5
|
require 'htmlentities'
|
14
6
|
|
15
7
|
module Relevance; end
|
@@ -5,7 +5,10 @@ module Relevance
|
|
5
5
|
include Relevance::Tarantula
|
6
6
|
def handle(result)
|
7
7
|
response = result.response
|
8
|
-
|
8
|
+
unless response.html?
|
9
|
+
log "Skipping #{self.class} on url: #{result.url} because response is not html."
|
10
|
+
return
|
11
|
+
end
|
9
12
|
begin
|
10
13
|
body = HTML::Document.new(response.body, true)
|
11
14
|
rescue Exception => e
|
@@ -1,8 +1,6 @@
|
|
1
|
-
require 'rubygems'
|
2
1
|
begin
|
3
|
-
gem 'tidy'
|
4
2
|
require 'tidy'
|
5
|
-
rescue
|
3
|
+
rescue LoadError
|
6
4
|
puts "Tidy gem not available -- 'gem install tidy' to get it."
|
7
5
|
end
|
8
6
|
|
@@ -12,7 +10,7 @@ if defined? Tidy
|
|
12
10
|
module Relevance
|
13
11
|
module Tarantula
|
14
12
|
|
15
|
-
class TidyHandler
|
13
|
+
class TidyHandler
|
16
14
|
include Relevance::Tarantula
|
17
15
|
def initialize(options = {})
|
18
16
|
@options = {:show_warnings=>true}.merge(options)
|
@@ -1,29 +1,48 @@
|
|
1
1
|
require "spec_helper"
|
2
|
-
require 'relevance/core_extensions/file'
|
3
2
|
|
4
3
|
describe "Relevance::CoreExtensions::Response#html?" do
|
5
4
|
before do
|
6
5
|
@response = OpenStruct.new
|
7
6
|
@response.extend(Relevance::CoreExtensions::Response)
|
8
|
-
end
|
9
|
-
|
10
|
-
it "should be html if the content-type is 'text/html'" do
|
11
|
-
@response.content_type = "text/html"
|
12
|
-
@response.should be_html
|
13
|
-
@response.content_type = "text/html;charset=iso-8859-2"
|
14
|
-
@response.should be_html
|
15
7
|
end
|
16
8
|
|
17
|
-
|
18
|
-
|
19
|
-
|
9
|
+
context 'when content_type is a String (Rails 2)' do
|
10
|
+
it "should be html if the content-type is 'text/html'" do
|
11
|
+
@response.content_type = "text/html"
|
12
|
+
@response.should be_html
|
13
|
+
@response.content_type = "text/html;charset=iso-8859-2"
|
14
|
+
@response.should be_html
|
15
|
+
end
|
16
|
+
|
17
|
+
it "should not be html if the content-type isn't an html type" do
|
18
|
+
@response.content_type = "text/plain"
|
19
|
+
@response.should_not be_html
|
20
|
+
@response.content_type = "application/pdf"
|
21
|
+
@response.should_not be_html
|
22
|
+
end
|
20
23
|
end
|
21
24
|
|
22
|
-
|
25
|
+
context 'when content_type is a Mime::Type (Rails 3)' do
|
26
|
+
it "should be html if the content-type is 'text/html'" do
|
27
|
+
@response.content_type = Mime::Type.new("text/html")
|
28
|
+
@response.should be_html
|
29
|
+
@response.content_type = Mime::Type.new("text/html;charset=iso-8859-2")
|
30
|
+
@response.should be_html
|
31
|
+
end
|
32
|
+
|
33
|
+
it "should not be html if the content-type isn't an html type" do
|
34
|
+
@response.content_type = Mime::Type.new("text/plain")
|
35
|
+
@response.should_not be_html
|
36
|
+
@response.content_type = Mime::Type.new("application/pdf")
|
37
|
+
@response.should_not be_html
|
38
|
+
end
|
39
|
+
end
|
40
|
+
|
41
|
+
# better ideas welcome, but be careful not to
|
23
42
|
# castrate tarantula for proxies that don't set the content-type
|
24
43
|
it "should pretend we have html if the content-type is nil" do
|
25
44
|
@response.content_type = nil
|
26
45
|
@response.should be_html
|
27
46
|
end
|
28
|
-
|
47
|
+
|
29
48
|
end
|
@@ -1,5 +1,4 @@
|
|
1
1
|
require "spec_helper"
|
2
|
-
require 'relevance/core_extensions/test_case'
|
3
2
|
|
4
3
|
describe "TestCase extensions" do
|
5
4
|
pending "can create the crawler" do
|
@@ -13,7 +12,7 @@ describe "TestCase extensions" do
|
|
13
12
|
expects(:tarantula_crawler).returns(crawler)
|
14
13
|
tarantula_crawl(:integration_test_stub, :url => "/foo")
|
15
14
|
end
|
16
|
-
|
15
|
+
|
17
16
|
it "should get mixed into ActionController::IntegrationTest" do
|
18
17
|
ActionController::IntegrationTest.ancestors.should include(Relevance::CoreExtensions::TestCaseExtensions)
|
19
18
|
end
|
@@ -57,11 +57,11 @@ describe "Relevance::Tarantula::RailsIntegrationProxy patching" do
|
|
57
57
|
it "patches in Relevance::CoreExtensions::Response" do
|
58
58
|
@rip = Relevance::Tarantula::RailsIntegrationProxy.new(stub)
|
59
59
|
@rip.stubs(:rails_root).returns("faux_rails_root")
|
60
|
-
@response = stub_everything({:code => "404", :headers => {}, :content_type => "text/html"})
|
60
|
+
@response = stub_everything({:code => "404", :headers => {}, :content_type => Mime::Type.new("text/html")})
|
61
61
|
@response.meta.ancestors.should_not include(Relevance::CoreExtensions::Response)
|
62
62
|
@rip.patch_response("/url", @response)
|
63
63
|
@response.meta.ancestors.should include(Relevance::CoreExtensions::Response)
|
64
|
-
@response.
|
64
|
+
@response.should be_html
|
65
65
|
end
|
66
66
|
|
67
67
|
it "replaces 404s with 200s, pulling content from public, for known text types" do
|
data/spec/spec_helper.rb
CHANGED
@@ -1,8 +1,5 @@
|
|
1
|
-
require 'rubygems'
|
2
|
-
lib_path = File.expand_path(File.dirname(__FILE__) + "/../lib")
|
3
|
-
$LOAD_PATH.unshift lib_path unless $LOAD_PATH.include?(lib_path)
|
4
|
-
|
5
1
|
if rails_version = ENV['RAILS_VERSION']
|
2
|
+
require 'rubygems'
|
6
3
|
gem "rails", rails_version
|
7
4
|
end
|
8
5
|
|
@@ -13,6 +10,7 @@ if Rails::VERSION::STRING < "2.3.1" && RUBY_VERSION >= "1.9.1"
|
|
13
10
|
end
|
14
11
|
puts "==== Testing with Rails #{Rails::VERSION::STRING} ===="
|
15
12
|
|
13
|
+
require 'relevance/tarantula'
|
16
14
|
require 'bundler'
|
17
15
|
Bundler.require
|
18
16
|
require 'ostruct'
|
metadata
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: tarantula
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.4.
|
4
|
+
version: 0.4.2
|
5
5
|
prerelease:
|
6
6
|
platform: ruby
|
7
7
|
authors:
|
@@ -9,11 +9,11 @@ authors:
|
|
9
9
|
autorequire:
|
10
10
|
bindir: bin
|
11
11
|
cert_chain: []
|
12
|
-
date:
|
12
|
+
date: 2012-02-20 00:00:00.000000000Z
|
13
13
|
dependencies:
|
14
14
|
- !ruby/object:Gem::Dependency
|
15
15
|
name: htmlentities
|
16
|
-
requirement: &
|
16
|
+
requirement: &70348248358760 !ruby/object:Gem::Requirement
|
17
17
|
none: false
|
18
18
|
requirements:
|
19
19
|
- - ~>
|
@@ -21,10 +21,10 @@ dependencies:
|
|
21
21
|
version: 4.3.0
|
22
22
|
type: :runtime
|
23
23
|
prerelease: false
|
24
|
-
version_requirements: *
|
24
|
+
version_requirements: *70348248358760
|
25
25
|
- !ruby/object:Gem::Dependency
|
26
26
|
name: hpricot
|
27
|
-
requirement: &
|
27
|
+
requirement: &70348248358220 !ruby/object:Gem::Requirement
|
28
28
|
none: false
|
29
29
|
requirements:
|
30
30
|
- - ~>
|
@@ -32,10 +32,10 @@ dependencies:
|
|
32
32
|
version: 0.8.4
|
33
33
|
type: :runtime
|
34
34
|
prerelease: false
|
35
|
-
version_requirements: *
|
35
|
+
version_requirements: *70348248358220
|
36
36
|
- !ruby/object:Gem::Dependency
|
37
37
|
name: rspec
|
38
|
-
requirement: &
|
38
|
+
requirement: &70348248357700 !ruby/object:Gem::Requirement
|
39
39
|
none: false
|
40
40
|
requirements:
|
41
41
|
- - ~>
|
@@ -43,10 +43,10 @@ dependencies:
|
|
43
43
|
version: 2.6.0
|
44
44
|
type: :development
|
45
45
|
prerelease: false
|
46
|
-
version_requirements: *
|
46
|
+
version_requirements: *70348248357700
|
47
47
|
- !ruby/object:Gem::Dependency
|
48
48
|
name: sdoc
|
49
|
-
requirement: &
|
49
|
+
requirement: &70348248357240 !ruby/object:Gem::Requirement
|
50
50
|
none: false
|
51
51
|
requirements:
|
52
52
|
- - ~>
|
@@ -54,10 +54,10 @@ dependencies:
|
|
54
54
|
version: 0.3.0
|
55
55
|
type: :development
|
56
56
|
prerelease: false
|
57
|
-
version_requirements: *
|
57
|
+
version_requirements: *70348248357240
|
58
58
|
- !ruby/object:Gem::Dependency
|
59
59
|
name: sdoc-helpers
|
60
|
-
requirement: &
|
60
|
+
requirement: &70348248356660 !ruby/object:Gem::Requirement
|
61
61
|
none: false
|
62
62
|
requirements:
|
63
63
|
- - ~>
|
@@ -65,10 +65,10 @@ dependencies:
|
|
65
65
|
version: 0.1.4
|
66
66
|
type: :development
|
67
67
|
prerelease: false
|
68
|
-
version_requirements: *
|
68
|
+
version_requirements: *70348248356660
|
69
69
|
- !ruby/object:Gem::Dependency
|
70
70
|
name: rdiscount
|
71
|
-
requirement: &
|
71
|
+
requirement: &70348248356080 !ruby/object:Gem::Requirement
|
72
72
|
none: false
|
73
73
|
requirements:
|
74
74
|
- - ~>
|
@@ -76,10 +76,10 @@ dependencies:
|
|
76
76
|
version: 1.6.8
|
77
77
|
type: :development
|
78
78
|
prerelease: false
|
79
|
-
version_requirements: *
|
79
|
+
version_requirements: *70348248356080
|
80
80
|
- !ruby/object:Gem::Dependency
|
81
81
|
name: log_buddy
|
82
|
-
requirement: &
|
82
|
+
requirement: &70348248339640 !ruby/object:Gem::Requirement
|
83
83
|
none: false
|
84
84
|
requirements:
|
85
85
|
- - ~>
|
@@ -87,10 +87,10 @@ dependencies:
|
|
87
87
|
version: 0.6.0
|
88
88
|
type: :development
|
89
89
|
prerelease: false
|
90
|
-
version_requirements: *
|
90
|
+
version_requirements: *70348248339640
|
91
91
|
- !ruby/object:Gem::Dependency
|
92
92
|
name: mocha
|
93
|
-
requirement: &
|
93
|
+
requirement: &70348248339060 !ruby/object:Gem::Requirement
|
94
94
|
none: false
|
95
95
|
requirements:
|
96
96
|
- - ~>
|
@@ -98,10 +98,10 @@ dependencies:
|
|
98
98
|
version: 0.9.12
|
99
99
|
type: :development
|
100
100
|
prerelease: false
|
101
|
-
version_requirements: *
|
101
|
+
version_requirements: *70348248339060
|
102
102
|
- !ruby/object:Gem::Dependency
|
103
103
|
name: rails
|
104
|
-
requirement: &
|
104
|
+
requirement: &70348248338480 !ruby/object:Gem::Requirement
|
105
105
|
none: false
|
106
106
|
requirements:
|
107
107
|
- - ~>
|
@@ -109,7 +109,7 @@ dependencies:
|
|
109
109
|
version: 3.0.9
|
110
110
|
type: :development
|
111
111
|
prerelease: false
|
112
|
-
version_requirements: *
|
112
|
+
version_requirements: *70348248338480
|
113
113
|
description: A big hairy fuzzy spider that crawls your site, wreaking havoc
|
114
114
|
email:
|
115
115
|
- opensource@thinkrelevance.com
|
@@ -120,10 +120,10 @@ files:
|
|
120
120
|
- .autotest
|
121
121
|
- .gitignore
|
122
122
|
- .rvmrc
|
123
|
+
- .travis.yml
|
123
124
|
- CHANGELOG
|
124
125
|
- DSL_EXAMPLES.md
|
125
126
|
- Gemfile
|
126
|
-
- Gemfile.lock
|
127
127
|
- LICENSE
|
128
128
|
- README.rdoc
|
129
129
|
- Rakefile
|
@@ -224,8 +224,9 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
224
224
|
version: '0'
|
225
225
|
requirements: []
|
226
226
|
rubyforge_project: tarantula
|
227
|
-
rubygems_version: 1.8.
|
227
|
+
rubygems_version: 1.8.15
|
228
228
|
signing_key:
|
229
229
|
specification_version: 3
|
230
230
|
summary: A big hairy fuzzy spider that crawls your site, wreaking havoc
|
231
|
-
test_files:
|
231
|
+
test_files:
|
232
|
+
- template/tarantula_test.rb
|
data/Gemfile.lock
DELETED
@@ -1,108 +0,0 @@
|
|
1
|
-
PATH
|
2
|
-
remote: .
|
3
|
-
specs:
|
4
|
-
relevance/tarantula (0.4.0)
|
5
|
-
hpricot (~> 0.8.4)
|
6
|
-
htmlentities (~> 4.3.0)
|
7
|
-
|
8
|
-
GEM
|
9
|
-
remote: https://rubygems.org/
|
10
|
-
specs:
|
11
|
-
abstract (1.0.0)
|
12
|
-
actionmailer (3.0.10)
|
13
|
-
actionpack (= 3.0.10)
|
14
|
-
mail (~> 2.2.19)
|
15
|
-
actionpack (3.0.10)
|
16
|
-
activemodel (= 3.0.10)
|
17
|
-
activesupport (= 3.0.10)
|
18
|
-
builder (~> 2.1.2)
|
19
|
-
erubis (~> 2.6.6)
|
20
|
-
i18n (~> 0.5.0)
|
21
|
-
rack (~> 1.2.1)
|
22
|
-
rack-mount (~> 0.6.14)
|
23
|
-
rack-test (~> 0.5.7)
|
24
|
-
tzinfo (~> 0.3.23)
|
25
|
-
activemodel (3.0.10)
|
26
|
-
activesupport (= 3.0.10)
|
27
|
-
builder (~> 2.1.2)
|
28
|
-
i18n (~> 0.5.0)
|
29
|
-
activerecord (3.0.10)
|
30
|
-
activemodel (= 3.0.10)
|
31
|
-
activesupport (= 3.0.10)
|
32
|
-
arel (~> 2.0.10)
|
33
|
-
tzinfo (~> 0.3.23)
|
34
|
-
activeresource (3.0.10)
|
35
|
-
activemodel (= 3.0.10)
|
36
|
-
activesupport (= 3.0.10)
|
37
|
-
activesupport (3.0.10)
|
38
|
-
arel (2.0.10)
|
39
|
-
builder (2.1.2)
|
40
|
-
diff-lcs (1.1.2)
|
41
|
-
erubis (2.6.6)
|
42
|
-
abstract (>= 1.0.0)
|
43
|
-
hpricot (0.8.4)
|
44
|
-
htmlentities (4.3.0)
|
45
|
-
i18n (0.5.0)
|
46
|
-
json (1.5.3)
|
47
|
-
log_buddy (0.6.0)
|
48
|
-
mail (2.2.19)
|
49
|
-
activesupport (>= 2.3.6)
|
50
|
-
i18n (>= 0.4.0)
|
51
|
-
mime-types (~> 1.16)
|
52
|
-
treetop (~> 1.4.8)
|
53
|
-
mime-types (1.16)
|
54
|
-
mocha (0.9.12)
|
55
|
-
polyglot (0.3.2)
|
56
|
-
rack (1.2.3)
|
57
|
-
rack-mount (0.6.14)
|
58
|
-
rack (>= 1.0.0)
|
59
|
-
rack-test (0.5.7)
|
60
|
-
rack (>= 1.0)
|
61
|
-
rails (3.0.10)
|
62
|
-
actionmailer (= 3.0.10)
|
63
|
-
actionpack (= 3.0.10)
|
64
|
-
activerecord (= 3.0.10)
|
65
|
-
activeresource (= 3.0.10)
|
66
|
-
activesupport (= 3.0.10)
|
67
|
-
bundler (~> 1.0)
|
68
|
-
railties (= 3.0.10)
|
69
|
-
railties (3.0.10)
|
70
|
-
actionpack (= 3.0.10)
|
71
|
-
activesupport (= 3.0.10)
|
72
|
-
rake (>= 0.8.7)
|
73
|
-
rdoc (~> 3.4)
|
74
|
-
thor (~> 0.14.4)
|
75
|
-
rake (0.9.2)
|
76
|
-
rdiscount (1.6.8)
|
77
|
-
rdoc (3.9.2)
|
78
|
-
rspec (2.6.0)
|
79
|
-
rspec-core (~> 2.6.0)
|
80
|
-
rspec-expectations (~> 2.6.0)
|
81
|
-
rspec-mocks (~> 2.6.0)
|
82
|
-
rspec-core (2.6.4)
|
83
|
-
rspec-expectations (2.6.0)
|
84
|
-
diff-lcs (~> 1.1.2)
|
85
|
-
rspec-mocks (2.6.0)
|
86
|
-
sdoc (0.3.0)
|
87
|
-
json (>= 1.1.3)
|
88
|
-
rdoc (~> 3)
|
89
|
-
sdoc-helpers (0.1.4)
|
90
|
-
sdoc (~> 0.2)
|
91
|
-
thor (0.14.6)
|
92
|
-
treetop (1.4.10)
|
93
|
-
polyglot
|
94
|
-
polyglot (>= 0.3.1)
|
95
|
-
tzinfo (0.3.29)
|
96
|
-
|
97
|
-
PLATFORMS
|
98
|
-
ruby
|
99
|
-
|
100
|
-
DEPENDENCIES
|
101
|
-
log_buddy (~> 0.6.0)
|
102
|
-
mocha (~> 0.9.12)
|
103
|
-
rails (~> 3.0.9)
|
104
|
-
rdiscount (~> 1.6.8)
|
105
|
-
relevance/tarantula!
|
106
|
-
rspec (~> 2.6.0)
|
107
|
-
sdoc (~> 0.3.0)
|
108
|
-
sdoc-helpers (~> 0.1.4)
|