metainspector 1.9.7 → 1.9.8

Sign up to get free protection for your applications and to get access to all the features.
@@ -170,11 +170,7 @@ module MetaInspector
170
170
  if url =~ /^\w*\:/i
171
171
  url
172
172
  else
173
- if url[0] == "/"
174
- File.join(@root_url, url)
175
- else
176
- File.join(@url, url)
177
- end
173
+ URI.parse(@root_url).merge(url).to_s
178
174
  end
179
175
  end
180
176
 
@@ -1,5 +1,5 @@
1
1
  # -*- encoding: utf-8 -*-
2
2
 
3
3
  module MetaInspector
4
- VERSION = "1.9.7"
4
+ VERSION = "1.9.8"
5
5
  end
@@ -0,0 +1,23 @@
1
+ HTTP/1.1 200 OK
2
+ Date: Mon, 30 May 2011 09:58:20 GMT
3
+ Server: Microsoft-IIS/6.0
4
+ X-Powered-By: PleskWin
5
+ X-Powered-By: ASP.NET
6
+ Cache-Control: private
7
+ Content-Length: 25902
8
+ Content-Type: text/html
9
+ Expires: Sun, 29 May 2011 09:58:18 GMT
10
+ Set-Cookie: ASPSESSIONIDCSBSQADC=AHENHHKBGGDIFJLHHCCJBHMP; path=/
11
+ Cache-control: private
12
+
13
+
14
+
15
+ <html>
16
+ <head>
17
+ <title>Diseño paginas web</title>
18
+ </head>
19
+ <body>
20
+ <a href="index.asp">Index</a>
21
+ <a href="faqs.asp">Faqs</a>
22
+ </body>
23
+ </html>
@@ -5,6 +5,7 @@ require File.join(File.dirname(__FILE__), "/spec_helper")
5
5
  describe MetaInspector do
6
6
  FakeWeb.register_uri(:get, "http://pagerankalert.com", :response => fixture_file("pagerankalert.com.response"))
7
7
  FakeWeb.register_uri(:get, "http://www.alazan.com", :response => fixture_file("alazan.com.response"))
8
+ FakeWeb.register_uri(:get, "http://alazan.com/websolution.asp", :response => fixture_file("alazan_websolution.response"))
8
9
  FakeWeb.register_uri(:get, "http://www.theonion.com/articles/apple-claims-new-iphone-only-visible-to-most-loyal,2772/", :response => fixture_file("theonion.com.response"))
9
10
  FakeWeb.register_uri(:get, "http://theonion-no-description.com", :response => fixture_file("theonion-no-description.com.response"))
10
11
  FakeWeb.register_uri(:get, "http://www.iteh.at", :response => fixture_file("iteh.at.response"))
@@ -141,7 +142,7 @@ describe MetaInspector do
141
142
 
142
143
  it "should get correct absolute links for internal pages" do
143
144
  m = MetaInspector.new('http://w3clove.com/faqs')
144
- m.links.should == [ "http://w3clove.com/faqs/#",
145
+ m.links.should == [ "http://w3clove.com/#",
145
146
  "http://w3clove.com/",
146
147
  "http://w3clove.com/faqs",
147
148
  "http://w3clove.com/plans-and-pricing",
@@ -166,6 +167,12 @@ describe MetaInspector do
166
167
  "http://us4.campaign-archive1.com/home/?u=6af3ab69c286561d0f0f25671&id=04a0dab609" ]
167
168
  end
168
169
 
170
+ it "should get correct absolute links, correcting relative links from URL not ending with slash" do
171
+ m = MetaInspector.new('http://alazan.com/websolution.asp')
172
+ m.links.should == [ "http://alazan.com/index.asp",
173
+ "http://alazan.com/faqs.asp" ]
174
+ end
175
+
169
176
  it "should return empty array if no links found" do
170
177
  m = MetaInspector.new('http://example.com/empty')
171
178
  m.links.should == []
metadata CHANGED
@@ -1,13 +1,13 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: metainspector
3
3
  version: !ruby/object:Gem::Version
4
- hash: 61
4
+ hash: 35
5
5
  prerelease:
6
6
  segments:
7
7
  - 1
8
8
  - 9
9
- - 7
10
- version: 1.9.7
9
+ - 8
10
+ version: 1.9.8
11
11
  platform: ruby
12
12
  authors:
13
13
  - Jaime Iniesta
@@ -154,6 +154,7 @@ files:
154
154
  - samples/basic_scraping.rb
155
155
  - samples/spider.rb
156
156
  - spec/fixtures/alazan.com.response
157
+ - spec/fixtures/alazan_websolution.response
157
158
  - spec/fixtures/empty_page.response
158
159
  - spec/fixtures/guardian.co.uk.response
159
160
  - spec/fixtures/iteh.at.response