simplecrawler 0.1.3 → 0.1.4

Sign up to get free protection for your applications and to get access to all the features.
data/lib/simplecrawler.rb CHANGED
@@ -23,7 +23,7 @@ module SimpleCrawler
23
23
  require File.dirname(__FILE__) + '/document'
24
24
 
25
25
  MARKUP_MIME_TYPES = ["text/html", "text/xml", "application/xml", "application/xhtml+xml"]
26
- VERSION = "0.1.3"
26
+ VERSION = "0.1.4"
27
27
 
28
28
  class Crawler
29
29
 
@@ -103,7 +103,7 @@ module SimpleCrawler
103
103
  doc = Document.new
104
104
  begin
105
105
  uri = @site_uri.clone
106
- uri.path = uri.path + path if path != "/"
106
+ uri.path = path if path != "/"
107
107
  doc.uri = uri
108
108
 
109
109
  log("Trying #{uri}")
@@ -12,8 +12,14 @@ class SimpleCrawlerTest < Test::Unit::TestCase
12
12
  def test_initialize_crawler
13
13
  @crawler = SimpleCrawler::Crawler.new("http://www.example.com/")
14
14
  assert @crawler.queue.length == 1
15
+ assert_equal "/", @crawler.queue[0]
15
16
  end
16
17
 
18
+ def test_initialize_crawler_with_path
19
+ @crawler = SimpleCrawler::Crawler.new("http://www.example.com/deep/down/in/hierarchy/")
20
+ assert @crawler.queue.length == 1
21
+ assert_equal "/deep/down/in/hierarchy/", @crawler.queue[0]
22
+ end
17
23
 
18
24
  def test_initialize_crawler_without_uri_path
19
25
  @crawler = SimpleCrawler::Crawler.new("http://www.example.com")
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: simplecrawler
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.1.3
4
+ version: 0.1.4
5
5
  platform: ruby
6
6
  authors:
7
7
  - Peter Krantz
@@ -9,7 +9,7 @@ autorequire: simplecrawler
9
9
  bindir: bin
10
10
  cert_chain: []
11
11
 
12
- date: 2008-01-26 00:00:00 +01:00
12
+ date: 2008-09-17 00:00:00 +02:00
13
13
  default_executable:
14
14
  dependencies:
15
15
  - !ruby/object:Gem::Dependency