rcrawl 0.4.5 → 0.4.6

Sign up to get free protection for your applications and to get access to all the features.
data/Rakefile CHANGED
@@ -18,7 +18,7 @@ end
18
18
 
19
19
  spec = Gem::Specification.new do |s|
20
20
  s.name = "rcrawl"
21
- s.version = "0.4.5"
21
+ s.version = "0.4.6"
22
22
  s.author = "Digital Duckies"
23
23
  s.email = "rcrawl@digitalduckies.net"
24
24
  s.homepage = "http://digitalduckies.net"
@@ -27,6 +27,10 @@ module Rcrawl
27
27
  # Get link
28
28
  url_server
29
29
  next unless robot_safe? @url
30
+ if @url.include? '#'
31
+ print "... Anchor link found, skipping..."
32
+ next
33
+ end
30
34
  # Parse robots.txt, then download document if robot_safe
31
35
  fetch_http(@url)
32
36
  # Store raw HTML in variable to read/reread as needed
@@ -1,5 +1,5 @@
1
1
  module Rcrawl
2
2
  class Crawler
3
- VERSION = "0.4.5"
3
+ VERSION = "0.4.6"
4
4
  end
5
5
  end
metadata CHANGED
@@ -3,7 +3,7 @@ rubygems_version: 0.9.0
3
3
  specification_version: 1
4
4
  name: rcrawl
5
5
  version: !ruby/object:Gem::Version
6
- version: 0.4.5
6
+ version: 0.4.6
7
7
  date: 2006-09-26 00:00:00 -05:00
8
8
  summary: A web crawler written in ruby
9
9
  require_paths: