flyerhzm-regexp_crawler 0.7.0 → 0.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
data/VERSION CHANGED
@@ -1 +1 @@
1
- 0.7.0
1
+ 0.8.0
@@ -51,7 +51,7 @@ module RegexpCrawler
51
51
  if response.is_a? Net::HTTPSuccess
52
52
  if continue_regexp
53
53
  response_body.scan(continue_regexp).each do |page|
54
- page = page.first if page.is_a? Array
54
+ page = page.compact.first if page.is_a? Array
55
55
  continue_uri = continue_uri(uri, page)
56
56
  @pages << continue_uri unless @captured_pages.include?(continue_uri) or @pages.include?(continue_uri)
57
57
  end
@@ -1,6 +1,8 @@
1
1
  require 'net/http'
2
2
  require 'uri'
3
+ require 'iconv'
3
4
  require 'regexp_crawler/http'
5
+ require 'regexp_crawler/crawler'
4
6
 
5
7
  module RegexpCrawler
6
8
 
@@ -5,11 +5,11 @@
5
5
 
6
6
  Gem::Specification.new do |s|
7
7
  s.name = %q{regexp_crawler}
8
- s.version = "0.7.0"
8
+ s.version = "0.8.0"
9
9
 
10
10
  s.required_rubygems_version = Gem::Requirement.new(">= 0") if s.respond_to? :required_rubygems_version=
11
11
  s.authors = ["Richard Huang"]
12
- s.date = %q{2009-08-30}
12
+ s.date = %q{2009-09-01}
13
13
  s.description = %q{RegexpCrawler is a Ruby library for crawl data from website using regular expression.}
14
14
  s.email = %q{flyerhzm@gmail.com}
15
15
  s.extra_rdoc_files = [
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: flyerhzm-regexp_crawler
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.7.0
4
+ version: 0.8.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Richard Huang
@@ -9,7 +9,7 @@ autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
11
 
12
- date: 2009-08-30 00:00:00 -07:00
12
+ date: 2009-09-01 00:00:00 -07:00
13
13
  default_executable:
14
14
  dependencies: []
15
15