spider_rails 4.0.1 → 4.0.2

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA1:
3
- metadata.gz: 45eb0723b5f87fe4d47fe672b0731b2b023a6c9c
4
- data.tar.gz: 7c08ae9a4ba6499bcda5b4c01038a0695e378d39
3
+ metadata.gz: 5e182b6084575d3b2ac7e4cc9dcaf9c07b7018fc
4
+ data.tar.gz: 060df4f018e1bf486c0ac03d923fde72f5cd3f96
5
5
  SHA512:
6
- metadata.gz: 61551419495a9dd7cd11cdb81a81e8a79fc5d0dd8e840ac7dbc3eb292979911e5f626e933c1a9f704cba42cd14933a3e5f756aab4f1c40ddb9cbeb96dc435f61
7
- data.tar.gz: aa82ef9627e5661cdb32e4face134711249599dcde520238982469aa089cbbfb6d0fcecf13a3bf7f02556f905244b20e34b9f96836eed55dda31f15304e0b2b8
6
+ metadata.gz: 386ffce6067639a68a264d4fe73d9d2eb398874d4c68f7290fbbf1bfd4163206e3c1e9754f7891b43b390dea38fefcd0674cbac92b7c3fb6bae55ea3fc94544e
7
+ data.tar.gz: 463612cd49d92066f7c349f4188a9cff34e3e31a69ebeb9ce1ce874e006e1aae8586b3d41a21a323138bcee6fa69a7c706d08105d5762c21a80a86bca1653436
@@ -41,9 +41,9 @@ module Spider
41
41
  end
42
42
 
43
43
  class << self
44
- def open_browser url
45
- @browser = Watir::Browser.new :chrome, switches: %w( --user-data-dir=/home/zxr/.config/google-chrome)
46
- #@browser = Watir::Browser.new :chrome
44
+ def open_browser driver, url
45
+ #@browser = Watir::Browser.new :chrome, switches: %w( --user-data-dir=/home/zxr/.config/google-chrome)
46
+ @browser = Watir::Browser.new driver
47
47
  @browser.goto url
48
48
  @browser
49
49
  end
@@ -6,9 +6,8 @@ module Spider
6
6
  @ani = Hash.new
7
7
  @anis = Array.new
8
8
  @page = page
9
- @base_url = page.url.gsub!(/\b\d(.html)?/, '')
10
-
11
- if @base_url.include?('search')
9
+ @base_url = page.url.sub(/\d.html$/, '')
10
+ if @base_url && @base_url.include?('search')
12
11
  @mode = 'search'
13
12
  else
14
13
  @mode = 'normal'
@@ -22,8 +21,16 @@ module Spider
22
21
  (1..fp).each do |page_num|
23
22
  full_page page_num
24
23
  end
25
- #rescue Exception
26
- # raise %Q(page isn't not exist)
24
+ rescue Exception
25
+ raise %Q(page isn't not exist)
26
+ end
27
+ end
28
+
29
+ def multi_pages final_page_num
30
+ begin
31
+ (1..final_page_num).each do |page_num|
32
+ full_page page_num
33
+ end
27
34
  end
28
35
  end
29
36
 
@@ -40,16 +47,18 @@ module Spider
40
47
  case @mode
41
48
  when 'search'
42
49
  @page.goto "#{@base_url}#{page_num}"
43
- html = Nokogiri::HTML.parse @page.html
44
- html.css('.ltext').each do |td|
45
- sing le(td)
46
- end
50
+
47
51
  when 'normal'
48
52
  @page.goto "#{@base_url}#{page_num}.html"
49
53
  end
54
+ html = Nokogiri::HTML.parse @page.html
55
+
56
+ html.css('.ltext').each do |td|
57
+ single(td)
58
+ end
50
59
  end
51
60
 
52
- def single element, &block
61
+ def single element
53
62
  get(element)
54
63
  @anis
55
64
  end
@@ -59,9 +68,13 @@ module Spider
59
68
  @ani[:torrent] = 'http://bt.ktxp.com' + a['href']
60
69
  end
61
70
  @ani[:title],
62
- @ani[:size],
63
- @ani[:finish] = get_content(element, 'a.quick-down+a', 'td.ltext+td', 'td.ltext+td+td+td+td')
64
- @ani
71
+ @ani[:size],
72
+ @ani[:finish] = get_content(element, 'a.quick-down+a', 'td.ltext+td', 'td.ltext+td+td+td+td')
73
+ @anis << @ani
74
+ end
75
+
76
+ def count
77
+ self.anis.count
65
78
  end
66
79
 
67
80
  def get_content(element, *selectors)
@@ -1,3 +1,3 @@
1
1
  module SpiderRails
2
- VERSION = "4.0.1"
2
+ VERSION = "4.0.2"
3
3
  end
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: spider_rails
3
3
  version: !ruby/object:Gem::Version
4
- version: 4.0.1
4
+ version: 4.0.2
5
5
  platform: ruby
6
6
  authors:
7
7
  - zhuxingruo
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2013-07-18 00:00:00.000000000 Z
11
+ date: 2013-07-20 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: rails