spider_rails 4.0.1 → 4.0.2
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/lib/spider_rails/common.rb +3 -3
- data/lib/spider_rails/ji_ying.rb +26 -13
- data/lib/spider_rails/version.rb +1 -1
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 5e182b6084575d3b2ac7e4cc9dcaf9c07b7018fc
|
4
|
+
data.tar.gz: 060df4f018e1bf486c0ac03d923fde72f5cd3f96
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 386ffce6067639a68a264d4fe73d9d2eb398874d4c68f7290fbbf1bfd4163206e3c1e9754f7891b43b390dea38fefcd0674cbac92b7c3fb6bae55ea3fc94544e
|
7
|
+
data.tar.gz: 463612cd49d92066f7c349f4188a9cff34e3e31a69ebeb9ce1ce874e006e1aae8586b3d41a21a323138bcee6fa69a7c706d08105d5762c21a80a86bca1653436
|
data/lib/spider_rails/common.rb
CHANGED
@@ -41,9 +41,9 @@ module Spider
|
|
41
41
|
end
|
42
42
|
|
43
43
|
class << self
|
44
|
-
def open_browser url
|
45
|
-
|
46
|
-
|
44
|
+
def open_browser driver, url
|
45
|
+
#@browser = Watir::Browser.new :chrome, switches: %w( --user-data-dir=/home/zxr/.config/google-chrome)
|
46
|
+
@browser = Watir::Browser.new driver
|
47
47
|
@browser.goto url
|
48
48
|
@browser
|
49
49
|
end
|
data/lib/spider_rails/ji_ying.rb
CHANGED
@@ -6,9 +6,8 @@ module Spider
|
|
6
6
|
@ani = Hash.new
|
7
7
|
@anis = Array.new
|
8
8
|
@page = page
|
9
|
-
@base_url = page.url.
|
10
|
-
|
11
|
-
if @base_url.include?('search')
|
9
|
+
@base_url = page.url.sub(/\d.html$/, '')
|
10
|
+
if @base_url && @base_url.include?('search')
|
12
11
|
@mode = 'search'
|
13
12
|
else
|
14
13
|
@mode = 'normal'
|
@@ -22,8 +21,16 @@ module Spider
|
|
22
21
|
(1..fp).each do |page_num|
|
23
22
|
full_page page_num
|
24
23
|
end
|
25
|
-
|
26
|
-
|
24
|
+
rescue Exception
|
25
|
+
raise %Q(page isn't not exist)
|
26
|
+
end
|
27
|
+
end
|
28
|
+
|
29
|
+
def multi_pages final_page_num
|
30
|
+
begin
|
31
|
+
(1..final_page_num).each do |page_num|
|
32
|
+
full_page page_num
|
33
|
+
end
|
27
34
|
end
|
28
35
|
end
|
29
36
|
|
@@ -40,16 +47,18 @@ module Spider
|
|
40
47
|
case @mode
|
41
48
|
when 'search'
|
42
49
|
@page.goto "#{@base_url}#{page_num}"
|
43
|
-
|
44
|
-
html.css('.ltext').each do |td|
|
45
|
-
sing le(td)
|
46
|
-
end
|
50
|
+
|
47
51
|
when 'normal'
|
48
52
|
@page.goto "#{@base_url}#{page_num}.html"
|
49
53
|
end
|
54
|
+
html = Nokogiri::HTML.parse @page.html
|
55
|
+
|
56
|
+
html.css('.ltext').each do |td|
|
57
|
+
single(td)
|
58
|
+
end
|
50
59
|
end
|
51
60
|
|
52
|
-
def single element
|
61
|
+
def single element
|
53
62
|
get(element)
|
54
63
|
@anis
|
55
64
|
end
|
@@ -59,9 +68,13 @@ module Spider
|
|
59
68
|
@ani[:torrent] = 'http://bt.ktxp.com' + a['href']
|
60
69
|
end
|
61
70
|
@ani[:title],
|
62
|
-
|
63
|
-
|
64
|
-
@ani
|
71
|
+
@ani[:size],
|
72
|
+
@ani[:finish] = get_content(element, 'a.quick-down+a', 'td.ltext+td', 'td.ltext+td+td+td+td')
|
73
|
+
@anis << @ani
|
74
|
+
end
|
75
|
+
|
76
|
+
def count
|
77
|
+
self.anis.count
|
65
78
|
end
|
66
79
|
|
67
80
|
def get_content(element, *selectors)
|
data/lib/spider_rails/version.rb
CHANGED
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: spider_rails
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 4.0.
|
4
|
+
version: 4.0.2
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- zhuxingruo
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2013-07-
|
11
|
+
date: 2013-07-20 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: rails
|