spider_rails 4.0.1 → 4.0.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/lib/spider_rails/common.rb +3 -3
- data/lib/spider_rails/ji_ying.rb +26 -13
- data/lib/spider_rails/version.rb +1 -1
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 5e182b6084575d3b2ac7e4cc9dcaf9c07b7018fc
|
4
|
+
data.tar.gz: 060df4f018e1bf486c0ac03d923fde72f5cd3f96
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 386ffce6067639a68a264d4fe73d9d2eb398874d4c68f7290fbbf1bfd4163206e3c1e9754f7891b43b390dea38fefcd0674cbac92b7c3fb6bae55ea3fc94544e
|
7
|
+
data.tar.gz: 463612cd49d92066f7c349f4188a9cff34e3e31a69ebeb9ce1ce874e006e1aae8586b3d41a21a323138bcee6fa69a7c706d08105d5762c21a80a86bca1653436
|
data/lib/spider_rails/common.rb
CHANGED
@@ -41,9 +41,9 @@ module Spider
|
|
41
41
|
end
|
42
42
|
|
43
43
|
class << self
|
44
|
-
def open_browser url
|
45
|
-
|
46
|
-
|
44
|
+
def open_browser driver, url
|
45
|
+
#@browser = Watir::Browser.new :chrome, switches: %w( --user-data-dir=/home/zxr/.config/google-chrome)
|
46
|
+
@browser = Watir::Browser.new driver
|
47
47
|
@browser.goto url
|
48
48
|
@browser
|
49
49
|
end
|
data/lib/spider_rails/ji_ying.rb
CHANGED
@@ -6,9 +6,8 @@ module Spider
|
|
6
6
|
@ani = Hash.new
|
7
7
|
@anis = Array.new
|
8
8
|
@page = page
|
9
|
-
@base_url = page.url.
|
10
|
-
|
11
|
-
if @base_url.include?('search')
|
9
|
+
@base_url = page.url.sub(/\d.html$/, '')
|
10
|
+
if @base_url && @base_url.include?('search')
|
12
11
|
@mode = 'search'
|
13
12
|
else
|
14
13
|
@mode = 'normal'
|
@@ -22,8 +21,16 @@ module Spider
|
|
22
21
|
(1..fp).each do |page_num|
|
23
22
|
full_page page_num
|
24
23
|
end
|
25
|
-
|
26
|
-
|
24
|
+
rescue Exception
|
25
|
+
raise %Q(page isn't not exist)
|
26
|
+
end
|
27
|
+
end
|
28
|
+
|
29
|
+
def multi_pages final_page_num
|
30
|
+
begin
|
31
|
+
(1..final_page_num).each do |page_num|
|
32
|
+
full_page page_num
|
33
|
+
end
|
27
34
|
end
|
28
35
|
end
|
29
36
|
|
@@ -40,16 +47,18 @@ module Spider
|
|
40
47
|
case @mode
|
41
48
|
when 'search'
|
42
49
|
@page.goto "#{@base_url}#{page_num}"
|
43
|
-
|
44
|
-
html.css('.ltext').each do |td|
|
45
|
-
sing le(td)
|
46
|
-
end
|
50
|
+
|
47
51
|
when 'normal'
|
48
52
|
@page.goto "#{@base_url}#{page_num}.html"
|
49
53
|
end
|
54
|
+
html = Nokogiri::HTML.parse @page.html
|
55
|
+
|
56
|
+
html.css('.ltext').each do |td|
|
57
|
+
single(td)
|
58
|
+
end
|
50
59
|
end
|
51
60
|
|
52
|
-
def single element
|
61
|
+
def single element
|
53
62
|
get(element)
|
54
63
|
@anis
|
55
64
|
end
|
@@ -59,9 +68,13 @@ module Spider
|
|
59
68
|
@ani[:torrent] = 'http://bt.ktxp.com' + a['href']
|
60
69
|
end
|
61
70
|
@ani[:title],
|
62
|
-
|
63
|
-
|
64
|
-
@ani
|
71
|
+
@ani[:size],
|
72
|
+
@ani[:finish] = get_content(element, 'a.quick-down+a', 'td.ltext+td', 'td.ltext+td+td+td+td')
|
73
|
+
@anis << @ani
|
74
|
+
end
|
75
|
+
|
76
|
+
def count
|
77
|
+
self.anis.count
|
65
78
|
end
|
66
79
|
|
67
80
|
def get_content(element, *selectors)
|
data/lib/spider_rails/version.rb
CHANGED
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: spider_rails
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 4.0.
|
4
|
+
version: 4.0.2
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- zhuxingruo
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2013-07-
|
11
|
+
date: 2013-07-20 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: rails
|