get_proxy_list 0.0.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml ADDED
@@ -0,0 +1,15 @@
1
+ ---
2
+ !binary "U0hBMQ==":
3
+ metadata.gz: !binary |-
4
+ NjZiNTkyNWI3NjJmMTE4MjEwYjU0YzY2ZDllMWVlOTA0N2E5ZTQ2MA==
5
+ data.tar.gz: !binary |-
6
+ ODliZWIwYzhhYWNmOGRiOWQwZmY2MGI4ODhhNTY3ZWJlNmZkOTA3NQ==
7
+ !binary "U0hBNTEy":
8
+ metadata.gz: !binary |-
9
+ YzczYWY5NTM2ODQyYTUwZGFlOTRkZjg5YjNiYTc2ODJlNTFjMWI4YTVhZjY1
10
+ MjAwZjJhOTg3MGZkOWE2YmYyMWYzZTQzMmQxMTc5ODlmZDFiM2FlM2QyODdl
11
+ NTlhMGFlODJkZTU1ZjQ5YjczMmZiMzg4OWQwNzBhYTQwN2VlNmI=
12
+ data.tar.gz: !binary |-
13
+ OGQ0MTczZjIwODAzZjY4ZDBmYTlkMGFhY2VhNmFjM2YzOGMzNjYxZDdlMGU5
14
+ ZDljM2EyN2YxMDFlMjE4ZWY0MDUyNGQxMjQ5ZDQwNWVjYWM2MWQ1MTVjZmZi
15
+ ZTlkNzY3ZWZhMzM0YzMzMTEyNDU2MzU0ZDlhMWUwZTkzNTU2YzA=
data/.gitignore ADDED
@@ -0,0 +1,17 @@
1
+ *.gem
2
+ *.rbc
3
+ .bundle
4
+ .config
5
+ .yardoc
6
+ Gemfile.lock
7
+ InstalledFiles
8
+ _yardoc
9
+ coverage
10
+ doc/
11
+ lib/bundler/man
12
+ pkg
13
+ rdoc
14
+ spec/reports
15
+ test/tmp
16
+ test/version_tmp
17
+ tmp
data/Gemfile ADDED
@@ -0,0 +1,6 @@
1
+ source 'https://rubygems.org'
2
+
3
+ # Specify your gem's dependencies in get_proxy_list.gemspec
4
+ gem 'nokogiri'
5
+ gemspec
6
+
data/LICENSE.txt ADDED
@@ -0,0 +1,22 @@
1
+ Copyright (c) 2013 hahazql
2
+
3
+ MIT License
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining
6
+ a copy of this software and associated documentation files (the
7
+ "Software"), to deal in the Software without restriction, including
8
+ without limitation the rights to use, copy, modify, merge, publish,
9
+ distribute, sublicense, and/or sell copies of the Software, and to
10
+ permit persons to whom the Software is furnished to do so, subject to
11
+ the following conditions:
12
+
13
+ The above copyright notice and this permission notice shall be
14
+ included in all copies or substantial portions of the Software.
15
+
16
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
17
+ EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
18
+ MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
19
+ NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
20
+ LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
21
+ OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
22
+ WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
data/README.md ADDED
@@ -0,0 +1,29 @@
1
+ # GetProxyList
2
+
3
+ TODO: Write a gem description
4
+
5
+ ## Installation
6
+
7
+ Add this line to your application's Gemfile:
8
+
9
+ gem 'get_proxy_list'
10
+
11
+ And then execute:
12
+
13
+ $ bundle
14
+
15
+ Or install it yourself as:
16
+
17
+ $ gem install get_proxy_list
18
+
19
+ ## Usage
20
+
21
+ TODO: Write usage instructions here
22
+
23
+ ## Contributing
24
+
25
+ 1. Fork it
26
+ 2. Create your feature branch (`git checkout -b my-new-feature`)
27
+ 3. Commit your changes (`git commit -am 'Add some feature'`)
28
+ 4. Push to the branch (`git push origin my-new-feature`)
29
+ 5. Create new Pull Request
data/Rakefile ADDED
@@ -0,0 +1 @@
1
+ require "bundler/gem_tasks"
@@ -0,0 +1,23 @@
1
+ # coding: utf-8
2
+ lib = File.expand_path('../lib', __FILE__)
3
+ $LOAD_PATH.unshift(lib) unless $LOAD_PATH.include?(lib)
4
+ require 'get_proxy_list/version'
5
+
6
+ Gem::Specification.new do |spec|
7
+ spec.name = "get_proxy_list"
8
+ spec.version = GetProxyList::VERSION
9
+ spec.authors = ["hahazql"]
10
+ spec.email = ["hahazhouqunli@gmail.com"]
11
+ spec.description = %q{use for get a proxy list}
12
+ spec.summary = %q{use for get a proxy list}
13
+ spec.homepage = ""
14
+ spec.license = "MIT"
15
+
16
+ spec.files = `git ls-files`.split($/)
17
+ spec.executables = spec.files.grep(%r{^bin/}) { |f| File.basename(f) }
18
+ spec.test_files = spec.files.grep(%r{^(test|spec|features)/})
19
+ spec.require_paths = ["lib"]
20
+
21
+ spec.add_development_dependency "bundler", "~> 1.3"
22
+ spec.add_development_dependency "rake"
23
+ end
@@ -0,0 +1,55 @@
1
+ require 'nokogiri'
2
+
3
+ module GetProxyList
4
+ class Base
5
+ # To change this template use File | Settings | File Templates.
6
+
7
+ attr_writer :save_path
8
+
9
+ def initialize(save_path=nil)
10
+ @save_path = save_path
11
+ unless @save_path
12
+ @save_path = File.expand_path("../proxylist", __FILE__)
13
+ end
14
+ end
15
+
16
+
17
+
18
+
19
+ #获取符合时限的代理
20
+ #limit 时限
21
+ #proxylist 待筛选的代理列表
22
+ def get_proxy_in_time_limit(limit,proxylist)
23
+ limit_list = []
24
+ proxylist.each do |proxy|
25
+ url = "http://" + proxy["ip"] + ":" + proxy["port"]
26
+ time_start = Time.now.to_i
27
+ begin
28
+ timeout(limit+1) do
29
+ doc = Nokogiri::HTML(open("http://www.baidu.com",:proxy=> url))
30
+ end
31
+ time_end = Time.now.to_i
32
+ time_use = time_end - time_start
33
+ p "url use_time:#{time_use}"
34
+ rescue Exception =>e
35
+ case e
36
+ when Errno::ETIMEDOUT
37
+ p "Use #{url} timeout"
38
+ when Timeout::Error
39
+ p "Use #{url} timeout"
40
+ when Errno::ECONNREFUSED
41
+ p "Use #{url} Error connection"
42
+ else
43
+ p "Use #{url} Error:#{e.to_s}"
44
+ end
45
+ time_use = -1
46
+ end
47
+ if(time_use > 0 &&time_use < limit)
48
+ limit_list << url
49
+ end
50
+ end
51
+ limit_list
52
+ end
53
+
54
+ end
55
+ end
@@ -0,0 +1,61 @@
1
+ require 'nokogiri'
2
+
3
+
4
+ module GetProxyList
5
+ class FromProxyCn
6
+ # To change this template use File | Settings | File Templates.
7
+ include GetProxyList
8
+ attr_reader :site
9
+
10
+ def initialize
11
+ @site = "http://www.cnproxy.com"
12
+ end
13
+
14
+
15
+ #获取代理列表
16
+ def _getproxylist(url)
17
+ begin
18
+ doc = Nokogiri::HTML(open('#{url}'))
19
+ proxylist = []
20
+ p "Doc: #{docs}"
21
+ doc.css('table').each do |_table|
22
+ _table.css('tr').each do |tr|
23
+ unless !tr.css('td')[0].eql?("IP:Port")||tr.css('td').empty?
24
+ proxy=tr.css('td')[0]
25
+ p "Proxy: #{proxy}"
26
+ proxy = proxy.split("document.write")
27
+ _proxy = proxy.split(":")
28
+ proxylist << {ip:_proxy[0],port:_proxy[1]}
29
+ end
30
+ end
31
+ end
32
+ p "ProxyList: #{proxylist}"
33
+ return proxylist
34
+ rescue => err
35
+ raise "Get Proxy list Error! Class:'FromProxyCn' Gem:'get_proxy_list' Error:'#{err.to_s}'"
36
+ end
37
+ end
38
+
39
+
40
+ #根据需要的页数获取URL列表
41
+ #page 将获取的页数
42
+ def get_url_list(page)
43
+ urls = []
44
+ 1.upto(page.to_i).each do |_page|
45
+ urls << @site+"/proxy#{_page.to_s}.html"
46
+ end
47
+ return urls
48
+ end
49
+
50
+
51
+ def get_proxylist(page)
52
+ urls = get_url_list(page)
53
+ proxylist = []
54
+ urls.each do |url|
55
+ proxylist =proxylist+proxylist|_getproxylist(url)
56
+ end
57
+ return proxylist
58
+ end
59
+
60
+ end
61
+ end
@@ -0,0 +1,7 @@
1
+
2
+
3
+ module GetProxyList
4
+ class FromProxycn
5
+ # To change this template use File | Settings | File Templates.
6
+ end
7
+ end
@@ -0,0 +1,3 @@
1
+ module GetProxyList
2
+ VERSION = "0.0.2"
3
+ end
@@ -0,0 +1,14 @@
1
+ require 'get_proxy_list'
2
+ require "get_proxy_list/version"
3
+ require "get_proxy_list/from_proxy_cn"
4
+ require "get_proxy_list/base"
5
+
6
+ module GetProxyList
7
+ def self.get_list(limit,page)
8
+ fromProxyCn = FromProxyCn.new()
9
+ base = Base.new()
10
+ proxylist = fromProxyCn.get_proxylist(page)
11
+ proxylist = base.get_proxy_in_time_limit(limit,proxylist)
12
+ return proxylist
13
+ end
14
+ end
metadata ADDED
@@ -0,0 +1,84 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: get_proxy_list
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.0.2
5
+ platform: ruby
6
+ authors:
7
+ - hahazql
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2013-05-30 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: bundler
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - ~>
18
+ - !ruby/object:Gem::Version
19
+ version: '1.3'
20
+ type: :development
21
+ prerelease: false
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - ~>
25
+ - !ruby/object:Gem::Version
26
+ version: '1.3'
27
+ - !ruby/object:Gem::Dependency
28
+ name: rake
29
+ requirement: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - ! '>='
32
+ - !ruby/object:Gem::Version
33
+ version: '0'
34
+ type: :development
35
+ prerelease: false
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - ! '>='
39
+ - !ruby/object:Gem::Version
40
+ version: '0'
41
+ description: use for get a proxy list
42
+ email:
43
+ - hahazhouqunli@gmail.com
44
+ executables: []
45
+ extensions: []
46
+ extra_rdoc_files: []
47
+ files:
48
+ - .gitignore
49
+ - Gemfile
50
+ - LICENSE.txt
51
+ - README.md
52
+ - Rakefile
53
+ - get_proxy_list.gemspec
54
+ - lib/get_proxy_list.rb
55
+ - lib/get_proxy_list/base.rb
56
+ - lib/get_proxy_list/from_proxy_cn.rb
57
+ - lib/get_proxy_list/from_proxycn.rb
58
+ - lib/get_proxy_list/version.rb
59
+ homepage: ''
60
+ licenses:
61
+ - MIT
62
+ metadata: {}
63
+ post_install_message:
64
+ rdoc_options: []
65
+ require_paths:
66
+ - lib
67
+ required_ruby_version: !ruby/object:Gem::Requirement
68
+ requirements:
69
+ - - ! '>='
70
+ - !ruby/object:Gem::Version
71
+ version: '0'
72
+ required_rubygems_version: !ruby/object:Gem::Requirement
73
+ requirements:
74
+ - - ! '>='
75
+ - !ruby/object:Gem::Version
76
+ version: '0'
77
+ requirements: []
78
+ rubyforge_project:
79
+ rubygems_version: 2.0.0
80
+ signing_key:
81
+ specification_version: 4
82
+ summary: use for get a proxy list
83
+ test_files: []
84
+ has_rdoc: