proxy_fetcher 0.11.0 → 0.15.1

Sign up to get free protection for your applications and to get access to all the features.
Files changed (39) hide show
  1. checksums.yaml +4 -4
  2. data/CHANGELOG.md +32 -1
  3. data/Gemfile +4 -2
  4. data/Rakefile +3 -1
  5. data/gemfiles/nokogiri.gemfile +1 -1
  6. data/gemfiles/oga.gemfile +2 -2
  7. data/lib/proxy_fetcher.rb +42 -31
  8. data/lib/proxy_fetcher/client/request.rb +3 -3
  9. data/lib/proxy_fetcher/configuration.rb +13 -9
  10. data/lib/proxy_fetcher/document/node.rb +1 -1
  11. data/lib/proxy_fetcher/manager.rb +40 -7
  12. data/lib/proxy_fetcher/providers/base.rb +2 -1
  13. data/lib/proxy_fetcher/providers/free_proxy_list.rb +0 -21
  14. data/lib/proxy_fetcher/providers/free_proxy_list_socks.rb +58 -0
  15. data/lib/proxy_fetcher/providers/free_proxy_list_ssl.rb +1 -0
  16. data/lib/proxy_fetcher/providers/free_proxy_list_us.rb +54 -0
  17. data/lib/proxy_fetcher/providers/mtpro.rb +43 -0
  18. data/lib/proxy_fetcher/providers/proxypedia.rb +48 -0
  19. data/lib/proxy_fetcher/providers/proxyscrape_http.rb +65 -0
  20. data/lib/proxy_fetcher/providers/proxyscrape_socks4.rb +65 -0
  21. data/lib/proxy_fetcher/providers/proxyscrape_socks5.rb +65 -0
  22. data/lib/proxy_fetcher/providers/xroxy.rb +2 -2
  23. data/lib/proxy_fetcher/proxy.rb +12 -0
  24. data/lib/proxy_fetcher/utils/http_client.rb +25 -21
  25. data/lib/proxy_fetcher/utils/proxy_validator.rb +20 -8
  26. data/lib/proxy_fetcher/version.rb +2 -2
  27. data/proxy_fetcher.gemspec +6 -4
  28. data/spec/fixtures/proxies.txt +14 -0
  29. data/spec/proxy_fetcher/client/client_spec.rb +10 -5
  30. data/spec/proxy_fetcher/manager_spec.rb +18 -0
  31. data/spec/proxy_fetcher/providers/proxy_classes_spec.rb +28 -0
  32. metadata +15 -12
  33. data/lib/proxy_fetcher/providers/gather_proxy.rb +0 -50
  34. data/spec/proxy_fetcher/providers/free_proxy_list_spec.rb +0 -13
  35. data/spec/proxy_fetcher/providers/free_proxy_list_ssl_spec.rb +0 -11
  36. data/spec/proxy_fetcher/providers/gather_proxy_spec.rb +0 -11
  37. data/spec/proxy_fetcher/providers/http_tunnel_spec.rb +0 -11
  38. data/spec/proxy_fetcher/providers/proxy_list_spec.rb +0 -11
  39. data/spec/proxy_fetcher/providers/xroxy_spec.rb +0 -11
@@ -10,27 +10,39 @@ module ProxyFetcher
10
10
 
11
11
  # Short variant to validate proxy.
12
12
  #
13
- # @param proxy_addr [String] proxy address or IP
14
- # @param proxy_port [String, Integer] proxy port
13
+ # @param address [String] proxy address or IP
14
+ # @param port [String, Integer] proxy port
15
15
  #
16
16
  # @return [Boolean]
17
17
  # true if connection to the server using proxy established, otherwise false
18
18
  #
19
- def self.connectable?(proxy_addr, proxy_port)
20
- new(proxy_addr, proxy_port).connectable?
19
+ def self.connectable?(address, port)
20
+ new(address, port).connectable?
21
21
  end
22
22
 
23
23
  # Initialize new ProxyValidator instance
24
24
  #
25
- # @param proxy_addr [String] proxy address or IP
26
- # @param proxy_port [String, Integer] proxy port
25
+ # @param address [String] Proxy address or IP
26
+ # @param port [String, Integer] Proxy port
27
+ # @param options [Hash] proxy options
28
+ # @option username [String] Proxy authentication username
29
+ # @option password [String] Proxy authentication password
30
+ # @option headers [Hash] Proxy headers
27
31
  #
28
32
  # @return [ProxyValidator]
29
33
  #
30
- def initialize(proxy_addr, proxy_port)
34
+ def initialize(address, port, options: {})
31
35
  timeout = ProxyFetcher.config.proxy_validation_timeout
36
+ proxy = [address, port.to_i]
32
37
 
33
- @http = HTTP.follow.via(proxy_addr, proxy_port.to_i).timeout(connect: timeout, read: timeout)
38
+ if options[:username] && options[:password]
39
+ proxy << options[:username]
40
+ proxy << options[:password]
41
+ end
42
+
43
+ proxy << options[:headers].to_h if options[:headers]
44
+
45
+ @http = HTTP.follow.via(*proxy).timeout(connect: timeout, read: timeout)
34
46
  end
35
47
 
36
48
  # Checks if proxy is connectable (can be used to connect
@@ -13,9 +13,9 @@ module ProxyFetcher
13
13
  # Major version number
14
14
  MAJOR = 0
15
15
  # Minor version number
16
- MINOR = 11
16
+ MINOR = 15
17
17
  # Smallest version number
18
- TINY = 0
18
+ TINY = 1
19
19
 
20
20
  # Full version number
21
21
  STRING = [MAJOR, MINOR, TINY].compact.join(".")
@@ -8,9 +8,11 @@ Gem::Specification.new do |gem|
8
8
  gem.name = "proxy_fetcher"
9
9
  gem.version = ProxyFetcher.gem_version
10
10
  gem.summary = "Ruby gem for dealing with proxy lists from different providers"
11
- gem.description = "This gem can help your Ruby application to make HTTP(S) requests " \
12
- "using proxies by fetching and validating proxy lists from " \
13
- "the different providers."
11
+ gem.description = <<-TEXT.strip.gsub(/[\s\n]+/, " ")
12
+ This gem can help your Ruby application to make HTTP(S) requests
13
+ using proxies by fetching and validating proxy lists from
14
+ the different providers.
15
+ TEXT
14
16
  gem.authors = ["Nikita Bulai"]
15
17
  gem.email = "bulajnikita@gmail.com"
16
18
  gem.require_paths = ["lib"]
@@ -24,5 +26,5 @@ Gem::Specification.new do |gem|
24
26
  gem.add_runtime_dependency "http", ">= 3", "< 5"
25
27
 
26
28
  gem.add_development_dependency "rake", ">= 12.0"
27
- gem.add_development_dependency "rspec", "~> 3.5"
29
+ gem.add_development_dependency "rspec", "~> 3.9"
28
30
  end
@@ -0,0 +1,14 @@
1
+ 139.162.59.9:3128
2
+ 176.62.187.158:56351
3
+ 144.217.22.142:8080
4
+ 176.55.108.21:3128
5
+ 157.225.214.251:3128
6
+ 202.51.49.52:48298
7
+ 104.244.75.26:8080
8
+ 163.172.28.20:80
9
+ 187.56.191.12:3128
10
+ 129.194.12.26:80
11
+ 178.128.39.39:8080
12
+ 181.30.28.15:8080
13
+ 51.181.96.185:8080
14
+ 148.134.10.13
@@ -3,6 +3,11 @@
3
3
  require "spec_helper"
4
4
  require "json"
5
5
 
6
+ begin
7
+ require "webrick"
8
+ rescue LoadError
9
+ # nop
10
+ end
6
11
  require "evil-proxy"
7
12
  require "evil-proxy/async"
8
13
 
@@ -118,15 +123,15 @@ describe ProxyFetcher::Client do
118
123
  end
119
124
  end
120
125
 
121
- xcontext "retries" do
126
+ context "retries" do
122
127
  it "raises an error when reaches max retries limit" do
123
128
  allow(ProxyFetcher::Client::Request).to receive(:execute).and_raise(StandardError)
124
129
 
125
- expect { ProxyFetcher::Client.get("http://httpbin.org") }
130
+ expect { ProxyFetcher::Client.get("http://httpbin.org", options: { max_retries: 10 }) }
126
131
  .to raise_error(ProxyFetcher::Exceptions::MaximumRetriesReached)
127
132
  end
128
133
 
129
- it "raises an error when http request returns an error" do
134
+ xit "raises an error when http request returns an error" do
130
135
  allow_any_instance_of(HTTP::Client).to receive(:get).and_return(StandardError.new)
131
136
 
132
137
  expect { ProxyFetcher::Client.get("http://httpbin.org") }
@@ -134,14 +139,14 @@ describe ProxyFetcher::Client do
134
139
  end
135
140
 
136
141
  it "refreshes proxy lists if no proxy found" do
137
- ProxyFetcher::Client::ProxiesRegistry.manager.instance_variable_set(:"@proxies", [])
142
+ allow(ProxyFetcher::Manager.new).to receive(:proxies).and_return([])
138
143
 
139
144
  expect { ProxyFetcher::Client.get("http://httpbin.org") }
140
145
  .not_to raise_error
141
146
  end
142
147
  end
143
148
 
144
- context "redirects" do
149
+ xcontext "redirects" do
145
150
  it "follows redirect when present" do
146
151
  content = ProxyFetcher::Client.get("http://httpbin.org/absolute-redirect/2")
147
152
 
@@ -0,0 +1,18 @@
1
+ # frozen_string_literal: true
2
+
3
+ require "spec_helper"
4
+
5
+ describe ProxyFetcher::Manager do
6
+ it "can initialize with a proxies from file(s)" do
7
+ manager = described_class.new(refresh: false, file: "spec/fixtures/proxies.txt")
8
+
9
+ expect(manager.proxies.size).to be(14)
10
+
11
+ manager = described_class.new(
12
+ refresh: false,
13
+ file: ["spec/fixtures/proxies.txt", "spec/fixtures/proxies.txt"]
14
+ )
15
+
16
+ expect(manager.proxies.size).to be(14)
17
+ end
18
+ end
@@ -0,0 +1,28 @@
1
+ # frozen_string_literal: true
2
+
3
+ require "spec_helper"
4
+
5
+ describe "Proxy classes" do
6
+ [
7
+ [:free_proxy_list, "FreeProxyList"],
8
+ [:free_proxy_list_socks, "FreeProxyListSocks"],
9
+ [:free_proxy_list_ssl, "FreeProxyListSSL"],
10
+ [:free_proxy_list_us, "FreeProxyListUS"],
11
+ [:http_tunnel, "HTTPTunnel"],
12
+ [:mtpro, "MTPro"],
13
+ [:proxy_list, "ProxyList"],
14
+ [:proxypedia, "Proxypedia"],
15
+ [:proxyscrape_http, "ProxyscrapeHTTP"],
16
+ [:proxyscrape_socks4, "ProxyscrapeSOCKS4"],
17
+ [:proxyscrape_socks5, "ProxyscrapeSOCKS5"],
18
+ [:xroxy, "XRoxy"]
19
+ ].each do |(provider_name, provider_klass)|
20
+ describe Object.const_get("ProxyFetcher::Providers::#{provider_klass}") do
21
+ before :all do
22
+ ProxyFetcher.config.provider = provider_name
23
+ end
24
+
25
+ it_behaves_like "a manager"
26
+ end
27
+ end
28
+ end
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: proxy_fetcher
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.11.0
4
+ version: 0.15.1
5
5
  platform: ruby
6
6
  authors:
7
7
  - Nikita Bulai
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2019-10-24 00:00:00.000000000 Z
11
+ date: 2021-02-17 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: http
@@ -50,14 +50,14 @@ dependencies:
50
50
  requirements:
51
51
  - - "~>"
52
52
  - !ruby/object:Gem::Version
53
- version: '3.5'
53
+ version: '3.9'
54
54
  type: :development
55
55
  prerelease: false
56
56
  version_requirements: !ruby/object:Gem::Requirement
57
57
  requirements:
58
58
  - - "~>"
59
59
  - !ruby/object:Gem::Version
60
- version: '3.5'
60
+ version: '3.9'
61
61
  description: This gem can help your Ruby application to make HTTP(S) requests using
62
62
  proxies by fetching and validating proxy lists from the different providers.
63
63
  email: bulajnikita@gmail.com
@@ -94,10 +94,16 @@ files:
94
94
  - lib/proxy_fetcher/null_logger.rb
95
95
  - lib/proxy_fetcher/providers/base.rb
96
96
  - lib/proxy_fetcher/providers/free_proxy_list.rb
97
+ - lib/proxy_fetcher/providers/free_proxy_list_socks.rb
97
98
  - lib/proxy_fetcher/providers/free_proxy_list_ssl.rb
98
- - lib/proxy_fetcher/providers/gather_proxy.rb
99
+ - lib/proxy_fetcher/providers/free_proxy_list_us.rb
99
100
  - lib/proxy_fetcher/providers/http_tunnel.rb
101
+ - lib/proxy_fetcher/providers/mtpro.rb
100
102
  - lib/proxy_fetcher/providers/proxy_list.rb
103
+ - lib/proxy_fetcher/providers/proxypedia.rb
104
+ - lib/proxy_fetcher/providers/proxyscrape_http.rb
105
+ - lib/proxy_fetcher/providers/proxyscrape_socks4.rb
106
+ - lib/proxy_fetcher/providers/proxyscrape_socks5.rb
101
107
  - lib/proxy_fetcher/providers/xroxy.rb
102
108
  - lib/proxy_fetcher/proxy.rb
103
109
  - lib/proxy_fetcher/utils/http_client.rb
@@ -105,18 +111,15 @@ files:
105
111
  - lib/proxy_fetcher/utils/proxy_validator.rb
106
112
  - lib/proxy_fetcher/version.rb
107
113
  - proxy_fetcher.gemspec
114
+ - spec/fixtures/proxies.txt
108
115
  - spec/proxy_fetcher/client/client_spec.rb
109
116
  - spec/proxy_fetcher/configuration_spec.rb
110
117
  - spec/proxy_fetcher/document/adapters_spec.rb
111
118
  - spec/proxy_fetcher/document/node_spec.rb
119
+ - spec/proxy_fetcher/manager_spec.rb
112
120
  - spec/proxy_fetcher/providers/base_spec.rb
113
- - spec/proxy_fetcher/providers/free_proxy_list_spec.rb
114
- - spec/proxy_fetcher/providers/free_proxy_list_ssl_spec.rb
115
- - spec/proxy_fetcher/providers/gather_proxy_spec.rb
116
- - spec/proxy_fetcher/providers/http_tunnel_spec.rb
117
121
  - spec/proxy_fetcher/providers/multiple_providers_spec.rb
118
- - spec/proxy_fetcher/providers/proxy_list_spec.rb
119
- - spec/proxy_fetcher/providers/xroxy_spec.rb
122
+ - spec/proxy_fetcher/providers/proxy_classes_spec.rb
120
123
  - spec/proxy_fetcher/proxy_spec.rb
121
124
  - spec/proxy_fetcher/version_spec.rb
122
125
  - spec/spec_helper.rb
@@ -140,7 +143,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
140
143
  - !ruby/object:Gem::Version
141
144
  version: '0'
142
145
  requirements: []
143
- rubygems_version: 3.0.3
146
+ rubygems_version: 3.1.2
144
147
  signing_key:
145
148
  specification_version: 4
146
149
  summary: Ruby gem for dealing with proxy lists from different providers
@@ -1,50 +0,0 @@
1
- # frozen_string_literal: true
2
-
3
- require "json"
4
-
5
- module ProxyFetcher
6
- module Providers
7
- # GatherProxy provider class.
8
- class GatherProxy < Base
9
- # Provider URL to fetch proxy list
10
- def provider_url
11
- "http://www.gatherproxy.com/"
12
- end
13
-
14
- def xpath
15
- '//div[@class="proxy-list"]/table/script'
16
- end
17
-
18
- # Converts HTML node (entry of N tags) to <code>ProxyFetcher::Proxy</code>
19
- # object.
20
- #
21
- # @param html_node [Object]
22
- # HTML node from the <code>ProxyFetcher::Document</code> DOM model.
23
- #
24
- # @return [ProxyFetcher::Proxy]
25
- # Proxy object
26
- #
27
- def to_proxy(html_node)
28
- json = parse_json(html_node)
29
-
30
- ProxyFetcher::Proxy.new.tap do |proxy|
31
- proxy.addr = json["PROXY_IP"]
32
- proxy.port = json["PROXY_PORT"].to_i(16)
33
- proxy.anonymity = json["PROXY_TYPE"]
34
- proxy.country = json["PROXY_COUNTRY"]
35
- proxy.response_time = json["PROXY_TIME"].to_i
36
- proxy.type = ProxyFetcher::Proxy::HTTP
37
- end
38
- end
39
-
40
- private
41
-
42
- def parse_json(html_node)
43
- javascript = html_node.content[/{.+}/im]
44
- JSON.parse(javascript)
45
- end
46
- end
47
-
48
- ProxyFetcher::Configuration.register_provider(:gather_proxy, GatherProxy)
49
- end
50
- end
@@ -1,13 +0,0 @@
1
- # frozen_string_literal: true
2
-
3
- require "spec_helper"
4
-
5
- describe ProxyFetcher::Providers::FreeProxyList do
6
- before :all do
7
- ProxyFetcher.configure do |config|
8
- config.provider = :free_proxy_list
9
- end
10
- end
11
-
12
- it_behaves_like "a manager"
13
- end
@@ -1,11 +0,0 @@
1
- # frozen_string_literal: true
2
-
3
- require "spec_helper"
4
-
5
- describe ProxyFetcher::Providers::FreeProxyListSSL do
6
- before :all do
7
- ProxyFetcher.config.provider = :free_proxy_list_ssl
8
- end
9
-
10
- it_behaves_like "a manager"
11
- end
@@ -1,11 +0,0 @@
1
- # frozen_string_literal: true
2
-
3
- require "spec_helper"
4
-
5
- describe ProxyFetcher::Providers::GatherProxy do
6
- before :all do
7
- ProxyFetcher.config.provider = :gather_proxy
8
- end
9
-
10
- it_behaves_like "a manager"
11
- end
@@ -1,11 +0,0 @@
1
- # frozen_string_literal: true
2
-
3
- require "spec_helper"
4
-
5
- describe ProxyFetcher::Providers::HTTPTunnel do
6
- before :all do
7
- ProxyFetcher.config.provider = :http_tunnel
8
- end
9
-
10
- it_behaves_like "a manager"
11
- end
@@ -1,11 +0,0 @@
1
- # frozen_string_literal: true
2
-
3
- require "spec_helper"
4
-
5
- describe ProxyFetcher::Providers::ProxyList do
6
- before :all do
7
- ProxyFetcher.config.provider = :proxy_list
8
- end
9
-
10
- it_behaves_like "a manager"
11
- end
@@ -1,11 +0,0 @@
1
- # frozen_string_literal: true
2
-
3
- require "spec_helper"
4
-
5
- describe ProxyFetcher::Providers::XRoxy do
6
- before :all do
7
- ProxyFetcher.config.provider = :xroxy
8
- end
9
-
10
- it_behaves_like "a manager"
11
- end