web_stat 0.3.7 → 0.3.8
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/Gemfile.lock +2 -2
- data/lib/web_stat/fetch.rb +16 -8
- data/lib/web_stat/version.rb +1 -1
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: bbf065f5482ee7bf68e14e41af1e48b855f4219b9f44a7e16440834c92f404d5
|
4
|
+
data.tar.gz: a16fc8b8a66cb534bb8ce61c6da28212faff44f2df6324772261f9b6847cfc7f
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 83b8b7d71a1047ec2614a9bfbc3c6305806cf7a616ba6b2568382b72ef91f5b0947e7aefb3d926b33c4970d291d2a34c99a86ba0f0e320a3e7fde9dd2b5bc154
|
7
|
+
data.tar.gz: aa4af6063d7dd81c7c78c0100ff5354d7c54f28d7b2fac7393656cb5bde932b7260c95d1fe08fc560784e85ead7bbf49134c4d56cb108cef522cef753e477032
|
data/Gemfile.lock
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
PATH
|
2
2
|
remote: .
|
3
3
|
specs:
|
4
|
-
web_stat (0.3.
|
4
|
+
web_stat (0.3.7)
|
5
5
|
bundler (>= 2.0.2)
|
6
6
|
cld (>= 0.8.0)
|
7
7
|
mechanize (>= 2.7)
|
@@ -83,7 +83,7 @@ GEM
|
|
83
83
|
nokogiri (>= 1.6.0)
|
84
84
|
rubyzip (2.3.0)
|
85
85
|
safe_yaml (1.0.5)
|
86
|
-
sanitize (5.2.
|
86
|
+
sanitize (5.2.1)
|
87
87
|
crass (~> 1.0.2)
|
88
88
|
nokogiri (>= 1.8.0)
|
89
89
|
nokogumbo (~> 2.0)
|
data/lib/web_stat/fetch.rb
CHANGED
@@ -47,7 +47,7 @@ module WebStat
|
|
47
47
|
break
|
48
48
|
end
|
49
49
|
end
|
50
|
-
if path.nil? || path.empty?
|
50
|
+
if path.nil? || path.empty? || @nokogiri.at('body').xpath('//img').first
|
51
51
|
path = @nokogiri.at('body').xpath('//img').first.attr('src')
|
52
52
|
end
|
53
53
|
if ! path.nil? && path.match(/^\//)
|
@@ -78,17 +78,25 @@ module WebStat
|
|
78
78
|
# @param [String] url
|
79
79
|
# @param [String] body
|
80
80
|
def get_url(url)
|
81
|
-
|
81
|
+
mech = Mechanize.new { |_mech| _mech.user_agent = WebStat::Configure.get["user_agent"] }
|
82
82
|
# Enable to read Robots.txt
|
83
|
-
|
83
|
+
mech.robots = true
|
84
84
|
begin
|
85
|
-
|
86
|
-
|
87
|
-
|
85
|
+
if mech.agent.robots_disallowed?(url)
|
86
|
+
raise Mechanize::RobotsDisallowedError.new(url)
|
87
|
+
end
|
88
|
+
if WebStat::Configure.get["use_chromedirver"]
|
89
|
+
document = WebStat::WebDriverHelper.get_last_url(url)
|
90
|
+
@status = 200
|
88
91
|
else
|
89
|
-
|
92
|
+
document = mech.get(url, [], nil, { 'Accept-Language' => 'ja'})
|
93
|
+
if document.class == Mechanize::File
|
94
|
+
body = document.body
|
95
|
+
else
|
96
|
+
body = document.body.encode('UTF-8', document.encoding)
|
97
|
+
end
|
98
|
+
@status = document.code
|
90
99
|
end
|
91
|
-
@status = document.code
|
92
100
|
rescue Mechanize::ResponseCodeError => e
|
93
101
|
body = e.page.body
|
94
102
|
@status = e.page.code
|
data/lib/web_stat/version.rb
CHANGED
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: web_stat
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.3.
|
4
|
+
version: 0.3.8
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- yusuke abe
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2020-06-
|
11
|
+
date: 2020-06-17 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: bundler
|