vore 0.2.4-x86_64-darwin → 0.2.6-x86_64-darwin

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 2d48f8e0f2bd479af664769d0c0781f04746a2367f2d3dcf0d9f8845020c6f17
4
- data.tar.gz: 154f154fcc46dbb6df0ffe9da4af15b13ce78f33711157bb1cdd90f5d3363467
3
+ metadata.gz: 2ede3f51d145b7ddb4dd0c042013f51b46d7b99268aec6d7fe013c0be027687f
4
+ data.tar.gz: 4bdeb20c4621e9611fec13d30c19f2c06ce71267867e5ff484b579b786ea113f
5
5
  SHA512:
6
- metadata.gz: ca6d066f2162526c37480f539481fa4c02c4d3ea009368b937d600a90170cf7aad2da99e01403c365810036c412a179f3ffaaae1872ea528fab31363e29e52a9
7
- data.tar.gz: 91326f86dbd7af495039aeb08d057b965c4db8d79614863c1f58be0bab471cc047388f7b60aa3e0703fd4287dd706ab4f60735130960712040c8d75f032f421f
6
+ metadata.gz: 1be22361d6e06dce9c3e37494688f228f4bff053a75f974c0970601c87af6f184a2a1090a775ad61aa67eb284ee5bd14b4299991b63c030e607ee79c9470b60f
7
+ data.tar.gz: cb8e2cb3032554570ad0a3e94fda35deadfbe8ba81caa92d19018ca462e4e8226c27a155846a86fc701056548acff45cb160d6e49e286a4c0009ddc1df334778
data/exe/vore-spider CHANGED
Binary file
data/lib/vore/crawler.rb CHANGED
@@ -31,7 +31,7 @@ module Vore
31
31
 
32
32
  output = %x(#{@executable} \
33
33
  --user-agent #{user_agent} \
34
- --delay 3000 \
34
+ --delay 3500 \
35
35
  --url #{website} \
36
36
  download \
37
37
  -t \
@@ -48,16 +48,26 @@ module Vore
48
48
  Dir.glob(File.join(output_dir, "**", "*")).each do |path|
49
49
  next unless File.file?(path)
50
50
 
51
+ results[:pages_visited] += 1
52
+
51
53
  html_file = File.read(path).force_encoding("UTF-8")
52
- rewritten_html_file = @selma.rewrite(html_file)
54
+ rewritten_html_file = ""
53
55
 
54
- results[:pages_visited] += 1
55
- if rewritten_html_file.empty?
56
+ if html_file.empty?
57
+ Vore.logger.warn("HTML file empty: #{path}")
56
58
  results[:pages_unprocessed] += 1
57
59
  results[:unprocessed_pages] << path
58
60
  next
59
61
  end
60
62
 
63
+ begin
64
+ rewritten_html_file = @selma.rewrite(html_file)
65
+ rescue StandardError => e
66
+ Vore.logger.warn("Error rewriting #{path}: #{e}")
67
+ results[:pages_unprocessed] += 1
68
+ next
69
+ end
70
+
61
71
  # drops the first 3 parts of the path, which are "tmp", "vore", and the site name
62
72
  url_path = path.split(FILE_SEPERATOR)[3..].join("/")
63
73
 
data/lib/vore/version.rb CHANGED
@@ -1,5 +1,5 @@
1
1
  # frozen_string_literal: true
2
2
 
3
3
  module Vore
4
- VERSION = "0.2.4"
4
+ VERSION = "0.2.6"
5
5
  end
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: vore
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.2.4
4
+ version: 0.2.6
5
5
  platform: x86_64-darwin
6
6
  authors:
7
7
  - Garen J. Torikian