vore 0.2.4-x86_64-linux → 0.2.6-x86_64-linux

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: f079e19db98ba57bd8aa0a69471244231ed09a9c706c817af6470a0ed42b4e7c
4
- data.tar.gz: 3697e1361fbd4326fed8f78449729879bceb6dd9846f7c965b6f0263738347dc
3
+ metadata.gz: 53cb93bee6f3736369589c1eaaf7b739ca6f898e814d33d4ff747f4daa2077fc
4
+ data.tar.gz: 100cf434502ce236ce6f31aa24c110ed43274043f1ea7a678f4cad9905079e7a
5
5
  SHA512:
6
- metadata.gz: 83e15d4f005f2df953fd83082a0b05987e89de048b6a685f5ab070dd39d2fe04503758caccdb5eb0e9899e6448214c45a5f9ff850119ded82fee37385c6e0db3
7
- data.tar.gz: 0fcf835ebf8992d4cd9a764107727ce9f41437369d428f6fe73d272865079963f90193f4a99c4842882c0980f97c0ffe448f173dd297769634e2a79f0db75d4e
6
+ metadata.gz: b66ad8d522524716bc1f5a904b428934ef5006916cad623893301569afcfd7b255c021d1bc3f1205cd757365a165b6b88dfe278e9979aba4d900fc913f074d73
7
+ data.tar.gz: 9e176c95395e40503fc8a5af9f014a5befc37a63d04b71a0d64549be100700b92abbb439f57be4ab4699a3543ad2ca32203095b83e402774b35e70ae58d6cde2
data/exe/vore-spider CHANGED
Binary file
data/lib/vore/crawler.rb CHANGED
@@ -31,7 +31,7 @@ module Vore
31
31
 
32
32
  output = %x(#{@executable} \
33
33
  --user-agent #{user_agent} \
34
- --delay 3000 \
34
+ --delay 3500 \
35
35
  --url #{website} \
36
36
  download \
37
37
  -t \
@@ -48,16 +48,26 @@ module Vore
48
48
  Dir.glob(File.join(output_dir, "**", "*")).each do |path|
49
49
  next unless File.file?(path)
50
50
 
51
+ results[:pages_visited] += 1
52
+
51
53
  html_file = File.read(path).force_encoding("UTF-8")
52
- rewritten_html_file = @selma.rewrite(html_file)
54
+ rewritten_html_file = ""
53
55
 
54
- results[:pages_visited] += 1
55
- if rewritten_html_file.empty?
56
+ if html_file.empty?
57
+ Vore.logger.warn("HTML file empty: #{path}")
56
58
  results[:pages_unprocessed] += 1
57
59
  results[:unprocessed_pages] << path
58
60
  next
59
61
  end
60
62
 
63
+ begin
64
+ rewritten_html_file = @selma.rewrite(html_file)
65
+ rescue StandardError => e
66
+ Vore.logger.warn("Error rewriting #{path}: #{e}")
67
+ results[:pages_unprocessed] += 1
68
+ next
69
+ end
70
+
61
71
  # drops the first 3 parts of the path, which are "tmp", "vore", and the site name
62
72
  url_path = path.split(FILE_SEPERATOR)[3..].join("/")
63
73
 
data/lib/vore/version.rb CHANGED
@@ -1,5 +1,5 @@
1
1
  # frozen_string_literal: true
2
2
 
3
3
  module Vore
4
- VERSION = "0.2.4"
4
+ VERSION = "0.2.6"
5
5
  end
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: vore
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.2.4
4
+ version: 0.2.6
5
5
  platform: x86_64-linux
6
6
  authors:
7
7
  - Garen J. Torikian