vore 0.2.8-x86_64-darwin → 0.3.0-x86_64-darwin

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: a4f96c051f27e8fd481213db0cf06e2c5bc02a61c159b820f0753796a378335a
4
- data.tar.gz: 17219abae1846d6c2b48b8ceb92d3bdb7a3510c4a1d49b85eecdc1a81457c735
3
+ metadata.gz: 30fdc42af4a7181231ba9325a2f6803054d8d7cc801906a789df183fe106292c
4
+ data.tar.gz: 4d89ee0d331471992743b372cf7f64d8e30d7d166290fc8cf48b11246c41f5da
5
5
  SHA512:
6
- metadata.gz: f73a3769ad439820018ced158e109871efcf74537c142240e6bb991dbd04cb32286d78393f3194f68ad4cb3f3f49b8a3962e27bc9f9cded1ec5ca5880d9d3573
7
- data.tar.gz: 969e0c30ecce701f23ab32207a84599d18d986b82862cd2910069a6ec6a330ad5b62baf53c5483ae2c7ec7d11860cb3746841fd74216a4029b9dbcd4169ade69
6
+ metadata.gz: 8ba4d1f1cce56648d71155fd937af2e649d583169f44e07e529223166433dbb4b427d3f8b381a99c27e2958124af338b23e8f00dc6dc12ab037e0121b016d9ef
7
+ data.tar.gz: 9666321603fb722d77b8495e9b6b34515e29fd3636f7a420780359e778cc232dfe0dbaede172259ba523226fcde44cf93095b26268351f66f2d37da9d2acf0fb
data/exe/vore-spider CHANGED
Binary file
@@ -5,5 +5,9 @@ module Vole
5
5
  DEFAULT_SANITIZATION_CONFIG = Selma::Sanitizer::Config::RELAXED.dup.merge({
6
6
  allow_doctype: false,
7
7
  })
8
+
9
+ DEFAULT_OPTIONS = {
10
+ delay: 3500,
11
+ }
8
12
  end
9
13
  end
data/lib/vore/crawler.rb CHANGED
@@ -12,7 +12,7 @@ module Vore
12
12
 
13
13
  # Creates a crawler
14
14
  # denylist: Sets a denylist filter, allows a regexp, string or array of either to be matched.
15
- def initialize(denylist: /a^/, sanitization_config: Vole::Configuration::DEFAULT_SANITIZATION_CONFIG)
15
+ def initialize(denylist: /a^/, sanitization_config: Vole::Configuration::DEFAULT_SANITIZATION_CONFIG, options: Vole::Configuration::DEFAULT_OPTIONS)
16
16
  @denylist_regexp = Regexp.union(denylist)
17
17
 
18
18
  @content_extractor = Vole::Handlers::ContentExtractor.new
@@ -20,6 +20,7 @@ module Vore
20
20
  ext = PLATFORM.include?("windows") ? ".exe" : ""
21
21
  @executable = File.expand_path([__FILE__, "..", "..", "..", "exe", "vore-spider#{ext}"].join(FILE_SEPERATOR))
22
22
  @parent_output_dir = "tmp/vore"
23
+ @options = options
23
24
 
24
25
  return if File.exist?(@executable)
25
26
 
@@ -31,7 +32,7 @@ module Vore
31
32
  @output_dir = "#{@parent_output_dir}/#{website.gsub(/[^a-zA-Z0-9]/, "_").squeeze("_")}"
32
33
  Vore.logger.info("Vore started crawling #{website}, outputting to #{output_dir}")
33
34
 
34
- output = run_command(website, @output_dir)
35
+ output = run_command(website, delay: @options[:delay])
35
36
 
36
37
  Vore.logger.info("Vore finished crawling #{website}: #{output}")
37
38
 
@@ -86,14 +87,14 @@ module Vore
86
87
  # crawl_site(site)
87
88
  # end
88
89
 
89
- def run_command(website, output_dir)
90
+ def run_command(website, delay: 3500)
90
91
  %x(#{@executable} \
91
92
  --user-agent #{user_agent} \
92
- --delay 3500 \
93
+ --delay #{delay} \
93
94
  --url #{website} \
94
95
  download \
95
96
  -t \
96
- #{output_dir})
97
+ #{@output_dir})
97
98
  end
98
99
 
99
100
  def user_agent
data/lib/vore/version.rb CHANGED
@@ -1,5 +1,5 @@
1
1
  # frozen_string_literal: true
2
2
 
3
3
  module Vore
4
- VERSION = "0.2.8"
4
+ VERSION = "0.3.0"
5
5
  end
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: vore
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.2.8
4
+ version: 0.3.0
5
5
  platform: x86_64-darwin
6
6
  authors:
7
7
  - Garen J. Torikian