vore 0.2.8-x86_64-windows → 0.3.0-x86_64-windows

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 85a50437d0557e28ff3eeb155a8e527163aeb5f90fd98f0e5cb8e09e3d81bb6e
4
- data.tar.gz: 61d1255a042db43b6e50bc749fccceb452080afd07e1eac04461ef4894fb8027
3
+ metadata.gz: d9c0a3b54d7618f058010a7b420d8085bb26614a2a25a2d13574694d73639faf
4
+ data.tar.gz: 3b13cf4124744f822c0d3cb969c960d811cb76d39b542531dde19cfe4bc53c25
5
5
  SHA512:
6
- metadata.gz: d5c8a45adf9b4402d3600ae26728afb89b5e4d24953ad905462ad6b7c2d682a2806ed452673c486000621e5bf0373de6dd85a28ba592cb2e5eb1e86d83eb973f
7
- data.tar.gz: 0077fcc1c2173c46be332da7727f6560a1cf8b2351491bc147b0d1111cefc82dc8bf8081e0f2370e2f7432d1905b2419e8bc168294dfef8a4387d609d512dae8
6
+ metadata.gz: 870cc3ea8b2ba8ae56ac0a4435f08baa0504d7f4cb809b06bc052598f0837ea46ab10f4b93b73c859f58be7378a88942d4861ebe5f9ab126de5273ac919c160e
7
+ data.tar.gz: a6c10f0f3233aec66f9f68c25aba29a87f69fab17070c5aad040b2e08a04e652a289ff6a4143e86dd160f2b411da4d4c9dda9458789144602424ee565a83cc50
data/exe/vore-spider.exe CHANGED
Binary file
@@ -5,5 +5,9 @@ module Vole
5
5
  DEFAULT_SANITIZATION_CONFIG = Selma::Sanitizer::Config::RELAXED.dup.merge({
6
6
  allow_doctype: false,
7
7
  })
8
+
9
+ DEFAULT_OPTIONS = {
10
+ delay: 3500,
11
+ }
8
12
  end
9
13
  end
data/lib/vore/crawler.rb CHANGED
@@ -12,7 +12,7 @@ module Vore
12
12
 
13
13
  # Creates a crawler
14
14
  # denylist: Sets a denylist filter, allows a regexp, string or array of either to be matched.
15
- def initialize(denylist: /a^/, sanitization_config: Vole::Configuration::DEFAULT_SANITIZATION_CONFIG)
15
+ def initialize(denylist: /a^/, sanitization_config: Vole::Configuration::DEFAULT_SANITIZATION_CONFIG, options: Vole::Configuration::DEFAULT_OPTIONS)
16
16
  @denylist_regexp = Regexp.union(denylist)
17
17
 
18
18
  @content_extractor = Vole::Handlers::ContentExtractor.new
@@ -20,6 +20,7 @@ module Vore
20
20
  ext = PLATFORM.include?("windows") ? ".exe" : ""
21
21
  @executable = File.expand_path([__FILE__, "..", "..", "..", "exe", "vore-spider#{ext}"].join(FILE_SEPERATOR))
22
22
  @parent_output_dir = "tmp/vore"
23
+ @options = options
23
24
 
24
25
  return if File.exist?(@executable)
25
26
 
@@ -31,7 +32,7 @@ module Vore
31
32
  @output_dir = "#{@parent_output_dir}/#{website.gsub(/[^a-zA-Z0-9]/, "_").squeeze("_")}"
32
33
  Vore.logger.info("Vore started crawling #{website}, outputting to #{output_dir}")
33
34
 
34
- output = run_command(website, @output_dir)
35
+ output = run_command(website, delay: @options[:delay])
35
36
 
36
37
  Vore.logger.info("Vore finished crawling #{website}: #{output}")
37
38
 
@@ -86,14 +87,14 @@ module Vore
86
87
  # crawl_site(site)
87
88
  # end
88
89
 
89
- def run_command(website, output_dir)
90
+ def run_command(website, delay: 3500)
90
91
  %x(#{@executable} \
91
92
  --user-agent #{user_agent} \
92
- --delay 3500 \
93
+ --delay #{delay} \
93
94
  --url #{website} \
94
95
  download \
95
96
  -t \
96
- #{output_dir})
97
+ #{@output_dir})
97
98
  end
98
99
 
99
100
  def user_agent
data/lib/vore/version.rb CHANGED
@@ -1,5 +1,5 @@
1
1
  # frozen_string_literal: true
2
2
 
3
3
  module Vore
4
- VERSION = "0.2.8"
4
+ VERSION = "0.3.0"
5
5
  end
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: vore
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.2.8
4
+ version: 0.3.0
5
5
  platform: x86_64-windows
6
6
  authors:
7
7
  - Garen J. Torikian