datahen 0.14.18 → 0.14.19
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/lib/datahen/cli/scraper_page.rb +8 -6
- data/lib/datahen/version.rb +1 -1
- metadata +5 -5
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: b483263384d6a00e51fd345499ad020d69c9d07c1a77e3521e6b55a4528195de
|
4
|
+
data.tar.gz: 167c0a417c402198f13151daf29bddb0f8429cac3876c8a84d6b7ba396b1ac90
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 344168b7a8a4cb746347aba1640d7b4e75a901cd5a1e2ab7acd00f6e8eee3d8c297795812259f84a21757b444e653331e44dd9e1efbec372472b6aeb98c56619
|
7
|
+
data.tar.gz: 1ef00c32694830740ea477fb4291de9234957ee4b7f7ad02642aa9d5cb91d1b3b1cd6a56542db4cbf84d92d42039546f2e9bfb8a40cf22d103256e8d53b0ac28
|
@@ -99,16 +99,17 @@ module Datahen
|
|
99
99
|
|
100
100
|
desc "refetch <scraper_name>", "Refetch Pages on a scraper's current job"
|
101
101
|
long_desc <<-LONGDESC
|
102
|
-
Refetch pages in a scraper's current job. You need to specify either a --gid or --fetch-fail or --parse-fail or --status.\x5
|
102
|
+
Refetch pages in a scraper's current job. You need to specify either a --gid or --fetch-fail or --parse-fail or --status or --page-type.\x5
|
103
103
|
LONGDESC
|
104
104
|
option :gid, :aliases => :g, type: :string, desc: 'Refetch a specific GID'
|
105
105
|
option :fetch_fail, type: :boolean, desc: 'Refetches only pages that fails fetching.'
|
106
106
|
option :parse_fail, type: :boolean, desc: 'Refetches only pages that fails parsing.'
|
107
107
|
option :status, type: :string, desc: 'Refetches only pages with a specific status.'
|
108
|
+
option :page_type, type: :string, desc: 'Refetches only pages with a specific page type.'
|
108
109
|
option :job, :aliases => :j, type: :numeric, desc: 'Set a specific job ID'
|
109
110
|
def refetch(scraper_name)
|
110
|
-
if !options.key?(:gid) && !options.key?(:fetch_fail) && !options.key?(:parse_fail) && !options.key?(:status)
|
111
|
-
puts "Must specify either a --gid, --fetch-fail, --parse-fail or --
|
111
|
+
if !options.key?(:gid) && !options.key?(:fetch_fail) && !options.key?(:parse_fail) && !options.key?(:status) && !options.key?(:page_type)
|
112
|
+
puts "Must specify either a --gid, --fetch-fail, --parse-fail, --status or --page-type"
|
112
113
|
return
|
113
114
|
end
|
114
115
|
|
@@ -123,15 +124,16 @@ module Datahen
|
|
123
124
|
|
124
125
|
desc "reparse <scraper_name>", "Reparse Pages on a scraper's current job"
|
125
126
|
long_desc <<-LONGDESC
|
126
|
-
Reparse pages in a scraper's current job. You need to specify either a --gid or --parse-fail or --status.\x5
|
127
|
+
Reparse pages in a scraper's current job. You need to specify either a --gid or --parse-fail or --status or --page-type.\x5
|
127
128
|
LONGDESC
|
128
129
|
option :gid, :aliases => :g, type: :string, desc: 'Reparse a specific GID'
|
129
130
|
option :parse_fail, type: :boolean, desc: 'Reparse only pages that fails parsing.'
|
130
131
|
option :status, type: :string, desc: 'Reparse only pages with a specific status.'
|
132
|
+
option :page_type, type: :string, desc: 'Refetches only pages with a specific page type.'
|
131
133
|
option :job, :aliases => :j, type: :numeric, desc: 'Set a specific job ID'
|
132
134
|
def reparse(scraper_name)
|
133
|
-
if !options.key?(:gid) && !options.key?(:parse_fail) && !options.key?(:status)
|
134
|
-
puts "Must specify either a --gid, --parse-fail or --
|
135
|
+
if !options.key?(:gid) && !options.key?(:parse_fail) && !options.key?(:status) && !options.key?(:page_type)
|
136
|
+
puts "Must specify either a --gid, --parse-fail, --status or --page-type"
|
135
137
|
return
|
136
138
|
end
|
137
139
|
|
data/lib/datahen/version.rb
CHANGED
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: datahen
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.14.
|
4
|
+
version: 0.14.19
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Parama Danoesubroto
|
8
|
-
autorequire:
|
8
|
+
autorequire:
|
9
9
|
bindir: exe
|
10
10
|
cert_chain: []
|
11
|
-
date: 2020-10-
|
11
|
+
date: 2020-10-27 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: thor
|
@@ -253,7 +253,7 @@ metadata:
|
|
253
253
|
allowed_push_host: https://rubygems.org
|
254
254
|
homepage_uri: https://datahen.com
|
255
255
|
source_code_uri: https://github.com/DataHenOfficial/datahen-ruby
|
256
|
-
post_install_message:
|
256
|
+
post_install_message:
|
257
257
|
rdoc_options: []
|
258
258
|
require_paths:
|
259
259
|
- lib
|
@@ -269,7 +269,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
269
269
|
version: '0'
|
270
270
|
requirements: []
|
271
271
|
rubygems_version: 3.0.3
|
272
|
-
signing_key:
|
272
|
+
signing_key:
|
273
273
|
specification_version: 4
|
274
274
|
summary: DataHen toolbelt for developers
|
275
275
|
test_files: []
|