datahen 0.14.18 → 0.14.19
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/lib/datahen/cli/scraper_page.rb +8 -6
- data/lib/datahen/version.rb +1 -1
- metadata +5 -5
checksums.yaml
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
SHA256:
|
|
3
|
-
metadata.gz:
|
|
4
|
-
data.tar.gz:
|
|
3
|
+
metadata.gz: b483263384d6a00e51fd345499ad020d69c9d07c1a77e3521e6b55a4528195de
|
|
4
|
+
data.tar.gz: 167c0a417c402198f13151daf29bddb0f8429cac3876c8a84d6b7ba396b1ac90
|
|
5
5
|
SHA512:
|
|
6
|
-
metadata.gz:
|
|
7
|
-
data.tar.gz:
|
|
6
|
+
metadata.gz: 344168b7a8a4cb746347aba1640d7b4e75a901cd5a1e2ab7acd00f6e8eee3d8c297795812259f84a21757b444e653331e44dd9e1efbec372472b6aeb98c56619
|
|
7
|
+
data.tar.gz: 1ef00c32694830740ea477fb4291de9234957ee4b7f7ad02642aa9d5cb91d1b3b1cd6a56542db4cbf84d92d42039546f2e9bfb8a40cf22d103256e8d53b0ac28
|
|
@@ -99,16 +99,17 @@ module Datahen
|
|
|
99
99
|
|
|
100
100
|
desc "refetch <scraper_name>", "Refetch Pages on a scraper's current job"
|
|
101
101
|
long_desc <<-LONGDESC
|
|
102
|
-
Refetch pages in a scraper's current job. You need to specify either a --gid or --fetch-fail or --parse-fail or --status.\x5
|
|
102
|
+
Refetch pages in a scraper's current job. You need to specify either a --gid or --fetch-fail or --parse-fail or --status or --page-type.\x5
|
|
103
103
|
LONGDESC
|
|
104
104
|
option :gid, :aliases => :g, type: :string, desc: 'Refetch a specific GID'
|
|
105
105
|
option :fetch_fail, type: :boolean, desc: 'Refetches only pages that fails fetching.'
|
|
106
106
|
option :parse_fail, type: :boolean, desc: 'Refetches only pages that fails parsing.'
|
|
107
107
|
option :status, type: :string, desc: 'Refetches only pages with a specific status.'
|
|
108
|
+
option :page_type, type: :string, desc: 'Refetches only pages with a specific page type.'
|
|
108
109
|
option :job, :aliases => :j, type: :numeric, desc: 'Set a specific job ID'
|
|
109
110
|
def refetch(scraper_name)
|
|
110
|
-
if !options.key?(:gid) && !options.key?(:fetch_fail) && !options.key?(:parse_fail) && !options.key?(:status)
|
|
111
|
-
puts "Must specify either a --gid, --fetch-fail, --parse-fail or --
|
|
111
|
+
if !options.key?(:gid) && !options.key?(:fetch_fail) && !options.key?(:parse_fail) && !options.key?(:status) && !options.key?(:page_type)
|
|
112
|
+
puts "Must specify either a --gid, --fetch-fail, --parse-fail, --status or --page-type"
|
|
112
113
|
return
|
|
113
114
|
end
|
|
114
115
|
|
|
@@ -123,15 +124,16 @@ module Datahen
|
|
|
123
124
|
|
|
124
125
|
desc "reparse <scraper_name>", "Reparse Pages on a scraper's current job"
|
|
125
126
|
long_desc <<-LONGDESC
|
|
126
|
-
Reparse pages in a scraper's current job. You need to specify either a --gid or --parse-fail or --status.\x5
|
|
127
|
+
Reparse pages in a scraper's current job. You need to specify either a --gid or --parse-fail or --status or --page-type.\x5
|
|
127
128
|
LONGDESC
|
|
128
129
|
option :gid, :aliases => :g, type: :string, desc: 'Reparse a specific GID'
|
|
129
130
|
option :parse_fail, type: :boolean, desc: 'Reparse only pages that fails parsing.'
|
|
130
131
|
option :status, type: :string, desc: 'Reparse only pages with a specific status.'
|
|
132
|
+
option :page_type, type: :string, desc: 'Refetches only pages with a specific page type.'
|
|
131
133
|
option :job, :aliases => :j, type: :numeric, desc: 'Set a specific job ID'
|
|
132
134
|
def reparse(scraper_name)
|
|
133
|
-
if !options.key?(:gid) && !options.key?(:parse_fail) && !options.key?(:status)
|
|
134
|
-
puts "Must specify either a --gid, --parse-fail or --
|
|
135
|
+
if !options.key?(:gid) && !options.key?(:parse_fail) && !options.key?(:status) && !options.key?(:page_type)
|
|
136
|
+
puts "Must specify either a --gid, --parse-fail, --status or --page-type"
|
|
135
137
|
return
|
|
136
138
|
end
|
|
137
139
|
|
data/lib/datahen/version.rb
CHANGED
metadata
CHANGED
|
@@ -1,14 +1,14 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: datahen
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
version: 0.14.
|
|
4
|
+
version: 0.14.19
|
|
5
5
|
platform: ruby
|
|
6
6
|
authors:
|
|
7
7
|
- Parama Danoesubroto
|
|
8
|
-
autorequire:
|
|
8
|
+
autorequire:
|
|
9
9
|
bindir: exe
|
|
10
10
|
cert_chain: []
|
|
11
|
-
date: 2020-10-
|
|
11
|
+
date: 2020-10-27 00:00:00.000000000 Z
|
|
12
12
|
dependencies:
|
|
13
13
|
- !ruby/object:Gem::Dependency
|
|
14
14
|
name: thor
|
|
@@ -253,7 +253,7 @@ metadata:
|
|
|
253
253
|
allowed_push_host: https://rubygems.org
|
|
254
254
|
homepage_uri: https://datahen.com
|
|
255
255
|
source_code_uri: https://github.com/DataHenOfficial/datahen-ruby
|
|
256
|
-
post_install_message:
|
|
256
|
+
post_install_message:
|
|
257
257
|
rdoc_options: []
|
|
258
258
|
require_paths:
|
|
259
259
|
- lib
|
|
@@ -269,7 +269,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
|
269
269
|
version: '0'
|
|
270
270
|
requirements: []
|
|
271
271
|
rubygems_version: 3.0.3
|
|
272
|
-
signing_key:
|
|
272
|
+
signing_key:
|
|
273
273
|
specification_version: 4
|
|
274
274
|
summary: DataHen toolbelt for developers
|
|
275
275
|
test_files: []
|