scrapework 0.1.1 → 0.1.2
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/CHANGELOG.md +4 -0
- data/Gemfile.lock +2 -2
- data/examples/manga.rb +31 -0
- data/lib/scrapework/object.rb +5 -1
- data/lib/scrapework/version.rb +1 -1
- data/lib/scrapework.rb +2 -0
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 4d05be6e525594f8a297ad5bae0abaeeb366a198bd4acb450f837449c7c19e93
|
4
|
+
data.tar.gz: 0e74bd49022f11e5712e363ef9ddaf9710c37456324cee058596eb00340b2308
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 486ebab03674cae60200091d0983c766e61e177a15eb897de4951adf7de46cd2b22614e4d8ea981a5574b70f9388a58212a1e7c35e2a87e7f9f6a3973c552652
|
7
|
+
data.tar.gz: db1b96744ebbe5d9833ac20591aa7ba6dc6ad6634ff957c473e6482037f0efe3862d48f2db16c8e42e34822959be4dbd29e36867906895255a2d2cacf11c0ea4
|
data/CHANGELOG.md
CHANGED
data/Gemfile.lock
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
PATH
|
2
2
|
remote: .
|
3
3
|
specs:
|
4
|
-
scrapework (0.1.
|
4
|
+
scrapework (0.1.2)
|
5
5
|
active_attr
|
6
6
|
activesupport
|
7
7
|
nokogiri
|
@@ -27,7 +27,7 @@ GEM
|
|
27
27
|
jaro_winkler (1.5.2)
|
28
28
|
mini_portile2 (2.4.0)
|
29
29
|
minitest (5.11.3)
|
30
|
-
nokogiri (1.10.
|
30
|
+
nokogiri (1.10.3)
|
31
31
|
mini_portile2 (~> 2.4.0)
|
32
32
|
parallel (1.17.0)
|
33
33
|
parser (2.6.2.1)
|
data/examples/manga.rb
CHANGED
@@ -5,6 +5,37 @@ require 'scrapework'
|
|
5
5
|
# This example sets up several data types and uses them
|
6
6
|
# to download every chapter of a manga.
|
7
7
|
|
8
|
+
# A manga list web page
|
9
|
+
class MangaList < Scrapework::Object
|
10
|
+
has_many :manga, class: 'Manga'
|
11
|
+
|
12
|
+
# Will not return the array of full collection
|
13
|
+
def each(*args, &block)
|
14
|
+
manga.each(*args, &block)
|
15
|
+
|
16
|
+
next_page&.each(*args, &block)
|
17
|
+
end
|
18
|
+
|
19
|
+
map 'manga' do |html|
|
20
|
+
html.css('.update_item h3 a').map do |a|
|
21
|
+
{ uri: a['href'], title: a.text.strip }
|
22
|
+
end
|
23
|
+
end
|
24
|
+
|
25
|
+
paginate do |html|
|
26
|
+
pages = html.css('.group-page a').to_a[1..-2]
|
27
|
+
current = pages.find_index { |p| p['class'] == 'pageselect' }
|
28
|
+
|
29
|
+
prev_page_link = pages[current - 1] if current
|
30
|
+
next_page_link = pages[current + 1] if current
|
31
|
+
|
32
|
+
prev_page = { url: prev_page_link['href'] } if prev_page_link
|
33
|
+
next_page = { url: next_page_link['href'] } if next_page_link
|
34
|
+
|
35
|
+
[prev_page, next_page]
|
36
|
+
end
|
37
|
+
end
|
38
|
+
|
8
39
|
# A manga web page
|
9
40
|
class Manga < Scrapework::Object
|
10
41
|
attribute :title
|
data/lib/scrapework/object.rb
CHANGED
@@ -123,7 +123,11 @@ module Scrapework
|
|
123
123
|
mapped_method = :"_mapped_#{name}"
|
124
124
|
|
125
125
|
define_method(mapped_method) do
|
126
|
-
value =
|
126
|
+
value = begin
|
127
|
+
instance_exec(_document, &block)
|
128
|
+
rescue StandardError => e
|
129
|
+
raise MappingError, e.message
|
130
|
+
end
|
127
131
|
|
128
132
|
public_send("#{name}=", value)
|
129
133
|
end
|
data/lib/scrapework/version.rb
CHANGED
data/lib/scrapework.rb
CHANGED
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: scrapework
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.1.
|
4
|
+
version: 0.1.2
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- jphager2
|
8
8
|
autorequire:
|
9
9
|
bindir: exe
|
10
10
|
cert_chain: []
|
11
|
-
date: 2019-04-
|
11
|
+
date: 2019-04-23 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: active_attr
|