oai_schedules 0.2.0 → 0.3.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +5 -0
- data/README.md +3 -2
- data/examples/example_01.rb +1 -1
- data/examples/example_02.rb +1 -1
- data/lib/oai_schedules/manager.rb +7 -3
- data/lib/oai_schedules/version.rb +1 -1
- metadata +1 -1
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 3e87f0fab9a90cc32bb6c3892a9ad72e6dae77c8b7efbc4ab3198c39b7d2a660
|
4
|
+
data.tar.gz: b59ddf59dd77df9dc1365a279dbe7ac3a9fb7b8d5f1bb7a33a8951f3d4ce1f48
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: d384485639a44d848f35eb3bc0a25a44fe2357cd84aeb37530a683a153aaba6f4b9bb24b7a316caf424e8f0c57b77b775b45f168c06339b3a6b6e35b1b2ee8d9
|
7
|
+
data.tar.gz: 84117dbd3b7f6757290fdee7a9f3388623330d8d293961946b6ee2058b2be8a7898b60822598bd8e8ac6bf2340d3cbabcba05124d1aa087e876b2a83192ea948
|
data/CHANGELOG.md
CHANGED
data/README.md
CHANGED
@@ -22,7 +22,7 @@ gem install oai_schedules
|
|
22
22
|
```ruby
|
23
23
|
require 'oai_schedules/manager'
|
24
24
|
|
25
|
-
f_show = lambda do |records, done|
|
25
|
+
f_show = lambda do |name, content, records, done|
|
26
26
|
# ... do your stuff with records ...
|
27
27
|
if done
|
28
28
|
puts "done full harvesting"
|
@@ -58,7 +58,8 @@ At every iteration, every 2 seconds, it will get the *partial* records by using
|
|
58
58
|
The code will do this by querying `https://eudml.org/oai/OAIHandler?verb=ListRecords&...` and adding the necessary
|
59
59
|
query parameters.
|
60
60
|
The custom function provided as `f_digest` will then be called at each iteration.
|
61
|
-
This will be provided the partial list of `records` as a hash,
|
61
|
+
This will be provided schedule `name` and `content`, the partial list of `records` as a hash,
|
62
|
+
and a `done` flag (full harvesting complete).
|
62
63
|
and it will write the new one to the state file, until no token is provided (end of the harvesting).
|
63
64
|
As soon as the schedule is added, it is executed.
|
64
65
|
It is possible to add all schedules in advance, then call `sleep` for infinite event loop.
|
data/examples/example_01.rb
CHANGED
data/examples/example_02.rb
CHANGED
@@ -4,7 +4,7 @@ require 'oai_schedules/manager'
|
|
4
4
|
|
5
5
|
# usage with programmatic schedules addition / modify / remove
|
6
6
|
|
7
|
-
f_show = lambda do |records, done|
|
7
|
+
f_show = lambda do |name, content, records, done|
|
8
8
|
# ... do your stuff with records ...
|
9
9
|
if done
|
10
10
|
puts "done full harvesting"
|
@@ -194,7 +194,7 @@ module OAISchedules
|
|
194
194
|
task.add_observer(TaskObserver.new(@logger, name))
|
195
195
|
# add item to schedules
|
196
196
|
@schedules[name] = {
|
197
|
-
content: content,
|
197
|
+
content: deep_copy(content),
|
198
198
|
task: task,
|
199
199
|
state_machine: StateMachineHarvesting.new,
|
200
200
|
state: state
|
@@ -213,7 +213,7 @@ module OAISchedules
|
|
213
213
|
|
214
214
|
|
215
215
|
def modify_schedule(name, content)
|
216
|
-
@schedules[name][:content] = content
|
216
|
+
@schedules[name][:content] = deep_copy(content)
|
217
217
|
handle_schedule_task(name)
|
218
218
|
end
|
219
219
|
|
@@ -222,6 +222,10 @@ module OAISchedules
|
|
222
222
|
|
223
223
|
private
|
224
224
|
|
225
|
+
def deep_copy(o)
|
226
|
+
Marshal.load(Marshal.dump(o))
|
227
|
+
end
|
228
|
+
|
225
229
|
|
226
230
|
def handle_schedule_task(name)
|
227
231
|
task = @schedules[name][:task]
|
@@ -360,7 +364,7 @@ module OAISchedules
|
|
360
364
|
state_machine.add_event(EventHarvesting::DONE_FULL_HARVEST)
|
361
365
|
done = true
|
362
366
|
end
|
363
|
-
@f_digest&.call(data, done)
|
367
|
+
@f_digest&.call(name, content, data, done)
|
364
368
|
break
|
365
369
|
when StateHarvesting::COMPLETE
|
366
370
|
@logger.warn("#{name}: full harvesting complete")
|