oai_schedules 0.2.0 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 6b67e6f8703a12140e9f0ddb981a30a5311e80d27e5146bd9848601d27272db9
4
- data.tar.gz: '09864239d4e38142c63a503a1535296f0a504bd4e9c0c84bfb87b024e640d104'
3
+ metadata.gz: 3e87f0fab9a90cc32bb6c3892a9ad72e6dae77c8b7efbc4ab3198c39b7d2a660
4
+ data.tar.gz: b59ddf59dd77df9dc1365a279dbe7ac3a9fb7b8d5f1bb7a33a8951f3d4ce1f48
5
5
  SHA512:
6
- metadata.gz: cbe2109c9a0b04a3e743ef6c577a38320bc84d411bff334b9b5e5e6bfc536aa9946c536b4a4dd3f56f320977b734de16e183247ac64edbb8d5d0051c7690ae91
7
- data.tar.gz: e747187b4375075a4e7f06831c67b6f59e7e2062578255732330884ea60bd4607b360054b2db504fcee7ec853d09b89ed8adf7f34d7f2f0a3d8ba49822a24b88
6
+ metadata.gz: d384485639a44d848f35eb3bc0a25a44fe2357cd84aeb37530a683a153aaba6f4b9bb24b7a316caf424e8f0c57b77b775b45f168c06339b3a6b6e35b1b2ee8d9
7
+ data.tar.gz: 84117dbd3b7f6757290fdee7a9f3388623330d8d293961946b6ee2058b2be8a7898b60822598bd8e8ac6bf2340d3cbabcba05124d1aa087e876b2a83192ea948
data/CHANGELOG.md CHANGED
@@ -1,3 +1,8 @@
1
+ ## [0.3.0] - 2025-03-26
2
+
3
+ - Added schedule name and content to digestion function
4
+ - Schedule content is deep-copied to internal state
5
+
1
6
  ## [0.2.0] - 2025-03-26
2
7
 
3
8
  - Added custom records digestions function
data/README.md CHANGED
@@ -22,7 +22,7 @@ gem install oai_schedules
22
22
  ```ruby
23
23
  require 'oai_schedules/manager'
24
24
 
25
- f_show = lambda do |records, done|
25
+ f_show = lambda do |name, content, records, done|
26
26
  # ... do your stuff with records ...
27
27
  if done
28
28
  puts "done full harvesting"
@@ -58,7 +58,8 @@ At every iteration, every 2 seconds, it will get the *partial* records by using
58
58
  The code will do this by querying `https://eudml.org/oai/OAIHandler?verb=ListRecords&...` and adding the necessary
59
59
  query parameters.
60
60
  The custom function provided as `f_digest` will then be called at each iteration.
61
- This will be provided the partial list of `records` as a hash, and a `done` flag (full harvesting complete).
61
+ This will be provided schedule `name` and `content`, the partial list of `records` as a hash,
62
+ and a `done` flag (full harvesting complete).
62
63
  and it will write the new one to the state file, until no token is provided (end of the harvesting).
63
64
  As soon as the schedule is added, it is executed.
64
65
  It is possible to add all schedules in advance, then call `sleep` for infinite event loop.
@@ -4,7 +4,7 @@ require 'oai_schedules/manager'
4
4
 
5
5
  # usage with folder listener
6
6
 
7
- f_show = lambda do |records, done|
7
+ f_show = lambda do |name, content, records, done|
8
8
  # ... do your stuff with records ...
9
9
  if done
10
10
  puts "done full harvesting"
@@ -4,7 +4,7 @@ require 'oai_schedules/manager'
4
4
 
5
5
  # usage with programmatic schedules addition / modify / remove
6
6
 
7
- f_show = lambda do |records, done|
7
+ f_show = lambda do |name, content, records, done|
8
8
  # ... do your stuff with records ...
9
9
  if done
10
10
  puts "done full harvesting"
@@ -194,7 +194,7 @@ module OAISchedules
194
194
  task.add_observer(TaskObserver.new(@logger, name))
195
195
  # add item to schedules
196
196
  @schedules[name] = {
197
- content: content,
197
+ content: deep_copy(content),
198
198
  task: task,
199
199
  state_machine: StateMachineHarvesting.new,
200
200
  state: state
@@ -213,7 +213,7 @@ module OAISchedules
213
213
 
214
214
 
215
215
  def modify_schedule(name, content)
216
- @schedules[name][:content] = content
216
+ @schedules[name][:content] = deep_copy(content)
217
217
  handle_schedule_task(name)
218
218
  end
219
219
 
@@ -222,6 +222,10 @@ module OAISchedules
222
222
 
223
223
  private
224
224
 
225
+ def deep_copy(o)
226
+ Marshal.load(Marshal.dump(o))
227
+ end
228
+
225
229
 
226
230
  def handle_schedule_task(name)
227
231
  task = @schedules[name][:task]
@@ -360,7 +364,7 @@ module OAISchedules
360
364
  state_machine.add_event(EventHarvesting::DONE_FULL_HARVEST)
361
365
  done = true
362
366
  end
363
- @f_digest&.call(data, done)
367
+ @f_digest&.call(name, content, data, done)
364
368
  break
365
369
  when StateHarvesting::COMPLETE
366
370
  @logger.warn("#{name}: full harvesting complete")
@@ -1,5 +1,5 @@
1
1
  # frozen_string_literal: true
2
2
 
3
3
  module OaiSchedules
4
- VERSION = "0.2.0"
4
+ VERSION = "0.3.0"
5
5
  end
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: oai_schedules
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.2.0
4
+ version: 0.3.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Davide Monari