canvas_sync 0.16.5 → 0.17.0.beta1
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +5 -5
- data/README.md +49 -137
- data/app/models/canvas_sync/sync_batch.rb +5 -0
- data/db/migrate/20201018210836_create_canvas_sync_sync_batches.rb +11 -0
- data/lib/canvas_sync/importers/bulk_importer.rb +4 -7
- data/lib/canvas_sync/job.rb +4 -10
- data/lib/canvas_sync/job_batches/batch.rb +399 -0
- data/lib/canvas_sync/job_batches/batch_aware_job.rb +62 -0
- data/lib/canvas_sync/job_batches/callback.rb +153 -0
- data/lib/canvas_sync/job_batches/chain_builder.rb +203 -0
- data/lib/canvas_sync/job_batches/context_hash.rb +147 -0
- data/lib/canvas_sync/job_batches/jobs/base_job.rb +7 -0
- data/lib/canvas_sync/job_batches/jobs/concurrent_batch_job.rb +18 -0
- data/lib/canvas_sync/job_batches/jobs/serial_batch_job.rb +73 -0
- data/lib/canvas_sync/job_batches/sidekiq.rb +91 -0
- data/lib/canvas_sync/job_batches/status.rb +63 -0
- data/lib/canvas_sync/jobs/begin_sync_chain_job.rb +34 -0
- data/lib/canvas_sync/jobs/report_checker.rb +3 -6
- data/lib/canvas_sync/jobs/report_processor_job.rb +2 -5
- data/lib/canvas_sync/jobs/report_starter.rb +28 -20
- data/lib/canvas_sync/jobs/sync_accounts_job.rb +3 -5
- data/lib/canvas_sync/jobs/sync_admins_job.rb +2 -4
- data/lib/canvas_sync/jobs/sync_assignment_groups_job.rb +2 -4
- data/lib/canvas_sync/jobs/sync_assignments_job.rb +2 -4
- data/lib/canvas_sync/jobs/sync_context_module_items_job.rb +2 -4
- data/lib/canvas_sync/jobs/sync_context_modules_job.rb +2 -4
- data/lib/canvas_sync/jobs/sync_provisioning_report_job.rb +4 -31
- data/lib/canvas_sync/jobs/sync_roles_job.rb +2 -5
- data/lib/canvas_sync/jobs/sync_simple_table_job.rb +11 -32
- data/lib/canvas_sync/jobs/sync_submissions_job.rb +2 -4
- data/lib/canvas_sync/jobs/sync_terms_job.rb +22 -7
- data/lib/canvas_sync/processors/assignment_groups_processor.rb +2 -3
- data/lib/canvas_sync/processors/assignments_processor.rb +2 -3
- data/lib/canvas_sync/processors/context_module_items_processor.rb +2 -3
- data/lib/canvas_sync/processors/context_modules_processor.rb +2 -3
- data/lib/canvas_sync/processors/normal_processor.rb +1 -2
- data/lib/canvas_sync/processors/provisioning_report_processor.rb +2 -10
- data/lib/canvas_sync/processors/submissions_processor.rb +2 -3
- data/lib/canvas_sync/version.rb +1 -1
- data/lib/canvas_sync.rb +34 -97
- data/spec/canvas_sync/canvas_sync_spec.rb +126 -153
- data/spec/canvas_sync/jobs/job_spec.rb +9 -17
- data/spec/canvas_sync/jobs/report_checker_spec.rb +1 -3
- data/spec/canvas_sync/jobs/report_processor_job_spec.rb +0 -3
- data/spec/canvas_sync/jobs/report_starter_spec.rb +19 -28
- data/spec/canvas_sync/jobs/sync_admins_job_spec.rb +1 -4
- data/spec/canvas_sync/jobs/sync_assignment_groups_job_spec.rb +2 -1
- data/spec/canvas_sync/jobs/sync_assignments_job_spec.rb +3 -2
- data/spec/canvas_sync/jobs/sync_context_module_items_job_spec.rb +3 -2
- data/spec/canvas_sync/jobs/sync_context_modules_job_spec.rb +3 -2
- data/spec/canvas_sync/jobs/sync_provisioning_report_job_spec.rb +3 -35
- data/spec/canvas_sync/jobs/sync_roles_job_spec.rb +1 -4
- data/spec/canvas_sync/jobs/sync_simple_table_job_spec.rb +5 -12
- data/spec/canvas_sync/jobs/sync_submissions_job_spec.rb +2 -1
- data/spec/canvas_sync/jobs/sync_terms_job_spec.rb +1 -4
- data/spec/dummy/config/environments/test.rb +2 -0
- data/spec/dummy/db/schema.rb +9 -1
- data/spec/job_batching/batch_aware_job_spec.rb +100 -0
- data/spec/job_batching/batch_spec.rb +363 -0
- data/spec/job_batching/callback_spec.rb +38 -0
- data/spec/job_batching/flow_spec.rb +91 -0
- data/spec/job_batching/integration/integration.rb +57 -0
- data/spec/job_batching/integration/nested.rb +88 -0
- data/spec/job_batching/integration/simple.rb +47 -0
- data/spec/job_batching/integration/workflow.rb +134 -0
- data/spec/job_batching/integration_helper.rb +48 -0
- data/spec/job_batching/sidekiq_spec.rb +124 -0
- data/spec/job_batching/status_spec.rb +92 -0
- data/spec/job_batching/support/base_job.rb +14 -0
- data/spec/job_batching/support/sample_callback.rb +2 -0
- data/spec/spec_helper.rb +10 -0
- metadata +91 -23
- data/lib/canvas_sync/job_chain.rb +0 -102
- data/lib/canvas_sync/jobs/fork_gather.rb +0 -74
- data/spec/canvas_sync/jobs/fork_gather_spec.rb +0 -73
- data/spec/dummy/db/test.sqlite3 +0 -0
- data/spec/dummy/log/development.log +0 -1248
- data/spec/dummy/log/test.log +0 -43258
- data/spec/support/fixtures/reports/provisioning_csv_unzipped/courses.csv +0 -3
- data/spec/support/fixtures/reports/provisioning_csv_unzipped/users.csv +0 -4
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
|
-
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
2
|
+
SHA1:
|
3
|
+
metadata.gz: b4ffe8d3a42b647f8c30f1d831c4a86998bc7c1b
|
4
|
+
data.tar.gz: 2ba762a479d2df35e22a69b7930d051a2e43bd30
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 6702f6754b217edfe2c7e4ff51c586940e7073993b5e3a79464e49308edd274af9bc8165f38aa919ef3c288ec86f1623065a91f42121f68c4da1389f27a57cb2
|
7
|
+
data.tar.gz: 71365002bcf14b762b00b73ae805862d8691a2b78ecd0254c0ef7fcf56eea6caeae838652e7ca4a685834eb380a08e782cf78e591b5af2c8950b4d4fd763e704
|
data/README.md
CHANGED
@@ -91,27 +91,45 @@ This gem also helps with syncing and processing other reports if needed. In orde
|
|
91
91
|
- Integrate your reports with the `ReportStarter`
|
92
92
|
- Tell the gem what jobs to run
|
93
93
|
|
94
|
+
### `updated_after`
|
95
|
+
An `updated_after` param may be passed when triggering a provision or making a chain:
|
96
|
+
```ruby
|
97
|
+
CanvasSync.default_provisioning_report_chain(
|
98
|
+
%i[list of models to sync], updated_after: false
|
99
|
+
)
|
100
|
+
```
|
101
|
+
It may be one of the following values:
|
102
|
+
* `false` - Will not apply any `updated_after` filtering to the requested reports
|
103
|
+
* An ISO-8601 Date - Will pass the supplied date ad the `updated_after` param for the requested reports
|
104
|
+
* `true` (Default) - Will use the start date of the last successful sync
|
105
|
+
|
94
106
|
### Extensible chain
|
95
107
|
It is sometimes desired to extend or customize the chain of jobs that are run with CanvasSync.
|
96
108
|
This can be achieved with the following pattern:
|
97
109
|
|
98
110
|
```ruby
|
99
|
-
|
111
|
+
chain = CanvasSync.default_provisioning_report_chain(
|
100
112
|
%i[list of models to sync]
|
101
113
|
)
|
102
114
|
|
103
|
-
#
|
104
|
-
|
105
|
-
|
106
|
-
|
107
|
-
|
108
|
-
# Jobs placed before SyncProvisioningReportJob or after ForkGather will run once per Sync
|
109
|
-
job_chain[:jobs] << { job: CanvasSync::Jobs::ForkGather, options: {} }
|
115
|
+
# Add a custom job to the end of the chain.
|
116
|
+
chain << { job: CanvasSyncCompleteWorker, parameters: [{ job_id: job.id }] }
|
117
|
+
chain << { job: CanvasSyncCompleteWorker, options: { job_id: job.id } } # If an options key is provided, it will be automatically appended to the end of the :parameters array
|
118
|
+
|
119
|
+
chain.process!
|
110
120
|
|
111
|
-
#
|
112
|
-
|
121
|
+
# The chain object provides a fairly extensive API:
|
122
|
+
chain.insert({ job: SomeOtherJob }) # Adds the job to the end of the chain
|
123
|
+
chain.insert_at(0, { job: SomeOtherJob }) # Adds the job to the beginning of the chain
|
124
|
+
chain.insert({ job: SomeOtherJob }, after: 'CanvasSync::Jobs::SyncTermsJob') # Adds the job right after the SyncTermsJob
|
125
|
+
chain.insert({ job: SomeOtherJob }, before: 'CanvasSync::Jobs::SyncTermsJob') # Adds the job right before the SyncTermsJob
|
126
|
+
chain.insert({ job: SomeOtherJob }, with: 'CanvasSync::Jobs::SyncTermsJob') # Adds the job to be performed concurrently with the SyncTermsJob
|
113
127
|
|
114
|
-
|
128
|
+
# Some Jobs (such as the SyncTermsJob) have a sub-chain for, eg, Courses.
|
129
|
+
# chain.insert is aware of these sub-chains and will recurse into them when looking for a before:/after:/with: reference
|
130
|
+
chain.insert({ job: SomeOtherJob }, after: 'CanvasSync::Jobs::SyncCoursesJob') # Adds the job to be performed after SyncCoursesJob (which is a sub-job of the terms job and is duplicated for each term in the term_scope:)
|
131
|
+
# You can also retrieve the sub-chain like so:
|
132
|
+
chain.get_sub_chain('CanvasSync::Jobs::SyncTermsJob')
|
115
133
|
```
|
116
134
|
|
117
135
|
### Processor
|
@@ -134,9 +152,8 @@ Let's say we have a custom Canvas report called "my_really_cool_report_csv". Fir
|
|
134
152
|
|
135
153
|
```ruby
|
136
154
|
class MyReallyCoolReportJob < CanvasSync::Jobs::ReportStarter
|
137
|
-
def perform(
|
155
|
+
def perform(options)
|
138
156
|
super(
|
139
|
-
job_chain,
|
140
157
|
'my_really_cool_report_csv', # Report name
|
141
158
|
{ "parameters[param1]" => true }, # Report parameters
|
142
159
|
MyCoolProcessor.to_s, # Your processor class as a string
|
@@ -148,57 +165,6 @@ end
|
|
148
165
|
|
149
166
|
You can also see examples in `lib/canvas_sync/jobs/sync_users_job.rb` and `lib/canvas_sync/jobs/sync_provisioning_report.rb`.
|
150
167
|
|
151
|
-
### Start the jobs
|
152
|
-
|
153
|
-
The `CanvasSync.process_jobs` method allows you to pass in a chain of jobs to run. The job chain must be formatted like:
|
154
|
-
|
155
|
-
```ruby
|
156
|
-
{
|
157
|
-
jobs: [
|
158
|
-
{ job: JobClass, options: {} },
|
159
|
-
{ job: JobClass2, options: {} }
|
160
|
-
],
|
161
|
-
global_options: {}
|
162
|
-
}
|
163
|
-
```
|
164
|
-
|
165
|
-
Here is an example that runs our new report job first followed by the builtin provisioning job:
|
166
|
-
|
167
|
-
```ruby
|
168
|
-
job_chain = {
|
169
|
-
jobs: [
|
170
|
-
{ job: MyReallyCoolReportJob, options: {} },
|
171
|
-
{ job: CanvasSync::Jobs::SyncProvisioningReportJob, options: { models: ['users', 'courses'] } }
|
172
|
-
],
|
173
|
-
global_options: {}
|
174
|
-
}
|
175
|
-
|
176
|
-
CanvasSync.process_jobs(job_chain)
|
177
|
-
```
|
178
|
-
|
179
|
-
What if you've got some other job that you want run that doesn't deal with a report? No problem! Just make sure you call `CanvasSync.invoke_next` at the end of your job. Example:
|
180
|
-
|
181
|
-
|
182
|
-
```ruby
|
183
|
-
class SomeRandomJob < CanvasSync::Job
|
184
|
-
def perform(job_chain, options)
|
185
|
-
i_dunno_do_something!
|
186
|
-
|
187
|
-
CanvasSync.invoke_next(job_chain)
|
188
|
-
end
|
189
|
-
end
|
190
|
-
|
191
|
-
job_chain = {
|
192
|
-
jobs: [
|
193
|
-
{ job: SomeRandomJob, options: {} },
|
194
|
-
{ job: CanvasSync::Jobs::SyncProvisioningReportJob, options: { models: ['users', 'courses'] } }
|
195
|
-
],
|
196
|
-
global_options: {}
|
197
|
-
}
|
198
|
-
|
199
|
-
CanvasSync.process_jobs(job_chain)
|
200
|
-
```
|
201
|
-
|
202
168
|
### Batching
|
203
169
|
|
204
170
|
The provisioning report uses the `CanvasSync::Importers::BulkImporter` class to bulk import rows with the activerecord-import gem. It inserts rows in batches of 10,000 by default. This can be customized by setting the `BULK_IMPORTER_BATCH_SIZE` environment variable.
|
@@ -257,6 +223,14 @@ class CanvasSyncModel < ApplicationRecord
|
|
257
223
|
end
|
258
224
|
```
|
259
225
|
|
226
|
+
### Job Batching
|
227
|
+
CanvasSync adds a `CanvasSync::JobBatches` module. It adds Sidekiq/sidekiq-batch like support for Job Batches.
|
228
|
+
It integrates automatically with both Sidekiq and ActiveJob. The API is highly similar to the Sidekiq-batch implementation,
|
229
|
+
documentation for which can be found at https://github.com/mperham/sidekiq/wiki/Batches
|
230
|
+
|
231
|
+
A batch can be created using `Sidekiq::Batch` or `CanvasSync::JobBatching::Batch`.
|
232
|
+
|
233
|
+
Also see `canvas_sync/jobs/begin_sync_chain_job`, `canvas_sync/Job_batches/jobs/serial_batch_job`, or `canvas_sync/Job_batches/jobs/concurrent_batch_job` for example usage.
|
260
234
|
|
261
235
|
## Legacy Support
|
262
236
|
|
@@ -308,80 +282,19 @@ end
|
|
308
282
|
## Syncronize different reports
|
309
283
|
CanvasSync provides the functionality to import data from other reports into an specific table.
|
310
284
|
|
311
|
-
This can be
|
312
|
-
|
313
|
-
```ruby
|
314
|
-
CanvasSync.provisioning_sync(<array of models to sync>, term_scope: <optional term scope>)
|
315
|
-
CanvasSync
|
316
|
-
.simple_report_sync(
|
317
|
-
[
|
318
|
-
{
|
319
|
-
report_name: <report name>,
|
320
|
-
model: <model to sync>,
|
321
|
-
params: <hash with the require parameters the report needs to sync>
|
322
|
-
},
|
323
|
-
{
|
324
|
-
report_name: <report name>,
|
325
|
-
model: <model to sync>,
|
326
|
-
params: <hash with the require parameters the report needs to sync>
|
327
|
-
},
|
328
|
-
...
|
329
|
-
],
|
330
|
-
term_scope: <optional term scope>
|
331
|
-
)
|
332
|
-
```
|
333
|
-
|
334
|
-
Example:
|
285
|
+
This can be achieved by using the following method
|
335
286
|
|
336
287
|
```ruby
|
337
|
-
CanvasSync
|
338
|
-
|
339
|
-
|
340
|
-
|
341
|
-
|
342
|
-
|
343
|
-
|
344
|
-
|
345
|
-
|
346
|
-
|
347
|
-
},
|
348
|
-
{
|
349
|
-
report_name: 'proservices_provisioning_csv',
|
350
|
-
model: 'accounts',
|
351
|
-
params: {
|
352
|
-
"parameters[include_deleted]" => true,
|
353
|
-
"parameters[accounts]" => true
|
354
|
-
}
|
355
|
-
}
|
356
|
-
]
|
357
|
-
)
|
358
|
-
```
|
359
|
-
|
360
|
-
Example with the term_scope active:
|
361
|
-
|
362
|
-
```ruby
|
363
|
-
CanvasSync
|
364
|
-
.simple_report_sync(
|
365
|
-
[
|
366
|
-
{
|
367
|
-
report_name: 'proservices_provisioning_csv',
|
368
|
-
model: 'sections',
|
369
|
-
params: {
|
370
|
-
"parameters[include_deleted]" => true,
|
371
|
-
"parameters[sections]" => true
|
372
|
-
}
|
373
|
-
},
|
374
|
-
{
|
375
|
-
report_name: 'proservices_provisioning_csv',
|
376
|
-
model: 'courses',
|
377
|
-
params: {
|
378
|
-
"parameters[include_deleted]" => true,
|
379
|
-
"parameters[courses]" => true
|
380
|
-
}
|
381
|
-
}
|
382
|
-
],
|
383
|
-
term_scope: 'active'
|
384
|
-
)
|
288
|
+
chain = CanvasSync.default_provisioning_report_chain
|
289
|
+
chain << {
|
290
|
+
job: CanvasSync::Jobs::SyncSimpleTableJob,
|
291
|
+
options: {
|
292
|
+
report_name: <report name>,
|
293
|
+
model: <model to sync>,
|
294
|
+
params: <hash with the require parameters the report needs to sync>
|
295
|
+
},
|
296
|
+
}
|
297
|
+
chain.process!
|
385
298
|
```
|
386
299
|
|
387
300
|
## Configuration
|
@@ -421,7 +334,6 @@ class CanvasSyncStarterWorker
|
|
421
334
|
}
|
422
335
|
}
|
423
336
|
)
|
424
|
-
CanvasSync.invoke_next(job_chain)
|
425
337
|
end
|
426
338
|
|
427
339
|
def self.handle_canvas_sync_error(error, **options)
|
@@ -64,12 +64,13 @@ module CanvasSync
|
|
64
64
|
columns = columns.dup
|
65
65
|
|
66
66
|
update_conditions = {
|
67
|
-
condition: condition_sql(klass, columns
|
67
|
+
condition: condition_sql(klass, columns),
|
68
68
|
columns: columns
|
69
69
|
}
|
70
70
|
update_conditions[:conflict_target] = conflict_target if conflict_target
|
71
71
|
|
72
72
|
options = { validate: false, on_duplicate_key_update: update_conditions }.merge(import_args)
|
73
|
+
|
73
74
|
options.delete(:on_duplicate_key_update) if options.key?(:on_duplicate_key_ignore)
|
74
75
|
klass.import(columns, rows, options)
|
75
76
|
end
|
@@ -84,14 +85,10 @@ module CanvasSync
|
|
84
85
|
# started_at = Time.now
|
85
86
|
# run_the_users_sync!
|
86
87
|
# changed = User.where("updated_at >= ?", started_at)
|
87
|
-
def self.condition_sql(klass, columns
|
88
|
+
def self.condition_sql(klass, columns)
|
88
89
|
columns_str = columns.map { |c| "#{klass.quoted_table_name}.#{c}" }.join(", ")
|
89
90
|
excluded_str = columns.map { |c| "EXCLUDED.#{c}" }.join(", ")
|
90
|
-
|
91
|
-
if klass.column_names.include?("updated_at") && report_start
|
92
|
-
condition_sql += " AND #{klass.quoted_table_name}.updated_at < '#{report_start}'"
|
93
|
-
end
|
94
|
-
condition_sql
|
91
|
+
"(#{columns_str}) IS DISTINCT FROM (#{excluded_str})"
|
95
92
|
end
|
96
93
|
|
97
94
|
def self.batch_size
|
data/lib/canvas_sync/job.rb
CHANGED
@@ -3,7 +3,7 @@ require "active_job"
|
|
3
3
|
module CanvasSync
|
4
4
|
# Inherit from this class to build a Job that will log to the canvas_sync_job_logs table
|
5
5
|
class Job < ActiveJob::Base
|
6
|
-
attr_reader :
|
6
|
+
attr_reader :job_log
|
7
7
|
|
8
8
|
before_enqueue do |job|
|
9
9
|
create_job_log(job)
|
@@ -15,12 +15,6 @@ module CanvasSync
|
|
15
15
|
@job_log.started_at = Time.now
|
16
16
|
@job_log.save
|
17
17
|
|
18
|
-
if job.arguments[0].is_a?(Hash) && job.arguments[0].include?(:jobs)
|
19
|
-
# @job_chain = JobChain.new(job.arguments[0])
|
20
|
-
@job_chain = job.arguments[0]
|
21
|
-
job.arguments[0] = @job_chain
|
22
|
-
end
|
23
|
-
|
24
18
|
begin
|
25
19
|
block.call
|
26
20
|
@job_log.status = JobLog::SUCCESS_STATUS
|
@@ -28,11 +22,11 @@ module CanvasSync
|
|
28
22
|
@job_log.exception = "#{e.class}: #{e.message}"
|
29
23
|
@job_log.backtrace = e.backtrace.join('\n')
|
30
24
|
@job_log.status = JobLog::ERROR_STATUS
|
31
|
-
if
|
25
|
+
if batch_context&.[](:on_failure)&.present?
|
32
26
|
begin
|
33
|
-
class_name, method =
|
27
|
+
class_name, method = batch_context[:on_failure].split('.')
|
34
28
|
klass = class_name.constantize
|
35
|
-
klass.send(method.to_sym, e,
|
29
|
+
klass.send(method.to_sym, e, batch_context: batch_context, job_log: @job_log)
|
36
30
|
rescue => e2
|
37
31
|
@job_log.backtrace += "\n\nError Occurred while handling an Error: #{e2.class}: #{e2.message}"
|
38
32
|
@job_log.backtrace += "\n" + e2.backtrace.join('\n')
|