switchman-inst-jobs 3.0.5 → 3.1.2
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/lib/switchman_inst_jobs/delayed/backend/base.rb +1 -2
- data/lib/switchman_inst_jobs/delayed/settings.rb +9 -0
- data/lib/switchman_inst_jobs/delayed/worker/health_check.rb +15 -14
- data/lib/switchman_inst_jobs/jobs_migrator.rb +49 -34
- data/lib/switchman_inst_jobs/switchman/shard.rb +8 -1
- data/lib/switchman_inst_jobs/version.rb +1 -1
- data/lib/switchman_inst_jobs.rb +1 -0
- metadata +14 -13
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 4efbe05e879c9162df06f945af688c64876b9c56cc870509687160549359fd39
|
4
|
+
data.tar.gz: e32c8a6dfecd0b6c760d07a4d45eeaf6651d6cc7e70e7b6418d82c5a112f70cd
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 4fe0103d1b4bc305f0c85ba2135366968eb7c33bb6482b6d302dde9b9532db1d3d09fac64d90dad16fe6c6a438236ede5732d16a22d8538053d814010c9d2c87
|
7
|
+
data.tar.gz: feb2e546ee06bc38f964f58e63cfb59fdc25757952762ef8f8faf0521050d264e9f018ea8e6bb0131b277997d63035f68562cf45a7af13886fbfd80f481f5515
|
@@ -43,8 +43,7 @@ module SwitchmanInstJobs
|
|
43
43
|
end
|
44
44
|
|
45
45
|
def configured_shard_ids
|
46
|
-
|
47
|
-
map { |w| w['shard'] }.compact.uniq
|
46
|
+
::SwitchmanInstJobs::Delayed::Settings.configured_shard_ids
|
48
47
|
end
|
49
48
|
|
50
49
|
def processes_locked_locally
|
@@ -18,22 +18,23 @@ module SwitchmanInstJobs
|
|
18
18
|
::Delayed::Settings.worker_health_check_config['service_name'] = original_service_name
|
19
19
|
end
|
20
20
|
|
21
|
-
def reschedule_abandoned_jobs
|
22
|
-
|
23
|
-
|
24
|
-
|
25
|
-
|
26
|
-
|
21
|
+
def reschedule_abandoned_jobs
|
22
|
+
shard_ids = ::SwitchmanInstJobs::Delayed::Settings.configured_shard_ids
|
23
|
+
shards = shard_ids.map { |shard_id| ::Delayed::Worker.shard(shard_id) }
|
24
|
+
::Switchman::Shard.with_each_shard(shards, [:delayed_jobs]) do
|
25
|
+
dj_shard = ::Switchman::Shard.current(:delayed_jobs)
|
26
|
+
dj_shard.activate do
|
27
|
+
munge_service_name(dj_shard) do
|
28
|
+
# because this rescheduling process is running on every host, we need
|
29
|
+
# to make sure that it's functioning for each shard the current
|
30
|
+
# host is programmed to interact with, but ONLY for those shards.
|
31
|
+
# reading the config lets us iterate over any shards this host should
|
32
|
+
# work with and lets us pick the correct service name to identify which
|
33
|
+
# hosts are currently alive and valid via the health checks
|
34
|
+
super()
|
35
|
+
end
|
27
36
|
end
|
28
37
|
end
|
29
|
-
|
30
|
-
::Switchman::Shard.with_each_shard(shards, [:delayed_jobs], exception: :ignore) do
|
31
|
-
shard = ::Switchman::Shard.current(:delayed_jobs)
|
32
|
-
singleton = <<~SINGLETON
|
33
|
-
periodic: Delayed::Worker::HealthCheck.reschedule_abandoned_jobs:#{shard.id}
|
34
|
-
SINGLETON
|
35
|
-
delay(singleton: singleton).reschedule_abandoned_jobs(call_super: shard)
|
36
|
-
end
|
37
38
|
end
|
38
39
|
end
|
39
40
|
end
|
@@ -39,16 +39,12 @@ module SwitchmanInstJobs
|
|
39
39
|
|
40
40
|
# Do the updates in batches and then just clear redis instead of clearing them one at a time
|
41
41
|
target_shards.each do |target_shard, shards|
|
42
|
-
|
42
|
+
updates = { delayed_jobs_shard_id: target_shard, block_stranded: true }
|
43
|
+
updates[:updated_at] = Time.zone.now if ::Switchman::Shard.column_names.include?('updated_at')
|
44
|
+
::Switchman::Shard.where(id: shards).update_all(updates)
|
43
45
|
end
|
44
46
|
clear_shard_cache
|
45
47
|
|
46
|
-
# Wait a little over the 60 second in-process shard cache clearing
|
47
|
-
# threshold to ensure that all new stranded jobs are now being
|
48
|
-
# enqueued with next_in_strand: false
|
49
|
-
Rails.logger.debug('Waiting for caches to clear')
|
50
|
-
sleep(65) unless @skip_cache_wait
|
51
|
-
|
52
48
|
::Switchman::Shard.clear_cache
|
53
49
|
# rubocop:disable Style/CombinableLoops
|
54
50
|
# We first migrate strands so that we can stop blocking strands before we migrate unstranded jobs
|
@@ -59,11 +55,33 @@ module SwitchmanInstJobs
|
|
59
55
|
source_shards.each do |s|
|
60
56
|
::Switchman::Shard.lookup(s).activate(:delayed_jobs) { migrate_everything }
|
61
57
|
end
|
58
|
+
ensure_unblock_stranded_for(shard_map.map(&:first))
|
62
59
|
# rubocop:enable Style/CombinableLoops
|
63
60
|
end
|
64
61
|
|
65
|
-
|
62
|
+
# if :migrate_strands ran on any shards that fell into scenario 1, then
|
63
|
+
# block_stranded never got flipped, so do that now.
|
64
|
+
def ensure_unblock_stranded_for(shards)
|
65
|
+
shards = ::Switchman::Shard.where(id: shards, block_stranded: true).to_a
|
66
|
+
return unless shards.any?
|
67
|
+
|
68
|
+
::Switchman::Shard.where(id: shards).update_all(block_stranded: false)
|
69
|
+
clear_shard_cache
|
70
|
+
|
71
|
+
# shards is an array of shard objects that is now stale cause block_stranded has been updated.
|
72
|
+
shards.map(&:delayed_jobs_shard).uniq.each do |dj_shard|
|
73
|
+
unblock_strands(dj_shard)
|
74
|
+
end
|
75
|
+
end
|
76
|
+
|
77
|
+
def clear_shard_cache(debug_message = nil)
|
66
78
|
::Switchman.cache.clear
|
79
|
+
Rails.logger.debug("Waiting for caches to clear #{debug_message}")
|
80
|
+
# Wait a little over the 60 second in-process shard cache clearing
|
81
|
+
# threshold to ensure that all new stranded jobs are now being
|
82
|
+
# enqueued with next_in_strand: false
|
83
|
+
# @skip_cache_wait is for spec usage only
|
84
|
+
sleep(65) unless @skip_cache_wait
|
67
85
|
end
|
68
86
|
|
69
87
|
# This method expects that all relevant shards already have block_stranded: true
|
@@ -125,7 +143,7 @@ module SwitchmanInstJobs
|
|
125
143
|
update_all(next_in_strand: false)
|
126
144
|
end
|
127
145
|
|
128
|
-
# 4) is taken care of here, by
|
146
|
+
# 4) is taken care of here, by leaving next_in_strand alone and
|
129
147
|
# it should execute on the new shard
|
130
148
|
batch_move_jobs(
|
131
149
|
target_shard: target_shard,
|
@@ -141,35 +159,32 @@ module SwitchmanInstJobs
|
|
141
159
|
updated = ::Switchman::Shard.where(id: source_shard_ids, block_stranded: true).
|
142
160
|
update_all(block_stranded: false)
|
143
161
|
# If this is being manually re-run for some reason to clean something up, don't wait for nothing to happen
|
144
|
-
unless updated.zero?
|
145
|
-
|
146
|
-
# Wait a little over the 60 second in-process shard cache clearing
|
147
|
-
# threshold to ensure that all new stranded jobs are now being
|
148
|
-
# enqueued with next_in_strand: false
|
149
|
-
Rails.logger.debug("Waiting for caches to clear (#{source_shard.id} -> #{target_shard.id})")
|
150
|
-
# for spec usage only
|
151
|
-
sleep(65) unless @skip_cache_wait
|
152
|
-
end
|
162
|
+
clear_shard_cache("(#{source_shard.id} -> #{target_shard.id})") unless updated.zero?
|
163
|
+
|
153
164
|
::Switchman::Shard.clear_cache
|
154
165
|
# At this time, let's unblock all the strands on the target shard that aren't being held by a blocker
|
155
166
|
# but actually could have run and we just didn't know it because we didn't know if they had jobs
|
156
167
|
# on the source shard
|
157
|
-
target_shard
|
158
|
-
|
159
|
-
|
160
|
-
|
161
|
-
|
162
|
-
|
163
|
-
|
164
|
-
|
165
|
-
|
166
|
-
|
167
|
-
|
168
|
-
|
169
|
-
|
170
|
-
|
171
|
-
|
172
|
-
|
168
|
+
unblock_strands(target_shard)
|
169
|
+
end
|
170
|
+
end
|
171
|
+
end
|
172
|
+
|
173
|
+
def unblock_strands(target_shard)
|
174
|
+
target_shard.activate(:delayed_jobs) do
|
175
|
+
loop do
|
176
|
+
# We only want to unlock stranded jobs where they don't belong to a blocked shard (if they *do* belong)
|
177
|
+
# to a blocked shard, they must be part of a concurrent jobs migration from a different source shard to
|
178
|
+
# this target shard, so we shouldn't unlock them yet. We only ever unlock one job here to keep the
|
179
|
+
# logic cleaner; if the job is n-stranded, after the first one runs, the trigger will unlock larger
|
180
|
+
# batches
|
181
|
+
break if ::Delayed::Job.where(id: ::Delayed::Job.select('DISTINCT ON (strand) id').
|
182
|
+
where.not(strand: nil).
|
183
|
+
where.not(shard_id: ::Switchman::Shard.where(block_stranded: true).pluck(:id)).where(
|
184
|
+
::Delayed::Job.select(1).from("#{::Delayed::Job.quoted_table_name} dj2").
|
185
|
+
where("dj2.next_in_strand = true OR dj2.source = 'JobsMigrator::StrandBlocker'").
|
186
|
+
where('dj2.strand = delayed_jobs.strand').arel.exists.not
|
187
|
+
).order(:strand, :strand_order_override, :id)).limit(500).update_all(next_in_strand: true).zero?
|
173
188
|
end
|
174
189
|
end
|
175
190
|
end
|
@@ -39,7 +39,14 @@ module SwitchmanInstJobs
|
|
39
39
|
|
40
40
|
def unhold_jobs!
|
41
41
|
self.jobs_held = false
|
42
|
-
|
42
|
+
if changed?
|
43
|
+
save!
|
44
|
+
# Wait a little over the 60 second in-process shard cache clearing
|
45
|
+
# threshold to ensure that all new jobs are now being enqueued
|
46
|
+
# unlocked
|
47
|
+
Rails.logger.debug('Waiting for caches to clear')
|
48
|
+
sleep(65)
|
49
|
+
end
|
43
50
|
delayed_jobs_shard.activate(:delayed_jobs) do
|
44
51
|
::Delayed::Job.where(locked_by: ::Delayed::Backend::Base::ON_HOLD_LOCKED_BY, shard_id: id).
|
45
52
|
in_batches(of: 10_000).
|
data/lib/switchman_inst_jobs.rb
CHANGED
@@ -38,6 +38,7 @@ end
|
|
38
38
|
|
39
39
|
require 'switchman_inst_jobs/active_record/connection_adapters/postgresql_adapter'
|
40
40
|
require 'switchman_inst_jobs/active_record/migration'
|
41
|
+
require 'switchman_inst_jobs/delayed/settings'
|
41
42
|
require 'switchman_inst_jobs/delayed/backend/base'
|
42
43
|
require 'switchman_inst_jobs/delayed/message_sending'
|
43
44
|
require 'switchman_inst_jobs/delayed/pool'
|
metadata
CHANGED
@@ -1,35 +1,35 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: switchman-inst-jobs
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 3.
|
4
|
+
version: 3.1.2
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Bryan Petty
|
8
|
-
autorequire:
|
8
|
+
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date:
|
11
|
+
date: 2021-01-26 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: inst-jobs
|
15
15
|
requirement: !ruby/object:Gem::Requirement
|
16
16
|
requirements:
|
17
|
-
- - "~>"
|
18
|
-
- !ruby/object:Gem::Version
|
19
|
-
version: '1.0'
|
20
17
|
- - ">="
|
21
18
|
- !ruby/object:Gem::Version
|
22
19
|
version: 1.0.3
|
20
|
+
- - "<"
|
21
|
+
- !ruby/object:Gem::Version
|
22
|
+
version: '3.0'
|
23
23
|
type: :runtime
|
24
24
|
prerelease: false
|
25
25
|
version_requirements: !ruby/object:Gem::Requirement
|
26
26
|
requirements:
|
27
|
-
- - "~>"
|
28
|
-
- !ruby/object:Gem::Version
|
29
|
-
version: '1.0'
|
30
27
|
- - ">="
|
31
28
|
- !ruby/object:Gem::Version
|
32
29
|
version: 1.0.3
|
30
|
+
- - "<"
|
31
|
+
- !ruby/object:Gem::Version
|
32
|
+
version: '3.0'
|
33
33
|
- !ruby/object:Gem::Dependency
|
34
34
|
name: parallel
|
35
35
|
requirement: !ruby/object:Gem::Requirement
|
@@ -260,7 +260,7 @@ dependencies:
|
|
260
260
|
- - "~>"
|
261
261
|
- !ruby/object:Gem::Version
|
262
262
|
version: '1.4'
|
263
|
-
description:
|
263
|
+
description:
|
264
264
|
email:
|
265
265
|
- bpetty@instructure.com
|
266
266
|
executables: []
|
@@ -303,6 +303,7 @@ files:
|
|
303
303
|
- lib/switchman_inst_jobs/delayed/backend/base.rb
|
304
304
|
- lib/switchman_inst_jobs/delayed/message_sending.rb
|
305
305
|
- lib/switchman_inst_jobs/delayed/pool.rb
|
306
|
+
- lib/switchman_inst_jobs/delayed/settings.rb
|
306
307
|
- lib/switchman_inst_jobs/delayed/worker.rb
|
307
308
|
- lib/switchman_inst_jobs/delayed/worker/health_check.rb
|
308
309
|
- lib/switchman_inst_jobs/engine.rb
|
@@ -319,7 +320,7 @@ homepage: https://github.com/instructure/switchman-inst-jobs
|
|
319
320
|
licenses:
|
320
321
|
- MIT
|
321
322
|
metadata: {}
|
322
|
-
post_install_message:
|
323
|
+
post_install_message:
|
323
324
|
rdoc_options: []
|
324
325
|
require_paths:
|
325
326
|
- lib
|
@@ -334,8 +335,8 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
334
335
|
- !ruby/object:Gem::Version
|
335
336
|
version: '0'
|
336
337
|
requirements: []
|
337
|
-
rubygems_version: 3.
|
338
|
-
signing_key:
|
338
|
+
rubygems_version: 3.0.3
|
339
|
+
signing_key:
|
339
340
|
specification_version: 4
|
340
341
|
summary: Switchman and Instructure Jobs compatibility gem.
|
341
342
|
test_files: []
|