inst-jobs 1.0.4 → 2.1.3
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/lib/delayed/backend/base.rb +9 -1
- data/lib/delayed/lifecycle.rb +1 -0
- data/lib/delayed/periodic.rb +17 -4
- data/lib/delayed/version.rb +1 -1
- data/lib/delayed/worker.rb +46 -25
- data/lib/delayed/worker/health_check.rb +34 -19
- data/spec/delayed/periodic_spec.rb +41 -0
- data/spec/delayed/worker/health_check_spec.rb +9 -0
- data/spec/delayed/worker_spec.rb +23 -3
- metadata +5 -3
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 4c31ed6d846425c9bf022bb8c744681019cbf0f0192d4e0ee7f0a5d7dc44a65c
|
4
|
+
data.tar.gz: 4a5b940ba8bd6770209d93e20ccc217d4ab5915bcd1a5791de70b076e7cecf97
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 07377763c26979774add4b3445aa72ebc2cbff6aabe595e1157c883a90dea48407bc8ecb87f5532265178a96b27548caaf5ce13a0789c469272980bc864a2882
|
7
|
+
data.tar.gz: 7ddd291e18be337ae1d858d016af92cc255c111e5141eafca8cee598fcdae9563a74983ba6b98daeb50c1fe599490dd9c962e1c722d5dcea5083bf16a619641d
|
data/lib/delayed/backend/base.rb
CHANGED
@@ -87,6 +87,10 @@ module Delayed
|
|
87
87
|
batches[batch_enqueue_args] << kwargs
|
88
88
|
return true
|
89
89
|
else
|
90
|
+
if kwargs[:on_conflict].present?
|
91
|
+
Delayed::Logging.logger.warn("[DELAYED_JOB] WARNING: providing 'on_conflict' as an option to a non-singleton job will have no effect. Discarding.")
|
92
|
+
kwargs.delete(:on_conflict)
|
93
|
+
end
|
90
94
|
job = self.create(**kwargs)
|
91
95
|
end
|
92
96
|
|
@@ -178,6 +182,10 @@ module Delayed
|
|
178
182
|
expires_at && (self.class.db_time_now >= expires_at)
|
179
183
|
end
|
180
184
|
|
185
|
+
def inferred_max_attempts
|
186
|
+
self.max_attempts || Delayed::Settings.max_attempts
|
187
|
+
end
|
188
|
+
|
181
189
|
# Reschedule the job in the future (when a job fails).
|
182
190
|
# Uses an exponential scale depending on the number of failed attempts.
|
183
191
|
def reschedule(error = nil, time = nil)
|
@@ -190,7 +198,7 @@ module Delayed
|
|
190
198
|
|
191
199
|
self.attempts += 1 unless return_code == :unlock
|
192
200
|
|
193
|
-
if self.attempts >=
|
201
|
+
if self.attempts >= self.inferred_max_attempts
|
194
202
|
permanent_failure error || "max attempts reached"
|
195
203
|
elsif expired?
|
196
204
|
permanent_failure error || "job has expired"
|
data/lib/delayed/lifecycle.rb
CHANGED
data/lib/delayed/periodic.rb
CHANGED
@@ -49,10 +49,23 @@ class Periodic
|
|
49
49
|
end
|
50
50
|
|
51
51
|
def enqueue
|
52
|
-
Delayed::Job.enqueue(self,
|
53
|
-
|
54
|
-
|
55
|
-
|
52
|
+
Delayed::Job.enqueue(self, **enqueue_args)
|
53
|
+
end
|
54
|
+
|
55
|
+
def enqueue_args
|
56
|
+
# yes, checking for whether it is actually the boolean literal false,
|
57
|
+
# which means the consuming code really does not want this job to be
|
58
|
+
# a singleton at all.
|
59
|
+
non_singleton_periodic_job = @job_args[:singleton] == false
|
60
|
+
inferred_args = {
|
61
|
+
max_attempts: 1,
|
62
|
+
run_at: @cron.next_time(Delayed::Periodic.now).utc.to_time,
|
63
|
+
singleton: (non_singleton_periodic_job ? nil : tag)
|
64
|
+
}
|
65
|
+
unless non_singleton_periodic_job
|
66
|
+
inferred_args[:on_conflict] = :patient
|
67
|
+
end
|
68
|
+
@job_args.merge(inferred_args)
|
56
69
|
end
|
57
70
|
|
58
71
|
def perform
|
data/lib/delayed/version.rb
CHANGED
data/lib/delayed/worker.rb
CHANGED
@@ -3,6 +3,17 @@
|
|
3
3
|
module Delayed
|
4
4
|
|
5
5
|
class TimeoutError < RuntimeError; end
|
6
|
+
class RetriableError < RuntimeError
|
7
|
+
# this error is a special case. You _should_ raise
|
8
|
+
# it from inside the rescue block for another error,
|
9
|
+
# because it indicates: "something made this job fail
|
10
|
+
# but we're pretty sure it's transient and it's safe to try again".
|
11
|
+
# the workflow is still the same (retry will happen unless
|
12
|
+
# retries are exhausted), but it won't call the :error
|
13
|
+
# callback unless it can't retry anymore. It WILL call the
|
14
|
+
# separate ":retry" callback, which is ONLY activated
|
15
|
+
# for this kind of error.
|
16
|
+
end
|
6
17
|
|
7
18
|
require 'tmpdir'
|
8
19
|
require 'set'
|
@@ -94,7 +105,11 @@ class Worker
|
|
94
105
|
end
|
95
106
|
|
96
107
|
def exit?
|
97
|
-
|
108
|
+
!!@exit || parent_exited?
|
109
|
+
end
|
110
|
+
|
111
|
+
def parent_exited?
|
112
|
+
@parent_pid && @parent_pid != Process.ppid
|
98
113
|
end
|
99
114
|
|
100
115
|
def wake_up
|
@@ -198,32 +213,38 @@ class Worker
|
|
198
213
|
end
|
199
214
|
|
200
215
|
def perform(job)
|
201
|
-
|
202
|
-
|
203
|
-
|
204
|
-
|
205
|
-
|
206
|
-
|
207
|
-
|
208
|
-
|
209
|
-
|
210
|
-
|
211
|
-
|
212
|
-
|
216
|
+
begin
|
217
|
+
count = 1
|
218
|
+
raise Delayed::Backend::JobExpired, "job expired at #{job.expires_at}" if job.expired?
|
219
|
+
self.class.lifecycle.run_callbacks(:perform, self, job) do
|
220
|
+
set_process_name("run:#{Settings.worker_procname_prefix}#{job.id}:#{job.name}")
|
221
|
+
logger.info("Processing #{log_job(job, :long)}")
|
222
|
+
runtime = Benchmark.realtime do
|
223
|
+
if job.batch?
|
224
|
+
# each job in the batch will have perform called on it, so we don't
|
225
|
+
# need a timeout around this
|
226
|
+
count = perform_batch(job)
|
227
|
+
else
|
228
|
+
job.invoke_job
|
229
|
+
end
|
230
|
+
job.destroy
|
213
231
|
end
|
214
|
-
job
|
232
|
+
logger.info("Completed #{log_job(job)} #{"%.0fms" % (runtime * 1000)}")
|
233
|
+
end
|
234
|
+
rescue ::Delayed::RetriableError => re
|
235
|
+
can_retry = job.attempts + 1 < job.inferred_max_attempts
|
236
|
+
callback_type = can_retry ? :retry : :error
|
237
|
+
self.class.lifecycle.run_callbacks(callback_type, self, job, re) do
|
238
|
+
handle_failed_job(job, re)
|
239
|
+
end
|
240
|
+
rescue SystemExit => se
|
241
|
+
# There wasn't really a failure here so no callbacks and whatnot needed,
|
242
|
+
# still reschedule the job though.
|
243
|
+
job.reschedule(se)
|
244
|
+
rescue Exception => e
|
245
|
+
self.class.lifecycle.run_callbacks(:error, self, job, e) do
|
246
|
+
handle_failed_job(job, e)
|
215
247
|
end
|
216
|
-
logger.info("Completed #{log_job(job)} #{"%.0fms" % (runtime * 1000)}")
|
217
|
-
end
|
218
|
-
count
|
219
|
-
rescue SystemExit => se
|
220
|
-
# There wasn't really a failure here so no callbacks and whatnot needed,
|
221
|
-
# still reschedule the job though.
|
222
|
-
job.reschedule(se)
|
223
|
-
count
|
224
|
-
rescue Exception => e
|
225
|
-
self.class.lifecycle.run_callbacks(:error, self, job, e) do
|
226
|
-
handle_failed_job(job, e)
|
227
248
|
end
|
228
249
|
count
|
229
250
|
end
|
@@ -22,31 +22,46 @@ module Delayed
|
|
22
22
|
|
23
23
|
def reschedule_abandoned_jobs
|
24
24
|
return if Settings.worker_health_check_type == :none
|
25
|
+
Delayed::Job.transaction do
|
26
|
+
# this job is a special case, and is not a singleton
|
27
|
+
# because if it gets wiped out suddenly during execution
|
28
|
+
# it can't go clean up it's abandoned self. Therefore,
|
29
|
+
# we try to get an advisory lock when it runs. If we succeed,
|
30
|
+
# no other job is trying to do this right now (and if we abandon the
|
31
|
+
# job, the transaction will end, releasing the advisory lock).
|
32
|
+
result = attempt_advisory_lock
|
33
|
+
return unless result
|
34
|
+
checker = Worker::HealthCheck.build(
|
35
|
+
type: Settings.worker_health_check_type,
|
36
|
+
config: Settings.worker_health_check_config,
|
37
|
+
worker_name: 'cleanup-crew'
|
38
|
+
)
|
39
|
+
live_workers = checker.live_workers
|
25
40
|
|
26
|
-
|
27
|
-
|
28
|
-
|
29
|
-
|
30
|
-
|
31
|
-
|
32
|
-
|
33
|
-
|
34
|
-
|
35
|
-
|
36
|
-
|
37
|
-
|
38
|
-
|
39
|
-
# double check that the job is still there. locked_by will immediately be reset
|
40
|
-
# to nil in this transaction by Job#reschedule
|
41
|
-
next unless Delayed::Job.where(id: job, locked_by: job.locked_by).update_all(locked_by: "abandoned job cleanup") == 1
|
42
|
-
job.reschedule
|
41
|
+
Delayed::Job.running_jobs.each do |job|
|
42
|
+
# prefetched jobs have their own way of automatically unlocking themselves
|
43
|
+
next if job.locked_by.start_with?("prefetch:")
|
44
|
+
unless live_workers.include?(job.locked_by)
|
45
|
+
begin
|
46
|
+
Delayed::Job.transaction do
|
47
|
+
# double check that the job is still there. locked_by will immediately be reset
|
48
|
+
# to nil in this transaction by Job#reschedule
|
49
|
+
next unless Delayed::Job.where(id: job, locked_by: job.locked_by).update_all(locked_by: "abandoned job cleanup") == 1
|
50
|
+
job.reschedule
|
51
|
+
end
|
52
|
+
rescue
|
53
|
+
::Rails.logger.error "Failure rescheduling abandoned job #{job.id} #{$!.inspect}"
|
43
54
|
end
|
44
|
-
rescue
|
45
|
-
::Rails.logger.error "Failure rescheduling abandoned job #{job.id} #{$!.inspect}"
|
46
55
|
end
|
47
56
|
end
|
48
57
|
end
|
49
58
|
end
|
59
|
+
|
60
|
+
def attempt_advisory_lock
|
61
|
+
lock_name = "Delayed::Worker::HealthCheck#reschedule_abandoned_jobs"
|
62
|
+
conn = ActiveRecord::Base.connection
|
63
|
+
conn.select_value("SELECT pg_try_advisory_xact_lock(#{conn.quote_table_name('half_md5_as_bigint')}('#{lock_name}'));")
|
64
|
+
end
|
50
65
|
end
|
51
66
|
|
52
67
|
attr_accessor :config, :worker_name
|
@@ -0,0 +1,41 @@
|
|
1
|
+
# frozen_string_literal: true
|
2
|
+
|
3
|
+
require 'spec_helper'
|
4
|
+
|
5
|
+
RSpec.describe Delayed::Periodic do
|
6
|
+
around(:each) do |block|
|
7
|
+
# make sure we can use ".cron" and
|
8
|
+
# such safely without leaking global state
|
9
|
+
prev_sched = Delayed::Periodic.scheduled
|
10
|
+
prev_ovr = Delayed::Periodic.overrides
|
11
|
+
Delayed::Periodic.scheduled = {}
|
12
|
+
Delayed::Periodic.overrides = {}
|
13
|
+
block.call
|
14
|
+
ensure
|
15
|
+
Delayed::Periodic.scheduled = prev_sched
|
16
|
+
Delayed::Periodic.overrides = prev_ovr
|
17
|
+
Delayed::Job.delete_all
|
18
|
+
end
|
19
|
+
|
20
|
+
describe ".cron" do
|
21
|
+
let(:job_name){ 'just a test'}
|
22
|
+
it "provides a tag by default for periodic jobs" do
|
23
|
+
Delayed::Periodic.cron job_name, '*/10 * * * *' do
|
24
|
+
# no-op
|
25
|
+
end
|
26
|
+
instance = Delayed::Periodic.scheduled[job_name]
|
27
|
+
expect(instance).to_not be_nil
|
28
|
+
expect(instance.enqueue_args[:singleton]).to eq("periodic: just a test")
|
29
|
+
end
|
30
|
+
|
31
|
+
it "uses no singleton if told to skip" do
|
32
|
+
Delayed::Periodic.cron job_name, '*/10 * * * *', {singleton: false} do
|
33
|
+
# no-op
|
34
|
+
end
|
35
|
+
instance = Delayed::Periodic.scheduled[job_name]
|
36
|
+
expect(instance).to_not be_nil
|
37
|
+
expect(instance.enqueue_args[:singleton]).to be_nil
|
38
|
+
Delayed::Periodic.perform_audit!
|
39
|
+
end
|
40
|
+
end
|
41
|
+
end
|
@@ -107,6 +107,15 @@ RSpec.describe Delayed::Worker::HealthCheck do
|
|
107
107
|
@dead_job.reload
|
108
108
|
expect(@dead_job.locked_by).to eq 'prefetch:some_node'
|
109
109
|
end
|
110
|
+
|
111
|
+
it "bails immediately if advisory lock already taken" do
|
112
|
+
allow(Delayed::Worker::HealthCheck).to receive(:attempt_advisory_lock).and_return(false)
|
113
|
+
Delayed::Worker::HealthCheck.reschedule_abandoned_jobs
|
114
|
+
@dead_job.reload
|
115
|
+
expect(@dead_job.run_at.to_i).to eq(initial_run_at.to_i)
|
116
|
+
expect(@dead_job.locked_at).to_not be_nil
|
117
|
+
expect(@dead_job.locked_by).to_not be_nil
|
118
|
+
end
|
110
119
|
end
|
111
120
|
|
112
121
|
describe '#initialize' do
|
data/spec/delayed/worker_spec.rb
CHANGED
@@ -6,6 +6,11 @@ describe Delayed::Worker do
|
|
6
6
|
let(:worker_config) { {
|
7
7
|
queue: "test", min_priority: 1, max_priority: 2, stuff: "stuff",
|
8
8
|
}.freeze }
|
9
|
+
let(:job_attrs) { {
|
10
|
+
id: 42, name: "testjob", full_name: "testfullname", :last_error= => nil,
|
11
|
+
attempts: 1, reschedule: nil, :expired? => false,
|
12
|
+
payload_object: {}, priority: 25
|
13
|
+
}.freeze }
|
9
14
|
subject { described_class.new(worker_config.dup) }
|
10
15
|
|
11
16
|
after { Delayed::Worker.lifecycle.reset! }
|
@@ -14,9 +19,24 @@ describe Delayed::Worker do
|
|
14
19
|
it "fires off an error callback when a job raises an exception" do
|
15
20
|
fired = false
|
16
21
|
Delayed::Worker.lifecycle.before(:error) {|worker, exception| fired = true}
|
17
|
-
job = double(
|
18
|
-
subject.perform(job)
|
22
|
+
job = double(job_attrs)
|
23
|
+
output_count = subject.perform(job)
|
19
24
|
expect(fired).to be_truthy
|
25
|
+
expect(output_count).to eq(1)
|
26
|
+
end
|
27
|
+
|
28
|
+
it "uses the retry callback for a retriable exception" do
|
29
|
+
error_fired = retry_fired = false
|
30
|
+
Delayed::Worker.lifecycle.before(:error) {|worker, exception| error_fired = true }
|
31
|
+
Delayed::Worker.lifecycle.before(:retry) {|worker, exception| retry_fired = true}
|
32
|
+
job = Delayed::Job.new(payload_object: {}, priority: 25, strand: "test_jobs", max_attempts: 3)
|
33
|
+
expect(job).to receive(:invoke_job) do
|
34
|
+
raise Delayed::RetriableError, "that's all this job does"
|
35
|
+
end
|
36
|
+
output_count = subject.perform(job)
|
37
|
+
expect(error_fired).to be_falsey
|
38
|
+
expect(retry_fired).to be_truthy
|
39
|
+
expect(output_count).to eq(1)
|
20
40
|
end
|
21
41
|
|
22
42
|
it "reloads" do
|
@@ -35,7 +55,7 @@ describe Delayed::Worker do
|
|
35
55
|
expect(ActionDispatch::Reloader).to receive(:prepare!).once
|
36
56
|
expect(ActionDispatch::Reloader).to receive(:cleanup!).once
|
37
57
|
end
|
38
|
-
job = double(
|
58
|
+
job = double(job_attrs)
|
39
59
|
subject.perform(job)
|
40
60
|
end
|
41
61
|
end
|
metadata
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: inst-jobs
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 1.
|
4
|
+
version: 2.1.3
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Tobias Luetke
|
@@ -9,7 +9,7 @@ authors:
|
|
9
9
|
autorequire:
|
10
10
|
bindir: exe
|
11
11
|
cert_chain: []
|
12
|
-
date: 2020-
|
12
|
+
date: 2020-12-22 00:00:00.000000000 Z
|
13
13
|
dependencies:
|
14
14
|
- !ruby/object:Gem::Dependency
|
15
15
|
name: activerecord
|
@@ -412,6 +412,7 @@ files:
|
|
412
412
|
- spec/delayed/cli_spec.rb
|
413
413
|
- spec/delayed/daemon_spec.rb
|
414
414
|
- spec/delayed/message_sending_spec.rb
|
415
|
+
- spec/delayed/periodic_spec.rb
|
415
416
|
- spec/delayed/server_spec.rb
|
416
417
|
- spec/delayed/settings_spec.rb
|
417
418
|
- spec/delayed/work_queue/in_process_spec.rb
|
@@ -448,7 +449,7 @@ required_ruby_version: !ruby/object:Gem::Requirement
|
|
448
449
|
requirements:
|
449
450
|
- - ">="
|
450
451
|
- !ruby/object:Gem::Version
|
451
|
-
version: '2.
|
452
|
+
version: '2.6'
|
452
453
|
required_rubygems_version: !ruby/object:Gem::Requirement
|
453
454
|
requirements:
|
454
455
|
- - ">="
|
@@ -480,6 +481,7 @@ test_files:
|
|
480
481
|
- spec/delayed/cli_spec.rb
|
481
482
|
- spec/delayed/daemon_spec.rb
|
482
483
|
- spec/delayed/worker_spec.rb
|
484
|
+
- spec/delayed/periodic_spec.rb
|
483
485
|
- spec/delayed/message_sending_spec.rb
|
484
486
|
- spec/delayed/settings_spec.rb
|
485
487
|
- spec/delayed/work_queue/in_process_spec.rb
|