sidekiq 3.5.4 → 5.2.7
Sign up to get free protection for your applications and to get access to all the features.
Potentially problematic release.
This version of sidekiq might be problematic. Click here for more details.
- checksums.yaml +5 -5
- data/.circleci/config.yml +61 -0
- data/{Contributing.md → .github/contributing.md} +0 -0
- data/.github/issue_template.md +11 -0
- data/.gitignore +3 -0
- data/.travis.yml +5 -10
- data/4.0-Upgrade.md +53 -0
- data/5.0-Upgrade.md +56 -0
- data/COMM-LICENSE +13 -11
- data/Changes.md +376 -1
- data/Ent-Changes.md +201 -2
- data/Gemfile +14 -18
- data/LICENSE +1 -1
- data/Pro-3.0-Upgrade.md +44 -0
- data/Pro-4.0-Upgrade.md +35 -0
- data/Pro-Changes.md +307 -2
- data/README.md +34 -22
- data/Rakefile +3 -3
- data/bin/sidekiq +0 -1
- data/bin/sidekiqctl +13 -86
- data/bin/sidekiqload +23 -27
- data/code_of_conduct.md +50 -0
- data/lib/generators/sidekiq/templates/worker_spec.rb.erb +3 -3
- data/lib/generators/sidekiq/templates/worker_test.rb.erb +6 -6
- data/lib/sidekiq.rb +72 -25
- data/lib/sidekiq/api.rb +206 -73
- data/lib/sidekiq/cli.rb +145 -101
- data/lib/sidekiq/client.rb +42 -36
- data/lib/sidekiq/core_ext.rb +1 -105
- data/lib/sidekiq/ctl.rb +221 -0
- data/lib/sidekiq/delay.rb +42 -0
- data/lib/sidekiq/exception_handler.rb +4 -5
- data/lib/sidekiq/extensions/action_mailer.rb +1 -0
- data/lib/sidekiq/extensions/active_record.rb +1 -0
- data/lib/sidekiq/extensions/class_methods.rb +1 -0
- data/lib/sidekiq/extensions/generic_proxy.rb +8 -1
- data/lib/sidekiq/fetch.rb +36 -111
- data/lib/sidekiq/job_logger.rb +25 -0
- data/lib/sidekiq/job_retry.rb +262 -0
- data/lib/sidekiq/launcher.rb +129 -55
- data/lib/sidekiq/logging.rb +21 -3
- data/lib/sidekiq/manager.rb +83 -182
- data/lib/sidekiq/middleware/chain.rb +1 -0
- data/lib/sidekiq/middleware/i18n.rb +1 -0
- data/lib/sidekiq/middleware/server/active_record.rb +10 -0
- data/lib/sidekiq/paginator.rb +1 -0
- data/lib/sidekiq/processor.rb +221 -103
- data/lib/sidekiq/rails.rb +47 -27
- data/lib/sidekiq/redis_connection.rb +74 -7
- data/lib/sidekiq/scheduled.rb +87 -28
- data/lib/sidekiq/testing.rb +150 -19
- data/lib/sidekiq/testing/inline.rb +1 -0
- data/lib/sidekiq/util.rb +15 -17
- data/lib/sidekiq/version.rb +2 -1
- data/lib/sidekiq/web.rb +120 -184
- data/lib/sidekiq/web/action.rb +89 -0
- data/lib/sidekiq/web/application.rb +353 -0
- data/lib/sidekiq/{web_helpers.rb → web/helpers.rb} +123 -47
- data/lib/sidekiq/web/router.rb +100 -0
- data/lib/sidekiq/worker.rb +135 -18
- data/sidekiq.gemspec +8 -14
- data/web/assets/images/{status-sd8051fd480.png → status.png} +0 -0
- data/web/assets/javascripts/application.js +24 -20
- data/web/assets/javascripts/dashboard.js +33 -18
- data/web/assets/stylesheets/application-rtl.css +246 -0
- data/web/assets/stylesheets/application.css +401 -7
- data/web/assets/stylesheets/bootstrap-rtl.min.css +9 -0
- data/web/assets/stylesheets/bootstrap.css +4 -8
- data/web/locales/ar.yml +81 -0
- data/web/locales/cs.yml +11 -1
- data/web/locales/de.yml +1 -1
- data/web/locales/en.yml +4 -0
- data/web/locales/es.yml +4 -3
- data/web/locales/fa.yml +80 -0
- data/web/locales/fr.yml +21 -12
- data/web/locales/he.yml +79 -0
- data/web/locales/ja.yml +24 -13
- data/web/locales/ru.yml +3 -0
- data/web/locales/ur.yml +80 -0
- data/web/views/_footer.erb +7 -9
- data/web/views/_job_info.erb +5 -1
- data/web/views/_nav.erb +5 -19
- data/web/views/_paging.erb +1 -1
- data/web/views/busy.erb +18 -9
- data/web/views/dashboard.erb +5 -5
- data/web/views/dead.erb +1 -1
- data/web/views/layout.erb +13 -5
- data/web/views/morgue.erb +16 -12
- data/web/views/queue.erb +12 -11
- data/web/views/queues.erb +5 -3
- data/web/views/retries.erb +19 -13
- data/web/views/retry.erb +2 -2
- data/web/views/scheduled.erb +4 -4
- data/web/views/scheduled_job_info.erb +1 -1
- metadata +45 -227
- data/lib/sidekiq/actor.rb +0 -39
- data/lib/sidekiq/middleware/server/logging.rb +0 -40
- data/lib/sidekiq/middleware/server/retry_jobs.rb +0 -206
- data/test/config.yml +0 -9
- data/test/env_based_config.yml +0 -11
- data/test/fake_env.rb +0 -0
- data/test/fixtures/en.yml +0 -2
- data/test/helper.rb +0 -49
- data/test/test_api.rb +0 -493
- data/test/test_cli.rb +0 -335
- data/test/test_client.rb +0 -194
- data/test/test_exception_handler.rb +0 -55
- data/test/test_extensions.rb +0 -126
- data/test/test_fetch.rb +0 -104
- data/test/test_logging.rb +0 -34
- data/test/test_manager.rb +0 -168
- data/test/test_middleware.rb +0 -159
- data/test/test_processor.rb +0 -237
- data/test/test_rails.rb +0 -21
- data/test/test_redis_connection.rb +0 -126
- data/test/test_retry.rb +0 -325
- data/test/test_scheduled.rb +0 -114
- data/test/test_scheduling.rb +0 -49
- data/test/test_sidekiq.rb +0 -99
- data/test/test_testing.rb +0 -142
- data/test/test_testing_fake.rb +0 -268
- data/test/test_testing_inline.rb +0 -93
- data/test/test_util.rb +0 -16
- data/test/test_web.rb +0 -608
- data/test/test_web_helpers.rb +0 -53
- data/web/assets/images/bootstrap/glyphicons-halflings-white.png +0 -0
- data/web/assets/images/bootstrap/glyphicons-halflings.png +0 -0
- data/web/assets/images/status/active.png +0 -0
- data/web/assets/images/status/idle.png +0 -0
- data/web/assets/javascripts/locales/README.md +0 -27
- data/web/assets/javascripts/locales/jquery.timeago.ar.js +0 -96
- data/web/assets/javascripts/locales/jquery.timeago.bg.js +0 -18
- data/web/assets/javascripts/locales/jquery.timeago.bs.js +0 -49
- data/web/assets/javascripts/locales/jquery.timeago.ca.js +0 -18
- data/web/assets/javascripts/locales/jquery.timeago.cs.js +0 -18
- data/web/assets/javascripts/locales/jquery.timeago.cy.js +0 -20
- data/web/assets/javascripts/locales/jquery.timeago.da.js +0 -18
- data/web/assets/javascripts/locales/jquery.timeago.de.js +0 -18
- data/web/assets/javascripts/locales/jquery.timeago.el.js +0 -18
- data/web/assets/javascripts/locales/jquery.timeago.en-short.js +0 -20
- data/web/assets/javascripts/locales/jquery.timeago.en.js +0 -20
- data/web/assets/javascripts/locales/jquery.timeago.es.js +0 -18
- data/web/assets/javascripts/locales/jquery.timeago.et.js +0 -18
- data/web/assets/javascripts/locales/jquery.timeago.fa.js +0 -22
- data/web/assets/javascripts/locales/jquery.timeago.fi.js +0 -28
- data/web/assets/javascripts/locales/jquery.timeago.fr-short.js +0 -16
- data/web/assets/javascripts/locales/jquery.timeago.fr.js +0 -17
- data/web/assets/javascripts/locales/jquery.timeago.he.js +0 -18
- data/web/assets/javascripts/locales/jquery.timeago.hr.js +0 -49
- data/web/assets/javascripts/locales/jquery.timeago.hu.js +0 -18
- data/web/assets/javascripts/locales/jquery.timeago.hy.js +0 -18
- data/web/assets/javascripts/locales/jquery.timeago.id.js +0 -18
- data/web/assets/javascripts/locales/jquery.timeago.it.js +0 -16
- data/web/assets/javascripts/locales/jquery.timeago.ja.js +0 -19
- data/web/assets/javascripts/locales/jquery.timeago.ko.js +0 -17
- data/web/assets/javascripts/locales/jquery.timeago.lt.js +0 -20
- data/web/assets/javascripts/locales/jquery.timeago.mk.js +0 -20
- data/web/assets/javascripts/locales/jquery.timeago.nl.js +0 -20
- data/web/assets/javascripts/locales/jquery.timeago.no.js +0 -18
- data/web/assets/javascripts/locales/jquery.timeago.pl.js +0 -31
- data/web/assets/javascripts/locales/jquery.timeago.pt-br.js +0 -16
- data/web/assets/javascripts/locales/jquery.timeago.pt.js +0 -16
- data/web/assets/javascripts/locales/jquery.timeago.ro.js +0 -18
- data/web/assets/javascripts/locales/jquery.timeago.rs.js +0 -49
- data/web/assets/javascripts/locales/jquery.timeago.ru.js +0 -34
- data/web/assets/javascripts/locales/jquery.timeago.sk.js +0 -18
- data/web/assets/javascripts/locales/jquery.timeago.sl.js +0 -44
- data/web/assets/javascripts/locales/jquery.timeago.sv.js +0 -18
- data/web/assets/javascripts/locales/jquery.timeago.th.js +0 -20
- data/web/assets/javascripts/locales/jquery.timeago.tr.js +0 -16
- data/web/assets/javascripts/locales/jquery.timeago.uk.js +0 -34
- data/web/assets/javascripts/locales/jquery.timeago.uz.js +0 -19
- data/web/assets/javascripts/locales/jquery.timeago.zh-cn.js +0 -20
- data/web/assets/javascripts/locales/jquery.timeago.zh-tw.js +0 -20
- data/web/views/_poll_js.erb +0 -5
@@ -0,0 +1,25 @@
|
|
1
|
+
# frozen_string_literal: true
|
2
|
+
module Sidekiq
|
3
|
+
class JobLogger
|
4
|
+
|
5
|
+
def call(item, queue)
|
6
|
+
start = ::Process.clock_gettime(::Process::CLOCK_MONOTONIC)
|
7
|
+
logger.info("start")
|
8
|
+
yield
|
9
|
+
logger.info("done: #{elapsed(start)} sec")
|
10
|
+
rescue Exception
|
11
|
+
logger.info("fail: #{elapsed(start)} sec")
|
12
|
+
raise
|
13
|
+
end
|
14
|
+
|
15
|
+
private
|
16
|
+
|
17
|
+
def elapsed(start)
|
18
|
+
(::Process.clock_gettime(::Process::CLOCK_MONOTONIC) - start).round(3)
|
19
|
+
end
|
20
|
+
|
21
|
+
def logger
|
22
|
+
Sidekiq.logger
|
23
|
+
end
|
24
|
+
end
|
25
|
+
end
|
@@ -0,0 +1,262 @@
|
|
1
|
+
# frozen_string_literal: true
|
2
|
+
require 'sidekiq/scheduled'
|
3
|
+
require 'sidekiq/api'
|
4
|
+
|
5
|
+
module Sidekiq
|
6
|
+
##
|
7
|
+
# Automatically retry jobs that fail in Sidekiq.
|
8
|
+
# Sidekiq's retry support assumes a typical development lifecycle:
|
9
|
+
#
|
10
|
+
# 0. Push some code changes with a bug in it.
|
11
|
+
# 1. Bug causes job processing to fail, Sidekiq's middleware captures
|
12
|
+
# the job and pushes it onto a retry queue.
|
13
|
+
# 2. Sidekiq retries jobs in the retry queue multiple times with
|
14
|
+
# an exponential delay, the job continues to fail.
|
15
|
+
# 3. After a few days, a developer deploys a fix. The job is
|
16
|
+
# reprocessed successfully.
|
17
|
+
# 4. Once retries are exhausted, Sidekiq will give up and move the
|
18
|
+
# job to the Dead Job Queue (aka morgue) where it must be dealt with
|
19
|
+
# manually in the Web UI.
|
20
|
+
# 5. After 6 months on the DJQ, Sidekiq will discard the job.
|
21
|
+
#
|
22
|
+
# A job looks like:
|
23
|
+
#
|
24
|
+
# { 'class' => 'HardWorker', 'args' => [1, 2, 'foo'], 'retry' => true }
|
25
|
+
#
|
26
|
+
# The 'retry' option also accepts a number (in place of 'true'):
|
27
|
+
#
|
28
|
+
# { 'class' => 'HardWorker', 'args' => [1, 2, 'foo'], 'retry' => 5 }
|
29
|
+
#
|
30
|
+
# The job will be retried this number of times before giving up. (If simply
|
31
|
+
# 'true', Sidekiq retries 25 times)
|
32
|
+
#
|
33
|
+
# We'll add a bit more data to the job to support retries:
|
34
|
+
#
|
35
|
+
# * 'queue' - the queue to use
|
36
|
+
# * 'retry_count' - number of times we've retried so far.
|
37
|
+
# * 'error_message' - the message from the exception
|
38
|
+
# * 'error_class' - the exception class
|
39
|
+
# * 'failed_at' - the first time it failed
|
40
|
+
# * 'retried_at' - the last time it was retried
|
41
|
+
# * 'backtrace' - the number of lines of error backtrace to store
|
42
|
+
#
|
43
|
+
# We don't store the backtrace by default as that can add a lot of overhead
|
44
|
+
# to the job and everyone is using an error service, right?
|
45
|
+
#
|
46
|
+
# The default number of retries is 25 which works out to about 3 weeks
|
47
|
+
# You can change the default maximum number of retries in your initializer:
|
48
|
+
#
|
49
|
+
# Sidekiq.options[:max_retries] = 7
|
50
|
+
#
|
51
|
+
# or limit the number of retries for a particular worker with:
|
52
|
+
#
|
53
|
+
# class MyWorker
|
54
|
+
# include Sidekiq::Worker
|
55
|
+
# sidekiq_options :retry => 10
|
56
|
+
# end
|
57
|
+
#
|
58
|
+
class JobRetry
|
59
|
+
class Handled < ::RuntimeError; end
|
60
|
+
class Skip < Handled; end
|
61
|
+
|
62
|
+
include Sidekiq::Util
|
63
|
+
|
64
|
+
DEFAULT_MAX_RETRY_ATTEMPTS = 25
|
65
|
+
|
66
|
+
def initialize(options = {})
|
67
|
+
@max_retries = Sidekiq.options.merge(options).fetch(:max_retries, DEFAULT_MAX_RETRY_ATTEMPTS)
|
68
|
+
end
|
69
|
+
|
70
|
+
# The global retry handler requires only the barest of data.
|
71
|
+
# We want to be able to retry as much as possible so we don't
|
72
|
+
# require the worker to be instantiated.
|
73
|
+
def global(msg, queue)
|
74
|
+
yield
|
75
|
+
rescue Handled => ex
|
76
|
+
raise ex
|
77
|
+
rescue Sidekiq::Shutdown => ey
|
78
|
+
# ignore, will be pushed back onto queue during hard_shutdown
|
79
|
+
raise ey
|
80
|
+
rescue Exception => e
|
81
|
+
# ignore, will be pushed back onto queue during hard_shutdown
|
82
|
+
raise Sidekiq::Shutdown if exception_caused_by_shutdown?(e)
|
83
|
+
|
84
|
+
if msg['retry']
|
85
|
+
attempt_retry(nil, msg, queue, e)
|
86
|
+
else
|
87
|
+
Sidekiq.death_handlers.each do |handler|
|
88
|
+
begin
|
89
|
+
handler.call(msg, e)
|
90
|
+
rescue => handler_ex
|
91
|
+
handle_exception(handler_ex, { context: "Error calling death handler", job: msg })
|
92
|
+
end
|
93
|
+
end
|
94
|
+
end
|
95
|
+
|
96
|
+
raise Handled
|
97
|
+
end
|
98
|
+
|
99
|
+
|
100
|
+
# The local retry support means that any errors that occur within
|
101
|
+
# this block can be associated with the given worker instance.
|
102
|
+
# This is required to support the `sidekiq_retries_exhausted` block.
|
103
|
+
#
|
104
|
+
# Note that any exception from the block is wrapped in the Skip
|
105
|
+
# exception so the global block does not reprocess the error. The
|
106
|
+
# Skip exception is unwrapped within Sidekiq::Processor#process before
|
107
|
+
# calling the handle_exception handlers.
|
108
|
+
def local(worker, msg, queue)
|
109
|
+
yield
|
110
|
+
rescue Handled => ex
|
111
|
+
raise ex
|
112
|
+
rescue Sidekiq::Shutdown => ey
|
113
|
+
# ignore, will be pushed back onto queue during hard_shutdown
|
114
|
+
raise ey
|
115
|
+
rescue Exception => e
|
116
|
+
# ignore, will be pushed back onto queue during hard_shutdown
|
117
|
+
raise Sidekiq::Shutdown if exception_caused_by_shutdown?(e)
|
118
|
+
|
119
|
+
if msg['retry'] == nil
|
120
|
+
msg['retry'] = worker.class.get_sidekiq_options['retry']
|
121
|
+
end
|
122
|
+
|
123
|
+
raise e unless msg['retry']
|
124
|
+
attempt_retry(worker, msg, queue, e)
|
125
|
+
# We've handled this error associated with this job, don't
|
126
|
+
# need to handle it at the global level
|
127
|
+
raise Skip
|
128
|
+
end
|
129
|
+
|
130
|
+
private
|
131
|
+
|
132
|
+
# Note that +worker+ can be nil here if an error is raised before we can
|
133
|
+
# instantiate the worker instance. All access must be guarded and
|
134
|
+
# best effort.
|
135
|
+
def attempt_retry(worker, msg, queue, exception)
|
136
|
+
max_retry_attempts = retry_attempts_from(msg['retry'], @max_retries)
|
137
|
+
|
138
|
+
msg['queue'] = if msg['retry_queue']
|
139
|
+
msg['retry_queue']
|
140
|
+
else
|
141
|
+
queue
|
142
|
+
end
|
143
|
+
|
144
|
+
m = exception_message(exception)
|
145
|
+
if m.respond_to?(:scrub!)
|
146
|
+
m.force_encoding("utf-8")
|
147
|
+
m.scrub!
|
148
|
+
end
|
149
|
+
|
150
|
+
msg['error_message'] = m
|
151
|
+
msg['error_class'] = exception.class.name
|
152
|
+
count = if msg['retry_count']
|
153
|
+
msg['retried_at'] = Time.now.to_f
|
154
|
+
msg['retry_count'] += 1
|
155
|
+
else
|
156
|
+
msg['failed_at'] = Time.now.to_f
|
157
|
+
msg['retry_count'] = 0
|
158
|
+
end
|
159
|
+
|
160
|
+
if msg['backtrace'] == true
|
161
|
+
msg['error_backtrace'] = exception.backtrace
|
162
|
+
elsif !msg['backtrace']
|
163
|
+
# do nothing
|
164
|
+
elsif msg['backtrace'].to_i != 0
|
165
|
+
msg['error_backtrace'] = exception.backtrace[0...msg['backtrace'].to_i]
|
166
|
+
end
|
167
|
+
|
168
|
+
if count < max_retry_attempts
|
169
|
+
delay = delay_for(worker, count, exception)
|
170
|
+
# Logging here can break retries if the logging device raises ENOSPC #3979
|
171
|
+
#logger.debug { "Failure! Retry #{count} in #{delay} seconds" }
|
172
|
+
retry_at = Time.now.to_f + delay
|
173
|
+
payload = Sidekiq.dump_json(msg)
|
174
|
+
Sidekiq.redis do |conn|
|
175
|
+
conn.zadd('retry', retry_at.to_s, payload)
|
176
|
+
end
|
177
|
+
else
|
178
|
+
# Goodbye dear message, you (re)tried your best I'm sure.
|
179
|
+
retries_exhausted(worker, msg, exception)
|
180
|
+
end
|
181
|
+
end
|
182
|
+
|
183
|
+
def retries_exhausted(worker, msg, exception)
|
184
|
+
begin
|
185
|
+
block = worker && worker.sidekiq_retries_exhausted_block
|
186
|
+
block.call(msg, exception) if block
|
187
|
+
rescue => e
|
188
|
+
handle_exception(e, { context: "Error calling retries_exhausted", job: msg })
|
189
|
+
end
|
190
|
+
|
191
|
+
Sidekiq.death_handlers.each do |handler|
|
192
|
+
begin
|
193
|
+
handler.call(msg, exception)
|
194
|
+
rescue => e
|
195
|
+
handle_exception(e, { context: "Error calling death handler", job: msg })
|
196
|
+
end
|
197
|
+
end
|
198
|
+
|
199
|
+
send_to_morgue(msg) unless msg['dead'] == false
|
200
|
+
end
|
201
|
+
|
202
|
+
def send_to_morgue(msg)
|
203
|
+
logger.info { "Adding dead #{msg['class']} job #{msg['jid']}" }
|
204
|
+
payload = Sidekiq.dump_json(msg)
|
205
|
+
DeadSet.new.kill(payload, notify_failure: false)
|
206
|
+
end
|
207
|
+
|
208
|
+
def retry_attempts_from(msg_retry, default)
|
209
|
+
if msg_retry.is_a?(Integer)
|
210
|
+
msg_retry
|
211
|
+
else
|
212
|
+
default
|
213
|
+
end
|
214
|
+
end
|
215
|
+
|
216
|
+
def delay_for(worker, count, exception)
|
217
|
+
if worker && worker.sidekiq_retry_in_block
|
218
|
+
custom_retry_in = retry_in(worker, count, exception).to_i
|
219
|
+
return custom_retry_in if custom_retry_in > 0
|
220
|
+
end
|
221
|
+
seconds_to_delay(count)
|
222
|
+
end
|
223
|
+
|
224
|
+
# delayed_job uses the same basic formula
|
225
|
+
def seconds_to_delay(count)
|
226
|
+
(count ** 4) + 15 + (rand(30)*(count+1))
|
227
|
+
end
|
228
|
+
|
229
|
+
def retry_in(worker, count, exception)
|
230
|
+
begin
|
231
|
+
worker.sidekiq_retry_in_block.call(count, exception)
|
232
|
+
rescue Exception => e
|
233
|
+
handle_exception(e, { context: "Failure scheduling retry using the defined `sidekiq_retry_in` in #{worker.class.name}, falling back to default" })
|
234
|
+
nil
|
235
|
+
end
|
236
|
+
end
|
237
|
+
|
238
|
+
def exception_caused_by_shutdown?(e, checked_causes = [])
|
239
|
+
return false unless e.cause
|
240
|
+
|
241
|
+
# Handle circular causes
|
242
|
+
checked_causes << e.object_id
|
243
|
+
return false if checked_causes.include?(e.cause.object_id)
|
244
|
+
|
245
|
+
e.cause.instance_of?(Sidekiq::Shutdown) ||
|
246
|
+
exception_caused_by_shutdown?(e.cause, checked_causes)
|
247
|
+
end
|
248
|
+
|
249
|
+
# Extract message from exception.
|
250
|
+
# Set a default if the message raises an error
|
251
|
+
def exception_message(exception)
|
252
|
+
begin
|
253
|
+
# App code can stuff all sorts of crazy binary data into the error message
|
254
|
+
# that won't convert to JSON.
|
255
|
+
exception.message.to_s[0, 10_000]
|
256
|
+
rescue
|
257
|
+
"!!! ERROR MESSAGE THREW AN ERROR !!!".dup
|
258
|
+
end
|
259
|
+
end
|
260
|
+
|
261
|
+
end
|
262
|
+
end
|
data/lib/sidekiq/launcher.rb
CHANGED
@@ -1,4 +1,4 @@
|
|
1
|
-
|
1
|
+
# frozen_string_literal: true
|
2
2
|
require 'sidekiq/manager'
|
3
3
|
require 'sidekiq/fetch'
|
4
4
|
require 'sidekiq/scheduled'
|
@@ -9,82 +9,156 @@ module Sidekiq
|
|
9
9
|
# If any of these actors die, the Sidekiq process exits
|
10
10
|
# immediately.
|
11
11
|
class Launcher
|
12
|
-
include Actor
|
13
12
|
include Util
|
14
13
|
|
15
|
-
|
14
|
+
attr_accessor :manager, :poller, :fetcher
|
16
15
|
|
17
|
-
|
16
|
+
STATS_TTL = 5*365*24*60*60
|
18
17
|
|
19
18
|
def initialize(options)
|
20
|
-
@
|
21
|
-
@
|
22
|
-
@poller = Sidekiq::Scheduled::Poller.new_link
|
23
|
-
@fetcher = Sidekiq::Fetcher.new_link(@manager, options)
|
24
|
-
@manager.fetcher = @fetcher
|
19
|
+
@manager = Sidekiq::Manager.new(options)
|
20
|
+
@poller = Sidekiq::Scheduled::Poller.new
|
25
21
|
@done = false
|
26
22
|
@options = options
|
27
23
|
end
|
28
24
|
|
29
|
-
def
|
30
|
-
|
31
|
-
|
25
|
+
def run
|
26
|
+
@thread = safe_thread("heartbeat", &method(:start_heartbeat))
|
27
|
+
@poller.start
|
28
|
+
@manager.start
|
29
|
+
end
|
32
30
|
|
33
|
-
|
34
|
-
|
35
|
-
|
31
|
+
# Stops this instance from processing any more jobs,
|
32
|
+
#
|
33
|
+
def quiet
|
34
|
+
@done = true
|
35
|
+
@manager.quiet
|
36
|
+
@poller.terminate
|
36
37
|
end
|
37
38
|
|
38
|
-
|
39
|
-
|
40
|
-
|
41
|
-
|
39
|
+
# Shuts down the process. This method does not
|
40
|
+
# return until all work is complete and cleaned up.
|
41
|
+
# It can take up to the timeout to complete.
|
42
|
+
def stop
|
43
|
+
deadline = ::Process.clock_gettime(::Process::CLOCK_MONOTONIC) + @options[:timeout]
|
44
|
+
|
45
|
+
@done = true
|
46
|
+
@manager.quiet
|
47
|
+
@poller.terminate
|
48
|
+
|
49
|
+
@manager.stop(deadline)
|
50
|
+
|
51
|
+
# Requeue everything in case there was a worker who grabbed work while stopped
|
52
|
+
# This call is a no-op in Sidekiq but necessary for Sidekiq Pro.
|
53
|
+
strategy = (@options[:fetch] || Sidekiq::BasicFetch)
|
54
|
+
strategy.bulk_requeue([], @options)
|
55
|
+
|
56
|
+
clear_heartbeat
|
57
|
+
end
|
58
|
+
|
59
|
+
def stopping?
|
60
|
+
@done
|
61
|
+
end
|
62
|
+
|
63
|
+
private unless $TESTING
|
64
|
+
|
65
|
+
def heartbeat
|
66
|
+
results = Sidekiq::CLI::PROCTITLES.map {|x| x.(self, to_data) }
|
67
|
+
results.compact!
|
68
|
+
$0 = results.join(' ')
|
69
|
+
|
70
|
+
❤
|
71
|
+
end
|
72
|
+
|
73
|
+
def ❤
|
74
|
+
key = identity
|
75
|
+
fails = procd = 0
|
76
|
+
begin
|
77
|
+
fails = Processor::FAILURE.reset
|
78
|
+
procd = Processor::PROCESSED.reset
|
79
|
+
curstate = Processor::WORKER_STATE.dup
|
80
|
+
|
81
|
+
workers_key = "#{key}:workers"
|
82
|
+
nowdate = Time.now.utc.strftime("%Y-%m-%d")
|
83
|
+
Sidekiq.redis do |conn|
|
84
|
+
conn.multi do
|
85
|
+
conn.incrby("stat:processed", procd)
|
86
|
+
conn.incrby("stat:processed:#{nowdate}", procd)
|
87
|
+
conn.expire("stat:processed:#{nowdate}", STATS_TTL)
|
88
|
+
|
89
|
+
conn.incrby("stat:failed", fails)
|
90
|
+
conn.incrby("stat:failed:#{nowdate}", fails)
|
91
|
+
conn.expire("stat:failed:#{nowdate}", STATS_TTL)
|
92
|
+
|
93
|
+
conn.del(workers_key)
|
94
|
+
curstate.each_pair do |tid, hash|
|
95
|
+
conn.hset(workers_key, tid, Sidekiq.dump_json(hash))
|
96
|
+
end
|
97
|
+
conn.expire(workers_key, 60)
|
98
|
+
end
|
99
|
+
end
|
100
|
+
fails = procd = 0
|
101
|
+
|
102
|
+
_, exists, _, _, msg = Sidekiq.redis do |conn|
|
103
|
+
conn.multi do
|
104
|
+
conn.sadd('processes', key)
|
105
|
+
conn.exists(key)
|
106
|
+
conn.hmset(key, 'info', to_json, 'busy', curstate.size, 'beat', Time.now.to_f, 'quiet', @done)
|
107
|
+
conn.expire(key, 60)
|
108
|
+
conn.rpop("#{key}-signals")
|
109
|
+
end
|
110
|
+
end
|
111
|
+
|
112
|
+
# first heartbeat or recovering from an outage and need to reestablish our heartbeat
|
113
|
+
fire_event(:heartbeat) if !exists
|
114
|
+
|
115
|
+
return unless msg
|
42
116
|
|
43
|
-
|
117
|
+
::Process.kill(msg, $$)
|
118
|
+
rescue => e
|
119
|
+
# ignore all redis/network issues
|
120
|
+
logger.error("heartbeat: #{e.message}")
|
121
|
+
# don't lose the counts if there was a network issue
|
122
|
+
Processor::PROCESSED.incr(procd)
|
123
|
+
Processor::FAILURE.incr(fails)
|
44
124
|
end
|
45
125
|
end
|
46
126
|
|
47
|
-
def
|
48
|
-
|
49
|
-
|
50
|
-
|
51
|
-
fetcher.terminate if fetcher.alive?
|
52
|
-
poller.terminate if poller.alive?
|
53
|
-
|
54
|
-
manager.async.stop(:shutdown => true, :timeout => @options[:timeout])
|
55
|
-
fire_event(:shutdown, true)
|
56
|
-
@condvar.wait
|
57
|
-
manager.terminate
|
58
|
-
|
59
|
-
# Requeue everything in case there was a worker who grabbed work while stopped
|
60
|
-
# This call is a no-op in Sidekiq but necessary for Sidekiq Pro.
|
61
|
-
Sidekiq::Fetcher.strategy.bulk_requeue([], @options)
|
62
|
-
|
63
|
-
stop_heartbeat
|
127
|
+
def start_heartbeat
|
128
|
+
while true
|
129
|
+
heartbeat
|
130
|
+
sleep 5
|
64
131
|
end
|
132
|
+
Sidekiq.logger.info("Heartbeat stopping...")
|
65
133
|
end
|
66
134
|
|
67
|
-
|
135
|
+
def to_data
|
136
|
+
@data ||= begin
|
137
|
+
{
|
138
|
+
'hostname' => hostname,
|
139
|
+
'started_at' => Time.now.to_f,
|
140
|
+
'pid' => $$,
|
141
|
+
'tag' => @options[:tag] || '',
|
142
|
+
'concurrency' => @options[:concurrency],
|
143
|
+
'queues' => @options[:queues].uniq,
|
144
|
+
'labels' => @options[:labels],
|
145
|
+
'identity' => identity,
|
146
|
+
}
|
147
|
+
end
|
148
|
+
end
|
68
149
|
|
69
|
-
def
|
70
|
-
|
71
|
-
|
72
|
-
'
|
73
|
-
|
74
|
-
|
75
|
-
'tag' => @options[:tag] || '',
|
76
|
-
'concurrency' => @options[:concurrency],
|
77
|
-
'queues' => @options[:queues].uniq,
|
78
|
-
'labels' => Sidekiq.options[:labels],
|
79
|
-
'identity' => identity,
|
80
|
-
}
|
81
|
-
# this data doesn't change so dump it to a string
|
82
|
-
# now so we don't need to dump it every heartbeat.
|
83
|
-
json = Sidekiq.dump_json(data)
|
84
|
-
manager.heartbeat(key, data, json)
|
150
|
+
def to_json
|
151
|
+
@json ||= begin
|
152
|
+
# this data changes infrequently so dump it to a string
|
153
|
+
# now so we don't need to dump it every heartbeat.
|
154
|
+
Sidekiq.dump_json(to_data)
|
155
|
+
end
|
85
156
|
end
|
86
157
|
|
87
|
-
def
|
158
|
+
def clear_heartbeat
|
159
|
+
# Remove record from Redis since we are shutting down.
|
160
|
+
# Note we don't stop the heartbeat thread; if the process
|
161
|
+
# doesn't actually exit, it'll reappear in the Web UI.
|
88
162
|
Sidekiq.redis do |conn|
|
89
163
|
conn.pipelined do
|
90
164
|
conn.srem('processes', identity)
|