RubyGems - sidekiq - Versions diffs - 6.4.0 → 7.0.8 - Mend

sidekiq 6.4.0 → 7.0.8

Potentially problematic release.

This version of sidekiq might be problematic. Click here for more details.

Files changed (113) hide show

checksums.yaml +4 -4
data/Changes.md +187 -12
data/README.md +44 -31
data/bin/sidekiq +4 -9
data/bin/sidekiqload +189 -117
data/bin/sidekiqmon +4 -1
data/lib/sidekiq/api.rb +304 -186
data/lib/sidekiq/capsule.rb +127 -0
data/lib/sidekiq/cli.rb +83 -80
data/lib/sidekiq/client.rb +71 -44
data/lib/sidekiq/component.rb +68 -0
data/lib/sidekiq/config.rb +270 -0
data/lib/sidekiq/deploy.rb +62 -0
data/lib/sidekiq/embedded.rb +61 -0
data/lib/sidekiq/fetch.rb +23 -24
data/lib/sidekiq/job.rb +375 -10
data/lib/sidekiq/job_logger.rb +16 -28
data/lib/sidekiq/job_retry.rb +76 -54
data/lib/sidekiq/job_util.rb +59 -19
data/lib/sidekiq/launcher.rb +103 -95
data/lib/sidekiq/logger.rb +9 -44
data/lib/sidekiq/manager.rb +33 -32
data/lib/sidekiq/metrics/query.rb +153 -0
data/lib/sidekiq/metrics/shared.rb +95 -0
data/lib/sidekiq/metrics/tracking.rb +136 -0
data/lib/sidekiq/middleware/chain.rb +96 -51
data/lib/sidekiq/middleware/current_attributes.rb +16 -17
data/lib/sidekiq/middleware/i18n.rb +6 -4
data/lib/sidekiq/middleware/modules.rb +21 -0
data/lib/sidekiq/monitor.rb +17 -4
data/lib/sidekiq/paginator.rb +17 -9
data/lib/sidekiq/processor.rb +60 -60
data/lib/sidekiq/rails.rb +12 -10
data/lib/sidekiq/redis_client_adapter.rb +115 -0
data/lib/sidekiq/redis_connection.rb +13 -82
data/lib/sidekiq/ring_buffer.rb +29 -0
data/lib/sidekiq/scheduled.rb +65 -37
data/lib/sidekiq/testing/inline.rb +4 -4
data/lib/sidekiq/testing.rb +41 -68
data/lib/sidekiq/transaction_aware_client.rb +44 -0
data/lib/sidekiq/version.rb +2 -1
data/lib/sidekiq/web/action.rb +3 -3
data/lib/sidekiq/web/application.rb +40 -9
data/lib/sidekiq/web/csrf_protection.rb +3 -3
data/lib/sidekiq/web/helpers.rb +35 -21
data/lib/sidekiq/web.rb +10 -17
data/lib/sidekiq/worker_compatibility_alias.rb +13 -0
data/lib/sidekiq.rb +84 -206
data/sidekiq.gemspec +21 -10
data/web/assets/javascripts/application.js +76 -26
data/web/assets/javascripts/base-charts.js +106 -0
data/web/assets/javascripts/chart.min.js +13 -0
data/web/assets/javascripts/chartjs-plugin-annotation.min.js +7 -0
data/web/assets/javascripts/dashboard-charts.js +166 -0
data/web/assets/javascripts/dashboard.js +3 -240
data/web/assets/javascripts/metrics.js +264 -0
data/web/assets/stylesheets/application-dark.css +4 -0
data/web/assets/stylesheets/application-rtl.css +2 -91
data/web/assets/stylesheets/application.css +66 -297
data/web/locales/ar.yml +70 -70
data/web/locales/cs.yml +62 -62
data/web/locales/da.yml +60 -53
data/web/locales/de.yml +65 -65
data/web/locales/el.yml +43 -24
data/web/locales/en.yml +82 -69
data/web/locales/es.yml +68 -68
data/web/locales/fa.yml +65 -65
data/web/locales/fr.yml +67 -67
data/web/locales/he.yml +65 -64
data/web/locales/hi.yml +59 -59
data/web/locales/it.yml +53 -53
data/web/locales/ja.yml +73 -68
data/web/locales/ko.yml +52 -52
data/web/locales/lt.yml +66 -66
data/web/locales/nb.yml +61 -61
data/web/locales/nl.yml +52 -52
data/web/locales/pl.yml +45 -45
data/web/locales/pt-br.yml +63 -55
data/web/locales/pt.yml +51 -51
data/web/locales/ru.yml +67 -66
data/web/locales/sv.yml +53 -53
data/web/locales/ta.yml +60 -60
data/web/locales/uk.yml +62 -61
data/web/locales/ur.yml +64 -64
data/web/locales/vi.yml +67 -67
data/web/locales/zh-cn.yml +43 -16
data/web/locales/zh-tw.yml +42 -8
data/web/views/_footer.erb +5 -2
data/web/views/_job_info.erb +18 -2
data/web/views/_metrics_period_select.erb +12 -0
data/web/views/_nav.erb +1 -1
data/web/views/_paging.erb +2 -0
data/web/views/_poll_link.erb +1 -1
data/web/views/_summary.erb +1 -1
data/web/views/busy.erb +42 -26
data/web/views/dashboard.erb +36 -4
data/web/views/metrics.erb +82 -0
data/web/views/metrics_for_job.erb +71 -0
data/web/views/morgue.erb +5 -9
data/web/views/queue.erb +15 -15
data/web/views/queues.erb +3 -1
data/web/views/retries.erb +5 -9
data/web/views/scheduled.erb +12 -13
metadata +64 -28
data/lib/sidekiq/delay.rb +0 -43
data/lib/sidekiq/exception_handler.rb +0 -27
data/lib/sidekiq/extensions/action_mailer.rb +0 -48
data/lib/sidekiq/extensions/active_record.rb +0 -43
data/lib/sidekiq/extensions/class_methods.rb +0 -43
data/lib/sidekiq/extensions/generic_proxy.rb +0 -33
data/lib/sidekiq/util.rb +0 -108
data/lib/sidekiq/worker.rb +0 -364
/data/{LICENSE → LICENSE.txt} +0 -0

data/lib/sidekiq/logger.rb CHANGED Viewed

@@ -16,6 +16,10 @@ module Sidekiq
     def self.current
       Thread.current[:sidekiq_context] ||= {}
     end
+    def self.add(k, v)
+      current[k] = v
+    end
   end
   module LoggingUtils
@@ -27,28 +31,14 @@ module Sidekiq
       "fatal" => 4
     }
     LEVELS.default_proc = proc do |_, level|
-      Sidekiq.logger.warn("Invalid log level: #{level.inspect}")
+      puts("Invalid log level: #{level.inspect}")
       nil
     end
-    def debug?
-      level <= 0
-    end
-    def info?
-      level <= 1
-    end
-    def warn?
-      level <= 2
-    end
-    def error?
-      level <= 3
-    end
-    def fatal?
-      level <= 4
+    LEVELS.each do |level, numeric_level|
+      define_method("#{level}?") do
+        local_level.nil? ? super() : local_level <= numeric_level
+      end
     end
     def local_level
@@ -80,36 +70,11 @@ module Sidekiq
     ensure
       self.local_level = old_local_level
     end
-    # Redefined to check severity against #level, and thus the thread-local level, rather than +@level+.
-    # FIXME: Remove when the minimum Ruby version supports overriding Logger#level.
-    def add(severity, message = nil, progname = nil, &block)
-      severity ||= ::Logger::UNKNOWN
-      progname ||= @progname
-      return true if @logdev.nil? || severity < level
-      if message.nil?
-        if block
-          message = yield
-        else
-          message = progname
-          progname = @progname
-        end
-      end
-      @logdev.write format_message(format_severity(severity), Time.now, progname, message)
-    end
   end
   class Logger < ::Logger
     include LoggingUtils
-    def initialize(*args, **kwargs)
-      super
-      self.formatter = Sidekiq.log_formatter
-    end
     module Formatters
       class Base < ::Logger::Formatter
         def tid

data/lib/sidekiq/manager.rb CHANGED Viewed

@@ -1,8 +1,6 @@
 # frozen_string_literal: true
-require "sidekiq/util"
 require "sidekiq/processor"
-require "sidekiq/fetch"
 require "set"
 module Sidekiq
@@ -21,43 +19,38 @@ module Sidekiq
   # the shutdown process.  The other tasks are performed by other threads.
   #
   class Manager
-    include Util
+    include Sidekiq::Component
     attr_reader :workers
-    attr_reader :options
+    attr_reader :capsule
-    def initialize(options = {})
-      logger.debug { options.inspect }
-      @options = options
-      @count = options[:concurrency] || 10
+    def initialize(capsule)
+      @config = @capsule = capsule
+      @count = capsule.concurrency
       raise ArgumentError, "Concurrency of #{@count} is not supported" if @count < 1
       @done = false
       @workers = Set.new
+      @plock = Mutex.new
       @count.times do
-        @workers << Processor.new(self, options)
+        @workers << Processor.new(@config, &method(:processor_result))
       end
-      @plock = Mutex.new
     end
     def start
-      @workers.each do |x|
-        x.start
-      end
+      @workers.each(&:start)
     end
     def quiet
       return if @done
       @done = true
-      logger.info { "Terminating quiet workers" }
-      @workers.each { |x| x.terminate }
-      fire_event(:quiet, reverse: true)
+      logger.info { "Terminating quiet threads for #{capsule.name} capsule" }
+      @workers.each(&:terminate)
     end
     def stop(deadline)
       quiet
-      fire_event(:shutdown, reverse: true)
       # some of the shutdown events can be async,
       # we don't have any way to know when they're done but
@@ -65,24 +58,20 @@ module Sidekiq
       sleep PAUSE_TIME
       return if @workers.empty?
-      logger.info { "Pausing to allow workers to finish..." }
+      logger.info { "Pausing to allow jobs to finish..." }
       wait_for(deadline) { @workers.empty? }
       return if @workers.empty?
       hard_shutdown
+    ensure
+      capsule.stop
     end
-    def processor_stopped(processor)
-      @plock.synchronize do
-        @workers.delete(processor)
-      end
-    end
-    def processor_died(processor, reason)
+    def processor_result(processor, reason = nil)
       @plock.synchronize do
         @workers.delete(processor)
         unless @done
-          p = Processor.new(self, options)
+          p = Processor.new(@config, &method(:processor_result))
           @workers << p
           p.start
         end
@@ -96,7 +85,7 @@ module Sidekiq
     private
     def hard_shutdown
-      # We've reached the timeout and we still have busy workers.
+      # We've reached the timeout and we still have busy threads.
       # They must die but their jobs shall live on.
       cleanup = nil
       @plock.synchronize do
@@ -106,17 +95,16 @@ module Sidekiq
       if cleanup.size > 0
         jobs = cleanup.map { |p| p.job }.compact
-        logger.warn { "Terminating #{cleanup.size} busy worker threads" }
-        logger.warn { "Work still in progress #{jobs.inspect}" }
+        logger.warn { "Terminating #{cleanup.size} busy threads" }
+        logger.debug { "Jobs still in progress #{jobs.inspect}" }
         # Re-enqueue unfinished jobs
         # NOTE: You may notice that we may push a job back to redis before
-        # the worker thread is terminated. This is ok because Sidekiq's
+        # the thread is terminated. This is ok because Sidekiq's
         # contract says that jobs are run AT LEAST once. Process termination
         # is delayed until we're certain the jobs are back in Redis because
         # it is worse to lose a job than to run it twice.
-        strategy = @options[:fetch]
-        strategy.bulk_requeue(jobs, @options)
+        capsule.fetcher.bulk_requeue(jobs)
       end
       cleanup.each do |processor|
@@ -129,5 +117,18 @@ module Sidekiq
       deadline = ::Process.clock_gettime(::Process::CLOCK_MONOTONIC) + 3
       wait_for(deadline) { @workers.empty? }
     end
+    # hack for quicker development / testing environment #2774
+    PAUSE_TIME = $stdout.tty? ? 0.1 : 0.5
+    # Wait for the orblock to be true or the deadline passed.
+    def wait_for(deadline, &condblock)
+      remaining = deadline - ::Process.clock_gettime(::Process::CLOCK_MONOTONIC)
+      while remaining > PAUSE_TIME
+        return if condblock.call
+        sleep PAUSE_TIME
+        remaining = deadline - ::Process.clock_gettime(::Process::CLOCK_MONOTONIC)
+      end
+    end
   end
 end

data/lib/sidekiq/metrics/query.rb ADDED Viewed

@@ -0,0 +1,153 @@
+require "sidekiq"
+require "date"
+require "set"
+require "sidekiq/metrics/shared"
+module Sidekiq
+  module Metrics
+    # Allows caller to query for Sidekiq execution metrics within Redis.
+    # Caller sets a set of attributes to act as filters. {#fetch} will call
+    # Redis and return a Hash of results.
+    #
+    # NB: all metrics and times/dates are UTC only. We specifically do not
+    # support timezones.
+    class Query
+      def initialize(pool: nil, now: Time.now)
+        @time = now.utc
+        @pool = pool || Sidekiq.default_configuration.redis_pool
+        @klass = nil
+      end
+      # Get metric data for all jobs from the last hour
+      def top_jobs(minutes: 60)
+        result = Result.new
+        time = @time
+        redis_results = @pool.with do |conn|
+          conn.pipelined do |pipe|
+            minutes.times do |idx|
+              key = "j|#{time.strftime("%Y%m%d")}|#{time.hour}:#{time.min}"
+              pipe.hgetall key
+              result.prepend_bucket time
+              time -= 60
+            end
+          end
+        end
+        time = @time
+        redis_results.each do |hash|
+          hash.each do |k, v|
+            kls, metric = k.split("|")
+            result.job_results[kls].add_metric metric, time, v.to_i
+          end
+          time -= 60
+        end
+        result.marks = fetch_marks(result.starts_at..result.ends_at)
+        result
+      end
+      def for_job(klass, minutes: 60)
+        result = Result.new
+        time = @time
+        redis_results = @pool.with do |conn|
+          conn.pipelined do |pipe|
+            minutes.times do |idx|
+              key = "j|#{time.strftime("%Y%m%d")}|#{time.hour}:#{time.min}"
+              pipe.hmget key, "#{klass}|ms", "#{klass}|p", "#{klass}|f"
+              result.prepend_bucket time
+              time -= 60
+            end
+          end
+        end
+        time = @time
+        @pool.with do |conn|
+          redis_results.each do |(ms, p, f)|
+            result.job_results[klass].add_metric "ms", time, ms.to_i if ms
+            result.job_results[klass].add_metric "p", time, p.to_i if p
+            result.job_results[klass].add_metric "f", time, f.to_i if f
+            result.job_results[klass].add_hist time, Histogram.new(klass).fetch(conn, time)
+            time -= 60
+          end
+        end
+        result.marks = fetch_marks(result.starts_at..result.ends_at)
+        result
+      end
+      class Result < Struct.new(:starts_at, :ends_at, :size, :buckets, :job_results, :marks)
+        def initialize
+          super
+          self.buckets = []
+          self.marks = []
+          self.job_results = Hash.new { |h, k| h[k] = JobResult.new }
+        end
+        def prepend_bucket(time)
+          buckets.unshift time.strftime("%H:%M")
+          self.ends_at ||= time
+          self.starts_at = time
+        end
+      end
+      class JobResult < Struct.new(:series, :hist, :totals)
+        def initialize
+          super
+          self.series = Hash.new { |h, k| h[k] = Hash.new(0) }
+          self.hist = Hash.new { |h, k| h[k] = [] }
+          self.totals = Hash.new(0)
+        end
+        def add_metric(metric, time, value)
+          totals[metric] += value
+          series[metric][time.strftime("%H:%M")] += value
+          # Include timing measurements in seconds for convenience
+          add_metric("s", time, value / 1000.0) if metric == "ms"
+        end
+        def add_hist(time, hist_result)
+          hist[time.strftime("%H:%M")] = hist_result
+        end
+        def total_avg(metric = "ms")
+          completed = totals["p"] - totals["f"]
+          totals[metric].to_f / completed
+        end
+        def series_avg(metric = "ms")
+          series[metric].each_with_object(Hash.new(0)) do |(bucket, value), result|
+            completed = series.dig("p", bucket) - series.dig("f", bucket)
+            result[bucket] = (completed == 0) ? 0 : value.to_f / completed
+          end
+        end
+      end
+      class MarkResult < Struct.new(:time, :label)
+        def bucket
+          time.strftime("%H:%M")
+        end
+      end
+      private
+      def fetch_marks(time_range)
+        [].tap do |result|
+          marks = @pool.with { |c| c.hgetall("#{@time.strftime("%Y%m%d")}-marks") }
+          marks.each do |timestamp, label|
+            time = Time.parse(timestamp)
+            if time_range.cover? time
+              result << MarkResult.new(time, label)
+            end
+          end
+        end
+      end
+    end
+  end
+end

data/lib/sidekiq/metrics/shared.rb ADDED Viewed

@@ -0,0 +1,95 @@
+require "concurrent"
+module Sidekiq
+  module Metrics
+    # This is the only dependency on concurrent-ruby in Sidekiq but it's
+    # mandatory for thread-safety until MRI supports atomic operations on values.
+    Counter = ::Concurrent::AtomicFixnum
+    # Implements space-efficient but statistically useful histogram storage.
+    # A precise time histogram stores every time. Instead we break times into a set of
+    # known buckets and increment counts of the associated time bucket. Even if we call
+    # the histogram a million times, we'll still only store 26 buckets.
+    # NB: needs to be thread-safe or resiliant to races.
+    #
+    # To store this data, we use Redis' BITFIELD command to store unsigned 16-bit counters
+    # per bucket per klass per minute. It's unlikely that most people will be executing more
+    # than 1000 job/sec for a full minute of a specific type.
+    class Histogram
+      include Enumerable
+      # This number represents the maximum milliseconds for this bucket.
+      # 20 means all job executions up to 20ms, e.g. if a job takes
+      # 280ms, it'll increment bucket[7]. Note we can track job executions
+      # up to about 5.5 minutes. After that, it's assumed you're probably
+      # not too concerned with its performance.
+      BUCKET_INTERVALS = [
+        20, 30, 45, 65, 100,
+        150, 225, 335, 500, 750,
+        1100, 1700, 2500, 3800, 5750,
+        8500, 13000, 20000, 30000, 45000,
+        65000, 100000, 150000, 225000, 335000,
+        Float::INFINITY # the "maybe your job is too long" bucket
+      ]
+      LABELS = [
+        "20ms", "30ms", "45ms", "65ms", "100ms",
+        "150ms", "225ms", "335ms", "500ms", "750ms",
+        "1.1s", "1.7s", "2.5s", "3.8s", "5.75s",
+        "8.5s", "13s", "20s", "30s", "45s",
+        "65s", "100s", "150s", "225s", "335s",
+        "Slow"
+      ]
+      FETCH = "GET u16 #0 GET u16 #1 GET u16 #2 GET u16 #3 \
+        GET u16 #4 GET u16 #5 GET u16 #6 GET u16 #7 \
+        GET u16 #8 GET u16 #9 GET u16 #10 GET u16 #11 \
+        GET u16 #12 GET u16 #13 GET u16 #14 GET u16 #15 \
+        GET u16 #16 GET u16 #17 GET u16 #18 GET u16 #19 \
+        GET u16 #20 GET u16 #21 GET u16 #22 GET u16 #23 \
+        GET u16 #24 GET u16 #25".split
+      HISTOGRAM_TTL = 8 * 60 * 60
+      def each
+        buckets.each { |counter| yield counter.value }
+      end
+      def label(idx)
+        LABELS[idx]
+      end
+      attr_reader :buckets
+      def initialize(klass)
+        @klass = klass
+        @buckets = Array.new(BUCKET_INTERVALS.size) { Counter.new }
+      end
+      def record_time(ms)
+        index_to_use = BUCKET_INTERVALS.each_index do |idx|
+          break idx if ms < BUCKET_INTERVALS[idx]
+        end
+        @buckets[index_to_use].increment
+      end
+      def fetch(conn, now = Time.now)
+        window = now.utc.strftime("%d-%H:%-M")
+        key = "#{@klass}-#{window}"
+        conn.bitfield(key, *FETCH)
+      end
+      def persist(conn, now = Time.now)
+        buckets, @buckets = @buckets, []
+        window = now.utc.strftime("%d-%H:%-M")
+        key = "#{@klass}-#{window}"
+        cmd = [key, "OVERFLOW", "SAT"]
+        buckets.each_with_index do |counter, idx|
+          val = counter.value
+          cmd << "INCRBY" << "u16" << "##{idx}" << val.to_s if val > 0
+        end
+        conn.bitfield(*cmd) if cmd.size > 3
+        conn.expire(key, HISTOGRAM_TTL)
+        key
+      end
+    end
+  end
+end

data/lib/sidekiq/metrics/tracking.rb ADDED Viewed

@@ -0,0 +1,136 @@
+# frozen_string_literal: true
+require "time"
+require "sidekiq"
+require "sidekiq/metrics/shared"
+# This file contains the components which track execution metrics within Sidekiq.
+module Sidekiq
+  module Metrics
+    class ExecutionTracker
+      include Sidekiq::Component
+      def initialize(config)
+        @config = config
+        @jobs = Hash.new(0)
+        @totals = Hash.new(0)
+        @grams = Hash.new { |hash, key| hash[key] = Histogram.new(key) }
+        @lock = Mutex.new
+      end
+      def track(queue, klass)
+        start = ::Process.clock_gettime(::Process::CLOCK_MONOTONIC, :millisecond)
+        time_ms = 0
+        begin
+          begin
+            yield
+          ensure
+            finish = ::Process.clock_gettime(::Process::CLOCK_MONOTONIC, :millisecond)
+            time_ms = finish - start
+          end
+          # We don't track time for failed jobs as they can have very unpredictable
+          # execution times. more important to know average time for successful jobs so we
+          # can better recognize when a perf regression is introduced.
+          @lock.synchronize {
+            @grams[klass].record_time(time_ms)
+            @jobs["#{klass}|ms"] += time_ms
+            @totals["ms"] += time_ms
+          }
+        rescue Exception
+          @lock.synchronize {
+            @jobs["#{klass}|f"] += 1
+            @totals["f"] += 1
+          }
+          raise
+        ensure
+          @lock.synchronize {
+            @jobs["#{klass}|p"] += 1
+            @totals["p"] += 1
+          }
+        end
+      end
+      # LONG_TERM = 90 * 24 * 60 * 60
+      # MID_TERM = 7 * 24 * 60 * 60
+      SHORT_TERM = 8 * 60 * 60
+      def flush(time = Time.now)
+        totals, jobs, grams = reset
+        procd = totals["p"]
+        fails = totals["f"]
+        return if procd == 0 && fails == 0
+        now = time.utc
+        # nowdate = now.strftime("%Y%m%d")
+        # nowhour = now.strftime("%Y%m%d|%-H")
+        nowmin = now.strftime("%Y%m%d|%-H:%-M")
+        count = 0
+        redis do |conn|
+          # persist fine-grained histogram data
+          if grams.size > 0
+            conn.pipelined do |pipe|
+              grams.each do |_, gram|
+                gram.persist(pipe, now)
+              end
+            end
+          end
+          # persist coarse grained execution count + execution millis.
+          # note as of today we don't use or do anything with the
+          # daily or hourly rollups.
+          [
+            # ["j", jobs, nowdate, LONG_TERM],
+            # ["j", jobs, nowhour, MID_TERM],
+            ["j", jobs, nowmin, SHORT_TERM]
+          ].each do |prefix, data, bucket, ttl|
+            conn.pipelined do |xa|
+              stats = "#{prefix}|#{bucket}"
+              data.each_pair do |key, value|
+                xa.hincrby stats, key, value
+                count += 1
+              end
+              xa.expire(stats, ttl)
+            end
+          end
+          logger.debug "Flushed #{count} metrics"
+          count
+        end
+      end
+      private
+      def reset
+        @lock.synchronize {
+          array = [@totals, @jobs, @grams]
+          @totals = Hash.new(0)
+          @jobs = Hash.new(0)
+          @grams = Hash.new { |hash, key| hash[key] = Histogram.new(key) }
+          array
+        }
+      end
+    end
+    class Middleware
+      include Sidekiq::ServerMiddleware
+      def initialize(options)
+        @exec = options
+      end
+      def call(_instance, hash, queue, &block)
+        @exec.track(queue, hash["wrapped"] || hash["class"], &block)
+      end
+    end
+  end
+end
+Sidekiq.configure_server do |config|
+  exec = Sidekiq::Metrics::ExecutionTracker.new(config)
+  config.server_middleware do |chain|
+    chain.add Sidekiq::Metrics::Middleware, exec
+  end
+  config.on(:beat) do
+    exec.flush
+  end
+end