RubyGems - rocketjob - Versions diffs - 2.1.3 → 3.0.0.alpha - Mend

rocketjob 2.1.3 → 3.0.0.alpha

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (47) hide show

checksums.yaml +4 -4
data/README.md +36 -0
data/lib/rocket_job/active_server.rb +48 -0
data/lib/rocket_job/cli.rb +29 -17
data/lib/rocket_job/config.rb +19 -31
data/lib/rocket_job/dirmon_entry.rb +15 -45
data/lib/rocket_job/extensions/mongo/logging.rb +26 -0
data/lib/rocket_job/extensions/rocket_job_adapter.rb +3 -5
data/lib/rocket_job/heartbeat.rb +18 -23
data/lib/rocket_job/job.rb +0 -1
data/lib/rocket_job/job_exception.rb +11 -13
data/lib/rocket_job/jobs/dirmon_job.rb +8 -8
data/lib/rocket_job/jobs/housekeeping_job.rb +13 -15
data/lib/rocket_job/performance.rb +5 -5
data/lib/rocket_job/plugins/cron.rb +3 -10
data/lib/rocket_job/plugins/document.rb +58 -33
data/lib/rocket_job/plugins/job/model.rb +43 -71
data/lib/rocket_job/plugins/job/persistence.rb +7 -63
data/lib/rocket_job/plugins/job/worker.rb +24 -26
data/lib/rocket_job/plugins/processing_window.rb +6 -9
data/lib/rocket_job/plugins/retry.rb +3 -8
data/lib/rocket_job/plugins/singleton.rb +1 -1
data/lib/rocket_job/plugins/state_machine.rb +1 -7
data/lib/rocket_job/server.rb +352 -0
data/lib/rocket_job/version.rb +1 -1
data/lib/rocket_job/worker.rb +46 -336
data/lib/rocketjob.rb +5 -4
data/test/config/mongoid.yml +88 -0
data/test/config_test.rb +1 -1
data/test/dirmon_entry_test.rb +15 -79
data/test/dirmon_job_test.rb +6 -6
data/test/job_test.rb +2 -2
data/test/plugins/job/callbacks_test.rb +40 -32
data/test/plugins/job/defaults_test.rb +10 -8
data/test/plugins/job/model_test.rb +1 -3
data/test/plugins/job/persistence_test.rb +11 -13
data/test/plugins/job/worker_test.rb +45 -26
data/test/plugins/processing_window_test.rb +4 -4
data/test/plugins/restart_test.rb +11 -12
data/test/plugins/state_machine_event_callbacks_test.rb +20 -18
data/test/plugins/state_machine_test.rb +5 -5
data/test/test_helper.rb +4 -1
metadata +15 -29
data/lib/rocket_job/extensions/mongo.rb +0 -23
data/lib/rocket_job/extensions/mongo_mapper.rb +0 -30
data/lib/rocket_job/plugins/job/defaults.rb +0 -40
data/test/config/mongo.yml +0 -46

data/lib/rocket_job/version.rb CHANGED Viewed

@@ -1,4 +1,4 @@
 # encoding: UTF-8
 module RocketJob #:nodoc
-  VERSION = '2.1.3'
+  VERSION = '3.0.0.alpha'
 end

data/lib/rocket_job/worker.rb CHANGED Viewed

@@ -1,354 +1,93 @@
 # encoding: UTF-8
 require 'concurrent'
+require 'forwardable'
 module RocketJob
   # Worker
   #
-  # On startup a worker instance will automatically register itself
-  # if not already present
-  #
-  # Starting a worker in the foreground:
-  #   - Using a Rails runner:
-  #     bin/rocketjob
-  #
-  # Starting a worker in the background:
-  #   - Using a Rails runner:
-  #     nohup bin/rocketjob --quiet 2>&1 1>output.log &
-  #
-  # Stopping a worker:
-  #   - Stop the worker via the Web UI
-  #   - Send a regular kill signal to make it shutdown once all active work is complete
-  #       kill <pid>
-  #   - Or, use the following Ruby code:
-  #     worker = RocketJob::Worker.where(name: 'worker name').first
-  #     worker.stop!
-  #
-  #   Sending the kill signal locally will result in starting the shutdown process
-  #   immediately. Via the UI or Ruby code the worker can take up to 15 seconds
-  #   (the heartbeat interval) to start shutting down.
+  # A worker runs on a single operating system thread
+  # Is usually started under a RocketJob server process.
   class Worker
-    include Plugins::Document
-    include Plugins::StateMachine
     include SemanticLogger::Loggable
+    include ActiveSupport::Callbacks
+    extend Forwardable
-    # @formatter:off
-    # Unique Name of this worker instance
-    #   Default: `host name:PID`
-    # The unique name is used on re-start to re-queue any jobs that were being processed
-    # at the time the worker or host unexpectedly terminated, if any
-    key :name,               String, default: -> { "#{SemanticLogger.host}:#{$$}" }
-    # The maximum number of threads that this worker should use
-    #   If set, it will override the default value in RocketJob::Config
-    key :max_threads,        Integer, default: -> { Config.instance.max_worker_threads }
-    # When this worker process was started
-    key :started_at,         Time
-    # The heartbeat information for this worker
-    has_one :heartbeat,      class_name: 'RocketJob::Heartbeat'
-    # Current state
-    #   Internal use only. Do not set this field directly
-    key :state,              Symbol, default: :starting
-    validates_presence_of :state, :name, :max_threads
-    # States
-    #   :starting -> :running -> :paused
-    #                         -> :stopping
-    aasm column: :state do
-      state :starting, initial: true
-      state :running
-      state :paused
-      state :stopping
-      event :started do
-        transitions from: :starting, to: :running
-        before do
-          self.started_at = Time.now
-        end
-      end
-      event :pause do
-        transitions from: :running, to: :paused
-      end
-      event :resume do
-        transitions from: :paused, to: :running
-      end
-      event :stop do
-        transitions from: :running,  to: :stopping
-        transitions from: :paused,   to: :stopping
-        transitions from: :starting, to: :stopping
-      end
-    end
-    # @formatter:on
-    # Requeue any jobs being worked by this worker when it is destroyed
-    before_destroy :requeue_jobs
-    # Run the worker process
-    # Attributes supplied are passed to #new
-    def self.run(attrs={})
-      Thread.current.name = 'rocketjob main'
-      create_indexes
-      register_signal_handlers
-      if defined?(RocketJobPro) && (RocketJob::Job.database.name != RocketJob::Jobs::PerformanceJob.database.name)
-        raise 'The RocketJob configuration is being applied after the system has been initialized'
-      end
-      worker = create!(attrs)
-      if worker.max_threads == 0
-        # Does not start any additional threads and runs the worker in the current thread.
-        # No heartbeats are performed. So this worker will appear as a zombie in RJMC.
-        # Designed for profiling purposes where a single thread is much simpler to profile.
-        worker.started!
-        worker.send(:worker, 0)
-      else
-        worker.send(:run)
-      end
-    ensure
-      worker.destroy if worker
-    end
+    def_delegator :@thread, :alive?
+    def_delegator :@thread, :backtrace
+    def_delegator :@thread, :join
-    # Create indexes
-    def self.create_indexes
-      ensure_index [[:name, 1]], background: true, unique: true
-      # Also create indexes for the jobs collection
-      Job.create_indexes
-    end
+    define_callbacks :running
-    # Destroy's all instances of zombie workers and requeues any jobs still "running"
-    # on those workers
-    def self.destroy_zombies
-      count = 0
-      each do |worker|
-        next unless worker.zombie?
-        logger.warn "Destroying zombie worker #{worker.name}, and requeueing its jobs"
-        worker.destroy
-        count += 1
-      end
-      count
-    end
+    attr_accessor :id, :worker_name, :inline
+    attr_reader :thread, :name
-    # Stop all running, paused, or starting workers
-    def self.stop_all
-      where(state: [:running, :paused, :starting]).each(&:stop!)
+    def self.before_running(*filters, &blk)
+      set_callback(:running, :before, *filters, &blk)
     end
-    # Pause all running workers
-    def self.pause_all
-      running.each(&:pause!)
+    def self.after_running(*filters, &blk)
+      set_callback(:running, :after, *filters, &blk)
     end
-    # Resume all paused workers
-    def self.resume_all
-      paused.each(&:resume!)
+    def self.around_running(*filters, &blk)
+      set_callback(:running, :around, *filters, &blk)
     end
-    # Returns [Hash<String:Integer>] of the number of workers in each state.
-    # Note: If there are no workers in that particular state then the hash will not have a value for it.
-    #
-    # Example workers in every state:
-    #   RocketJob::Worker.counts_by_state
-    #   # => {
-    #          :aborted => 1,
-    #          :completed => 37,
-    #          :failed => 1,
-    #          :paused => 3,
-    #          :queued => 4,
-    #          :running => 1,
-    #          :queued_now => 1,
-    #          :scheduled => 3
-    #        }
-    #
-    # Example no workers active:
-    #   RocketJob::Worker.counts_by_state
-    #   # => {}
-    def self.counts_by_state
-      counts = {}
-      collection.aggregate([
-        {
-          '$group' => {
-            _id:   '$state',
-            count: {'$sum' => 1}
-          }
-        }
-      ]
-      ).each do |result|
-        counts[result['_id'].to_sym] = result['count']
+    def initialize(id: 0, server_name: 'inline', inline: false)
+      @id          = id
+      @server_name = server_name
+      if defined?(Concurrent::JavaAtomicBoolean) || defined?(Concurrent::CAtomicBoolean)
+        @shutdown = Concurrent::AtomicBoolean.new(false)
+      else
+        @shutdown = false
       end
-      counts
-    end
-    # Returns [Boolean] whether the worker is shutting down
-    def shutting_down?
-      self.class.shutdown? || !running?
-    end
-    # Returns [true|false] if this worker has missed at least the last 4 heartbeats
-    #
-    # Possible causes for a worker to miss its heartbeats:
-    # - The worker process has died
-    # - The worker process is "hanging"
-    # - The worker is no longer able to communicate with the MongoDB Server
-    def zombie?(missed = 4)
-      return false unless running? || stopping?
-      return true if heartbeat.nil? || heartbeat.updated_at.nil?
-      dead_seconds = Config.instance.heartbeat_seconds * missed
-      (Time.now - heartbeat.updated_at) >= dead_seconds
+      @name   = "#{server_name}:#{id}"
+      @thread = Thread.new { run } unless inline
     end
-    # On MRI the 'concurrent-ruby-ext' gem may not be loaded
     if defined?(Concurrent::JavaAtomicBoolean) || defined?(Concurrent::CAtomicBoolean)
-      # Returns [true|false] whether the shutdown indicator has been set for this worker process
-      def self.shutdown?
-        @@shutdown.value
+      # Tells this worker to shutdown as soon the current job/slice is complete
+      def shutdown!
+        @shutdown.make_true
       end
-      # Set shutdown indicator for this worker process
-      def self.shutdown!
-        @@shutdown.make_true
+      def shutdown?
+        @shutdown.value
       end
-      @@shutdown = Concurrent::AtomicBoolean.new(false)
     else
-      # Returns [true|false] whether the shutdown indicator has been set for this worker process
-      def self.shutdown?
-        @@shutdown
+      def shutdown!
+        @shutdown = true
       end
-      # Set shutdown indicator for this worker process
-      def self.shutdown!
-        @@shutdown = true
+      def shutdown?
+        @shutdown
       end
-      @@shutdown = false
     end
     private
-    attr_reader :worker_threads
-    # Returns [Array<Thread>] collection of created worker threads
-    def worker_threads
-      @worker_threads ||= []
-    end
-    # Management Thread
+    # Process jobs until it shuts down
+    #
+    # Params
+    #   worker_id [Integer]
+    #     The number of this worker for logging purposes
     def run
-      logger.info "Using MongoDB Database: #{RocketJob::Job.database.name}"
-      build_heartbeat(updated_at: Time.now, current_threads: 0)
-      started!
-      adjust_worker_threads(true)
-      logger.info "RocketJob Worker started with #{max_threads} workers running"
-      count = 0
-      while running? || paused?
-        sleep Config.instance.heartbeat_seconds
-        update_attributes_and_reload(
-          'heartbeat.updated_at'      => Time.now,
-          'heartbeat.current_threads' => worker_count
-        )
-        # In case number of threads has been modified
-        adjust_worker_threads
-        # Stop worker if shutdown indicator was set
-        stop! if self.class.shutdown? && may_stop?
-      end
-      logger.info 'Waiting for worker threads to stop'
-      while thread = worker_threads.first
-        if thread.join(5)
-          # Worker thread is dead
-          worker_threads.shift
-        else
-          # Timeout waiting for thread to stop
-          begin
-            update_attributes_and_reload(
-              'heartbeat.updated_at'      => Time.now,
-              'heartbeat.current_threads' => worker_count
-            )
-          rescue MongoMapper::DocumentNotFound
-            logger.warn('Worker has been destroyed. Going down hard!')
-            break
-          end
-        end
-      end
-      logger.info 'Shutdown'
-    rescue Exception => exc
-      logger.error('RocketJob::Worker is stopping due to an exception', exc)
-    end
-    # Returns [Fixnum] number of workers (threads) that are alive
-    def worker_count
-      worker_threads.count { |i| i.alive? }
-    end
-    def next_worker_id
-      @worker_id ||= 0
-      @worker_id += 1
-    end
-    # Re-adjust the number of running threads to get it up to the
-    # required number of threads
-    #   Parameters
-    #     stagger_threads
-    #       Whether to stagger when the threads poll for work the first time
-    #       It spreads out the queue polling over the max_poll_seconds so
-    #       that not all workers poll at the same time
-    #       The worker also respond faster than max_poll_seconds when a new
-    #       job is added.
-    def adjust_worker_threads(stagger_threads=false)
-      count = worker_count
-      # Cleanup threads that have stopped
-      if count != worker_threads.count
-        logger.info "Cleaning up #{worker_threads.count - count} threads that went away"
-        worker_threads.delete_if { |t| !t.alive? }
-      end
-      return if shutting_down?
-      # Need to add more threads?
-      if count < max_threads
-        thread_count = max_threads - count
-        logger.info "Starting #{thread_count} threads"
-        thread_count.times.each do
-          # Start worker thread
-          worker_threads << Thread.new(next_worker_id) do |id|
-            begin
-              sleep (Config.instance.max_poll_seconds.to_f / max_threads) * (id - 1) if stagger_threads
-              worker(id)
-            rescue Exception => exc
-              logger.fatal('Cannot start worker thread', exc)
-            end
-          end
-        end
-      end
-    end
-    # Keep processing jobs until worker stops running
-    def worker(worker_id)
-      Thread.current.name = 'rocketjob %03i' % worker_id
+      Thread.current.name = 'rocketjob %03i' % id
       logger.info 'Started'
-      while !shutting_down?
+      while !shutdown?
         if process_available_jobs
           # Keeps workers staggered across the poll interval so that
           # all workers don't poll at the same time
           sleep rand(RocketJob::Config.instance.max_poll_seconds * 1000) / 1000
         else
-          break if shutting_down?
+          break if shutdown?
           sleep RocketJob::Config.instance.max_poll_seconds
         end
       end
-      logger.info "Stopping. Worker state: #{state.inspect}"
+      logger.info 'Stopping'
     rescue Exception => exc
       logger.fatal('Unhandled exception in job processing thread', exc)
     ensure
+      # TODO: Move to after_running callback
       ActiveRecord::Base.clear_active_connections! if defined?(ActiveRecord::Base)
     end
@@ -357,7 +96,7 @@ module RocketJob
     def process_available_jobs
       skip_job_ids = []
       processed    = false
-      while (job = Job.rocket_job_next_job(name, skip_job_ids)) && !shutting_down?
+      while (job = Job.rocket_job_next_job(worker_name, skip_job_ids)) && !shutdown?
         logger.fast_tag("job:#{job.id}") do
           if job.rocket_job_work(self)
             # Need to skip the specified job due to throttling or no work available
@@ -370,35 +109,6 @@ module RocketJob
       processed
     end
-    # Register handlers for the various signals
-    # Term:
-    #   Perform clean shutdown
-    #
-    def self.register_signal_handlers
-      begin
-        Signal.trap 'SIGTERM' do
-          shutdown!
-          message = 'Shutdown signal (SIGTERM) received. Will shutdown as soon as active jobs/slices have completed.'
-          # Logging uses a mutex to access Queue on MRI/CRuby
-          defined?(JRuby) ? logger.warn(message) : puts(message)
-        end
-        Signal.trap 'INT' do
-          shutdown!
-          message = 'Shutdown signal (INT) received. Will shutdown as soon as active jobs/slices have completed.'
-          # Logging uses a mutex to access Queue on MRI/CRuby
-          defined?(JRuby) ? logger.warn(message) : puts(message)
-        end
-      rescue StandardError
-        logger.warn 'SIGTERM handler not installed. Not able to shutdown gracefully'
-      end
-    end
-    # Requeue any jobs assigned to this worker when it is destroyed
-    def requeue_jobs
-      RocketJob::Job.requeue_dead_worker(name)
-    end
   end
 end

data/lib/rocketjob.rb CHANGED Viewed

@@ -1,13 +1,12 @@
 # encoding: UTF-8
 require 'semantic_logger'
-require 'rocket_job/extensions/mongo'
-require 'mongo_ha'
-require 'mongo_mapper'
-require 'rocket_job/extensions/mongo_mapper'
+require 'mongoid'
+require 'rocket_job/extensions/mongo/logging'
 require 'rocket_job/version'
 # @formatter:off
 module RocketJob
+  autoload :ActiveServer,       'rocket_job/active_server'
   autoload :CLI,                'rocket_job/cli'
   autoload :Config,             'rocket_job/config'
   autoload :DirmonEntry,        'rocket_job/dirmon_entry'
@@ -15,6 +14,8 @@ module RocketJob
   autoload :Job,                'rocket_job/job'
   autoload :JobException,       'rocket_job/job_exception'
   autoload :Worker,             'rocket_job/worker'
+  autoload :Performance,        'rocket_job/performance'
+  autoload :Server,             'rocket_job/server'
   module Plugins
     module Job