RubyGems - backburner-allq - Versions diffs - 1.0.0 - Mend

backburner-allq 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (63) hide show

checksums.yaml +7 -0
data/.gitignore +17 -0
data/.travis.yml +29 -0
data/CHANGELOG.md +133 -0
data/CONTRIBUTING.md +37 -0
data/Gemfile +4 -0
data/HOOKS.md +99 -0
data/LICENSE +22 -0
data/README.md +658 -0
data/Rakefile +17 -0
data/TODO +4 -0
data/backburner-allq.gemspec +26 -0
data/bin/backburner +7 -0
data/circle.yml +3 -0
data/deploy.sh +3 -0
data/examples/custom.rb +25 -0
data/examples/demo.rb +60 -0
data/examples/god.rb +46 -0
data/examples/hooked.rb +87 -0
data/examples/retried.rb +31 -0
data/examples/simple.rb +43 -0
data/examples/stress.rb +31 -0
data/lib/backburner.rb +75 -0
data/lib/backburner/allq_wrapper.rb +317 -0
data/lib/backburner/async_proxy.rb +25 -0
data/lib/backburner/cli.rb +53 -0
data/lib/backburner/configuration.rb +48 -0
data/lib/backburner/connection.rb +157 -0
data/lib/backburner/helpers.rb +193 -0
data/lib/backburner/hooks.rb +53 -0
data/lib/backburner/job.rb +118 -0
data/lib/backburner/logger.rb +53 -0
data/lib/backburner/performable.rb +95 -0
data/lib/backburner/queue.rb +145 -0
data/lib/backburner/tasks.rb +54 -0
data/lib/backburner/version.rb +3 -0
data/lib/backburner/worker.rb +221 -0
data/lib/backburner/workers/forking.rb +52 -0
data/lib/backburner/workers/simple.rb +29 -0
data/lib/backburner/workers/threading.rb +163 -0
data/lib/backburner/workers/threads_on_fork.rb +263 -0
data/test/async_proxy_test.rb +36 -0
data/test/back_burner_test.rb +88 -0
data/test/connection_test.rb +179 -0
data/test/fixtures/hooked.rb +122 -0
data/test/fixtures/test_fork_jobs.rb +72 -0
data/test/fixtures/test_forking_jobs.rb +56 -0
data/test/fixtures/test_jobs.rb +87 -0
data/test/fixtures/test_queue_settings.rb +14 -0
data/test/helpers/templogger.rb +22 -0
data/test/helpers_test.rb +278 -0
data/test/hooks_test.rb +112 -0
data/test/job_test.rb +185 -0
data/test/logger_test.rb +44 -0
data/test/performable_test.rb +88 -0
data/test/queue_test.rb +69 -0
data/test/test_helper.rb +128 -0
data/test/worker_test.rb +157 -0
data/test/workers/forking_worker_test.rb +181 -0
data/test/workers/simple_worker_test.rb +350 -0
data/test/workers/threading_worker_test.rb +104 -0
data/test/workers/threads_on_fork_worker_test.rb +484 -0
metadata +217 -0

data/lib/backburner/workers/simple.rb ADDED

@@ -0,0 +1,29 @@
+module Backburner
+  module Workers
+    class Simple < Worker
+      # Used to prepare job queues before processing jobs.
+      # Setup beanstalk tube_names and watch all specified tubes for jobs.
+      #
+      # @raise [Beaneater::NotConnected] If beanstalk fails to connect.
+      # @example
+      #   @worker.prepare
+      #
+      def prepare
+        self.tube_names.map! { |name| expand_tube_name(name)  }.uniq!
+        log_info "Working #{tube_names.size} queues: [ #{tube_names.join(', ')} ]"
+        self.connection.tubes.watch!(*self.tube_names)
+      end
+      # Starts processing new jobs indefinitely.
+      # Primary way to consume and process jobs in specified tubes.
+      #
+      # @example
+      #   @worker.start
+      #
+      def start
+        prepare
+        loop { work_one_job }
+      end
+    end # Basic
+  end # Workers
+end # Backburner

data/lib/backburner/workers/threading.rb ADDED

@@ -0,0 +1,163 @@
+require 'concurrent'
+module Backburner
+  module Workers
+    class Threading < Worker
+      attr_accessor :self_read, :self_write, :exit_on_shutdown
+      @shutdown_timeout = 10
+      class << self
+        attr_accessor :threads_number
+        attr_accessor :shutdown_timeout
+      end
+      # Custom initializer just to set @tubes_data
+      def initialize(*args)
+        @tubes_data = {}
+        super
+        self.process_tube_options
+        @exit_on_shutdown = true
+      end
+      # Used to prepare job queues before processing jobs.
+      # Setup beanstalk tube_names and watch all specified tubes for jobs.
+      #
+      # @raise [Beaneater::NotConnected] If beanstalk fails to connect.
+      # @example
+      #   @worker.prepare
+      #
+      def prepare
+        self.tube_names.map! { |name| expand_tube_name(name)  }.uniq!
+        log_info "Working #{tube_names.size} queues: [ #{tube_names.join(', ')} ]"
+        @thread_pools = {}
+        @tubes_data.each do |name, config|
+          max_threads = (config[:threads] || self.class.threads_number || ::Concurrent.processor_count).to_i
+          @thread_pools[name] = (::Concurrent::ThreadPoolExecutor.new(min_threads: 1, max_threads: max_threads))
+        end
+      end
+      # Starts processing new jobs indefinitely.
+      # Primary way to consume and process jobs in specified tubes.
+      #
+      # @example
+      #   @worker.start
+      #
+      def start(wait=true)
+        prepare
+        @thread_pools.each do |tube_name, pool|
+          pool.max_length.times do
+            # Create a new connection and set it up to listen on this tube name
+            connection = new_connection.tap{ |conn| conn.tubes.watch!(tube_name) }
+            connection.on_reconnect = lambda { |conn| conn.tubes.watch!(tube_name) }
+            # Make it work jobs using its own connection per thread
+            pool.post(connection) do |memo_connection|
+              # TODO: use read-write lock?
+              loop do
+                begin
+                  break if @in_shutdown
+                  work_one_job(memo_connection)
+                rescue => e
+                  log_error("Exception caught in thread pool loop. Continuing. -> #{e.message}\nBacktrace: #{e.backtrace}")
+                end
+              end
+              connection.close
+            end
+          end
+        end
+        wait_for_shutdown! if wait
+      end
+      # FIXME: We can't use this on_reconnect method since we don't know which thread
+      # pool the connection belongs to (and therefore we can't re-watch the right tubes).
+      # However, we set the individual connections' on_reconnect method in #start
+      # def on_reconnect(conn)
+      #   watch_tube(@watching_tube, conn) if @watching_tube
+      # end
+      # Process the special tube_names of Threading worker:
+      #   The format is tube_name:custom_threads_limit
+      #
+      # @example
+      #    process_tube_names(['foo:10', 'lol'])
+      #    => ['foo', lol']
+      def process_tube_names(tube_names)
+        names = compact_tube_names(tube_names)
+        if names.nil?
+          nil
+        else
+          names.map do |name|
+            data = name.split(":")
+            tube_name = data.first
+            threads_number = data[1].empty? ? nil : data[1].to_i rescue nil
+            @tubes_data[expand_tube_name(tube_name)] = {
+              :threads => threads_number
+            }
+            tube_name
+          end
+        end
+      end
+      # Process the tube settings
+      # This overrides @tubes_data set by process_tube_names method. So a tube has name 'super_job:5'
+      # and the tube class has setting queue_jobs_limit 10, the result limit will be 10
+      # If the tube is known by existing beanstalkd queue, but not by class - skip it
+      #
+      def process_tube_options
+        Backburner::Worker.known_queue_classes.each do |queue|
+          next if @tubes_data[expand_tube_name(queue)].nil?
+          queue_settings = {
+            :threads => queue.queue_jobs_limit
+          }
+          @tubes_data[expand_tube_name(queue)].merge!(queue_settings){|k, v1, v2| v2.nil? ? v1 : v2 }
+        end
+      end
+      # Wait for the shutdown signel
+      def wait_for_shutdown!
+        raise Interrupt while IO.select([self_read])
+      rescue Interrupt
+        shutdown
+      end
+      def shutdown_threadpools
+        @thread_pools.each { |_name, pool| pool.shutdown }
+        shutdown_time = Time.now
+        @in_shutdown = true
+        all_shutdown = @thread_pools.all? do |_name, pool|
+          time_to_wait = self.class.shutdown_timeout - (Time.now - shutdown_time).to_i
+          pool.wait_for_termination(time_to_wait) if time_to_wait > 0
+        end
+      rescue Interrupt
+        log_info "graceful shutdown aborted, shutting down immediately"
+      ensure
+        kill unless all_shutdown
+      end
+      def kill
+        @thread_pools.each { |_name, pool| pool.kill unless pool.shutdown? }
+      end
+      def shutdown
+        log_info "beginning graceful worker shutdown"
+        shutdown_threadpools
+        super if @exit_on_shutdown
+      end
+      # Registers signal handlers TERM and INT to trigger
+      def register_signal_handlers!
+        @self_read, @self_write = IO.pipe
+        %w[TERM INT].each do |sig|
+          trap(sig) do
+            raise Interrupt if @in_shutdown
+            self_write.puts(sig)
+          end
+        end
+      end
+    end # Threading
+  end # Workers
+end # Backburner

data/lib/backburner/workers/threads_on_fork.rb ADDED

@@ -0,0 +1,263 @@
+module Backburner
+  module Workers
+    class ThreadsOnFork < Worker
+      class << self
+        attr_accessor :shutdown
+        attr_accessor :threads_number
+        attr_accessor :garbage_after
+        attr_accessor :is_child
+        # return the pids of all alive children/forks
+        def child_pids
+          return [] if is_child
+          @child_pids ||= []
+          tmp_ids = []
+          for id in @child_pids
+            next if id.to_i == Process.pid
+            begin
+              Process.kill(0, id)
+              tmp_ids << id
+            rescue Errno::ESRCH
+            end
+          end
+          @child_pids = tmp_ids if @child_pids != tmp_ids
+          @child_pids
+        end
+        # Send a SIGTERM signal to all children
+        # This is the same of a normal exit
+        # We are simply asking the children to exit
+        def stop_forks
+          for id in child_pids
+            begin
+              Process.kill("SIGTERM", id)
+            rescue Errno::ESRCH
+            end
+          end
+        end
+        # Send a SIGKILL signal to all children
+        # This is the same of assassinate
+        # We are KILLING those folks that don't obey us
+        def kill_forks
+          for id in child_pids
+            begin
+              Process.kill("SIGKILL", id)
+            rescue Errno::ESRCH
+            end
+          end
+        end
+        def finish_forks
+          return if is_child
+          ids = child_pids
+          if ids.length > 0
+            puts "[ThreadsOnFork workers] Stopping forks: #{ids.join(", ")}"
+            stop_forks
+            Kernel.sleep 1
+            ids = child_pids
+            if ids.length > 0
+              puts "[ThreadsOnFork workers] Killing remaining forks: #{ids.join(", ")}"
+              kill_forks
+              Process.waitall
+            end
+          end
+        end
+      end
+      # Custom initializer just to set @tubes_data
+      def initialize(*args)
+        @tubes_data = {}
+        super
+        self.process_tube_options
+      end
+      # Process the special tube_names of ThreadsOnFork worker
+      # The idea is tube_name:custom_threads_limit:custom_garbage_limit:custom_retries
+      # Any custom can be ignore. So if you want to set just the custom_retries
+      # you will need to write this 'tube_name:::10'
+      #
+      # @example
+      #    process_tube_names(['foo:10:5:1', 'bar:2::3', 'lol'])
+      #    => ['foo', 'bar', 'lol']
+      def process_tube_names(tube_names)
+        names = compact_tube_names(tube_names)
+        if names.nil?
+          nil
+        else
+          names.map do |name|
+            data = name.split(":")
+            tube_name = data.first
+            threads_number = data[1].empty? ? nil : data[1].to_i rescue nil
+            garbage_number = data[2].empty? ? nil : data[2].to_i rescue nil
+            retries_number = data[3].empty? ? nil : data[3].to_i rescue nil
+            @tubes_data[expand_tube_name(tube_name)] = {
+                :threads => threads_number,
+                :garbage => garbage_number,
+                :retries => retries_number
+            }
+            tube_name
+          end
+        end
+      end
+      # Process the tube settings
+      # This overrides @tubes_data set by process_tube_names method. So a tube has name 'super_job:5:20:10'
+      # and the tube class has setting queue_jobs_limit 10, the result limit will be 10
+      # If the tube is known by existing beanstalkd queue, but not by class - skip it
+      #
+      def process_tube_options
+        Backburner::Worker.known_queue_classes.each do |queue|
+          next if @tubes_data[expand_tube_name(queue)].nil?
+          queue_settings = {
+              :threads => queue.queue_jobs_limit,
+              :garbage => queue.queue_garbage_limit,
+              :retries => queue.queue_retry_limit
+          }
+          @tubes_data[expand_tube_name(queue)].merge!(queue_settings){|k, v1, v2| v2.nil? ? v1 : v2 }
+        end
+      end
+      def prepare
+        self.tube_names ||= Backburner.default_queues.any? ? Backburner.default_queues : all_existing_queues
+        self.tube_names = Array(self.tube_names)
+        tube_names.map! { |name| expand_tube_name(name)  }.uniq!
+        tube_display_names = tube_names.map{|name| "#{name}:#{@tubes_data[name].values}"}
+        log_info "Working #{tube_names.size} queues: [ #{tube_display_names.join(', ')} ]"
+      end
+      # For each tube we will call fork_and_watch to create the fork
+      # The lock argument define if this method should block or no
+      def start(lock=true)
+        prepare
+        tube_names.each do |name|
+          fork_and_watch(name)
+        end
+        if lock
+          sleep 0.1 while true
+        end
+      end
+      # Make the fork and create a thread to watch the child process
+      # The exit code '99' means that the fork exited because of the garbage limit
+      # Any other code is an error
+      def fork_and_watch(name)
+        create_thread(name) do |tube_name|
+          until self.class.shutdown
+            pid = fork_tube(tube_name)
+            _, status = wait_for_process(pid)
+            # 99 = garbaged
+            if status.exitstatus != 99
+              log_error("Catastrophic failure: tube #{tube_name} exited with code #{status.exitstatus}.")
+            end
+          end
+        end
+      end
+      # This makes easy to test
+      def fork_tube(name)
+        fork_it do
+          fork_inner(name)
+        end
+      end
+      # Here we are already on the forked child
+      # We will watch just the selected tube and change the configuration of
+      # queue_config.max_job_retries if needed
+      #
+      # If we limit the number of threads to 1 it will just run in a loop without
+      # creating any extra thread.
+      def fork_inner(name)
+        if @tubes_data[name]
+          queue_config.max_job_retries = @tubes_data[name][:retries] if @tubes_data[name][:retries]
+        else
+          @tubes_data[name] = {}
+        end
+        @garbage_after  = @tubes_data[name][:garbage]  || self.class.garbage_after
+        @threads_number = (@tubes_data[name][:threads] || self.class.threads_number || 1).to_i
+        @runs = 0
+        if @threads_number == 1
+          watch_tube(name)
+          run_while_can
+        else
+          threads_count = Thread.list.count
+          @threads_number.times do
+            create_thread do
+              begin
+                conn = new_connection
+                watch_tube(name, conn)
+                run_while_can(conn)
+              ensure
+                conn.close if conn
+              end
+            end
+          end
+          sleep 0.1 while Thread.list.count > threads_count
+        end
+        coolest_exit
+      end
+      # Run work_one_job while we can
+      def run_while_can(conn = connection)
+        while @garbage_after.nil? or @garbage_after > @runs
+          @runs += 1 # FIXME: Likely race condition
+          work_one_job(conn)
+        end
+      end
+      # Shortcut for watching a tube on our beanstalk connection
+      def watch_tube(name, conn = connection)
+        # No op for allq
+      end
+      def on_reconnect(conn)
+        watch_tube(@watching_tube, conn) if @watching_tube
+      end
+      # Exit with Kernel.exit! to avoid at_exit callbacks that should belongs to
+      # parent process
+      # We will use exitcode 99 that means the fork reached the garbage number
+      def coolest_exit
+        Kernel.exit! 99
+      end
+      # Create a thread. Easy to test
+      def create_thread(*args, &block)
+        Thread.new(*args, &block)
+      end
+      # Wait for a specific process. Easy to test
+      def wait_for_process(pid)
+        out = Process.wait2(pid)
+        self.class.child_pids.delete(pid)
+        out
+      end
+      # Forks the specified block and adds the process to the child process pool
+      # FIXME: If blk.call breaks then the pid isn't added to child_pids and is
+      # never shutdown
+      def fork_it(&blk)
+        pid = Kernel.fork do
+          self.class.is_child = true
+          $0 = "[ThreadsOnFork worker] parent: #{Process.ppid}"
+          blk.call
+        end
+        self.class.child_pids << pid
+        pid
+      end
+    end
+  end
+end
+at_exit do
+  unless Backburner::Workers::ThreadsOnFork.is_child
+    Backburner::Workers::ThreadsOnFork.shutdown = true
+  end
+  Backburner::Workers::ThreadsOnFork.finish_forks
+end