RubyGems - spbtv_redis_failover - Versions diffs - 1.0.2.1 - Mend

spbtv_redis_failover 1.0.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (53) hide show

checksums.yaml +7 -0
data/.gitignore +19 -0
data/.travis.yml +7 -0
data/.yardopts +6 -0
data/Changes.md +191 -0
data/Gemfile +2 -0
data/LICENSE +22 -0
data/README.md +240 -0
data/Rakefile +9 -0
data/bin/redis_node_manager +7 -0
data/examples/config.yml +17 -0
data/examples/multiple_environments_config.yml +15 -0
data/lib/redis_failover.rb +25 -0
data/lib/redis_failover/cli.rb +142 -0
data/lib/redis_failover/client.rb +517 -0
data/lib/redis_failover/errors.rb +54 -0
data/lib/redis_failover/failover_strategy.rb +25 -0
data/lib/redis_failover/failover_strategy/latency.rb +21 -0
data/lib/redis_failover/manual_failover.rb +52 -0
data/lib/redis_failover/node.rb +190 -0
data/lib/redis_failover/node_manager.rb +741 -0
data/lib/redis_failover/node_snapshot.rb +81 -0
data/lib/redis_failover/node_strategy.rb +34 -0
data/lib/redis_failover/node_strategy/consensus.rb +18 -0
data/lib/redis_failover/node_strategy/majority.rb +18 -0
data/lib/redis_failover/node_strategy/single.rb +17 -0
data/lib/redis_failover/node_watcher.rb +83 -0
data/lib/redis_failover/runner.rb +27 -0
data/lib/redis_failover/util.rb +137 -0
data/lib/redis_failover/version.rb +3 -0
data/misc/redis_failover.png +0 -0
data/spbtv_redis_failover.gemspec +26 -0
data/spec/cli_spec.rb +75 -0
data/spec/client_spec.rb +153 -0
data/spec/failover_strategy/latency_spec.rb +41 -0
data/spec/failover_strategy_spec.rb +17 -0
data/spec/node_manager_spec.rb +136 -0
data/spec/node_snapshot_spec.rb +30 -0
data/spec/node_spec.rb +84 -0
data/spec/node_strategy/consensus_spec.rb +30 -0
data/spec/node_strategy/majority_spec.rb +22 -0
data/spec/node_strategy/single_spec.rb +22 -0
data/spec/node_strategy_spec.rb +22 -0
data/spec/node_watcher_spec.rb +58 -0
data/spec/spec_helper.rb +21 -0
data/spec/support/config/multiple_environments.yml +15 -0
data/spec/support/config/multiple_environments_with_chroot.yml +17 -0
data/spec/support/config/single_environment.yml +7 -0
data/spec/support/config/single_environment_with_chroot.yml +8 -0
data/spec/support/node_manager_stub.rb +87 -0
data/spec/support/redis_stub.rb +105 -0
data/spec/util_spec.rb +21 -0
metadata +207 -0

data/lib/redis_failover/errors.rb ADDED Viewed

@@ -0,0 +1,54 @@
+module RedisFailover
+  # Base class for all RedisFailover errors.
+  class Error < StandardError
+  end
+  # Raised when a node is specified incorrectly.
+  class InvalidNodeError < Error
+  end
+  # Raised when a node changes to an invalid/unknown state.
+  class InvalidNodeStateError < Error
+    def initialize(node, state)
+      super("Invalid state change `#{state}` for node #{node}")
+    end
+  end
+  # Raised when a node is unavailable (i.e., unreachable via network).
+  class NodeUnavailableError < Error
+    def initialize(node)
+      super("Node: #{node}")
+    end
+  end
+  # Raised when no master is currently available.
+  class NoMasterError < Error
+  end
+  # Raised when more than one master is found on startup.
+  class MultipleMastersError < Error
+    def initialize(nodes)
+      super("Multiple nodes with master role: #{nodes.map(&:to_s)}")
+    end
+  end
+  # Raised when no slave is currently available.
+  class NoSlaveError < Error
+  end
+  # Raised when a redis server is no longer using the same role
+  # as previously assumed.
+  class InvalidNodeRoleError < Error
+    def initialize(node, assumed, actual)
+      super("Invalid role detected for node #{node}, client thought " +
+        "it was a #{assumed}, but it's now a #{actual}")
+    end
+  end
+  # Raised when an unsupported redis operation is performed.
+  class UnsupportedOperationError < Error
+    def initialize(operation)
+      super("Operation `#{operation}` is currently unsupported")
+    end
+  end
+end

data/lib/redis_failover/failover_strategy.rb ADDED Viewed

@@ -0,0 +1,25 @@
+module RedisFailover
+  # Base class for strategies that determine which node is used during failover.
+  class FailoverStrategy
+    include Util
+    # Loads a strategy based on the given name.
+    #
+    # @param [String, Symbol] name the strategy name
+    # @return [Object] a new strategy instance
+    def self.for(name)
+      require "redis_failover/failover_strategy/#{name.downcase}"
+      const_get(name.capitalize).new
+    rescue LoadError, NameError
+      raise "Failed to find failover strategy: #{name}"
+    end
+    # Returns a candidate node as determined by this strategy.
+    #
+    # @param [Hash<Node, NodeSnapshot>] snapshots the node snapshots
+    # @return [Node] the candidate node or nil if one couldn't be found
+    def find_candidate(snapshots)
+      raise NotImplementedError
+    end
+  end
+end

data/lib/redis_failover/failover_strategy/latency.rb ADDED Viewed

@@ -0,0 +1,21 @@
+module RedisFailover
+  class FailoverStrategy
+    # Failover strategy that selects an available node that is both seen by all
+    # node managers and has the lowest reported health check latency.
+    class Latency < FailoverStrategy
+      # @see RedisFailover::FailoverStrategy#find_candidate
+      def find_candidate(snapshots)
+        candidates = {}
+        snapshots.each do |node, snapshot|
+          if snapshot.all_available?
+            candidates[node] = snapshot.avg_latency
+          end
+        end
+        if candidate = candidates.min_by(&:last)
+          candidate.first
+        end
+      end
+    end
+  end
+end

data/lib/redis_failover/manual_failover.rb ADDED Viewed

@@ -0,0 +1,52 @@
+module RedisFailover
+  # Provides manual failover support to a new master.
+  class ManualFailover
+    # Path for manual failover communication.
+    ZNODE_PATH = 'manual_failover'.freeze
+    # Denotes that any slave can be used as a candidate for promotion.
+    ANY_SLAVE = "ANY_SLAVE".freeze
+    def self.path(root_znode)
+      "#{root_znode}/#{ZNODE_PATH}"
+    end
+    # Creates a new instance.
+    #
+    # @param [ZK] zk the ZooKeeper client
+    # @param [ZNode] root_znode the root ZK node
+    # @param [Hash] options the options used for manual failover
+    # @option options [String] :host the host of the failover candidate
+    # @option options [String] :port the port of the failover candidate
+    # @note
+    #   If options is empty, a random slave will be used
+    #   as a failover candidate.
+    def initialize(zk, root_znode, options = {})
+      @zk = zk
+      @root_znode = root_znode
+      @options = options
+      unless @options.empty?
+        port = Integer(@options[:port]) rescue nil
+        raise ArgumentError, ':host not properly specified' if @options[:host].to_s.empty?
+        raise ArgumentError, ':port not properly specified' if port.nil?
+      end
+    end
+    # Performs a manual failover.
+    def perform
+      create_path
+      node = @options.empty? ? ANY_SLAVE : "#{@options[:host]}:#{@options[:port]}"
+      @zk.set(self.class.path(@root_znode), node)
+    end
+    private
+    # Creates the znode path used for coordinating manual failovers.
+    def create_path
+      @zk.create(self.class.path(@root_znode))
+    rescue ZK::Exceptions::NodeExists
+      # best effort
+    end
+  end
+end

data/lib/redis_failover/node.rb ADDED Viewed

@@ -0,0 +1,190 @@
+module RedisFailover
+  # Represents a redis node (master or slave). Instances of this class
+  # are used by the NodeManager and NodeWatcher to manipulate real redis
+  # servers.
+  class Node
+    include Util
+    # Maximum amount of time given for any redis operation to complete.
+    # If a redis operation doesn't complete in the alotted time, a
+    # NodeUnavailableError will be raised.
+    MAX_OP_WAIT_TIME = 5
+    # @return [String] the redis server host
+    attr_reader :host
+    # @return [Integer] the redis server port
+    attr_reader :port
+    # Creates a new instance.
+    #
+    # @param [Hash] options the options used to create the node
+    # @option options [String] :host the host of the redis server
+    # @option options [String] :port the port of the redis server
+    def initialize(options = {})
+      @host = options[:host]
+      raise InvalidNodeError, 'missing host' if @host.to_s.empty?
+      @port = Integer(options[:port] || 6379)
+      @password = options[:password]
+    end
+    # @return [Boolean] true if this node is a master, false otherwise
+    def master?
+      role == 'master'
+    end
+    # @return [Boolean] true if this node is a slave, false otherwise
+    def slave?
+      !master?
+    end
+    # Determines if this node is a slave of the given master.
+    #
+    # @param [Node] master the master to check
+    # @return [Boolean] true if slave of master, false otherwise
+    def slave_of?(master)
+      current_master == master
+    end
+    # Determines current master of this slave.
+    #
+    # @return [Node] the node representing the master of this slave
+    def current_master
+      info = fetch_info
+      return unless info[:role] == 'slave'
+      Node.new(:host => info[:master_host], :port => info[:master_port].to_i)
+    end
+    # Waits until something interesting happens. If the connection
+    # with this node dies, the blpop call will raise an error. If
+    # the blpop call returns without error, then this will be due to
+    # a graceful shutdown signaled by #wakeup or a timeout.
+    def wait
+      perform_operation do |redis|
+        redis.blpop(wait_key, MAX_OP_WAIT_TIME - 3)
+        redis.del(wait_key)
+      end
+    end
+    # Wakes up this node by pushing a value to its internal
+    # queue used by #wait.
+    def wakeup
+      perform_operation do |redis|
+        redis.lpush(wait_key, '1')
+      end
+    end
+    # Makes this node a slave of the given node.
+    #
+    # @param [Node] node the node of which to become a slave
+    def make_slave!(node)
+      perform_operation do |redis|
+        unless slave_of?(node)
+          redis.slaveof(node.host, node.port)
+          logger.info("#{self} is now a slave of #{node}")
+          wakeup
+        end
+      end
+    end
+    # Makes this node a master node.
+    def make_master!
+      perform_operation do |redis|
+        unless master?
+          redis.slaveof('no', 'one')
+          logger.info("#{self} is now master")
+          wakeup
+        end
+      end
+    end
+    # @return [String] an inspect string for this node
+    def inspect
+      "<RedisFailover::Node #{to_s}>"
+    end
+    # @return [String] a friendly string for this node
+    def to_s
+      "#{@host}:#{@port}"
+    end
+    # Determines if this node is equal to another node.
+    #
+    # @param [Node] other the other node to compare
+    # @return [Boolean] true if equal, false otherwise
+    def ==(other)
+      return false unless Node === other
+      return true if self.equal?(other)
+      [host, port] == [other.host, other.port]
+    end
+    alias_method :eql?, :==
+    # @return [Integer] a hash value for this node
+    def hash
+      to_s.hash
+    end
+    # Fetches information/stats for this node.
+    #
+    # @return [Hash] the info for this node
+    def fetch_info
+      perform_operation do |redis|
+        symbolize_keys(redis.info)
+      end
+    end
+    alias_method :ping, :fetch_info
+    # @return [Boolean] determines if this node prohibits stale reads
+    def prohibits_stale_reads?
+      perform_operation do |redis|
+        redis.config('get', 'slave-serve-stale-data').last == 'no'
+      end
+    end
+    # @return [Boolean] determines if this node is syncing with its master
+    def syncing_with_master?
+      perform_operation do |redis|
+        fetch_info[:master_sync_in_progress] == '1'
+      end
+    end
+    private
+    # @return [String] the current role for this node
+    def role
+      fetch_info[:role]
+    end
+    # @return [String] the name of the wait queue for this node
+    def wait_key
+      @wait_key ||= "_redis_failover_#{SecureRandom.hex(32)}"
+    end
+    # @return [Redis] a new redis client instance for this node
+    def new_client
+      Redis.new(:host => @host, :password => @password, :port => @port)
+    end
+    # Safely performs a redis operation within a given timeout window.
+    #
+    # @yield [Redis] the redis client to use for the operation
+    # @raise [NodeUnavailableError] if node is currently unreachable
+    def perform_operation
+      redis = nil
+      Timeout.timeout(MAX_OP_WAIT_TIME) do
+        redis = new_client
+        yield redis
+      end
+    rescue Exception => ex
+      raise NodeUnavailableError, "#{ex.class}: #{ex.message}", ex.backtrace
+    ensure
+      if redis
+        begin
+          redis.client.disconnect
+        rescue Exception => ex
+          raise NodeUnavailableError, "#{ex.class}: #{ex.message}", ex.backtrace
+        end
+      end
+    end
+  end
+end

data/lib/redis_failover/node_manager.rb ADDED Viewed

@@ -0,0 +1,741 @@
+module RedisFailover
+  # NodeManager manages a list of redis nodes. Upon startup, the NodeManager
+  # will discover the current redis master and slaves. Each redis node is
+  # monitored by a NodeWatcher instance. The NodeWatchers periodically
+  # report the current state of the redis node it's watching to the
+  # NodeManager. The NodeManager processes the state reports and reacts
+  # appropriately by handling stale/dead nodes, and promoting a new redis master
+  # if it sees fit to do so.
+  class NodeManager
+    include Util
+    # Number of seconds to wait before retrying bootstrap process.
+    TIMEOUT = 5
+    # Number of seconds for checking node snapshots.
+    CHECK_INTERVAL = 5
+    # Number of max attempts to promote a master before releasing master lock.
+    MAX_PROMOTION_ATTEMPTS = 3
+    # Latency threshold for recording node state.
+    LATENCY_THRESHOLD = 0.5
+    # Errors that can happen during the node discovery process.
+    NODE_DISCOVERY_ERRORS = [
+      InvalidNodeRoleError,
+      NodeUnavailableError,
+      NoMasterError,
+      MultipleMastersError
+    ].freeze
+    # Creates a new instance.
+    #
+    # @param [Hash] options the options used to initialize the manager
+    # @option options [String] :zkservers comma-separated ZK host:port pairs
+    # @option options [String] :znode_path znode path override for redis nodes
+    # @option options [String] :password password for redis nodes
+    # @option options [Array<String>] :nodes the nodes to manage
+    # @option options [String] :max_failures the max failures for a node
+    def initialize(options)
+      logger.info("Redis Node Manager v#{VERSION} starting (#{RUBY_DESCRIPTION})")
+      @options = options
+      @required_node_managers = options.fetch(:required_node_managers, 1)
+      @root_znode = options.fetch(:znode_path, Util::DEFAULT_ROOT_ZNODE_PATH)
+      @node_strategy = NodeStrategy.for(options.fetch(:node_strategy, :majority))
+      @failover_strategy = FailoverStrategy.for(options.fetch(:failover_strategy, :latency))
+      @nodes = Array(@options[:nodes]).map { |opts| Node.new(opts) }.uniq
+      @master_manager = false
+      @master_promotion_attempts = 0
+      @sufficient_node_managers = false
+      @lock = Monitor.new
+      @shutdown = false
+    end
+    # Starts the node manager.
+    #
+    # @note This method does not return until the manager terminates.
+    def start
+      return unless running?
+      setup_zk
+      spawn_watchers
+      wait_until_master
+    rescue *ZK_ERRORS => ex
+      logger.error("ZK error while attempting to manage nodes: #{ex.inspect}")
+      reset
+      sleep(TIMEOUT)
+      retry
+    rescue NoMasterError
+      logger.error("Failed to promote a new master after #{MAX_PROMOTION_ATTEMPTS} attempts.")
+      reset
+      sleep(TIMEOUT)
+      retry
+    end
+    # Notifies the manager of a state change. Used primarily by
+    # {RedisFailover::NodeWatcher} to inform the manager of watched node states.
+    #
+    # @param [Node] node the node
+    # @param [Symbol] state the state
+    # @param [Integer] latency an optional latency
+    def notify_state(node, state, latency = nil)
+      @lock.synchronize do
+        if running?
+          update_current_state(node, state, latency)
+        end
+      end
+    rescue => ex
+      logger.error("Error handling state report #{[node, state].inspect}: #{ex.inspect}")
+      logger.error(ex.backtrace.join("\n"))
+    end
+    # Performs a reset of the manager.
+    def reset
+      @master_manager = false
+      @master_promotion_attempts = 0
+      @watchers.each(&:shutdown) if @watchers
+    end
+    # Initiates a graceful shutdown.
+    def shutdown
+      logger.info('Shutting down ...')
+      @lock.synchronize do
+        @shutdown = true
+      end
+      reset
+      exit
+    end
+    private
+    # Configures the ZooKeeper client.
+    def setup_zk
+      unless @zk
+        @zk = ZK.new("#{@options[:zkservers]}#{@options[:chroot] || ''}")
+        @zk.register(manual_failover_path) do |event|
+          handle_manual_failover_update(event)
+        end
+        @zk.on_connected { @zk.stat(manual_failover_path, :watch => true) }
+      end
+      create_path(@root_znode)
+      create_path(current_state_root)
+      @zk.stat(manual_failover_path, :watch => true)
+    end
+    # Handles an unavailable node.
+    #
+    # @param [Node] node the unavailable node
+    # @param [Hash<Node, NodeSnapshot>] snapshots the current set of snapshots
+    def handle_unavailable(node, snapshots)
+      # no-op if we already know about this node
+      return if @unavailable.include?(node)
+      logger.info("Handling unavailable node: #{node}")
+      @unavailable << node
+      # find a new master if this node was a master
+      if node == @master
+        logger.info("Demoting currently unavailable master #{node}.")
+        promote_new_master(snapshots)
+      else
+        @slaves.delete(node)
+      end
+    end
+    # Handles an available node.
+    #
+    # @param [Node] node the available node
+    # @param [Hash<Node, NodeSnapshot>] snapshots the current set of snapshots
+    def handle_available(node, snapshots)
+      reconcile(node)
+      # no-op if we already know about this node
+      return if @master == node || (@master && @slaves.include?(node))
+      logger.info("Handling available node: #{node}")
+      if @master
+        # master already exists, make a slave
+        node.make_slave!(@master)
+        @slaves << node
+      else
+        # no master exists, make this the new master
+        promote_new_master(snapshots, node)
+      end
+      @unavailable.delete(node)
+    end
+    # Handles a node that is currently syncing.
+    #
+    # @param [Node] node the syncing node
+    # @param [Hash<Node, NodeSnapshot>] snapshots the current set of snapshots
+    def handle_syncing(node, snapshots)
+      reconcile(node)
+      if node.syncing_with_master? && node.prohibits_stale_reads?
+        logger.info("Node #{node} not ready yet, still syncing with master.")
+        force_unavailable_slave(node)
+      else
+        # otherwise, we can use this node
+        handle_available(node, snapshots)
+      end
+    end
+    # Handles a manual failover request to the given node.
+    #
+    # @param [Node] node the candidate node for failover
+    # @param [Hash<Node, NodeSnapshot>] snapshots the current set of snapshots
+    def handle_manual_failover(node, snapshots)
+      # no-op if node to be failed over is already master
+      return if @master == node
+      logger.info("Handling manual failover")
+      # ensure we can talk to the node
+      node.ping
+      # make current master a slave, and promote new master
+      @slaves << @master if @master
+      @slaves.delete(node)
+      promote_new_master(snapshots, node)
+    end
+    # Promotes a new master.
+    #
+    # @param [Hash<Node, NodeSnapshot>] snapshots the current set of snapshots
+    # @param [Node] node the optional node to promote
+    def promote_new_master(snapshots, node = nil)
+      delete_path(redis_nodes_path)
+      @master = nil
+      # make a specific node or selected candidate the new master
+      candidate = node || failover_strategy_candidate(snapshots)
+      if candidate.nil?
+        logger.error('Failed to promote a new master, no candidate available.')
+      else
+        @slaves.delete(candidate)
+        @unavailable.delete(candidate)
+        redirect_slaves_to(candidate)
+        candidate.make_master!
+        @master = candidate
+        write_current_redis_nodes
+        @master_promotion_attempts = 0
+        logger.info("Successfully promoted #{candidate} to master.")
+      end
+    end
+    # Discovers the current master and slave nodes.
+    # @return [Boolean] true if nodes successfully discovered, false otherwise
+    def discover_nodes
+      @lock.synchronize do
+        return unless running?
+        @slaves, @unavailable = [], []
+        if @master = find_existing_master
+          logger.info("Using master #{@master} from existing znode config.")
+        elsif @master = guess_master(@nodes)
+          logger.info("Guessed master #{@master} from known redis nodes.")
+        end
+        @slaves = @nodes - [@master]
+        logger.info("Managing master (#{@master}) and slaves #{stringify_nodes(@slaves)}")
+      end
+    rescue *NODE_DISCOVERY_ERRORS => ex
+      msg = <<-MSG.gsub(/\s+/, ' ')
+        Failed to discover master node: #{ex.inspect}
+        In order to ensure a safe startup, redis_failover requires that all redis
+        nodes be accessible, and only a single node indicating that it's the master.
+        In order to fix this, you can perform a manual failover via redis_failover,
+        or manually fix the individual redis servers. This discovery process will
+        retry in #{TIMEOUT}s.
+      MSG
+      logger.warn(msg)
+      sleep(TIMEOUT)
+      retry
+    end
+    # Seeds the initial node master from an existing znode config.
+    def find_existing_master
+      if data = @zk.get(redis_nodes_path).first
+        nodes = symbolize_keys(decode(data))
+        master = node_from(nodes[:master])
+        logger.info("Master from existing znode config: #{master || 'none'}")
+        # Check for case where a node previously thought to be the master was
+        # somehow manually reconfigured to be a slave outside of the node manager's
+        # control.
+        begin
+          if master && master.slave?
+            raise InvalidNodeRoleError.new(master, :master, :slave)
+          end
+        rescue RedisFailover::NodeUnavailableError => ex
+          logger.warn("Failed to check whether existing master has invalid role: #{ex.inspect}")
+        end
+        master
+      end
+    rescue ZK::Exceptions::NoNode
+      # blank slate, no last known master
+      nil
+    end
+    # Creates a Node instance from a string.
+    #
+    # @param [String] node_string a string representation of a node (e.g., host:port)
+    # @return [Node] the Node representation
+    def node_from(node_string)
+      return if node_string.nil?
+      host, port = node_string.split(':', 2)
+      Node.new(:host => host, :port => port, :password => @options[:password])
+    end
+    # Spawns the {RedisFailover::NodeWatcher} instances for each managed node.
+    def spawn_watchers
+      @zk.delete(current_state_path, :ignore => :no_node)
+      @monitored_available, @monitored_unavailable = {}, []
+      @watchers = @nodes.map do |node|
+        NodeWatcher.new(self, node, @options.fetch(:max_failures, 3))
+      end
+      @watchers.each(&:watch)
+      logger.info("Monitoring redis nodes at #{stringify_nodes(@nodes)}")
+    end
+    # Searches for the master node.
+    #
+    # @param [Array<Node>] nodes the nodes to search
+    # @return [Node] the found master node, nil if not found
+    def guess_master(nodes)
+      master_nodes = nodes.select { |node| node.master? }
+      raise NoMasterError if master_nodes.empty?
+      raise MultipleMastersError.new(master_nodes) if master_nodes.size > 1
+      master_nodes.first
+    end
+    # Redirects all slaves to the specified node.
+    #
+    # @param [Node] node the node to which slaves are redirected
+    def redirect_slaves_to(node)
+      @slaves.dup.each do |slave|
+        begin
+          slave.make_slave!(node)
+        rescue NodeUnavailableError
+          logger.info("Failed to redirect unreachable slave #{slave} to #{node}")
+          force_unavailable_slave(slave)
+        end
+      end
+    end
+    # Forces a slave to be marked as unavailable.
+    #
+    # @param [Node] node the node to force as unavailable
+    def force_unavailable_slave(node)
+      @slaves.delete(node)
+      @unavailable << node unless @unavailable.include?(node)
+    end
+    # It's possible that a newly available node may have been restarted
+    # and completely lost its dynamically set run-time role by the node
+    # manager. This method ensures that the node resumes its role as
+    # determined by the manager.
+    #
+    # @param [Node] node the node to reconcile
+    def reconcile(node)
+      return if @master == node && node.master?
+      return if @master && node.slave_of?(@master)
+      logger.info("Reconciling node #{node}")
+      if @master == node && !node.master?
+        # we think the node is a master, but the node doesn't
+        node.make_master!
+        return
+      end
+      # verify that node is a slave for the current master
+      if @master && !node.slave_of?(@master)
+        node.make_slave!(@master)
+      end
+    end
+    # @return [Hash] the set of current nodes grouped by category
+    def current_nodes
+      {
+        :master => @master ? @master.to_s : nil,
+        :slaves => @slaves.map(&:to_s),
+        :unavailable => @unavailable.map(&:to_s)
+      }
+    end
+    # @return [Hash] the set of currently available/unavailable nodes as
+    # seen by this node manager instance
+    def node_availability_state
+      {
+        :available => Hash[@monitored_available.map { |k, v| [k.to_s, v] }],
+        :unavailable => @monitored_unavailable.map(&:to_s)
+      }
+    end
+    # Deletes the znode path containing the redis nodes.
+    #
+    # @param [String] path the znode path to delete
+    def delete_path(path)
+      @zk.delete(path)
+      logger.info("Deleted ZK node #{path}")
+    rescue ZK::Exceptions::NoNode => ex
+      logger.info("Tried to delete missing znode: #{ex.inspect}")
+    end
+    # Creates a znode path.
+    #
+    # @param [String] path the znode path to create
+    # @param [Hash] options the options used to create the path
+    # @option options [String] :initial_value an initial value for the znode
+    # @option options [Boolean] :ephemeral true if node is ephemeral, false otherwise
+    def create_path(path, options = {})
+      unless @zk.exists?(path)
+        @zk.create(path,
+          options[:initial_value],
+          :ephemeral => options.fetch(:ephemeral, false))
+        logger.info("Created ZK node #{path}")
+      end
+    rescue ZK::Exceptions::NodeExists
+      # best effort
+    end
+    # Writes state to a particular znode path.
+    #
+    # @param [String] path the znode path that should be written to
+    # @param [String] value the value to write to the znode
+    # @param [Hash] options the default options to be used when creating the node
+    # @note the path will be created if it doesn't exist
+    def write_state(path, value, options = {})
+      create_path(path, options.merge(:initial_value => value))
+      @zk.set(path, value)
+    end
+    # Handles a manual failover znode update.
+    #
+    # @param [ZK::Event] event the ZK event to handle
+    def handle_manual_failover_update(event)
+      if event.node_created? || event.node_changed?
+        perform_manual_failover
+      end
+    rescue => ex
+      logger.error("Error scheduling a manual failover: #{ex.inspect}")
+      logger.error(ex.backtrace.join("\n"))
+    ensure
+      @zk.stat(manual_failover_path, :watch => true)
+    end
+    # Produces a FQDN id for this Node Manager.
+    #
+    # @return [String] the FQDN for this Node Manager
+    def manager_id
+      @manager_id ||= [
+        Socket.gethostbyname(Socket.gethostname)[0],
+        Process.pid
+      ].join('-')
+    end
+    # Writes the current master list of redis nodes. This method is only invoked
+    # if this node manager instance is the master/primary manager.
+    def write_current_redis_nodes
+      write_state(redis_nodes_path, encode(current_nodes))
+    end
+    # Writes the current monitored list of redis nodes. This method is always
+    # invoked by all running node managers.
+    def write_current_monitored_state
+      write_state(current_state_path, encode(node_availability_state), :ephemeral => true)
+    end
+    # @return [String] root path for current node manager state
+    def current_state_root
+      "#{@root_znode}/manager_node_state"
+    end
+    # @return [String] the znode path for this node manager's view
+    # of available nodes
+    def current_state_path
+      "#{current_state_root}/#{manager_id}"
+    end
+    # @return [String] the znode path for the master redis nodes config
+    def redis_nodes_path
+      "#{@root_znode}/nodes"
+    end
+    # @return [String] root path for current node manager lock
+    def current_lock_path
+      "#{@root_znode}/master_redis_node_manager_lock"
+    end
+    # @return [String] the znode path used for performing manual failovers
+    def manual_failover_path
+      ManualFailover.path(@root_znode)
+    end
+    # @return [Boolean] true if this node manager is the master, false otherwise
+    def master_manager?
+      @master_manager
+    end
+    # Used to update the master node manager state. These states are only handled if
+    # this node manager instance is serving as the master manager.
+    #
+    # @param [Node] node the node to handle
+    # @param [Hash<Node, NodeSnapshot>] snapshots the current set of snapshots
+    def update_master_state(node, snapshots)
+      state = @node_strategy.determine_state(node, snapshots)
+      case state
+      when :unavailable
+        handle_unavailable(node, snapshots)
+      when :available
+        if node.syncing_with_master?
+          handle_syncing(node, snapshots)
+        else
+          handle_available(node, snapshots)
+        end
+      else
+        raise InvalidNodeStateError.new(node, state)
+      end
+    rescue *ZK_ERRORS
+      # fail hard if this is a ZK connection-related error
+      raise
+    rescue => ex
+      logger.error("Error handling state report for #{[node, state].inspect}: #{ex.inspect}")
+    end
+    # Updates the current view of the world for this particular node
+    # manager instance. All node managers write this state regardless
+    # of whether they are the master manager or not.
+    #
+    # @param [Node] node the node to handle
+    # @param [Symbol] state the node state
+    # @param [Integer] latency an optional latency
+    def update_current_state(node, state, latency = nil)
+      old_unavailable = @monitored_unavailable.dup
+      old_available = @monitored_available.dup
+      case state
+      when :unavailable
+        unless @monitored_unavailable.include?(node)
+          @monitored_unavailable << node
+          @monitored_available.delete(node)
+          write_current_monitored_state
+        end
+      when :available
+        last_latency = @monitored_available[node]
+        if last_latency.nil? || (latency - last_latency) > LATENCY_THRESHOLD
+          @monitored_available[node] = latency
+          @monitored_unavailable.delete(node)
+          write_current_monitored_state
+        end
+      else
+        raise InvalidNodeStateError.new(node, state)
+      end
+    rescue => ex
+      # if an error occurs, make sure that we rollback to the old state
+      @monitored_unavailable = old_unavailable
+      @monitored_available = old_available
+      raise
+    end
+    # Fetches each currently running node manager's view of the
+    # world in terms of which nodes they think are available/unavailable.
+    #
+    # @return [Hash<String, Array>] a hash of node manager to host states
+    def fetch_node_manager_states
+      states = {}
+      @zk.children(current_state_root).each do |child|
+        full_path = "#{current_state_root}/#{child}"
+        begin
+          states[child] = symbolize_keys(decode(@zk.get(full_path).first))
+        rescue ZK::Exceptions::NoNode
+          # ignore, this is an edge case that can happen when a node manager
+          # process dies while fetching its state
+        rescue => ex
+          logger.error("Failed to fetch states for #{full_path}: #{ex.inspect}")
+        end
+      end
+      states
+    end
+    # Builds current snapshots of nodes across all running node managers.
+    #
+    # @return [Hash<Node, NodeSnapshot>] the snapshots for all nodes
+    def current_node_snapshots
+      nodes = {}
+      snapshots = Hash.new { |h, k| h[k] = NodeSnapshot.new(k) }
+      fetch_node_manager_states.each do |node_manager, states|
+        available, unavailable = states.values_at(:available, :unavailable)
+        available.each do |node_string, latency|
+          node = nodes[node_string] ||= node_from(node_string)
+          snapshots[node].viewable_by(node_manager, latency)
+        end
+        unavailable.each do |node_string|
+          node = nodes[node_string] ||= node_from(node_string)
+          snapshots[node].unviewable_by(node_manager)
+        end
+      end
+      snapshots
+    end
+    # Waits until this node manager becomes the master.
+    def wait_until_master
+      logger.info('Waiting to become master Node Manager ...')
+      with_lock do
+        @master_manager = true
+        logger.info('Acquired master Node Manager lock.')
+        logger.info("Configured node strategy #{@node_strategy.class}")
+        logger.info("Configured failover strategy #{@failover_strategy.class}")
+        logger.info("Required Node Managers to make a decision: #{@required_node_managers}")
+        manage_nodes
+      end
+    end
+    # Manages the redis nodes by periodically processing snapshots.
+    def manage_nodes
+      # Re-discover nodes, since the state of the world may have been changed
+      # by the time we've become the primary node manager.
+      discover_nodes
+      # ensure that slaves are correctly pointing to this master
+      redirect_slaves_to(@master)
+      # Periodically update master config state.
+      while running? && master_manager?
+        @zk_lock.assert!
+        sleep(CHECK_INTERVAL)
+        @lock.synchronize do
+          snapshots = current_node_snapshots
+          if ensure_sufficient_node_managers(snapshots)
+            snapshots.each_key do |node|
+              update_master_state(node, snapshots)
+            end
+            # flush current master state
+            write_current_redis_nodes
+            # check if we've exhausted our attempts to promote a master
+            unless @master
+              @master_promotion_attempts += 1
+              raise NoMasterError if @master_promotion_attempts > MAX_PROMOTION_ATTEMPTS
+            end
+          end
+        end
+      end
+    end
+    # Creates a Node instance from a string.
+    #
+    # @param [String] node_string a string representation of a node (e.g., host:port)
+    # @return [Node] the Node representation
+    def node_from(node_string)
+      return if node_string.nil?
+      host, port = node_string.split(':', 2)
+      Node.new(:host => host, :port => port, :password => @options[:password])
+    end
+    # Executes a block wrapped in a ZK exclusive lock.
+    def with_lock
+      @zk_lock ||= @zk.locker(current_lock_path)
+      begin
+        @zk_lock.lock!(true)
+      rescue Exception
+        # handle shutdown case
+        running? ? raise : return
+      end
+      if running?
+        @zk_lock.assert!
+        yield
+      end
+    ensure
+      if @zk_lock
+        begin
+          @zk_lock.unlock!
+        rescue => ex
+          logger.warn("Failed to release lock: #{ex.inspect}")
+        end
+      end
+    end
+    # Perform a manual failover to a redis node.
+    def perform_manual_failover
+      @lock.synchronize do
+        return unless running? && @master_manager && @zk_lock
+        @zk_lock.assert!
+        new_master = @zk.get(manual_failover_path, :watch => true).first
+        return unless new_master && new_master.size > 0
+        logger.info("Received manual failover request for: #{new_master}")
+        logger.info("Current nodes: #{current_nodes.inspect}")
+        snapshots = current_node_snapshots
+        node = if new_master == ManualFailover::ANY_SLAVE
+          failover_strategy_candidate(snapshots)
+        else
+          node_from(new_master)
+        end
+        if node
+          handle_manual_failover(node, snapshots)
+        else
+          logger.error('Failed to perform manual failover, no candidate found.')
+        end
+      end
+    rescue => ex
+      logger.error("Error handling manual failover: #{ex.inspect}")
+      logger.error(ex.backtrace.join("\n"))
+    ensure
+      @zk.stat(manual_failover_path, :watch => true)
+    end
+    # @return [Boolean] true if running, false otherwise
+    def running?
+      @lock.synchronize { !@shutdown }
+    end
+    # @return [String] a stringified version of redis nodes
+    def stringify_nodes(nodes)
+      "(#{nodes.map(&:to_s).join(', ')})"
+    end
+    # Determines if each snapshot has a sufficient number of node managers.
+    #
+    # @param [Hash<Node, Snapshot>] snapshots the current snapshots
+    # @return [Boolean] true if sufficient, false otherwise
+    def ensure_sufficient_node_managers(snapshots)
+      currently_sufficient = true
+      snapshots.each do |node, snapshot|
+        node_managers = snapshot.node_managers
+        if node_managers.size < @required_node_managers
+          logger.error("Not enough Node Managers in snapshot for node #{node}. " +
+            "Required: #{@required_node_managers}, " +
+            "Available: #{node_managers.size} #{node_managers}")
+          currently_sufficient = false
+        end
+      end
+      if currently_sufficient && !@sufficient_node_managers
+        logger.info("Required Node Managers are visible: #{@required_node_managers}")
+      end
+      @sufficient_node_managers = currently_sufficient
+      @sufficient_node_managers
+    end
+    # Invokes the configured failover strategy.
+    #
+    # @param [Hash<Node, NodeSnapshot>] snapshots the node snapshots
+    # @return [Node] a failover candidate
+    def failover_strategy_candidate(snapshots)
+      # only include nodes that this master Node Manager can see
+      filtered_snapshots = snapshots.select do |node, snapshot|
+        snapshot.viewable_by?(manager_id)
+      end
+      logger.info('Attempting to find candidate from snapshots:')
+      logger.info("\n" + filtered_snapshots.values.join("\n"))
+      @failover_strategy.find_candidate(filtered_snapshots)
+    end
+  end
+end