RubyGems - cfn_manage - Versions diffs - 0.7.1 → 0.8.0 - Mend

cfn_manage 0.7.1 → 0.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (27) hide show

checksums.yaml +4 -4
data/bin/cfn_manage +78 -7
data/bin/usage.txt +31 -0
data/lib/cfn_manage/cf_start_stop_environment.rb +84 -56
data/lib/cfn_manage/globals.rb +90 -0
data/lib/cfn_manage/handlers/alarm.rb +45 -0
data/lib/cfn_manage/handlers/asg.rb +311 -0
data/lib/cfn_manage/handlers/aurora_cluster.rb +97 -0
data/lib/cfn_manage/handlers/documentdb.rb +89 -0
data/lib/cfn_manage/handlers/ec2.rb +42 -0
data/lib/cfn_manage/handlers/ecs_cluster.rb +207 -0
data/lib/cfn_manage/handlers/rds.rb +134 -0
data/lib/cfn_manage/handlers/spot_fleet.rb +56 -0
data/lib/cfn_manage/handlers/transfer.rb +96 -0
data/lib/cfn_manage/start_stop_handler_factory.rb +19 -19
data/lib/cfn_manage/tag_finder.rb +77 -0
data/lib/cfn_manage/version.rb +1 -1
metadata +36 -14
data/lib/cfn_manage/alarm_start_stop_handler.rb +0 -44
data/lib/cfn_manage/asg_start_stop_handler.rb +0 -181
data/lib/cfn_manage/aurora_cluster_start_stop_handler.rb +0 -97
data/lib/cfn_manage/documentdb_cluster_start_stop_handler.rb +0 -89
data/lib/cfn_manage/ec2_start_stop_handler.rb +0 -43
data/lib/cfn_manage/ecs_cluster_start_stop_handler.rb +0 -80
data/lib/cfn_manage/rds_start_stop_handler.rb +0 -134
data/lib/cfn_manage/spot_fleet_start_stop_handler.rb +0 -57
data/lib/cfn_manage/transfer_start_stop_handler.rb +0 -97

data/lib/cfn_manage/globals.rb ADDED

@@ -0,0 +1,90 @@
+module CfnManage
+  # set default options here
+  @asg_wait_state = 'HealthyInASG'
+  @ecs_wait_state = 'Skip'
+  class << self
+    # return the vale of our options
+    attr_accessor :asg_wait_state, :ecs_wait_state
+    # converts string based bolleans from aws tag values to bolleans
+    def true?(obj)
+      ["true","1"].include? obj.to_s.downcase
+    end
+    # find options set on resource tags
+    def find_tags
+      @find_tags = true
+    end
+    def find_tags?
+      @find_tags
+    end
+    # don't stop or start resources
+    def dry_run
+      @dry_run = true
+    end
+    def dry_run?
+      @dry_run
+    end
+    # dont wait for resources to become healthy
+    def skip_wait
+      @skip_wait = true
+    end
+    def skip_wait?
+      @skip_wait
+    end
+    # wait for resources based upon priority groups
+    def wait_async
+      @wait_async = true
+    end
+    def wait_async?
+      @wait_async
+    end
+    # dirty hack
+    def ignore_missing_ecs_config
+      @ignore_missing_ecs_config = true
+    end
+    def ignore_missing_ecs_config?
+      @ignore_missing_ecs_config
+    end
+    # disable termination on asg when stopping EC2 instances in an asg
+    def asg_suspend_termination
+      @asg_suspend_termination = true
+    end
+    def asg_suspend_termination?
+      @asg_suspend_termination
+    end
+    # continue if a resource fails to stop or start
+    def continue_on_error
+      @continue_on_error = true
+    end
+    def continue_on_error?
+      @continue_on_error
+    end
+    # Wait for a container instances to join a ecs cluster
+    def ecs_wait_container_instances
+      @ecs_wait_container_instances = true
+    end
+    def ecs_wait_container_instances?
+      @ecs_wait_container_instances
+    end
+  end
+end

data/lib/cfn_manage/handlers/alarm.rb ADDED

@@ -0,0 +1,45 @@
+require 'aws-sdk-cloudwatch'
+require 'cfn_manage/aws_credentials'
+module CfnManage
+  module StartStopHandler
+    class Alarm
+      def initialize(alarm_name,options = {})
+        @alarm_id = alarm_name
+        credentials = CfnManage::AWSCredentials.get_session_credentials("startstopalarm_#{@asg_name}")
+        @cwclient = Aws::CloudWatch::Client.new(retry_limit: 20)
+        if credentials != nil
+          @cwclient = Aws::CloudWatch::Client.new(credentials: credentials, retry_limit: 20)
+        end
+        @cwresource = Aws::CloudWatch::Resource.new(client: @cwclient)
+        @alarm = @cwresource.alarm(alarm_name)
+      end
+      def start(configuration)
+        if @alarm.actions_enabled
+          $log.info("Alarm #{@alarm.alarm_arn} actions already enabled")
+          return
+        end
+        $log.info("Enabling alarm #{@alarm.alarm_arn}")
+        @alarm.enable_actions({})
+      end
+      def stop
+        if not @alarm.actions_enabled
+          $log.info("Alarm #{@alarm.alarm_arn} actions already disabled")
+          return {}
+        end
+        $log.info("Disabling actions on alarm #{@alarm.alarm_arn}")
+        @alarm.disable_actions({})
+        return {}
+      end
+      def wait(wait_states=[])
+        $log.debug("Not waiting for alarm #{@alarm_id}")
+      end
+    end
+  end
+end

data/lib/cfn_manage/handlers/asg.rb ADDED

@@ -0,0 +1,311 @@
+require 'cfn_manage/aws_credentials'
+require 'aws-sdk-autoscaling'
+require 'aws-sdk-ec2'
+require 'aws-sdk-elasticloadbalancingv2'
+module CfnManage
+  module StartStopHandler
+    class Asg
+      def initialize(asg_id, options = {})
+        @asg_name = asg_id
+        @wait_state = options.has_key?(:wait_state) ? options[:wait_state] : CfnManage.asg_wait_state
+        @skip_wait = options.has_key?(:skip_wait) ? CfnManage.true?(options[:skip_wait]) : CfnManage.skip_wait?
+        @suspend_termination = options.has_key?(:suspend_termination) ? CfnManage.true?(options[:suspend_termination]) : CfnManage.asg_suspend_termination?
+        credentials = CfnManage::AWSCredentials.get_session_credentials("stopasg_#{@asg_name}")
+        @asg_client = Aws::AutoScaling::Client.new(retry_limit: 20)
+        @ec2_client = Aws::EC2::Client.new(retry_limit: 20)
+        @elb_client = Aws::ElasticLoadBalancingV2::Client.new(retry_limit: 20)
+        if credentials != nil
+          @asg_client = Aws::AutoScaling::Client.new(credentials: credentials, retry_limit: 20)
+          @ec2_client = Aws::EC2::Client.new(credentials: credentials, retry_limit: 20)
+          @elb_client = Aws::ElasticLoadBalancingV2::Client.new(credentials: credentials, retry_limit: 20)
+        end
+        asg_details = @asg_client.describe_auto_scaling_groups(
+            auto_scaling_group_names: [@asg_name]
+        )
+        if asg_details.auto_scaling_groups.size() == 0
+          raise "Couldn't find ASG #{@asg_name}"
+        end
+        @asg = asg_details.auto_scaling_groups[0]
+      end
+      def stop
+        # check if already stopped
+        if @asg.min_size == @asg.max_size and @asg.max_size == @asg.desired_capacity and @asg.min_size == 0
+          $log.info("ASG #{@asg_name} already stopped")
+          # nil and false configurations are not saved
+          return nil
+        else
+          unless @suspend_termination
+            # store asg configuration to S3
+            configuration = {
+                desired_capacity: @asg.desired_capacity,
+                min_size: @asg.min_size,
+                max_size: @asg.max_size
+            }
+            $log.info("Setting desired capacity to 0/0/0 for ASG #{@asg.auto_scaling_group_name}A")
+            @asg_client.update_auto_scaling_group({
+                auto_scaling_group_name: "#{@asg.auto_scaling_group_name}",
+                min_size: 0,
+                max_size: 0,
+                desired_capacity: 0
+            })
+            return configuration
+          else
+            configuration = {
+              desired_capacity: @asg.desired_capacity,
+              min_size: @asg.min_size,
+              max_size: @asg.max_size,
+              suspended_processes: @asg.suspended_processes
+            }
+            $log.info("Suspending processes for ASG #{@asg.auto_scaling_group_name}A")
+            @asg_client.suspend_processes({
+              auto_scaling_group_name: "#{@asg.auto_scaling_group_name}",
+            })
+            $log.info("Stopping all instances in ASG #{@asg.auto_scaling_group_name}A")
+            @asg.instances.each do |instance|
+              @instance_id = instance.instance_id
+              @instance = Aws::EC2::Resource.new(client: @ec2_client, retry_limit: 20).instance(@instance_id)
+              if %w(stopped stopping).include?(@instance.state.name)
+                $log.info("Instance #{@instance_id} already stopping or stopped")
+                return
+              end
+              $log.info("Stopping instance #{@instance_id}")
+              @instance.stop()
+            end
+            return configuration
+          end
+        end
+      end
+      def start(configuration)
+        if configuration.nil?
+          $log.warn("No configuration found for #{@asg_name}, skipping..")
+          return
+        end
+        $log.info("Starting ASG #{@asg_name} with following configuration\n#{configuration}")
+        unless @suspend_termination
+          # restore asg sizes
+          @asg_client.update_auto_scaling_group({
+            auto_scaling_group_name: @asg_name,
+            min_size: configuration['min_size'],
+            max_size: configuration['max_size'],
+            desired_capacity: configuration['desired_capacity']
+          })
+        else
+          $log.info("Starting instances for ASG #{@asg_name}...")
+          @asg.instances.each do |instance|
+            @instance_id = instance.instance_id
+            @instance = Aws::EC2::Resource.new(client: @ec2_client, retry_limit: 20).instance(@instance_id)
+            if %w(running).include?(@instance.state.name)
+              $log.info("Instance #{@instance_id} already running")
+              return
+            end
+            $log.info("Starting instance #{@instance_id}")
+            @instance.start()
+          end
+        end
+        if configuration['desired_capacity'] == 0
+          # if ASG desired count is purposfully set to 0 and we want to wait for other ASG's
+          # int the stack, then we need to skip wait for this ASG.
+          $log.info("Desired capacity is 0, skipping wait for asg #{@asg_name}")
+        elsif @skip_wait && @suspend_termination
+          # If wait is skipped we still need to wait until the instances are healthy in the asg
+          # before resuming the processes. This will avoid the asg terminating the instances.
+          wait('HealthyInASG')
+        elsif !@skip_wait
+          # if we are waiting for the instances to reach a desired state
+          $log.info("Waiting for ASG instances wait state #{@wait_state}")
+          wait(@wait_state)
+        end
+        if @suspend_termination
+          # resume the asg processes after we've waited for them to become healthy
+          $log.info("Resuming all processes for ASG #{@asg_name}")
+          @asg_client.resume_processes({
+            auto_scaling_group_name: "#{@asg.auto_scaling_group_name}",
+          })
+          if configuration.key?(:suspended_processes)
+            $log.info("Suspending processes stored in configuration for ASG #{@asg_name}")
+            @asg_client.suspend_processes({
+              auto_scaling_group_name: "#{@asg.auto_scaling_group_name}",
+              scaling_processes: configuration['suspended_processes'],
+            })
+          end
+        end
+      end
+      def wait(type)
+        attempts = 0
+        until attempts == (max_attempts = 60*6) do
+          case type
+          when 'HealthyInASG'
+            success = wait_till_healthy_in_asg()
+          when 'Running'
+            success = wait_till_running()
+          when 'HealthyInTargetGroup'
+            success = wait_till_healthy_in_target_group()
+          else
+            $log.warn("unknown asg wait type #{type}. skipping...")
+            break
+          end
+          if success
+            break
+          end
+          attempts = attempts + 1
+          sleep(15)
+        end
+        if attempts == max_attempts
+          $log.error("Failed to wait for asg with wait type #{type}")
+        end
+      end
+      def wait_till_healthy_in_asg
+        asg_curr_details = @asg_client.describe_auto_scaling_groups(
+          auto_scaling_group_names: [@asg_name]
+        )
+        asg_status = asg_curr_details.auto_scaling_groups.first
+        health_status = asg_status.instances.collect { |inst| inst.health_status }
+        $log.info("ASG #{@asg_name} health status is currently #{health_status}")
+        if health_status.empty?
+          $log.info("ASG #{@asg_name} has not started any instances yet")
+          return false
+        end
+        if health_status.all? "Healthy"
+          $log.info("All instances healthy in ASG #{@asg_name}")
+          return true
+        end
+        unhealthy = asg_status.instances.select {|inst| inst.health_status == "Unhealthy" }.collect {|inst| inst.instance_id }
+        $log.info("waiting for instances #{unhealthy} to become healthy in asg #{@asg_name}")
+        return false
+      end
+      def wait_till_running
+        asg_curr_details = @asg_client.describe_auto_scaling_groups(
+          auto_scaling_group_names: [@asg_name]
+        )
+        asg_status = asg_curr_details.auto_scaling_groups.first
+        instances = asg_status.instances.collect { |inst| inst.instance_id }
+        if instances.empty?
+          $log.info("ASG #{@asg_name} has not started any instances yet")
+          return false
+        end
+        status = @ec2_client.describe_instance_status({
+          instance_ids: instances
+        })
+        state = status.instance_statuses.collect {|inst| inst.instance_state.name}
+        if state.all? "running"
+          $log.info("All instances in a running state from ASG #{@asg_name}")
+          return true
+        end
+        not_running = @status.instance_statuses.select {|inst| inst.instance_state.name != "running" }
+        not_running.each do |inst|
+          $log.info("waiting for instances #{inst.instance_id} to be running. Current state is #{inst.instance_state.name}")
+        end
+        return false
+      end
+      def wait_till_healthy_in_target_group
+        asg_curr_details = @asg_client.describe_auto_scaling_groups(
+          auto_scaling_group_names: [@asg_name]
+        )
+        asg_status = asg_curr_details.auto_scaling_groups.first
+        asg_instances = asg_status.instances.collect { |inst| inst.instance_id }
+        target_groups = asg_status.target_group_arns
+        if asg_instances.empty?
+          $log.info("ASG #{@asg_name} has not started any instances yet")
+          return false
+        end
+        if target_groups.empty?
+          # we want to skip here if the asg is not associated with any target groups
+          $log.info("ASG #{@asg_name} is not associated with any target groups")
+          return true
+        end
+        target_health = []
+        target_groups.each do |tg|
+          resp = @elb_client.describe_target_health({
+            target_group_arn: tg,
+          })
+          if resp.target_health_descriptions.length != asg_instances.length
+            # we need to wait until all asg insatnces have been placed into the target group
+            # before we can check they're healthy
+            $log.info("All ASG instances haven't been placed into target group #{tg.split('/')[1]} yet")
+            return false
+          end
+          target_health.push(*resp.target_health_descriptions)
+        end
+        state = target_health.collect {|tg| tg.target_health.state}
+        if state.all? 'healthy'
+          $log.info("All instances are in a healthy state in target groups #{target_groups.map {|tg| tg.split('/')[1] }}")
+          return true
+        end
+        unhealthy = target_health.select {|tg| tg.target_health.state != 'healthy'}
+        unhealthy.each do |tg|
+          $log.info("waiting for instances #{tg.target.id} to be healthy in target group. Current state is #{tg.target_health.state}")
+        end
+        return false
+      end
+    end
+  end
+end

data/lib/cfn_manage/handlers/aurora_cluster.rb ADDED

@@ -0,0 +1,97 @@
+require 'aws-sdk-rds'
+require 'cfn_manage/aws_credentials'
+module CfnManage
+  module StartStopHandler
+    class AuroraCluster
+      def initialize(cluster_id, options = {})
+        @cluster_id = cluster_id
+        credentials = CfnManage::AWSCredentials.get_session_credentials("startstopcluster_#{cluster_id}")
+        @rds_client = Aws::RDS::Client.new(retry_limit: 20)
+        if credentials != nil
+          @rds_client = Aws::RDS::Client.new(credentials: credentials, retry_limit: 20)
+        end
+        rds = Aws::RDS::Resource.new(client: @rds_client)
+        @rds_cluster = rds.db_cluster(cluster_id)
+      end
+      def start(configuration)
+        if @rds_cluster.status == 'available'
+          $log.info("Aurora Cluster #{@cluster_id} is already in available state")
+          return
+        end
+        if @rds_cluster.engine_mode != 'provisioned'
+          $log.info("Aurora Cluster #{@cluster_id} is not a provisioned cluster and cannot be started using this method.")
+          return
+        end
+        # start rds cluster
+        if @rds_cluster.status == 'stopped'
+          $log.info("Starting Aurora cluster #{@cluster_id}")
+          @rds_client.start_db_cluster({ db_cluster_identifier: @cluster_id })
+          unless CfnManage.skip_wait?
+            # wait cluster to become available
+            $log.info("Waiting Aurora cluster to become available #{@cluster_id}")
+            wait('available')
+          end
+        else
+          $log.info("Aurora Cluster #{@cluster_id} is not in a stopped state. State: #{@rds_cluster.status}")
+        end
+      end
+      def stop
+        if @rds_cluster.status == 'stopped'
+          $log.info("Aurora Cluster #{@cluster_id} is already stopped")
+          return {}
+        end
+        if @rds_cluster.status != 'available'
+          $log.info("Aurora Cluster #{@cluster_id} is not in a available state. State: #{@rds_cluster.status}")
+          return {}
+        end
+        if @rds_cluster.engine_mode != 'provisioned'
+          $log.info("Aurora Cluster #{@cluster_id} is not a provisioned cluster and cannot be stopped using this method.")
+          return {}
+        end
+        # stop rds cluster and wait for it to be fully stopped
+        $log.info("Stopping aurora cluster #{@cluster_id}")
+        @rds_client.stop_db_cluster({ db_cluster_identifier: @cluster_id })
+        unless CfnManage.skip_wait?
+          $log.info("Waiting aurora cluster to be stopped #{@cluster_id}")
+          wait('stopped')
+        end
+        return {}
+      end
+      def wait(completed_state)
+        # reached state must be steady, at least a minute.
+        state_count = 0
+        steady_count = 4
+        attempts = 0
+        rds = Aws::RDS::Resource.new(client: @rds_client)
+        until attempts == (max_attempts = 60*6) do
+          cluster = rds.db_cluster(@cluster_id)
+          $log.info("Aurora Cluster #{cluster.db_cluster_identifier} state: #{cluster.status}, waiting for #{completed_state}")
+          if cluster.status == "#{completed_state}"
+            state_count = state_count + 1
+            $log.info("#{state_count}/#{steady_count}")
+          else
+            state_count = 0
+          end
+          break if state_count == steady_count
+          attempts = attempts + 1
+          sleep(15)
+        end
+        if attempts == max_attempts
+          $log.error("RDS Aurora Cluster #{@cluster_id} did not enter #{state} state, however continuing operations...")
+        end
+      end
+    end
+  end
+end