RubyGems - sisfc - Versions diffs - 0.1.0 → 0.2.0 - Mend

sisfc 0.1.0 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (38) hide show

checksums.yaml +5 -5
data/.projections.json +12 -0
data/.travis.yml +6 -0
data/README.md +37 -19
data/Rakefile +4 -2
data/TODO +5 -0
data/bin/sisfc +29 -6
data/examples/generator.R +3 -1
data/examples/simulator.conf +80 -29
data/lib/sisfc.rb +4 -4
data/lib/sisfc/configuration.rb +73 -6
data/lib/sisfc/data_center.rb +42 -29
data/lib/sisfc/evaluation.rb +23 -15
data/lib/sisfc/event.rb +9 -6
data/lib/sisfc/generator.rb +14 -21
data/lib/sisfc/latency_manager.rb +65 -0
data/lib/sisfc/logger.rb +28 -0
data/lib/sisfc/request.rb +42 -85
data/lib/sisfc/service_type.rb +2 -0
data/lib/sisfc/simulation.rb +234 -47
data/lib/sisfc/sorted_array.rb +2 -0
data/lib/sisfc/statistics.rb +37 -3
data/lib/sisfc/support/dsl_helper.rb +2 -0
data/lib/sisfc/version.rb +3 -1
data/lib/sisfc/vm.rb +46 -27
data/sisfc.gemspec +9 -5
data/spec/minitest_helper.rb +9 -0
data/{test/sisfc/configuration_test.rb → spec/sisfc/configuration_spec.rb} +4 -2
data/spec/sisfc/data_center_spec.rb +19 -0
data/{test/sisfc/evaluation_test.rb → spec/sisfc/evaluation_spec.rb} +5 -3
data/{test/sisfc/generator_test.rb → spec/sisfc/generator_spec.rb} +21 -18
data/spec/sisfc/latency_manager_spec.rb +13 -0
data/spec/sisfc/reference_configuration.rb +534 -0
data/spec/sisfc/request_spec.rb +19 -0
metadata +115 -49
data/test/sisfc/reference_configuration.rb +0 -191
data/test/sisfc/request_test.rb +0 -13
data/test/test_helper.rb +0 -4

data/lib/sisfc/service_type.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 require 'erv'
 module SISFC

data/lib/sisfc/simulation.rb CHANGED Viewed

@@ -1,9 +1,12 @@
-require 'sisfc/data_center'
-require 'sisfc/event'
-require 'sisfc/generator'
-require 'sisfc/sorted_array'
-require 'sisfc/statistics'
-require 'sisfc/vm'
+# frozen_string_literal: true
+require_relative './data_center'
+require_relative './event'
+require_relative './generator'
+require_relative './sorted_array'
+require_relative './statistics'
+require_relative './vm'
+require_relative './latency_manager'
 module SISFC
@@ -15,6 +18,9 @@ module SISFC
     def initialize(opts = {})
       @configuration = opts[:configuration]
       @evaluator     = opts[:evaluator]
+      # create latency manager
+      @latency_manager = LatencyManager.new(@configuration.latency_models)
     end
@@ -33,28 +39,63 @@ module SISFC
       # setup simulation start and current time
       @current_time = @start_time = @configuration.start_time
-      # create data centers
-      data_centers = @configuration.data_centers.map {|k,v| DataCenter.new(k,v) }
+      # create data centers and store them in a repository
+      data_center_repository = Hash[
+        @configuration.data_centers.map do |k,v|
+          [ k, DataCenter.new(id: k, **v) ]
+        end
+      ]
+      customer_repository = @configuration.customers
+      workflow_type_repository = @configuration.workflow_types
       # initialize statistics
-      stats    = Statistics.new
-      dc_stats = data_centers.map {|k,v| Statistics.new }
+      stats = Statistics.new
+      per_workflow_and_customer_stats = Hash[
+        workflow_type_repository.keys.map do |wft_id|
+          [
+            wft_id,
+            Hash[
+              customer_repository.keys.map do |c_id|
+                [ c_id, Statistics.new(@configuration.custom_stats.find{|x| x[:customer_id] == c_id && x[:workflow_type_id] == wft_id } || {}) ]
+              end
+            ]
+          ]
+        end
+      ]
+      reqs_received_per_workflow_and_customer = Hash[
+        workflow_type_repository.keys.map do |wft_id|
+          [ wft_id, Hash[customer_repository.keys.map {|c_id| [ c_id, 0 ]}] ]
+        end
+      ]
       # create VMs
       @vms = []
       vmid = 0
       vm_allocation.each do |opts|
         # setup service_time_distribution
-        opts[:service_time_distribution] = @configuration.service_component_types[opts[:component_type]][:service_time_distribution]
+        stdist = @configuration.service_component_types[opts[:component_type]][:service_time_distribution]
         # allocate the VMs
         opts[:vm_num].times do
           # create VM ...
-          vm = VM.new(vmid, opts) # vm = VM.new(vmid, opts.except(:vm_num))
+          # if [ "Financial Transaction Server", "RDBMS C", "Queue Manager" ].include? opts[:component_type]
+          #   vm = VM.new(vmid, opts[:dc_id], opts[:vm_size], stdist, trace: true, notes: "ct #{opts[:component_type]}")
+          # else
+          #   vm = VM.new(vmid, opts[:dc_id], opts[:vm_size], stdist)
+          # end
+          vm = VM.new(vmid, opts[:dc_id], opts[:vm_size], stdist)
           # ... add it to the vm list ...
           @vms << vm
           # ... and register it in the corresponding data center
-          data_centers[opts[:dc_id]-1].add_vm(vm, opts[:component_type])
+          unless data_center_repository[opts[:dc_id]].add_vm(vm, opts[:component_type])
+            $stderr.puts "====== Unfeasible allocation at data center #{dc_id} ======"
+            $stderr.flush
+            # here we return Float::MAX instead of, e.g., Float::INFINITY,
+            # because the latter would break optimization tools. instead, we
+            # want to have a very high but comparable value.
+            return Float::MAX
+          end
           # update vm id
           vmid += 1
         end
@@ -67,8 +108,8 @@ module SISFC
       # generate first request
       rg = RequestGenerator.new(@configuration.request_generation)
-      new_req = rg.generate
-      new_event(Event::ET_REQUEST_ARRIVAL, new_req, new_req.arrival_time, nil)
+      req_attrs = rg.generate
+      new_event(Event::ET_REQUEST_GENERATION, req_attrs, req_attrs[:generation_time], nil)
       # schedule end of simulation
       unless @configuration.end_time.nil?
@@ -80,54 +121,115 @@ module SISFC
       warmup_threshold = @configuration.start_time + @configuration.warmup_duration.to_i
       requests_being_worked_on = 0
-      events = 0
+      requests_forwarded_to_other_dcs = 0
+      current_event = 0
       # launch simulation
       until @event_queue.empty?
         e = @event_queue.shift
-        events += 1
+        current_event += 1
         # sanity check on simulation time flow
         if @current_time > e.time
-          raise "Error: simulation time inconsistency for event #{events} " +
+          raise "Error: simulation time inconsistency for event #{current_event} " +
                 "e.type=#{e.type} @current_time=#{@current_time}, e.time=#{e.time}"
         end
         @current_time = e.time
         case e.type
+          when Event::ET_REQUEST_GENERATION
+            req_attrs = e.data
+            # find closest data center
+            customer_location_id = customer_repository.dig(req_attrs[:customer_id], :location_id)
+            dc_at_customer_location = data_center_repository.values.find {|dc| dc.location_id == customer_location_id }
+            raise "No data center found at location id #{customer_location_id}!" unless dc_at_customer_location
+            # find first component name for requested workflow
+            workflow = workflow_type_repository[req_attrs[:workflow_type_id]]
+            first_component_name = workflow[:component_sequence][0][:name]
+            closest_dc = if dc_at_customer_location.has_vms_of_type?(first_component_name)
+              dc_at_customer_location
+            else
+              data_center_repository.values.select{|dc| dc.has_vms_of_type?(first_component_name) }&.sample
+            end
+            raise "Invalid configuration! No VMs of type #{first_component_name} found!" unless closest_dc
+            arrival_time = @current_time + @latency_manager.sample_latency_between(customer_location_id, closest_dc.location_id)
+            new_req = Request.new(req_attrs.merge!(initial_data_center_id: closest_dc.dcid,
+                                                   arrival_time: arrival_time))
+            # schedule arrival of current request
+            new_event(Event::ET_REQUEST_ARRIVAL, new_req, arrival_time, nil)
+            # schedule generation of next request
+            req_attrs = rg.generate
+            new_event(Event::ET_REQUEST_GENERATION, req_attrs, req_attrs[:generation_time], nil)
           when Event::ET_REQUEST_ARRIVAL
             # get request
             req = e.data
             # find data center
-            data_center = data_centers[req.data_center_id-1]
+            data_center = data_center_repository[req.data_center_id]
+            # update reqs_received_per_workflow_and_customer
+            reqs_received_per_workflow_and_customer[req.workflow_type_id][req.customer_id] += 1
             # find next component name
-            workflow = @configuration.workflow_types[req.workflow_type_id]
+            workflow = workflow_type_repository[req.workflow_type_id]
             next_component_name = workflow[:component_sequence][req.next_step][:name]
+            # if [5,6,9].include? req.workflow_type_id
+            #   $stderr.puts "received request for wf #{req.workflow_type_id} at dc #{req.data_center_id}"
+            #   $stderr.puts "next component name is #{next_component_name}"
+            #   $stderr.flush
+            # end
             # get random vm providing next service component type
             vm = data_center.get_random_vm(next_component_name)
+            # if [5,6,9].include? req.workflow_type_id
+            #   $stderr.puts "next vm is #{vm.__id__}"
+            #   $stderr.flush
+            # end
-            # forward request to the vm
-            vm.new_request(self, req, e.time)
+            # schedule request forwarding to vm
+            new_event(Event::ET_REQUEST_FORWARDING, req, e.time, vm)
             # update stats
             if req.arrival_time > warmup_threshold
               # increase the number of requests being worked on
               requests_being_worked_on += 1
-            end
-            # generate next request
-            new_req = rg.generate
-            new_event(Event::ET_REQUEST_ARRIVAL, new_req, new_req.arrival_time, nil)
+              # increase count of received requests
+              stats.request_received
+              # increase count of received requests in per_workflow_and_customer_stats
+              per_workflow_and_customer_stats[req.workflow_type_id][req.customer_id].request_received
+              # if stats.received % 10_000 == 0
+              #   $stderr.puts "#{Thread.current.__id__} sisfc: Received #{stats.received} requests."
+              #   $stderr.puts "#{Thread.current.__id__} sisfc: Working on #{requests_being_worked_on} requests."
+              #   $stderr.flush
+              # end
+            end
           # Leave these events for when we add VM migration support
           # when Event::ET_VM_SUSPEND
           # when Event::ET_VM_RESUME
+          when Event::ET_REQUEST_FORWARDING
+            # get request
+            req  = e.data
+            time = e.time
+            vm   = e.destination
+            vm.new_request(self, req, time)
           when Event::ET_WORKFLOW_STEP_COMPLETED
             # retrieve request and vm
@@ -138,22 +240,103 @@ module SISFC
             vm.request_finished(self, e.time)
             # find data center and workflow
-            data_center = data_centers[req.data_center_id-1]
-            workflow    = @configuration.workflow_types[req.workflow_type_id]
+            data_center = data_center_repository[req.data_center_id]
+            workflow    = workflow_type_repository[req.workflow_type_id]
             # check if there are other steps left to complete the workflow
             if req.next_step < workflow[:component_sequence].size
               # find next component name
               next_component_name = workflow[:component_sequence][req.next_step][:name]
-              # get random vm providing next service component type
+              # get random VM providing next service component type
               new_vm = data_center.get_random_vm(next_component_name)
-              # forward request to the new vm
-              new_vm.new_request(self, req, e.time)
+              # this is the request's time of arrival at the new VM
+              forwarding_time = e.time
+              # there might not be a VM of the type we need in the current data
+              # center, so look in the other data centers
+              unless new_vm
+                # get list of other data centers, randomly picked
+                other_dcs = data_center_repository.values.select{|x| x != data_center && x.has_vms_of_type?(next_component_name) }&.shuffle
+                other_dcs.each do |dc|
+                  new_vm = dc.get_random_vm(next_component_name)
+                  if new_vm
+                    # need to update data_center_id of request
+                    req.data_center_id = dc.dcid
+                    # keep track of transmission time
+                    transmission_time =
+                      @latency_manager.sample_latency_between(data_center.location_id,
+                                                              dc.location_id)
+                    unless transmission_time >= 0.0
+                      raise "Negative transmission time (#{transmission_time})!"
+                    end
+                    # if [5,6,9].include? req.workflow_type_id
+                    #   $stderr.puts "rerouting request for wf #{req.workflow_type_id} from dc #{data_center.dcid} to dc #{dc.dcid}"
+                    #   $stderr.puts "next component name is #{next_component_name}"
+                    #   $stderr.puts "transmission time is #{transmission_time}"
+                    #   $stderr.flush
+                    # end
+                    req.update_transfer_time(transmission_time)
+                    forwarding_time += transmission_time
+                    # update request's current data_center_id
+                    req.data_center_id = dc.dcid
+                    # keep track of number of requests forwarded to other data centers
+                    requests_forwarded_to_other_dcs += 1
+                    # we're done here
+                    break
+                  end
+                end
+              end
+              # make sure we actually found a VM
+              raise "Cannot find VM running a component of type " +
+                    "#{next_component_name} in any data center!" unless new_vm
+              # if [5,6,9].include? req.workflow_type_id
+              #   $stderr.puts "received request for wf #{req.workflow_type_id} at dc #{req.data_center_id}"
+              #   $stderr.puts "next component name is #{next_component_name}"
+              #   $stderr.puts "next vm is #{new_vm.__id__}"
+              #   $stderr.flush
+              # end
+              # schedule request forwarding to vm
+              new_event(Event::ET_REQUEST_FORWARDING, req, forwarding_time, new_vm)
             else # workflow is finished
+              # calculate transmission time
+              transmission_time =
+                @latency_manager.sample_latency_between(
+                  # data center location
+                  data_center_repository[req.data_center_id].location_id,
+                  # customer location
+                  customer_repository.dig(req.customer_id, :location_id)
+                )
+              # if [5,6,9].include? req.workflow_type_id
+              #   $stderr.puts "closing request for wf #{req.workflow_type_id}"
+              #   $stderr.puts "e.time is #{e.time}"
+              #   $stderr.puts "transmission_time is #{transmission_time}"
+              #   $stderr.flush
+              # end
+              unless transmission_time >= 0.0
+                raise "Negative transmission time (#{transmission_time})!"
+              end
+              # keep track of transmission time
+              req.update_transfer_time(transmission_time)
               # schedule request closure
-              new_event(Event::ET_REQUEST_CLOSURE, req, e.time + req.communication_latency, nil)
+              new_event(Event::ET_REQUEST_CLOSURE, req, e.time + transmission_time, nil)
             end
@@ -171,7 +354,9 @@ module SISFC
               # collect request statistics
               stats.record_request(req)
-              dc_stats[req.data_center_id - 1].record_request(req)
+              # collect request statistics in per_workflow_and_customer_stats
+              per_workflow_and_customer_stats[req.workflow_type_id][req.customer_id].record_request(req)
             end
@@ -184,22 +369,24 @@ module SISFC
       # puts "========== Simulation Finished =========="
-      # calculate kpis (for the moment, we only have mttr)
-      kpis = { :mttr            => stats.mean,
-               :served_requests => stats.n,
-               :queued_requests => requests_being_worked_on }
-      dc_kpis = dc_stats.map do |s|
-        { :mttr            => s.mean,
-          :served_requests => s.n, }
-      end
-      fitness = @evaluator.evaluate_business_impact(kpis, dc_kpis, vm_allocation)
+      costs = @evaluator.evaluate_business_impact(stats, per_workflow_and_customer_stats,
+                                                  vm_allocation)
       puts "====== Evaluating new allocation ======\n" +
-        vm_allocation.map{|x| x.except(:service_time_distribution) }.inspect + "\n" +
-        "kpis: #{kpis.to_s}\n" +
-        "dc_kpis: #{dc_kpis.to_s}\n" +
-        "=======================================\n"
-      fitness
+           "costs: #{costs}\n" +
+           "vm_allocation: #{vm_allocation.inspect}\n" +
+           "stats: #{stats.to_s}\n" +
+           "per_workflow_and_customer_stats: #{per_workflow_and_customer_stats.to_s}\n" +
+           "=======================================\n"
+      # we want to minimize the cost, so we define fitness as the opposite of
+      # the sum of all costs incurred
+      fitness = - costs.values.inject(0.0){|s,x| s += x }
     end
+    private
+      def communication_latency_between(loc1, loc2)
+        @latency_manager.sample_latency_between(loc1.to_i, loc2.to_i)
+      end
   end
 end

data/lib/sisfc/sorted_array.rb CHANGED Viewed

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 module SISFC
   # the SortedArray class was taken from the ruby cookbook
   class SortedArray < Array

data/lib/sisfc/statistics.rb CHANGED Viewed

@@ -1,19 +1,35 @@
-require 'sisfc/request'
+# frozen_string_literal: true
+require_relative './request'
 module SISFC
   class Statistics
-    attr_reader :mean, :n
+    attr_reader :mean, :n, :received, :longer_than
+    alias_method :closed, :n
     # see http://en.wikipedia.org/wiki/Algorithms_for_calculating_variance#Online_algorithm
-    def initialize
+    # and https://www.johndcook.com/blog/standard_deviation/
+    def initialize(opts={})
       @n    = 0 # number of requests
       @mean = 0.0
       @m_2  = 0.0
+      @longer_than = init_counters_for_longer_than_stats(opts)
+      @received = 0
+    end
+    def request_received
+      @received += 1
     end
     def record_request(req)
       # get new sample
       x = req.ttr
+      raise "TTR #{x} for request #{req.rid} invalid!" unless x > 0.0
+      @longer_than.each_key do |k|
+        @longer_than[k] += 1 if x > k
+      end
       # update counters
       @n += 1
@@ -25,5 +41,23 @@ module SISFC
     def variance
       @m_2 / (@n - 1)
     end
+    def to_s
+      "received: #{@received}, closed: #{@n}, " +
+      "(mean: #{@mean}, variance: #{variance}, longer_than: #{@longer_than.to_s})"
+    end
+    private
+      def init_counters_for_longer_than_stats(custom_kpis_config)
+        # prepare an infinite length enumerator that always returns zero
+        zeros = Enumerator.new(){|x| loop do x << 0 end }
+        Hash[
+          # wrap the values in custom_kpis_config[:longer_than] in an array
+          Array(custom_kpis_config[:longer_than]).
+            # and interval the numbers contained in that array with zeroes
+            zip(zeros) ]
+      end
   end
 end