RubyGems - answer-factory - Versions diffs - 0.0.1 - Mend

answer-factory 0.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (38) hide show

data/LICENSE.txt +21 -0
data/Rakefile +29 -0
data/Thorfile +79 -0
data/VERSION +1 -0
data/_spikes/old_vs_new_dominated_by?.rb +45 -0
data/config/database.yml +9 -0
data/lib/answer-factory.rb +14 -0
data/lib/answers/answer.rb +126 -0
data/lib/answers/batch.rb +49 -0
data/lib/factories/factory.rb +53 -0
data/lib/factories/workstation.rb +33 -0
data/lib/operators/basic_operators.rb +240 -0
data/lib/operators/evaluators.rb +113 -0
data/lib/operators/samplers_and_selectors.rb +131 -0
data/pkg/nudgegp-0.0.1.gem +0 -0
data/readme.md +29 -0
data/spec/answer_spec.rb +412 -0
data/spec/batch_spec.rb +98 -0
data/spec/config_spec.rb +94 -0
data/spec/factories/factory_spec.rb +86 -0
data/spec/factories/workstation_spec.rb +139 -0
data/spec/operators/any_one_sampler_spec.rb +39 -0
data/spec/operators/dominated_quantile_spec.rb +111 -0
data/spec/operators/duplicate_genomes_spec.rb +35 -0
data/spec/operators/evaluators/program_point_evaluator_spec.rb +43 -0
data/spec/operators/evaluators/test_case_evaluator_spec.rb +129 -0
data/spec/operators/infrastructure_spec.rb +45 -0
data/spec/operators/most_dominated_subset_spec.rb +47 -0
data/spec/operators/nondominated_subset_spec.rb +103 -0
data/spec/operators/pointCrossover_spec.rb +60 -0
data/spec/operators/pointDeletion_spec.rb +62 -0
data/spec/operators/pointMutation_spec.rb +77 -0
data/spec/operators/random_guess_spec.rb +77 -0
data/spec/operators/resample_and_clone_spec.rb +60 -0
data/spec/operators/resample_values_spec.rb +135 -0
data/spec/operators/uniformBackboneCrossover_spec.rb +67 -0
data/spec/spec_helper.rb +14 -0
metadata +201 -0

data/lib/operators/basic_operators.rb ADDED

@@ -0,0 +1,240 @@
+#encoding: utf-8
+module NudgeGP
+  # Abstract class that from which specific SearchOperator subclasses inherit initialization
+  class SearchOperator
+    attr_accessor :incoming_options
+     def initialize(options={})
+       @incoming_options = options
+     end
+  end
+  class RandomGuessOperator < SearchOperator
+    # returns an Array of random Answers
+    #
+    # the first (optional) parameter specifies how many to make, and defaults to 1
+    # the second (also optional) parameter is a hash that
+    # can temporarily override those set in the initialization
+    #
+    # For example, if
+    # <tt>myRandomGuesser = RandomGuessOperator.new(:randomIntegerLowerBound => -90000)</tt>
+    #
+    # [<tt>myRandomGuesser.generate()</tt>]
+    #   produces a list of 1 Answer, and if it has any IntType samples they will be in [-90000,100]
+    #   (since the default +:randomIntegerLowerBound+ is 100)
+    # [<tt>myRandomGuesser.generate(1,:randomIntegerLowerBound => 0)</tt>]
+    #   makes one Answer whose IntType samples (if any) will be between [0,100]
+    def generate(howMany = 1, overridden_options ={})
+      result = Batch.new
+      howMany.times do
+        newGenome = CodeType.any_value(@incoming_options.merge(overridden_options))
+        newDude = Answer.new(newGenome, progress:0)
+        result << newDude
+      end
+      result
+    end
+  end
+  class ResampleAndCloneOperator < SearchOperator
+    # returns an Array of clones of Answers randomly selected from the crowd passed in
+    #
+    # the first (required) parameter is an Array of Answers
+    # the second (optional) parameter is how many samples to take, and defaults to 1
+    #
+    # For example, if
+    # <tt>@currentPopulation = [a list of 300 Answers]</tt> and
+    # <tt>myRandomSampler = ResampleAndCloneOperator.new(@currentPopulation)</tt>
+    # [<tt>myRandomSampler.generate()</tt>]
+    #   produces a list of 1 Answer, which is a clone of somebody from <tt>@currentPopulation</tt>
+    # [<tt>myRandomGuesser.generate(11)</tt>]
+    #   returns a list of 11 Answers cloned from <tt>@currentPopulation</tt>,
+    #   possibly including repeats
+    def generate(crowd, howMany = 1)
+      result = Batch.new
+      howMany.times do
+        donor = crowd.sample
+        clone = Answer.new(donor.blueprint, progress:donor.progress + 1)
+        result << clone
+      end
+      return result
+    end
+  end
+  class ResampleValuesOperator < SearchOperator
+    def generate(crowd, howManyCopies = 1, overridden_options = {})
+      crowd.each {|dude| raise(ArgumentError) if !dude.kind_of?(Answer) }
+      result = Batch.new
+      regenerating_options = @incoming_options.merge(overridden_options)
+      crowd.each do |dude|
+        howManyCopies.times do
+          wildtype_program = dude.program
+          starting_footnotes = wildtype_program.footnote_section.split( /^(?=«)/ )
+          breaker = /^«([a-zA-Z][a-zA-Z0-9_]*)»\s*(.*)\s*/m
+          type_value_pairs = starting_footnotes.collect {|fn| fn.match(breaker)[1..2]}
+          mutant_blueprint = wildtype_program.code_section
+          type_value_pairs.each do |pair|
+            begin
+              type_name = pair[0]
+              type_class = "#{type_name}_type".camelize.constantize
+              reduced_size = regenerating_options[:target_size_in_points] || rand(dude.points/2)
+              reduced_option = {target_size_in_points:reduced_size}
+              resampled_value = type_class.any_value(regenerating_options.merge(reduced_option)).to_s
+            rescue NameError
+              resampled_value = pair[1]
+            end
+            mutant_blueprint << "\n«#{pair[0].strip}» #{resampled_value.strip}"
+          end
+          mutant = Answer.new(mutant_blueprint, progress:dude.progress + 1)
+          result << mutant
+        end
+      end
+      return result
+    end
+  end
+  class UniformBackboneCrossoverOperator < SearchOperator
+    # Returns a Batch of new Answers whose programs are made by stitching together
+    # the programs of pairs of 'parents'. The incoming Batch is divided into pairs based on
+    # adjacency (modulo the Batch.length), one pair for each 'offspring' to be made. To make
+    # an offspring, the number of backbone program points is determined in each parent; 'backbone'
+    # refers to the number of branches directly within the root of the program, not the entire tree.
+    #
+    # To construct an offspring's program, program points are copied from the first parent with
+    # probability p, or the second parent with probability (1-p), for each point in the first
+    # parent's backbone. So if there are 13 and 6 points, respectively, the first six points are
+    # selected randomly, but the last 7 are copied from the first parent. If there are 8 and 11
+    # respectively, then the last 3 will be ignored from the second parent in any case.
+    #
+    #   the first (required) parameter is an Array of Answers
+    #   the second (optional) parameter is how many crossovers to make,
+    #     which defaults to the number of Answers in the incoming Batch
+    def generate(crowd, howMany = crowd.length, prob = 0.5)
+      result = Batch.new
+      howMany.times do
+        where = rand(crowd.length)
+        mom = crowd[where]
+        dad = crowd[ (where+1) % crowd.length ]
+        mom_backbone_length = mom.program[1].contents.length
+        dad_backbone_length = dad.program[1].contents.length
+        baby_blueprint_parts = ["",""]
+        (0..mom_backbone_length-1).each do |backbone_point|
+          if rand() < prob
+            next_chunks = mom.program[1].contents[backbone_point].blueprint_parts || ["",""]
+          else
+            if backbone_point < dad_backbone_length
+              next_chunks = (dad.program[1].contents[backbone_point].blueprint_parts || ["", ""])
+            else
+              next_chunks = ["",""]
+            end
+          end
+          baby_blueprint_parts[0] << " #{next_chunks[0]}"
+          baby_blueprint_parts[1] << " \n#{next_chunks[1]}"
+        end
+        mom.program.unused_footnotes.each {|fn| baby_blueprint_parts[1] += "\n#{fn}"}
+        baby_blueprint = "block {#{baby_blueprint_parts[0]}} #{baby_blueprint_parts[1]}"
+        baby = Answer.new(baby_blueprint, progress:[mom.progress,dad.progress].max + 1)
+        result << baby
+      end
+      return result
+    end
+  end
+  class PointCrossoverOperator < SearchOperator
+    def generate(crowd, howManyBabies = 1)
+      raise(ArgumentError) if !crowd.kind_of?(Array)
+      raise(ArgumentError) if crowd.empty?
+      crowd.each {|dude| raise(ArgumentError) if !dude.kind_of?(Answer) }
+      result = Batch.new
+      production = crowd.length*howManyBabies
+      production.times do
+        mom = crowd.sample
+        dad = crowd.sample
+        mom_receives = rand(mom.points) + 1
+        dad_donates = rand(dad.points) + 1
+        baby_blueprint = mom.replace_point_or_clone(mom_receives,dad.program[dad_donates])
+        baby = Answer.new(baby_blueprint,
+          progress:[mom.progress,dad.progress].max + 1)
+        result << baby
+      end
+      return result
+    end
+  end
+  class PointDeleteOperator < SearchOperator
+    def generate(crowd, howManyCopies = 1)
+      raise(ArgumentError) if !crowd.kind_of?(Array)
+      crowd.each {|dude| raise(ArgumentError) if !dude.kind_of?(Answer) }
+      result = Batch.new
+      crowd.each do |dude|
+        howManyCopies.times do
+          where = rand(dude.points)+1
+          variant = dude.delete_point_or_clone(where)
+          baby = Answer.new(variant, progress:dude.progress + 1)
+          result << baby
+        end
+      end
+      return result
+    end
+  end
+  class PointMutationOperator < SearchOperator
+    def generate(crowd, howManyCopies = 1, overridden_options ={})
+      raise(ArgumentError) if !crowd.kind_of?(Array)
+      raise(ArgumentError) if crowd.empty?
+      crowd.each {|dude| raise(ArgumentError) if !dude.kind_of?(Answer) }
+      result = Batch.new
+      crowd.each do |dude|
+        howManyCopies.times do
+          where = rand(dude.points)+1
+          newCode = CodeType.any_value(@incoming_options.merge(overridden_options))
+          variant = dude.replace_point_or_clone(where,newCode)
+          baby = Answer.new(variant, progress:dude.progress + 1)
+          result << baby
+        end
+      end
+      return result
+    end
+  end
+end

data/lib/operators/evaluators.rb ADDED

@@ -0,0 +1,113 @@
+module NudgeGP
+  class Evaluator < SearchOperator
+    attr_accessor :name
+    def initialize(params = {})
+      raise(ArgumentError, "Evaluators must be initialized with names") if params[:name] == nil
+      @name = params[:name]
+    end
+  end
+  class ProgramPointEvaluator < Evaluator
+    def evaluate(batch)
+      raise(ArgumentError, "Can only evaluate a Batch of Answers") if !batch.kind_of?(Batch)
+      batch.each do |i|
+        if i.parses?
+          i.scores[@name] = i.program.points
+        else
+          raise(ArgumentError, "Program is not parseable")
+        end
+      end
+    end
+  end
+  class TestCase
+    attr_accessor :bindings, :expectations, :gauges
+    def initialize(args = {})
+      @bindings = args[:bindings] || Hash.new
+      @expectations = args[:expectations] || Hash.new
+      @gauges = args[:gauges] || Hash.new
+      if (@expectations.keys - @gauges.keys).length > 0
+        raise ArgumentError, "One or more expectations have no defined gauge"
+      end
+    end
+  end
+  class TestCaseEvaluator < Evaluator
+    attr_accessor :interpreter_settings
+    def evaluate(batch, cases = [], params = {})
+      raise(ArgumentError, "Can only evaluate a Batch of Answers") if !batch.kind_of?(Batch)
+      instructions = params[:instructions] || Instruction.all_instructions
+      types = params[:types] || [IntType, BoolType, FloatType]
+      variable_names = params[:references] || []
+      batch.each do |dude|
+        if !params[:deterministic] || !dude.scores[@name]
+          score = 0
+          readings = {}
+          cases.each do |example|
+            difference = 0
+            # make an Interpreter
+            workspace = Interpreter.new("",
+              :instruction_names => instructions,
+              :type_names => types,
+              :references => variable_names)
+            # set up the program
+            workspace.reset(dude.blueprint)
+            # set up the bindings
+            example.bindings.each do |key,value|
+              workspace.bind_variable(key, value)
+            end
+            # run it
+            workspace.run
+            # apply the gauge(s) for each expectation
+            example.gauges.each do |variable_name,the_gauge|
+              readings[variable_name] = the_gauge.call(workspace)
+            end
+            # synthesize readings into a single scalar difference
+            # FIXME this should be a settable Proc
+            example.gauges.each do |variable_name,the_gauge|
+              begin
+                difference = (readings[variable_name].value - example.expectations[variable_name])
+              rescue
+                difference = 100000
+              end
+            end
+            score += difference.abs
+          end
+          # aggregate differences
+          dude.scores[@name] = score.to_f / cases.length
+          puts "#{score.to_f / cases.length}" if params[:feedback]
+        else
+          puts dude.scores[@name] if params[:feedback]
+        end
+      end
+    end
+  end
+end

data/lib/operators/samplers_and_selectors.rb ADDED

@@ -0,0 +1,131 @@
+module NudgeGP
+  class Sampler < SearchOperator
+    def initialize (params = {})
+      super
+    end
+    def all_known_criteria(crowd)
+      union = []
+      crowd.each do |dude|
+        union |= dude.known_criteria
+      end
+      return union
+    end
+    def all_shared_scores(crowd)
+      intersection = self.all_known_criteria(crowd)
+      crowd.each do |dude|
+        intersection = intersection & dude.known_criteria
+      end
+      return intersection
+    end
+    def domination_classes(crowd, template = all_shared_scores(crowd))
+      result = Hash.new()
+      crowd.each_index do |i|
+        dominated_by = 0
+        crowd.each_index do |j|
+          dominated_by += 1 if crowd[i].dominated_by?(crowd[j], template)
+        end
+        result[dominated_by] ||= []
+        result[dominated_by].push crowd[i]
+      end
+      return result
+    end
+    def diversity_classes(crowd)
+      result = Hash.new()
+      crowd.each do |dude|
+        result[dude.program.tidy] ||= []
+        result[dude.program.tidy] << dude
+      end
+      return result
+    end
+  end
+  class NondominatedSubsetSelector < Sampler
+    def generate(crowd, template = all_shared_scores(crowd))
+      result = Batch.new
+      crowd.each do |answer|
+        dominated = false
+        crowd.each do |other_answer|
+          dominated ||= answer.dominated_by?(other_answer, template)
+        end
+        result << answer unless dominated
+      end
+      return result
+    end
+  end
+  class DominatedQuantileSampler < Sampler
+    def generate(crowd, proportion = 0.5, template = all_shared_scores(crowd))
+      classified = domination_classes(crowd, template)
+      increasing_grades = classified.keys.sort {|a,b| b <=> a}
+      partial_ordering = []
+      increasing_grades.each {|grade| partial_ordering += classified[grade]}
+      how_many = (crowd.length * proportion).ceil
+      result = Batch.new
+      partial_ordering[0...how_many].each {|dude| result << dude} unless how_many == 0
+      return result
+    end
+  end
+  class MostDominatedSubsetSampler < Sampler
+    def generate(crowd, template = all_shared_scores(crowd))
+      result = Batch.new
+      classified = domination_classes(crowd, template)
+      worst_key = classified.keys.sort[-1]
+      classified[worst_key].each {|bad_dude| result.push bad_dude}
+      return result
+    end
+  end
+  class AnyOneSampler < Sampler
+    def generate(crowd)
+      result = Batch[crowd.sample]
+    end
+  end
+  class AllDuplicatedGenomesSampler < Sampler
+    def generate(crowd)
+      result = Batch.new
+      clustered = diversity_classes(crowd)
+      clustered.each do |blueprint, array|
+        if array.length > 1
+          result.concat array
+        end
+      end
+      return result
+    end
+  end
+end