RubyGems - stamina - Versions diffs - 0.4.0 → 0.5.0 - Mend

stamina 0.4.0 → 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (116) hide show

data/CHANGELOG.md +22 -5
data/LICENCE.md +2 -2
data/bin/stamina +1 -7
data/lib/stamina.rb +10 -19
metadata +54 -333
data/.gemtest +0 -0
data/Gemfile +0 -2
data/Gemfile.lock +0 -37
data/Manifest.txt +0 -16
data/README.md +0 -78
data/Rakefile +0 -23
data/example/adl/automaton.adl +0 -49
data/example/adl/sample.adl +0 -53
data/example/basic/characteristic_sample.adl +0 -32
data/example/basic/target.adl +0 -9
data/example/competition/31_test.adl +0 -1500
data/example/competition/31_training.adl +0 -1759
data/lib/stamina/abbadingo.rb +0 -2
data/lib/stamina/abbadingo/random_dfa.rb +0 -48
data/lib/stamina/abbadingo/random_sample.rb +0 -146
data/lib/stamina/adl.rb +0 -298
data/lib/stamina/automaton.rb +0 -1263
data/lib/stamina/automaton/complete.rb +0 -36
data/lib/stamina/automaton/equivalence.rb +0 -55
data/lib/stamina/automaton/metrics.rb +0 -78
data/lib/stamina/automaton/minimize.rb +0 -25
data/lib/stamina/automaton/minimize/hopcroft.rb +0 -116
data/lib/stamina/automaton/minimize/pitchies.rb +0 -64
data/lib/stamina/automaton/strip.rb +0 -16
data/lib/stamina/automaton/walking.rb +0 -363
data/lib/stamina/classifier.rb +0 -52
data/lib/stamina/command.rb +0 -45
data/lib/stamina/command/abbadingo_dfa.rb +0 -81
data/lib/stamina/command/abbadingo_samples.rb +0 -40
data/lib/stamina/command/adl2dot.rb +0 -71
data/lib/stamina/command/classify.rb +0 -48
data/lib/stamina/command/help.rb +0 -27
data/lib/stamina/command/infer.rb +0 -141
data/lib/stamina/command/metrics.rb +0 -51
data/lib/stamina/command/robustness.rb +0 -22
data/lib/stamina/command/score.rb +0 -35
data/lib/stamina/errors.rb +0 -23
data/lib/stamina/ext/math.rb +0 -20
data/lib/stamina/induction/blue_fringe.rb +0 -265
data/lib/stamina/induction/commons.rb +0 -156
data/lib/stamina/induction/rpni.rb +0 -186
data/lib/stamina/induction/union_find.rb +0 -377
data/lib/stamina/input_string.rb +0 -123
data/lib/stamina/loader.rb +0 -1
data/lib/stamina/markable.rb +0 -42
data/lib/stamina/sample.rb +0 -267
data/lib/stamina/scoring.rb +0 -213
data/lib/stamina/utils.rb +0 -1
data/lib/stamina/utils/decorate.rb +0 -81
data/lib/stamina/version.rb +0 -14
data/stamina.gemspec +0 -191
data/stamina.noespec +0 -32
data/tasks/debug_mail.rake +0 -78
data/tasks/debug_mail.txt +0 -13
data/tasks/gem.rake +0 -68
data/tasks/spec_test.rake +0 -79
data/tasks/unit_test.rake +0 -77
data/tasks/yard.rake +0 -51
data/test/stamina/abbadingo/random_dfa_test.rb +0 -16
data/test/stamina/abbadingo/random_sample_test.rb +0 -78
data/test/stamina/adl_test.rb +0 -516
data/test/stamina/automaton/classifier_test.rb +0 -259
data/test/stamina/automaton/complete_test.rb +0 -58
data/test/stamina/automaton/equivalence_test.rb +0 -120
data/test/stamina/automaton/metrics_test.rb +0 -36
data/test/stamina/automaton/minimize/hopcroft_test.rb +0 -15
data/test/stamina/automaton/minimize/minimize_test.rb +0 -55
data/test/stamina/automaton/minimize/pitchies_test.rb +0 -15
data/test/stamina/automaton/minimize/rice_edu_10.adl +0 -16
data/test/stamina/automaton/minimize/rice_edu_10.min.adl +0 -13
data/test/stamina/automaton/minimize/rice_edu_13.adl +0 -13
data/test/stamina/automaton/minimize/rice_edu_13.min.adl +0 -7
data/test/stamina/automaton/minimize/should_strip_1.adl +0 -8
data/test/stamina/automaton/minimize/should_strip_1.min.adl +0 -6
data/test/stamina/automaton/minimize/unknown_1.adl +0 -16
data/test/stamina/automaton/minimize/unknown_1.min.adl +0 -12
data/test/stamina/automaton/strip_test.rb +0 -36
data/test/stamina/automaton/to_dot_test.rb +0 -64
data/test/stamina/automaton/walking/dfa_delta_test.rb +0 -39
data/test/stamina/automaton/walking_test.rb +0 -206
data/test/stamina/automaton_additional_test.rb +0 -190
data/test/stamina/automaton_test.rb +0 -1104
data/test/stamina/exit.rb +0 -3
data/test/stamina/induction/blue_fringe_test.rb +0 -83
data/test/stamina/induction/induction_test.rb +0 -70
data/test/stamina/induction/redblue_mergesamestatebug_expected.adl +0 -19
data/test/stamina/induction/redblue_mergesamestatebug_pta.dot +0 -64
data/test/stamina/induction/redblue_mergesamestatebug_sample.adl +0 -9
data/test/stamina/induction/redblue_universal_expected.adl +0 -4
data/test/stamina/induction/redblue_universal_sample.adl +0 -5
data/test/stamina/induction/rpni_inria_expected.adl +0 -7
data/test/stamina/induction/rpni_inria_sample.adl +0 -9
data/test/stamina/induction/rpni_test.rb +0 -129
data/test/stamina/induction/rpni_test_pta.dot +0 -22
data/test/stamina/induction/rpni_universal_expected.adl +0 -4
data/test/stamina/induction/rpni_universal_sample.adl +0 -4
data/test/stamina/induction/union_find_test.rb +0 -124
data/test/stamina/input_string_test.rb +0 -323
data/test/stamina/markable_test.rb +0 -70
data/test/stamina/randdfa.adl +0 -66
data/test/stamina/sample.adl +0 -4
data/test/stamina/sample_classify_test.rb +0 -149
data/test/stamina/sample_test.rb +0 -290
data/test/stamina/scoring_test.rb +0 -63
data/test/stamina/small_dfa.dot +0 -16
data/test/stamina/small_dfa.gif +0 -0
data/test/stamina/small_nfa.dot +0 -18
data/test/stamina/small_nfa.gif +0 -0
data/test/stamina/stamina_test.rb +0 -80
data/test/stamina/utils/decorate_test.rb +0 -65
data/test/test_all.rb +0 -7

data/lib/stamina/classifier.rb DELETED Viewed

@@ -1,52 +0,0 @@
-module Stamina
-  #
-  # Provides a reusable module for binary classifiers. Classes including this
-  # module are required to provide a label_of(string) method, returning '1' for
-  # strings considered positive, and '0' fr strings considered negative.
-  #
-  # Note that an Automaton being a classifier it already includes this module.
-  #
-  module Classifier
-    #
-    # Computes a signature for a given sample (that is, an ordered set of strings).
-    # The signature is a string containing 1 (considered positive, or accepted)
-    # and 0 (considered negative, or rejected), one for each string.
-    #
-    def signature(sample)
-      signature = ''
-      sample.each do |str|
-        signature << label_of(str)
-      end
-      signature
-    end
-    alias :classification_signature :signature
-    #
-    # Classifies a sample then compute the classification scoring that is obtained
-    # by comparing the signature obtained by classification and the one of the sample
-    # itself. Returns an object responding to methods defined in Scoring module.
-    #
-    # This method is actually a convenient shortcut for:
-    #
-    #    Stamina::Scoring.scoring(signature(sample), sample.signature)
-    #
-    def scoring(sample)
-      Stamina::Scoring.scoring(signature(sample), sample.signature)
-    end
-    alias :classification_scoring :scoring
-    #
-    # Checks if a labeled sample is correctly classified by the classifier.
-    #
-    def correctly_classify?(sample)
-      sample.each do |str|
-        label = label_of(str)
-        expected = (str.positive? ? '1' : '0')
-        return false unless expected==label
-      end
-      true
-    end
-  end # module Classifier
-end # module Stamina

data/lib/stamina/command.rb DELETED Viewed

@@ -1,45 +0,0 @@
-require 'stamina'
-module Stamina
-  #
-  # Stamina - A Ruby Automaton & Induction Toolkit
-  #
-  # SYNOPSIS
-  #   #{program_name} [--version] [--help] COMMAND [cmd opts] ARGS...
-  #
-  # OPTIONS
-  # #{summarized_options}
-  #
-  # COMMANDS
-  # #{summarized_subcommands}
-  #
-  # See '#{program_name} help COMMAND' for more information on a specific command.
-  #
-  class Command < ::Quickl::Delegator(__FILE__, __LINE__)
-    # Install options
-    options do |opt|
-      # Show the help and exit
-      opt.on_tail("--help", "Show help") do
-        raise Quickl::Help
-      end
-      # Show version and exit
-      opt.on_tail("--version", "Show version") do
-        raise Quickl::Exit, "#{program_name} #{VERSION} (c) 2010-2011, Bernard Lambeau"
-      end
-    end
-  end # class Command
-end # module Stamina
-require 'stamina/command/robustness'
-require 'stamina/command/help'
-require 'stamina/command/adl2dot'
-require 'stamina/command/metrics'
-require 'stamina/command/classify'
-require 'stamina/command/score'
-require 'stamina/command/abbadingo_dfa'
-require 'stamina/command/abbadingo_samples'
-require 'stamina/command/infer'

data/lib/stamina/command/abbadingo_dfa.rb DELETED Viewed

@@ -1,81 +0,0 @@
-module Stamina
-  class Command
-    #
-    # Generates a DFA following Abbadingo's protocol
-    #
-    # SYNOPSIS
-    #   #{program_name} #{command_name}
-    #
-    # OPTIONS
-    # #{summarized_options}
-    #
-    class AbbadingoDfa < Quickl::Command(__FILE__, __LINE__)
-      include Robustness
-      # Size of the target automaton
-      attr_accessor :size
-      # Tolerance on the size
-      attr_accessor :size_tolerance
-      # Tolerance on the automaton depth
-      attr_accessor :depth_tolerance
-      # Where to flush the dfa
-      attr_accessor :output_file
-      # Install options
-      options do |opt|
-        @size = 64
-        opt.on("--size=X", Integer, "Sets the size of the automaton to generate") do |x|
-          @size = x
-        end
-        @size_tolerance = nil
-        opt.on("--size-tolerance[=X]", Integer, "Sets the tolerance on automaton size (in number of states)") do |x|
-          @size_tolerance = x
-        end
-        @depth_tolerance = 0
-        opt.on("--depth-tolerance[=X]", Integer, "Sets the tolerance on expected automaton depth (in length, 0 by default)") do |x|
-          @depth_tolerance = x
-        end
-        @output_file = nil
-        opt.on("-o", "--output=OUTPUT",
-               "Flush DFA in output file") do |value|
-          @output_file = assert_writable_file(value)
-        end
-      end # options
-      def accept?(dfa)
-        (size_tolerance.nil?  || (size - dfa.state_count).abs <= size_tolerance) &&
-        (depth_tolerance.nil? || ((2*Math.log2(size)-2) - dfa.depth).abs <= depth_tolerance)
-      end
-      # Command execution
-      def execute(args)
-        require 'stamina/abbadingo'
-        # generate it
-        randomizer = Stamina::Abbadingo::RandomDFA.new(size)
-        begin
-          dfa = randomizer.execute
-        end until accept?(dfa)
-        # flush it
-        if output_file
-          File.open(output_file, 'w') do |file|
-            Stamina::ADL.print_automaton(dfa, file)
-          end
-        else
-          Stamina::ADL.print_automaton(dfa, $stdout)
-        end
-      end
-    end # class AbbadingoDFA
-  end # class Command
-end # module Stamina

data/lib/stamina/command/abbadingo_samples.rb DELETED Viewed

@@ -1,40 +0,0 @@
-module Stamina
-  class Command
-    #
-    # Generates samples following Abbadingo's protocol
-    #
-    # SYNOPSIS
-    #   #{program_name} #{command_name} target.adl
-    #
-    # OPTIONS
-    # #{summarized_options}
-    #
-    class AbbadingoSamples < Quickl::Command(__FILE__, __LINE__)
-      # Install options
-      options do |opt|
-      end # options
-      # Command execution
-      def execute(args)
-        raise Quickl::Help unless args.size == 1
-        # Loads the target automaton
-        target_file = args.first
-        basename = File.basename(target_file, '.adl')
-        dirname = File.dirname(target_file)
-        target = Stamina::ADL::parse_automaton_file(target_file)
-        require 'stamina/abbadingo'
-        training, test = Stamina::Abbadingo::RandomSample.execute(target)
-        # Flush results aside the target automaton file
-        Stamina::ADL::print_sample_in_file(training, File.join(dirname, "#{basename}-training.adl"))
-        Stamina::ADL::print_sample_in_file(test,     File.join(dirname, "#{basename}-test.adl"))
-      end
-    end # class AbbadingoSamples
-  end # class Command
-end # module Stamina

data/lib/stamina/command/adl2dot.rb DELETED Viewed

@@ -1,71 +0,0 @@
-module Stamina
-  class Command
-    #
-    # Prints an automaton expressed in ADL in dot (or gif) format
-    #
-    # SYNOPSIS
-    #   #{program_name} #{command_name} automaton.adl
-    #
-    # OPTIONS
-    # #{summarized_options}
-    #
-    class Adl2dot < Quickl::Command(__FILE__, __LINE__)
-      include Robustness
-      attr_reader :gif_output
-      # Install options
-      options do |opt|
-        @output_file = nil
-        opt.on("-o", "--output=OUTPUT",
-               "Flush result output file") do |value|
-          @output_file = assert_writable_file(value)
-        end
-        opt.on("-g", "--gif",
-               "Generates a gif file instead of a dot one") do
-          @gif_output = true
-        end
-      end # options
-      def output_file(infile)
-        @output_file || "#{File.basename(infile || 'stdin.adl', '.adl')}.#{gif_output ? 'gif' : 'dot'}"
-      end
-      # Command execution
-      def execute(args)
-        raise Quickl::Help unless args.size <= 1
-        # Loads the target automaton
-        input = if args.size == 1
-          File.read assert_readable_file(args.first)
-        else
-          $stdin.readlines.join("\n")
-        end
-        automaton = Stamina::ADL::parse_automaton(input)
-        # create a file for the dot output
-        if gif_output
-          require 'tempfile'
-          dotfile = Tempfile.new("stamina").path
-        else
-          dotfile = output_file(args.first)
-        end
-        # Flush automaton inside it
-        File.open(dotfile, 'w') do |f|
-          f << automaton.to_dot
-        end
-        # if gif output, use dot to convert it
-        if gif_output
-          `dot -Tgif -o #{output_file(args.first)} #{dotfile}`
-        end
-      end
-    end # class Adl2dot
-  end # class Command
-end # module Stamina

data/lib/stamina/command/classify.rb DELETED Viewed

@@ -1,48 +0,0 @@
-module Stamina
-  class Command
-    #
-    # Classifies a sample thanks with an automaton
-    #
-    # SYNOPSIS
-    #   #{program_name} #{command_name} sample.adl automaton.adl
-    #
-    # OPTIONS
-    # #{summarized_options}
-    #
-    class Classify < Quickl::Command(__FILE__, __LINE__)
-      include Robustness
-      # Where to flush the output
-      attr_accessor :output_file
-      # Install options
-      options do |opt|
-        @output_file = nil
-        opt.on("-o", "--output=OUTPUT",
-               "Flush classification signature in output file") do |value|
-          assert_writable_file(value)
-          @output_file = value
-        end
-      end # options
-      # Command execution
-      def execute(args)
-        raise Quickl::Help unless args.size == 2
-        sample    = Stamina::ADL::parse_sample_file assert_readable_file(args.first)
-        automaton = Stamina::ADL::parse_automaton_file assert_readable_file(args.last)
-        if of = output_file
-          File.open(of, 'w'){|io|
-            io << automaton.signature(sample)
-          }
-        else
-          $stdout << automaton.signature(sample)
-        end
-      end
-    end # class Classify
-  end # class Command
-end # module Stamina

data/lib/stamina/command/help.rb DELETED Viewed

@@ -1,27 +0,0 @@
-module Stamina
-  class Command
-    #
-    # Show help about a specific command
-    #
-    # SYNOPSIS
-    #   #{program_name} #{command_name} COMMAND
-    #
-    class Help < Quickl::Command(__FILE__, __LINE__)
-      # Let NoSuchCommandError be passed to higher stage
-      no_react_to Quickl::NoSuchCommand
-      # Command execution
-      def execute(args)
-        if args.size != 1
-          puts super_command.help
-        else
-          cmd = has_command!(args.first, super_command)
-          puts cmd.help
-        end
-      end
-    end # class Help
-  end # class Command
-end # module Stamina

data/lib/stamina/command/infer.rb DELETED Viewed

@@ -1,141 +0,0 @@
-module Stamina
-  class Command
-    #
-    # Grammar inference, induces a DFA from a training sample using an
-    # chosen algorithm.
-    #
-    # SYNOPSIS
-    #   #{program_name} #{command_name} sample.adl
-    #
-    # OPTIONS
-    # #{summarized_options}
-    #
-    class Infer < Quickl::Command(__FILE__, __LINE__)
-      include Robustness
-      attr_accessor :algorithm
-      attr_accessor :take
-      attr_accessor :score
-      attr_accessor :verbose
-      attr_accessor :drop
-      attr_accessor :output_file
-      # Install options
-      options do |opt|
-        @algorithm = :rpni
-        opt.on("--algorithm=X", "Sets the induction algorithm to use (rpni, bluefringe)") do |x|
-          @algorithm = x.to_sym
-        end
-        @take = 1.0
-        opt.on("--take=X", Float, "Take only X% of available strings") do |x|
-          @take = x.to_f
-          unless @take > 0.0 and @take <= 1.0
-            raise Quickl::InvalidOption, "Invalid --take option: #{@take}"
-          end
-        end
-        @score = nil
-        opt.on("--score=test.adl", "Add scoring information to metadata, using test.adl file") do |x|
-          @score = assert_readable_file(x)
-        end
-        @verbose = true
-        opt.on("-v", "--[no-]verbose", "Verbose mode") do |x|
-          @verbose = x
-        end
-        @drop = false
-        opt.on("-d", "--drop", "Drop result") do |x|
-          @drop = x
-        end
-        @output_file = nil
-        opt.on("-o", "--output=OUTPUT",
-               "Flush induced DFA in output file") do |value|
-          @output_file = assert_writable_file(value)
-        end
-      end # options
-      def launch_induction(sample)
-        require 'benchmark'
-        algo_clazz = case algorithm
-          when :rpni
-            Stamina::Induction::RPNI
-          when :bluefringe
-            Stamina::Induction::BlueFringe
-          else
-            raise Quickl::InvalidOption, "Unknown induction algorithm: #{algo}"
-        end
-        dfa, tms = nil, nil
-        tms = Benchmark.measure do
-          dfa = algo_clazz.execute(sample, {:verbose => verbose})
-        end
-        [dfa, tms]
-      end
-      def load_sample(file)
-        sample = Stamina::ADL.parse_sample_file(file)
-        if @take != 1.0
-          sampled = Stamina::Sample.new
-          sample.each_positive{|s| sampled << s if Kernel.rand < @take}
-          sample.each_negative{|s| sampled << s if Kernel.rand < @take}
-          sample = sampled
-        end
-        sample
-      end
-      # Command execution
-      def execute(args)
-        raise Quickl::Help unless args.size == 1
-        # Parses the sample
-        $stderr << "Parsing sample...\n" if verbose
-        sample = load_sample(assert_readable_file(args.first))
-        # Induce the DFA
-        dfa, tms = launch_induction(sample)
-        # Flush result
-        unless drop
-          if output_file
-            File.open(output_file, 'w') do |file|
-              Stamina::ADL.print_automaton(dfa, file)
-            end
-          else
-            Stamina::ADL.print_automaton(dfa, $stdout)
-          end
-        end
-        # build meta information
-        meta = {:algorithm   => algorithm,
-                :sample      => File.basename(args.first),
-                :take        => take,
-                :sample_size => sample.size,
-                :positive_count => sample.positive_count,
-                :negative_count => sample.negative_count,
-                :real_time   => tms.real,
-                :total_time  => tms.total,
-                :user_time   => tms.utime + tms.cutime,
-                :system_time => tms.stime + tms.cstime}
-        if score
-          test = Stamina::ADL::parse_sample_file(score)
-          classified_as = dfa.signature(test)
-          reference = test.signature
-          scoring = Scoring.scoring(classified_as, reference)
-          meta.merge!(scoring.to_h)
-        end
-        # Display information
-        puts meta.inspect
-      end
-    end # class Infer
-  end # class Command
-end # module Stamina