RubyGems - ai4r - Versions diffs - 1.1 → 1.2 - Mend

ai4r 1.1 → 1.2

Files changed (140) hide show

data/README.rdoc +21 -20
data/examples/decision_trees/id3_example.rb +3 -2
data/examples/genetic_algorithm/genetic_algorithm_example.rb +6 -6
data/examples/neural_network/backpropagation_example.rb +2 -2
data/lib/ai4r/classifiers/classifier_helper.rb +54 -0
data/lib/ai4r/classifiers/id3.rb +356 -0
data/lib/ai4r/classifiers/one_r.rb +148 -0
data/lib/ai4r/classifiers/prism.rb +231 -0
data/lib/ai4r/classifiers/zero_r.rb +104 -0
data/lib/ai4r/genetic_algorithm/genetic_algorithm.rb +272 -0
data/lib/ai4r/neural_network/backpropagation.rb +271 -0
data/site/build/tmp/locationmap.xml +14 -14
data/site/build/tmp/output.xmap +23 -23
data/site/build/tmp/pluginlist2fetchbuild.xml +144 -144
data/site/build/tmp/plugins-1.xml +0 -11
data/site/build/tmp/plugins-2.xml +54 -0
data/site/build/tmp/projfilters.properties +41 -41
data/site/build/webapp/WEB-INF/logs/core.log +681 -788
data/site/build/webapp/WEB-INF/logs/error.log +281 -248
data/site/build/webapp/WEB-INF/logs/sitemap.log +1015 -0
data/site/src/documentation/content/xdocs/forum.html +9 -0
data/site/src/documentation/content/xdocs/geneticAlgorithms.xml +82 -68
data/site/src/documentation/content/xdocs/index.xml +47 -18
data/site/src/documentation/content/xdocs/machineLearning.xml +10 -9
data/site/src/documentation/content/xdocs/neuralNetworks.xml +60 -36
data/site/src/documentation/content/xdocs/site.xml +8 -5
data/site/src/documentation/content/xdocs/svn.xml +11 -1
data/site/src/documentation/resources/images/Thumbs.db +0 -0
data/site/src/documentation/resources/images/ai4r-logo.png +0 -0
data/site/src/documentation/resources/images/genetic_algorithms_example.png +0 -0
data/site/src/documentation/resources/images/jadeferret.png +0 -0
data/site/src/documentation/resources/images/neural_network_example.png +0 -0
data/site/src/documentation/resources/images/sub-dir/Thumbs.db +0 -0
data/site/src/documentation/skinconf.xml +18 -18
data/test/classifiers/id3_test.rb +206 -0
data/test/classifiers/one_r_test.rb +62 -0
data/test/classifiers/prism_test.rb +83 -0
data/test/classifiers/zero_r_test.rb +48 -0
data/test/genetic_algorithm/chromosome_test.rb +41 -38
data/test/genetic_algorithm/genetic_algorithm_test.rb +64 -61
data/test/neural_network/backpropagation_test.rb +20 -18
metadata +109 -199
data/lib/decision_tree/id3.rb +0 -354
data/lib/genetic_algorithm/genetic_algorithm.rb +0 -268
data/lib/neural_network/backpropagation.rb +0 -264
data/site/build/site/en/broken-links.xml +0 -2
data/site/build/site/en/downloads.html +0 -187
data/site/build/site/en/downloads.pdf +0 -151
data/site/build/site/en/geneticAlgorithms.html +0 -564
data/site/build/site/en/geneticAlgorithms.pdf +0 -911
data/site/build/site/en/images/ai4r-logo.png +0 -0
data/site/build/site/en/images/built-with-forrest-button.png +0 -0
data/site/build/site/en/images/c.png +0 -0
data/site/build/site/en/images/c_wbn.png +0 -0
data/site/build/site/en/images/c_wn.png +0 -0
data/site/build/site/en/images/ero.gif +0 -0
data/site/build/site/en/images/europe2.png +0 -0
data/site/build/site/en/images/europe3.png +0 -0
data/site/build/site/en/images/fitness.png +0 -0
data/site/build/site/en/images/instruction_arrow.png +0 -0
data/site/build/site/en/images/my_email.png +0 -0
data/site/build/site/en/images/rubyforge.png +0 -0
data/site/build/site/en/images/s.png +0 -0
data/site/build/site/en/images/s_wbn.png +0 -0
data/site/build/site/en/images/s_wn.png +0 -0
data/site/build/site/en/images/sigmoid.png +0 -0
data/site/build/site/en/images/t.png +0 -0
data/site/build/site/en/images/t_wbn.png +0 -0
data/site/build/site/en/images/t_wn.png +0 -0
data/site/build/site/en/index.html +0 -258
data/site/build/site/en/index.pdf +0 -306
data/site/build/site/en/linkmap.html +0 -231
data/site/build/site/en/linkmap.pdf +0 -94
data/site/build/site/en/locationmap.xml +0 -72
data/site/build/site/en/machineLearning.html +0 -325
data/site/build/site/en/machineLearning.pdf +0 -337
data/site/build/site/en/neuralNetworks.html +0 -446
data/site/build/site/en/neuralNetworks.pdf +0 -604
data/site/build/site/en/skin/CommonMessages_de.xml +0 -23
data/site/build/site/en/skin/CommonMessages_en_US.xml +0 -23
data/site/build/site/en/skin/CommonMessages_es.xml +0 -23
data/site/build/site/en/skin/CommonMessages_fr.xml +0 -23
data/site/build/site/en/skin/basic.css +0 -166
data/site/build/site/en/skin/breadcrumbs-optimized.js +0 -90
data/site/build/site/en/skin/breadcrumbs.js +0 -237
data/site/build/site/en/skin/fontsize.js +0 -166
data/site/build/site/en/skin/getBlank.js +0 -40
data/site/build/site/en/skin/getMenu.js +0 -45
data/site/build/site/en/skin/images/README.txt +0 -1
data/site/build/site/en/skin/images/add.jpg +0 -0
data/site/build/site/en/skin/images/built-with-forrest-button.png +0 -0
data/site/build/site/en/skin/images/chapter.gif +0 -0
data/site/build/site/en/skin/images/chapter_open.gif +0 -0
data/site/build/site/en/skin/images/current.gif +0 -0
data/site/build/site/en/skin/images/error.png +0 -0
data/site/build/site/en/skin/images/external-link.gif +0 -0
data/site/build/site/en/skin/images/fix.jpg +0 -0
data/site/build/site/en/skin/images/forrest-credit-logo.png +0 -0
data/site/build/site/en/skin/images/hack.jpg +0 -0
data/site/build/site/en/skin/images/header_white_line.gif +0 -0
data/site/build/site/en/skin/images/info.png +0 -0
data/site/build/site/en/skin/images/instruction_arrow.png +0 -0
data/site/build/site/en/skin/images/label.gif +0 -0
data/site/build/site/en/skin/images/page.gif +0 -0
data/site/build/site/en/skin/images/pdfdoc.gif +0 -0
data/site/build/site/en/skin/images/poddoc.png +0 -0
data/site/build/site/en/skin/images/printer.gif +0 -0
data/site/build/site/en/skin/images/rc-b-l-15-1body-2menu-3menu.png +0 -0
data/site/build/site/en/skin/images/rc-b-r-15-1body-2menu-3menu.png +0 -0
data/site/build/site/en/skin/images/rc-b-r-5-1header-2tab-selected-3tab-selected.png +0 -0
data/site/build/site/en/skin/images/rc-t-l-5-1header-2searchbox-3searchbox.png +0 -0
data/site/build/site/en/skin/images/rc-t-l-5-1header-2tab-selected-3tab-selected.png +0 -0
data/site/build/site/en/skin/images/rc-t-l-5-1header-2tab-unselected-3tab-unselected.png +0 -0
data/site/build/site/en/skin/images/rc-t-r-15-1body-2menu-3menu.png +0 -0
data/site/build/site/en/skin/images/rc-t-r-5-1header-2searchbox-3searchbox.png +0 -0
data/site/build/site/en/skin/images/rc-t-r-5-1header-2tab-selected-3tab-selected.png +0 -0
data/site/build/site/en/skin/images/rc-t-r-5-1header-2tab-unselected-3tab-unselected.png +0 -0
data/site/build/site/en/skin/images/remove.jpg +0 -0
data/site/build/site/en/skin/images/rss.png +0 -0
data/site/build/site/en/skin/images/spacer.gif +0 -0
data/site/build/site/en/skin/images/success.png +0 -0
data/site/build/site/en/skin/images/txtdoc.png +0 -0
data/site/build/site/en/skin/images/update.jpg +0 -0
data/site/build/site/en/skin/images/valid-html401.png +0 -0
data/site/build/site/en/skin/images/vcss.png +0 -0
data/site/build/site/en/skin/images/warning.png +0 -0
data/site/build/site/en/skin/images/xmldoc.gif +0 -0
data/site/build/site/en/skin/menu.js +0 -48
data/site/build/site/en/skin/note.txt +0 -50
data/site/build/site/en/skin/print.css +0 -54
data/site/build/site/en/skin/profile.css +0 -163
data/site/build/site/en/skin/prototype.js +0 -1257
data/site/build/site/en/skin/screen.css +0 -587
data/site/build/site/en/svn.html +0 -223
data/site/build/site/en/svn.pdf +0 -239
data/site/build/site/en/wholesite.pdf +0 -1686
data/site/build/tmp/brokenlinks.xml +0 -2
data/site/build/tmp/cocoon-work/cache-dir/cocoon-ehcache-1.data +0 -0
data/site/build/tmp/cocoon-work/cache-dir/cocoon-ehcache-1.index +0 -0
data/test/decision_tree/id3_test.rb +0 -209

data/lib/ai4r/classifiers/one_r.rb ADDED

@@ -0,0 +1,148 @@
+# Author::    Sergio Fierens (Implementation only)
+# License::   MPL 1.1
+# Project::   ai4r
+# Url::       http://ai4r.rubyforge.org/
+#
+# You can redistribute it and/or modify it under the terms of
+# the Mozilla Public License version 1.1  as published by the
+# Mozilla Foundation at http://www.mozilla.org/MPL/MPL-1.1.txt
+require 'set'
+require File.dirname(__FILE__) + '/classifier_helper'
+module Ai4r
+  module Classifiers
+    # = Introduction
+    #
+    # The idea of the OneR algorithm is identify the single
+    # attribute to use to classify data that makes
+    # fewest prediction errors.
+    # It generates rules based on a single attribute.
+    class OneR
+      attr_accessor :data_labels, :rule
+      include ClassifierHelper
+      # Build a new OneR classifier. If your data is classified with N attributed
+      # and M examples, then your data examples must have the following format:
+      #
+      #     [   [ATT1_VAL1, ATT2_VAL1, ATT3_VAL1, ... , ATTN_VAL1,  CLASS_VAL1],
+      #         [ATT1_VAL2, ATT2_VAL2, ATT3_VAL2, ... , ATTN_VAL2,  CLASS_VAL2],
+      #         ...
+      #         [ATTM1_VALM, ATT2_VALM, ATT3_VALM, ... , ATTN_VALM, CLASS_VALM],
+      #     ]
+      #
+      # e.g.
+      #     [   ['New York',  '<30',      'M', 'Y'],
+      #          ['Chicago',     '<30',      'M', 'Y'],
+      #          ['Chicago',     '<30',      'F', 'Y'],
+      #          ['New York',  '<30',      'M', 'Y'],
+      #          ['New York',  '<30',      'M', 'Y'],
+      #          ['Chicago',     '[30-50)',  'M', 'Y'],
+      #          ['New York',  '[30-50)',  'F', 'N'],
+      #          ['Chicago',     '[30-50)',  'F', 'Y'],
+      #          ['New York',  '[30-50)',  'F', 'N'],
+      #          ['Chicago',     '[50-80]', 'M', 'N'],
+      #          ['New York',  '[50-80]', 'F', 'N'],
+      #          ['New York',  '[50-80]', 'M', 'N'],
+      #          ['Chicago',     '[50-80]', 'M', 'N'],
+      #          ['New York',  '[50-80]', 'F', 'N'],
+      #          ['Chicago',     '>80',      'F', 'Y']
+      #        ]
+      #
+      # Data labels must have the following format:
+      #     [ 'city', 'age_range', 'gender', 'marketing_target'  ]
+      #
+      # If you do not provide labels for you data, the following labels will
+      # be created by default:
+      #     [ 'attribute_1', 'attribute_2', 'attribute_3', 'class_value'  ]
+      #
+      def build(data_examples, data_labels = nil)
+        check_data_examples(data_examples)
+        @data_labels = (data_labels) ? data_labels : default_data_labels(data_examples)
+        if (num_attributes(data_examples) == 1)
+          @zero_r = ZeroR.new.build(data_examples, data_labels)
+          return self;
+        else
+          @zero_r = nil;
+        end
+        domains = build_domains(data_examples)
+        @rule = nil
+        domains[1...-1].each_index do |attr_index|
+          rule = build_rule(data_examples, attr_index, domains)
+          @rule = rule if !@rule || rule[:correct] > @rule[:correct]
+        end
+        return self
+      end
+      # You can evaluate new data, predicting its class.
+      # e.g.
+      #   classifier.eval(['New York',  '<30', 'F'])  # => 'Y'
+      def eval(data)
+        return @zero_r.eval(data) if @zero_r
+        attr_value = data[@rule[:attr_index]]
+        return @rule[:rule][attr_value]
+      end
+      # This method returns the generated rules in ruby code.
+      # e.g.
+      #
+      #   classifier.to_s
+      #     # =>  if age_range == '<30' then marketing_target = 'Y'
+      #           elsif age_range == '[30-50)' then marketing_target = 'N'
+      #           elsif age_range == '[50-80]' then marketing_target = 'N'
+      #           end
+      #
+      # It is a nice way to inspect induction results, and also to execute them:
+      #     marketing_target = nil
+      #     eval classifier.to_s
+      #     puts marketing_target
+      #       # =>  'Y'
+      def to_s
+        return @zero_r.to_s if @zero_r
+        sentences = []
+        attr_label = @data_labels[@rule[:attr_index]]
+        class_label = @data_labels.last
+        @rule[:rule].each_pair do |attr_value, class_value|
+          sentences << "#{attr_label} == '#{attr_value}' then #{class_label} = '#{class_value}'"
+        end
+        return "if " + sentences.join("\nelsif ") + "\nend"
+      end
+      protected
+      def build_domains(data_examples)
+        domains = Array.new(num_attributes(data_examples)) { Set.new }
+        data_examples.each do |data|
+          data.each_index {|attr_index| domains[attr_index] << data[attr_index]}
+        end
+        return domains
+      end
+      def build_rule(data_examples, attr_index, domains)
+        domain = domains[attr_index]
+        value_freq = Hash.new
+        domain.each do |attr_value|
+          value_freq[attr_value] = Hash.new { |hash, key| hash[key] = 0 }
+        end
+        data_examples.each do |data|
+          value_freq[data[attr_index]][data.last] = value_freq[data[attr_index]][data.last] + 1
+        end
+        rule = {}
+        correct_instances = 0
+        value_freq.each_pair do |attr, class_freq_hash|
+          max_freq = 0
+          class_freq_hash.each_pair do |class_value, freq|
+            if max_freq < freq
+              rule[attr] = class_value
+              max_freq = freq
+            end
+          end
+          correct_instances += max_freq
+        end
+        return {:attr_index => attr_index, :rule => rule, :correct => correct_instances}
+      end
+    end
+  end
+end

data/lib/ai4r/classifiers/prism.rb ADDED

@@ -0,0 +1,231 @@
+# Author::    Sergio Fierens (Implementation only, Cendrowska is
+# the creator of the algorithm)
+# License::   MPL 1.1
+# Project::   ai4r
+# Url::       http://ai4r.rubyforge.org/
+#
+# You can redistribute it and/or modify it under the terms of
+# the Mozilla Public License version 1.1  as published by the
+# Mozilla Foundation at http://www.mozilla.org/MPL/MPL-1.1.txt
+#
+# J. Cendrowska (1987). PRISM: An algorithm for inducing modular rules.
+# International Journal of Man-Machine Studies. 27(4):349-370.
+require File.dirname(__FILE__) + '/classifier_helper'
+module Ai4r
+  module Classifiers
+    # = Introduction
+    # This is an implementation of the PRISM algorithm (Cendrowska, 1987)
+    # Given a set of preclassified examples, it builds a set of rules
+    # to predict the class of other instaces.
+    #
+    # J. Cendrowska (1987). PRISM: An algorithm for inducing modular rules.
+    # International Journal of Man-Machine Studies. 27(4):349-370.
+    class Prism
+      attr_accessor :data_labels, :rules
+      include ClassifierHelper
+      # Build a new Prism classifier. If your data is classified with N attributed
+      # and M examples, then your data examples must have the following format:
+      #
+      #     [   [ATT1_VAL1, ATT2_VAL1, ATT3_VAL1, ... , ATTN_VAL1,  CLASS_VAL1],
+      #         [ATT1_VAL2, ATT2_VAL2, ATT3_VAL2, ... , ATTN_VAL2,  CLASS_VAL2],
+      #         ...
+      #         [ATTM1_VALM, ATT2_VALM, ATT3_VALM, ... , ATTN_VALM, CLASS_VALM],
+      #     ]
+      #
+      # e.g.
+      #     [   ['New York',  '<30',      'M', 'Y'],
+      #          ['Chicago',     '<30',      'M', 'Y'],
+      #          ['Chicago',     '<30',      'F', 'Y'],
+      #          ['New York',  '<30',      'M', 'Y'],
+      #          ['New York',  '<30',      'M', 'Y'],
+      #          ['Chicago',     '[30-50)',  'M', 'Y'],
+      #          ['New York',  '[30-50)',  'F', 'N'],
+      #          ['Chicago',     '[30-50)',  'F', 'Y'],
+      #          ['New York',  '[30-50)',  'F', 'N'],
+      #          ['Chicago',     '[50-80]', 'M', 'N'],
+      #          ['New York',  '[50-80]', 'F', 'N'],
+      #          ['New York',  '[50-80]', 'M', 'N'],
+      #          ['Chicago',     '[50-80]', 'M', 'N'],
+      #          ['New York',  '[50-80]', 'F', 'N'],
+      #          ['Chicago',     '>80',      'F', 'Y']
+      #        ]
+      #
+      # Data labels must have the following format:
+      #     [ 'city', 'age_range', 'gender', 'marketing_target'  ]
+      #
+      # If you do not provide labels for you data, the following labels will
+      # be created by default:
+      #     [ 'attribute_1', 'attribute_2', 'attribute_3', 'class_value'  ]
+      #
+      def build(data_examples, data_labels=nil)
+        check_data_examples(data_examples)
+        @data_labels = (data_labels) ? data_labels : default_data_labels(data_examples)
+        domains = build_domains(data_examples)
+        instances = data_examples.collect {|data| data }
+        @rules = []
+        domains.last.each do |class_value|
+          while(has_class_value(instances, class_value))
+            rule = build_rule(class_value, instances)
+            @rules << rule
+            instances = instances.select {|data| !matches_conditions(data, rule[:conditions])}
+          end
+        end
+        return self
+      end
+      # You can evaluate new data, predicting its class.
+      # e.g.
+      #   classifier.eval(['New York',  '<30', 'F'])  # => 'Y'
+      def eval(instace)
+        @rules.each do |rule|
+          return rule[:class_value] if matches_conditions(instace, rule[:conditions])
+        end
+        return nil
+      end
+      # This method returns the generated rules in ruby code.
+      # e.g.
+      #
+      #   classifier.to_s
+      #     # => if age_range == '<30' then marketing_target = 'Y'
+      #    elsif age_range == '>80' then marketing_target = 'Y'
+      #    elsif city == 'Chicago' and age_range == '[30-50)' then marketing_target = 'Y'
+      #    else marketing_target = 'N'
+      #    end
+      #
+      # It is a nice way to inspect induction results, and also to execute them:
+      #        age_range = '[30-50)'
+      #        city = 'New York'
+      #        eval(classifier.to_s)
+      #        puts marketing_target
+      #         'Y'
+      def to_s
+        out = "if #{join_terms(@rules.first)} then #{then_clause(@rules.first)}"
+        @rules[1...-1].each do |rule|
+          out += "\nelsif #{join_terms(rule)} then #{then_clause(rule)}"
+        end
+        out += "\nelse #{then_clause(@rules.last)}" if @rules.size > 1
+        out += "\nend"
+        return out
+      end
+      protected
+      def has_class_value(instances, class_value)
+        instances.each { |data| return true if data.last == class_value}
+        return false
+      end
+      def is_perfect(instances, rule)
+        class_value = rule[:class_value]
+        instances.each do |data|
+          return false if data.last != class_value and matches_conditions(data, rule[:conditions])
+        end
+        return true
+      end
+      def matches_conditions(data, conditions)
+        conditions.each_pair do |attr_label, attr_value|
+          return false if data[get_attr_index(attr_label)] != attr_value
+        end
+        return true
+      end
+      def get_attr_index(attr_label)
+        return @data_labels.index(attr_label)
+      end
+      def get_attr_value(data, attr_label)
+        return data[get_attr_index(attr_label)]
+      end
+      def build_rule(class_value, instances)
+        rule = {:class_value => class_value, :conditions => {}}
+        rule_instances = instances.collect {|data| data }
+        attributes = @data_labels[0...-1].collect {|label| label }
+        until(is_perfect(instances, rule) || attributes.empty?)
+          freq_table = build_freq_table(rule_instances, attributes, class_value)
+          condition = get_condition(freq_table)
+          rule[:conditions].merge!(condition)
+          rule_instances = rule_instances.select do |data|
+            matches_conditions(data, condition)
+          end
+        end
+        return rule
+      end
+      # Returns a structure with the folloring format:
+      # => {attr1_label => { :attr1_value1 => [p, t], attr1_value2 => [p, t], ... },
+      #     attr2_label => { :attr2_value1 => [p, t], attr2_value2 => [p, t], ... },
+      #     ...
+      #     }
+      # where p is the number of instances classified as class_value
+      # with that attribute value, and t is the total number of instances with
+      # that attribute value
+      def build_freq_table(rule_instances, attributes, class_value)
+        freq_table = Hash.new()
+        rule_instances.each do |data|
+          attributes.each do |attr_label|
+            attr_freqs = freq_table[attr_label] || Hash.new([0, 0])
+            pt = attr_freqs[get_attr_value(data, attr_label)]
+            pt = [(data.last == class_value) ? pt[0]+1 : pt[0], pt[1]+1]
+            attr_freqs[get_attr_value(data, attr_label)] = pt
+            freq_table[attr_label] = attr_freqs
+          end
+        end
+        return freq_table
+      end
+      # returns a single conditional term: {attrN_label => attrN_valueM}
+      # selecting the attribute with higher pt ratio
+      # (occurrences of attribute value classified as class_value /
+      #  occurrences of attribute value)
+      def get_condition(freq_table)
+        best_pt = [0, 0]
+        condition = nil
+        freq_table.each do |attr_label, attr_freqs|
+          attr_freqs.each do |attr_value, pt|
+            if(better_pt(pt, best_pt))
+              condition = { attr_label => attr_value }
+              best_pt = pt
+            end
+          end
+        end
+        return condition
+      end
+      # pt = [p, t]
+      # p = occurrences of attribute value with instance classified as class_value
+      # t = occurrences of attribute value
+      # a pt is better if:
+      #   1- its ratio is higher
+      #   2- its ratio is equal, and has a higher p
+      def better_pt(pt, best_pt)
+        return false if pt[1] == 0
+        return true if best_pt[1] == 0
+        a = pt[0]*best_pt[1]
+        b = best_pt[0]*pt[1]
+        return true if a>b || (a==b && pt[0]>best_pt[0])
+        return false
+      end
+      def join_terms(rule)
+        terms = []
+        rule[:conditions].each do |attr_label, attr_value|
+            terms << "#{attr_label} == '#{attr_value}'"
+        end
+        "#{terms.join(" and ")}"
+      end
+      def then_clause(rule)
+        "#{@data_labels.last} = '#{rule[:class_value]}'"
+      end
+    end
+  end
+end

data/lib/ai4r/classifiers/zero_r.rb ADDED

@@ -0,0 +1,104 @@
+# Author::    Sergio Fierens (Implementation only)
+# License::   MPL 1.1
+# Project::   ai4r
+# Url::       http://ai4r.rubyforge.org/
+#
+# You can redistribute it and/or modify it under the terms of
+# the Mozilla Public License version 1.1  as published by the
+# Mozilla Foundation at http://www.mozilla.org/MPL/MPL-1.1.txt
+require File.dirname(__FILE__) + '/classifier_helper'
+module Ai4r
+  module Classifiers
+    # = Introduction
+    #
+    # The idea behind the ZeroR classifier is to identify the
+    # the most common class value in the training set.
+    # It always returns that value when evaluating an instance.
+    # It is frequently used as a baseline for evaluating other machine learning
+    # algorithms.
+    class ZeroR
+      attr_accessor :data_labels, :class_value
+      include ClassifierHelper
+      # Build a new ZeroR classifier. If your data is classified with N attributed
+      # and M examples, then your data examples must have the following format:
+      #
+      #     [   [ATT1_VAL1, ATT2_VAL1, ATT3_VAL1, ... , ATTN_VAL1,  CLASS_VAL1],
+      #         [ATT1_VAL2, ATT2_VAL2, ATT3_VAL2, ... , ATTN_VAL2,  CLASS_VAL2],
+      #         ...
+      #         [ATTM1_VALM, ATT2_VALM, ATT3_VALM, ... , ATTN_VALM, CLASS_VALM],
+      #     ]
+      #
+      # e.g.
+      #     [   ['New York',  '<30',      'M', 'Y'],
+      #          ['Chicago',     '<30',      'M', 'Y'],
+      #          ['Chicago',     '<30',      'F', 'Y'],
+      #          ['New York',  '<30',      'M', 'Y'],
+      #          ['New York',  '<30',      'M', 'Y'],
+      #          ['Chicago',     '[30-50)',  'M', 'Y'],
+      #          ['New York',  '[30-50)',  'F', 'N'],
+      #          ['Chicago',     '[30-50)',  'F', 'Y'],
+      #          ['New York',  '[30-50)',  'F', 'N'],
+      #          ['Chicago',     '[50-80]', 'M', 'N'],
+      #          ['New York',  '[50-80]', 'F', 'N'],
+      #          ['New York',  '[50-80]', 'M', 'N'],
+      #          ['Chicago',     '[50-80]', 'M', 'N'],
+      #          ['New York',  '[50-80]', 'F', 'N'],
+      #          ['Chicago',     '>80',      'F', 'Y']
+      #        ]
+      #
+      # Data labels must have the following format:
+      #     [ 'city', 'age_range', 'gender', 'marketing_target'  ]
+      #
+      # If you do not provide labels for you data, the following labels will
+      # be created by default:
+      #     [ 'attribute_1', 'attribute_2', 'attribute_3', 'class_value'  ]
+      #
+      def build(data_examples, data_labels=nil)
+        check_data_examples(data_examples)
+        @data_labels = (data_labels) ? data_labels : default_data_labels(data_examples)
+        frequence = {}
+        max_freq = 0
+        @class_value
+        data_examples.each do |example|
+          class_value = example.last
+          class_frequency = frequence[class_value]
+          class_frequency = (class_frequency) ? class_frequency+1 : 1
+          if max_freq < class_frequency
+            max_freq = class_frequency
+            @class_value = class_value
+          end
+        end
+        return self
+      end
+      # You can evaluate new data, predicting its class.
+      # e.g.
+      #   classifier.eval(['New York',  '<30', 'F'])  # => 'Y'
+      def eval(data)
+        @class_value
+      end
+      # This method returns the generated rules in ruby code.
+      # e.g.
+      #
+      #   classifier.to_s
+      #     # =>  marketing_target='Y'
+      #
+      # It is a nice way to inspect induction results, and also to execute them:
+      #     marketing_target = nil
+      #     eval classifier.to_s
+      #     puts marketing_target
+      #       # =>  'Y'
+      def to_s
+        return "#{@data_labels.last} = '#{@class_value}'"
+      end
+    end
+  end
+end