RubyGems - ai4r - Versions diffs - 1.1 → 1.2 - Mend

ai4r 1.1 → 1.2

Files changed (140) hide show

data/README.rdoc +21 -20
data/examples/decision_trees/id3_example.rb +3 -2
data/examples/genetic_algorithm/genetic_algorithm_example.rb +6 -6
data/examples/neural_network/backpropagation_example.rb +2 -2
data/lib/ai4r/classifiers/classifier_helper.rb +54 -0
data/lib/ai4r/classifiers/id3.rb +356 -0
data/lib/ai4r/classifiers/one_r.rb +148 -0
data/lib/ai4r/classifiers/prism.rb +231 -0
data/lib/ai4r/classifiers/zero_r.rb +104 -0
data/lib/ai4r/genetic_algorithm/genetic_algorithm.rb +272 -0
data/lib/ai4r/neural_network/backpropagation.rb +271 -0
data/site/build/tmp/locationmap.xml +14 -14
data/site/build/tmp/output.xmap +23 -23
data/site/build/tmp/pluginlist2fetchbuild.xml +144 -144
data/site/build/tmp/plugins-1.xml +0 -11
data/site/build/tmp/plugins-2.xml +54 -0
data/site/build/tmp/projfilters.properties +41 -41
data/site/build/webapp/WEB-INF/logs/core.log +681 -788
data/site/build/webapp/WEB-INF/logs/error.log +281 -248
data/site/build/webapp/WEB-INF/logs/sitemap.log +1015 -0
data/site/src/documentation/content/xdocs/forum.html +9 -0
data/site/src/documentation/content/xdocs/geneticAlgorithms.xml +82 -68
data/site/src/documentation/content/xdocs/index.xml +47 -18
data/site/src/documentation/content/xdocs/machineLearning.xml +10 -9
data/site/src/documentation/content/xdocs/neuralNetworks.xml +60 -36
data/site/src/documentation/content/xdocs/site.xml +8 -5
data/site/src/documentation/content/xdocs/svn.xml +11 -1
data/site/src/documentation/resources/images/Thumbs.db +0 -0
data/site/src/documentation/resources/images/ai4r-logo.png +0 -0
data/site/src/documentation/resources/images/genetic_algorithms_example.png +0 -0
data/site/src/documentation/resources/images/jadeferret.png +0 -0
data/site/src/documentation/resources/images/neural_network_example.png +0 -0
data/site/src/documentation/resources/images/sub-dir/Thumbs.db +0 -0
data/site/src/documentation/skinconf.xml +18 -18
data/test/classifiers/id3_test.rb +206 -0
data/test/classifiers/one_r_test.rb +62 -0
data/test/classifiers/prism_test.rb +83 -0
data/test/classifiers/zero_r_test.rb +48 -0
data/test/genetic_algorithm/chromosome_test.rb +41 -38
data/test/genetic_algorithm/genetic_algorithm_test.rb +64 -61
data/test/neural_network/backpropagation_test.rb +20 -18
metadata +109 -199
data/lib/decision_tree/id3.rb +0 -354
data/lib/genetic_algorithm/genetic_algorithm.rb +0 -268
data/lib/neural_network/backpropagation.rb +0 -264
data/site/build/site/en/broken-links.xml +0 -2
data/site/build/site/en/downloads.html +0 -187
data/site/build/site/en/downloads.pdf +0 -151
data/site/build/site/en/geneticAlgorithms.html +0 -564
data/site/build/site/en/geneticAlgorithms.pdf +0 -911
data/site/build/site/en/images/ai4r-logo.png +0 -0
data/site/build/site/en/images/built-with-forrest-button.png +0 -0
data/site/build/site/en/images/c.png +0 -0
data/site/build/site/en/images/c_wbn.png +0 -0
data/site/build/site/en/images/c_wn.png +0 -0
data/site/build/site/en/images/ero.gif +0 -0
data/site/build/site/en/images/europe2.png +0 -0
data/site/build/site/en/images/europe3.png +0 -0
data/site/build/site/en/images/fitness.png +0 -0
data/site/build/site/en/images/instruction_arrow.png +0 -0
data/site/build/site/en/images/my_email.png +0 -0
data/site/build/site/en/images/rubyforge.png +0 -0
data/site/build/site/en/images/s.png +0 -0
data/site/build/site/en/images/s_wbn.png +0 -0
data/site/build/site/en/images/s_wn.png +0 -0
data/site/build/site/en/images/sigmoid.png +0 -0
data/site/build/site/en/images/t.png +0 -0
data/site/build/site/en/images/t_wbn.png +0 -0
data/site/build/site/en/images/t_wn.png +0 -0
data/site/build/site/en/index.html +0 -258
data/site/build/site/en/index.pdf +0 -306
data/site/build/site/en/linkmap.html +0 -231
data/site/build/site/en/linkmap.pdf +0 -94
data/site/build/site/en/locationmap.xml +0 -72
data/site/build/site/en/machineLearning.html +0 -325
data/site/build/site/en/machineLearning.pdf +0 -337
data/site/build/site/en/neuralNetworks.html +0 -446
data/site/build/site/en/neuralNetworks.pdf +0 -604
data/site/build/site/en/skin/CommonMessages_de.xml +0 -23
data/site/build/site/en/skin/CommonMessages_en_US.xml +0 -23
data/site/build/site/en/skin/CommonMessages_es.xml +0 -23
data/site/build/site/en/skin/CommonMessages_fr.xml +0 -23
data/site/build/site/en/skin/basic.css +0 -166
data/site/build/site/en/skin/breadcrumbs-optimized.js +0 -90
data/site/build/site/en/skin/breadcrumbs.js +0 -237
data/site/build/site/en/skin/fontsize.js +0 -166
data/site/build/site/en/skin/getBlank.js +0 -40
data/site/build/site/en/skin/getMenu.js +0 -45
data/site/build/site/en/skin/images/README.txt +0 -1
data/site/build/site/en/skin/images/add.jpg +0 -0
data/site/build/site/en/skin/images/built-with-forrest-button.png +0 -0
data/site/build/site/en/skin/images/chapter.gif +0 -0
data/site/build/site/en/skin/images/chapter_open.gif +0 -0
data/site/build/site/en/skin/images/current.gif +0 -0
data/site/build/site/en/skin/images/error.png +0 -0
data/site/build/site/en/skin/images/external-link.gif +0 -0
data/site/build/site/en/skin/images/fix.jpg +0 -0
data/site/build/site/en/skin/images/forrest-credit-logo.png +0 -0
data/site/build/site/en/skin/images/hack.jpg +0 -0
data/site/build/site/en/skin/images/header_white_line.gif +0 -0
data/site/build/site/en/skin/images/info.png +0 -0
data/site/build/site/en/skin/images/instruction_arrow.png +0 -0
data/site/build/site/en/skin/images/label.gif +0 -0
data/site/build/site/en/skin/images/page.gif +0 -0
data/site/build/site/en/skin/images/pdfdoc.gif +0 -0
data/site/build/site/en/skin/images/poddoc.png +0 -0
data/site/build/site/en/skin/images/printer.gif +0 -0
data/site/build/site/en/skin/images/rc-b-l-15-1body-2menu-3menu.png +0 -0
data/site/build/site/en/skin/images/rc-b-r-15-1body-2menu-3menu.png +0 -0
data/site/build/site/en/skin/images/rc-b-r-5-1header-2tab-selected-3tab-selected.png +0 -0
data/site/build/site/en/skin/images/rc-t-l-5-1header-2searchbox-3searchbox.png +0 -0
data/site/build/site/en/skin/images/rc-t-l-5-1header-2tab-selected-3tab-selected.png +0 -0
data/site/build/site/en/skin/images/rc-t-l-5-1header-2tab-unselected-3tab-unselected.png +0 -0
data/site/build/site/en/skin/images/rc-t-r-15-1body-2menu-3menu.png +0 -0
data/site/build/site/en/skin/images/rc-t-r-5-1header-2searchbox-3searchbox.png +0 -0
data/site/build/site/en/skin/images/rc-t-r-5-1header-2tab-selected-3tab-selected.png +0 -0
data/site/build/site/en/skin/images/rc-t-r-5-1header-2tab-unselected-3tab-unselected.png +0 -0
data/site/build/site/en/skin/images/remove.jpg +0 -0
data/site/build/site/en/skin/images/rss.png +0 -0
data/site/build/site/en/skin/images/spacer.gif +0 -0
data/site/build/site/en/skin/images/success.png +0 -0
data/site/build/site/en/skin/images/txtdoc.png +0 -0
data/site/build/site/en/skin/images/update.jpg +0 -0
data/site/build/site/en/skin/images/valid-html401.png +0 -0
data/site/build/site/en/skin/images/vcss.png +0 -0
data/site/build/site/en/skin/images/warning.png +0 -0
data/site/build/site/en/skin/images/xmldoc.gif +0 -0
data/site/build/site/en/skin/menu.js +0 -48
data/site/build/site/en/skin/note.txt +0 -50
data/site/build/site/en/skin/print.css +0 -54
data/site/build/site/en/skin/profile.css +0 -163
data/site/build/site/en/skin/prototype.js +0 -1257
data/site/build/site/en/skin/screen.css +0 -587
data/site/build/site/en/svn.html +0 -223
data/site/build/site/en/svn.pdf +0 -239
data/site/build/site/en/wholesite.pdf +0 -1686
data/site/build/tmp/brokenlinks.xml +0 -2
data/site/build/tmp/cocoon-work/cache-dir/cocoon-ehcache-1.data +0 -0
data/site/build/tmp/cocoon-work/cache-dir/cocoon-ehcache-1.index +0 -0
data/test/decision_tree/id3_test.rb +0 -209

data/README.rdoc CHANGED

@@ -1,40 +1,41 @@
 = Introduction
-This project aims to produce ruby implementations of
-algorithms covering several Artificial intelligence fields, including:
+ AI4R is a collection of ruby algorithms implementations, covering several Artificial intelligence fields,
+ and simple practical examples using them. It implements:
-* Machine Learning (DecisionTree::ID3)
-    Decision Trees using an implementation of ID3 algorithm.
-* Genetic algorithms (GeneticAlgorithm::GeneticSearch)
-    Implementation of GeneticSearch and Chromosome classes. The GeneticSearch is a generic class, and can be used to solved any kind of problems. The GeneticSearch class performs a stochastic search of the solution of a given problem.
-* Neural network (NeuralNetwork::Backpropagation)
-    Implementation of neural networks using the Backpropagation supervised learning technique.
+* Genetic algorithms (AI4R::GeneticAlgorithm::GeneticSearch)
+* Neural networks (AI4R::NeuralNetwork::Backpropagation)
+* ID3 Decision Trees (AI4R::Classifiers::ID3)
-* Bayesian networks
+* PRISM (J. Cendrowska, 1987) (AI4R::Classifiers::Prism)
+* OneR (AKA One Attribute Rule, 1R) (AI4R::Classifiers::OneR)
-    TODO
+* ZeroR (AI4R::Classifiers::ZeroR)
 = Where can I find the lastest code and info on this project?
 http://ai4r.rubyforge.org
+http://ai4r.jadeferret.com
 = How to install
 1. Install the gem:
-    gem install http://rubyforge.org/frs/download.php/32923/ai4r-1.0.gem
+    gem install ai4r
 2. Include require statements in your code:
-    require "rubygems"
-    require "decision_tree/id3"
-    require "neural_network/backpropagation"
-    require "genetic_algorithm/genetic_algorithm"
+	require "rubygems"
+	require "ai4r/classifiers/id3"en
+	require "ai4r/classifiers/prism"
+	require "ai4r/classifiers/one_r"
+	require "ai4r/classifiers/zero_r"
+	require "ai4r/neural_network/backpropagation"
+	require "ai4r/genetic_algorithm/genetic_algorithm"
 = Feedback

data/examples/decision_trees/id3_example.rb CHANGED

@@ -7,7 +7,8 @@
 # the Mozilla Public License version 1.1  as published by the
 # Mozilla Foundation at http://www.mozilla.org/MPL/MPL-1.1.txt
-require File.dirname(__FILE__) + '/../../lib/decision_tree/id3'
+#require File.dirname(__FILE__) + '/../../lib/decision_tree/id3'
+require File.dirname(__FILE__) + '/../../lib/ai4r/classifiers/id3'
 require 'csv'
 # Load data from data_set.csv
@@ -18,7 +19,7 @@ end
 data_labels = data_set.shift
 # Build ID3 tree
-id3 = DecisionTree::ID3.new(data_set, data_labels)
+id3 = Ai4r::Classifiers::ID3.new.build(data_set, data_labels)
 # Show rules
 puts "Discovered rules are:"

data/examples/genetic_algorithm/genetic_algorithm_example.rb CHANGED

@@ -7,7 +7,7 @@
 # the Mozilla Public License version 1.1  as published by the
 # Mozilla Foundation at http://www.mozilla.org/MPL/MPL-1.1.txt
-require File.dirname(__FILE__) + '/../../lib/genetic_algorithm/genetic_algorithm'
+require File.dirname(__FILE__) + '/../../lib/ai4r/genetic_algorithm/genetic_algorithm'
 require 'csv'
 # Load data from data_set.csv
@@ -20,18 +20,18 @@ data_set.collect! do |column|
   column.collect { |element| element.to_f}
 end
-GeneticAlgorithm::Chromosome.set_cost_matrix(data_set)
+Ai4r::GeneticAlgorithm::Chromosome.set_cost_matrix(data_set)
 puts "Some random selected tours costs: "
 3.times do
-  c = GeneticAlgorithm::Chromosome.seed
-  puts "COST #{c.fitness} TOUR: #{c.data.collect{ |c| data_labels[c]} * ', '}"
+  c = Ai4r::GeneticAlgorithm::Chromosome.seed
+  puts "COST #{-1 * c.fitness} TOUR: #{c.data.collect{ |c| data_labels[c]} * ', '}"
 end
 puts "Beginning genetic search, please wait... "
-search = GeneticAlgorithm::GeneticSearch.new(800, 100)
+search = Ai4r::GeneticAlgorithm::GeneticSearch.new(800, 100)
 result = search.run
-puts "BEST COST FOUND #{result.fitness} TOUR: #{result.data.collect{ |c| data_labels[c]} * ', '}"
+puts "BEST COST FOUND #{-1 * result.fitness} TOUR: #{result.data.collect{ |c| data_labels[c]} * ', '}"
  # $7611.99 TOUR: Moscow, Kiev, Warsaw, Hamburg, Berlin, Vienna, Munich, Milan, Rome, Barcelona, Madrid, Paris, Brussels, London, Dublin
  # $7659.81 TOUR: Moscow, Kiev, Warsaw, Vienna, Munich, Berlin, Hamburg, Brussels, Dublin, London, Paris, Milan, Rome, Barcelona, Madrid

data/examples/neural_network/backpropagation_example.rb CHANGED

@@ -10,12 +10,12 @@
 require File.dirname(__FILE__) + '/training_patterns'
 require File.dirname(__FILE__) + '/patterns_with_noise'
 require File.dirname(__FILE__) + '/patterns_with_base_noise'
-require File.dirname(__FILE__) + '/../../lib/neural_network/backpropagation'
+require File.dirname(__FILE__) + '/../../lib/ai4r/neural_network/backpropagation'
 require 'benchmark'
 times = Benchmark.measure do
-    net = NeuralNetwork::Backpropagation.new([256, 3])
+    net = Ai4r::NeuralNetwork::Backpropagation.new([256, 3])
     tr_input = TRIANGLE.flatten.collect { |input| input.to_f / 10}
     sq_input = SQUARE.flatten.collect { |input| input.to_f / 10}

data/lib/ai4r/classifiers/classifier_helper.rb ADDED

@@ -0,0 +1,54 @@
+require 'set'
+module Ai4r
+  module Classifiers
+    NUMERIC_CLASS_TYPE = 1
+    NOMINAL_CLASS_TYPE = 2
+    module ClassifierHelper
+      def default_data_labels(data_examples)
+        data_labels = []
+        data_examples[0][0..-2].each_index do |i|
+          data_labels[i] = "attribute_#{i+1}"
+        end
+        data_labels[data_labels.length]="class_value"
+        return data_labels
+      end
+      def check_data_examples(data_examples)
+        if !data_examples || data_examples.empty?
+          raise ArgumentError,"Examples data set must not be empty."
+        elsif !data_examples.first.is_a?(Array)
+          raise ArgumentError,"Unkown format for example data."
+        end
+      end
+      # Returns attributes number, including class attribute
+      def num_attributes(data_examples)
+        return 0 if !data_examples || data_examples.empty? || !data_examples.first.is_a?(Array)
+        return data_examples.first.size
+      end
+      # Returns an array with the domain of each attribute (Set instance
+      # containing all possible values)
+      # Return example:
+      # => [#<Set: {"New York", "Chicago"}>,
+      #     #<Set: {"<30", "[30-50)", "[50-80]", ">80"}>,
+      #     #<Set: {"M", "F"}>,
+      #     #<Set: {"Y", "N"}>]
+      def build_domains(data_examples)
+        domains = Array.new(num_attributes(data_examples)) { Set.new }
+        data_examples.each do |data|
+          data.each_index {|attr_index| domains[attr_index] << data[attr_index]}
+        end
+        return domains
+      end
+    end
+  end
+end

data/lib/ai4r/classifiers/id3.rb ADDED

@@ -0,0 +1,356 @@
+# Author::    Sergio Fierens (Implementation, Quinlan is
+# the creator of the algorithm)
+# License::   MPL 1.1
+# Project::   ai4r
+# Url::       http://ai4r.rubyforge.org/
+#
+# You can redistribute it and/or modify it under the terms of
+# the Mozilla Public License version 1.1  as published by the
+# Mozilla Foundation at http://www.mozilla.org/MPL/MPL-1.1.txt
+require File.dirname(__FILE__) + '/classifier_helper'
+module Ai4r
+  module Classifiers
+    # = Introduction
+    # This is an implementation of the ID3 algorithm (Quinlan)
+    # Given a set of preclassified examples, it builds a top-down
+    # induction of decision tree, biased by the information gain and
+    # entropy measure.
+    #
+    # * http://en.wikipedia.org/wiki/Decision_tree
+    # * http://en.wikipedia.org/wiki/ID3_algorithm
+    #
+    # = How to use it
+    #
+    #   DATA_LABELS = [ 'city', 'age_range', 'gender', 'marketing_target'  ]
+    #
+    #   DATA_SET = [  ['New York',  '<30',      'M', 'Y'],
+    #            ['Chicago',     '<30',      'M', 'Y'],
+    #            ['Chicago',     '<30',      'F', 'Y'],
+    #            ['New York',  '<30',      'M', 'Y'],
+    #            ['New York',  '<30',      'M', 'Y'],
+    #            ['Chicago',     '[30-50)',  'M', 'Y'],
+    #            ['New York',  '[30-50)',  'F', 'N'],
+    #            ['Chicago',     '[30-50)',  'F', 'Y'],
+    #            ['New York',  '[30-50)',  'F', 'N'],
+    #            ['Chicago',     '[50-80]', 'M', 'N'],
+    #            ['New York',  '[50-80]', 'F', 'N'],
+    #            ['New York',  '[50-80]', 'M', 'N'],
+    #            ['Chicago',     '[50-80]', 'M', 'N'],
+    #            ['New York',  '[50-80]', 'F', 'N'],
+    #            ['Chicago',     '>80',      'F', 'Y']
+    #          ]
+    #
+    #   id3 = DecisionTree::ID3.new(DATA_SET, DATA_LABELS)
+    #
+    #   id3.to_s
+    #     # =>  if age_range=='<30' then marketing_target='Y'
+    #           elsif age_range=='[30-50)' and city=='Chicago' then marketing_target='Y'
+    #           elsif age_range=='[30-50)' and city=='New York' then marketing_target='N'
+    #           elsif age_range=='[50-80]' then marketing_target='N'
+    #           elsif age_range=='>80' then marketing_target='Y'
+    #           else raise 'There was not enough information during training to do a proper induction for this data element' end
+    #
+    #   id3.eval(['New York', '<30', 'M'])
+    #     # =>  'Y'
+    #
+    # = A better way to load the data
+    #
+    # In the real life you will use lot more data training examples, with more
+    # attributes. Consider moving your data to an external CSV (comma separate
+    # values) file.
+    #
+    #   data_set = []
+    #   CSV::Reader.parse(File.open("#{File.dirname(__FILE__)}/data_set.csv", 'r')) do |row|
+    #     data_set << row
+    #   end
+    #   data_labels = data_set.shift
+    #
+    #   id3 = DecisionTree::ID3.new(data_set, data_labels)
+    #
+    # = A nice tip for data evaluation
+    #
+    #   id3 = DecisionTree::ID3.new(DATA_SET, DATA_LABELS)
+    #     age_range = '<30'
+    #     marketing_target = nil
+    #     eval id3.to_s
+    #     puts marketing_target
+    #       # =>  'Y'
+    # = More about ID3 and decision trees
+    #
+    # * http://en.wikipedia.org/wiki/Decision_tree
+    # * http://en.wikipedia.org/wiki/ID3_algorithm
+    #
+    # = About the project
+    # Author::    Sergio Fierens
+    # License::   MPL 1.1
+    class ID3
+      attr_reader :data_labels
+      include ClassifierHelper
+      # Create a new decision tree. If your data is classified with N attributed
+      # and M examples, then your data examples must have the following format:
+      #
+      #     [   [ATT1_VAL1, ATT2_VAL1, ATT3_VAL1, ... , ATTN_VAL1,  CATEGORY_VAL1],
+      #         [ATT1_VAL2, ATT2_VAL2, ATT3_VAL2, ... , ATTN_VAL2,  CATEGORY_VAL2],
+      #         ...
+      #         [ATTM1_VALM, ATT2_VALM, ATT3_VALM, ... , ATTN_VALM,  CATEGORY_VALM],
+      #     ]
+      #
+      # e.g.
+      #     [   ['New York',  '<30',      'M', 'Y'],
+      #          ['Chicago',     '<30',      'M', 'Y'],
+      #          ['Chicago',     '<30',      'F', 'Y'],
+      #          ['New York',  '<30',      'M', 'Y'],
+      #          ['New York',  '<30',      'M', 'Y'],
+      #          ['Chicago',     '[30-50)',  'M', 'Y'],
+      #          ['New York',  '[30-50)',  'F', 'N'],
+      #          ['Chicago',     '[30-50)',  'F', 'Y'],
+      #          ['New York',  '[30-50)',  'F', 'N'],
+      #          ['Chicago',     '[50-80]', 'M', 'N'],
+      #          ['New York',  '[50-80]', 'F', 'N'],
+      #          ['New York',  '[50-80]', 'M', 'N'],
+      #          ['Chicago',     '[50-80]', 'M', 'N'],
+      #          ['New York',  '[50-80]', 'F', 'N'],
+      #          ['Chicago',     '>80',      'F', 'Y']
+      #        ]
+      #
+      # Data labels must have the following format:
+      #     [ 'city', 'age_range', 'gender', 'marketing_target'  ]
+      #
+      # If you do not provide labels for you data, the following labels will
+      # be created by default:
+      #     [ 'ATTRIBUTE_1', 'ATTRIBUTE_2', 'ATTRIBUTE_3', 'CATEGORY'  ]
+      #
+      def build(data_examples, data_labels=nil)
+        check_data_examples(data_examples)
+        @data_labels = (data_labels) ? data_labels : default_data_labels(data_examples)
+        preprocess_data(data_examples)
+        return self
+      end
+      # You can evaluate new data, predicting its category.
+      # e.g.
+      #   id3.eval(['New York',  '<30', 'F'])  # => 'Y'
+      def eval(data)
+        @tree.value(data) if @tree
+      end
+      # This method returns the generated rules in ruby code.
+      # e.g.
+      #
+      #   id3.to_s
+      #     # =>  if age_range=='<30' then marketing_target='Y'
+      #           elsif age_range=='[30-50)' and city=='Chicago' then marketing_target='Y'
+      #           elsif age_range=='[30-50)' and city=='New York' then marketing_target='N'
+      #           elsif age_range=='[50-80]' then marketing_target='N'
+      #           elsif age_range=='>80' then marketing_target='Y'
+      #           else raise 'There was not enough information during training to do a proper induction for this data element' end
+      #
+      # It is a nice way to inspect induction results, and also to execute them:
+      #     age_range = '<30'
+      #     marketing_target = nil
+      #     eval id3.to_s
+      #     puts marketing_target
+      #       # =>  'Y'
+      def to_s
+        rules = @tree.get_rules
+        rules = rules.collect do |rule|
+            "#{rule[0..-2].join(' and ')} then #{rule.last}"
+        end
+        return "if #{rules.join("\nelsif ")}\nelse raise 'There was not enough information during training to do a proper induction for this data element' end"
+      end
+      private
+      def preprocess_data(data_examples)
+        @tree = build_node(data_examples)
+      end
+      private
+      def build_node(data_examples, flag_att = [])
+        return ErrorNode.new if data_examples.length == 0
+        domain = domain(data_examples)
+        return CategoryNode.new(@data_labels.last, domain.last[0]) if domain.last.length == 1
+        min_entropy_index = min_entropy_index(data_examples, domain, flag_att)
+        flag_att << min_entropy_index
+        split_data_examples = split_data_examples(data_examples, domain, min_entropy_index)
+        return CategoryNode.new(@data_labels.last, most_freq(data_examples, domain)) if split_data_examples.length == 1
+        nodes = split_data_examples.collect do |partial_data_examples|
+          build_node(partial_data_examples, flag_att)
+        end
+        return EvaluationNode.new(@data_labels, min_entropy_index, domain[min_entropy_index], nodes)
+      end
+      private
+      def self.sum(values)
+        values.inject( 0 ) { |sum,x| sum+x }
+      end
+      private
+      def self.log2(z)
+        return 0.0 if z == 0
+        Math.log(z)/LOG2
+      end
+      private
+      def most_freq(examples, domain)
+        freqs = []
+        domain.last.length.times { freqs << 0}
+        examples.each do |example|
+          cat_index = domain.last.index(example.last)
+          freq = freqs[cat_index] + 1
+          freqs[cat_index] = freq
+        end
+        max_freq = freqs.max
+        max_freq_index = freqs.index(max_freq)
+        domain.last[max_freq_index]
+      end
+      private
+      def split_data_examples(data_examples, domain, att_index)
+        data_examples_array = []
+        att_value_examples = {}
+        data_examples.each do |example|
+          example_set = att_value_examples[example[att_index]]
+          example_set = [] if !example_set
+          example_set << example
+          att_value_examples.store(example[att_index], example_set)
+        end
+        att_value_examples.each_pair do |att_value, example_set|
+           att_value_index = domain[att_index].index(att_value)
+           data_examples_array[att_value_index] = example_set
+        end
+        return data_examples_array
+      end
+      private
+      def min_entropy_index(data_examples, domain, flag_att=[])
+        min_entropy = nil
+        min_index = 0
+        domain[0..-2].each_index do |index|
+          freq_grid = freq_grid(index, data_examples, domain)
+          entropy = entropy(freq_grid, data_examples.length)
+          if (!min_entropy || entropy < min_entropy) && !flag_att.include?(index)
+            min_entropy = entropy
+            min_index = index
+          end
+        end
+        return min_index
+      end
+      private
+      def domain(data_examples)
+        #return build_domains(data_examples)
+        domain = []
+        @data_labels.length.times { domain << [] }
+        data_examples.each do |data|
+          data.each_index do |i|
+            domain[i] << data[i] if i<domain.length && !domain[i].include?(data[i])
+          end
+        end
+        return domain
+      end
+      private
+      def freq_grid(att_index, data_examples, domain)
+        #Initialize empty grid
+        grid_element = []
+        domain.last.length.times { grid_element << 0}
+        grid = []
+        domain[att_index].length.times { grid << grid_element.clone }
+        #Fill frecuency with grid
+        data_examples.each do |example|
+          att_val = example[att_index]
+          att_val_index = domain[att_index].index(att_val)
+          category = example.last
+          category_index = domain.last.index(category)
+          freq = grid[att_val_index][category_index] + 1
+          grid[att_val_index][category_index] = freq
+        end
+        return grid
+      end
+      private
+      def entropy(freq_grid, total_examples)
+        #Calc entropy of each element
+        entropy = 0
+        freq_grid.each do |att_freq|
+          att_total_freq = ID3.sum(att_freq)
+          partial_entropy = 0
+          if att_total_freq != 0
+            att_freq.each do |freq|
+              prop = freq.to_f/att_total_freq
+              partial_entropy += (-1*prop*ID3.log2(prop))
+            end
+          end
+          entropy += (att_total_freq.to_f/total_examples) * partial_entropy
+        end
+        return entropy
+      end
+      private
+      LOG2 = Math.log(2)
+    end
+    class EvaluationNode
+      attr_reader :index, :values, :nodes
+      def initialize(data_labels, index, values, nodes)
+        @index = index
+        @values = values
+        @nodes = nodes
+        @data_labels = data_labels
+      end
+      def value(data)
+        value = data[@index]
+        return rule_not_found if !@values.include?(value)
+        return nodes[@values.index(value)].value(data)
+      end
+      def get_rules
+        rule_set = []
+        @nodes.each_index do |child_node_index|
+          my_rule = "#{@data_labels[@index]}=='#{@values[child_node_index]}'"
+          child_node = @nodes[child_node_index]
+          child_node_rules = child_node.get_rules
+          child_node_rules.each do |child_rule|
+            child_rule.unshift(my_rule)
+          end
+          rule_set += child_node_rules
+        end
+        return rule_set
+      end
+    end
+    class CategoryNode
+      def initialize(label, value)
+        @label = label
+        @value = value
+      end
+      def value(data)
+        return @value
+      end
+      def get_rules
+        return [["#{@label}='#{@value}'"]]
+      end
+    end
+    class ErrorNode
+      def value(data)
+        raise "There was not enough information during training to do a proper induction for this data element."
+      end
+      def get_rules
+        return []
+      end
+    end
+  end
+end