RubyGems - treat - Versions diffs - 2.0.3 → 2.0.4 - Mend

treat 2.0.3 → 2.0.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (36) hide show

data/lib/treat/config/data/languages/agnostic.rb +6 -3
data/lib/treat/config/data/languages/english.rb +1 -1
data/lib/treat/config/data/workers/extractors.rb +8 -0
data/lib/treat/loaders/stanford.rb +2 -0
data/lib/treat/version.rb +1 -1
data/lib/treat/workers/extractors/distance/levenshtein.rb +35 -0
data/lib/treat/workers/extractors/name_tag/stanford.rb +4 -1
data/lib/treat/workers/extractors/similarity/jaro_winkler.rb +38 -0
data/lib/treat/workers/extractors/similarity/tf_idf.rb +19 -3
data/lib/treat/workers/extractors/time/chronic.rb +6 -41
data/lib/treat/workers/extractors/time/kronic.rb +20 -0
data/lib/treat/workers/extractors/time/nickel.rb +0 -15
data/lib/treat/workers/extractors/time/ruby.rb +2 -33
data/lib/treat/workers/lexicalizers/taggers/stanford.rb +11 -10
data/lib/treat/workers/processors/parsers/stanford.rb +60 -112
data/spec/entities/collection.rb +29 -25
data/spec/entities/document.rb +45 -44
data/spec/entities/entity.rb +295 -294
data/spec/entities/phrase.rb +21 -17
data/spec/entities/token.rb +43 -40
data/spec/entities/word.rb +5 -1
data/spec/entities/zone.rb +26 -22
data/spec/helper.rb +7 -2
data/spec/learning/data_set.rb +145 -141
data/spec/learning/export.rb +46 -42
data/spec/learning/problem.rb +114 -110
data/spec/learning/question.rb +46 -42
data/spec/treat.rb +41 -37
data/spec/workers/agnostic.rb +2 -2
data/spec/workers/english.rb +12 -12
metadata +7 -8
data/files/21552208.html +0 -786
data/files/nethttp-cheat-sheet-2940.html +0 -393
data/lib/treat/workers/extractors/similarity/levenshtein.rb +0 -36
data/spec/sandbox.rb +0 -294
data/spec/workers/examples/english/mathematicians/euler.html +0 -21

data/spec/learning/export.rb CHANGED Viewed

@@ -1,52 +1,56 @@
-describe Treat::Learning::Export do
+module Treat::Specs::Learning
-  describe "#initialize" do
-    context "when supplied with acceptable parameters" do
-      it "should give access to the parameters" do
-        export = Treat::Learning::Export.new(:name, 0, "->(e) { e }")
-        export.name.should eql :name
-        export.default.should eql 0
-        export.proc_string.should eql "->(e) { e }"
-        export.proc.should be_instance_of Proc
-        export.proc.call('x').should eql 'x'
+  describe Treat::Learning::Export do
+    describe "#initialize" do
+      context "when supplied with acceptable parameters" do
+        it "should give access to the parameters" do
+          export = Treat::Learning::Export.new(:name, 0, "->(e) { e }")
+          export.name.should eql :name
+          export.default.should eql 0
+          export.proc_string.should eql "->(e) { e }"
+          export.proc.should be_instance_of Proc
+          export.proc.call('x').should eql 'x'
+        end
       end
-    end
-    context "when supplied with wrong parameters" do
-      it "should raise an exception" do
-        # First argument should be a symbol representing the name of the export.
-        expect { Treat::Learning::Export.new(nil) }.to raise_error
-        # Third argument, if supplied, should be a string that
-        # evaluates to a proc (NOT a proc/lambda).
-        expect { Treat::Learning::Export.new(:name, 0, lambda { x } ) }.to raise_error
-        # Third argument should be proper ruby syntax.
-        expect { Treat::Learning::Export.new(:name, 0, "->(e) { ") }.to raise_error
-        # Third argument should evaluate to a proc.
-        expect { Treat::Learning::Export.new(:name, 0, "2") }.to raise_error
+      context "when supplied with wrong parameters" do
+        it "should raise an exception" do
+          # First argument should be a symbol representing the name of the export.
+          expect { Treat::Learning::Export.new(nil) }.to raise_error
+          # Third argument, if supplied, should be a string that
+          # evaluates to a proc (NOT a proc/lambda).
+          expect { Treat::Learning::Export.new(:name, 0, lambda { x } ) }.to raise_error
+          # Third argument should be proper ruby syntax.
+          expect { Treat::Learning::Export.new(:name, 0, "->(e) { ") }.to raise_error
+          # Third argument should evaluate to a proc.
+          expect { Treat::Learning::Export.new(:name, 0, "2") }.to raise_error
+        end
       end
     end
-  end
-  describe "#==(question)" do
-    context "when supplied with an equal question" do
-      it "should return true" do
-        Treat::Learning::Export.new(:name).
-        should == Treat::Learning::Export.new(:name)
-        Treat::Learning::Export.new(:name, 0).
-        should == Treat::Learning::Export.new(:name, 0)
-        Treat::Learning::Export.new(:name, 0, "->(e) { }").
-        should == Treat::Learning::Export.new(:name, 0, "->(e) { }")
+    describe "#==(question)" do
+      context "when supplied with an equal question" do
+        it "should return true" do
+          Treat::Learning::Export.new(:name).
+          should == Treat::Learning::Export.new(:name)
+          Treat::Learning::Export.new(:name, 0).
+          should == Treat::Learning::Export.new(:name, 0)
+          Treat::Learning::Export.new(:name, 0, "->(e) { }").
+          should == Treat::Learning::Export.new(:name, 0, "->(e) { }")
+        end
       end
-    end
-    context "when supplied with a different question" do
-      it "should return false" do
-        Treat::Learning::Export.new(:name).
-        should_not == Treat::Learning::Export.new(:name2)
-        Treat::Learning::Export.new(:name, 0).
-        should_not == Treat::Learning::Export.new(:name, 1)
-        Treat::Learning::Export.new(:name, 0, "->(e) { }").
-        should_not == Treat::Learning::Export.new(:name, 0, "->(e) { x }")
+      context "when supplied with a different question" do
+        it "should return false" do
+          Treat::Learning::Export.new(:name).
+          should_not == Treat::Learning::Export.new(:name2)
+          Treat::Learning::Export.new(:name, 0).
+          should_not == Treat::Learning::Export.new(:name, 1)
+          Treat::Learning::Export.new(:name, 0, "->(e) { }").
+          should_not == Treat::Learning::Export.new(:name, 0, "->(e) { x }")
+        end
       end
     end
   end
-end
+end

data/spec/learning/problem.rb CHANGED Viewed

@@ -1,144 +1,148 @@
-describe Treat::Learning::Problem do
+module Treat::Specs::Learning
-  before do
-    @question = Treat::Learning::Question.new(:is_key_sentence,
-    :sentence,  0, :continuous)
-    @feature = Treat::Learning::Feature.new(:word_count, 0)
-    @tag = Treat::Learning::Tag.new(:paragraph_length, 0,
-    "->(e) { e.parent_paragraph.word_count }")
-    @paragraph = Treat::Entities::Paragraph.new(
-    "Ranga and I went to the store. Meanwhile, Ryan was sleeping.")
-    @paragraph.do :segment, :tokenize
-    @sentence = @paragraph.sentences[0]
-    @hash = {"question"=>{"name"=>:is_key_sentence, "target"=>:sentence,
-    "type"=>:continuous, "default"=>0}, "features"=>[
-    {"proc_string"=>nil, "default"=>0, "name"=>:word_count, "proc"=>nil}],
-    "tags"=>[{"proc_string"=>"->(e) { e.parent_paragraph.word_count }",
-    "default"=>0, "name"=>:paragraph_length, "proc"=>nil}], "id"=>0}
-  end
+  describe Treat::Learning::Problem do
-  describe "#initialize" do
-    context "when supplied with proper arguments" do
-      it "initializes the problem and gives access to parameters" do
-        problem = Treat::Learning::Problem.new(@question, @feature, @tag)
-        problem.question.should eql @question
-        problem.features.should eql [@feature]
-        problem.tags.should eql [@tag]
-        problem.feature_labels.should eql [@feature.name]
-        problem.tag_labels.should eql [@tag.name]
-        # ID ???      FIXME
-      end
+    before do
+      @question = Treat::Learning::Question.new(:is_key_sentence,
+      :sentence,  0, :continuous)
+      @feature = Treat::Learning::Feature.new(:word_count, 0)
+      @tag = Treat::Learning::Tag.new(:paragraph_length, 0,
+      "->(e) { e.parent_paragraph.word_count }")
+      @paragraph = Treat::Entities::Paragraph.new(
+      "Ranga and I went to the store. Meanwhile, Ryan was sleeping.")
+      @paragraph.apply :segment, :tokenize
+      @sentence = @paragraph.sentences[0]
+      @hash = {"question"=>{"name"=>:is_key_sentence, "target"=>:sentence,
+      "type"=>:continuous, "default"=>0}, "features"=>[
+      {"proc_string"=>nil, "default"=>0, "name"=>:word_count, "proc"=>nil}],
+      "tags"=>[{"proc_string"=>"->(e) { e.parent_paragraph.word_count }",
+      "default"=>0, "name"=>:paragraph_length, "proc"=>nil}], "id"=>0}
     end
-    context "when supplied with unacceptable arguments" do
-      it "raises an error" do
-        # First argument should be instance of Question.
-        expect { Treat::Learning::Problem.new('foo') }.to raise_error
-        # Arguments >= 2 should be instances of Export.
-        expect { Treat::Learning::Problem.new(@question, 'foo') }.to raise_error
-        # Should have at least one Feature in the arguments.
-        expect { Treat::Learning::Problem.new(@question, @tag) }.to raise_error
+    describe "#initialize" do
+      context "when supplied with proper arguments" do
+        it "initializes the problem and gives access to parameters" do
+          problem = Treat::Learning::Problem.new(@question, @feature, @tag)
+          problem.question.should eql @question
+          problem.features.should eql [@feature]
+          problem.tags.should eql [@tag]
+          problem.feature_labels.should eql [@feature.name]
+          problem.tag_labels.should eql [@tag.name]
+          # ID ???      FIXME
+        end
+      end
+      context "when supplied with unacceptable arguments" do
+        it "raises an error" do
+          # First argument should be instance of Question.
+          expect { Treat::Learning::Problem.new('foo') }.to raise_error
+          # Arguments >= 2 should be instances of Export.
+          expect { Treat::Learning::Problem.new(@question, 'foo') }.to raise_error
+          # Should have at least one Feature in the arguments.
+          expect { Treat::Learning::Problem.new(@question, @tag) }.to raise_error
+        end
       end
     end
-  end
-  describe "#==(problem)" do
-    context "when supplied with an equal problem" do
-      it "should return true" do
-        Treat::Learning::Problem.new(@question, @feature).
-        should == Treat::Learning::Problem.new(@question, @feature)
-        Treat::Learning::Problem.new(@question, @feature, @tag).
-        should == Treat::Learning::Problem.new(@question, @feature, @tag)
+    describe "#==(problem)" do
+      context "when supplied with an equal problem" do
+        it "should return true" do
+          Treat::Learning::Problem.new(@question, @feature).
+          should == Treat::Learning::Problem.new(@question, @feature)
+          Treat::Learning::Problem.new(@question, @feature, @tag).
+          should == Treat::Learning::Problem.new(@question, @feature, @tag)
+        end
       end
-    end
-    context "when supplied with a different question" do
-      it "should return false" do
-        question = Treat::Learning::Question.new(:is_key_sentence, :sentence)
-        feature = Treat::Learning::Feature.new(:word_count, 999)
-        tag = Treat::Learning::Tag.new(:paragraph_length, 999)
-        Treat::Learning::Problem.new(@question, @feature).
-        should_not == Treat::Learning::Problem.new(question, @feature)
-        Treat::Learning::Problem.new(@question, @feature).
-        should_not == Treat::Learning::Problem.new(@question, feature)
-        Treat::Learning::Problem.new(@question, @feature, @tag).
-        should_not == Treat::Learning::Problem.new(@question, @feature, tag)
+      context "when supplied with a different question" do
+        it "should return false" do
+          question = Treat::Learning::Question.new(:is_key_sentence, :sentence)
+          feature = Treat::Learning::Feature.new(:word_count, 999)
+          tag = Treat::Learning::Tag.new(:paragraph_length, 999)
+          Treat::Learning::Problem.new(@question, @feature).
+          should_not == Treat::Learning::Problem.new(question, @feature)
+          Treat::Learning::Problem.new(@question, @feature).
+          should_not == Treat::Learning::Problem.new(@question, feature)
+          Treat::Learning::Problem.new(@question, @feature, @tag).
+          should_not == Treat::Learning::Problem.new(@question, @feature, tag)
+        end
       end
     end
-  end
-  describe "#export_tags(entity)" do
-    context "when called on a problem that has tags" do
-      context "and called with an entity of the proper type" do
-        it "returns an array of the tags" do
-          problem = Treat::Learning::Problem.new(@question, @feature, @tag)
-          problem.export_tags(@sentence).should eql [11]
+    describe "#export_tags(entity)" do
+      context "when called on a problem that has tags" do
+        context "and called with an entity of the proper type" do
+          it "returns an array of the tags" do
+            problem = Treat::Learning::Problem.new(@question, @feature, @tag)
+            problem.export_tags(@sentence).should eql [11]
+          end
         end
       end
-    end
-    context "when called on a problem that doesn't have tags" do
-      it "raises an error" do
-        problem = Treat::Learning::Problem.new(@question, @feature)
-        expect { problem.export_tags(@sentence) }.to raise_error
+      context "when called on a problem that doesn't have tags" do
+        it "raises an error" do
+          problem = Treat::Learning::Problem.new(@question, @feature)
+          expect { problem.export_tags(@sentence) }.to raise_error
+        end
       end
     end
-  end
-  describe "#export_features(entity, include_answer = true)" do
+    describe "#export_features(entity, include_answer = true)" do
-    context "when called with an entity of the proper type" do
-      context "and include_answer is set to true" do
-        context "and the answer is already set on the entity" do
-          it "returns an array of the exported features, with the answer" do
-            problem = Treat::Learning::Problem.new(@question, @feature)
-            @sentence.set :is_key_sentence, 1
-            problem.export_features(@sentence).should eql [7, 1]
+      context "when called with an entity of the proper type" do
+        context "and include_answer is set to true" do
+          context "and the answer is already set on the entity" do
+            it "returns an array of the exported features, with the answer" do
+              problem = Treat::Learning::Problem.new(@question, @feature)
+              @sentence.set :is_key_sentence, 1
+              problem.export_features(@sentence).should eql [7, 1]
+            end
+          end
+          context "and the answer is not already set on the entity" do
+            it "returns an array of the exported features, with the question's default answer" do
+              problem = Treat::Learning::Problem.new(@question, @feature)
+              problem.export_features(@sentence).should eql [7, @question.default]
+            end
           end
         end
-        context "and the answer is not already set on the entity" do
-          it "returns an array of the exported features, with the question's default answer" do
+        context "and include_answer is set to false" do
+          it "returns an array of the exported features, without the answer" do
             problem = Treat::Learning::Problem.new(@question, @feature)
-            problem.export_features(@sentence).should eql [7, @question.default]
+            problem.export_features(@sentence, false).should eql [7]
           end
         end
       end
-      context "and include_answer is set to false" do
-        it "returns an array of the exported features, without the answer" do
+      context "when supplied with an entity that is not of the proper type" do
+        it "raises an error" do
           problem = Treat::Learning::Problem.new(@question, @feature)
-          problem.export_features(@sentence, false).should eql [7]
+          word = Treat::Entities::Word.new('test')
+          expect { problem.export_features(word) }.to raise_error
         end
       end
     end
-    context "when supplied with an entity that is not of the proper type" do
-      it "raises an error" do
-        problem = Treat::Learning::Problem.new(@question, @feature)
-        word = Treat::Entities::Word.new('test')
-        expect { problem.export_features(word) }.to raise_error
-      end
-    end
-  end
-  describe "#to_hash" do
-    context "when called on a problem" do
-      it "returns a hash describing the problem" do
-        Treat::Learning::Problem.new(@question, @feature, @tag).
-        to_hash.tap { |e| e['id'] = 0 }.should eql @hash
+    describe "#to_hash" do
+      context "when called on a problem" do
+        it "returns a hash describing the problem" do
+          Treat::Learning::Problem.new(@question, @feature, @tag).
+          to_hash.tap { |e| e['id'] = 0 }.should eql @hash
+        end
       end
     end
-  end
-  describe "#self.from_hash" do
-    context "when called with a hash describing a problem" do
-      it "returns a problem based on the hash" do
-        problem = Treat::Learning::Problem.from_hash(@hash)
-        problem.question.name.should eql :is_key_sentence
-        problem.question.target.should eql :sentence
-        problem.question.type.should eql :continuous
-        problem.question.default.should eql 0
-        problem.features[0].proc_string.should eql nil
-        problem.features[0].default.should eql 0
-        problem.features[0].name.should eql :word_count
-        problem.features[0].proc.should eql nil
+    describe "#self.from_hash" do
+      context "when called with a hash describing a problem" do
+        it "returns a problem based on the hash" do
+          problem = Treat::Learning::Problem.from_hash(@hash)
+          problem.question.name.should eql :is_key_sentence
+          problem.question.target.should eql :sentence
+          problem.question.type.should eql :continuous
+          problem.question.default.should eql 0
+          problem.features[0].proc_string.should eql nil
+          problem.features[0].default.should eql 0
+          problem.features[0].name.should eql :word_count
+          problem.features[0].proc.should eql nil
+        end
       end
     end
   end
-end
+end

data/spec/learning/question.rb CHANGED Viewed

@@ -1,52 +1,56 @@
-describe Treat::Learning::Question do
+module Treat::Specs::Learning
-  describe "#initialize" do
-    context "when supplied with acceptable parameters" do
-      it "should give access to the parameters" do
-        question = Treat::Learning::Question.new(
-        :is_keyword, :word, 0, :continuous)
-        question.name.should eql :is_keyword
-        question.target.should eql :word
-        question.type.should eql :continuous
-        question.default.should eql 0
+  describe Treat::Learning::Question do
+    describe "#initialize" do
+      context "when supplied with acceptable parameters" do
+        it "should give access to the parameters" do
+          question = Treat::Learning::Question.new(
+          :is_keyword, :word, 0, :continuous)
+          question.name.should eql :is_keyword
+          question.target.should eql :word
+          question.type.should eql :continuous
+          question.default.should eql 0
+        end
       end
-    end
-    context "when supplied with wrong parameters" do
-      it "should raise an exception" do
-        # Name should be a symbol
-        expect { Treat::Learning::Question.new(
-        nil, :sentence) }.to raise_error
-        # Target should be an actual entity type
-        expect { Treat::Learning::Question.new(
-        :name, :foo) }.to raise_error
-        # Distribution type should be continuous or discrete
-        expect { Treat::Learning::Question.new(
-        :name, :sentence, 0, :nonsense) }.to raise_error
+      context "when supplied with wrong parameters" do
+        it "should raise an exception" do
+          # Name should be a symbol
+          expect { Treat::Learning::Question.new(
+          nil, :sentence) }.to raise_error
+          # Target should be an actual entity type
+          expect { Treat::Learning::Question.new(
+          :name, :foo) }.to raise_error
+          # Distribution type should be continuous or discrete
+          expect { Treat::Learning::Question.new(
+          :name, :sentence, 0, :nonsense) }.to raise_error
+        end
       end
     end
-  end
-  describe "#==(question)" do
-    context "when supplied with an equal question" do
-      it "should return true" do
-        Treat::Learning::Question.new(
-        :is_keyword, :word).
-        should == Treat::Learning::Question.new(
-        :is_keyword, :word)
+    describe "#==(question)" do
+      context "when supplied with an equal question" do
+        it "should return true" do
+          Treat::Learning::Question.new(
+          :is_keyword, :word).
+          should == Treat::Learning::Question.new(
+          :is_keyword, :word)
+        end
       end
-    end
-    context "when supplied with a different question" do
-      it "should return false" do
-        Treat::Learning::Question.new(
-        :is_keyword, :word).
-        should_not == Treat::Learning::Question.new(
-        :is_keyword, :sentence)
-        Treat::Learning::Question.new(
-        :is_keyword, :word, 0, :continuous).
-        should_not == Treat::Learning::Question.new(
-        :is_keyword, :word, 0, :discrete)
+      context "when supplied with a different question" do
+        it "should return false" do
+          Treat::Learning::Question.new(
+          :is_keyword, :word).
+          should_not == Treat::Learning::Question.new(
+          :is_keyword, :sentence)
+          Treat::Learning::Question.new(
+          :is_keyword, :word, 0, :continuous).
+          should_not == Treat::Learning::Question.new(
+          :is_keyword, :word, 0, :discrete)
+        end
       end
     end
   end
-end
+end