RubyGems - wikipedia-vandalism_detection - Versions diffs - 0.0.1 - Mend

wikipedia-vandalism_detection 0.0.1

Files changed (247) hide show

data/spec/vandalism_detection/diff_spec.rb ADDED

@@ -0,0 +1,40 @@
+require 'spec_helper'
+describe Wikipedia::VandalismDetection::Diff do
+  it "can deal with invalid byte sequences" do
+    text = "text \255".force_encoding('UTF-8')
+    expect { Wikipedia::VandalismDetection::Diff.new("#{text} a", "#{text} b") }.not_to raise_error
+  end
+  before do
+    @old_text =  Wikipedia::VandalismDetection::Text.new "hello\nworld\nmy name is Luke\n"
+    @new_text =  Wikipedia::VandalismDetection::Text.new "world\nhello\nmy name is Mr. Skywalker\n"
+    @diff =  Wikipedia::VandalismDetection::Diff.new(@old_text, @new_text)
+  end
+  describe "getting the inserted and removed words" do
+    it "can return the added words as array" do
+      inserted_words = @diff.inserted_words
+      expect(inserted_words).to be_an Array
+      expect(inserted_words.count).to eq 3
+    end
+    it "can return the removed words as array" do
+      removed_words = @diff.removed_words
+      expect(removed_words).to be_an Array
+      expect(removed_words.count).to eq 2
+    end
+    it "returns the right inserted words" do
+      expect(@diff.inserted_words).to eq ['hello', 'Mr.', 'Skywalker']
+    end
+    it "returns the right removed words" do
+      expect(@diff.removed_words).to eq ['hello', 'Luke']
+    end
+  end
+end

data/spec/vandalism_detection/edit_spec.rb ADDED

@@ -0,0 +1,137 @@
+require 'spec_helper'
+describe Wikipedia::VandalismDetection::Edit do
+  before do
+    @old_revision = build :old_revision
+    @new_revision = build :new_revision
+    @page_id = '1234'
+    @edit = Wikipedia::VandalismDetection::Edit.new(@old_revision, @new_revision)
+  end
+  it "has an old revision" do
+    expect(@edit.old_revision).to eq @old_revision
+  end
+  it "has a new revision" do
+    expect(@edit.new_revision).to eq @new_revision
+  end
+  it "can be build with its parent page referenced" do
+    page = build(:page, id: '1234', title: 'Page Title')
+    edit = Wikipedia::VandalismDetection::Edit.new(@old_revision, @new_revision, page: page)
+    expect(edit.page).to eq page
+  end
+  it "can be build with a page to get the id" do
+    page_id = '1234'
+    page = Wikipedia::VandalismDetection::Page.new
+    page.id = page_id
+    edit = Wikipedia::VandalismDetection::Edit.new(@old_revision, @new_revision, page: page)
+    expect(edit.page.id).to eq page_id
+  end
+  it "can be build with a page to get the title" do
+    page = Wikipedia::VandalismDetection::Page.new
+    page_title = 'Article'
+    page.title = page_title
+    edit = Wikipedia::VandalismDetection::Edit.new(@old_revision, @new_revision, page: page)
+    expect(edit.page.title).to eq page_title
+  end
+  describe "exception handling" do
+    it "does not raise an error if page parameters are called" do
+      edit = Wikipedia::VandalismDetection::Edit.new(@old_revision, @new_revision)
+      expect { edit.page.id }.not_to raise_error
+    end
+    it "raises no error if revisions are not sequent" do
+      expect { Wikipedia::VandalismDetection::Edit.new(@old_revision, @new_revision) }.not_to raise_error
+    end
+    it "raises an error if revisions are not sequent" do
+      expect { Wikipedia::VandalismDetection::Edit.new(@new_revision, @old_revision) }.to raise_exception ArgumentError
+    end
+  end
+  describe "#serialize" do
+    it "serializes the given parameters into a string" do
+      expect(@edit.serialize(:id, :text)).to eq "1,text 1\t2,text 2"
+    end
+  end
+  describe "#inserted_words" do
+    it "returns the inserted words as array" do
+      old_revision = build(:old_revision, text: "")
+      new_revision = build(:new_revision, text: "inserted words")
+      edit = build(:edit, old_revision: old_revision, new_revision: new_revision)
+      expect(edit.inserted_words).to eq ['inserted', 'words']
+    end
+    it "returns the uncleaned text inserted words as array" do
+      old_revision = build(:old_revision, text: "")
+      new_revision = build(:new_revision, text: "[[inserted words]]")
+      edit = build(:edit, old_revision: old_revision, new_revision: new_revision)
+      expect(edit.inserted_words).to eq ['[[inserted', 'words]]']
+    end
+  end
+  describe "#inserted_text" do
+    it "returns the inserted text as Wikipedia::VandalismDetection::Text" do
+      old_revision = build(:old_revision, text: "")
+      new_revision = build(:new_revision, text: "inserted words")
+      edit = build(:edit, old_revision: old_revision, new_revision: new_revision)
+      expect(edit.inserted_text).to eq Wikipedia::VandalismDetection::Text.new('inserted words')
+    end
+    it "returns the uncleaned text inserted text as Wikipedia::VadalismDetection::Text" do
+      old_revision = build(:old_revision, text: "")
+      new_revision = build(:new_revision, text: "[[inserted words]]")
+      edit = build(:edit, old_revision: old_revision, new_revision: new_revision)
+      expect(edit.inserted_text).to eq Wikipedia::VandalismDetection::Text.new('[[inserted words]]')
+    end
+  end
+  describe "#removed_words" do
+    it "returns the removed words as array" do
+      old_revision = build(:old_revision, text: "removed words")
+      new_revision = build(:new_revision, text: "")
+      edit = build(:edit, old_revision: old_revision, new_revision: new_revision)
+      expect(edit.removed_words).to eq ['removed', 'words']
+    end
+    it "returns the uncleaned text rremoved words as array" do
+      old_revision = build(:old_revision, text: "[[removed words]]")
+      new_revision = build(:new_revision, text: "")
+      edit = build(:edit, old_revision: old_revision, new_revision: new_revision)
+      expect(edit.removed_words).to eq ['[[removed', 'words]]']
+    end
+  end
+  describe "#removed_text" do
+    it "returns the removed text as Wikipedia::VandalismDetection::Text" do
+      old_revision = build(:old_revision, text: "removed words")
+      new_revision = build(:new_revision, text: "")
+      edit = build(:edit, old_revision: old_revision, new_revision: new_revision)
+      expect(edit.removed_text).to eq Wikipedia::VandalismDetection::Text.new('removed words')
+    end
+    it "returns the uncleaned text removed text as Wikipedia::VadalismDetection::Text" do
+      old_revision = build(:old_revision, text: "[[removed words]]")
+      new_revision = build(:new_revision, text: "")
+      edit = build(:edit, old_revision: old_revision, new_revision: new_revision)
+      expect(edit.removed_text).to eq Wikipedia::VandalismDetection::Text.new('[[removed words]]')
+    end
+  end
+end

data/spec/vandalism_detection/evaluator_spec.rb ADDED

@@ -0,0 +1,671 @@
+require 'spec_helper'
+describe Wikipedia::VandalismDetection::Evaluator do
+  before do
+    use_test_configuration
+    @config = test_config
+    @training_arff_file = @config.training_output_arff_file
+    @test_arff_file = @config.test_output_arff_file
+    @build_dir = @config.output_base_directory
+    @test_classification_file = @config.test_output_classification_file
+  end
+  after do
+    # remove training arff file
+    if File.exists?(@training_arff_file)
+      File.delete(@training_arff_file)
+      FileUtils.rm_r(File.dirname @training_arff_file)
+    end
+    # remove test arff file
+    if File.exists?(@test_arff_file)
+      File.delete(@test_arff_file)
+      FileUtils.rm_r(File.dirname @test_arff_file)
+    end
+    # remove classification.txt
+    if File.exist?(@test_classification_file)
+      File.delete(@test_classification_file)
+      File.rm_r(File.dirname @test_classification_file)
+    end
+    # remove output base directory
+    if Dir.exists?(@build_dir)
+      FileUtils.rm_r(@build_dir)
+    end
+  end
+  describe "#initialize" do
+    it "raises an ArgumentError if classifier attr is not a Wikipedia::VandalismDetection::Classfier" do
+      expect { Wikipedia::VandalismDetection::Evaluator.new("") }.to raise_error ArgumentError
+    end
+    it "does not raise an error while appropriate initialization" do
+      classifier = Wikipedia::VandalismDetection::Classifier.new
+      expect { Wikipedia::VandalismDetection::Evaluator.new(classifier) }.not_to raise_error
+    end
+  end
+  before do
+    classifier = Wikipedia::VandalismDetection::Classifier.new
+    @evaluator = Wikipedia::VandalismDetection::Evaluator.new(classifier)
+  end
+  describe "#test_performance_curves" do
+    before do
+      @classification = {
+          :"1-2" => {
+              old_revision_id: 1,
+              new_revision_id: 2,
+              class: "R",
+              confidence: 0.0
+          },
+          :"2-3" => {
+              old_revision_id: 2,
+              new_revision_id: 3,
+              class: "R",
+              confidence: 0.3
+          },
+          :"3-4" => {
+              old_revision_id: 3,
+              new_revision_id: 4,
+              class: "V",
+              confidence: 0.8
+          },
+          :"4-5" => {
+              old_revision_id: 4,
+              new_revision_id: 5,
+              class: "V",
+              confidence: 1.0
+          }
+      }
+      # ground truth has one sample more to represent fall-out samples while feature calculation
+      # (e.g. redirects are not considered)
+      @ground_truth = {
+          :"0-1" => { # this is a sample that is not used!
+              old_revision_id: 0,
+              new_revision_id: 1,
+              class: "R"
+          },
+          :"1-2" => {
+              old_revision_id: 1,
+              new_revision_id: 2,
+              class: "R"
+          },
+          :"2-3" => {
+              old_revision_id: 2,
+              new_revision_id: 3,
+              class: "V"
+          },
+          :"3-4" => {
+              old_revision_id: 3,
+              new_revision_id: 4,
+              class: "R"
+          },
+          :"4-5" => {
+              old_revision_id: 4,
+              new_revision_id: 5,
+              class: "V"
+          }
+      }
+      @sample_count = 10
+      @curve_data = @evaluator.test_performance_curves(@ground_truth, @classification, @sample_count)
+    end
+    it "returns a Hash" do
+      expect(@curve_data).to be_a Hash
+    end
+    [:recalls, :precisions,:fp_rates, :tp_rates, :pr_auc, :roc_auc].each do |attribute|
+      it "returns a Hash including #{attribute}" do
+        expect(@curve_data).to have_key(attribute)
+      end
+    end
+    describe "#predictive_values" do
+      before do
+        @threshold = 0.5
+        @predictive_values = @evaluator.predictive_values(@ground_truth, @classification, @threshold)
+      end
+      it "returns a Hash" do
+        expect(@predictive_values).to be_a Hash
+      end
+      [
+          { threshold: 0.0, result: {tp: 2, fp: 2, tn: 0, fn: 0} },
+          { threshold: 0.3, result: {tp: 1, fp: 1, tn: 1, fn: 1} },
+          { threshold: 0.5, result: {tp: 1, fp: 1, tn: 1, fn: 1} },
+          { threshold: 0.8, result: {tp: 1, fp: 1, tn: 1, fn: 1} },
+          { threshold: 0.9, result: {tp: 1, fp: 0, tn: 2, fn: 1} },
+          { threshold: 1.0, result: {tp: 0, fp: 0, tn: 2, fn: 2} }
+      ].each do |values|
+        it "returns the right values for threshold #{values[:threshold]}" do
+          predictive_values = @evaluator.predictive_values(@ground_truth, @classification, values[:threshold])
+          expect(predictive_values).to eq values[:result]
+        end
+      end
+    end
+    describe "#sort_curve_values" do
+      before do
+        @x = [0.7, 0.4, 0.8, 0.4, 0.7]
+        @y = [0.6, 0.8, 0.2, 0.6, 0.6]
+        @x_sorted = [0.4, 0.4, 0.7, 0.8]
+        @y_sorted = [0.8, 0.6, 0.6, 0.2]
+      end
+      it "returns the unique sorted input values" do
+        hash = { x: @x_sorted, y: @y_sorted }
+        sorted = @evaluator.sort_curve_values(@x, @y)
+        expect(sorted).to eq hash
+      end
+      it "adds start values if given" do
+        start_values = { x: -1.0, y: -2.0 }
+        hash = { x: @x_sorted.unshift(start_values[:x]), y: @y_sorted.unshift(start_values[:y])}
+        sorted = @evaluator.sort_curve_values(@x, @y, start_values)
+        expect(sorted).to eq hash
+      end
+      it "adds x start value if only one value given" do
+        start_values = { x: -1.0 }
+        hash = { x: @x_sorted.unshift(start_values[:x]), y: @y_sorted.unshift(@y_sorted.first) }
+        sorted = @evaluator.sort_curve_values(@x, @y, start_values)
+        expect(sorted).to eq hash
+      end
+      it "adds y start value if only one value given" do
+        start_values = { y: -2.0 }
+        hash = { x: @x_sorted.unshift(@x_sorted.first), y: @y_sorted.unshift(start_values[:y]) }
+        sorted = @evaluator.sort_curve_values(@x, @y, start_values)
+        expect(sorted).to eq hash
+      end
+      it "adds end values if given" do
+        end_values = { x: -1.0, y: -2.0 }
+        hash = { x: @x_sorted.push(end_values[:x]), y: @y_sorted.push(end_values[:y]) }
+        sorted = @evaluator.sort_curve_values(@x, @y, nil, end_values)
+        expect(sorted).to eq hash
+      end
+      it "adds y end values if only one value is given" do
+        end_values = {y: -2.0 }
+        hash = { x: @x_sorted.push(@x_sorted.last), y: @y_sorted.push(end_values[:y]) }
+        sorted = @evaluator.sort_curve_values(@x, @y, nil, end_values)
+        expect(sorted).to eq hash
+      end
+      it "adds x end values if only one value is given" do
+        end_values = {x: -1.0 }
+        hash = { x: @x_sorted.push(end_values[:x]), y: @y_sorted.push(@y_sorted.last) }
+        sorted = @evaluator.sort_curve_values(@x, @y, nil, end_values)
+        expect(sorted).to eq hash
+      end
+    end
+    describe "#area_under_curve" do
+      before do
+        @pr_auc = @evaluator.area_under_curve(@curve_data[:precisions], @curve_data[:precisions])
+        @roc_auc = @evaluator.area_under_curve(@curve_data[:fp_rates], @curve_data[:tp_rates])
+      end
+      it "returns a numeric value for pr_auc" do
+        expect(@pr_auc).to be_a Numeric
+      end
+      it "returns a numeric value between 0.0 & 1.0 for pr_auc" do
+        is_between_zero_and_one = (@pr_auc >= 0.0 && @pr_auc <= 1.0)
+        expect(is_between_zero_and_one).to be true
+      end
+      it "returns a numeric value for roc_auc" do
+        expect(@roc_auc).to be_a Numeric
+      end
+      it "returns a numeric value between 0.0 & 1.0 for roc_auc" do
+        is_between_zero_and_one = @roc_auc >= 0.0 && @roc_auc <= 1.0
+        expect(is_between_zero_and_one).to be true
+      end
+      [
+          { x: [0.0, 0.2, 0.4, 0.6, 0.8, 1.0], y: [1.0, 0.8, 0.6, 0.4, 0.2, 0.0], auc: 0.5 }
+      ].each do |data|
+        it "returns the right values" do
+          x = data[:x]
+          y = data[:y]
+          auc = data[:auc]
+          expect(@evaluator.area_under_curve(x, y)).to eq auc
+        end
+      end
+    end
+  end
+  describe "#create_testcorpus_classification_file!" do
+    before do
+      @ground_truth = { # see resources file ground_truth.csv
+          :"0-1" => { # this is a sample that is not used!
+              old_revision_id: 0,
+              new_revision_id: 1,
+              class: "R"
+          },
+          :"307084144-326873205" => {
+              old_revision_id: 307084144,
+              new_revision_id: 326873205,
+              class: "R"
+          },
+          :"326471754-326978767" => {
+              old_revision_id: 326471754,
+              new_revision_id: 326978767,
+              class: "V"
+          },
+          :"328774035-328774110" => {
+              old_revision_id: 328774035,
+              new_revision_id: 328774110,
+              class: "R"
+          }
+      }
+    end
+    it "raises an argument error if ground_truth param is nil" do
+      expect { @evaluator.create_testcorpus_classification_file!(@test_classification_file, nil) }.to raise_error ArgumentError
+    end
+    it "creates a classification file in the base output directory" do
+      expect(File.exists?(@test_classification_file)).to be false
+      @evaluator.create_testcorpus_classification_file!(@test_classification_file, @ground_truth)
+      expect(File.exists?(@test_classification_file)).to be true
+    end
+    it "creates a file with an appropriate header" do
+      @evaluator.create_testcorpus_classification_file!(@test_classification_file, @ground_truth)
+      content = File.open(@test_classification_file, 'r')
+      features = Core::Parser.parse_ARFF(@test_arff_file).enumerate_attributes.to_a.map { |attr| attr.name.upcase }[0...-2]
+      proposed_header = ['OLDREVID', 'NEWREVID', 'C', 'CONF', *features]
+      header = content.lines.first.split(' ')
+      expect(header).to eq proposed_header
+    end
+    it "creates a file with an appropriate number of lines" do
+      @evaluator.create_testcorpus_classification_file!(@test_classification_file, @ground_truth)
+      content = File.open(@test_classification_file, 'r')
+      samples_count = Core::Parser.parse_ARFF(@test_arff_file).n_rows
+      lines = content.lines.to_a
+      lines.shift # remove header
+      expect(lines.count).to eq samples_count
+    end
+    it "has the short class names as class value" do
+      @evaluator.create_testcorpus_classification_file!(@test_classification_file, @ground_truth)
+      content = File.open(@test_classification_file, 'r')
+      lines = content.lines.to_a
+      lines.shift # remove header
+      short_classes = Wikipedia::VandalismDetection::Instances::CLASSES_SHORT
+      vandalism_index = Wikipedia::VandalismDetection::Instances::VANDALISM_CLASS_INDEX
+      regular_index = Wikipedia::VandalismDetection::Instances::REGULAR_CLASS_INDEX
+      missing_index = Wikipedia::VandalismDetection::Instances::NOT_KNOWN_INDEX
+      names = [short_classes[regular_index], short_classes[vandalism_index], short_classes[missing_index]]
+      lines.each do |line|
+        class_name = line.split[2]
+        expect(names).to include class_name
+      end
+    end
+  end
+  describe "#evaluate_testcorpus_classification" do
+    describe "exceptions" do
+      it "raises an GroundTruthFileNotConfiguredError unless a ground thruth file is configured" do
+        config = test_config
+        config.instance_variable_set :@test_corpus_ground_truth_file, nil
+        use_configuration(config)
+        classifier = Wikipedia::VandalismDetection::Classifier.new
+        evaluator = Wikipedia::VandalismDetection::Evaluator.new(classifier)
+        expect { evaluator.evaluate_testcorpus_classification }.to raise_error \
+          Wikipedia::VandalismDetection::GroundTruthFileNotConfiguredError
+      end
+      it "raises an GroundTruthFileNotFoundError unless the ground thruth file can be found" do
+        config = test_config
+        config.instance_variable_set :@test_corpus_ground_truth_file, 'false-file-name.txt'
+        use_configuration(config)
+        classifier = Wikipedia::VandalismDetection::Classifier.new
+        evaluator = Wikipedia::VandalismDetection::Evaluator.new(classifier)
+        expect { evaluator.evaluate_testcorpus_classification }.to raise_error \
+          Wikipedia::VandalismDetection::GroundTruthFileNotFoundError
+      end
+    end
+    it "returns a performance values Hash" do
+      performance_values = @evaluator.evaluate_testcorpus_classification(sample_count: @sample_count)
+      expect(performance_values).to be_a Hash
+    end
+    [ :fp_rates,
+      :tp_rates,
+      :precisions,
+      :recalls,
+      :pr_auc,
+      :roc_auc,
+      :total_precision,
+      :total_recall
+    ].each do |attr|
+      it "returns a performance values Hash with property'#{attr}'" do
+        performance_values = @evaluator.evaluate_testcorpus_classification(sample_count: @sample_count)
+        expect(performance_values[attr]).to_not be_nil
+      end
+    end
+    it "runs the classification file creation" do
+      expect(File.exists?(@test_classification_file)).to be false
+      @evaluator.evaluate_testcorpus_classification
+      expect(File.exists?(@test_classification_file)).to be true
+    end
+    it "overwrites the old classification file" do
+      config = test_config
+      config.instance_variable_set(:@features, ['comment length'])
+      use_configuration(config)
+      classifier = Wikipedia::VandalismDetection::Classifier.new
+      evaluator = Wikipedia::VandalismDetection::Evaluator.new(classifier)
+      evaluator.evaluate_testcorpus_classification
+      content_old = File.read(@test_classification_file)
+      config.instance_variable_set(:@features, ['anonymity'])
+      use_configuration(config)
+      classifier = Wikipedia::VandalismDetection::Classifier.new
+      evaluator = Wikipedia::VandalismDetection::Evaluator.new(classifier)
+      evaluator.evaluate_testcorpus_classification
+      content_new = File.read(@test_classification_file)
+      expect(content_old).to_not eq content_new
+    end
+  end
+  describe "#cross_validate" do
+    it "returns an evaluation object" do
+      evaluation = @evaluator.cross_validate
+      expect(evaluation.class).to eq Java::WekaClassifiers::Evaluation
+    end
+    it "can cross validates the classifier" do
+      expect { @evaluator.cross_validate }.not_to raise_error
+    end
+    it "can cross validates the classifier with equally distributed samples" do
+      expect { @evaluator.cross_validate(equally_distributed: true) }.not_to raise_error
+    end
+  end
+  describe "#curve_data" do
+    describe "all samples" do
+      before do
+        @data = @evaluator.curve_data
+      end
+      it "returns a Hash" do
+        expect(@data).to be_a Hash
+      end
+      it "includes precision curve data" do
+        expect(@data[:precision]).to be_an Array
+      end
+      it "includes recall curve data" do
+        expect(@data[:recall]).to be_an Array
+      end
+      it "includes area_under_prc data" do
+        expect(@data[:area_under_prc]).to be_a Numeric
+      end
+      it "has non-empty :precision Array contents" do
+        expect(@data[:precision]).to_not be_empty
+      end
+      it "has non-empty :recall Array contents" do
+        expect(@data[:recall]).to_not be_empty
+      end
+    end
+    describe "equally distributed samples" do
+      before do
+        @data = @evaluator.curve_data(equally_distributed: true)
+      end
+      it "returns a Hash" do
+        expect(@data).to be_a Hash
+      end
+      it "includes precision curve data" do
+        expect(@data[:precision]).to be_a Array
+      end
+      it "includes recall curve data" do
+        expect(@data[:recall]).to be_a Array
+      end
+      it "includes area_under_prc data" do
+        expect(@data[:area_under_prc]).to be_a Numeric
+      end
+      it "has non-empty :precision Array contents" do
+        expect(@data[:precision]).to_not be_empty
+      end
+      it "has non-empty :recall Array contents" do
+        expect(@data[:recall]).to_not be_empty
+      end
+    end
+  end
+  describe "#feature_analysis" do
+    it "returns a hash" do
+      analysis = @evaluator.feature_analysis(sample_count: 100)
+      expect(analysis).to be_a Hash
+    end
+    it "returns a hash with feature count size" do
+      analysis = @evaluator.feature_analysis(sample_count: 100)
+      expect(analysis.count).to eq @config.features.count
+    end
+    it "returns a hash with sample count number of data hashes" do
+      sample_count = 5
+      analysis = @evaluator.feature_analysis(sample_count: sample_count)
+      analysis.each do |key, threshold_hash|
+        expect(threshold_hash.count).to eq sample_count
+      end
+    end
+    it "returns the four predictive values in each features threshold hash" do
+      analysis = @evaluator.feature_analysis
+      threshold_hash = analysis[@config.features.first][0.0]
+      expect(threshold_hash).to have_key(:fp)
+      expect(threshold_hash).to have_key(:fn)
+      expect(threshold_hash).to have_key(:tp)
+      expect(threshold_hash).to have_key(:tn)
+    end
+  end
+  describe "#full_analysis" do
+    it "returns a hash" do
+      analysis = @evaluator.full_analysis(sample_count: 100)
+      expect(analysis).to be_a Hash
+    end
+    it "returns a hash with smaple count number of threshold hashes" do
+      sample_count = 5
+      analysis = @evaluator.full_analysis(sample_count: sample_count)
+      expect(analysis.count).to eq sample_count
+    end
+    it "returns the four predictive values in each features threshold hash" do
+      analysis = @evaluator.full_analysis
+      threshold_hash = analysis[0.0]
+      expect(threshold_hash).to have_key(:fp)
+      expect(threshold_hash).to have_key(:fn)
+      expect(threshold_hash).to have_key(:tp)
+      expect(threshold_hash).to have_key(:tn)
+    end
+  end
+  describe "#true_positive?" do
+    before do
+      @vandalism = Wikipedia::VandalismDetection::Instances::VANDALISM_SHORT
+      @regular = Wikipedia::VandalismDetection::Instances::REGULAR_SHORT
+      @threshold = 0.7
+    end
+    it "returns true if the given confidence is higher than a threshold regarding the ground truth 'V'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.true_positive?(@vandalism, 0.8, @threshold)).to be true
+    end
+    it "returns false if the given confidence is lower than a threshold regarding the ground truth 'V'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.true_positive?(@vandalism, 0.5, @threshold)).to be false
+    end
+    it "returns false for the same confidence and threshold if ground truth is 'V'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.true_positive?(@vandalism, @threshold, @threshold)).to be false
+    end
+    it "returns false if the given confidence is higher than a threshold regarding the ground truth 'R'" do
+      expect( Wikipedia::VandalismDetection::Evaluator.true_positive?(@regular, 0.8, @threshold)).to be false
+    end
+    it "returns false if the given confidence is lower than a threshold regarding the ground truth 'R'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.true_positive?(@regular, 0.5, @threshold)).to be false
+    end
+  end
+  describe "#true_negative?" do
+    before do
+      @vandalism = Wikipedia::VandalismDetection::Instances::VANDALISM_SHORT
+      @regular = Wikipedia::VandalismDetection::Instances::REGULAR_SHORT
+      @threshold = 0.7
+    end
+    it "returns true if the given confidence is lower than a threshold regarding the ground truth 'R'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.true_negative?(@regular, 0.5, @threshold)).to be true
+    end
+    it "returns false if the given confidence is higher than a threshold regarding the ground truth 'R'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.true_negative?(@regular, 0.8, @threshold)).to be false
+    end
+    it "returns false for the same confidence and threshold if ground truth is 'R'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.true_negative?(@regular, @threshold, @threshold)).to be false
+    end
+    it "returns false if the given confidence is lower than a threshold regarding the ground truth 'V'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.true_negative?(@vandalism, 0.5, @threshold)).to be false
+    end
+    it "returns false if the given confidence is higher than a threshold regarding the ground truth 'V'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.true_negative?(@vandalism, 0.8, @threshold)).to be false
+    end
+  end
+  describe "#false_positive?" do
+    before do
+      @vandalism = Wikipedia::VandalismDetection::Instances::VANDALISM_SHORT
+      @regular = Wikipedia::VandalismDetection::Instances::REGULAR_SHORT
+      @threshold = 0.7
+    end
+    it "returns true if the given confidence is higher than a threshold regarding the ground truth 'R'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.false_positive?(@regular, 0.8, @threshold)).to be true
+    end
+    it "returns false if the given confidence is lower than a threshold regarding the ground truth 'R'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.false_positive?(@regular, 0.5, @threshold)).to be false
+    end
+    it "returns true for the same confidence and threshold if ground truth is 'R'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.false_positive?(@regular, @threshold, @threshold)).to be true
+    end
+    it "returns false if the given confidence is higher than a threshold regarding the ground truth 'V'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.false_positive?(@vandalism, 0.8, @threshold)).to be false
+    end
+    it "returns false if the given confidence is lower than a threshold regarding the ground truth 'V'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.false_positive?(@vandalism, 0.5, @threshold)).to be false
+    end
+  end
+  describe "#false_negative?" do
+    before do
+      @vandalism = Wikipedia::VandalismDetection::Instances::VANDALISM_SHORT
+      @regular = Wikipedia::VandalismDetection::Instances::REGULAR_SHORT
+      @threshold = 0.7
+    end
+    it "returns true if the given confidence is lower than a threshold regarding the ground truth 'V'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.false_negative?(@vandalism, 0.5, @threshold)).to be true
+    end
+    it "returns false if the given confidence is higher than a threshold regarding the ground truth 'V'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.false_negative?(@vandalism, 0.8, @threshold)).to be false
+    end
+    it "returns true for the same confidence and threshold if ground truth is 'V'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.false_negative?(@vandalism, @threshold, @threshold)).to be true
+    end
+    it "returns false if the given confidence is lower than a threshold regarding the ground truth 'R'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.false_negative?(@regular, 0.5, @threshold)).to be false
+    end
+    it "returns false if the given confidence is higher than a threshold regarding the ground truth 'R'" do
+      expect(Wikipedia::VandalismDetection::Evaluator.false_negative?(@regular, 0.8, @threshold)).to be false
+    end
+  end
+end