nlp 0.2.6 → 0.2.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,9 +0,0 @@
1
- require 'rubygems'
2
- require 'test/unit'
3
-
4
- $LOAD_PATH.unshift(File.dirname(__FILE__))
5
- $LOAD_PATH.unshift(File.join(File.dirname(__FILE__), '..', 'lib'))
6
- require 'nlp'
7
-
8
- class Test::Unit::TestCase
9
- end
@@ -1,73 +0,0 @@
1
- require 'helper'
2
- require '../lib/lemmatizer.rb'
3
-
4
- class LemmatizerTest < Test::Unit::TestCase
5
-
6
- include NLP
7
-
8
- def setup
9
- @sample = "Złe czasy już minęły."
10
-
11
-
12
- @zle_word = Word.new('złe','zły','adj:pl:nom:m3:pos')
13
- @czasy_word = Word.new('czasy','czas','subst:pl:nom:m3')
14
- @minely_word = Word.new('minęły','minąć','praet:pl:m3:perf')
15
- @juz_word = Word.new('już','już','qub')
16
- @period = Token.new('.','interp')
17
-
18
- end
19
-
20
-
21
-
22
- def test_takipi_remote_lemmatizer
23
- text = Lemmatizer.lemmatize(@sample,:takipi,:remote)
24
- test_takipi_lemmatizer(text)
25
- end
26
-
27
-
28
- def test_takipi_local_lemmatizer
29
- text = Lemmatizer.lemmatize(@sample,:takipi,:local)
30
- test_takipi_lemmatizer(text)
31
- end
32
-
33
-
34
- def test_morfeusz_leamtizer
35
- text = Lemmatizer.lemmatize(@sample)
36
- assert_equal Text, text.class
37
- assert_equal 1, text.sentences.size
38
- assert_equal 4, text.sentences[0].words_number
39
-
40
- tokens = text.sentences[0].tokens
41
- zle,czasy,juz,minely,period = *tokens
42
- assert_equal 'zły', zle.lemat
43
- assert_equal 'czas', czasy.lemat
44
- assert_equal 'już', juz.lemat
45
- assert_equal 'minąć', minely.lemat
46
-
47
- end
48
-
49
- private
50
- def test_takipi_lemmatizer(text)
51
-
52
- assert_equal Text, text.class
53
- assert_equal 1, text.sentences.size
54
- assert_equal 4, text.sentences[0].words_number
55
-
56
- tokens = text.sentences[0].tokens
57
- zle, czasy, juz, minely, period = *tokens
58
- assert_equal @zle_word.inflection, zle.inflection
59
- assert_equal @czasy_word.inflection, czasy.inflection
60
- assert_equal @juz_word.inflection, juz.inflection
61
- assert_equal @minely_word.inflection, minely.inflection
62
- assert_equal @period.tags, period.tags
63
-
64
- assert_equal 'zły', zle.lemat
65
- assert_equal 'czas', czasy.lemat
66
- assert_equal 'już', juz.lemat
67
- assert_equal 'minąć', minely.lemat
68
-
69
- end
70
-
71
-
72
-
73
- end
@@ -1,28 +0,0 @@
1
- require 'helper'
2
- require '../lib/word.rb'
3
-
4
- class MeaningableTest < Test::Unit::TestCase
5
- include NLP
6
-
7
- def setup
8
-
9
- @word_kochamy = Word.new('kochamy','kochać', 'fin:pl:pri:imperf')
10
- psych_cat = LIWCCategory.new('PROCESY_PSYCHOLOGICZNE')
11
- emotion_cat = LIWCCategory.new('EMOCJE',psych_cat)
12
- pos_emotion_cat = LIWCCategory.new('POZYTYWNE_EMOCJE',emotion_cat)
13
- @word_kochamy.category = pos_emotion_cat
14
-
15
- end
16
-
17
- def test_category_recognition
18
-
19
- assert @word_kochamy.psychological?
20
- assert @word_kochamy.positive_emotion?
21
- assert @word_kochamy.emotion?
22
-
23
- assert !@word_kochamy.negative_emotion?
24
- end
25
-
26
-
27
- end
28
-
@@ -1,11 +0,0 @@
1
- require 'test/unit'
2
- require 'helper'
3
- require "lemmatizer_test"
4
- require "word_test"
5
- require "token_test"
6
- require "text_test"
7
- require "sentence_test"
8
- require "token_scanner_test"
9
- require "meaningable_test"
10
-
11
-
@@ -1,26 +0,0 @@
1
- require 'helper'
2
- require '../lib/token.rb'
3
-
4
- class SentenceTest < Test::Unit::TestCase
5
-
6
- include NLP
7
-
8
- def setup
9
- @sentence = Sentence.new
10
- @comma = Token.new(',','interp')
11
- @integer = Token.new('32','tnum:integer')
12
- @float = Token.new('3,12','tnum:frac')
13
- @symbol = Token.new('nie_istniejace_slowo','tsym')
14
- end
15
-
16
-
17
- def test_sentence_size
18
- assert_equal 0, @sentence.words_number
19
- @sentence << @symbol
20
- assert_equal 1, @sentence.words_number
21
- @sentence << @integer << @comma << @float
22
- assert_equal 3, @sentence.words_number
23
- end
24
-
25
-
26
- end
@@ -1,7 +0,0 @@
1
- require 'helper'
2
-
3
- class TestNlp < Test::Unit::TestCase
4
- def test_something_for_real
5
- assert_nil nil
6
- end
7
- end
@@ -1,29 +0,0 @@
1
- require 'helper'
2
- require '../lib/token.rb'
3
-
4
- class TextTest < Test::Unit::TestCase
5
-
6
- include NLP
7
-
8
- def setup
9
- @s1 = Sentence.new
10
- @s2 = Sentence.new
11
- @comma = Token.new(',','interp')
12
- @integer = Token.new('32','tnum:integer')
13
- @float = Token.new('3,12','tnum:frac')
14
- @symbol = Token.new('nie_istniejace_slowo','tsym')
15
- @s1 << @integer << @comma << @symbol
16
- @s2 << @integer << @symbol
17
- @text = Text.new
18
-
19
- end
20
-
21
-
22
- def test_text
23
- @text << @s1
24
- @text << @s2
25
- assert_equal 2, @text.words_per_sentence
26
- end
27
-
28
-
29
- end
@@ -1,28 +0,0 @@
1
- require 'helper'
2
- require '../lib/token_scanner.rb'
3
-
4
- class TokenScannerTest < Test::Unit::TestCase
5
-
6
- include NLP
7
-
8
- def setup
9
- sentence = "To, jest zdanie."
10
- @text = Lemmatizer.lemmatize(sentence,:takipi,:local)
11
- @scanner = TokenScanner.new(@text)
12
-
13
- end
14
-
15
- def test_scanner
16
- assert_equal "To", @scanner.current.orth
17
- @scanner.next(:word)
18
- assert_equal "jest", @scanner.current.orth
19
- @scanner.next(:interp)
20
- assert_equal ".", @scanner.current.orth
21
- @scanner.next(:word)
22
- assert @scanner.end?
23
- @scanner.rewind
24
- assert_equal 0, @scanner.index
25
- end
26
-
27
- end
28
-
@@ -1,37 +0,0 @@
1
- require 'helper'
2
- require '../lib/token.rb'
3
-
4
- class TokenTest < Test::Unit::TestCase
5
-
6
- include NLP
7
-
8
- def setup
9
- @comma = Token.new(',','interp')
10
- @integer = Token.new('32','tnum:integer')
11
- @float = Token.new('3,12','tnum:frac')
12
- @symbol = Token.new('nie_istniejace_slowo','tsym')
13
- end
14
-
15
-
16
- def test_recognizing_interpunction
17
- assert @comma.interp?
18
- assert !@comma.word?
19
- end
20
-
21
- def test_recognizing_numbers
22
- assert @integer.integer?
23
- assert !@integer.word?
24
-
25
- assert @float.float?
26
- assert @float.number?
27
-
28
- assert !@float.word?
29
- assert !@float.integer?
30
- end
31
-
32
- def test_symbol
33
- assert @symbol.symbol?
34
- end
35
-
36
-
37
- end
@@ -1,45 +0,0 @@
1
- require 'helper'
2
- require '../lib/word.rb'
3
-
4
- class WordTest < Test::Unit::TestCase
5
- include NLP
6
-
7
- def setup
8
- @word_kota = Word.new('kota','kot','subst:sg:gen.acc:m2')
9
- @word_siebie = Word.new('siebie','się','siebie:gen.acc')
10
- end
11
-
12
- def test_word_lematization
13
- assert_equal 'kot', @word_kota.lemat
14
- assert_equal 'się', @word_siebie.lemat
15
- end
16
-
17
- def test_word_orth
18
- assert_equal 'kota', @word_kota.orth
19
- assert_equal 'siebie', @word_siebie.orth
20
- end
21
-
22
- def test_recognizing_part_of_speech
23
- assert @word_kota.rzeczownik?
24
- assert @word_siebie.zaimek?
25
- end
26
-
27
- def test_recognizing_inflection
28
- assert @word_kota.liczba_pojedyncza?
29
- assert @word_kota.dopelniacz?
30
- assert @word_kota.biernik?
31
- assert @word_kota.meski_zwierzecy?
32
-
33
- assert !@word_kota.liczba_mnoga?
34
- assert !@word_kota.mianownik?
35
-
36
- assert @word_siebie.biernik?
37
- assert @word_siebie.dopelniacz?
38
- end
39
-
40
- def test_inflection_string
41
- assert_equal @word_kota.inflection, 'subst:sg:gen.acc:m2'
42
- end
43
-
44
-
45
- end