raingrams 0.0.9 → 0.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/History.txt +9 -0
- data/Manifest.txt +10 -10
- data/README.txt +9 -7
- data/Rakefile +3 -6
- data/TODO.txt +6 -0
- data/lib/raingrams/bigram_model.rb +3 -7
- data/lib/raingrams/extensions/object.rb +4 -1
- data/lib/raingrams/extensions/string.rb +3 -0
- data/lib/raingrams/extensions.rb +0 -5
- data/lib/raingrams/hexagram_model.rb +3 -7
- data/lib/raingrams/model.rb +622 -61
- data/lib/raingrams/ngram.rb +50 -9
- data/lib/raingrams/ngram_set.rb +43 -0
- data/lib/raingrams/open_vocabulary/model.rb +12 -0
- data/lib/raingrams/open_vocabulary/open_model.rb +8 -4
- data/lib/raingrams/open_vocabulary.rb +0 -1
- data/lib/raingrams/pentagram_model.rb +3 -7
- data/lib/raingrams/probability_table.rb +153 -0
- data/lib/raingrams/quadgram_model.rb +3 -7
- data/lib/raingrams/raingrams.rb +10 -20
- data/lib/raingrams/tokens/start_sentence.rb +2 -2
- data/lib/raingrams/tokens/stop_sentence.rb +2 -2
- data/lib/raingrams/tokens/token.rb +49 -5
- data/lib/raingrams/tokens/unknown.rb +2 -2
- data/lib/raingrams/tokens.rb +1 -0
- data/lib/raingrams/trigram_model.rb +3 -7
- data/lib/raingrams/version.rb +1 -1
- data/lib/raingrams.rb +1 -1
- data/spec/ngram_set_spec.rb +54 -0
- data/spec/ngram_spec.rb +29 -0
- data/spec/probability_table_spec.rb +94 -0
- data/spec/raingrams_spec.rb +9 -0
- data/spec/spec_helper.rb +5 -0
- data/tasks/spec.rb +7 -0
- metadata +65 -55
- data/lib/raingrams/extensions/class.rb +0 -7
- data/lib/raingrams/extensions/false_class.rb +0 -7
- data/lib/raingrams/extensions/nil_class.rb +0 -7
- data/lib/raingrams/extensions/symbol.rb +0 -7
- data/lib/raingrams/extensions/true_class.rb +0 -7
- data/lib/raingrams/multigram_model.rb +0 -165
- data/lib/raingrams/open_vocabulary/multigram_model.rb +0 -12
- data/lib/raingrams/open_vocabulary/unigram_model.rb +0 -12
- data/lib/raingrams/unigram_model.rb +0 -70
- data/test/test_raingrams.rb +0 -0
data/History.txt
CHANGED
@@ -1,3 +1,12 @@
|
|
1
|
+
== 0.1.0 / 2008-10-06
|
2
|
+
|
3
|
+
* Various bug fixes.
|
4
|
+
* Added NgramSet and ProbabilityTable classes.
|
5
|
+
* Merged NgramModel with the Model class.
|
6
|
+
* Refactored the Model class.
|
7
|
+
* Added random_gram_sentence, random_sentence, random_paragraph and
|
8
|
+
random_text methods to the Model class.
|
9
|
+
|
1
10
|
== 0.0.9 / 2008-01-09
|
2
11
|
|
3
12
|
* Initial release.
|
data/Manifest.txt
CHANGED
@@ -2,19 +2,15 @@ History.txt
|
|
2
2
|
LICENSE.txt
|
3
3
|
Manifest.txt
|
4
4
|
README.txt
|
5
|
+
TODO.txt
|
5
6
|
Rakefile
|
6
7
|
lib/raingrams.rb
|
7
8
|
lib/raingrams/version.rb
|
8
9
|
lib/raingrams/raingrams.rb
|
9
10
|
lib/raingrams/exceptions/prefix_frequency_missing.rb
|
10
11
|
lib/raingrams/exceptions.rb
|
11
|
-
lib/raingrams/extensions/class.rb
|
12
|
-
lib/raingrams/extensions/false_class.rb
|
13
|
-
lib/raingrams/extensions/nil_class.rb
|
14
12
|
lib/raingrams/extensions/object.rb
|
15
13
|
lib/raingrams/extensions/string.rb
|
16
|
-
lib/raingrams/extensions/symbol.rb
|
17
|
-
lib/raingrams/extensions/true_class.rb
|
18
14
|
lib/raingrams/extensions.rb
|
19
15
|
lib/raingrams/tokens/token.rb
|
20
16
|
lib/raingrams/tokens/start_sentence.rb
|
@@ -22,21 +18,25 @@ lib/raingrams/tokens/stop_sentence.rb
|
|
22
18
|
lib/raingrams/tokens/unknown.rb
|
23
19
|
lib/raingrams/tokens.rb
|
24
20
|
lib/raingrams/ngram.rb
|
21
|
+
lib/raingrams/ngram_set.rb
|
22
|
+
lib/raingrams/probability_table.rb
|
25
23
|
lib/raingrams/model.rb
|
26
|
-
lib/raingrams/unigram_model.rb
|
27
|
-
lib/raingrams/multigram_model.rb
|
28
24
|
lib/raingrams/bigram_model.rb
|
29
25
|
lib/raingrams/trigram_model.rb
|
30
26
|
lib/raingrams/quadgram_model.rb
|
31
27
|
lib/raingrams/pentagram_model.rb
|
32
28
|
lib/raingrams/hexagram_model.rb
|
33
29
|
lib/raingrams/open_vocabulary/open_model.rb
|
34
|
-
lib/raingrams/open_vocabulary/
|
35
|
-
lib/raingrams/open_vocabulary/multigram_model.rb
|
30
|
+
lib/raingrams/open_vocabulary/model.rb
|
36
31
|
lib/raingrams/open_vocabulary/bigram_model.rb
|
37
32
|
lib/raingrams/open_vocabulary/trigram_model.rb
|
38
33
|
lib/raingrams/open_vocabulary/quadgram_model.rb
|
39
34
|
lib/raingrams/open_vocabulary/pentagram_model.rb
|
40
35
|
lib/raingrams/open_vocabulary/hexagram_model.rb
|
41
36
|
lib/raingrams/open_vocabulary.rb
|
42
|
-
|
37
|
+
tasks/spec.rb
|
38
|
+
spec/spec_helper.rb
|
39
|
+
spec/ngram_spec.rb
|
40
|
+
spec/ngram_set_spec.rb
|
41
|
+
spec/probability_table_spec.rb
|
42
|
+
spec/raingrams_spec.rb
|
data/README.txt
CHANGED
@@ -1,6 +1,7 @@
|
|
1
|
-
Raingrams
|
2
|
-
|
3
|
-
|
1
|
+
= Raingrams
|
2
|
+
|
3
|
+
* http://raingrams.rubyforge.org/
|
4
|
+
* Postmodern Modulus III (postmodern.mod3@gmail.com)
|
4
5
|
|
5
6
|
== DESCRIPTION:
|
6
7
|
|
@@ -8,13 +9,14 @@ Raingrams is a flexible and general-purpose ngrams library written in Ruby.
|
|
8
9
|
Raingrams supports any non-zero ngram size, text/non-text grams, multiple
|
9
10
|
parsing styles and open/closed vocabulary models.
|
10
11
|
|
11
|
-
== FEATURES
|
12
|
+
== FEATURES:
|
12
13
|
|
13
|
-
* Supports all
|
14
|
+
* Supports all ngram sizes above 1.
|
14
15
|
* Supports text and non-text grams.
|
15
16
|
* Supports Open and Closed vocabulary models.
|
16
|
-
|
17
|
-
|
17
|
+
* Supports calculating the similarity and commonality of sample text against
|
18
|
+
specified models.
|
19
|
+
* Supports generating random text from models.
|
18
20
|
|
19
21
|
== INSTALL:
|
20
22
|
|
data/Rakefile
CHANGED
@@ -2,16 +2,13 @@
|
|
2
2
|
|
3
3
|
require 'rubygems'
|
4
4
|
require 'hoe'
|
5
|
+
require './tasks/spec.rb'
|
5
6
|
require './lib/raingrams/version.rb'
|
6
7
|
|
7
8
|
Hoe.new('raingrams', Raingrams::VERSION) do |p|
|
8
9
|
p.rubyforge_name = 'raingrams'
|
9
|
-
p.
|
10
|
-
p.
|
11
|
-
p.summary = 'Raingrams is a flexible and general-purpose ngrams library written in Ruby'
|
12
|
-
p.description = p.paragraphs_of('README.txt', 2..5).join("\n\n")
|
13
|
-
p.url = p.paragraphs_of('README.txt', 0).first.split(/\n/)[1..-1]
|
14
|
-
p.changes = p.paragraphs_of('History.txt', 0..1).join("\n\n")
|
10
|
+
p.developer('Postmodern Modulus III', 'postmodern.mod3@gmail.com')
|
11
|
+
p.remote_rdoc_dir = 'docs'
|
15
12
|
end
|
16
13
|
|
17
14
|
# vim: syntax=Ruby
|
data/TODO.txt
ADDED
@@ -1,13 +1,9 @@
|
|
1
|
-
require 'raingrams/
|
1
|
+
require 'raingrams/model'
|
2
2
|
|
3
3
|
module Raingrams
|
4
|
-
class BigramModel <
|
4
|
+
class BigramModel < Model
|
5
5
|
|
6
|
-
|
7
|
-
opts[:ngram_size] = 2
|
8
|
-
|
9
|
-
super(opts,&block)
|
10
|
-
end
|
6
|
+
ngram_size 2
|
11
7
|
|
12
8
|
end
|
13
9
|
end
|
data/lib/raingrams/extensions.rb
CHANGED
@@ -1,7 +1,2 @@
|
|
1
|
-
require 'raingrams/extensions/class'
|
2
|
-
require 'raingrams/extensions/nil_class'
|
3
|
-
require 'raingrams/extensions/true_class'
|
4
|
-
require 'raingrams/extensions/false_class'
|
5
|
-
require 'raingrams/extensions/symbol'
|
6
1
|
require 'raingrams/extensions/string'
|
7
2
|
require 'raingrams/extensions/object'
|
@@ -1,13 +1,9 @@
|
|
1
|
-
require 'raingrams/
|
1
|
+
require 'raingrams/model'
|
2
2
|
|
3
3
|
module Raingrams
|
4
|
-
class HexagramModel <
|
4
|
+
class HexagramModel < Model
|
5
5
|
|
6
|
-
|
7
|
-
opts[:ngram_size] = 6
|
8
|
-
|
9
|
-
super(opts,&block)
|
10
|
-
end
|
6
|
+
ngram_size 6
|
11
7
|
|
12
8
|
end
|
13
9
|
end
|