unsupervised-language-detection 0.0.1 → 0.0.2
Sign up to get free protection for your applications and to get access to all the features.
@@ -3,7 +3,7 @@ require File.expand_path('../language-detector', __FILE__)
|
|
3
3
|
TWEETS_FILENAME = "datasets/tweets_5000.txt"
|
4
4
|
|
5
5
|
training_sentences = File.readlines(TWEETS_FILENAME).map{ |tweet| tweet.normalize }
|
6
|
-
detector = LanguageDetector.new(:ngram_size =>
|
6
|
+
detector = LanguageDetector.new(:ngram_size => 3)
|
7
7
|
detector.train(30, training_sentences)
|
8
8
|
detector.yamlize("detector.yaml")
|
9
9
|
|
metadata
CHANGED
@@ -1,13 +1,13 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: unsupervised-language-detection
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
hash:
|
4
|
+
hash: 27
|
5
5
|
prerelease:
|
6
6
|
segments:
|
7
7
|
- 0
|
8
8
|
- 0
|
9
|
-
-
|
10
|
-
version: 0.0.
|
9
|
+
- 2
|
10
|
+
version: 0.0.2
|
11
11
|
platform: ruby
|
12
12
|
authors:
|
13
13
|
- Edwin Chen
|