scylla 1.0.7 → 1.0.8
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/README.rdoc +2 -11
- data/test/classifier_test.rb +1 -1
- data/test/generator_test.rb +1 -1
- data/test/helper.rb +3 -3
- data/test/language_test.rb +1 -1
- data/test/loader_test.rb +1 -1
- data/test/scylla_test.rb +3 -3
- metadata +28 -20
checksums.yaml
ADDED
@@ -0,0 +1,7 @@
|
|
1
|
+
---
|
2
|
+
SHA1:
|
3
|
+
metadata.gz: cc4efa8f7db7f8d6af1db0fb2ce7c204b6238fd7
|
4
|
+
data.tar.gz: 96723ba86150e5612a1b88ae7ef568bf4080c13a
|
5
|
+
SHA512:
|
6
|
+
metadata.gz: e99255de08664a38cc0f155f2d4789f04139dc2277d285aebfa887dcfa4956f9caec90dabfecc1316e6652795f0220c5d5a47decd57f2a4d15da3106c86ad4d1
|
7
|
+
data.tar.gz: b64726df9e01a455e475818e7dd0b9cbe285c056d04a06a7bb576273e8e772444c9c316728c0b0140a400dc2cbfbd7e8cc482065bde720575830ffe8767c3b1f
|
data/README.rdoc
CHANGED
@@ -26,20 +26,11 @@ Multiple results for other possible languages:
|
|
26
26
|
|
27
27
|
== Training
|
28
28
|
|
29
|
-
|
29
|
+
Training is done by fetching data from wikipedia. To fetch latest articles (The country name in the language
|
30
|
+
in question, eg. "England" for English or "日本" for Japanese), run
|
30
31
|
|
31
32
|
rake scylla:train
|
32
33
|
|
33
|
-
If you want to store texts in your own folder, you can specify that to the rake task.
|
34
|
-
WARNING: specifying a different folder deletes all language support for files located in the default directory if they are not copied over.
|
35
|
-
|
36
|
-
rake scylla:train[/Users/hash/mytextdir]
|
37
|
-
"Creating language map for /Users/hash/mytextdir/english.txt"
|
38
|
-
"Creating language map for /Users/hash/mytextdir/kannada.txt"
|
39
|
-
.
|
40
|
-
.
|
41
|
-
etc
|
42
|
-
|
43
34
|
== Contributing to scylla
|
44
35
|
|
45
36
|
* Check out the latest master to make sure the feature hasn't been implemented or the bug hasn't been fixed yet
|
data/test/classifier_test.rb
CHANGED
data/test/generator_test.rb
CHANGED
data/test/helper.rb
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
require 'rubygems'
|
2
|
-
require 'ruby-debug'
|
3
2
|
require 'bundler'
|
4
|
-
require
|
3
|
+
require "minitest/autorun"
|
4
|
+
# require 'test/unit'
|
5
5
|
require 'shoulda'
|
6
6
|
require 'scylla'
|
7
7
|
require 'sanitize'
|
@@ -18,5 +18,5 @@ end
|
|
18
18
|
$LOAD_PATH.unshift(File.join(File.dirname(__FILE__), '..', 'lib'))
|
19
19
|
$LOAD_PATH.unshift(File.dirname(__FILE__))
|
20
20
|
|
21
|
-
class Test
|
21
|
+
class Minitest::Test
|
22
22
|
end
|
data/test/language_test.rb
CHANGED
data/test/loader_test.rb
CHANGED
data/test/scylla_test.rb
CHANGED
@@ -1,6 +1,6 @@
|
|
1
1
|
require 'helper'
|
2
2
|
|
3
|
-
class ScyllaTest < Test
|
3
|
+
class ScyllaTest < Minitest::Test
|
4
4
|
context "String methods" do
|
5
5
|
setup do
|
6
6
|
Scylla::Loader.set_dir(File.join("test","fixtures","lms"))
|
@@ -12,8 +12,8 @@ class ScyllaTest < Test::Unit::TestCase
|
|
12
12
|
end
|
13
13
|
|
14
14
|
should "load language results for strings" do
|
15
|
-
|
16
|
-
|
15
|
+
assert @language
|
16
|
+
assert @languages
|
17
17
|
assert_equal String, @language.class
|
18
18
|
assert_equal Array, @languages.class
|
19
19
|
assert_equal "english", @language
|
metadata
CHANGED
@@ -1,8 +1,7 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: scylla
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 1.0.
|
5
|
-
prerelease:
|
4
|
+
version: 1.0.8
|
6
5
|
platform: ruby
|
7
6
|
authors:
|
8
7
|
- Ashwin Hegde
|
@@ -14,35 +13,45 @@ dependencies:
|
|
14
13
|
- !ruby/object:Gem::Dependency
|
15
14
|
name: bundler
|
16
15
|
requirement: !ruby/object:Gem::Requirement
|
17
|
-
none: false
|
18
16
|
requirements:
|
19
|
-
- -
|
17
|
+
- - ">="
|
20
18
|
- !ruby/object:Gem::Version
|
21
19
|
version: '0'
|
22
20
|
type: :development
|
23
21
|
prerelease: false
|
24
22
|
version_requirements: !ruby/object:Gem::Requirement
|
25
|
-
none: false
|
26
23
|
requirements:
|
27
|
-
- -
|
24
|
+
- - ">="
|
28
25
|
- !ruby/object:Gem::Version
|
29
26
|
version: '0'
|
30
27
|
- !ruby/object:Gem::Dependency
|
31
28
|
name: sanitize
|
32
29
|
requirement: !ruby/object:Gem::Requirement
|
33
|
-
none: false
|
34
30
|
requirements:
|
35
|
-
- -
|
31
|
+
- - ">="
|
36
32
|
- !ruby/object:Gem::Version
|
37
33
|
version: '0'
|
38
34
|
type: :runtime
|
39
35
|
prerelease: false
|
40
36
|
version_requirements: !ruby/object:Gem::Requirement
|
41
|
-
none: false
|
42
37
|
requirements:
|
43
|
-
- -
|
38
|
+
- - ">="
|
44
39
|
- !ruby/object:Gem::Version
|
45
40
|
version: '0'
|
41
|
+
- !ruby/object:Gem::Dependency
|
42
|
+
name: unicode
|
43
|
+
requirement: !ruby/object:Gem::Requirement
|
44
|
+
requirements:
|
45
|
+
- - "~>"
|
46
|
+
- !ruby/object:Gem::Version
|
47
|
+
version: 0.4.4
|
48
|
+
type: :runtime
|
49
|
+
prerelease: false
|
50
|
+
version_requirements: !ruby/object:Gem::Requirement
|
51
|
+
requirements:
|
52
|
+
- - "~>"
|
53
|
+
- !ruby/object:Gem::Version
|
54
|
+
version: 0.4.4
|
46
55
|
description: Allows for text categorization by guessing the language of a given text
|
47
56
|
using n-grams
|
48
57
|
email: ahegde@zendesk.com
|
@@ -53,6 +62,10 @@ extra_rdoc_files:
|
|
53
62
|
- LICENSE.txt
|
54
63
|
- README.rdoc
|
55
64
|
files:
|
65
|
+
- LICENSE.txt
|
66
|
+
- README.rdoc
|
67
|
+
- bin/scylla
|
68
|
+
- lib/scylla.rb
|
56
69
|
- lib/scylla/classifier.rb
|
57
70
|
- lib/scylla/generator.rb
|
58
71
|
- lib/scylla/lms/arabic.lm
|
@@ -95,9 +108,6 @@ files:
|
|
95
108
|
- lib/scylla/resources.rb
|
96
109
|
- lib/scylla/string.rb
|
97
110
|
- lib/scylla/tasks.rb
|
98
|
-
- lib/scylla.rb
|
99
|
-
- README.rdoc
|
100
|
-
- LICENSE.txt
|
101
111
|
- test/classifier_test.rb
|
102
112
|
- test/fixtures/lms/arabic.lm
|
103
113
|
- test/fixtures/lms/bulgarian.lm
|
@@ -157,31 +167,29 @@ files:
|
|
157
167
|
- test/language_test.rb
|
158
168
|
- test/loader_test.rb
|
159
169
|
- test/scylla_test.rb
|
160
|
-
- bin/scylla
|
161
170
|
homepage: http://github.com/hashwin/scylla
|
162
171
|
licenses:
|
163
172
|
- MIT
|
173
|
+
metadata: {}
|
164
174
|
post_install_message:
|
165
175
|
rdoc_options: []
|
166
176
|
require_paths:
|
167
177
|
- lib
|
168
178
|
required_ruby_version: !ruby/object:Gem::Requirement
|
169
|
-
none: false
|
170
179
|
requirements:
|
171
|
-
- -
|
180
|
+
- - ">="
|
172
181
|
- !ruby/object:Gem::Version
|
173
182
|
version: '0'
|
174
183
|
required_rubygems_version: !ruby/object:Gem::Requirement
|
175
|
-
none: false
|
176
184
|
requirements:
|
177
|
-
- -
|
185
|
+
- - ">="
|
178
186
|
- !ruby/object:Gem::Version
|
179
187
|
version: '0'
|
180
188
|
requirements: []
|
181
189
|
rubyforge_project:
|
182
|
-
rubygems_version:
|
190
|
+
rubygems_version: 2.5.2
|
183
191
|
signing_key:
|
184
|
-
specification_version:
|
192
|
+
specification_version: 4
|
185
193
|
summary: Ruby port of Textcat language guesser
|
186
194
|
test_files:
|
187
195
|
- test/classifier_test.rb
|