opener-language-identifier 3.0.1 → 3.0.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 7abeb7ee7ac0542e5948cb88b868501825efd4aa
|
4
|
+
data.tar.gz: e1fe36a7e665f42a1ea711f34996224c188c4e58
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 415285de95bd3ac2fd78d39c1e9d189badd4a384b086ae33767f96f1ec8df86bd24340f478f09ffedb04f4dac9d4aa23ad743e7caa0a2b06c6d6f90bf8f572f9
|
7
|
+
data.tar.gz: 3043ab05c774d586dd6f5aa3683313941af375017e6d02e1f6275ffda0f7adaecca0ba9f48a801d4635345488353f3a7750c356e8c83b39176ff9d1418dc065d
|
data/README.md
CHANGED
@@ -13,7 +13,7 @@ analysis of for example sentiments and or entities.
|
|
13
13
|
|
14
14
|
This software is part of a larger collection of natural language processing
|
15
15
|
tools known as "the OpeNER project". You can find more information about the
|
16
|
-
project at
|
16
|
+
project at [the OpeNER portal](http://opener-project.github.io). There you can
|
17
17
|
also find references to terms like KAF (an XML standard to represent linguistic
|
18
18
|
annotations in texts), component, cores, scenario's and pipelines.
|
19
19
|
|
@@ -37,13 +37,12 @@ This aplication reads a text from standard input in order to identify the langua
|
|
37
37
|
|
38
38
|
This will output:
|
39
39
|
|
40
|
-
|
40
|
+
~~~~
|
41
41
|
<?xml version="1.0" encoding="UTF-8" standalone="yes"?>
|
42
42
|
<KAF xml:lang="en" version="2.1">
|
43
|
-
|
44
|
-
</raw>
|
43
|
+
<raw>This is an English text.</raw>
|
45
44
|
</KAF>
|
46
|
-
|
45
|
+
~~~~
|
47
46
|
|
48
47
|
If you just want the language code returned add the ```--no-kaf``` option like
|
49
48
|
this
|
@@ -61,14 +60,14 @@ You can launch a language identification webservice by executing:
|
|
61
60
|
$ language-identifier-server
|
62
61
|
|
63
62
|
This will launch a mini webserver with the webservice. It defaults to port 9292,
|
64
|
-
so you can access it at <http://localhost:9292
|
63
|
+
so you can access it at <http://localhost:9292/>.
|
65
64
|
|
66
65
|
To launch it on a different port provide the `-p [port-number]` option like
|
67
66
|
this:
|
68
67
|
|
69
68
|
language-identifier-server -p 1234
|
70
69
|
|
71
|
-
It then launches at <http://localhost:1234
|
70
|
+
It then launches at <http://localhost:1234/>
|
72
71
|
|
73
72
|
Documentation on the Webservice is provided by surfing to the urls provided
|
74
73
|
above. For more information on how to launch a webservice run the command with
|
@@ -86,10 +85,7 @@ Description of dependencies
|
|
86
85
|
---------------------------
|
87
86
|
|
88
87
|
This component runs best if you run it in an environment suited for OpeNER
|
89
|
-
components. You can find an installation guide and helper tools in the (
|
90
|
-
installer)[https://github.com/opener-project/opener-installer] and (an
|
91
|
-
installation guide on the Opener
|
92
|
-
Website)[http://opener-project.github.io/getting-started/how-to/local-installation.html]
|
88
|
+
components. You can find an installation guide and helper tools in the [OpeNER installer](https://github.com/opener-project/opener-installer) and [an installation guide on the OpenerWebsite](http://opener-project.github.io/getting-started/how-to/local-installation.html)
|
93
89
|
|
94
90
|
At least you need the following system setup:
|
95
91
|
|
@@ -119,19 +115,19 @@ actual working component.
|
|
119
115
|
Where to go from here
|
120
116
|
---------------------
|
121
117
|
|
122
|
-
* Check
|
123
|
-
*
|
118
|
+
* [Check the project website](http://opener-project.github.io)
|
119
|
+
* [Checkout the webservice](http://opener.olery.com/language-identifier)
|
124
120
|
|
125
121
|
Report problem/Get help
|
126
122
|
-----------------------
|
127
123
|
|
128
124
|
If you encounter problems, please email support@opener-project.eu or leave an
|
129
|
-
issue in the
|
125
|
+
issue in the [issue tracker](https://github.com/opener-project/language-identifier/issues).
|
130
126
|
|
131
127
|
Contributing
|
132
128
|
------------
|
133
129
|
|
134
|
-
1. Fork it
|
130
|
+
1. Fork it <http://github.com/opener-project/language-identifier/fork>
|
135
131
|
2. Create your feature branch (`git checkout -b my-new-feature`)
|
136
132
|
3. Commit your changes (`git commit -am 'Add some feature'`)
|
137
133
|
4. Push to the branch (`git push origin my-new-feature`)
|
Binary file
|
Binary file
|
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: opener-language-identifier
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 3.0.
|
4
|
+
version: 3.0.2
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- development@olery.com
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2014-05-
|
11
|
+
date: 2014-05-23 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: builder
|
@@ -168,97 +168,97 @@ description: Language identifier for human readable text.
|
|
168
168
|
email:
|
169
169
|
executables:
|
170
170
|
- language-identifier
|
171
|
-
- language-identifier-daemon
|
172
171
|
- language-identifier-server
|
172
|
+
- language-identifier-daemon
|
173
173
|
extensions: []
|
174
174
|
extra_rdoc_files: []
|
175
175
|
files:
|
176
|
-
- README.md
|
177
|
-
- bin/language-identifier
|
178
|
-
- bin/language-identifier-daemon
|
179
|
-
- bin/language-identifier-server
|
180
|
-
- config.ru
|
181
176
|
- core/target/LanguageDetection-0.0.1.jar
|
182
|
-
- core/target/classes/
|
183
|
-
- core/target/classes/
|
184
|
-
- core/target/classes/com/cybozu/labs/langdetect/DetectorFactory.class
|
177
|
+
- core/target/classes/org/vicomtech/opennlp/LanguageDetection/CybozuDetector.class
|
178
|
+
- core/target/classes/org/vicomtech/opennlp/LanguageDetection/Main.class
|
185
179
|
- core/target/classes/com/cybozu/labs/langdetect/ErrorCode.class
|
186
180
|
- core/target/classes/com/cybozu/labs/langdetect/GenProfile.class
|
181
|
+
- core/target/classes/com/cybozu/labs/langdetect/Command.class
|
187
182
|
- core/target/classes/com/cybozu/labs/langdetect/LangDetectException.class
|
188
183
|
- core/target/classes/com/cybozu/labs/langdetect/Language.class
|
189
|
-
- core/target/classes/com/cybozu/labs/langdetect/
|
184
|
+
- core/target/classes/com/cybozu/labs/langdetect/Detector.class
|
185
|
+
- core/target/classes/com/cybozu/labs/langdetect/DetectorFactory.class
|
186
|
+
- core/target/classes/com/cybozu/labs/langdetect/util/TagExtractor.class
|
187
|
+
- core/target/classes/com/cybozu/labs/langdetect/util/NGram.class
|
190
188
|
- core/target/classes/com/cybozu/labs/langdetect/util/LangProfile.class
|
191
189
|
- core/target/classes/com/cybozu/labs/langdetect/util/Messages.class
|
192
|
-
- core/target/classes/com/cybozu/labs/langdetect/util/NGram.class
|
193
|
-
- core/target/classes/com/cybozu/labs/langdetect/util/TagExtractor.class
|
194
190
|
- core/target/classes/com/cybozu/labs/langdetect/util/messages.properties
|
195
|
-
- core/target/classes/org/vicomtech/opennlp/LanguageDetection/CybozuDetector.class
|
196
|
-
- core/target/classes/org/vicomtech/opennlp/LanguageDetection/Main.class
|
197
|
-
- core/target/classes/profiles/ar
|
198
|
-
- core/target/classes/profiles/bg
|
199
|
-
- core/target/classes/profiles/bn
|
200
|
-
- core/target/classes/profiles/ca
|
201
|
-
- core/target/classes/profiles/cs
|
202
|
-
- core/target/classes/profiles/da
|
203
|
-
- core/target/classes/profiles/de
|
204
|
-
- core/target/classes/profiles/el
|
205
|
-
- core/target/classes/profiles/en
|
206
|
-
- core/target/classes/profiles/es
|
207
|
-
- core/target/classes/profiles/et
|
208
|
-
- core/target/classes/profiles/eu
|
209
|
-
- core/target/classes/profiles/fa
|
210
191
|
- core/target/classes/profiles/fi
|
211
|
-
- core/target/classes/profiles/
|
212
|
-
- core/target/classes/profiles/
|
213
|
-
- core/target/classes/profiles/
|
214
|
-
- core/target/classes/profiles/hi
|
192
|
+
- core/target/classes/profiles/ta
|
193
|
+
- core/target/classes/profiles/mr
|
194
|
+
- core/target/classes/profiles/ml
|
215
195
|
- core/target/classes/profiles/hr
|
216
|
-
- core/target/classes/profiles/hu
|
217
196
|
- core/target/classes/profiles/id
|
218
|
-
- core/target/classes/profiles/
|
219
|
-
- core/target/classes/profiles/ja
|
220
|
-
- core/target/classes/profiles/kn
|
221
|
-
- core/target/classes/profiles/ko
|
222
|
-
- core/target/classes/profiles/lt
|
223
|
-
- core/target/classes/profiles/lv
|
224
|
-
- core/target/classes/profiles/mk
|
225
|
-
- core/target/classes/profiles/ml
|
226
|
-
- core/target/classes/profiles/mr
|
227
|
-
- core/target/classes/profiles/ne
|
228
|
-
- core/target/classes/profiles/nl
|
197
|
+
- core/target/classes/profiles/es
|
229
198
|
- core/target/classes/profiles/no
|
199
|
+
- core/target/classes/profiles/ca
|
200
|
+
- core/target/classes/profiles/en
|
201
|
+
- core/target/classes/profiles/ru
|
202
|
+
- core/target/classes/profiles/te
|
203
|
+
- core/target/classes/profiles/lt
|
230
204
|
- core/target/classes/profiles/pa
|
205
|
+
- core/target/classes/profiles/eu
|
206
|
+
- core/target/classes/profiles/ja
|
207
|
+
- core/target/classes/profiles/he
|
208
|
+
- core/target/classes/profiles/nl
|
209
|
+
- core/target/classes/profiles/sl
|
210
|
+
- core/target/classes/profiles/tr
|
231
211
|
- core/target/classes/profiles/pl
|
232
|
-
- core/target/classes/profiles/pt
|
233
|
-
- core/target/classes/profiles/ro
|
234
|
-
- core/target/classes/profiles/ru
|
235
212
|
- core/target/classes/profiles/sk
|
236
|
-
- core/target/classes/profiles/
|
237
|
-
- core/target/classes/profiles/
|
213
|
+
- core/target/classes/profiles/fa
|
214
|
+
- core/target/classes/profiles/de
|
215
|
+
- core/target/classes/profiles/bg
|
216
|
+
- core/target/classes/profiles/it
|
217
|
+
- core/target/classes/profiles/fr
|
218
|
+
- core/target/classes/profiles/el
|
219
|
+
- core/target/classes/profiles/pt
|
220
|
+
- core/target/classes/profiles/uk
|
221
|
+
- core/target/classes/profiles/da
|
222
|
+
- core/target/classes/profiles/ar
|
223
|
+
- core/target/classes/profiles/zh-tw
|
238
224
|
- core/target/classes/profiles/sq
|
239
|
-
- core/target/classes/profiles/sv
|
240
|
-
- core/target/classes/profiles/sw
|
241
|
-
- core/target/classes/profiles/ta
|
242
|
-
- core/target/classes/profiles/te
|
243
225
|
- core/target/classes/profiles/th
|
244
|
-
- core/target/classes/profiles/
|
245
|
-
- core/target/classes/profiles/
|
246
|
-
- core/target/classes/profiles/
|
247
|
-
- core/target/classes/profiles/
|
226
|
+
- core/target/classes/profiles/kn
|
227
|
+
- core/target/classes/profiles/sw
|
228
|
+
- core/target/classes/profiles/ko
|
229
|
+
- core/target/classes/profiles/ro
|
230
|
+
- core/target/classes/profiles/lv
|
231
|
+
- core/target/classes/profiles/sv
|
232
|
+
- core/target/classes/profiles/so
|
248
233
|
- core/target/classes/profiles/vi
|
234
|
+
- core/target/classes/profiles/et
|
235
|
+
- core/target/classes/profiles/hi
|
236
|
+
- core/target/classes/profiles/gu
|
249
237
|
- core/target/classes/profiles/zh-cn
|
250
|
-
- core/target/classes/profiles/
|
238
|
+
- core/target/classes/profiles/mk
|
239
|
+
- core/target/classes/profiles/ne
|
240
|
+
- core/target/classes/profiles/ur
|
241
|
+
- core/target/classes/profiles/hu
|
242
|
+
- core/target/classes/profiles/cs
|
243
|
+
- core/target/classes/profiles/bn
|
244
|
+
- core/target/classes/profiles/tl
|
245
|
+
- core/target/classes/com/cybozu/labs/langdetect/af
|
251
246
|
- exec/language-identifier.rb
|
252
247
|
- lib/opener/language_identifier.rb
|
253
|
-
- lib/opener/language_identifier/cli.rb
|
254
|
-
- lib/opener/language_identifier/detector.rb
|
255
248
|
- lib/opener/language_identifier/kaf_builder.rb
|
256
|
-
- lib/opener/language_identifier/public/markdown.css
|
257
|
-
- lib/opener/language_identifier/server.rb
|
258
249
|
- lib/opener/language_identifier/version.rb
|
250
|
+
- lib/opener/language_identifier/server.rb
|
251
|
+
- lib/opener/language_identifier/detector.rb
|
252
|
+
- lib/opener/language_identifier/cli.rb
|
253
|
+
- lib/opener/language_identifier/public/markdown.css
|
259
254
|
- lib/opener/language_identifier/views/index.erb
|
260
255
|
- lib/opener/language_identifier/views/result.erb
|
256
|
+
- config.ru
|
261
257
|
- opener-language-identifier.gemspec
|
258
|
+
- README.md
|
259
|
+
- bin/language-identifier
|
260
|
+
- bin/language-identifier-server
|
261
|
+
- bin/language-identifier-daemon
|
262
262
|
homepage: http://opener-project.github.com/
|
263
263
|
licenses: []
|
264
264
|
metadata: {}
|
@@ -278,8 +278,9 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
278
278
|
version: '0'
|
279
279
|
requirements: []
|
280
280
|
rubyforge_project:
|
281
|
-
rubygems_version: 2.
|
281
|
+
rubygems_version: 2.1.9
|
282
282
|
signing_key:
|
283
283
|
specification_version: 4
|
284
284
|
summary: Language identifier for human readable text.
|
285
285
|
test_files: []
|
286
|
+
has_rdoc: yard
|