stanford-core-nlp 0.5.3 → 3.5.0.alpha
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/README.md +174 -14
- data/lib/stanford-core-nlp/version.rb +1 -1
- metadata +8 -7
checksums.yaml
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
SHA1:
|
|
3
|
-
metadata.gz:
|
|
4
|
-
data.tar.gz:
|
|
3
|
+
metadata.gz: c549339529b8f18f52de57a5a01b677adbcca6bd
|
|
4
|
+
data.tar.gz: 9d85922fb49bb22f2964bf813fc5fcdcd7bd7e91
|
|
5
5
|
SHA512:
|
|
6
|
-
metadata.gz:
|
|
7
|
-
data.tar.gz:
|
|
6
|
+
metadata.gz: a5894ff785d811b43f779566c35965baed7ff6314f87f988d77ce456e91c1095667388f95fcf69b4fb4e9277064e6ad0cbf7984dd5f112601c122375817ca1dd
|
|
7
|
+
data.tar.gz: e113b755b626663e41291395359a913908a157481b9237ff65ce760939303ae1f230421eba6de60dc72ddf3c1da5541c32c4e5ebec1638c08c7bc9e04cf11fc0
|
data/README.md
CHANGED
|
@@ -1,23 +1,151 @@
|
|
|
1
|
-
# Stanford CoreNLP [](http://travis-ci.org/louismullie/stanford-core-nlp) [](https://github.com/arbox/nlp-with-ruby)
|
|
1
|
+
# Stanford CoreNLP [](http://travis-ci.org/louismullie/stanford-core-nlp) [](https://github.com/arbox/nlp-with-ruby) [](https://rubygems.org/gems/stanford-core-nlp)
|
|
2
2
|
|
|
3
|
-
> Ruby bindings for the Stanford
|
|
3
|
+
> Ruby bindings for the [Stanford CoreNLP Toolchain](http://stanfordnlp.github.io/CoreNLP/).
|
|
4
4
|
|
|
5
5
|
This gem provides high-level Ruby bindings to the
|
|
6
|
-
[Stanford
|
|
6
|
+
[Stanford CoreNLP](http://stanfordnlp.github.io/CoreNLP/) package,
|
|
7
7
|
a set natural language processing tools for tokenization, sentence segmentation,
|
|
8
8
|
part-of-speech tagging, lemmatization, and parsing of English, French and German.
|
|
9
|
-
The package also provides named entity recognition and coreference resolution
|
|
10
|
-
|
|
11
|
-
|
|
12
|
-
|
|
13
|
-
|
|
9
|
+
The package also provides named entity recognition and coreference resolution
|
|
10
|
+
for English.
|
|
11
|
+
|
|
12
|
+
This gem is compatible with Ruby `2.3` and `2.4` as well as JRuby `1.7` and `9`.
|
|
13
|
+
Older Ruby version should work as well.
|
|
14
|
+
|
|
15
|
+
You need Java 8 for the latest CoreNLP version (since 3.5.0, 2014-10-31),
|
|
16
|
+
earlier versions are tested on both Java 6 and Java 7.
|
|
17
|
+
|
|
18
|
+
The version schema has been changed to reflect the development
|
|
19
|
+
of Stanford CoreNLP itself. We'll release a gem for every new version from Stanford.
|
|
20
|
+
|
|
21
|
+
## Supported Human Languages
|
|
22
|
+
|
|
23
|
+
We strive to support all languages Stanford CoreNLP
|
|
24
|
+
[can](http://stanfordnlp.github.io/CoreNLP/human-languages.html) work with.
|
|
25
|
+
|
|
26
|
+
<table>
|
|
27
|
+
<thead>
|
|
28
|
+
<tr>
|
|
29
|
+
<th>Annotator</th>
|
|
30
|
+
<th style="text-align: center">ar</th>
|
|
31
|
+
<th style="text-align: center">zh</th>
|
|
32
|
+
<th style="text-align: center">en</th>
|
|
33
|
+
<th style="text-align: center">fr</th>
|
|
34
|
+
<th style="text-align: center">de</th>
|
|
35
|
+
<th style="text-align: center">es</th>
|
|
36
|
+
</tr>
|
|
37
|
+
</thead>
|
|
38
|
+
<tbody>
|
|
39
|
+
<tr>
|
|
40
|
+
<td>Tokenize / Segment</td>
|
|
41
|
+
<td style="text-align: center">✔</td>
|
|
42
|
+
<td style="text-align: center">✔</td>
|
|
43
|
+
<td style="text-align: center">✔</td>
|
|
44
|
+
<td style="text-align: center">✔</td>
|
|
45
|
+
<td style="text-align: center"> </td>
|
|
46
|
+
<td style="text-align: center">✔</td>
|
|
47
|
+
</tr>
|
|
48
|
+
<tr>
|
|
49
|
+
<td>Sentence Split</td>
|
|
50
|
+
<td style="text-align: center">✔</td>
|
|
51
|
+
<td style="text-align: center">✔</td>
|
|
52
|
+
<td style="text-align: center">✔</td>
|
|
53
|
+
<td style="text-align: center">✔</td>
|
|
54
|
+
<td style="text-align: center">✔</td>
|
|
55
|
+
<td style="text-align: center">✔</td>
|
|
56
|
+
</tr>
|
|
57
|
+
<tr>
|
|
58
|
+
<td>Part of Speech</td>
|
|
59
|
+
<td style="text-align: center">✔</td>
|
|
60
|
+
<td style="text-align: center">✔</td>
|
|
61
|
+
<td style="text-align: center">✔</td>
|
|
62
|
+
<td style="text-align: center">✔</td>
|
|
63
|
+
<td style="text-align: center">✔</td>
|
|
64
|
+
<td style="text-align: center">✔</td>
|
|
65
|
+
</tr>
|
|
66
|
+
<tr>
|
|
67
|
+
<td>Lemma</td>
|
|
68
|
+
<td style="text-align: center"> </td>
|
|
69
|
+
<td style="text-align: center"> </td>
|
|
70
|
+
<td style="text-align: center">✔</td>
|
|
71
|
+
<td style="text-align: center"> </td>
|
|
72
|
+
<td style="text-align: center"> </td>
|
|
73
|
+
<td style="text-align: center"> </td>
|
|
74
|
+
</tr>
|
|
75
|
+
<tr>
|
|
76
|
+
<td>Named Entities</td>
|
|
77
|
+
<td style="text-align: center"> </td>
|
|
78
|
+
<td style="text-align: center">✔</td>
|
|
79
|
+
<td style="text-align: center">✔</td>
|
|
80
|
+
<td style="text-align: center"> </td>
|
|
81
|
+
<td style="text-align: center">✔</td>
|
|
82
|
+
<td style="text-align: center">✔</td>
|
|
83
|
+
</tr>
|
|
84
|
+
<tr>
|
|
85
|
+
<td>Constituency Parsing</td>
|
|
86
|
+
<td style="text-align: center">✔</td>
|
|
87
|
+
<td style="text-align: center">✔</td>
|
|
88
|
+
<td style="text-align: center">✔</td>
|
|
89
|
+
<td style="text-align: center">✔</td>
|
|
90
|
+
<td style="text-align: center">✔</td>
|
|
91
|
+
<td style="text-align: center">✔</td>
|
|
92
|
+
</tr>
|
|
93
|
+
<tr>
|
|
94
|
+
<td>Dependency Parsing</td>
|
|
95
|
+
<td style="text-align: center"> </td>
|
|
96
|
+
<td style="text-align: center">✔</td>
|
|
97
|
+
<td style="text-align: center">✔</td>
|
|
98
|
+
<td style="text-align: center">✔</td>
|
|
99
|
+
<td style="text-align: center">✔</td>
|
|
100
|
+
<td style="text-align: center"> </td>
|
|
101
|
+
</tr>
|
|
102
|
+
<tr>
|
|
103
|
+
<td>Sentiment Analysis</td>
|
|
104
|
+
<td style="text-align: center"> </td>
|
|
105
|
+
<td style="text-align: center"> </td>
|
|
106
|
+
<td style="text-align: center">✔</td>
|
|
107
|
+
<td style="text-align: center"> </td>
|
|
108
|
+
<td style="text-align: center"> </td>
|
|
109
|
+
<td style="text-align: center"> </td>
|
|
110
|
+
</tr>
|
|
111
|
+
<tr>
|
|
112
|
+
<td>Mention Detection</td>
|
|
113
|
+
<td style="text-align: center"> </td>
|
|
114
|
+
<td style="text-align: center">✔</td>
|
|
115
|
+
<td style="text-align: center">✔</td>
|
|
116
|
+
<td style="text-align: center"> </td>
|
|
117
|
+
<td style="text-align: center"> </td>
|
|
118
|
+
<td style="text-align: center"> </td>
|
|
119
|
+
</tr>
|
|
120
|
+
<tr>
|
|
121
|
+
<td>Coreference</td>
|
|
122
|
+
<td style="text-align: center"> </td>
|
|
123
|
+
<td style="text-align: center">✔</td>
|
|
124
|
+
<td style="text-align: center">✔</td>
|
|
125
|
+
<td style="text-align: center"> </td>
|
|
126
|
+
<td style="text-align: center"> </td>
|
|
127
|
+
<td style="text-align: center"> </td>
|
|
128
|
+
</tr>
|
|
129
|
+
<tr>
|
|
130
|
+
<td>Open IE</td>
|
|
131
|
+
<td style="text-align: center"> </td>
|
|
132
|
+
<td style="text-align: center"> </td>
|
|
133
|
+
<td style="text-align: center">✔</td>
|
|
134
|
+
<td style="text-align: center"> </td>
|
|
135
|
+
<td style="text-align: center"> </td>
|
|
136
|
+
<td style="text-align: center"> </td>
|
|
137
|
+
</tr>
|
|
138
|
+
</tbody>
|
|
139
|
+
</table>
|
|
14
140
|
|
|
15
141
|
## Installation
|
|
16
142
|
|
|
17
143
|
First, install the gem: `gem install stanford-core-nlp`.
|
|
18
|
-
Then, download the Stanford Core NLP JAR and model files:
|
|
144
|
+
Then, download the Stanford Core NLP JAR and model files:
|
|
145
|
+
[Stanford CoreNLP](http://nlp.stanford.edu/software/stanford-postagger-full-2014-10-26.zip)
|
|
19
146
|
|
|
20
|
-
Place the contents of the extracted archive inside the
|
|
147
|
+
Place the contents of the extracted archive inside the `/bin/` folder of
|
|
148
|
+
the stanford-core-nlp gem (e.g. [...]/gems/stanford-core-nlp-0.x/bin/).
|
|
21
149
|
|
|
22
150
|
## Configuration
|
|
23
151
|
|
|
@@ -110,7 +238,11 @@ puts StanfordCoreNLP::MaxentTagger.inspect
|
|
|
110
238
|
|
|
111
239
|
## List of annotator classes
|
|
112
240
|
|
|
113
|
-
Here is a full list of annotator classes provided by the Stanford Core NLP package.
|
|
241
|
+
Here is a full list of annotator classes provided by the Stanford Core NLP package.
|
|
242
|
+
You can load these classes individually using `StanfordCoreNLP.load_class`
|
|
243
|
+
(see above). Once this is done, you can use them like you would from
|
|
244
|
+
a Java program. Refer to the Java documentation for a list of functions provided
|
|
245
|
+
by each of these classes.
|
|
114
246
|
|
|
115
247
|
* PTBTokenizerAnnotator - tokenizes the text following Penn Treebank conventions.
|
|
116
248
|
* WordToSentenceAnnotator - splits a sequence of words into a sequence of sentences.
|
|
@@ -213,7 +345,35 @@ end
|
|
|
213
345
|
|
|
214
346
|
## Contributing
|
|
215
347
|
|
|
216
|
-
|
|
348
|
+
We are very glad to see you in this section and highly appreciate any help!
|
|
349
|
+
|
|
350
|
+
If you want to contribute please agree that your work will be published
|
|
351
|
+
under the terms of the `GPL v.3.0` license.
|
|
352
|
+
|
|
353
|
+
Some of the open tasks for contributors are listed on the
|
|
354
|
+
[issues](https://github.com/louismullie/stanford-core-nlp/issues) page.
|
|
355
|
+
You may want to start there.
|
|
356
|
+
|
|
357
|
+
Then feel free to fork the code and send us a pull request.
|
|
358
|
+
|
|
359
|
+
## License
|
|
360
|
+
|
|
361
|
+
[](http://www.gnu.org/licenses/gpl-3.0) `stanford-core-nlp` by [Louis-Antoine Mullie](https://github.com/louismullie),
|
|
362
|
+
[Andrei Beliankou](https://github.com/arbox) and
|
|
363
|
+
[Contributors](https://github.com/louismullie/stanford-core-nlp/graphs/contributors).
|
|
364
|
+
|
|
365
|
+
> This program is free software: you can redistribute it and/or modify
|
|
366
|
+
> it under the terms of the GNU General Public License as published by
|
|
367
|
+
> the Free Software Foundation, either version 3 of the License, or
|
|
368
|
+
> (at your option) any later version.
|
|
369
|
+
|
|
370
|
+
> This program is distributed in the hope that it will be useful,
|
|
371
|
+
> but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
372
|
+
> MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
373
|
+
> GNU General Public License for more details.
|
|
374
|
+
|
|
375
|
+
> You should have received a copy of the GNU General Public License
|
|
376
|
+
> along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
217
377
|
|
|
218
|
-
|
|
219
|
-
|
|
378
|
+
<!--- Links --->
|
|
379
|
+
[ruby]: https://www.ruby-lang.org/en/
|
metadata
CHANGED
|
@@ -1,14 +1,15 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: stanford-core-nlp
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
version:
|
|
4
|
+
version: 3.5.0.alpha
|
|
5
5
|
platform: ruby
|
|
6
6
|
authors:
|
|
7
7
|
- Louis Mullie
|
|
8
|
+
- Andrei Beliankou
|
|
8
9
|
autorequire:
|
|
9
10
|
bindir: bin
|
|
10
11
|
cert_chain: []
|
|
11
|
-
date:
|
|
12
|
+
date: 2017-02-16 00:00:00.000000000 Z
|
|
12
13
|
dependencies:
|
|
13
14
|
- !ruby/object:Gem::Dependency
|
|
14
15
|
name: bind-it
|
|
@@ -29,7 +30,7 @@ description: High-level Ruby bindings to the Stanford CoreNLP package, a set nat
|
|
|
29
30
|
parsing for several languages, as well as named entity recognition and coreference
|
|
30
31
|
resolution for English, German, French and other languages.
|
|
31
32
|
email:
|
|
32
|
-
-
|
|
33
|
+
- arbox@yandex.ru
|
|
33
34
|
executables: []
|
|
34
35
|
extensions: []
|
|
35
36
|
extra_rdoc_files: []
|
|
@@ -47,7 +48,7 @@ homepage: https://github.com/louismullie/stanford-core-nlp
|
|
|
47
48
|
licenses:
|
|
48
49
|
- GPL-3.0
|
|
49
50
|
metadata: {}
|
|
50
|
-
post_install_message:
|
|
51
|
+
post_install_message: This is an alpha release. Stay tuned!
|
|
51
52
|
rdoc_options: []
|
|
52
53
|
require_paths:
|
|
53
54
|
- lib
|
|
@@ -58,12 +59,12 @@ required_ruby_version: !ruby/object:Gem::Requirement
|
|
|
58
59
|
version: '0'
|
|
59
60
|
required_rubygems_version: !ruby/object:Gem::Requirement
|
|
60
61
|
requirements:
|
|
61
|
-
- - "
|
|
62
|
+
- - ">"
|
|
62
63
|
- !ruby/object:Gem::Version
|
|
63
|
-
version:
|
|
64
|
+
version: 1.3.1
|
|
64
65
|
requirements: []
|
|
65
66
|
rubyforge_project:
|
|
66
|
-
rubygems_version: 2.
|
|
67
|
+
rubygems_version: 2.6.8
|
|
67
68
|
signing_key:
|
|
68
69
|
specification_version: 4
|
|
69
70
|
summary: Ruby bindings to the Stanford Core NLP tools.
|