name-spotter 0.2.4 → 0.3.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +7 -0
- data/.byebug_history +44 -0
- data/.gitignore +51 -0
- data/.rspec +2 -0
- data/.ruby-version +1 -0
- data/.travis.yml +22 -0
- data/CHANGELOG +2 -0
- data/Gemfile +2 -22
- data/README.md +116 -0
- data/Rakefile +2 -19
- data/lib/name-spotter.rb +3 -1
- data/lib/name-spotter/monkey_patches.rb +4 -2
- data/lib/name-spotter/neti_neti_client.rb +13 -6
- data/lib/name-spotter/scientific_name.rb +3 -3
- data/lib/name-spotter/taxon_finder_client.rb +35 -24
- data/lib/name-spotter/version.rb +8 -0
- data/name-spotter.gemspec +26 -98
- data/spec/name-spotter_spec.rb +334 -131
- data/spec/scientific_name_spec.rb +14 -19
- data/spec/spec_helper.rb +2 -12
- data/tf_logic.txt +3 -3
- metadata +69 -142
- data/.rvmrc +0 -1
- data/Gemfile.lock +0 -84
- data/README.rdoc +0 -95
- data/VERSION +0 -1
- data/features/name-spotter.feature +0 -9
- data/features/step_definitions/name-spotter_steps.rb +0 -0
- data/features/support/env.rb +0 -13
@@ -1,25 +1,20 @@
|
|
1
|
-
# encoding: utf-8
|
2
|
-
require File.expand_path(File.dirname(__FILE__) + '/spec_helper')
|
3
|
-
|
4
1
|
describe NameSpotter::ScientificName do
|
5
|
-
|
6
|
-
describe "
|
7
|
-
|
8
|
-
|
9
|
-
|
10
|
-
|
11
|
-
|
12
|
-
|
13
|
-
@name.end_pos.should eq @name.start_pos + @find_me.length - 1
|
2
|
+
|
3
|
+
describe ".new" do
|
4
|
+
it "calculates end_pos" do
|
5
|
+
find_me = "M. musculus"
|
6
|
+
name = NameSpotter::ScientificName.new(
|
7
|
+
find_me, { start_position: 30, scientific_name: "Mus musculus" }
|
8
|
+
)
|
9
|
+
expect(name.end_pos).to eq(name.start_pos + find_me.length - 1)
|
14
10
|
end
|
15
|
-
|
16
|
-
|
17
|
-
describe "unicode" do
|
18
|
-
it "should handle unicode characters" do
|
11
|
+
|
12
|
+
it "handles unicode characters" do
|
19
13
|
verbatim = "Slovenščina"
|
20
|
-
name = NameSpotter::ScientificName.
|
21
|
-
|
22
|
-
name.
|
14
|
+
name = NameSpotter::ScientificName.
|
15
|
+
new(verbatim, { start_position: 48193 })
|
16
|
+
expect(name.verbatim).to eq verbatim
|
17
|
+
expect(name.end_pos).to eq(name.start_pos + verbatim.length - 1)
|
23
18
|
end
|
24
19
|
end
|
25
20
|
end
|
data/spec/spec_helper.rb
CHANGED
@@ -1,12 +1,2 @@
|
|
1
|
-
|
2
|
-
|
3
|
-
require 'rspec'
|
4
|
-
require 'name-spotter'
|
5
|
-
|
6
|
-
# Requires supporting files with custom matchers and macros, etc,
|
7
|
-
# in ./support/ and its subdirectories.
|
8
|
-
Dir["#{File.dirname(__FILE__)}/support/**/*.rb"].each {|f| require f}
|
9
|
-
|
10
|
-
RSpec.configure do |config|
|
11
|
-
|
12
|
-
end
|
1
|
+
require "rspec"
|
2
|
+
require "name-spotter"
|
data/tf_logic.txt
CHANGED
@@ -23,11 +23,11 @@ for Genus + species
|
|
23
23
|
if genus found and species, but not end of the sentence
|
24
24
|
$currentString $cleanCandidateWord|species|$wordListMatches"."$score||-1||
|
25
25
|
search continues... found species, can be subspecies
|
26
|
-
|
26
|
+
|
27
27
|
for abbreviated Genera (1-2 letters (where '-' can also be the first letter ???):
|
28
28
|
expand Genus if last used genus is known with this letters
|
29
29
|
if abbrev did not make sense (genus is not found):
|
30
|
-
||0||-1||
|
30
|
+
||0||-1||
|
31
31
|
- result is nothing
|
32
32
|
Also means 2 letter genera are not found by NameFinder
|
33
33
|
|
@@ -43,7 +43,7 @@ for Genus + species
|
|
43
43
|
"$currentString ($cleanCandidateWord)|genus|$wordListMatches"."$scoreG||-1||\n"
|
44
44
|
if next word is genus
|
45
45
|
****"$cleanCandidateWord|genus|$scoreG|$currentString|$wordListMatches||\n"
|
46
|
-
|
46
|
+
|
47
47
|
if next word is family
|
48
48
|
if genus was abbreviated make it ""
|
49
49
|
****"||0|$currentString|$wordListMatches"; empty string genus -- should be ignored
|
metadata
CHANGED
@@ -1,254 +1,185 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: name-spotter
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.
|
5
|
-
prerelease:
|
4
|
+
version: 0.3.0
|
6
5
|
platform: ruby
|
7
6
|
authors:
|
8
7
|
- Anthony Goddard
|
9
8
|
- Chuck Ha
|
10
9
|
- Dmitry Mozzherin
|
10
|
+
- David Shorthouse
|
11
11
|
autorequire:
|
12
12
|
bindir: bin
|
13
13
|
cert_chain: []
|
14
|
-
date:
|
14
|
+
date: 2016-02-28 00:00:00.000000000 Z
|
15
15
|
dependencies:
|
16
16
|
- !ruby/object:Gem::Dependency
|
17
17
|
name: rake
|
18
18
|
requirement: !ruby/object:Gem::Requirement
|
19
|
-
none: false
|
20
19
|
requirements:
|
21
|
-
- -
|
20
|
+
- - "~>"
|
22
21
|
- !ruby/object:Gem::Version
|
23
|
-
version: '
|
22
|
+
version: '10.5'
|
24
23
|
type: :runtime
|
25
24
|
prerelease: false
|
26
25
|
version_requirements: !ruby/object:Gem::Requirement
|
27
|
-
none: false
|
28
26
|
requirements:
|
29
|
-
- -
|
27
|
+
- - "~>"
|
30
28
|
- !ruby/object:Gem::Version
|
31
|
-
version: '
|
29
|
+
version: '10.5'
|
32
30
|
- !ruby/object:Gem::Dependency
|
33
31
|
name: rest-client
|
34
32
|
requirement: !ruby/object:Gem::Requirement
|
35
|
-
none: false
|
36
33
|
requirements:
|
37
|
-
- -
|
34
|
+
- - "~>"
|
38
35
|
- !ruby/object:Gem::Version
|
39
|
-
version: '
|
36
|
+
version: '1.8'
|
40
37
|
type: :runtime
|
41
38
|
prerelease: false
|
42
39
|
version_requirements: !ruby/object:Gem::Requirement
|
43
|
-
none: false
|
44
40
|
requirements:
|
45
|
-
- -
|
41
|
+
- - "~>"
|
46
42
|
- !ruby/object:Gem::Version
|
47
|
-
version: '
|
43
|
+
version: '1.8'
|
48
44
|
- !ruby/object:Gem::Dependency
|
49
|
-
name:
|
45
|
+
name: nokogiri
|
50
46
|
requirement: !ruby/object:Gem::Requirement
|
51
|
-
none: false
|
52
47
|
requirements:
|
53
|
-
- -
|
48
|
+
- - "~>"
|
54
49
|
- !ruby/object:Gem::Version
|
55
|
-
version: '
|
50
|
+
version: '1.6'
|
56
51
|
type: :runtime
|
57
52
|
prerelease: false
|
58
53
|
version_requirements: !ruby/object:Gem::Requirement
|
59
|
-
none: false
|
60
54
|
requirements:
|
61
|
-
- -
|
55
|
+
- - "~>"
|
62
56
|
- !ruby/object:Gem::Version
|
63
|
-
version: '
|
57
|
+
version: '1.6'
|
64
58
|
- !ruby/object:Gem::Dependency
|
65
|
-
name:
|
59
|
+
name: builder
|
66
60
|
requirement: !ruby/object:Gem::Requirement
|
67
|
-
none: false
|
68
61
|
requirements:
|
69
|
-
- -
|
62
|
+
- - "~>"
|
70
63
|
- !ruby/object:Gem::Version
|
71
|
-
version: '
|
64
|
+
version: '3.2'
|
72
65
|
type: :runtime
|
73
66
|
prerelease: false
|
74
67
|
version_requirements: !ruby/object:Gem::Requirement
|
75
|
-
none: false
|
76
68
|
requirements:
|
77
|
-
- -
|
69
|
+
- - "~>"
|
78
70
|
- !ruby/object:Gem::Version
|
79
|
-
version: '
|
71
|
+
version: '3.2'
|
80
72
|
- !ruby/object:Gem::Dependency
|
81
|
-
name:
|
73
|
+
name: json
|
82
74
|
requirement: !ruby/object:Gem::Requirement
|
83
|
-
none: false
|
84
75
|
requirements:
|
85
|
-
- -
|
76
|
+
- - "~>"
|
86
77
|
- !ruby/object:Gem::Version
|
87
|
-
version: '
|
78
|
+
version: '1.8'
|
88
79
|
type: :runtime
|
89
80
|
prerelease: false
|
90
81
|
version_requirements: !ruby/object:Gem::Requirement
|
91
|
-
none: false
|
92
82
|
requirements:
|
93
|
-
- -
|
83
|
+
- - "~>"
|
94
84
|
- !ruby/object:Gem::Version
|
95
|
-
version: '
|
85
|
+
version: '1.8'
|
96
86
|
- !ruby/object:Gem::Dependency
|
97
|
-
name:
|
87
|
+
name: unicode_utils
|
98
88
|
requirement: !ruby/object:Gem::Requirement
|
99
|
-
none: false
|
100
89
|
requirements:
|
101
|
-
- -
|
90
|
+
- - "~>"
|
102
91
|
- !ruby/object:Gem::Version
|
103
|
-
version: '
|
92
|
+
version: '1.4'
|
104
93
|
type: :runtime
|
105
94
|
prerelease: false
|
106
95
|
version_requirements: !ruby/object:Gem::Requirement
|
107
|
-
none: false
|
108
|
-
requirements:
|
109
|
-
- - ! '>='
|
110
|
-
- !ruby/object:Gem::Version
|
111
|
-
version: '0'
|
112
|
-
- !ruby/object:Gem::Dependency
|
113
|
-
name: rspec
|
114
|
-
requirement: !ruby/object:Gem::Requirement
|
115
|
-
none: false
|
116
|
-
requirements:
|
117
|
-
- - ! '>='
|
118
|
-
- !ruby/object:Gem::Version
|
119
|
-
version: '0'
|
120
|
-
type: :development
|
121
|
-
prerelease: false
|
122
|
-
version_requirements: !ruby/object:Gem::Requirement
|
123
|
-
none: false
|
124
|
-
requirements:
|
125
|
-
- - ! '>='
|
126
|
-
- !ruby/object:Gem::Version
|
127
|
-
version: '0'
|
128
|
-
- !ruby/object:Gem::Dependency
|
129
|
-
name: rspec-expectations
|
130
|
-
requirement: !ruby/object:Gem::Requirement
|
131
|
-
none: false
|
132
|
-
requirements:
|
133
|
-
- - ! '>='
|
134
|
-
- !ruby/object:Gem::Version
|
135
|
-
version: '0'
|
136
|
-
type: :development
|
137
|
-
prerelease: false
|
138
|
-
version_requirements: !ruby/object:Gem::Requirement
|
139
|
-
none: false
|
140
96
|
requirements:
|
141
|
-
- -
|
97
|
+
- - "~>"
|
142
98
|
- !ruby/object:Gem::Version
|
143
|
-
version: '
|
99
|
+
version: '1.4'
|
144
100
|
- !ruby/object:Gem::Dependency
|
145
|
-
name:
|
101
|
+
name: unsupervised-language-detection
|
146
102
|
requirement: !ruby/object:Gem::Requirement
|
147
|
-
none: false
|
148
103
|
requirements:
|
149
|
-
- -
|
104
|
+
- - "~>"
|
150
105
|
- !ruby/object:Gem::Version
|
151
|
-
version:
|
152
|
-
type: :
|
106
|
+
version: 0.0.6
|
107
|
+
type: :runtime
|
153
108
|
prerelease: false
|
154
109
|
version_requirements: !ruby/object:Gem::Requirement
|
155
|
-
none: false
|
156
110
|
requirements:
|
157
|
-
- -
|
111
|
+
- - "~>"
|
158
112
|
- !ruby/object:Gem::Version
|
159
|
-
version:
|
113
|
+
version: 0.0.6
|
160
114
|
- !ruby/object:Gem::Dependency
|
161
|
-
name:
|
115
|
+
name: rspec
|
162
116
|
requirement: !ruby/object:Gem::Requirement
|
163
|
-
none: false
|
164
117
|
requirements:
|
165
|
-
- -
|
118
|
+
- - "~>"
|
166
119
|
- !ruby/object:Gem::Version
|
167
|
-
version: '
|
120
|
+
version: '3.1'
|
168
121
|
type: :development
|
169
122
|
prerelease: false
|
170
123
|
version_requirements: !ruby/object:Gem::Requirement
|
171
|
-
none: false
|
172
124
|
requirements:
|
173
|
-
- -
|
125
|
+
- - "~>"
|
174
126
|
- !ruby/object:Gem::Version
|
175
|
-
version: '
|
127
|
+
version: '3.1'
|
176
128
|
- !ruby/object:Gem::Dependency
|
177
129
|
name: bundler
|
178
130
|
requirement: !ruby/object:Gem::Requirement
|
179
|
-
none: false
|
180
131
|
requirements:
|
181
|
-
- -
|
132
|
+
- - "~>"
|
182
133
|
- !ruby/object:Gem::Version
|
183
|
-
version: '
|
134
|
+
version: '1.10'
|
184
135
|
type: :development
|
185
136
|
prerelease: false
|
186
137
|
version_requirements: !ruby/object:Gem::Requirement
|
187
|
-
none: false
|
188
138
|
requirements:
|
189
|
-
- -
|
139
|
+
- - "~>"
|
190
140
|
- !ruby/object:Gem::Version
|
191
|
-
version: '
|
141
|
+
version: '1.10'
|
192
142
|
- !ruby/object:Gem::Dependency
|
193
|
-
name:
|
143
|
+
name: byebug
|
194
144
|
requirement: !ruby/object:Gem::Requirement
|
195
|
-
none: false
|
196
145
|
requirements:
|
197
|
-
- - ~>
|
146
|
+
- - "~>"
|
198
147
|
- !ruby/object:Gem::Version
|
199
|
-
version:
|
148
|
+
version: '8.2'
|
200
149
|
type: :development
|
201
150
|
prerelease: false
|
202
151
|
version_requirements: !ruby/object:Gem::Requirement
|
203
|
-
none: false
|
204
152
|
requirements:
|
205
|
-
- - ~>
|
153
|
+
- - "~>"
|
206
154
|
- !ruby/object:Gem::Version
|
207
|
-
version:
|
208
|
-
|
209
|
-
|
210
|
-
|
211
|
-
|
212
|
-
requirements:
|
213
|
-
- - ! '>='
|
214
|
-
- !ruby/object:Gem::Version
|
215
|
-
version: '0'
|
216
|
-
type: :development
|
217
|
-
prerelease: false
|
218
|
-
version_requirements: !ruby/object:Gem::Requirement
|
219
|
-
none: false
|
220
|
-
requirements:
|
221
|
-
- - ! '>='
|
222
|
-
- !ruby/object:Gem::Version
|
223
|
-
version: '0'
|
224
|
-
description: The gem searches for scientific names in texts using socket servers running
|
225
|
-
TaxonFinder (by Patrick Leary) and NetiNeti (by Lakshmi Manohar Akella)
|
155
|
+
version: '8.2'
|
156
|
+
description: |-
|
157
|
+
The gem searches for scientific names in texts using
|
158
|
+
socket servers running TaxonFinder (by Patrick Leary)
|
159
|
+
and NetiNeti (by Lakshmi Manohar Akella)
|
226
160
|
email: dmozzherin@gmail.com
|
227
161
|
executables: []
|
228
162
|
extensions: []
|
229
|
-
extra_rdoc_files:
|
230
|
-
- LICENSE.txt
|
231
|
-
- README.rdoc
|
163
|
+
extra_rdoc_files: []
|
232
164
|
files:
|
233
|
-
- .
|
234
|
-
- .
|
235
|
-
- .
|
165
|
+
- ".byebug_history"
|
166
|
+
- ".document"
|
167
|
+
- ".gitignore"
|
168
|
+
- ".rspec"
|
169
|
+
- ".ruby-version"
|
170
|
+
- ".travis.yml"
|
236
171
|
- CHANGELOG
|
237
172
|
- Gemfile
|
238
|
-
- Gemfile.lock
|
239
173
|
- LICENSE.txt
|
240
|
-
- README.
|
174
|
+
- README.md
|
241
175
|
- Rakefile
|
242
|
-
- VERSION
|
243
|
-
- features/name-spotter.feature
|
244
|
-
- features/step_definitions/name-spotter_steps.rb
|
245
|
-
- features/support/env.rb
|
246
176
|
- lib/name-spotter.rb
|
247
177
|
- lib/name-spotter/client.rb
|
248
178
|
- lib/name-spotter/monkey_patches.rb
|
249
179
|
- lib/name-spotter/neti_neti_client.rb
|
250
180
|
- lib/name-spotter/scientific_name.rb
|
251
181
|
- lib/name-spotter/taxon_finder_client.rb
|
182
|
+
- lib/name-spotter/version.rb
|
252
183
|
- name-spotter.gemspec
|
253
184
|
- spec/files/english.txt
|
254
185
|
- spec/files/journalofentomol13pomo_0018.txt
|
@@ -261,29 +192,25 @@ files:
|
|
261
192
|
homepage: http://github.com/GlobalNamesArchitecture/name-spotter
|
262
193
|
licenses:
|
263
194
|
- MIT
|
195
|
+
metadata: {}
|
264
196
|
post_install_message:
|
265
197
|
rdoc_options: []
|
266
198
|
require_paths:
|
267
199
|
- lib
|
268
200
|
required_ruby_version: !ruby/object:Gem::Requirement
|
269
|
-
none: false
|
270
201
|
requirements:
|
271
|
-
- -
|
202
|
+
- - ">="
|
272
203
|
- !ruby/object:Gem::Version
|
273
204
|
version: '0'
|
274
|
-
segments:
|
275
|
-
- 0
|
276
|
-
hash: -3941125736575369993
|
277
205
|
required_rubygems_version: !ruby/object:Gem::Requirement
|
278
|
-
none: false
|
279
206
|
requirements:
|
280
|
-
- -
|
207
|
+
- - ">="
|
281
208
|
- !ruby/object:Gem::Version
|
282
209
|
version: '0'
|
283
210
|
requirements: []
|
284
211
|
rubyforge_project:
|
285
|
-
rubygems_version:
|
212
|
+
rubygems_version: 2.2.3
|
286
213
|
signing_key:
|
287
|
-
specification_version:
|
214
|
+
specification_version: 4
|
288
215
|
summary: Scientific names finder
|
289
216
|
test_files: []
|
data/.rvmrc
DELETED
@@ -1 +0,0 @@
|
|
1
|
-
rvm use ruby-1.9.3-p194@namespotter --create
|
data/Gemfile.lock
DELETED
@@ -1,84 +0,0 @@
|
|
1
|
-
GEM
|
2
|
-
remote: http://rubygems.org/
|
3
|
-
specs:
|
4
|
-
addressable (2.3.2)
|
5
|
-
builder (3.0.0)
|
6
|
-
capybara (1.1.2)
|
7
|
-
mime-types (>= 1.16)
|
8
|
-
nokogiri (>= 1.3.3)
|
9
|
-
rack (>= 1.0.0)
|
10
|
-
rack-test (>= 0.5.4)
|
11
|
-
selenium-webdriver (~> 2.0)
|
12
|
-
xpath (~> 0.1.4)
|
13
|
-
childprocess (0.3.5)
|
14
|
-
ffi (~> 1.0, >= 1.0.6)
|
15
|
-
columnize (0.3.6)
|
16
|
-
cucumber (1.2.1)
|
17
|
-
builder (>= 2.1.2)
|
18
|
-
diff-lcs (>= 1.1.3)
|
19
|
-
gherkin (~> 2.11.0)
|
20
|
-
json (>= 1.4.6)
|
21
|
-
debugger (1.2.0)
|
22
|
-
columnize (>= 0.3.1)
|
23
|
-
debugger-linecache (~> 1.1.1)
|
24
|
-
debugger-ruby_core_source (~> 1.1.3)
|
25
|
-
debugger-linecache (1.1.2)
|
26
|
-
debugger-ruby_core_source (>= 1.1.1)
|
27
|
-
debugger-ruby_core_source (1.1.3)
|
28
|
-
diff-lcs (1.1.3)
|
29
|
-
ffi (1.1.5)
|
30
|
-
gherkin (2.11.2)
|
31
|
-
json (>= 1.4.6)
|
32
|
-
git (1.2.5)
|
33
|
-
jeweler (1.6.4)
|
34
|
-
bundler (~> 1.0)
|
35
|
-
git (>= 1.2.5)
|
36
|
-
rake
|
37
|
-
json (1.7.5)
|
38
|
-
libwebsocket (0.1.5)
|
39
|
-
addressable
|
40
|
-
mime-types (1.19)
|
41
|
-
multi_json (1.3.6)
|
42
|
-
nokogiri (1.5.5)
|
43
|
-
rack (1.4.1)
|
44
|
-
rack-test (0.6.1)
|
45
|
-
rack (>= 1.0)
|
46
|
-
rake (0.9.2.2)
|
47
|
-
rest-client (1.6.7)
|
48
|
-
mime-types (>= 1.16)
|
49
|
-
rspec (2.11.0)
|
50
|
-
rspec-core (~> 2.11.0)
|
51
|
-
rspec-expectations (~> 2.11.0)
|
52
|
-
rspec-mocks (~> 2.11.0)
|
53
|
-
rspec-core (2.11.1)
|
54
|
-
rspec-expectations (2.11.2)
|
55
|
-
diff-lcs (~> 1.1.3)
|
56
|
-
rspec-mocks (2.11.2)
|
57
|
-
rubyzip (0.9.9)
|
58
|
-
selenium-webdriver (2.25.0)
|
59
|
-
childprocess (>= 0.2.5)
|
60
|
-
libwebsocket (~> 0.1.3)
|
61
|
-
multi_json (~> 1.0)
|
62
|
-
rubyzip
|
63
|
-
unicode_utils (1.3.0)
|
64
|
-
unsupervised-language-detection (0.0.6)
|
65
|
-
xpath (0.1.4)
|
66
|
-
nokogiri (~> 1.3)
|
67
|
-
|
68
|
-
PLATFORMS
|
69
|
-
ruby
|
70
|
-
|
71
|
-
DEPENDENCIES
|
72
|
-
builder
|
73
|
-
bundler
|
74
|
-
capybara
|
75
|
-
cucumber
|
76
|
-
debugger
|
77
|
-
jeweler (~> 1.6.4)
|
78
|
-
json
|
79
|
-
rake
|
80
|
-
rest-client
|
81
|
-
rspec
|
82
|
-
rspec-expectations
|
83
|
-
unicode_utils
|
84
|
-
unsupervised-language-detection
|