dwc_agent 3.0.0.2 → 3.0.0.6
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/lib/dwc_agent/constants.rb +13 -6
- data/lib/dwc_agent/version.rb +1 -1
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 7e33855504e8b60e240c2ccf1efb192dcbeb9878fb5d2f0172772ec2c2d3e9fa
|
4
|
+
data.tar.gz: 260e2c9304731ad852b0587a22938b31d48aeb1bd7d922eb30755e795ec054fe
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: bb32cd909dd7d824bc7e064316ce3e10ee6cc6b14a12371cc8464f94f2b5d0b2f0b605aeef924e44423f1af8c2af62c001f67511e2dd438086f097b81da29b57
|
7
|
+
data.tar.gz: cf52be5fde1f4c7ebee816fd07ae3903c3f7c55a6a41542fd21cb265a868590a3391c0d17a514c2b40ac7ca7dbfd37d9cb53211aec4a0eb0c1ec9793aa4b7c6d
|
data/lib/dwc_agent/constants.rb
CHANGED
@@ -56,6 +56,9 @@ module DwcAgent
|
|
56
56
|
(?i:autres?\s+de|probab|likely|possibl(e|y)|doubtful)|
|
57
57
|
\b\s*(?i:maybe)\s*\b|
|
58
58
|
\b\s*(?i:prob)\.\s*\b|
|
59
|
+
\b\s*(?i:field\s*number)|
|
60
|
+
\b\s*?(?i:malaise|light|pitfall|pan|suction|lobster|actinic light|cdc)\s*(?i:trap)\s*\b|
|
61
|
+
\|\s*(?i:collector\s*(field\s*)?number).*$|
|
59
62
|
\(?[,]?\s*?(?i:(local)?\s?collectors?|data\s*recorder|netter|(oper|prepar)ator)\(?s?\)?\.?\:?|
|
60
63
|
\b[.-–,;:]?\s*(?i:department|faculty)\s*?(?i:of)?\s*?(?i:entomology|biology|zoology)|
|
61
64
|
(?i:Engº|Agrº|Fcº|Drº|Mº|Profº|Dº|Fº)|
|
@@ -196,11 +199,11 @@ module DwcAgent
|
|
196
199
|
SEPARATORS = {
|
197
200
|
"^(\\S{4,},\\s+(?:\\S\\.\\s*){1,})\\s+(\\S{4,},\\s+(?:\\S\.\\s*){1,})$" => "\\1 | \\2",
|
198
201
|
"(\\S{1}\\.)([[:alpha:]]{2,})" => "\\1 \\2",
|
199
|
-
"(
|
200
|
-
"^([A-Z.\\s]+)\\s+(?:and|&|et|e)\\s+([A-Z.\\s]+)\\s+(
|
201
|
-
"^([A-Z]
|
202
|
-
"^([A-Z]
|
203
|
-
"^([A-Z]
|
202
|
+
"([[:alpha:]]*),?\\s+(.*)\\s+(van|von)$" => "\\3 \\1, \\2",
|
203
|
+
"^([A-Z.\\s]+)\\s+(?:and|&|et|e)\\s+([A-Z.\\s]+)\\s+([[:alpha:]]{2,})(.*)" => "\\1 \\3 | \\2 \\3 | \\4",
|
204
|
+
"^([A-Z][[:alpha:]]{2,}),\\s*?([A-Z][[:alpha:]]{2,})\\s*?[,&]\\s*?([A-Z][[:alpha:]]{2,})$" => "\\1 | \\2 | \\3",
|
205
|
+
"^([A-Z][[:alpha:]]{2,}),\\s*?([A-Z][[:alpha:]]{2,}),\\s*?([A-Z][[:alpha:]]{2,})\\s*?[,&]\\s*?([A-Z][[:alpha:]]{3,})$" => "\\1 | \\2 | \\3 | \\4",
|
206
|
+
"^([A-Z][[:alpha:]]{2,}),\\s*?([A-Z][[:alpha:]]{2,}),\\s*?([A-Z][[:alpha:]]{2,}),\\s*?([A-Z][[:alpha:]]{2,})\\s*?[,&]\\s*?([A-Z][[:alpha:]]{3,})$" => "\\1 | \\2 | \\3 | \\4 | \\5"
|
204
207
|
}
|
205
208
|
|
206
209
|
BLACKLIST = %r{
|
@@ -290,16 +293,20 @@ module DwcAgent
|
|
290
293
|
"von",
|
291
294
|
"the",
|
292
295
|
"of",
|
296
|
+
"new",
|
297
|
+
"no",
|
293
298
|
"adjustment",
|
294
299
|
"annotator",
|
295
300
|
"available",
|
296
301
|
"arachnology",
|
297
302
|
"catalogue",
|
303
|
+
"comments",
|
298
304
|
"curators",
|
299
305
|
"data",
|
300
306
|
"details",
|
301
307
|
"determiner",
|
302
308
|
"determination",
|
309
|
+
"dissected",
|
303
310
|
"dissection",
|
304
311
|
"entered",
|
305
312
|
"erased",
|
@@ -329,7 +336,7 @@ module DwcAgent
|
|
329
336
|
"has not"
|
330
337
|
]
|
331
338
|
|
332
|
-
TITLE = /\s*\b(sir|count(ess)?|colonel|(gen|adm|col|maj|capt|cmdr|lt|sgt|cpl|pvt|proff?|dr|md|ph\.?d|rev|mme|abbé|ptre|bro|esq)\.?|
|
339
|
+
TITLE = /\s*\b(sir|count(ess)?|colonel|(gen|adm|col|maj|capt|cmdr|lt|sgt|cpl|pvt|proff?|dr|md|ph\.?d|rev|mme|abbé|ptre|bro|esq)\.?|doct(eu|o)r|father|cantor|vicar|père|pastor|rabbi|reverend|pere|soeur|sister|professor)(\s+|$)/i
|
333
340
|
|
334
341
|
APPELLATION = /\s*\b((mrs?|ms|fr|hr)\.?|miss|herr|frau)(\s+|$)/i
|
335
342
|
|
data/lib/dwc_agent/version.rb
CHANGED
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: dwc_agent
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 3.0.0.
|
4
|
+
version: 3.0.0.6
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- David P. Shorthouse
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2021-
|
11
|
+
date: 2021-10-11 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: namae
|