dwc_agent 3.0.0.2 → 3.0.0.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 4eef2473cbf2e8ce7d504a4ebce69aa9a3a9da5a6ca92018044a154ced201a9a
4
- data.tar.gz: 4337d9f5441da1e6a1970449ef381e99027aeb1efe22fa0f43270d0f2c122d8b
3
+ metadata.gz: 7e33855504e8b60e240c2ccf1efb192dcbeb9878fb5d2f0172772ec2c2d3e9fa
4
+ data.tar.gz: 260e2c9304731ad852b0587a22938b31d48aeb1bd7d922eb30755e795ec054fe
5
5
  SHA512:
6
- metadata.gz: bf4ad079202f2f5e7550b79e095649416d64d6bd74300127cf2272da0f3a11e77ab00d1b95c2867256c6f98e6247a725f9cf4261fa07db501b8c97f9adc5efaa
7
- data.tar.gz: 52265090309fda51f66b54cc522f20c1f0415b451aea8749b0457360ae4079301ff6fffcca3fa54de60a0da1737158c35d96683ca04c4c2806189503402710d6
6
+ metadata.gz: bb32cd909dd7d824bc7e064316ce3e10ee6cc6b14a12371cc8464f94f2b5d0b2f0b605aeef924e44423f1af8c2af62c001f67511e2dd438086f097b81da29b57
7
+ data.tar.gz: cf52be5fde1f4c7ebee816fd07ae3903c3f7c55a6a41542fd21cb265a868590a3391c0d17a514c2b40ac7ca7dbfd37d9cb53211aec4a0eb0c1ec9793aa4b7c6d
@@ -56,6 +56,9 @@ module DwcAgent
56
56
  (?i:autres?\s+de|probab|likely|possibl(e|y)|doubtful)|
57
57
  \b\s*(?i:maybe)\s*\b|
58
58
  \b\s*(?i:prob)\.\s*\b|
59
+ \b\s*(?i:field\s*number)|
60
+ \b\s*?(?i:malaise|light|pitfall|pan|suction|lobster|actinic light|cdc)\s*(?i:trap)\s*\b|
61
+ \|\s*(?i:collector\s*(field\s*)?number).*$|
59
62
  \(?[,]?\s*?(?i:(local)?\s?collectors?|data\s*recorder|netter|(oper|prepar)ator)\(?s?\)?\.?\:?|
60
63
  \b[.-–,;:]?\s*(?i:department|faculty)\s*?(?i:of)?\s*?(?i:entomology|biology|zoology)|
61
64
  (?i:Engº|Agrº|Fcº|Drº|Mº|Profº|Dº|Fº)|
@@ -196,11 +199,11 @@ module DwcAgent
196
199
  SEPARATORS = {
197
200
  "^(\\S{4,},\\s+(?:\\S\\.\\s*){1,})\\s+(\\S{4,},\\s+(?:\\S\.\\s*){1,})$" => "\\1 | \\2",
198
201
  "(\\S{1}\\.)([[:alpha:]]{2,})" => "\\1 \\2",
199
- "(\\w*),?\\s+(.*)\\s+(van|von)$" => "\\3 \\1, \\2",
200
- "^([A-Z.\\s]+)\\s+(?:and|&|et|e)\\s+([A-Z.\\s]+)\\s+(\\w{2,})(.*)" => "\\1 \\3 | \\2 \\3 | \\4",
201
- "^([A-Z]\\w{2,}),\\s*?([A-Z]\\w{2,})\\s*?[,&]\\s*?([A-Z]\\w{2,})$" => "\\1 | \\2 | \\3",
202
- "^([A-Z]\\w{2,}),\\s*?([A-Z]\\w{2,}),\\s*?([A-Z]\\w{2,})\\s*?[,&]\\s*?([A-Z]\\w{3,})$" => "\\1 | \\2 | \\3 | \\4",
203
- "^([A-Z]\\w{2,}),\\s*?([A-Z]\\w{2,}),\\s*?([A-Z]\\w{2,}),\\s*?([A-Z]\\w{2,})\\s*?[,&]\\s*?([A-Z]\\w{3,})$" => "\\1 | \\2 | \\3 | \\4 | \\5"
202
+ "([[:alpha:]]*),?\\s+(.*)\\s+(van|von)$" => "\\3 \\1, \\2",
203
+ "^([A-Z.\\s]+)\\s+(?:and|&|et|e)\\s+([A-Z.\\s]+)\\s+([[:alpha:]]{2,})(.*)" => "\\1 \\3 | \\2 \\3 | \\4",
204
+ "^([A-Z][[:alpha:]]{2,}),\\s*?([A-Z][[:alpha:]]{2,})\\s*?[,&]\\s*?([A-Z][[:alpha:]]{2,})$" => "\\1 | \\2 | \\3",
205
+ "^([A-Z][[:alpha:]]{2,}),\\s*?([A-Z][[:alpha:]]{2,}),\\s*?([A-Z][[:alpha:]]{2,})\\s*?[,&]\\s*?([A-Z][[:alpha:]]{3,})$" => "\\1 | \\2 | \\3 | \\4",
206
+ "^([A-Z][[:alpha:]]{2,}),\\s*?([A-Z][[:alpha:]]{2,}),\\s*?([A-Z][[:alpha:]]{2,}),\\s*?([A-Z][[:alpha:]]{2,})\\s*?[,&]\\s*?([A-Z][[:alpha:]]{3,})$" => "\\1 | \\2 | \\3 | \\4 | \\5"
204
207
  }
205
208
 
206
209
  BLACKLIST = %r{
@@ -290,16 +293,20 @@ module DwcAgent
290
293
  "von",
291
294
  "the",
292
295
  "of",
296
+ "new",
297
+ "no",
293
298
  "adjustment",
294
299
  "annotator",
295
300
  "available",
296
301
  "arachnology",
297
302
  "catalogue",
303
+ "comments",
298
304
  "curators",
299
305
  "data",
300
306
  "details",
301
307
  "determiner",
302
308
  "determination",
309
+ "dissected",
303
310
  "dissection",
304
311
  "entered",
305
312
  "erased",
@@ -329,7 +336,7 @@ module DwcAgent
329
336
  "has not"
330
337
  ]
331
338
 
332
- TITLE = /\s*\b(sir|count(ess)?|colonel|(gen|adm|col|maj|capt|cmdr|lt|sgt|cpl|pvt|proff?|dr|md|ph\.?d|rev|mme|abbé|ptre|bro|esq)\.?|docteur|father|cantor|vicar|père|pastor|rabbi|reverend|pere|soeur|sister|professor)(\s+|$)/i
339
+ TITLE = /\s*\b(sir|count(ess)?|colonel|(gen|adm|col|maj|capt|cmdr|lt|sgt|cpl|pvt|proff?|dr|md|ph\.?d|rev|mme|abbé|ptre|bro|esq)\.?|doct(eu|o)r|father|cantor|vicar|père|pastor|rabbi|reverend|pere|soeur|sister|professor)(\s+|$)/i
333
340
 
334
341
  APPELLATION = /\s*\b((mrs?|ms|fr|hr)\.?|miss|herr|frau)(\s+|$)/i
335
342
 
@@ -4,7 +4,7 @@ module DwcAgent
4
4
  MAJOR = 3
5
5
  MINOR = 0
6
6
  PATCH = 0
7
- BUILD = 2
7
+ BUILD = 6
8
8
 
9
9
  def self.version
10
10
  [MAJOR, MINOR, PATCH, BUILD].compact.join('.').freeze
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: dwc_agent
3
3
  version: !ruby/object:Gem::Version
4
- version: 3.0.0.2
4
+ version: 3.0.0.6
5
5
  platform: ruby
6
6
  authors:
7
7
  - David P. Shorthouse
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2021-08-16 00:00:00.000000000 Z
11
+ date: 2021-10-11 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: namae