dwc_agent 3.0.17.0 → 3.0.19.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/lib/dwc_agent/cleaner.rb +5 -1
- data/lib/dwc_agent/constants.rb +20 -4
- data/lib/dwc_agent/version.rb +1 -1
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 232c24dde9ae5ecd8221049ab24283c2480c7d09df539f0eeef6b03729295360
|
4
|
+
data.tar.gz: 3fa7afa2113b78326938849744cf2e6a5a1f4949ba8567c0dac200872a72c62f
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 4a5778f3d32830ff95a2790c320d838df3c2e08937d8ca66cd1d3bf2a84560ce46b286f259bb213b7cf29c298d817c5f33d8ec09f958d65fd255825dc9dc1860
|
7
|
+
data.tar.gz: 8c01720ea2044073e3c850956e74b0a01f723350abb8b6d98183f9f8a6952f17dcbb5f64ab19311d72d57ff191634c783bc2b9e93cd40fd6c1819fa6c8de83fe
|
data/lib/dwc_agent/cleaner.rb
CHANGED
@@ -78,7 +78,6 @@ module DwcAgent
|
|
78
78
|
parsed_namae.family &&
|
79
79
|
parsed_namae.family.length <=3 &&
|
80
80
|
parsed_namae.family == parsed_namae.family.upcase &&
|
81
|
-
#parsed_namae.family != NameCase(parsed_namae.family) &&
|
82
81
|
parsed_namae.given[-1] != "."
|
83
82
|
given = parsed_namae.given
|
84
83
|
family = parsed_namae.family
|
@@ -168,6 +167,11 @@ module DwcAgent
|
|
168
167
|
return default
|
169
168
|
end
|
170
169
|
|
170
|
+
if !family.nil? && family.downcase.count(VOWELS) == 0 &&
|
171
|
+
!FAMILY_GREENLIST.any?{ |s| s.casecmp(family) == 0 }
|
172
|
+
return default
|
173
|
+
end
|
174
|
+
|
171
175
|
name = {
|
172
176
|
title: title,
|
173
177
|
appellation: appellation,
|
data/lib/dwc_agent/constants.rb
CHANGED
@@ -208,7 +208,8 @@ module DwcAgent
|
|
208
208
|
'-Jr' => ' Jr.',
|
209
209
|
'Dr.' => 'Dr. ',
|
210
210
|
'prof.' => 'Prof. ',
|
211
|
-
' .;' => '. ;'
|
211
|
+
' .;' => '. ;',
|
212
|
+
', &' => ' &'
|
212
213
|
}
|
213
214
|
|
214
215
|
SEPARATORS = {
|
@@ -219,9 +220,10 @@ module DwcAgent
|
|
219
220
|
"(\\S{1}\\.)([[:alpha:]]{2,})" => "\\1 \\2",
|
220
221
|
"^([[:alpha:]]{2,})(?:\\s+)((?:\\S{1}\\.\\s?){1,})$" => "\\1, \\2",
|
221
222
|
"([[:alpha:]]*),?\\s*(.*)\\s+(van|von|v\\.|v(a|o)n\\s+der?)$" => "\\3 \\1, \\2",
|
222
|
-
"^([A-Z
|
223
|
-
"^([A-Z
|
224
|
-
"^([A-Z
|
223
|
+
"^((?i:[A-Z]\\.\\s?){1,})\\s?(?:and|&|et|e)\\s+((?i:[A-Z]\\.\\s?){1,})\\s+([[:alpha:]’`'-]{2,})\\s+([[:alpha:]’`'-]{2,})$" => "\\1 \\4 | \\2 \\3 \\4",
|
224
|
+
"^((?i:[A-Z]\\.\\s?){1,})\\s?(?:and|&|et|e)\\s+((?i:[A-Z]\\.\\s?){1,})\\s+([[:alpha:]’`'-]{2,})(.*)$" => "\\1 \\3 | \\2 \\3 | \\4",
|
225
|
+
"^([A-Z]{1,3})\\s+(?:and|&|et|e)\\s+([A-Z]{1,3})\\s+([[:alpha:]’`'-]{2,})(.*)$" => "\\1 \\3 | \\2 \\3 | \\4",
|
226
|
+
"^((?i:[A-Z]\\.\\s?){1,}),\\s+([A-Z.\\s]+)\\s+(?:and|&|et|e)\\s+((?i:[A-Z]\\.\\s?){1,})\\s+([[:alpha:]’`'-]{2,})(.*)$" => "\\1 \\4 | \\2 \\4 | \\3 \\4 | \\5",
|
225
227
|
"^([A-Z][[:alpha:]]{2,}),\\s*?([A-Z][[:alpha:]]{2,})\\s*?(?i:and|&|et|e|,)\\s+([A-Z][[:alpha:]]{2,})$" => "\\1 | \\2 | \\3",
|
226
228
|
"^([A-Z][[:alpha:]]{2,}),\\s*?([A-Z][[:alpha:]]{2,}),\\s*?([A-Z][[:alpha:]]{2,})\\s*?(?i:and|&|et|e|,)\\s+([A-Z][[:alpha:]]{3,})$" => "\\1 | \\2 | \\3 | \\4",
|
227
229
|
"^([A-Z][[:alpha:]]{2,}),\\s*?([A-Z][[:alpha:]]{2,}),\\s*?([A-Z][[:alpha:]]{2,}),\\s*?([A-Z][[:alpha:]]{2,})\\s*?(?i:and|&|et|e|,)\\s+([A-Z][[:alpha:]]{3,})$" => "\\1 | \\2 | \\3 | \\4 | \\5"
|
@@ -300,6 +302,18 @@ module DwcAgent
|
|
300
302
|
^\s*?de\s*?$
|
301
303
|
}x
|
302
304
|
|
305
|
+
FAMILY_GREENLIST = [
|
306
|
+
"Ng",
|
307
|
+
"Srb",
|
308
|
+
"Srp",
|
309
|
+
"Vlk",
|
310
|
+
"Smrz",
|
311
|
+
"Smrž",
|
312
|
+
"Smrt",
|
313
|
+
"Krc",
|
314
|
+
"Krč"
|
315
|
+
]
|
316
|
+
|
303
317
|
FAMILY_BLACKLIST = [
|
304
318
|
"a b",
|
305
319
|
"a e",
|
@@ -402,4 +416,6 @@ module DwcAgent
|
|
402
416
|
"von der"
|
403
417
|
]
|
404
418
|
|
419
|
+
VOWELS = "aeiouäèéêëìíôöü"
|
420
|
+
|
405
421
|
end
|
data/lib/dwc_agent/version.rb
CHANGED
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: dwc_agent
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 3.0.
|
4
|
+
version: 3.0.19.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- David P. Shorthouse
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date:
|
11
|
+
date: 2024-01-05 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: namae
|