dwc_agent 3.0.1.5 → 3.0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 10f552fa73693ac39a23ee515c5943cd47e097679721effe240d8f4b4f495fff
4
- data.tar.gz: 3dde6324c5d09ea3c71c96f485d9c10d9ba9c394ce55a8adbaa1ae3632c42028
3
+ metadata.gz: 4cf15dbefcecdfe7586bb2f71977477a82f7069befa6ab4ec0063db8f1417175
4
+ data.tar.gz: 5eb22a22b08b1d5925f163093460448cc6f2428ce7a70df8da175fe198ca7364
5
5
  SHA512:
6
- metadata.gz: 80ac3371e1132851e17bf6d0755bfb3ea990dcf43a7d68987a654f512b500912e117cf7cfd5d4b97e3c5cab5c6e02c5c66aac80797d43a27f7020b2a92165bd3
7
- data.tar.gz: 1f304b786cf6e6d62ed1763367c081ea4aaf54247aa0cb532995e6d34a25669c1231663b640b81d682a6d9b44376bccdf4493f1148d38b497bc23905fa14b95a
6
+ metadata.gz: 77c083f4b4672bf5381f43df6b0f600760b6ce5756929a9c0255d876ed170d72594be69437e78af43e7b0c671c33373b5b66822b6bc5874603f73b92134919b6
7
+ data.tar.gz: fd394686ecf2a68f3b98a31fd33c3a5abf42e4e453c1582af92d4fb913bfc7edc5cfc2ece996935697b64b3c86da7babaaafbc78566d7d255ce93bab3a511ac2
@@ -26,6 +26,12 @@ module DwcAgent
26
26
  # @return Namae::Name [Object] a new Namae object
27
27
  def clean(parsed_namae)
28
28
 
29
+ if parsed_namae.family &&
30
+ parsed_namae.family == NameCase(parsed_namae.family) &&
31
+ parsed_namae.display_order.split.join == parsed_namae.initials
32
+ return default
33
+ end
34
+
29
35
  if parsed_namae.given &&
30
36
  @given_blacklist.any?{ |s| s.casecmp(parsed_namae.given) == 0 }
31
37
  return
@@ -72,6 +78,7 @@ module DwcAgent
72
78
  parsed_namae.family &&
73
79
  parsed_namae.family.length <=3 &&
74
80
  parsed_namae.family == parsed_namae.family.upcase &&
81
+ #parsed_namae.family != NameCase(parsed_namae.family) &&
75
82
  parsed_namae.given[-1] != "."
76
83
  given = parsed_namae.given
77
84
  family = parsed_namae.family
@@ -137,7 +144,7 @@ module DwcAgent
137
144
  particle = nil
138
145
  end
139
146
 
140
- if !particle.nil? && particle.include?(".")
147
+ if !particle.nil? && particle.include?(".") && !particle.include?("v")
141
148
  particle = nil
142
149
  end
143
150
 
@@ -167,7 +174,9 @@ module DwcAgent
167
174
  given: given,
168
175
  particle: particle,
169
176
  family: family,
170
- suffix: suffix
177
+ suffix: suffix,
178
+ nick: parsed_namae.nick,
179
+ dropping_particle: parsed_namae.dropping_particle
171
180
  }
172
181
  Namae::Name.new(name)
173
182
  end
@@ -13,6 +13,7 @@ module DwcAgent
13
13
  \b[,;]?\s*(?i:and|&)?\s*(?i:others|party)\s*\b|
14
14
  \b[,;]?\s*(?i:etc)\.?|
15
15
  \b[,;]?\s*(?i:exp)\.?\s*(\b|\z)|
16
+ \b[,;]?\s*(?i:aboard)[^$]+|
16
17
  \b[,;]?\s*(?i:on)\b|
17
18
  \b[,;]?\s*(?i:unkn?own)\b|
18
19
  \b[,;]?\s*(?i:n/a)\b|
@@ -52,7 +53,7 @@ module DwcAgent
52
53
  \d+\s+(?i:Nov|Novemb(er|re))\.?\b|
53
54
  \d+\s+(?i:Dec|D(e|é)cemb(er|re))\.?\b|
54
55
  \b[.-–,;:/]?\s*(?i:Alabama|Alaska|Arizona|Arkansas|California|Colorado|Connecticut|Delaware|Evergreen|Florida|Hawaii|Idaho|Illinois|Indiana|Iowa|Kansas|Kentucky|Louisiana|Maine|Maryland|Massachusetts|Michigan|Minnesota|Mississippi|Missouri|Montana|Nebraska|Nevada|New\s+Hampshire|New\s+Jersey|New\s+Mexico|New\s+York|North\s+Carolina|North\s+Dakota|Ohio|Oklahoma|Oregon|Pennsylvania|Portland|Rhode\s+Island|South\s+Carolina|South\s+Dakota|St\s+Petersburg|Tennessee|Texas|Utah|Vermont|Washington|West\s+Virginia|Wisconsin|Wyoming)\s+(?i:State)\s*\b|
55
- \b[.,;:/]?\s*?(?i:Afghanistan|Åland Islands|Albania|Algeria|American Samoa|Andorra|Angola|Anguilla|Antarctica|Antigua and Barbuda|Argentina|Armenia|Aruba|Australia|Azerbaijan|Bahamas|Bahrain|Bangladesh|Barbados|Belarus|Belize|Benin|Bermuda|Bhutan|Bolivia \(Plurinational State of\)|Bonaire, Sint Eustatius and Saba|Bosnia and Herzegovina|Botswana|Bouvet Island|Brazil|British Indian Ocean Territory|Brunei Darussalam|Bulgaria|Burkina Faso|Burundi|Cabo Verde|Cambodia|Cameroon|Canada|Cayman Islands|Central African Republic|Chad|Chile|Christmas Island|Cocos \(Keeling\) Islands|Colombia|Comoros|Congo|Congo \(Democratic Republic of the\)|Cook Islands|Costa Rica|Côte d'Ivoire|Croatia|Cuba|Curaçao|Cyprus|Czechia|Djibouti|Dominica|Dominican Republic|Ecuador|Egypt|El Salvador|Equatorial Guinea|Eritrea|Estonia|Ethiopia|Falkland Islands \(Malvinas\)|Faroe Islands|Fiji|Finland|French Guiana|French Polynesia|French Southern Territories|Gabon|Gambia|Germany|Ghana|Gibraltar|Greece|Greenland|Grenada|Guadeloupe|Guam|Guatemala|Guernsey|Guinea-Bissau|Guyana|Haiti|Heard Island and McDonald Islands|Holy See|Honduras|Hong Kong|Hungary|Iceland|India|Indonesia|Iran \(Islamic Republic of\)|Iraq|Ireland|Isle of Man|Italy|Jamaica|Japan|Jersey|Kazakhstan|Kenya|Kiribati|Korea \(Democratic People\'s Republic of\)|Korea \(Republic of\)|Kuwait|Kyrgyzstan|Lao People\'s Democratic Republic|Latvia|Lebanon|Lesotho|Liberia|Libya|Liechtenstein|Lithuania|Luxembourg|Macao|Macedonia (the former Yugoslav Republic of)|Madagascar|Malawi|Malaysia|Maldives|Malta|Marshall Islands|Martinique|Mauritania|Mauritius|Mayotte|Mexico|Micronesia \(Federated States of\)|Moldova \(Republic of\)|Monaco|Mongolia|Montenegro|Morocco|Mozambique|Myanmar|Namibia|Nauru|Nepal|Netherlands|New Caledonia|New Zealand|Nicaragua|Niger|Nigeria|Niue|Norfolk Island|Northern Mariana Islands|Norway|Oman|Pakistan|Palau|Palestine, State of|Panama|Papua New Guinea|Paraguay|Peru|Philippines|Pitcairn|Poland|Puerto Rico|Qatar|Réunion|Romania|Russian Federation|Rwanda|Saint Barthélemy|Saint Helena, Ascension and Tristan da Cunha|Saint Kitts and Nevis|Saint Lucia|Saint Martin \(French part\)|Saint Pierre and Miquelon|Saint Vincent and the Grenadines|Samoa|San Marino|Sao Tome and Principe|Saudi Arabia|Senegal|Serbia|Seychelles|Sierra Leone|Singapore|Sint Maarten \(Dutch part\)|Slovakia|Slovenia|Solomon Islands|Somalia|South Africa|South Georgia and the South Sandwich Islands|South Sudan|Sri Lanka|Sudan|Suriname|Svalbard and Jan Mayen|Swaziland|Sweden|Switzerland|Syrian Arab Republic|Taiwan|Tajikistan|Tanzania, United Republic of|Thailand|Timor-Leste|Togo|Tokelau|Tonga|Trinidad and Tobago|Tunisia|Turkey|Turkmenistan|Turks and Caicos Islands|Tuvalu|Uganda|Ukraine|United Arab Emirates|United Kingdom of Great Britain and Northern Ireland|United States of America|United States Minor Outlying Islands|Uruguay|Uzbekistan|Vanuatu|Venezuela \(Bolivarian Republic of\)|Viet Nam|Virgin Islands \(British\)|Virgin Islands \(U\.S\.\)|Wallis and Futuna|Western Sahara|Yemen|Zambia|Zimbabwe)\b|
56
+ \b[.,;:/]?\s*?(?i:Afghanistan|Åland Islands|Albania|Algeria|American Samoa|Andorra|Angola|Anguilla|Antarctica|Antigua and Barbuda|Argentina|Armenia|Aruba|Australia|Azerbaijan|Bahamas|Bahrain|Bangladesh|Barbados|Belarus|Belize|Benin|Bermuda|Bhutan|Bolivia \(Plurinational State of\)|Bonaire, Sint Eustatius and Saba|Bosnia and Herzegovina|Botswana|Bouvet Island|Brazil|British Indian Ocean Territory|Brunei Darussalam|Bulgaria|Burkina Faso|Burundi|Cabo Verde|Cambodia|Cameroon|Canada|Cayman Islands|Central African Republic|Chad|Chile|Christmas Island|Cocos \(Keeling\) Islands|Colombia|Comoros|Congo|Congo \(Democratic Republic of the\)|Cook Islands|Costa Rica|Côte d'Ivoire|Croatia|Cuba|Curaçao|Cyprus|Czechia|Djibouti|Dominica|Dominican Republic|Ecuador|Egypt|El Salvador|Equatorial Guinea|Eritrea|Estonia|Ethiopia|Falkland Islands \(Malvinas\)|Faroe Islands|Fiji|Finland|French Guiana|French Polynesia|French Southern Territories|Gabon|Gambia|Germany|Ghana|Gibraltar|Greece|Greenland|Grenada|Guadeloupe|Guam|Guatemala|Guernsey|Guinea-Bissau|Guyana|Haiti|Heard Island and McDonald Islands|Holy See|Honduras|Hong Kong|Hungary|Iceland|India|Indonesia|Iran \(Islamic Republic of\)|Iraq|Ireland|Isle of Man|Italy|Jamaica|Japan|Jersey|Kazakhstan|Kenya|Kiribati|Korea \(Democratic People\'s Republic of\)|Korea \(Republic of\)|Kuwait|Kyrgyzstan|Lao People\'s Democratic Republic|Latvia|Lebanon|Lesotho|Liberia|Libya|Liechtenstein|Lithuania|Luxembourg|Macao|Macedonia (the former Yugoslav Republic of)|Madagascar|Malawi|Malaysia|Maldives|Malta|Marshall Islands|Martinique|Mauritania|Mauritius|Mayotte|Mexico|Micronesia \(Federated States of\)|Moldova \(Republic of\)|Monaco|Mongolia|Montenegro|Morocco|Mozambique|Myanmar|Namibia|Nauru|Nepal|Netherlands|New Caledonia|New Zealand|Nicaragua|Niger|Nigeria|Niue|Norfolk Island|Northern Mariana Islands|Norway|Oman|Pakistan|Palau|Palestine, State of|Panama|Papua New Guinea|Paraguay|Peru|Philippines|Pitcairn|Poland|Puerto Rico|Qatar|Réunion|Romania|Russian Federation|Russia|Rwanda|Saint Barthélemy|Saint Helena, Ascension and Tristan da Cunha|Saint Kitts and Nevis|Saint Lucia|Saint Martin \(French part\)|Saint Pierre and Miquelon|Saint Vincent and the Grenadines|Samoa|San Marino|Sao Tome and Principe|Saudi Arabia|Senegal|Serbia|Seychelles|Sierra Leone|Singapore|Sint Maarten \(Dutch part\)|Slovakia|Slovenia|Solomon Islands|Somalia|South Africa|South Georgia and the South Sandwich Islands|South Sudan|Sri Lanka|Sudan|Suriname|Svalbard and Jan Mayen|Swaziland|Sweden|Switzerland|Syrian Arab Republic|Taiwan|Tajikistan|Tanzania, United Republic of|Thailand|Timor-Leste|Togo|Tokelau|Tonga|Trinidad and Tobago|Tunisia|Turkey|Turkmenistan|Turks and Caicos Islands|Tuvalu|Uganda|Ukraine|United Arab Emirates|United Kingdom of Great Britain and Northern Ireland|United States of America|United States Minor Outlying Islands|Uruguay|Uzbekistan|Vanuatu|Venezuela \(Bolivarian Republic of\)|Viet Nam|Virgin Islands \(British\)|Virgin Islands \(U\.S\.\)|Wallis and Futuna|Western Sahara|Yemen|Zambia|Zimbabwe)\b|
56
57
  (?i:autres?\s+de|probab|likely|possibl(e|y)|doubtful)|
57
58
  \b\s*(?i:maybe)\s*\b|
58
59
  \b\s*(?i:prob)\.\s*\b|
@@ -102,7 +103,7 @@ module DwcAgent
102
103
  (?i:not?)\s+(?i:name|date|details?|specific)?\s*?(?i:given|name|date|noted)|
103
104
  (?i:non?)\s+(?i:specificato)|
104
105
  \b[,;]\s+\d+\z|
105
- ["!@?]|
106
+ [!@?]|
106
107
  [,]?\d+|
107
108
  \s+\d+?(\/|\.)?(?i:i|ii|iii|iv|v|vi|vii|viii|ix|x)(\/|\.)\d+|
108
109
  [,;]\z|
@@ -121,7 +122,8 @@ module DwcAgent
121
122
  ^[-,.\s;*\d]+\s?|
122
123
  \s*?-{2,}\s*?|
123
124
  ^(?i:exc?p?)[:.]\s*|
124
- (?i:ex\.?\s+herb\.?\s*)|
125
+ ^(?:ex\.?|in)\s+(?:he?r?b)\.?\s+|
126
+ (?!^)(?:ex\.?|in)\s+(?:he?r?b)\.?\s+.*$|
125
127
  \:?\s*(?i:exch)(\b|\z)|
126
128
  \s+de\s*$|
127
129
  \.{2,}$|
@@ -132,7 +134,7 @@ module DwcAgent
132
134
  [–|ǀ∣|│&+\/;:]|
133
135
  \s+-\s+|
134
136
  \s+a\.\s+|
135
- \b(con|e|y|i|en|et|or|per|for)\s*\b|
137
+ \b(con|e|y|i|en|et|or|per|for|und)\s*\b|
136
138
  \b(?i:and|with)\s*\b|
137
139
  \b(?i:annotated(\s+by)?)\s*\b|
138
140
  \b(?i:coll\.)\s*\b|
@@ -159,6 +161,7 @@ module DwcAgent
159
161
  }x
160
162
 
161
163
  CHAR_SUBS = {
164
+ '"' => '\'',
162
165
  '|' => ' | ',
163
166
  'ǀ' => ' | ',
164
167
  '∣' => ' | ',
@@ -4,8 +4,8 @@ module DwcAgent
4
4
 
5
5
  MAJOR = 3
6
6
  MINOR = 0
7
- PATCH = 1
8
- BUILD = 5
7
+ PATCH = 3
8
+ BUILD = 0
9
9
 
10
10
  def self.version
11
11
  [MAJOR, MINOR, PATCH, BUILD].compact.join('.').freeze
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: dwc_agent
3
3
  version: !ruby/object:Gem::Version
4
- version: 3.0.1.5
4
+ version: 3.0.3.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - David P. Shorthouse
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2022-10-24 00:00:00.000000000 Z
11
+ date: 2023-06-07 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: namae
@@ -119,7 +119,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
119
119
  - !ruby/object:Gem::Version
120
120
  version: '0'
121
121
  requirements: []
122
- rubygems_version: 3.3.17
122
+ rubygems_version: 3.3.7
123
123
  signing_key:
124
124
  specification_version: 4
125
125
  summary: Parse Darwin Core agent terms such as recordedBy and identifiedBy