dwc_agent 0.1.8 → 0.1.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA1:
3
- metadata.gz: 20ca1d9afefdaaed29ca0133174b2781d412dd7a
4
- data.tar.gz: 5462f4e78954f3b71f3a52620eab958ee10abcff
3
+ metadata.gz: 5e5662fb6ce9768a7e4842123e7d6bd1f3609383
4
+ data.tar.gz: bf361f626333393dc5f68a960d6b9f2ceb3b634d
5
5
  SHA512:
6
- metadata.gz: 432d7daa90ca150304b2a20619c457dacb3d1f8964548402e02fad2a0ed77816a96dbf48b519712a9bd6b0cdf8cb7c888f886adc5cae9e6ccd1a40169c3acbb0
7
- data.tar.gz: 411aba8a997ed6b82a42960e1c943ce2b23f0abc4d3565c6a91c3da084ff41537c38bcae74f03c1debc955f66db93c8a818c107d03e159009c39b0557fe78f24
6
+ metadata.gz: 57cb357cf32164f6c0a50b604e1995626404565888a958842bcc50d32d5a6a9fd24f59d36768e1d5eb18eb8a03b1f9c301df66a174bc1fc93a10e5ae9715bc99
7
+ data.tar.gz: 2719e50b188b8babf83afccf4f3dfabddc5f7ba3a17716df4a2b2b7e9cf33d72d6e9da1dacfe3e8c818b49e5a3261a53a52875b25c24d6087c7da8e9f9f07cff
@@ -53,6 +53,7 @@ module DwcAgent
53
53
  (?i:crossed\s+out)|
54
54
  \(?(?i:source)\(?|
55
55
  (?i:according\s+to)|
56
+ (?i:museum\s+victoria)|
56
57
  (?i:revised|photograph|fruits\s+only)|
57
58
  -?\s*(?i:sight\s+(id|identifi?cation))\.?\s*\b|
58
59
  -?\s*(?i:synonym(y|ie))|
@@ -60,6 +61,7 @@ module DwcAgent
60
61
  \b(?i:to\s+(sub)?spp?)\.?|
61
62
  (?i:nom\.?\s+rev\.?)|
62
63
  FNA|DAO|HUH|FDNMB|\(MT\)|(?i:\(KEW\))|
64
+ (?i:university|museum|exhibits?)|
63
65
  (?i:uqam)|
64
66
  \b[,;]\s+\d+\z|
65
67
  [":!]|
@@ -68,18 +70,19 @@ module DwcAgent
68
70
  [,;]\z|
69
71
  ^\w{0,2}\z|
70
72
  ^[A-Z]{2,}\z|
73
+ (?i:annot\.?)\b|
71
74
  \s+(?i:stet)\s*!?\s*\z|
72
75
  \s+(?i:prep)\.?\s*\z|
73
- \b\s*\([A-Z]{2,}\)
76
+ \b\s*\([A-Z]{2,}\)|
77
+ \b[lL]eg[\.:]\s*\b
74
78
  }x
75
79
 
76
80
  SPLIT_BY = %r{
77
81
  [–|&+/;]|
78
82
  \s+-\s+|
79
83
  \s+a\.\s+|
80
- \b(?i:and|et|with|per)\s+|
81
- \s+y\s*\b|
82
- \be\s*\b|
84
+ \b(e|y|en|et|or|per|for)\s*\b|
85
+ \b(?i:and|with)\s*\b|
83
86
  \b(?i:annotated(\s+by)?)\s*\b|
84
87
  \b(?i:coll\.)\s*\b|
85
88
  \b(?i:communicate?d(\s+to)?)\s*\b|
@@ -90,7 +93,6 @@ module DwcAgent
90
93
  \b(?i:ex\.?(\s+by)?|examined(\s+by)?)\s*\b|
91
94
  \b(?i:in?dentified(\s+by)?)\s*\b|
92
95
  \b(?i:in\s+part(\s+by)?)\s*\b|
93
- \b(?i:or)\s+|
94
96
  \b(?i:prep\.?\s+(?i:by)?)\s*\b|
95
97
  \b(?i:redet\.?(\s+by?)?)\s*\b|
96
98
  \b(?i:reidentified(\s+by)?)\s*\b|
@@ -113,7 +115,11 @@ module DwcAgent
113
115
  '#' => '',
114
116
  '/' => ' / ',
115
117
  '&' => ' & ',
116
- '*' => ''
118
+ '*' => '',
119
+ '>' => '',
120
+ '<' => '',
121
+ '{' => '',
122
+ '}' => ''
117
123
  }
118
124
 
119
125
  COMPLEX_SEPARATORS = %r{
@@ -143,7 +149,7 @@ module DwcAgent
143
149
  (?i:ent(o|y)mology)|
144
150
  (?i:mus(eum|ée)|universit(y|é|e|at)|college|institute?|acad(e|é)m|school|écol(e|iers?)|laboratoi?r|projec?t|polytech|dep(t|art?ment)|research|clinic|hospital|cientifica|sanctuary|safari)|
145
151
  (?i:univ\.)|
146
- (?i:graduate|student|estudantes|storekeep|supervisor|superint|rcmp|coordinator|minority|fishermen|police|taxonomist|consultant|participante?s?|team|(é|e)quipe|memb(er|re)|crew|group|staff|personnel|family|captain|friends|assistant|worker)|
152
+ (?i:graduate|student|estudi?antes?|labo\.|storekeep|supervisor|superint|rcmp|coordinator|minority|fishermen|police|taxonomist|consultant|participante?s?|team|(é|e)quipe|memb(er|re)|crew|group|staff|personnel|family|captain|friends|assistant|worker)|
147
153
  (?i:non\s+pr(é|e)cis(é|e))|
148
154
  (?i:ontario|qu(e|é)bec|saskatchewan|new brunswick|sault|newfoundland|assurance|vancouver|u\.?s\.?s\.?r\.?)|
149
155
  (?i:recreation|culture)|
@@ -160,6 +166,7 @@ module DwcAgent
160
166
  \s*(?i:too)\s+|\s*(?i:the)\s+|
161
167
  (?i:taxiderm(ies|y))|
162
168
  (?i:though)|
169
+ (?:tropical)|
163
170
  (?i:toward|seen at)|
164
171
  (?i:unidentified|unspecified|unk?nown|unnamed|unread|unmistak|no agent)|
165
172
  (?i:urn\:)|
@@ -3,7 +3,7 @@ module DwcAgent
3
3
 
4
4
  MAJOR = 0
5
5
  MINOR = 1
6
- PATCH = 8
6
+ PATCH = 9
7
7
  BUILD = nil
8
8
 
9
9
  def self.version
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: dwc_agent
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.1.8
4
+ version: 0.1.9
5
5
  platform: ruby
6
6
  authors:
7
7
  - David P. Shorthouse
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2018-10-18 00:00:00.000000000 Z
11
+ date: 2018-10-26 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: namae