dwc_agent 0.1.8 → 0.1.9

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA1:
3
- metadata.gz: 20ca1d9afefdaaed29ca0133174b2781d412dd7a
4
- data.tar.gz: 5462f4e78954f3b71f3a52620eab958ee10abcff
3
+ metadata.gz: 5e5662fb6ce9768a7e4842123e7d6bd1f3609383
4
+ data.tar.gz: bf361f626333393dc5f68a960d6b9f2ceb3b634d
5
5
  SHA512:
6
- metadata.gz: 432d7daa90ca150304b2a20619c457dacb3d1f8964548402e02fad2a0ed77816a96dbf48b519712a9bd6b0cdf8cb7c888f886adc5cae9e6ccd1a40169c3acbb0
7
- data.tar.gz: 411aba8a997ed6b82a42960e1c943ce2b23f0abc4d3565c6a91c3da084ff41537c38bcae74f03c1debc955f66db93c8a818c107d03e159009c39b0557fe78f24
6
+ metadata.gz: 57cb357cf32164f6c0a50b604e1995626404565888a958842bcc50d32d5a6a9fd24f59d36768e1d5eb18eb8a03b1f9c301df66a174bc1fc93a10e5ae9715bc99
7
+ data.tar.gz: 2719e50b188b8babf83afccf4f3dfabddc5f7ba3a17716df4a2b2b7e9cf33d72d6e9da1dacfe3e8c818b49e5a3261a53a52875b25c24d6087c7da8e9f9f07cff
@@ -53,6 +53,7 @@ module DwcAgent
53
53
  (?i:crossed\s+out)|
54
54
  \(?(?i:source)\(?|
55
55
  (?i:according\s+to)|
56
+ (?i:museum\s+victoria)|
56
57
  (?i:revised|photograph|fruits\s+only)|
57
58
  -?\s*(?i:sight\s+(id|identifi?cation))\.?\s*\b|
58
59
  -?\s*(?i:synonym(y|ie))|
@@ -60,6 +61,7 @@ module DwcAgent
60
61
  \b(?i:to\s+(sub)?spp?)\.?|
61
62
  (?i:nom\.?\s+rev\.?)|
62
63
  FNA|DAO|HUH|FDNMB|\(MT\)|(?i:\(KEW\))|
64
+ (?i:university|museum|exhibits?)|
63
65
  (?i:uqam)|
64
66
  \b[,;]\s+\d+\z|
65
67
  [":!]|
@@ -68,18 +70,19 @@ module DwcAgent
68
70
  [,;]\z|
69
71
  ^\w{0,2}\z|
70
72
  ^[A-Z]{2,}\z|
73
+ (?i:annot\.?)\b|
71
74
  \s+(?i:stet)\s*!?\s*\z|
72
75
  \s+(?i:prep)\.?\s*\z|
73
- \b\s*\([A-Z]{2,}\)
76
+ \b\s*\([A-Z]{2,}\)|
77
+ \b[lL]eg[\.:]\s*\b
74
78
  }x
75
79
 
76
80
  SPLIT_BY = %r{
77
81
  [–|&+/;]|
78
82
  \s+-\s+|
79
83
  \s+a\.\s+|
80
- \b(?i:and|et|with|per)\s+|
81
- \s+y\s*\b|
82
- \be\s*\b|
84
+ \b(e|y|en|et|or|per|for)\s*\b|
85
+ \b(?i:and|with)\s*\b|
83
86
  \b(?i:annotated(\s+by)?)\s*\b|
84
87
  \b(?i:coll\.)\s*\b|
85
88
  \b(?i:communicate?d(\s+to)?)\s*\b|
@@ -90,7 +93,6 @@ module DwcAgent
90
93
  \b(?i:ex\.?(\s+by)?|examined(\s+by)?)\s*\b|
91
94
  \b(?i:in?dentified(\s+by)?)\s*\b|
92
95
  \b(?i:in\s+part(\s+by)?)\s*\b|
93
- \b(?i:or)\s+|
94
96
  \b(?i:prep\.?\s+(?i:by)?)\s*\b|
95
97
  \b(?i:redet\.?(\s+by?)?)\s*\b|
96
98
  \b(?i:reidentified(\s+by)?)\s*\b|
@@ -113,7 +115,11 @@ module DwcAgent
113
115
  '#' => '',
114
116
  '/' => ' / ',
115
117
  '&' => ' & ',
116
- '*' => ''
118
+ '*' => '',
119
+ '>' => '',
120
+ '<' => '',
121
+ '{' => '',
122
+ '}' => ''
117
123
  }
118
124
 
119
125
  COMPLEX_SEPARATORS = %r{
@@ -143,7 +149,7 @@ module DwcAgent
143
149
  (?i:ent(o|y)mology)|
144
150
  (?i:mus(eum|ée)|universit(y|é|e|at)|college|institute?|acad(e|é)m|school|écol(e|iers?)|laboratoi?r|projec?t|polytech|dep(t|art?ment)|research|clinic|hospital|cientifica|sanctuary|safari)|
145
151
  (?i:univ\.)|
146
- (?i:graduate|student|estudantes|storekeep|supervisor|superint|rcmp|coordinator|minority|fishermen|police|taxonomist|consultant|participante?s?|team|(é|e)quipe|memb(er|re)|crew|group|staff|personnel|family|captain|friends|assistant|worker)|
152
+ (?i:graduate|student|estudi?antes?|labo\.|storekeep|supervisor|superint|rcmp|coordinator|minority|fishermen|police|taxonomist|consultant|participante?s?|team|(é|e)quipe|memb(er|re)|crew|group|staff|personnel|family|captain|friends|assistant|worker)|
147
153
  (?i:non\s+pr(é|e)cis(é|e))|
148
154
  (?i:ontario|qu(e|é)bec|saskatchewan|new brunswick|sault|newfoundland|assurance|vancouver|u\.?s\.?s\.?r\.?)|
149
155
  (?i:recreation|culture)|
@@ -160,6 +166,7 @@ module DwcAgent
160
166
  \s*(?i:too)\s+|\s*(?i:the)\s+|
161
167
  (?i:taxiderm(ies|y))|
162
168
  (?i:though)|
169
+ (?:tropical)|
163
170
  (?i:toward|seen at)|
164
171
  (?i:unidentified|unspecified|unk?nown|unnamed|unread|unmistak|no agent)|
165
172
  (?i:urn\:)|
@@ -3,7 +3,7 @@ module DwcAgent
3
3
 
4
4
  MAJOR = 0
5
5
  MINOR = 1
6
- PATCH = 8
6
+ PATCH = 9
7
7
  BUILD = nil
8
8
 
9
9
  def self.version
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: dwc_agent
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.1.8
4
+ version: 0.1.9
5
5
  platform: ruby
6
6
  authors:
7
7
  - David P. Shorthouse
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2018-10-18 00:00:00.000000000 Z
11
+ date: 2018-10-26 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: namae