pennmarc 1.0.24 → 1.0.25
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/lib/pennmarc/enriched.rb +1 -0
- data/lib/pennmarc/helpers/access.rb +8 -6
- data/lib/pennmarc/helpers/identifier.rb +12 -0
- data/lib/pennmarc/helpers/subject.rb +10 -4
- data/lib/pennmarc/helpers/title.rb +39 -26
- data/lib/pennmarc/version.rb +1 -1
- data/spec/lib/pennmarc/helpers/access_spec.rb +11 -0
- data/spec/lib/pennmarc/helpers/identifer_spec.rb +14 -0
- data/spec/lib/pennmarc/helpers/subject_spec.rb +16 -0
- data/spec/lib/pennmarc/helpers/title_spec.rb +20 -0
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 8b540ecd84333f097b50a3682732229854b188fcde76921eb0ec184622a690dd
|
4
|
+
data.tar.gz: 9203fadee45b9ad65ec20880a1acbc23356000b748d32d07428ec093590cd55a
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 6770815e8f5f828c15451fc71c04dbef6a131203e8c58d721c063b15f218d5814a71b37fd6c4f088a9c7164d5d989ff6933abc820094068921f218c937a87410
|
7
|
+
data.tar.gz: 94eee63c29ae06151816a532a5afb7db1f27490de798651c909dc07fd0f33de1b4a1ee26057b6e3a8abc5d15c54d09709df8942e6e21ad828c1296fe3191725e
|
data/lib/pennmarc/enriched.rb
CHANGED
@@ -12,6 +12,7 @@ module PennMARC
|
|
12
12
|
PHYS_INVENTORY_TAG = 'hld'
|
13
13
|
ELEC_INVENTORY_TAG = 'prt'
|
14
14
|
ITEM_TAG = 'itm'
|
15
|
+
RELATED_RECORD_TAG = 'rel'
|
15
16
|
|
16
17
|
# Subfields for HLD tags
|
17
18
|
# Follow MARC 852 spec: https://www.loc.gov/marc/holdings/hd852.html, but names are translated into Alma parlance
|
@@ -5,14 +5,13 @@ module PennMARC
|
|
5
5
|
class Access < Helper
|
6
6
|
ONLINE = 'Online'
|
7
7
|
AT_THE_LIBRARY = 'At the library'
|
8
|
+
RESOURCE_LINK_BASE_URL = 'hdl.library.upenn.edu'
|
8
9
|
|
9
10
|
class << self
|
10
11
|
# Based on enhanced metadata fields added by Alma publishing process or API, determine if the record has
|
11
12
|
# electronic access or has physical holdings, and is therefore "Online" or "At the library". If a record is "At
|
12
13
|
# the library", but has a link to a finding aid in the 856 field (matching certain criteria), also add 'Online' as
|
13
14
|
# an access method.
|
14
|
-
# @todo What if none of these criteria match? Should we include "At the library" by default? Records with no value
|
15
|
-
# in this field would be lost if the user selects a facet value.
|
16
15
|
# @param [MARC::Record] record
|
17
16
|
# @return [Array]
|
18
17
|
def facet(record)
|
@@ -24,7 +23,7 @@ module PennMARC
|
|
24
23
|
return values if values.size == 2 # return early if all values are already present
|
25
24
|
|
26
25
|
# only check if ONLINE isn't already there
|
27
|
-
values << ONLINE if values.exclude?(ONLINE) &&
|
26
|
+
values << ONLINE if values.exclude?(ONLINE) && resource_link?(record)
|
28
27
|
values.uniq
|
29
28
|
end
|
30
29
|
|
@@ -44,20 +43,23 @@ module PennMARC
|
|
44
43
|
field.tag.in? [Enriched::Pub::PHYS_INVENTORY_TAG, Enriched::Api::PHYS_INVENTORY_TAG]
|
45
44
|
end
|
46
45
|
|
47
|
-
# Check if a record contains an 856 entry
|
46
|
+
# Check if a record contains an 856 entry with a Penn Handle server link meeting these criteria:
|
48
47
|
# 1. Indicator 1 is 4 (HTTP resource)
|
49
48
|
# 2. Indicator 2 is NOT 2 (indicating the linkage is to a "related" thing)
|
50
49
|
# 3. The URL specified in subfield u (URI) is a Penn Handle link
|
50
|
+
# 4. The subfield z does NOT include the string 'Finding aid'
|
51
51
|
# See: https://www.loc.gov/marc/bibliographic/bd856.html
|
52
|
+
# @note Some electronic records do not have Portfolios in Alma, so we rely upon the Resource Link in the 856 to
|
53
|
+
# get these records included in the Online category.
|
52
54
|
# @param [MARC::Record] record
|
53
55
|
# @return [Boolean]
|
54
|
-
def
|
56
|
+
def resource_link?(record)
|
55
57
|
record.fields('856').filter_map do |field|
|
56
58
|
next if field.indicator2 == '2' || field.indicator1 != '4'
|
57
59
|
|
58
60
|
subz = subfield_values(field, 'z')
|
59
61
|
subfield_values(field, 'u').filter_map do |value|
|
60
|
-
return true if subz.
|
62
|
+
return true if subz.exclude?('Finding aid') && value.include?(RESOURCE_LINK_BASE_URL)
|
61
63
|
end
|
62
64
|
end
|
63
65
|
false
|
@@ -159,6 +159,18 @@ module PennMARC
|
|
159
159
|
}.uniq
|
160
160
|
end
|
161
161
|
|
162
|
+
# Gets any Host record MMS ID values from an Enriched::Pub::RELATED_RECORD_TAG field added during Alma enrichment.
|
163
|
+
# This aids in our handling of "bound with" records.
|
164
|
+
# @param [MARC::Record] record
|
165
|
+
# @return [Array<String>]
|
166
|
+
def host_record_id(record)
|
167
|
+
record.fields(Enriched::Pub::RELATED_RECORD_TAG).filter_map { |field|
|
168
|
+
next unless subfield_value?(field, 'c', /contains/i)
|
169
|
+
|
170
|
+
subfield_values field, :w
|
171
|
+
}.flatten.uniq
|
172
|
+
end
|
173
|
+
|
162
174
|
private
|
163
175
|
|
164
176
|
# Determine if subfield 'a' is an OCLC id.
|
@@ -18,7 +18,7 @@ module PennMARC
|
|
18
18
|
# - 2: MeSH
|
19
19
|
# - 4: Source not specified (local?)
|
20
20
|
# - 7: Source specified in ǂ2
|
21
|
-
|
21
|
+
VALID_SOURCE_INDICATORS = %w[0 1 2 4 7].freeze
|
22
22
|
|
23
23
|
# Tags that serve as sources for Subject facet values
|
24
24
|
DISPLAY_TAGS = %w[600 610 611 630 650 651].freeze
|
@@ -27,7 +27,7 @@ module PennMARC
|
|
27
27
|
LOCAL_TAGS = %w[690 691 697].freeze
|
28
28
|
|
29
29
|
# All Subjects for searching. This includes most subfield content from any field contained in {SEARCH_TAGS} or
|
30
|
-
# 69X, including any linked 880 fields. Fields must have an indicator2 value in {
|
30
|
+
# 69X, including any linked 880 fields. Fields must have an indicator2 value in {VALID_SOURCE_INDICATORS}.
|
31
31
|
# @todo this includes subfields that may not be desired like 1 (uri) and 2 (source code) but this might be OK for
|
32
32
|
# a search (non-display) field?
|
33
33
|
# @param [Hash] relator_map
|
@@ -179,12 +179,18 @@ module PennMARC
|
|
179
179
|
end
|
180
180
|
end
|
181
181
|
|
182
|
-
# Is a field intended for display in a general subject field
|
182
|
+
# Is a field intended for display in a general subject field? To be included, the field tag is in either
|
183
|
+
# {DISPLAY_TAGS} or {LOCAL_TAGS}, and has an indicator 2 value that is in {VALID_SOURCE_INDICATORS}. If
|
184
|
+
# indicator 2 is '7' - indicating "source specified", the specified source must be in our approved source code
|
185
|
+
# list.
|
186
|
+
# @see Util.valid_subject_genre_source_code?
|
183
187
|
# @param [MARC::DataField] field
|
184
188
|
# @return [Boolean] whether a MARC field is intended for display under general "Subjects"
|
185
189
|
def subject_general_display_field?(field)
|
186
190
|
return false unless field.tag.in?(DISPLAY_TAGS + LOCAL_TAGS) && field.respond_to?(:indicator2)
|
187
191
|
|
192
|
+
return false if field.indicator2.present? && !field.indicator2.in?(VALID_SOURCE_INDICATORS)
|
193
|
+
|
188
194
|
return false if field.indicator2 == '7' && !valid_subject_genre_source_code?(field)
|
189
195
|
|
190
196
|
true
|
@@ -278,7 +284,7 @@ module PennMARC
|
|
278
284
|
# @param [MARC::DataField] field
|
279
285
|
# @return [Boolean]
|
280
286
|
def subject_search_field?(field)
|
281
|
-
return false unless field.respond_to?(:indicator2) &&
|
287
|
+
return false unless field.respond_to?(:indicator2) && VALID_SOURCE_INDICATORS.include?(field.indicator2)
|
282
288
|
|
283
289
|
tag = if field.tag == '880'
|
284
290
|
subfield_values(field, '6').first
|
@@ -3,33 +3,36 @@
|
|
3
3
|
module PennMARC
|
4
4
|
# This helper contains logic for parsing out Title and Title-related fields.
|
5
5
|
class Title < Helper
|
6
|
-
|
7
|
-
|
8
|
-
|
9
|
-
|
10
|
-
|
11
|
-
|
12
|
-
|
13
|
-
|
14
|
-
|
15
|
-
|
16
|
-
|
17
|
-
|
18
|
-
|
19
|
-
|
20
|
-
|
21
|
-
|
22
|
-
|
23
|
-
|
24
|
-
|
25
|
-
|
26
|
-
|
27
|
-
|
28
|
-
|
29
|
-
|
30
|
-
|
31
|
-
|
6
|
+
# We use these fields when retrieving auxiliary titles in the *search_aux methods:
|
7
|
+
# {https://www.loc.gov/marc/bibliographic/bd130.html 130},
|
8
|
+
# {https://www.loc.gov/marc/bibliographic/bd210.html 210},
|
9
|
+
# {https://www.loc.gov/marc/bibliographic/bd245.html 245},
|
10
|
+
# {https://www.loc.gov/marc/bibliographic/bd246.html 246},
|
11
|
+
# {https://www.loc.gov/marc/bibliographic/bd247.html 247},
|
12
|
+
# {https://www.loc.gov/marc/bibliographic/bd440.html 440},
|
13
|
+
# {https://www.loc.gov/marc/bibliographic/bd490.html 490},
|
14
|
+
# {https://www.loc.gov/marc/bibliographic/bd730.html 730},
|
15
|
+
# {https://www.loc.gov/marc/bibliographic/bd740.html 740},
|
16
|
+
# {https://www.loc.gov/marc/bibliographic/bd830.html 830},
|
17
|
+
# {https://www.loc.gov/marc/bibliographic/bd773.html 773},
|
18
|
+
# {https://www.loc.gov/marc/bibliographic/bd774.html 774},
|
19
|
+
# {https://www.loc.gov/marc/bibliographic/bd780.html 780},
|
20
|
+
# {https://www.loc.gov/marc/bibliographic/bd785.html 785},
|
21
|
+
# {https://www.loc.gov/marc/bibliographic/bd700.html 700},
|
22
|
+
# {https://www.loc.gov/marc/bibliographic/bd710.html 710},
|
23
|
+
# {https://www.loc.gov/marc/bibliographic/bd711.html 711},
|
24
|
+
# {https://www.loc.gov/marc/bibliographic/bd505.html 505}
|
25
|
+
AUX_TITLE_TAGS = {
|
26
|
+
main: %w[130 210 240 245 246 247 440 490 730 740 830],
|
27
|
+
related: %w[773 774 780 785],
|
28
|
+
entity: %w[700 710 711],
|
29
|
+
note: %w[505]
|
30
|
+
}.freeze
|
31
|
+
|
32
|
+
# This text is used in Alma to indicate a Bib record is a "Host" record for other bibs (bound-withs)
|
33
|
+
HOST_BIB_TITLE = 'Host bibliographic record for boundwith'
|
32
34
|
|
35
|
+
class << self
|
33
36
|
# Main Title Search field. Takes from {https://www.loc.gov/marc/bibliographic/bd245.html 245} and linked 880.
|
34
37
|
# @note Ported from get_title_1_search_values.
|
35
38
|
# @param [MARC::Record] record
|
@@ -217,6 +220,16 @@ module PennMARC
|
|
217
220
|
}.uniq
|
218
221
|
end
|
219
222
|
|
223
|
+
# Determine if the record is a "Host" bibliographic record for other bib records ("bound-withs")
|
224
|
+
# @param [MARC::Record] record
|
225
|
+
# @return [Boolean]
|
226
|
+
def host_bib_record?(record)
|
227
|
+
record.fields('245').any? do |f|
|
228
|
+
title = join_subfields(f, &subfield_in?(%w[a]))
|
229
|
+
title.include?(HOST_BIB_TITLE)
|
230
|
+
end
|
231
|
+
end
|
232
|
+
|
220
233
|
private
|
221
234
|
|
222
235
|
# Create prefix/filing hash for representing a title value with filing characters removed, with special
|
data/lib/pennmarc/version.rb
CHANGED
@@ -69,6 +69,17 @@ describe 'PennMARC::Access' do
|
|
69
69
|
{ z: 'Finding aid', u: 'http://hdl.library.upenn.edu/1017/d/pacscl/UPENN_RBML_MsColl200' }
|
70
70
|
end
|
71
71
|
|
72
|
+
it 'does not include online access' do
|
73
|
+
expect(helper.facet(record)).to contain_exactly(PennMARC::Access::AT_THE_LIBRARY)
|
74
|
+
end
|
75
|
+
end
|
76
|
+
|
77
|
+
context 'with an 856 describing a resource link' do
|
78
|
+
let(:indicators) { { indicator1: '4', indicator2: '1' } }
|
79
|
+
let(:location_and_access_subfields) do
|
80
|
+
{ z: 'Connect to resource', u: 'http://hdl.library.upenn.edu/1234' }
|
81
|
+
end
|
82
|
+
|
72
83
|
it 'includes online access' do
|
73
84
|
expect(helper.facet(record)).to contain_exactly(PennMARC::Access::ONLINE, PennMARC::Access::AT_THE_LIBRARY)
|
74
85
|
end
|
@@ -161,4 +161,18 @@ describe 'PennMARC::Identifier' do
|
|
161
161
|
'10.1038/sdata.2016.18', '10.18574/9781479842865')
|
162
162
|
end
|
163
163
|
end
|
164
|
+
|
165
|
+
describe '.host_record_id' do
|
166
|
+
let(:record) do
|
167
|
+
marc_record fields: [
|
168
|
+
marc_field(tag: PennMARC::Enriched::Pub::RELATED_RECORD_TAG, subfields: { w: '123456789', c: 'Contains',
|
169
|
+
a: 'Title' }),
|
170
|
+
marc_field(tag: PennMARC::Enriched::Pub::RELATED_RECORD_TAG, subfields: { w: '666666666', c: 'Contained In' })
|
171
|
+
]
|
172
|
+
end
|
173
|
+
|
174
|
+
it 'returns only the desired host record MMS ID values' do
|
175
|
+
expect(helper.host_record_id(record)).to contain_exactly '123456789'
|
176
|
+
end
|
177
|
+
end
|
164
178
|
end
|
@@ -288,6 +288,22 @@ describe 'PennMARC::Subject' do
|
|
288
288
|
'Early works to 1950.')
|
289
289
|
end
|
290
290
|
end
|
291
|
+
|
292
|
+
context 'with a mix of allowed and disallowed heading sources' do
|
293
|
+
let(:fields) do
|
294
|
+
[marc_field(tag: '650', indicator2: '7', subfields: {
|
295
|
+
'2': 'fast',
|
296
|
+
a: 'Philosophy in motion pictures.',
|
297
|
+
'0': 'http://id.loc.gov/authorities/subjects/sh92003501'
|
298
|
+
}),
|
299
|
+
marc_field(tag: '650', indicator2: '7', subfields: { '2': 'gnd', a: 'Filmästhetik.' }),
|
300
|
+
marc_field(tag: '650', indicator2: '6', subfields: { a: 'Cinéma et arts.' })]
|
301
|
+
end
|
302
|
+
|
303
|
+
it 'includes only permitted headings from approved ontologies' do
|
304
|
+
expect(values).to contain_exactly 'Philosophy in motion pictures.'
|
305
|
+
end
|
306
|
+
end
|
291
307
|
end
|
292
308
|
|
293
309
|
describe '.childrens_show' do
|
@@ -249,4 +249,24 @@ describe 'PennMARC::Title' do
|
|
249
249
|
expect(values).not_to include 'Linkage', '247'
|
250
250
|
end
|
251
251
|
end
|
252
|
+
|
253
|
+
describe '.host_bib_record?' do
|
254
|
+
let(:record) { marc_record fields: [marc_field(tag: '245', subfields: subfields)] }
|
255
|
+
|
256
|
+
context 'with a host record' do
|
257
|
+
let(:subfields) { { a: "#{PennMARC::Title::HOST_BIB_TITLE} for 123456789" } }
|
258
|
+
|
259
|
+
it 'returns true' do
|
260
|
+
expect(helper.host_bib_record?(record)).to be true
|
261
|
+
end
|
262
|
+
end
|
263
|
+
|
264
|
+
context 'with a non-host record' do
|
265
|
+
let(:subfields) { { a: 'Regular record' } }
|
266
|
+
|
267
|
+
it 'returns false' do
|
268
|
+
expect(helper.host_bib_record?(record)).to be false
|
269
|
+
end
|
270
|
+
end
|
271
|
+
end
|
252
272
|
end
|
metadata
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: pennmarc
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 1.0.
|
4
|
+
version: 1.0.25
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Mike Kanning
|
@@ -10,7 +10,7 @@ authors:
|
|
10
10
|
autorequire:
|
11
11
|
bindir: bin
|
12
12
|
cert_chain: []
|
13
|
-
date: 2024-06-
|
13
|
+
date: 2024-06-26 00:00:00.000000000 Z
|
14
14
|
dependencies:
|
15
15
|
- !ruby/object:Gem::Dependency
|
16
16
|
name: activesupport
|