@natlibfi/marc-record-validators-melinda 12.0.0-alpha.7 → 12.0.0-alpha.9
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/ending-punctuation-conf.js +3 -2
- package/dist/ending-punctuation-conf.js.map +2 -2
- package/dist/ending-punctuation.js +48 -9
- package/dist/ending-punctuation.js.map +3 -3
- package/dist/ending-punctuation.test.js +31 -9
- package/dist/ending-punctuation.test.js.map +2 -2
- package/dist/indicator-fixes.js +10 -0
- package/dist/indicator-fixes.js.map +2 -2
- package/dist/isbn-issn.js +7 -4
- package/dist/isbn-issn.js.map +2 -2
- package/dist/merge-fields/dataProvenance.js +1 -1
- package/dist/merge-fields/dataProvenance.js.map +2 -2
- package/dist/punctuation2.js +11 -5
- package/dist/punctuation2.js.map +2 -2
- package/dist/translate-terms.test.js +12 -2
- package/dist/translate-terms.test.js.map +2 -2
- package/dist/utils.js.map +2 -2
- package/package.json +8 -7
- package/src/ending-punctuation-conf.js +3 -3
- package/src/ending-punctuation.js +62 -11
- package/src/ending-punctuation.test.js +33 -9
- package/src/indicator-fixes.js +13 -0
- package/src/isbn-issn.js +10 -5
- package/src/merge-fields/dataProvenance.js +1 -1
- package/src/punctuation2.js +14 -5
- package/src/translate-terms.test.js +25 -2
- package/src/utils.js +6 -0
- package/test-fixtures/indicator-fixes/10/expectedResult.json +11 -0
- package/test-fixtures/indicator-fixes/10/metadata.json +4 -0
- package/test-fixtures/indicator-fixes/10/record.json +11 -0
- package/test-fixtures/translate-terms-data.js +42 -0
package/dist/utils.js.map
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
{
|
|
2
2
|
"version": 3,
|
|
3
3
|
"sources": ["../src/utils.js"],
|
|
4
|
-
"sourcesContent": ["import createDebugLogger from 'debug';\n\n//import fs from 'fs';\n//import path from 'path';\n\nconst debug = createDebugLogger('@natlibfi/melinda-marc-record-merge-reducers:utils');\n//const debugData = debug.extend('data');\nconst debugDev = debug.extend('dev');\n\nimport {melindaFieldSpecs} from './melindaCustomMergeFields.js';\n\n//JSON.parse(fs.readFileSync(path.join(__dirname, '..', 'src', 'melindaCustomMergeFields.json'), 'utf8'));\n\nexport function isElectronicMaterial(record) {\n const f337s = record.get('337');\n\n return f337s.length > 0 && f337s.some(f => fieldHasSubfield(f, 'b', 'c') && fieldHasSubfield(f, '2', 'rdamedia'));\n}\n\nexport function nvdebug(message, func = undefined) {\n if (func) {\n func(message);\n }\n //console.info(message); // eslint-disable-line no-console\n}\n\nexport function fieldHasSubfield(field, subfieldCode, subfieldValue = null) {\n if (!field.subfields) {\n return false;\n }\n if (subfieldValue === null) {\n return field.subfields.some(sf => sf.code === subfieldCode);\n }\n return field.subfields.some(sf => sf.code === subfieldCode && subfieldValue === sf.value);\n}\n\nexport function subfieldToString(sf) {\n if (!sf.value) {\n return `\u2021${sf.code}`;\n }\n return `\u2021${sf.code} ${sf.value}`;\n}\n\nfunction normalizeIndicatorValue(val) {\n if (val === ' ') {\n return '#';\n }\n return val;\n}\n\nexport function recordToString(record) {\n const ldr = `LDR ${record.leader}`;\n const fields = record.fields.map(f => fieldToString(f));\n return `${ldr}\\n${fields.join('\\n')}`;\n}\n\nexport function removeSubfield(record, tag, subfieldCode) {\n record.fields = record.fields.map(field => {\n if (field.tag !== tag || !field.subfields) { // Don't procss irrelevant fields\n return field;\n }\n field.subfields = field.subfields.filter(sf => sf.code !== subfieldCode);\n if (field.subfields.length === 0) {\n return false;\n }\n return field;\n }).filter(field => field);\n}\n\nexport function recordRemoveValuelessSubfields(record) {\n record.fields = record.fields.map(field => {\n if (!field.subfields) { // Keep control fields\n return field;\n }\n // Remove empty subfields from datafields:\n field.subfields = field.subfields.filter(sf => sf.value);\n\n if (field.subfields && field.subfields.length === 0) {\n return false; // Return false instead of a field if field has no subfields left. These will soon be filtered out.\n }\n\n return field; //if field has subfields return it\n }).filter(field => field); // Filter those falses out\n}\n\nexport function fieldToString(f) {\n if ('subfields' in f) {\n return `${f.tag} ${normalizeIndicatorValue(f.ind1)}${normalizeIndicatorValue(f.ind2)}${formatSubfields(f)}`;\n }\n return `${f.tag} ${f.value}`;\n\n function formatSubfields(field) {\n return field.subfields.map(sf => ` ${subfieldToString(sf)}`).join('');\n }\n}\n\nexport function fieldsToString(fields) {\n return fields.map(f => fieldToString(f)).join('\\t__SEPARATOR__\\t');\n}\n\nexport function nvdebugFieldArray(fields, prefix = ' ', func = undefined) {\n fields.forEach(field => nvdebug(`${prefix}${fieldToString(field)}`, func));\n}\n\nexport function isControlSubfieldCode(subfieldCode) {\n if (['0', '1', '2', '3', '4', '5', '6', '7', '8', '9', 'w'].includes(subfieldCode)) {\n return true;\n }\n return false;\n}\n\nexport function getCatalogingLanguage(record, defaultCatalogingLanguage = undefined) {\n const [field040] = record.get(/^040$/u);\n if (!field040) {\n return defaultCatalogingLanguage;\n }\n const [b] = field040.subfields.filter(sf => sf.code === 'b');\n if (!b) {\n return defaultCatalogingLanguage;\n }\n return b.value;\n}\n\n\nexport function uniqArray(arr) {\n return arr.filter((val, i) => arr.indexOf(val) === i);\n}\n\nexport function fieldsAreIdentical(field1, field2) {\n if (field1.tag !== field2.tag) { // NB! We are skipping normalizations here on purpose! They should be done beforehand...\n return false;\n }\n return fieldToString(field1) === fieldToString(field2);\n\n // The order of subfields is relevant! Bloody JS idiotisms make people use conditions such as:\n // return field1.subfields.every(sf => field2.subfields.some(sf2 => sf.code === sf2.code && sf.value === sf2.value));\n}\n\nexport function fieldHasNSubfields(field, subfieldCode/*, subfieldValue = null*/) {\n const relevantSubfields = field.subfields.filter(sf => sf.code === subfieldCode);\n //if (subfieldValue === null) {\n return relevantSubfields.length;\n //}\n //const subset = relevantSubfields.filter(value => value === subfieldValue);\n //return subset.length;\n}\n\nexport function removeCopyright(value) {\n return value.replace(/^(?:c|p|\u00A9|\u2117|Cop\\. ?) ?((?:1[0-9][0-9][0-9]|20[012][0-9])\\.?)$/ui, '$1');\n}\n\nfunction isNonStandardNonrepeatableSubfield(tag, subfieldCode) {\n // Put these into config or so...\n if (tag === '264') {\n return ['a', 'b', 'c'].includes(subfieldCode);\n }\n\n if (['336', '337', '338'].includes(tag)) {\n return ['a', 'b', '2'].includes(subfieldCode);\n }\n\n return false;\n}\n\n\nexport function subfieldIsRepeatable(tag, subfieldCode) {\n\n if (isNonStandardNonrepeatableSubfield(tag, subfieldCode)) {\n return false;\n }\n\n // These we know or \"know\":\n // NB! $5 is (according to MARC21 format) non-repeatable, and not usable in all fields, but Melinda has a local exception to this, see MET-300\n if ('0159'.indexOf(subfieldCode) > -1) {\n // Uh, can $0 appear on any field?\n return true;\n }\n\n const fieldSpecs = melindaFieldSpecs.fields.filter(field => field.tag === tag);\n if (fieldSpecs.length !== 1) {\n nvdebug(` WARNING! Getting field ${tag} data failed! ${fieldSpecs.length} hits. Default value true is used for'${subfieldCode}' .`, debugDev);\n return true;\n }\n\n const subfieldSpecs = fieldSpecs[0].subfields.filter(subfield => subfield.code === subfieldCode);\n // Currently we don't support multiple $6 fields due to re-indexing limitations...\n // Well, $6 is non-repeatable, isn't it?!?\n // (This might actually already be fixed... Marginal issue, but check eventually.)\n if (subfieldSpecs.length !== 1 || subfieldCode === '6') {\n return false; // repeatable if not specified, I guess. Maybe add log or warn?\n }\n return subfieldSpecs[0].repeatable;\n}\n\nfunction marc21GetTagsLegalIndicators(tag) {\n const fieldSpecs = melindaFieldSpecs.fields.filter(field => field.tag === tag);\n if (fieldSpecs.length === 0) {\n return undefined;\n }\n return fieldSpecs[0].indicators;\n}\n\nexport function marc21GetTagsLegalInd1Value(tag) {\n const indicator = marc21GetTagsLegalIndicators(tag);\n if (indicator === undefined) {\n return undefined;\n }\n return indicator.ind1;\n}\n\nexport function marc21GetTagsLegalInd2Value(tag) {\n const indicator = marc21GetTagsLegalIndicators(tag);\n if (indicator === undefined) {\n return undefined;\n }\n return indicator.ind2;\n}\n\nexport function nvdebugSubfieldArray(subfields, prefix = ' ', func = undefined) {\n subfields.forEach(subfield => nvdebug(`${prefix}${subfieldToString(subfield)}`, func));\n}\n\nexport function subfieldsAreIdentical(subfieldA, subfieldB) {\n return subfieldA.code === subfieldB.code && subfieldA.value === subfieldB.value;\n}\n\nexport function fieldHasMultipleSubfields(field, subfieldCode/*, subfieldValue = null*/) {\n return fieldHasNSubfields(field, subfieldCode) > 1;\n}\n\nexport function hasCopyright(value) {\n const modValue = removeCopyright(value);\n return value !== modValue;\n}\n\n\n\nexport function subfieldArraysContainSameData(arr1, arr2) {\n if ( !arr1.every(sf => arr2.some(sf2 => subfieldsAreIdentical(sf, sf2))) ) {\n return false;\n }\n\n return arr2.every(sf2 => arr1.some(sf => subfieldsAreIdentical(sf, sf2)));\n}"],
|
|
5
|
-
"mappings": "AAAA,OAAO,uBAAuB;AAK9B,MAAM,QAAQ,kBAAkB,oDAAoD;AAEpF,MAAM,WAAW,MAAM,OAAO,KAAK;AAEnC,SAAQ,yBAAwB;AAIzB,gBAAS,qBAAqB,QAAQ;AAC3C,QAAM,QAAQ,OAAO,IAAI,KAAK;AAE9B,SAAO,MAAM,SAAS,KAAK,MAAM,KAAK,OAAK,iBAAiB,GAAG,KAAK,GAAG,KAAK,iBAAiB,GAAG,KAAK,UAAU,CAAC;AAClH;AAEO,gBAAS,QAAQ,SAAS,OAAO,QAAW;AACjD,MAAI,MAAM;AACR,SAAK,OAAO;AAAA,EACd;AAEF;AAEO,gBAAS,iBAAiB,OAAO,cAAc,gBAAgB,MAAM;AAC1E,MAAI,CAAC,MAAM,WAAW;AACpB,WAAO;AAAA,EACT;AACA,MAAI,kBAAkB,MAAM;AAC1B,WAAO,MAAM,UAAU,KAAK,QAAM,GAAG,SAAS,YAAY;AAAA,EAC5D;AACA,SAAO,MAAM,UAAU,KAAK,QAAM,GAAG,SAAS,gBAAgB,kBAAkB,GAAG,KAAK;AAC1F;AAEO,gBAAS,iBAAiB,IAAI;AACnC,MAAI,CAAC,GAAG,OAAO;AACb,WAAO,SAAI,GAAG,IAAI;AAAA,EACpB;AACA,SAAO,SAAI,GAAG,IAAI,IAAI,GAAG,KAAK;AAChC;AAEA,SAAS,wBAAwB,KAAK;AACpC,MAAI,QAAQ,KAAK;AACf,WAAO;AAAA,EACT;AACA,SAAO;AACT;AAEO,gBAAS,eAAe,QAAQ;AACrC,QAAM,MAAM,SAAS,OAAO,MAAM;AAClC,QAAM,SAAS,OAAO,OAAO,IAAI,OAAK,cAAc,CAAC,CAAC;AACtD,SAAO,GAAG,GAAG;AAAA,EAAK,OAAO,KAAK,IAAI,CAAC;AACrC;AAEO,gBAAS,eAAe,QAAQ,KAAK,cAAc;AACxD,SAAO,SAAS,OAAO,OAAO,IAAI,WAAS;AACzC,QAAI,MAAM,QAAQ,OAAO,CAAC,MAAM,WAAW;AACzC,aAAO;AAAA,IACT;AACA,UAAM,YAAY,MAAM,UAAU,OAAO,QAAM,GAAG,SAAS,YAAY;AACvE,QAAI,MAAM,UAAU,WAAW,GAAG;AAChC,aAAO;AAAA,IACT;AACA,WAAO;AAAA,EACT,CAAC,EAAE,OAAO,WAAS,KAAK;AAC1B;AAEO,gBAAS,+BAA+B,QAAQ;AACrD,SAAO,SAAS,OAAO,OAAO,IAAI,WAAS;AACzC,QAAI,CAAC,MAAM,WAAW;AACpB,aAAO;AAAA,IACT;AAEA,UAAM,YAAY,MAAM,UAAU,OAAO,QAAM,GAAG,KAAK;AAEvD,QAAI,MAAM,aAAa,MAAM,UAAU,WAAW,GAAG;AACnD,aAAO;AAAA,IACT;AAEA,WAAO;AAAA,EACT,CAAC,EAAE,OAAO,WAAS,KAAK;AAC1B;AAEO,gBAAS,cAAc,GAAG;AAC/B,MAAI,eAAe,GAAG;AACpB,WAAO,GAAG,EAAE,GAAG,IAAI,wBAAwB,EAAE,IAAI,CAAC,GAAG,wBAAwB,EAAE,IAAI,CAAC,GAAG,gBAAgB,CAAC,CAAC;AAAA,EAC3G;AACA,SAAO,GAAG,EAAE,GAAG,OAAO,EAAE,KAAK;AAE7B,WAAS,gBAAgB,OAAO;AAC9B,WAAO,MAAM,UAAU,IAAI,QAAM,IAAI,iBAAiB,EAAE,CAAC,EAAE,EAAE,KAAK,EAAE;AAAA,EACtE;AACF;AAEO,gBAAS,eAAe,QAAQ;AACrC,SAAO,OAAO,IAAI,OAAK,cAAc,CAAC,CAAC,EAAE,KAAK,iBAAmB;AACnE;AAEO,gBAAS,kBAAkB,QAAQ,SAAS,MAAM,OAAO,QAAW;AACzE,SAAO,QAAQ,WAAS,QAAQ,GAAG,MAAM,GAAG,cAAc,KAAK,CAAC,IAAI,IAAI,CAAC;AAC3E;AAEO,gBAAS,sBAAsB,cAAc;
|
|
4
|
+
"sourcesContent": ["import createDebugLogger from 'debug';\n\n//import fs from 'fs';\n//import path from 'path';\n\nconst debug = createDebugLogger('@natlibfi/melinda-marc-record-merge-reducers:utils');\n//const debugData = debug.extend('data');\nconst debugDev = debug.extend('dev');\n\nimport {melindaFieldSpecs} from './melindaCustomMergeFields.js';\n\n//JSON.parse(fs.readFileSync(path.join(__dirname, '..', 'src', 'melindaCustomMergeFields.json'), 'utf8'));\n\nexport function isElectronicMaterial(record) {\n const f337s = record.get('337');\n\n return f337s.length > 0 && f337s.some(f => fieldHasSubfield(f, 'b', 'c') && fieldHasSubfield(f, '2', 'rdamedia'));\n}\n\nexport function nvdebug(message, func = undefined) {\n if (func) {\n func(message);\n }\n //console.info(message); // eslint-disable-line no-console\n}\n\nexport function fieldHasSubfield(field, subfieldCode, subfieldValue = null) {\n if (!field.subfields) {\n return false;\n }\n if (subfieldValue === null) {\n return field.subfields.some(sf => sf.code === subfieldCode);\n }\n return field.subfields.some(sf => sf.code === subfieldCode && subfieldValue === sf.value);\n}\n\nexport function subfieldToString(sf) {\n if (!sf.value) {\n return `\u2021${sf.code}`;\n }\n return `\u2021${sf.code} ${sf.value}`;\n}\n\nfunction normalizeIndicatorValue(val) {\n if (val === ' ') {\n return '#';\n }\n return val;\n}\n\nexport function recordToString(record) {\n const ldr = `LDR ${record.leader}`;\n const fields = record.fields.map(f => fieldToString(f));\n return `${ldr}\\n${fields.join('\\n')}`;\n}\n\nexport function removeSubfield(record, tag, subfieldCode) {\n record.fields = record.fields.map(field => {\n if (field.tag !== tag || !field.subfields) { // Don't procss irrelevant fields\n return field;\n }\n field.subfields = field.subfields.filter(sf => sf.code !== subfieldCode);\n if (field.subfields.length === 0) {\n return false;\n }\n return field;\n }).filter(field => field);\n}\n\nexport function recordRemoveValuelessSubfields(record) {\n record.fields = record.fields.map(field => {\n if (!field.subfields) { // Keep control fields\n return field;\n }\n // Remove empty subfields from datafields:\n field.subfields = field.subfields.filter(sf => sf.value);\n\n if (field.subfields && field.subfields.length === 0) {\n return false; // Return false instead of a field if field has no subfields left. These will soon be filtered out.\n }\n\n return field; //if field has subfields return it\n }).filter(field => field); // Filter those falses out\n}\n\nexport function fieldToString(f) {\n if ('subfields' in f) {\n return `${f.tag} ${normalizeIndicatorValue(f.ind1)}${normalizeIndicatorValue(f.ind2)}${formatSubfields(f)}`;\n }\n return `${f.tag} ${f.value}`;\n\n function formatSubfields(field) {\n return field.subfields.map(sf => ` ${subfieldToString(sf)}`).join('');\n }\n}\n\nexport function fieldsToString(fields) {\n return fields.map(f => fieldToString(f)).join('\\t__SEPARATOR__\\t');\n}\n\nexport function nvdebugFieldArray(fields, prefix = ' ', func = undefined) {\n fields.forEach(field => nvdebug(`${prefix}${fieldToString(field)}`, func));\n}\n\nexport function isControlSubfieldCode(subfieldCode) {\n // NB! Only $w, $0, $1, $5, $6 and $8 are really control subfields. In Finland $9 is oft a control subfield\n // $3 material (part of the whole thing)\n // $4 means 'relationship' (similar to relator terms at least in X00 and similar)\n // $7 is usually provinance subfield. However, it can be stored in other subfields as well. See merge-fields/dataProvenance.js for details\n // However, change this only if needed. Maybe all provinance subfields should return true?\n // This may become relevant when AI starts to create stuff...\n if (['0', '1', '2', '3', '4', '5', '6', '7', '8', '9', 'w'].includes(subfieldCode)) {\n return true;\n }\n return false;\n}\n\nexport function getCatalogingLanguage(record, defaultCatalogingLanguage = undefined) {\n const [field040] = record.get(/^040$/u);\n if (!field040) {\n return defaultCatalogingLanguage;\n }\n const [b] = field040.subfields.filter(sf => sf.code === 'b');\n if (!b) {\n return defaultCatalogingLanguage;\n }\n return b.value;\n}\n\n\nexport function uniqArray(arr) {\n return arr.filter((val, i) => arr.indexOf(val) === i);\n}\n\nexport function fieldsAreIdentical(field1, field2) {\n if (field1.tag !== field2.tag) { // NB! We are skipping normalizations here on purpose! They should be done beforehand...\n return false;\n }\n return fieldToString(field1) === fieldToString(field2);\n\n // The order of subfields is relevant! Bloody JS idiotisms make people use conditions such as:\n // return field1.subfields.every(sf => field2.subfields.some(sf2 => sf.code === sf2.code && sf.value === sf2.value));\n}\n\nexport function fieldHasNSubfields(field, subfieldCode/*, subfieldValue = null*/) {\n const relevantSubfields = field.subfields.filter(sf => sf.code === subfieldCode);\n //if (subfieldValue === null) {\n return relevantSubfields.length;\n //}\n //const subset = relevantSubfields.filter(value => value === subfieldValue);\n //return subset.length;\n}\n\nexport function removeCopyright(value) {\n return value.replace(/^(?:c|p|\u00A9|\u2117|Cop\\. ?) ?((?:1[0-9][0-9][0-9]|20[012][0-9])\\.?)$/ui, '$1');\n}\n\nfunction isNonStandardNonrepeatableSubfield(tag, subfieldCode) {\n // Put these into config or so...\n if (tag === '264') {\n return ['a', 'b', 'c'].includes(subfieldCode);\n }\n\n if (['336', '337', '338'].includes(tag)) {\n return ['a', 'b', '2'].includes(subfieldCode);\n }\n\n return false;\n}\n\n\nexport function subfieldIsRepeatable(tag, subfieldCode) {\n\n if (isNonStandardNonrepeatableSubfield(tag, subfieldCode)) {\n return false;\n }\n\n // These we know or \"know\":\n // NB! $5 is (according to MARC21 format) non-repeatable, and not usable in all fields, but Melinda has a local exception to this, see MET-300\n if ('0159'.indexOf(subfieldCode) > -1) {\n // Uh, can $0 appear on any field?\n return true;\n }\n\n const fieldSpecs = melindaFieldSpecs.fields.filter(field => field.tag === tag);\n if (fieldSpecs.length !== 1) {\n nvdebug(` WARNING! Getting field ${tag} data failed! ${fieldSpecs.length} hits. Default value true is used for'${subfieldCode}' .`, debugDev);\n return true;\n }\n\n const subfieldSpecs = fieldSpecs[0].subfields.filter(subfield => subfield.code === subfieldCode);\n // Currently we don't support multiple $6 fields due to re-indexing limitations...\n // Well, $6 is non-repeatable, isn't it?!?\n // (This might actually already be fixed... Marginal issue, but check eventually.)\n if (subfieldSpecs.length !== 1 || subfieldCode === '6') {\n return false; // repeatable if not specified, I guess. Maybe add log or warn?\n }\n return subfieldSpecs[0].repeatable;\n}\n\nfunction marc21GetTagsLegalIndicators(tag) {\n const fieldSpecs = melindaFieldSpecs.fields.filter(field => field.tag === tag);\n if (fieldSpecs.length === 0) {\n return undefined;\n }\n return fieldSpecs[0].indicators;\n}\n\nexport function marc21GetTagsLegalInd1Value(tag) {\n const indicator = marc21GetTagsLegalIndicators(tag);\n if (indicator === undefined) {\n return undefined;\n }\n return indicator.ind1;\n}\n\nexport function marc21GetTagsLegalInd2Value(tag) {\n const indicator = marc21GetTagsLegalIndicators(tag);\n if (indicator === undefined) {\n return undefined;\n }\n return indicator.ind2;\n}\n\nexport function nvdebugSubfieldArray(subfields, prefix = ' ', func = undefined) {\n subfields.forEach(subfield => nvdebug(`${prefix}${subfieldToString(subfield)}`, func));\n}\n\nexport function subfieldsAreIdentical(subfieldA, subfieldB) {\n return subfieldA.code === subfieldB.code && subfieldA.value === subfieldB.value;\n}\n\nexport function fieldHasMultipleSubfields(field, subfieldCode/*, subfieldValue = null*/) {\n return fieldHasNSubfields(field, subfieldCode) > 1;\n}\n\nexport function hasCopyright(value) {\n const modValue = removeCopyright(value);\n return value !== modValue;\n}\n\n\n\nexport function subfieldArraysContainSameData(arr1, arr2) {\n if ( !arr1.every(sf => arr2.some(sf2 => subfieldsAreIdentical(sf, sf2))) ) {\n return false;\n }\n\n return arr2.every(sf2 => arr1.some(sf => subfieldsAreIdentical(sf, sf2)));\n}"],
|
|
5
|
+
"mappings": "AAAA,OAAO,uBAAuB;AAK9B,MAAM,QAAQ,kBAAkB,oDAAoD;AAEpF,MAAM,WAAW,MAAM,OAAO,KAAK;AAEnC,SAAQ,yBAAwB;AAIzB,gBAAS,qBAAqB,QAAQ;AAC3C,QAAM,QAAQ,OAAO,IAAI,KAAK;AAE9B,SAAO,MAAM,SAAS,KAAK,MAAM,KAAK,OAAK,iBAAiB,GAAG,KAAK,GAAG,KAAK,iBAAiB,GAAG,KAAK,UAAU,CAAC;AAClH;AAEO,gBAAS,QAAQ,SAAS,OAAO,QAAW;AACjD,MAAI,MAAM;AACR,SAAK,OAAO;AAAA,EACd;AAEF;AAEO,gBAAS,iBAAiB,OAAO,cAAc,gBAAgB,MAAM;AAC1E,MAAI,CAAC,MAAM,WAAW;AACpB,WAAO;AAAA,EACT;AACA,MAAI,kBAAkB,MAAM;AAC1B,WAAO,MAAM,UAAU,KAAK,QAAM,GAAG,SAAS,YAAY;AAAA,EAC5D;AACA,SAAO,MAAM,UAAU,KAAK,QAAM,GAAG,SAAS,gBAAgB,kBAAkB,GAAG,KAAK;AAC1F;AAEO,gBAAS,iBAAiB,IAAI;AACnC,MAAI,CAAC,GAAG,OAAO;AACb,WAAO,SAAI,GAAG,IAAI;AAAA,EACpB;AACA,SAAO,SAAI,GAAG,IAAI,IAAI,GAAG,KAAK;AAChC;AAEA,SAAS,wBAAwB,KAAK;AACpC,MAAI,QAAQ,KAAK;AACf,WAAO;AAAA,EACT;AACA,SAAO;AACT;AAEO,gBAAS,eAAe,QAAQ;AACrC,QAAM,MAAM,SAAS,OAAO,MAAM;AAClC,QAAM,SAAS,OAAO,OAAO,IAAI,OAAK,cAAc,CAAC,CAAC;AACtD,SAAO,GAAG,GAAG;AAAA,EAAK,OAAO,KAAK,IAAI,CAAC;AACrC;AAEO,gBAAS,eAAe,QAAQ,KAAK,cAAc;AACxD,SAAO,SAAS,OAAO,OAAO,IAAI,WAAS;AACzC,QAAI,MAAM,QAAQ,OAAO,CAAC,MAAM,WAAW;AACzC,aAAO;AAAA,IACT;AACA,UAAM,YAAY,MAAM,UAAU,OAAO,QAAM,GAAG,SAAS,YAAY;AACvE,QAAI,MAAM,UAAU,WAAW,GAAG;AAChC,aAAO;AAAA,IACT;AACA,WAAO;AAAA,EACT,CAAC,EAAE,OAAO,WAAS,KAAK;AAC1B;AAEO,gBAAS,+BAA+B,QAAQ;AACrD,SAAO,SAAS,OAAO,OAAO,IAAI,WAAS;AACzC,QAAI,CAAC,MAAM,WAAW;AACpB,aAAO;AAAA,IACT;AAEA,UAAM,YAAY,MAAM,UAAU,OAAO,QAAM,GAAG,KAAK;AAEvD,QAAI,MAAM,aAAa,MAAM,UAAU,WAAW,GAAG;AACnD,aAAO;AAAA,IACT;AAEA,WAAO;AAAA,EACT,CAAC,EAAE,OAAO,WAAS,KAAK;AAC1B;AAEO,gBAAS,cAAc,GAAG;AAC/B,MAAI,eAAe,GAAG;AACpB,WAAO,GAAG,EAAE,GAAG,IAAI,wBAAwB,EAAE,IAAI,CAAC,GAAG,wBAAwB,EAAE,IAAI,CAAC,GAAG,gBAAgB,CAAC,CAAC;AAAA,EAC3G;AACA,SAAO,GAAG,EAAE,GAAG,OAAO,EAAE,KAAK;AAE7B,WAAS,gBAAgB,OAAO;AAC9B,WAAO,MAAM,UAAU,IAAI,QAAM,IAAI,iBAAiB,EAAE,CAAC,EAAE,EAAE,KAAK,EAAE;AAAA,EACtE;AACF;AAEO,gBAAS,eAAe,QAAQ;AACrC,SAAO,OAAO,IAAI,OAAK,cAAc,CAAC,CAAC,EAAE,KAAK,iBAAmB;AACnE;AAEO,gBAAS,kBAAkB,QAAQ,SAAS,MAAM,OAAO,QAAW;AACzE,SAAO,QAAQ,WAAS,QAAQ,GAAG,MAAM,GAAG,cAAc,KAAK,CAAC,IAAI,IAAI,CAAC;AAC3E;AAEO,gBAAS,sBAAsB,cAAc;AAOlD,MAAI,CAAC,KAAK,KAAK,KAAK,KAAK,KAAK,KAAK,KAAK,KAAK,KAAK,KAAK,GAAG,EAAE,SAAS,YAAY,GAAG;AAClF,WAAO;AAAA,EACT;AACA,SAAO;AACT;AAEO,gBAAS,sBAAsB,QAAQ,4BAA4B,QAAW;AACnF,QAAM,CAAC,QAAQ,IAAI,OAAO,IAAI,QAAQ;AACtC,MAAI,CAAC,UAAU;AACb,WAAO;AAAA,EACT;AACA,QAAM,CAAC,CAAC,IAAI,SAAS,UAAU,OAAO,QAAM,GAAG,SAAS,GAAG;AAC3D,MAAI,CAAC,GAAG;AACN,WAAO;AAAA,EACT;AACA,SAAO,EAAE;AACX;AAGO,gBAAS,UAAU,KAAK;AAC7B,SAAO,IAAI,OAAO,CAAC,KAAK,MAAM,IAAI,QAAQ,GAAG,MAAM,CAAC;AACtD;AAEO,gBAAS,mBAAmB,QAAQ,QAAQ;AACjD,MAAI,OAAO,QAAQ,OAAO,KAAK;AAC7B,WAAO;AAAA,EACT;AACA,SAAO,cAAc,MAAM,MAAM,cAAc,MAAM;AAIvD;AAEO,gBAAS,mBAAmB,OAAO,cAAwC;AAChF,QAAM,oBAAoB,MAAM,UAAU,OAAO,QAAM,GAAG,SAAS,YAAY;AAE/E,SAAO,kBAAkB;AAI3B;AAEO,gBAAS,gBAAgB,OAAO;AACrC,SAAO,MAAM,QAAQ,mEAAmE,IAAI;AAC9F;AAEA,SAAS,mCAAmC,KAAK,cAAc;AAE7D,MAAI,QAAQ,OAAO;AACjB,WAAO,CAAC,KAAK,KAAK,GAAG,EAAE,SAAS,YAAY;AAAA,EAC9C;AAEA,MAAI,CAAC,OAAO,OAAO,KAAK,EAAE,SAAS,GAAG,GAAG;AACvC,WAAO,CAAC,KAAK,KAAK,GAAG,EAAE,SAAS,YAAY;AAAA,EAC9C;AAEA,SAAO;AACT;AAGO,gBAAS,qBAAqB,KAAK,cAAc;AAEtD,MAAI,mCAAmC,KAAK,YAAY,GAAG;AACzD,WAAO;AAAA,EACT;AAIA,MAAI,OAAO,QAAQ,YAAY,IAAI,IAAI;AAErC,WAAO;AAAA,EACT;AAEA,QAAM,aAAa,kBAAkB,OAAO,OAAO,WAAS,MAAM,QAAQ,GAAG;AAC7E,MAAI,WAAW,WAAW,GAAG;AAC3B,YAAQ,2BAA2B,GAAG,iBAAiB,WAAW,MAAM,yCAAyC,YAAY,OAAO,QAAQ;AAC5I,WAAO;AAAA,EACT;AAEA,QAAM,gBAAgB,WAAW,CAAC,EAAE,UAAU,OAAO,cAAY,SAAS,SAAS,YAAY;AAI/F,MAAI,cAAc,WAAW,KAAK,iBAAiB,KAAK;AACtD,WAAO;AAAA,EACT;AACA,SAAO,cAAc,CAAC,EAAE;AAC1B;AAEA,SAAS,6BAA6B,KAAK;AACzC,QAAM,aAAa,kBAAkB,OAAO,OAAO,WAAS,MAAM,QAAQ,GAAG;AAC7E,MAAI,WAAW,WAAW,GAAG;AAC3B,WAAO;AAAA,EACT;AACA,SAAO,WAAW,CAAC,EAAE;AACvB;AAEO,gBAAS,4BAA4B,KAAK;AAC/C,QAAM,YAAY,6BAA6B,GAAG;AAClD,MAAI,cAAc,QAAW;AAC3B,WAAO;AAAA,EACT;AACA,SAAO,UAAU;AACnB;AAEO,gBAAS,4BAA4B,KAAK;AAC/C,QAAM,YAAY,6BAA6B,GAAG;AAClD,MAAI,cAAc,QAAW;AAC3B,WAAO;AAAA,EACT;AACA,SAAO,UAAU;AACnB;AAEO,gBAAS,qBAAqB,WAAW,SAAS,MAAM,OAAO,QAAW;AAC/E,YAAU,QAAQ,cAAY,QAAQ,GAAG,MAAM,GAAG,iBAAiB,QAAQ,CAAC,IAAI,IAAI,CAAC;AACvF;AAEO,gBAAS,sBAAsB,WAAW,WAAW;AAC1D,SAAO,UAAU,SAAS,UAAU,QAAQ,UAAU,UAAU,UAAU;AAC5E;AAEO,gBAAS,0BAA0B,OAAO,cAAwC;AACvF,SAAO,mBAAmB,OAAO,YAAY,IAAI;AACnD;AAEO,gBAAS,aAAa,OAAO;AAClC,QAAM,WAAW,gBAAgB,KAAK;AACtC,SAAO,UAAU;AACnB;AAIO,gBAAS,8BAA8B,MAAM,MAAM;AACxD,MAAK,CAAC,KAAK,MAAM,QAAM,KAAK,KAAK,SAAO,sBAAsB,IAAI,GAAG,CAAC,CAAC,GAAI;AACzE,WAAO;AAAA,EACT;AAEA,SAAO,KAAK,MAAM,SAAO,KAAK,KAAK,QAAM,sBAAsB,IAAI,GAAG,CAAC,CAAC;AAC1E;",
|
|
6
6
|
"names": []
|
|
7
7
|
}
|
package/package.json
CHANGED
|
@@ -14,7 +14,7 @@
|
|
|
14
14
|
"url": "https://github.com/NatLibFi/marc-record-validators-melinda"
|
|
15
15
|
},
|
|
16
16
|
"license": "MIT",
|
|
17
|
-
"version": "12.0.0-alpha.
|
|
17
|
+
"version": "12.0.0-alpha.9",
|
|
18
18
|
"main": "./dist/index.js",
|
|
19
19
|
"publishConfig": {
|
|
20
20
|
"access": "public"
|
|
@@ -33,19 +33,20 @@
|
|
|
33
33
|
"dev:debug": "cross-env LOG_LEVEL=debug DEBUG=@natlibfi/* NODE_ENV=test"
|
|
34
34
|
},
|
|
35
35
|
"dependencies": {
|
|
36
|
+
"@natlibfi/iso9-1995": "next",
|
|
36
37
|
"@natlibfi/issn-verify": "^1.0.6",
|
|
37
38
|
"@natlibfi/marc-record": "next",
|
|
38
39
|
"@natlibfi/marc-record-serializers": "next",
|
|
39
40
|
"@natlibfi/marc-record-validate": "next",
|
|
40
41
|
"@natlibfi/melinda-commons": "next",
|
|
41
42
|
"@natlibfi/sfs-4900": "next",
|
|
42
|
-
"@natlibfi/iso9-1995": "next",
|
|
43
43
|
"@natlibfi/sru-client": "next",
|
|
44
44
|
"cld3-asm": "^4.0.0",
|
|
45
45
|
"clone": "^2.1.2",
|
|
46
46
|
"debug": "^4.4.3",
|
|
47
|
-
"isbn3": "^
|
|
47
|
+
"isbn3": "^2.0.0",
|
|
48
48
|
"langs": "^2.0.0",
|
|
49
|
+
"undici": "^7.16.0",
|
|
49
50
|
"xml2js": "^0.6.2",
|
|
50
51
|
"xregexp": "^5.1.2"
|
|
51
52
|
},
|
|
@@ -56,12 +57,12 @@
|
|
|
56
57
|
"@natlibfi/fixugen": "next",
|
|
57
58
|
"@natlibfi/fixura": "next",
|
|
58
59
|
"cross-env": "^10.0.0",
|
|
59
|
-
"esbuild": "^0.25.
|
|
60
|
-
"eslint": "^9.
|
|
61
|
-
"fetch-mock": "^12.
|
|
60
|
+
"esbuild": "^0.25.12",
|
|
61
|
+
"eslint": "^9.39.1",
|
|
62
|
+
"fetch-mock": "^12.6.0"
|
|
62
63
|
},
|
|
63
64
|
"overrides": {
|
|
64
65
|
"nanoid": "^3.3.8"
|
|
65
66
|
},
|
|
66
|
-
"nvolkComment": "cld3-asm 4.0.0 uses emscripten-wasm-loader ^3.0.3 which uses problematic, non-secure nanoid version 2.X.X"
|
|
67
|
+
"nvolkComment": "cld3-asm 4.0.0 uses emscripten-wasm-loader ^3.0.3 which uses problematic, non-secure nanoid version 2.X.X. Isbn3 has breaking changes in 1.2.16-18 at least."
|
|
67
68
|
}
|
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
// Const finnishTerms = ['ysa', 'yso', 'kassu', 'seko', 'valo', 'kulo', 'puho', 'oiko', 'mero', 'liito', 'fast', 'allars', 'kaunokki'];
|
|
2
2
|
const finnishTerms = [
|
|
3
3
|
/^(?:allars|bella|fast|juho|jupo|kassu|kauno|kaunokki|keko|koko|kulo|liiko|liito|local|mero|mts|musa|oiko|puho|seko|woto|valo|ysa|yso)$/u,
|
|
4
|
-
/^(?:kauno|slm|yso)\//u
|
|
4
|
+
/^(?:kauno|slm|yso)\//u // <= yso/* etc
|
|
5
5
|
];
|
|
6
6
|
|
|
7
7
|
const validPuncMarks = '?-!.'; // NB! ')' and ']' are only valid for some fields!
|
|
@@ -501,7 +501,7 @@ const confSpec = [
|
|
|
501
501
|
index: null,
|
|
502
502
|
punc: false,
|
|
503
503
|
special: {
|
|
504
|
-
|
|
504
|
+
termSubfieldCode: '2',
|
|
505
505
|
finnishTerms,
|
|
506
506
|
else: true
|
|
507
507
|
}
|
|
@@ -517,7 +517,7 @@ const confSpec = [
|
|
|
517
517
|
index: null,
|
|
518
518
|
punc: false,
|
|
519
519
|
special: {
|
|
520
|
-
|
|
520
|
+
termSubfieldCode: '2',
|
|
521
521
|
finnishTerms,
|
|
522
522
|
else: true
|
|
523
523
|
}
|
|
@@ -65,12 +65,6 @@ export default function () {
|
|
|
65
65
|
|
|
66
66
|
// Field validation with punctuation rules for normal and special cases in subfunction (to reduce complexity to please travisci)
|
|
67
67
|
function validateField(field, linkedTag, fix, message) {
|
|
68
|
-
// This is used to find last subfield that should have punctuation
|
|
69
|
-
function findLastSubfield(field) {
|
|
70
|
-
const subfields = field.subfields.filter(sf => isNaN(sf.code) && 'value' in sf);
|
|
71
|
-
return subfields.slice(-1).shift();
|
|
72
|
-
}
|
|
73
|
-
|
|
74
68
|
function getDefaultPuncMarks(tag) {
|
|
75
69
|
if (tag.match(/^[1678](?:00|10|11|30)/u) || tag === '740') { // As defined in Loppupisteohje
|
|
76
70
|
return `${validPuncMarks})`;
|
|
@@ -98,7 +92,7 @@ function validateField(field, linkedTag, fix, message) {
|
|
|
98
92
|
|
|
99
93
|
// Last char should be punc, but it's not one of listed punctuation marks nor dot
|
|
100
94
|
if (punc && !(lastPuncMark || lastPuncDot)) {
|
|
101
|
-
console.log(puncMarks)
|
|
95
|
+
//console.log(puncMarks)
|
|
102
96
|
if (penultimateCharacter && validQuoteChars.includes(lastChar) && puncMarks.includes(penultimateCharacter)) {
|
|
103
97
|
// Exception: do nothing! Ending in punc+quote combo is all right, and does not imply a missing punc
|
|
104
98
|
}
|
|
@@ -189,12 +183,17 @@ function validateField(field, linkedTag, fix, message) {
|
|
|
189
183
|
normalPuncRules(lastSubField, res.punc, tag, false, false);
|
|
190
184
|
|
|
191
185
|
// Search for Finnish terms
|
|
192
|
-
} else if (res.special.
|
|
186
|
+
} else if (res.special.termSubfieldCode) {
|
|
193
187
|
lastSubField = findLastSubfield(field);
|
|
194
188
|
|
|
195
189
|
if (lastSubField) {
|
|
196
|
-
const
|
|
197
|
-
|
|
190
|
+
const lexicon = getLexicon(field, res.special.termSubfieldCode);
|
|
191
|
+
const proceed = !finnishException(field, res.special.termSubfieldCode, false);
|
|
192
|
+
|
|
193
|
+
|
|
194
|
+
//const languageField = field.subfields.find(({code}) => code === res.special.termSubfieldCode);
|
|
195
|
+
//if (languageField && languageField.value && finnishTerms.some(p => p.test(languageField.value))) {
|
|
196
|
+
if (lexicon && finnishTerms.some(p => p.test(lexicon)) && proceed) {
|
|
198
197
|
// If (languageField && languageField.value && finnishTerms.indexOf(languageField.value) > -1) {
|
|
199
198
|
normalPuncRules(lastSubField, res.punc, tag, true, false);
|
|
200
199
|
} else {
|
|
@@ -272,8 +271,12 @@ function validateField(field, linkedTag, fix, message) {
|
|
|
272
271
|
return;
|
|
273
272
|
}
|
|
274
273
|
|
|
274
|
+
const forceNormal = res.special ? finnishException(field, res.special.termSubfieldCode, true) : false;
|
|
275
275
|
// Normal rules
|
|
276
|
-
if (typeof res.special === 'undefined' || res.special === null) {
|
|
276
|
+
if (typeof res.special === 'undefined' || res.special === null || forceNormal) {
|
|
277
|
+
if (forceNormal) {
|
|
278
|
+
console.info("EXCEPTION. SKIP FINNISH RULES");
|
|
279
|
+
}
|
|
277
280
|
lastSubField = findLastSubfield(field);
|
|
278
281
|
|
|
279
282
|
if (lastSubField) {
|
|
@@ -300,3 +303,51 @@ export function validateSingleField(field, linkedTag, fix) {
|
|
|
300
303
|
return message;
|
|
301
304
|
}
|
|
302
305
|
|
|
306
|
+
function getLexicon(field, subfieldCode) {
|
|
307
|
+
const languageSubfield = field.subfields.find(({code}) => code === subfieldCode); // res.special.termSubfieldCode);
|
|
308
|
+
if (!languageSubfield || !languageSubfield.value) {
|
|
309
|
+
return undefined;
|
|
310
|
+
}
|
|
311
|
+
if (finnishTerms.find(p => p.test(languageSubfield.value))) {
|
|
312
|
+
return languageSubfield.value;
|
|
313
|
+
}
|
|
314
|
+
return undefined;
|
|
315
|
+
}
|
|
316
|
+
|
|
317
|
+
function finnishException(field, termSubfieldCode, hasDot = true) {
|
|
318
|
+
const lexicon = getLexicon(field, termSubfieldCode);
|
|
319
|
+
if (!lexicon) {
|
|
320
|
+
return false;
|
|
321
|
+
}
|
|
322
|
+
|
|
323
|
+
const lastSubfield = findLastSubfield(field);
|
|
324
|
+
if (!lastSubfield || !lastSubfield.value) {
|
|
325
|
+
return false;
|
|
326
|
+
}
|
|
327
|
+
// Some terms can end in '.' that we want to keep
|
|
328
|
+
if (field.tag === '648') { // Yso-aika checks
|
|
329
|
+
//console.log(`Finnish Exception? '${lastSubfield.value}', '${lexicon}', '${field.tag}'`);
|
|
330
|
+
if (lexicon === 'yso/fin') { // 'eaa.' appears in prefLAbels and 'eKr.' in altLabels
|
|
331
|
+
if (hasDot) {
|
|
332
|
+
return lastSubfield.value.match(/ (?:eaa|[ej]Kr|jaa)\.$/u); // Finnish term from which the dot is not to be removed
|
|
333
|
+
}
|
|
334
|
+
return lastSubfield.value.match(/ (?:eaa|[ej]Kr)|jaa$/u); // Finnish word that needs a dot
|
|
335
|
+
}
|
|
336
|
+
|
|
337
|
+
if (lexicon === 'yso/swe') {
|
|
338
|
+
if (hasDot) {
|
|
339
|
+
return lastSubfield.value.match(/ (?:[ef]\.Kr|f\.v\.t)\.$/u);
|
|
340
|
+
}
|
|
341
|
+
return lastSubfield.value.match(/ (?:[ef]\.Kr|f\.v\.t)$/u);
|
|
342
|
+
}
|
|
343
|
+
}
|
|
344
|
+
// yso has 'MODEL.LA.' and 'Corel R.A.V.E.' but these are so rare I'm not listing them
|
|
345
|
+
|
|
346
|
+
return false;
|
|
347
|
+
}
|
|
348
|
+
|
|
349
|
+
// This is used to find last subfield that should have punctuation
|
|
350
|
+
function findLastSubfield(field) {
|
|
351
|
+
const subfields = field.subfields.filter(sf => isNaN(sf.code) && 'value' in sf);
|
|
352
|
+
return subfields.slice(-1).shift();
|
|
353
|
+
}
|
|
@@ -1585,7 +1585,7 @@ describe('ending-punctuation', () => {
|
|
|
1585
1585
|
]
|
|
1586
1586
|
});
|
|
1587
1587
|
|
|
1588
|
-
const
|
|
1588
|
+
const recordValid648FinNo = new MarcRecord({
|
|
1589
1589
|
leader: '',
|
|
1590
1590
|
fields: [
|
|
1591
1591
|
{
|
|
@@ -1596,6 +1596,16 @@ describe('ending-punctuation', () => {
|
|
|
1596
1596
|
{code: 'a', value: '1900-luku'},
|
|
1597
1597
|
{code: '2', value: 'yso/swe'}
|
|
1598
1598
|
]
|
|
1599
|
+
},
|
|
1600
|
+
{ // Exception: term ending in dot:
|
|
1601
|
+
tag : '648',
|
|
1602
|
+
ind1: ' ',
|
|
1603
|
+
ind2: '7',
|
|
1604
|
+
subfields: [
|
|
1605
|
+
{code: 'a', value: '1200-luku eaa.'},
|
|
1606
|
+
{code: '2', value: 'yso/fin'},
|
|
1607
|
+
{code: '0', value: 'http://www.yso.fi/onto/yso/p1129911200'}
|
|
1608
|
+
]
|
|
1599
1609
|
}
|
|
1600
1610
|
]
|
|
1601
1611
|
});
|
|
@@ -1668,7 +1678,7 @@ describe('ending-punctuation', () => {
|
|
|
1668
1678
|
|
|
1669
1679
|
it('Finds record valid - 648 Finnish, without punc', async () => {
|
|
1670
1680
|
const validator = await validatorFactory();
|
|
1671
|
-
const result = await validator.validate(
|
|
1681
|
+
const result = await validator.validate(recordValid648FinNo);
|
|
1672
1682
|
assert.equal(result.valid, true);
|
|
1673
1683
|
});
|
|
1674
1684
|
|
|
@@ -1713,7 +1723,7 @@ describe('ending-punctuation', () => {
|
|
|
1713
1723
|
]
|
|
1714
1724
|
});
|
|
1715
1725
|
|
|
1716
|
-
const
|
|
1726
|
+
const recordInvalid648FinYes = new MarcRecord({
|
|
1717
1727
|
leader: '',
|
|
1718
1728
|
fields: [
|
|
1719
1729
|
{
|
|
@@ -1724,6 +1734,15 @@ describe('ending-punctuation', () => {
|
|
|
1724
1734
|
{code: 'a', value: '1900-luku.'},
|
|
1725
1735
|
{code: '2', value: 'yso/swe'}
|
|
1726
1736
|
]
|
|
1737
|
+
}, { // Exception:
|
|
1738
|
+
tag: '648',
|
|
1739
|
+
ind1: ' ',
|
|
1740
|
+
ind2: '7',
|
|
1741
|
+
subfields: [
|
|
1742
|
+
{code: 'a', value: '1200-luku eaa'},
|
|
1743
|
+
{code: '2', value: 'yso/fin'},
|
|
1744
|
+
{code: '0', value: 'http://www.yso.fi/onto/yso/p1129911200'}
|
|
1745
|
+
]
|
|
1727
1746
|
}
|
|
1728
1747
|
]
|
|
1729
1748
|
});
|
|
@@ -1799,9 +1818,9 @@ describe('ending-punctuation', () => {
|
|
|
1799
1818
|
|
|
1800
1819
|
it('Finds record invalid - 648 Finnish, with punc', async () => {
|
|
1801
1820
|
const validator = await validatorFactory();
|
|
1802
|
-
const result = await validator.validate(
|
|
1821
|
+
const result = await validator.validate(recordInvalid648FinYes);
|
|
1803
1822
|
assert.deepEqual(result, {
|
|
1804
|
-
message: ['Field 648 has unwanted ending punctuation \'.\''],
|
|
1823
|
+
message: ['Field 648 has unwanted ending punctuation \'.\'', "Field 648 requires ending punctuation, ends in 'a'"],
|
|
1805
1824
|
valid: false
|
|
1806
1825
|
});
|
|
1807
1826
|
});
|
|
@@ -1857,11 +1876,16 @@ describe('ending-punctuation', () => {
|
|
|
1857
1876
|
|
|
1858
1877
|
it('Repairs the invalid record - 648 Finnish, removes punc $a', async () => {
|
|
1859
1878
|
const validator = await validatorFactory();
|
|
1860
|
-
const result = await validator.fix(
|
|
1861
|
-
|
|
1879
|
+
const result = await validator.fix(recordInvalid648FinYes);
|
|
1880
|
+
//console.info("NV-------");
|
|
1881
|
+
//console.info(JSON.stringify(recordInvalid648FinYes));
|
|
1882
|
+
//console.info(JSON.stringify(recordValid648FinNo));
|
|
1883
|
+
//assert.equal(recordInvalid648FinYes.equalsTo(recordValid648FinNo), true);
|
|
1884
|
+
assert.deepEqual(recordInvalid648FinYes, recordValid648FinNo);
|
|
1885
|
+
//console.info(JSON.stringify(result));
|
|
1862
1886
|
assert.deepEqual(result, {
|
|
1863
|
-
message: ['Field 648 has unwanted ending punctuation \'.\''],
|
|
1864
|
-
fix: ['Field 648 - Removed punctuation from $a'],
|
|
1887
|
+
message: ['Field 648 has unwanted ending punctuation \'.\'', "Field 648 requires ending punctuation, ends in 'a'"],
|
|
1888
|
+
fix: ['Field 648 - Removed punctuation from $a', 'Field 648 - Added punctuation to $a'],
|
|
1865
1889
|
valid: false
|
|
1866
1890
|
});
|
|
1867
1891
|
});
|
package/src/indicator-fixes.js
CHANGED
|
@@ -171,6 +171,18 @@ function normalize245Indicator1(field, record) {
|
|
|
171
171
|
field.ind1 = field1XX.length === 0 ? '0' : '1';
|
|
172
172
|
}
|
|
173
173
|
|
|
174
|
+
function noDisplayConstantGenerated520Indicator1(field) {
|
|
175
|
+
if (field.tag !== '520') {
|
|
176
|
+
return;
|
|
177
|
+
}
|
|
178
|
+
const as = field.subfields.filter(sf => sf.code === 'a');
|
|
179
|
+
// Set ind1=8 "no display constant generated" fro certain values (part of MELKEHITYS-2579):
|
|
180
|
+
if (as.length === 1 && ['Abstract.', 'Abstrakt.', 'Abstrakti.', 'Abstract.', 'English Summary.', 'Sammandrag.', 'Tiivistelmä.'].includes(field.subfields[0].value)) {
|
|
181
|
+
field.ind1 = '8';
|
|
182
|
+
}
|
|
183
|
+
|
|
184
|
+
}
|
|
185
|
+
|
|
174
186
|
function normalize776Indicator2(field) {
|
|
175
187
|
if (field.tag !== '776') {
|
|
176
188
|
return;
|
|
@@ -242,6 +254,7 @@ function recordNormalizeIndicators(record) {
|
|
|
242
254
|
function fieldNormalizeIndicators(field, record, languages) {
|
|
243
255
|
normalize084Indicator1(field);
|
|
244
256
|
normalize245Indicator1(field, record);
|
|
257
|
+
noDisplayConstantGenerated520Indicator1(field);
|
|
245
258
|
normalizeNonFilingIndicator1(field, languages);
|
|
246
259
|
normalizeNonFilingIndicator2(field, languages);
|
|
247
260
|
normalize776Indicator2(field);
|
package/src/isbn-issn.js
CHANGED
|
@@ -29,8 +29,14 @@ export default ({hyphenateISBN = false, handleInvalid = false} = {}) => {
|
|
|
29
29
|
|
|
30
30
|
function invalidISBN(isbn) {
|
|
31
31
|
const isbnOnly = getFirstWord(isbn);
|
|
32
|
-
|
|
33
|
-
|
|
32
|
+
try {
|
|
33
|
+
const auditedIsbn = ISBN.audit(isbnOnly);
|
|
34
|
+
return !auditedIsbn.validIsbn;
|
|
35
|
+
}
|
|
36
|
+
catch {
|
|
37
|
+
return true;
|
|
38
|
+
}
|
|
39
|
+
|
|
34
40
|
}
|
|
35
41
|
|
|
36
42
|
function invalidSubfield(subfield) {
|
|
@@ -238,9 +244,8 @@ export default ({hyphenateISBN = false, handleInvalid = false} = {}) => {
|
|
|
238
244
|
function normalizeIsbnValue(value) {
|
|
239
245
|
const trimmedValue = getFirstWord(value);
|
|
240
246
|
//const trimmedValue = trimISBN(value); // NB! This might lose information that should be stored in $q...
|
|
241
|
-
|
|
242
|
-
|
|
243
|
-
return undefined;
|
|
247
|
+
if (invalidISBN(trimmedValue)) {
|
|
248
|
+
return undefined; // should this return value (= nothing normalized), not undefined?
|
|
244
249
|
}
|
|
245
250
|
const numbersOnly = trimmedValue.replace(/[^0-9Xx]+/ug, '');
|
|
246
251
|
const parsedIsbn = ISBN.parse(trimmedValue);
|
package/src/punctuation2.js
CHANGED
|
@@ -10,9 +10,10 @@
|
|
|
10
10
|
* (They are jumped over when looking for next (non-controlfield subfield)
|
|
11
11
|
*/
|
|
12
12
|
import {validateSingleField} from './ending-punctuation.js';
|
|
13
|
+
import {tagToDataProvenanceSubfieldCode} from './merge-fields/dataProvenance.js';
|
|
13
14
|
import {fieldGetUnambiguousTag} from './subfield6Utils.js';
|
|
14
15
|
//import createDebugLogger from 'debug';
|
|
15
|
-
import {fieldToString, nvdebug} from './utils.js';
|
|
16
|
+
import {fieldToString, isControlSubfieldCode, nvdebug} from './utils.js';
|
|
16
17
|
import clone from 'clone';
|
|
17
18
|
|
|
18
19
|
//const debug = createDebugLogger('debug/punctuation2');
|
|
@@ -49,12 +50,19 @@ export default function () {
|
|
|
49
50
|
}
|
|
50
51
|
}
|
|
51
52
|
|
|
52
|
-
|
|
53
|
-
|
|
53
|
+
|
|
54
|
+
|
|
55
|
+
function isIrrelevantSubfield(subfield, tag) {
|
|
56
|
+
const dataProvenanceSubfieldCode = tagToDataProvenanceSubfieldCode(tag);
|
|
57
|
+
if (subfield.code === dataProvenanceSubfieldCode) {
|
|
58
|
+
return true;
|
|
59
|
+
}
|
|
60
|
+
return isControlSubfieldCode(subfield.code); // Currently this contains other stuff as well ($3, $4, $7, $9...)
|
|
54
61
|
}
|
|
55
62
|
|
|
63
|
+
|
|
56
64
|
function getNextRelevantSubfield(field, currSubfieldIndex) {
|
|
57
|
-
return field.subfields.find((subfield, index) => index > currSubfieldIndex && !
|
|
65
|
+
return field.subfields.find((subfield, index) => index > currSubfieldIndex && !isIrrelevantSubfield(subfield, field.tag));
|
|
58
66
|
}
|
|
59
67
|
|
|
60
68
|
export function fieldGetFixedString(field, add = true) {
|
|
@@ -155,7 +163,8 @@ const remove490And830Whatever = [{'code': 'axyzv', 'followedBy': 'axyzv', 'remov
|
|
|
155
163
|
const linkingEntryRemoveWhatever = [
|
|
156
164
|
{'code': 'i', 'followedBy': 'at', 'remove': / ?:$/u}, // ':'
|
|
157
165
|
{'code': 'at', 'remove': /\.$/u},
|
|
158
|
-
|
|
166
|
+
// Only ". -" separator is still used in music. We can strip it, but can only create the non-music punctuation!
|
|
167
|
+
{'code': 'abdghiklmnopqrstuwxyz', 'followedBy': 'abdghiklmnopqrstuwxyz#', 'remove': /\. -$/u}
|
|
159
168
|
];
|
|
160
169
|
|
|
161
170
|
|
|
@@ -1,9 +1,23 @@
|
|
|
1
1
|
import assert from 'node:assert';
|
|
2
|
-
import
|
|
2
|
+
import createDebugLogger from 'debug';
|
|
3
|
+
import fetchMock from 'fetch-mock';
|
|
4
|
+
|
|
3
5
|
import validatorFactory from './translate-terms.js';
|
|
6
|
+
|
|
7
|
+
import {MarcRecord} from '@natlibfi/marc-record';
|
|
4
8
|
import {READERS} from '@natlibfi/fixura';
|
|
5
9
|
import generateTests from '@natlibfi/fixugen';
|
|
6
|
-
import
|
|
10
|
+
import {fakeData} from '../test-fixtures/translate-terms-data.js';
|
|
11
|
+
|
|
12
|
+
const uris = [
|
|
13
|
+
'http://www.yso.fi/onto/yso/p13299',
|
|
14
|
+
'http://www.yso.fi/onto/yso/p111739',
|
|
15
|
+
'http://www.yso.fi/onto/yso/p6197061979',
|
|
16
|
+
'http://www.yso.fi/onto/yso/p6196061969',
|
|
17
|
+
'http://urn.fi/URN:NBN:fi:au:slm:s161'
|
|
18
|
+
];
|
|
19
|
+
|
|
20
|
+
|
|
7
21
|
|
|
8
22
|
generateTests({
|
|
9
23
|
callback,
|
|
@@ -15,6 +29,15 @@ generateTests({
|
|
|
15
29
|
},
|
|
16
30
|
hooks: {
|
|
17
31
|
before: async () => {
|
|
32
|
+
|
|
33
|
+
fetchMock.mockGlobal()
|
|
34
|
+
.get(`https://api.finto.fi/rest/v1/data?uri=${uris[0]}&format=application%2Fjson`, {status: 200, headers: {}, body: fakeData})
|
|
35
|
+
.get(`https://api.finto.fi/rest/v1/data?uri=${uris[1]}&format=application%2Fjson`, {status: 200, headers: {}, body: fakeData})
|
|
36
|
+
.get(`https://api.finto.fi/rest/v1/data?uri=${uris[2]}&format=application%2Fjson`, {status: 200, headers: {}, body: fakeData})
|
|
37
|
+
.get(`https://api.finto.fi/rest/v1/data?uri=${uris[3]}&format=application%2Fjson`, {status: 200, headers: {}, body: fakeData})
|
|
38
|
+
.get(`https://api.finto.fi/rest/v1/data?uri=${uris[4]}&format=application%2Fjson`, {status: 200, headers: {}, body: fakeData});
|
|
39
|
+
|
|
40
|
+
|
|
18
41
|
testValidatorFactory();
|
|
19
42
|
}
|
|
20
43
|
}
|
package/src/utils.js
CHANGED
|
@@ -103,6 +103,12 @@ export function nvdebugFieldArray(fields, prefix = ' ', func = undefined) {
|
|
|
103
103
|
}
|
|
104
104
|
|
|
105
105
|
export function isControlSubfieldCode(subfieldCode) {
|
|
106
|
+
// NB! Only $w, $0, $1, $5, $6 and $8 are really control subfields. In Finland $9 is oft a control subfield
|
|
107
|
+
// $3 material (part of the whole thing)
|
|
108
|
+
// $4 means 'relationship' (similar to relator terms at least in X00 and similar)
|
|
109
|
+
// $7 is usually provinance subfield. However, it can be stored in other subfields as well. See merge-fields/dataProvenance.js for details
|
|
110
|
+
// However, change this only if needed. Maybe all provinance subfields should return true?
|
|
111
|
+
// This may become relevant when AI starts to create stuff...
|
|
106
112
|
if (['0', '1', '2', '3', '4', '5', '6', '7', '8', '9', 'w'].includes(subfieldCode)) {
|
|
107
113
|
return true;
|
|
108
114
|
}
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
{
|
|
2
|
+
"_validationOptions": {},
|
|
3
|
+
"fields": [
|
|
4
|
+
{ "tag": "005", "value": "20220202020202.0" },
|
|
5
|
+
{ "tag": "520", "ind1": "8", "ind2": " ", "subfields": [ {"code": "a", "value": "Abstrakti."}, {"code": "9", "value": "TESTI<KEEP>"} ]},
|
|
6
|
+
{ "tag": "520", "ind1": " ", "ind2": " ", "subfields": [ {"code": "a", "value": "Whatever."}]},
|
|
7
|
+
{ "tag": "520", "ind1": "8", "ind2": " ", "subfields": [ {"code": "a", "value": "Tiivistelmä."}]}
|
|
8
|
+
|
|
9
|
+
],
|
|
10
|
+
"leader": ""
|
|
11
|
+
}
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
{
|
|
2
|
+
"_validationOptions": {},
|
|
3
|
+
"fields": [
|
|
4
|
+
{ "tag": "005", "value": "20220202020202.0" },
|
|
5
|
+
{ "tag": "520", "ind1": " ", "ind2": " ", "subfields": [ {"code": "a", "value": "Abstrakti."}, {"code": "9", "value": "TESTI<KEEP>"} ]},
|
|
6
|
+
{ "tag": "520", "ind1": " ", "ind2": " ", "subfields": [ {"code": "a", "value": "Whatever."}]},
|
|
7
|
+
{ "tag": "520", "ind1": "3", "ind2": " ", "subfields": [ {"code": "a", "value": "Tiivistelmä."}]}
|
|
8
|
+
|
|
9
|
+
],
|
|
10
|
+
"leader": ""
|
|
11
|
+
}
|
|
@@ -0,0 +1,42 @@
|
|
|
1
|
+
const fakeTerms = {
|
|
2
|
+
graph: [
|
|
3
|
+
{
|
|
4
|
+
uri: 'http://www.yso.fi/onto/yso/p13299',
|
|
5
|
+
prefLabel: [
|
|
6
|
+
{ lang: 'fi', value: 'laiturit' },
|
|
7
|
+
{ lang: 'sv', value: 'bryggor'}
|
|
8
|
+
]
|
|
9
|
+
},
|
|
10
|
+
{
|
|
11
|
+
uri: 'http://www.yso.fi/onto/yso/p111739',
|
|
12
|
+
prefLabel: [
|
|
13
|
+
{ lang: 'fi', value: 'Ivalo (Inari)' },
|
|
14
|
+
{ lang: 'sv', value: 'Ivalo (Enare)'}
|
|
15
|
+
]
|
|
16
|
+
},
|
|
17
|
+
{
|
|
18
|
+
uri: 'http://www.yso.fi/onto/yso/p6197061979',
|
|
19
|
+
prefLabel: [
|
|
20
|
+
{ lang: 'fi', value: '1970-luku' },
|
|
21
|
+
{ lang: 'sv', value: '1970-talet' }
|
|
22
|
+
]
|
|
23
|
+
},
|
|
24
|
+
{
|
|
25
|
+
uri: 'http://www.yso.fi/onto/yso/p6196061969',
|
|
26
|
+
prefLabel: [
|
|
27
|
+
{ lang: 'fi', value: '1960-luku' },
|
|
28
|
+
{ lang: 'sv', value: '1960-talet' }
|
|
29
|
+
]
|
|
30
|
+
},
|
|
31
|
+
{
|
|
32
|
+
uri: 'http://urn.fi/URN:NBN:fi:au:slm:s161',
|
|
33
|
+
prefLabel: [
|
|
34
|
+
{ lang: 'fi', value: 'naistenlehdet' },
|
|
35
|
+
{ lang: 'sv', value: 'damtidningar' }
|
|
36
|
+
]
|
|
37
|
+
}
|
|
38
|
+
]
|
|
39
|
+
|
|
40
|
+
};
|
|
41
|
+
|
|
42
|
+
export const fakeData = JSON.stringify(fakeTerms);
|