@natlibfi/melinda-record-match-validator
Version:
Validates if two records matched by melinda-record-matching can be merged and sets merge priority
52 lines (46 loc) • 1.87 kB
JavaScript
import {recordGetSubfieldValuesFromNonRepeatableField} from '../utils.js';
//// Scores for various values in 040$b Language Cataloging
// Sorry, my Finlandswedish colleagues and friends: I've given Finnis top priority.
// 'fin', 'swe', and 'mul' so 'mul' comes third. It's typically seen in copycatalogued records,
// that have not (yet) been fully translated. These werethe original three.
// However, NL has done English-only records for Nordenskiöld collection, so we'll prefer 'eng' over other languages.
const scoreFor040b = {'fin': 4, 'swe': 3, 'mul': 2, 'eng': 1};
export function check040b({record1, record2}) {
const score1 = recordScore040FieldLanguage(record1);
const score2 = recordScore040FieldLanguage(record2);
//nvdebug(`040$b scores: ${score1} vs ${score2}`);
if (score1 > score2) {
return 'A';
}
if (score1 < score2) {
return 'B';
}
return true; // This test does not fail
function recordScore040FieldLanguage(record) {
const bs = recordGetSubfieldValuesFromNonRepeatableField(record, '040', 'b');
if (bs.length !== 1 || !(bs[0] in scoreFor040b)) {
return 0;
}
return scoreFor040b[bs[0]];
}
}
export function check040e({record1, record2}) {
const score1 = recordScore040FieldDescriptionConvention(record1);
const score2 = recordScore040FieldDescriptionConvention(record2);
//nvdebug(`040$e scores: ${score1} vs ${score2}`);
if (score1 > score2) {
return 'A';
}
if (score1 < score2) {
return 'B';
}
return true; // This test does not fail
function recordScore040FieldDescriptionConvention(record) {
const es = recordGetSubfieldValuesFromNonRepeatableField(record, '040', 'e');
// Is multiple $e's a problem? Once I thought so, but not anymore. However, keep this comment here for discussion.
if (es.includes('rda')) {
return 1;
}
return 0;
}
}