UNPKG

@natlibfi/melinda-record-match-validator

Version:

Validates if two records matched by melinda-record-matching can be merged and sets merge priority

93 lines (70 loc) 2.82 kB
import createDebugLogger from 'debug'; import {hasFields} from './collectFunctions/collectUtils'; //import {nvdebug} from './utils'; const debug = createDebugLogger('@natlibfi/melinda-record-match-validator:alephFunctions'); const debugDev = debug.extend('dev'); //const debugData = debug.extend('data'); // Collect SID export function getSID(record) { const SIDs = hasFields('SID', record).map(field => sidToJson(field)); debugDev('SIDs: %o', SIDs); return SIDs; function sidToJson(sid) { const [database] = sid.subfields.filter(sub => sub.code === 'b').map(sub => sub.value); const [id] = sid.subfields.filter(sub => sub.code === 'c').map(sub => sub.value); return {id, database}; } } // Compare SID export function compareSID(recordValuesA, recordValuesB) { const SIDsA = recordValuesA.SID; const SIDsB = recordValuesB.SID; return compareSIDValues(SIDsA, SIDsB); } function compareSIDValues(SIDsA, SIDsB) { debugDev('A: %o vs B: %o', SIDsA, SIDsB); return compareSIDContent(); // eslint-disable-next-line max-statements function compareSIDContent() { if (SIDsB.length === 0) { if (SIDsA.length > 0) { debugDev('SIDs A contains values and B is empty'); return 'A'; } debugDev('Both SIDS are empty'); return true; } if (SIDsA.length === 0) { debugDev('SIDs B contains values and A is empty'); return 'B'; } // Same database & different id => HARD failure if (SIDsA.some(sidA => SIDsB.some(sidB => sidA.database === sidB.database && sidA.id !== sidB.id))) { debugDev('SIDs: same db but diffent ids: fail'); return false; } const onlyA = SIDsA.filter(SIDA => SIDsB.every(SIDB => SIDA.database !== SIDB.database)); const onlyB = SIDsB.filter(SIDB => SIDsA.every(SIDA => SIDA.database !== SIDB.database)); if (onlyA.length === 0 && onlyB.length === 0) { debugDev('SIDs A and B are same'); return true; } // It's union: same result both ways... And anyway we are interested in the different values, not the same ones. //const SIDsBContainsFromA = SIDsA.filter(SIDA => SIDsB.some(SIDB => SIDA.database === SIDB.database && SIDA.id === SIDB.id)); //const SIDsAContainsFromB = SIDsB.filter(SIDB => SIDsA.some(SIDA => SIDA.database === SIDB.database && SIDA.id === SIDB.id)); if (onlyA.length > 0 && onlyB.length === 0) { debugDev('SIDs A contains all values from B'); return 'A'; } if (onlyB.length > 0 && onlyA.length === 0) { debugDev('SIDs B contains all values from A'); return 'B'; } return true; // default to true } } export function checkSID({record1, record2}) { const fields1 = getSID(record1); const fields2 = getSID(record2); return compareSIDValues(fields1, fields2); }