UNPKG

wink-nlp

Version:

Developer friendly Natural Language Processing ✨

81 lines (73 loc) 3.17 kB
// wink-nlp // // Copyright (C) GRAYPE Systems Private Limited // // This file is part of “wink-nlp”. // // Permission is hereby granted, free of charge, to any // person obtaining a copy of this software and // associated documentation files (the "Software"), to // deal in the Software without restriction, including // without limitation the rights to use, copy, modify, // merge, publish, distribute, sublicense, and/or sell // copies of the Software, and to permit persons to // whom the Software is furnished to do so, subject to // the following conditions: // // The above copyright notice and this permission notice // shall be included in all copies or substantial // portions of the Software. // // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF // ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED // TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A // PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL // THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, // DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF // CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN // CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER // DEALINGS IN THE SOFTWARE. // var its = require( '../its.js' ); var as = require( '../as.js' ); var allowed = require( '../allowed.js' ); var reconstructSpaces = require( '../reconstruct-spaces.js' ); var constants = require( '../constants.js' ); // Size of a single token. var tkSize = constants.tkSize; // Mask for preceding spaces. var psMask = constants.psMask; // ## selTokensOut /** * Out for selection of tokens. Note: the out always returns a Javascript * data type or data structure. * @param {number[]} selTokens Array containing indexes to the selected tokens. * @param {obejct} rdd Raw document data structure. * @param {function} itsf Desired `its` mapper. * @param {function} asf Desired `as` reducer. * @param {object} addons The addons from the model. * @return {*} Reduced value. * @private */ var selTokensOut = function ( selTokens, rdd, itsf, asf, addons ) { // Not a vector request, perform map-reduce. var mappedTkns = []; var itsfn = ( itsf && allowed.its4selTokens.has( itsf ) ) ? itsf : its.value; var asfn = ( asf && allowed.as4selTokens.has( asf ) ) ? asf : as.array; if ( itsfn !== its.value && itsfn !== its.normal && itsfn !== its.lemma && asfn === as.vector ) { throw Error( 'winkNLP: as.vector is allowed only with its value or normal or lemma.' ); } // Note, `as.text` needs special attention to include preceeding spaces. // No `markedUpText` allowed here. if ( asfn === as.text ) { for ( let i = 0; i < selTokens.length; i += 1 ) { mappedTkns.push( reconstructSpaces( selTokens[ i ], rdd ), itsf( selTokens[ i ], rdd, addons ) ); } } else { for ( let i = 0; i < selTokens.length; i += 1 ) { mappedTkns.push( itsfn( selTokens[ i ], rdd, addons ) ); } } return asfn( mappedTkns, rdd ); }; // selTokensOut() module.exports = selTokensOut;