wink-nlp
Version:
Developer friendly Natural Language Processing ✨
81 lines (73 loc) • 3.17 kB
JavaScript
// wink-nlp
//
// Copyright (C) GRAYPE Systems Private Limited
//
// This file is part of “wink-nlp”.
//
// Permission is hereby granted, free of charge, to any
// person obtaining a copy of this software and
// associated documentation files (the "Software"), to
// deal in the Software without restriction, including
// without limitation the rights to use, copy, modify,
// merge, publish, distribute, sublicense, and/or sell
// copies of the Software, and to permit persons to
// whom the Software is furnished to do so, subject to
// the following conditions:
//
// The above copyright notice and this permission notice
// shall be included in all copies or substantial
// portions of the Software.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF
// ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
// TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
// PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
// THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,
// DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF
// CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
// CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
// DEALINGS IN THE SOFTWARE.
//
var its = require( '../its.js' );
var as = require( '../as.js' );
var allowed = require( '../allowed.js' );
var reconstructSpaces = require( '../reconstruct-spaces.js' );
var constants = require( '../constants.js' );
// Size of a single token.
var tkSize = constants.tkSize;
// Mask for preceding spaces.
var psMask = constants.psMask;
// ## selTokensOut
/**
* Out for selection of tokens. Note: the out always returns a Javascript
* data type or data structure.
* @param {number[]} selTokens Array containing indexes to the selected tokens.
* @param {obejct} rdd Raw document data structure.
* @param {function} itsf Desired `its` mapper.
* @param {function} asf Desired `as` reducer.
* @param {object} addons The addons from the model.
* @return {*} Reduced value.
* @private
*/
var selTokensOut = function ( selTokens, rdd, itsf, asf, addons ) {
// Not a vector request, perform map-reduce.
var mappedTkns = [];
var itsfn = ( itsf && allowed.its4selTokens.has( itsf ) ) ? itsf : its.value;
var asfn = ( asf && allowed.as4selTokens.has( asf ) ) ? asf : as.array;
if ( itsfn !== its.value && itsfn !== its.normal && itsfn !== its.lemma && asfn === as.vector ) {
throw Error( 'winkNLP: as.vector is allowed only with its value or normal or lemma.' );
}
// Note, `as.text` needs special attention to include preceeding spaces.
// No `markedUpText` allowed here.
if ( asfn === as.text ) {
for ( let i = 0; i < selTokens.length; i += 1 ) {
mappedTkns.push( reconstructSpaces( selTokens[ i ], rdd ), itsf( selTokens[ i ], rdd, addons ) );
}
} else {
for ( let i = 0; i < selTokens.length; i += 1 ) {
mappedTkns.push( itsfn( selTokens[ i ], rdd, addons ) );
}
}
return asfn( mappedTkns, rdd );
}; // selTokensOut()
module.exports = selTokensOut;