node-nlp
Version:
Library for NLU (Natural Language Understanding) done in Node.js
127 lines (117 loc) • 3.83 kB
JavaScript
/*
* Copyright (c) AXA Shared Services Spain S.A.
*
* Permission is hereby granted, free of charge, to any person obtaining
* a copy of this software and associated documentation files (the
* "Software"), to deal in the Software without restriction, including
* without limitation the rights to use, copy, modify, merge, publish,
* distribute, sublicense, and/or sell copies of the Software, and to
* permit persons to whom the Software is furnished to do so, subject to
* the following conditions:
*
* The above copyright notice and this permission notice shall be
* included in all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
* NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
* LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
* OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
* WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
*/
const NamedEntity = require('./named-entity');
/**
* Class for the Enumerated Named Entity.
*/
class RegexNamedEntity extends NamedEntity {
/**
* Constructor of the class.
* @param {Object} settings Settings for the instance.
*/
constructor(settings) {
super(settings);
this.type = 'regex';
}
/**
* Assign a regular expression for the given languages
* @param {String[]} srcLanguages Target languages
* @param {RegExp} regex Regular expression.
*/
addRegex(srcLanguages, regex) {
const languages = Array.isArray(srcLanguages)
? srcLanguages
: [srcLanguages];
languages.forEach(language => {
const locale = this.getLocale(language);
locale.regex = regex;
});
}
/**
* Adds a regular expression from a string.
* @param {String[]} srcLanguages Array of languages.
* @param {String} regex Regular expression as string.
*/
addStrRegex(srcLanguages, regex) {
this.addRegex(srcLanguages, RegexNamedEntity.str2regex(regex));
}
/**
* Get the matchs of the regular expression over the utterance.
* @param {String} utterance Input utterance.
* @param {RegExp} regex Regular expression.
* @returns {Object[]} Edges found.
*/
getMatchs(utterance, regex) {
const result = [];
let matchFound;
do {
const match = regex.exec(utterance);
if (match) {
result.push({
start: match.index,
end: regex.lastIndex,
accuracy: 1,
sourceText: match[0],
utteranceText: match[0],
entity: this.name,
});
matchFound = true;
} else {
matchFound = false;
}
} while (matchFound);
return result;
}
/**
* Extract edges of an utterance.
* @param {String} utterance Input utterance.
* @param {String} language Language of the utterance.
* @returns {Object[]} Edges extracted.
*/
extract(utterance, language) {
const result = [];
const locale = this.getLocaleRules(language);
if (!locale) {
return result;
}
return this.getMatchs(utterance, locale.regex);
}
/**
* Transforms a string to a regular expression.
* @param {String} str String to be converted.
* @returns {RegExp} Regular expression.
*/
static str2regex(str) {
const index = str.lastIndexOf('/');
return new RegExp(str.slice(1, index), str.slice(index + 1));
}
/**
* Transforms a regular expression to a string.
* @param {RegExp} regex Regular expression.
* @returns {String} String representing the regular expression.
*/
static regex2str(regex) {
return regex.toString();
}
}
module.exports = RegexNamedEntity;