node-nlp
Version:
Library for NLU (Natural Language Understanding) done in Node.js
65 lines (51 loc) • 2.01 kB
JavaScript
/*
*/
var moment = require('moment');
var Parser = require('../parser').Parser;
var ParsedResult = require('../../result').ParsedResult;
var updateParsedComponent = require('../EN/ENWeekdayParser').updateParsedComponent;
var DAYS_OFFSET = { 'dimanche': 0, 'dim': 0, 'lundi': 1, 'lun': 1,'mardi': 2, 'mar':2, 'mercredi': 3, 'mer': 3,
'jeudi': 4, 'jeu':4, 'vendredi': 5, 'ven': 5,'samedi': 6, 'sam': 6};
var PATTERN = new RegExp('(\\s|^)' +
'(?:(?:\\,|\\(|\\()\\s*)?' +
'(?:(ce)\\s*)?' +
'(' + Object.keys(DAYS_OFFSET).join('|') + ')' +
'(?:\\s*(?:\\,|\\)|\\)))?' +
'(?:\\s*(dernier|prochain)\\s*)?' +
'(?=\\W|$)', 'i');
var PREFIX_GROUP = 2;
var WEEKDAY_GROUP = 3;
var POSTFIX_GROUP = 4;
exports.Parser = function FRWeekdayParser() {
Parser.apply(this, arguments);
this.pattern = function() { return PATTERN; };
this.extract = function(text, ref, match, opt){
var index = match.index + match[1].length;
var text = match[0].substr(match[1].length, match[0].length - match[1].length);
var result = new ParsedResult({
index: index,
text: text,
ref: ref
});
var dayOfWeek = match[WEEKDAY_GROUP].toLowerCase();
var offset = DAYS_OFFSET[dayOfWeek];
if(offset === undefined) return null;
var modifier = null;
var prefix = match[PREFIX_GROUP];
var postfix = match[POSTFIX_GROUP];
if (prefix || postfix) {
var norm = prefix || postfix;
norm = norm.toLowerCase();
if(norm == 'dernier') {
modifier = 'last';
} else if(norm == 'prochain') {
modifier = 'next';
} else if(norm== 'ce') {
modifier = 'this';
}
}
updateParsedComponent(result, ref, offset, modifier);
result.tags['FRWeekdayParser'] = true;
return result;
}
};