UNPKG

node-nlp

Version:

Library for NLU (Natural Language Understanding) done in Node.js

114 lines (91 loc) 4.03 kB
/* */ var moment = require('moment'); var Parser = require('../parser').Parser; var ParsedResult = require('../../result').ParsedResult; var util = require('../../utils/EN'); var PATTERN = new RegExp('(\\W|^)' + '(next|last|past)\\s*' + '('+ util.INTEGER_WORDS_PATTERN + '|[0-9]+|few|half(?:\\s*an?)?)?\\s*' + '(seconds?|min(?:ute)?s?|hours?|days?|weeks?|months?|years?)(?=\\s*)' + '(?=\\W|$)', 'i' ); var MODIFIER_WORD_GROUP = 2; var MULTIPLIER_WORD_GROUP = 3; var RELATIVE_WORD_GROUP = 4; exports.Parser = function ENRelativeDateFormatParser(){ Parser.apply(this, arguments); this.pattern = function() { return PATTERN; }; this.extract = function(text, ref, match, opt){ var index = match.index + match[1].length; var modifier = match[MODIFIER_WORD_GROUP].toLowerCase().match(/^next/) ? 1 : -1; var text = match[0]; text = match[0].substr(match[1].length, match[0].length - match[1].length); var result = new ParsedResult({ index: index, text: text, ref: ref }); result.tags['ENRelativeDateFormatParser'] = true; var num = match[MULTIPLIER_WORD_GROUP] === undefined ? '' : match[3].toLowerCase(); if (util.INTEGER_WORDS[num] !== undefined) { num = util.INTEGER_WORDS[num]; } else if (num === ''){ num = 1; } else if (num.match(/few/i)){ num = 3; } else if (num.match(/half/i)) { num = 0.5; } else { num = parseInt(num); } num *= modifier; var date = moment(ref); if (match[RELATIVE_WORD_GROUP].match(/day|week|month|year/i)) { if (match[RELATIVE_WORD_GROUP].match(/day/i)) { date.add(num, 'd'); result.start.assign('year', date.year()); result.start.assign('month', date.month() + 1); result.start.assign('day', date.date()); } else if (match[RELATIVE_WORD_GROUP].match(/week/i)) { date.add(num * 7, 'd'); // We don't know the exact date for next/last week so we imply // them result.start.imply('day', date.date()); result.start.imply('month', date.month() + 1); result.start.imply('year', date.year()); } else if (match[RELATIVE_WORD_GROUP].match(/month/i)) { date.add(num, 'month'); // We don't know the exact day for next/last month result.start.imply('day', date.date()); result.start.assign('year', date.year()); result.start.assign('month', date.month() + 1); } else if (match[RELATIVE_WORD_GROUP].match(/year/i)) { date.add(num, 'year'); // We don't know the exact day for month on next/last year result.start.imply('day', date.date()); result.start.imply('month', date.month() + 1); result.start.assign('year', date.year()); } return result; } if (match[RELATIVE_WORD_GROUP].match(/hour/i)) { date.add(num, 'hour'); result.start.imply('minute', date.minute()); result.start.imply('second', date.second()); } else if (match[RELATIVE_WORD_GROUP].match(/min/i)) { date.add(num, 'minute'); result.start.assign('minute', date.minute()); result.start.imply('second', date.second()); } else if (match[RELATIVE_WORD_GROUP].match(/second/i)) { date.add(num, 'second'); result.start.assign('second', date.second()); result.start.assign('minute', date.minute()); } result.start.assign('hour', date.hour()); result.start.assign('year', date.year()); result.start.assign('month', date.month() + 1); result.start.assign('day', date.date()); return result; }; };