node-nlp
Version:
Library for NLU (Natural Language Understanding) done in Node.js
95 lines (72 loc) • 2.89 kB
JavaScript
/*
The parser for parsing month name and year.
EX.
- Januar
- Januar 2012
*/
var moment = require('moment');
var Parser = require('../parser').Parser;
var ParsedResult = require('../../result').ParsedResult;
var util = require('../../utils/DE');
var PATTERN = new RegExp('(^|\\D\\s+|[^\\w\\s])' +
'(Jan\\.?|Januar|Feb\\.?|Februar|Mär\\.?|M(?:ä|ae)rz|Mrz\\.?|Apr\\.?|April|Mai\\.?|Jun\\.?|Juni|Jul\\.?|Juli|Aug\\.?|August|Sep\\.?|Sept\\.?|September|Okt\\.?|Oktober|Nov\\.?|November|Dez\\.?|Dezember)' +
'\\s*' +
'(?:' +
',?\\s*(?:([0-9]{4})(\\s*[vn]\\.?\\s*C(?:hr)?\\.?)?|([0-9]{1,4})\\s*([vn]\\.?\\s*C(?:hr)?\\.?))' +
')?' +
'(?=[^\\s\\w]|$)', 'i');
var MONTH_NAME_GROUP = 2;
var YEAR_GROUP = 3;
var YEAR_BE_GROUP = 4;
var YEAR_GROUP2 = 5;
var YEAR_BE_GROUP2 = 6;
exports.Parser = function ENMonthNameParser(){
Parser.apply(this, arguments);
this.pattern = function() { return PATTERN; }
this.extract = function(text, ref, match, opt){
var result = new ParsedResult({
text: match[0].substr(match[1].length, match[0].length - match[1].length),
index: match.index + match[1].length,
ref: ref,
});
var month = match[MONTH_NAME_GROUP];
month = util.MONTH_OFFSET[month.toLowerCase()];
var day = 1;
var year = null;
if (match[YEAR_GROUP] || match[YEAR_GROUP2]) {
year = match[YEAR_GROUP] || match[YEAR_GROUP2];
year = parseInt(year);
if (match[YEAR_BE_GROUP] || match[YEAR_BE_GROUP2]) {
if (/v/i.test(match[YEAR_BE_GROUP] || match[YEAR_BE_GROUP2])) {
// v.Chr.
year = -year;
}
} else if (year < 100){
year = year + 2000;
}
}
if(year){
result.start.imply('day', day);
result.start.assign('month', month);
result.start.assign('year', year);
} else {
//Find the most appropriated year
var refMoment = moment(ref);
refMoment.month(month - 1);
refMoment.date(day);
var nextYear = refMoment.clone().add(1, 'y');
var lastYear = refMoment.clone().add(-1, 'y');
if( Math.abs(nextYear.diff(moment(ref))) < Math.abs(refMoment.diff(moment(ref))) ){
refMoment = nextYear;
}
else if( Math.abs(lastYear.diff(moment(ref))) < Math.abs(refMoment.diff(moment(ref))) ){
refMoment = lastYear;
}
result.start.imply('day', day);
result.start.assign('month', month);
result.start.imply('year', refMoment.year());
}
result.tags['DEMonthNameParser'] = true;
return result;
}
}