chrono-node
Version:
A natural language date parser in Javascript
48 lines (41 loc) • 1.75 kB
text/typescript
import { TIME_UNITS_PATTERN, parseTimeUnits, TIME_UNITS_NO_ABBR_PATTERN } from "../constants";
import { ParsingContext } from "../../../chrono";
import { ParsingComponents } from "../../../results";
import { AbstractParserWithWordBoundaryChecking } from "../../../common/parsers/AbstractParserWithWordBoundary";
const PATTERN_WITH_OPTIONAL_PREFIX = new RegExp(
`(?:(?:within|in|for)\\s*)?` +
`(?:(?:about|around|roughly|approximately|just)\\s*(?:~\\s*)?)?(${TIME_UNITS_PATTERN})(?=\\W|$)`,
"i"
);
const PATTERN_WITH_PREFIX = new RegExp(
`(?:within|in|for)\\s*` +
`(?:(?:about|around|roughly|approximately|just)\\s*(?:~\\s*)?)?(${TIME_UNITS_PATTERN})(?=\\W|$)`,
"i"
);
const PATTERN_WITH_PREFIX_STRICT = new RegExp(
`(?:within|in|for)\\s*` +
`(?:(?:about|around|roughly|approximately|just)\\s*(?:~\\s*)?)?(${TIME_UNITS_NO_ABBR_PATTERN})(?=\\W|$)`,
"i"
);
export default class ENTimeUnitWithinFormatParser extends AbstractParserWithWordBoundaryChecking {
constructor(private strictMode: boolean) {
super();
}
innerPattern(context: ParsingContext): RegExp {
if (this.strictMode) {
return PATTERN_WITH_PREFIX_STRICT;
}
return context.option.forwardDate ? PATTERN_WITH_OPTIONAL_PREFIX : PATTERN_WITH_PREFIX;
}
innerExtract(context: ParsingContext, match: RegExpMatchArray) {
// Exclude "for the unit" phases, e.g. "for the year"
if (match[0].match(/^for\s*the\s*\w+/)) {
return null;
}
const timeUnits = parseTimeUnits(match[1]);
if (!timeUnits) {
return null;
}
return ParsingComponents.createRelativeFromReference(context.reference, timeUnits);
}
}