compromise
Version:
modest natural language processing
103 lines (91 loc) • 2.09 kB
JavaScript
const prp = ['Possessive', 'Pronoun']
//words that can't be compressed, for whatever reason
let misc = {
// numbers
'20th century fox': 'Organization',
'7 eleven': 'Organization',
'motel 6': 'Organization',
g8: 'Organization',
vh1: 'Organization',
'76ers': 'SportsTeam',
'49ers': 'SportsTeam',
q1: 'Date',
q2: 'Date',
q3: 'Date',
q4: 'Date',
km2: 'Unit',
m2: 'Unit',
dm2: 'Unit',
cm2: 'Unit',
mm2: 'Unit',
mile2: 'Unit',
in2: 'Unit',
yd2: 'Unit',
ft2: 'Unit',
m3: 'Unit',
dm3: 'Unit',
cm3: 'Unit',
in3: 'Unit',
ft3: 'Unit',
yd3: 'Unit',
// ampersands
'at&t': 'Organization',
'black & decker': 'Organization',
'h & m': 'Organization',
'johnson & johnson': 'Organization',
'procter & gamble': 'Organization',
"ben & jerry's": 'Organization',
'&': 'Conjunction',
//pronouns
i: ['Pronoun', 'Singular'],
he: ['Pronoun', 'Singular'],
she: ['Pronoun', 'Singular'],
it: ['Pronoun', 'Singular'],
they: ['Pronoun', 'Plural'],
we: ['Pronoun', 'Plural'],
was: ['Copula', 'PastTense'],
is: ['Copula', 'PresentTense'],
are: ['Copula', 'PresentTense'],
am: ['Copula', 'PresentTense'],
were: ['Copula', 'PastTense'],
// possessive pronouns
her: prp,
his: prp,
hers: prp,
their: prp,
theirs: prp,
themselves: prp,
your: prp,
our: prp,
ours: prp,
my: prp,
its: prp,
// misc
vs: ['Conjunction', 'Abbreviation'],
if: ['Condition', 'Preposition'],
closer: 'Comparative',
closest: 'Superlative',
much: 'Adverb',
may: 'Modal',
// irregular conjugations with two forms
babysat: 'PastTense',
blew: 'PastTense',
drank: 'PastTense',
drove: 'PastTense',
forgave: 'PastTense',
skiied: 'PastTense',
spilt: 'PastTense',
stung: 'PastTense',
swam: 'PastTense',
swung: 'PastTense',
guaranteed: 'PastTense',
shrunk: 'PastTense',
// support 'near', 'nears', 'nearing'
nears: 'PresentTense',
nearing: 'Gerund',
neared: 'PastTense',
no: ['Negative', 'Expression'],
// '-': 'Preposition', //june - july
// there: 'There'
}
export default misc