UNPKG

textlint-rule-terminology

Version:

TextLint rule to check correct terms spelling

github.com/sapegin/textlint-rule-terminology

sapegin/textlint-rule-terminology

141 lines • 5.97 kB

JavaScript

import fs from 'node:fs'; import { createRequire } from 'node:module'; import stripJsonComments from 'strip-json-comments'; import { RuleHelper } from 'textlint-rule-helper'; import upperFirst from 'lodash/upperFirst.js'; const DEFAULT_OPTIONS = { terms: [], skip: ['BlockQuote'], defaultTerms: true, exclude: [], }; const sentenceStartRegExp = /\w+[!.?]\)? $/; const punctuation = String.raw `[\.,;:!?'"’”)]`; function reporter(context, userOptions = {}) { const options = { ...DEFAULT_OPTIONS, ...userOptions }; const terms = getTerms(options.defaultTerms, options.terms, options.exclude); // Match all words (plain strings) with a single regexp const words = terms.filter((rule) => typeof rule === 'string'); const exactWordRules = [[getMultipleWordRegExp(words), words]]; // Create a separate regexp of each array rule ([pattern, replacement]) const advancedRules = terms.filter((rule) => typeof rule !== 'string'); const rules = [...exactWordRules, ...advancedRules]; const helper = new RuleHelper(context); const { Syntax, RuleError, report, fixer, getSource } = context; return { [Syntax.Str](node) { return new Promise((resolve) => { if (helper.isChildNode( // @ts-expect-error: Who the fuck knows what you want here ;-/ node, options.skip.map((rule) => Syntax[rule]))) { return resolve(); } const text = getSource(node); for (const [pattern, replacements] of rules) { const regExp = new RegExp(typeof pattern === 'string' ? getAdvancedRegExp(pattern) : pattern, 'igm'); let match; while ((match = regExp.exec(text))) { const index = match.index; const matched = match[0]; let replacement = getReplacement(pattern, replacements, matched); if (replacement === undefined) { throw new Error('No replacement found'); } // Capitalize word in the beginning of a sentence if the original word was capitalized const textBeforeMatch = text.slice(0, Math.max(0, index)); const isSentenceStart = index === 0 || sentenceStartRegExp.test(textBeforeMatch); if (isSentenceStart && upperFirst(matched) === matched) { replacement = upperFirst(replacement); } // Skip correct spelling if (matched === replacement) { continue; } const fix = fixer.replaceTextRange([index, index + matched.length], replacement); const message = `Incorrect term: “${matched.trim()}”, use “${replacement.trim()}” instead`; report(node, new RuleError(message, { index, fix })); } } resolve(); }); }, }; } export function getTerms(defaultTerms, terms, exclude) { const defaults = defaultTerms ? loadJson('../terms.jsonc') : []; const extras = typeof terms === 'string' ? loadJson(terms) : terms; // Order matters, the first term to match is used. We prioritize user // 'extras' before defaults const listTerms = [...(Array.isArray(extras) ? extras : []), ...defaults]; // Filter on all terms if (Array.isArray(exclude)) { return listTerms.filter((term) => { if (Array.isArray(term)) { return !exclude.includes(term[0]); } return !exclude.includes(term); }); } return listTerms; } function loadJson(modulePath) { const require = createRequire(import.meta.url); const resolvedModule = require.resolve(modulePath); const json = fs.readFileSync(resolvedModule, 'utf8'); return JSON.parse(stripJsonComments(json)); } /** * Match exact word in the middle of the text */ export function getExactMatchRegExp(pattern) { // 1. Beginning of the string, or any character that isn't "-" // or alphanumeric // 2. Not a dot "." (to make it ignore file extensions) // 3. Word boundary // 4. Exact match of the pattern // 5. Word boundary // 6. Space, punctuation + space, punctuation + punctuation, // or punctuation at the end of the string, end of the string return `(?<=^|[^-\\w])(?<!\\.)\\b${pattern}\\b(?= |${punctuation} |${punctuation}${punctuation}|${punctuation}$|$)`; } /** * Match any of given words exactly in the middle of the text */ export function getMultipleWordRegExp(words) { return getExactMatchRegExp(`(?:${words.join('|')})`); } /** * Match pattern on word boundaries in the middle of the text unless the pattern * has look behinds or look aheads */ export function getAdvancedRegExp(pattern) { if ( // Look behind: (?<=...) and (?<!...) pattern.startsWith('(?<') || // Positive look ahead: (?=...) pattern.includes('(?=') || // Negative look ahead: (?!...) pattern.includes('(?!')) { return pattern; } return getExactMatchRegExp(pattern); } export function getReplacement(pattern, replacements, matched) { if (Array.isArray(replacements)) { return findWord(replacements, matched); } const tag = 'xyz'; return `${tag} ${matched} ${tag}` .replace(new RegExp(pattern, 'i'), replacements) .slice(tag.length + 1, -(tag.length + 1)); } export function findWord(items, match) { const lowerCaseMatch = match.toLowerCase(); return items.find((word) => word.toLowerCase() === lowerCaseMatch); } const rule = { linter: reporter, fixer: reporter, }; export default rule; //# sourceMappingURL=index.js.map