UNPKG

ohm-js

Version:

An object-oriented language for parsing and pattern matching

150 lines (129 loc) • 4.41 kB

JavaScript

import * as ohm from 'ohm-js'; export const grammarsSource = String.raw` /* Superset of the Ohm grammar that allows examples to be embedded in comments. Any valid Ohm grammar will also be matched by this grammar. */ // Example: //+ "//+ \"x\"\nG {\n//- \"\"\nstart = \"x\"}" OhmWithExamples <: Ohm { Grammar := ident SuperGrammar? "{" (#exampleComments Rule)* #exampleComments "}" exampleComments = (spacesNoExampleComment exampleComment)* // Examples: //+ "//+ \"blah\"" //+ "//- \"one\", \"two\"" //- "// - \"x\", "//-\"x\" exampleComment = "//+" examples -- positive | "//-" examples -- negative examples = spaceNoNl+ nonemptyListOf<jsonString, exampleSep> spaceNoNl* exampleSep = "," spaces exampleCommentPrefix = "//+" | "//-" spaceNoNl = ~"\n" space spacesNoExampleComment = (~exampleCommentPrefix space)* jsonString = "\"" jsonChar* "\"" jsonChar = jsonEscape | ~"\\" ~"\"" "\u{0020}".."\u{10FFFF}" //+ "\\n", "\\u1234" jsonEscape (a JSON escape sequence) = "\\\"" | "\\\\" | "\\/" | "\\b" | "\\f" | "\\n" | "\\r" | "\\t" | "\\u" hexDigit hexDigit hexDigit hexDigit -- unicodeEscape } /* A stricter version of the grammar that prevents many malformed example comments from being parsed as regular comments. */ OhmWithExamplesStrict <: OhmWithExamples { // Redefine 'comment' to avoid malformed example comments from silently // being parsed as regular comments. comment := | ~exampleCommentPrefix comment_singleLine | comment_multiLine } `; export const grammars = ohm.grammars(grammarsSource, {Ohm: ohm.ohmGrammar}); const semantics = grammars.OhmWithExamples.createSemantics().addOperation('hasExamples', { _iter(...children) { return children.some(c => c.hasExamples()); }, exampleComments(_, commentIter) { return commentIter.numChildren > 0; }, }); semantics.addOperation('examples', { Grammars(grammarIter) { return grammarIter.children.flatMap(c => c.examples()); }, Grammar(name, _, _open, exampleCommentsIter, ruleIter, trailingCommentsIter, _close) { const result = []; const grammar = this.grammarName(); for (let i = 0; i < ruleIter.numChildren; i++) { const rule = ruleIter.child(i).ruleName(); // Augment each of the examples with the grammar and rule name. const examples = exampleCommentsIter.child(i).examples(); const augmentedExamples = examples.map(ex => ({...ex, grammar, rule})); result.push(...augmentedExamples); } if (trailingCommentsIter.hasExamples()) { const defaultExamples = trailingCommentsIter.examples(); result.push(...defaultExamples.map(ex => ({...ex, grammar, rule: ''}))); } return result; }, exampleComments(_, commentIter) { return commentIter.children.flatMap(c => c.examples()); }, exampleComment_positive(_, examples) { return examples.examples().map(ex => ({...ex, shouldMatch: true})); }, exampleComment_negative(_, examples) { return examples.examples().map(ex => ({...ex, shouldMatch: false})); }, examples(_ws, jsonStringList, _) { return jsonStringList.asIteration().children.map(t => { return {example: JSON.parse(t.sourceString)}; }); }, comment_singleLine(_, commentCharIter, _nl) { return []; }, comment_multiLine(_, commentCharIter, _nl) { return []; }, }); semantics.addOperation('grammarName', { Grammar(name, _, _open, exampleCommentsIter, ruleIter, trailingCommentsIter, _close) { return name.sourceString; }, }); semantics.addOperation('ruleName', { Rule_define(ident, _formals, _desc, _, _body) { return ident.sourceString; }, Rule_override(ident, _formals, _, _body) { return ident.sourceString; }, Rule_extend(ident, _formals, _, _body) { return ident.sourceString; }, }); /** @typedef {{grammar: string, rule: string, example: string, shouldMatch: boolean}} Example */ /** * @param {string} grammarsDef - A string containing one or more grammar definitions. * @return {[Example]} */ export function extractExamples(grammarsDef) { const matchResult = grammars.OhmWithExamples.match(grammarsDef); if (matchResult.failed()) { throw new Error(matchResult.message); } return semantics(matchResult).examples(); }