UNPKG

antlr4ts

Version:

ANTLR 4 runtime for JavaScript written in Typescript

github.com/tunnelvisionlabs/antlr4ts

tunnelvisionlabs/antlr4ts

489 lines • 17.6 kB

JavaScript

"use strict"; /*! * Copyright 2016 The ANTLR Project. All rights reserved. * Licensed under the BSD-3-Clause license. See LICENSE file in the project root for license information. */ var __decorate = (this && this.__decorate) || function (decorators, target, key, desc) { var c = arguments.length, r = c < 3 ? target : desc === null ? desc = Object.getOwnPropertyDescriptor(target, key) : desc, d; if (typeof Reflect === "object" && typeof Reflect.decorate === "function") r = Reflect.decorate(decorators, target, key, desc); else for (var i = decorators.length - 1; i >= 0; i--) if (d = decorators[i]) r = (c < 3 ? d(r) : c > 3 ? d(target, key, r) : d(target, key)) || r; return c > 3 && r && Object.defineProperty(target, key, r), r; }; var __param = (this && this.__param) || function (paramIndex, decorator) { return function (target, key) { decorator(target, key, paramIndex); } }; Object.defineProperty(exports, "__esModule", { value: true }); exports.BufferedTokenStream = void 0; // ConvertTo-TS run at 2016-10-04T11:26:49.6074365-07:00 const assert = require("assert"); const CommonToken_1 = require("./CommonToken"); const Interval_1 = require("./misc/Interval"); const Lexer_1 = require("./Lexer"); const Decorators_1 = require("./Decorators"); const Token_1 = require("./Token"); /** * This implementation of {@link TokenStream} loads tokens from a * {@link TokenSource} on-demand, and places the tokens in a buffer to provide * access to any previous token by index. * * This token stream ignores the value of {@link Token#getChannel}. If your * parser requires the token stream filter tokens to only those on a particular * channel, such as {@link Token#DEFAULT_CHANNEL} or * {@link Token#HIDDEN_CHANNEL}, use a filtering token stream such a * {@link CommonTokenStream}. */ let BufferedTokenStream = class BufferedTokenStream { constructor(tokenSource) { /** * A collection of all tokens fetched from the token source. The list is * considered a complete view of the input once {@link #fetchedEOF} is set * to `true`. */ this.tokens = []; /** * The index into {@link #tokens} of the current token (next token to * {@link #consume}). {@link #tokens}`[`{@link #p}`]` should be * {@link #LT LT(1)}. * * This field is set to -1 when the stream is first constructed or when * {@link #setTokenSource} is called, indicating that the first token has * not yet been fetched from the token source. For additional information, * see the documentation of {@link IntStream} for a description of * Initializing Methods. */ this.p = -1; /** * Indicates whether the {@link Token#EOF} token has been fetched from * {@link #tokenSource} and added to {@link #tokens}. This field improves * performance for the following cases: * * * {@link #consume}: The lookahead check in {@link #consume} to prevent * consuming the EOF symbol is optimized by checking the values of * {@link #fetchedEOF} and {@link #p} instead of calling {@link #LA}. * * {@link #fetch}: The check to prevent adding multiple EOF symbols into * {@link #tokens} is trivial with this field. */ this.fetchedEOF = false; if (tokenSource == null) { throw new Error("tokenSource cannot be null"); } this._tokenSource = tokenSource; } get tokenSource() { return this._tokenSource; } /** Reset this token stream by setting its token source. */ set tokenSource(tokenSource) { this._tokenSource = tokenSource; this.tokens.length = 0; this.p = -1; this.fetchedEOF = false; } get index() { return this.p; } mark() { return 0; } release(marker) { // no resources to release } seek(index) { this.lazyInit(); this.p = this.adjustSeekIndex(index); } get size() { return this.tokens.length; } consume() { let skipEofCheck; if (this.p >= 0) { if (this.fetchedEOF) { // the last token in tokens is EOF. skip check if p indexes any // fetched token except the last. skipEofCheck = this.p < this.tokens.length - 1; } else { // no EOF token in tokens. skip check if p indexes a fetched token. skipEofCheck = this.p < this.tokens.length; } } else { // not yet initialized skipEofCheck = false; } if (!skipEofCheck && this.LA(1) === Token_1.Token.EOF) { throw new Error("cannot consume EOF"); } if (this.sync(this.p + 1)) { this.p = this.adjustSeekIndex(this.p + 1); } } /** Make sure index `i` in tokens has a token. * * @returns `true` if a token is located at index `i`, otherwise * `false`. * @see #get(int i) */ sync(i) { assert(i >= 0); let n = i - this.tokens.length + 1; // how many more elements we need? //System.out.println("sync("+i+") needs "+n); if (n > 0) { let fetched = this.fetch(n); return fetched >= n; } return true; } /** Add `n` elements to buffer. * * @returns The actual number of elements added to the buffer. */ fetch(n) { if (this.fetchedEOF) { return 0; } for (let i = 0; i < n; i++) { let t = this.tokenSource.nextToken(); if (this.isWritableToken(t)) { t.tokenIndex = this.tokens.length; } this.tokens.push(t); if (t.type === Token_1.Token.EOF) { this.fetchedEOF = true; return i + 1; } } return n; } get(i) { if (i < 0 || i >= this.tokens.length) { throw new RangeError("token index " + i + " out of range 0.." + (this.tokens.length - 1)); } return this.tokens[i]; } /** Get all tokens from start..stop inclusively. */ getRange(start, stop) { if (start < 0 || stop < 0) { return []; } this.lazyInit(); let subset = new Array(); if (stop >= this.tokens.length) { stop = this.tokens.length - 1; } for (let i = start; i <= stop; i++) { let t = this.tokens[i]; if (t.type === Token_1.Token.EOF) { break; } subset.push(t); } return subset; } LA(i) { let token = this.LT(i); if (!token) { return Token_1.Token.INVALID_TYPE; } return token.type; } tryLB(k) { if ((this.p - k) < 0) { return undefined; } return this.tokens[this.p - k]; } LT(k) { let result = this.tryLT(k); if (result === undefined) { throw new RangeError("requested lookback index out of range"); } return result; } tryLT(k) { this.lazyInit(); if (k === 0) { throw new RangeError("0 is not a valid lookahead index"); } if (k < 0) { return this.tryLB(-k); } let i = this.p + k - 1; this.sync(i); if (i >= this.tokens.length) { // return EOF token // EOF must be last token return this.tokens[this.tokens.length - 1]; } // if ( i>range ) range = i; return this.tokens[i]; } /** * Allowed derived classes to modify the behavior of operations which change * the current stream position by adjusting the target token index of a seek * operation. The default implementation simply returns `i`. If an * exception is thrown in this method, the current stream index should not be * changed. * * For example, {@link CommonTokenStream} overrides this method to ensure that * the seek target is always an on-channel token. * * @param i The target token index. * @returns The adjusted target token index. */ adjustSeekIndex(i) { return i; } lazyInit() { if (this.p === -1) { this.setup(); } } setup() { this.sync(0); this.p = this.adjustSeekIndex(0); } /** Given a start and stop index, return a `List` of all tokens in * the token type `BitSet`. Return an empty array if no tokens were found. This * method looks at both on and off channel tokens. */ getTokens(start, stop, types) { this.lazyInit(); if (start === undefined) { assert(stop === undefined && types === undefined); return this.tokens; } else if (stop === undefined) { stop = this.tokens.length - 1; } if (start < 0 || stop >= this.tokens.length || stop < 0 || start >= this.tokens.length) { throw new RangeError("start " + start + " or stop " + stop + " not in 0.." + (this.tokens.length - 1)); } if (start > stop) { return []; } if (types === undefined) { return this.tokens.slice(start, stop + 1); } else if (typeof types === "number") { types = new Set().add(types); } let typesSet = types; // list = tokens[start:stop]:{T t, t.type in types} let filteredTokens = this.tokens.slice(start, stop + 1); filteredTokens = filteredTokens.filter((value) => typesSet.has(value.type)); return filteredTokens; } /** * Given a starting index, return the index of the next token on channel. * Return `i` if `tokens[i]` is on channel. Return the index of * the EOF token if there are no tokens on channel between `i` and * EOF. */ nextTokenOnChannel(i, channel) { this.sync(i); if (i >= this.size) { return this.size - 1; } let token = this.tokens[i]; while (token.channel !== channel) { if (token.type === Token_1.Token.EOF) { return i; } i++; this.sync(i); token = this.tokens[i]; } return i; } /** * Given a starting index, return the index of the previous token on * channel. Return `i` if `tokens[i]` is on channel. Return -1 * if there are no tokens on channel between `i` and 0. * * If `i` specifies an index at or after the EOF token, the EOF token * index is returned. This is due to the fact that the EOF token is treated * as though it were on every channel. */ previousTokenOnChannel(i, channel) { this.sync(i); if (i >= this.size) { // the EOF token is on every channel return this.size - 1; } while (i >= 0) { let token = this.tokens[i]; if (token.type === Token_1.Token.EOF || token.channel === channel) { return i; } i--; } return i; } /** Collect all tokens on specified channel to the right of * the current token up until we see a token on {@link Lexer#DEFAULT_TOKEN_CHANNEL} or * EOF. If `channel` is `-1`, find any non default channel token. */ getHiddenTokensToRight(tokenIndex, channel = -1) { this.lazyInit(); if (tokenIndex < 0 || tokenIndex >= this.tokens.length) { throw new RangeError(tokenIndex + " not in 0.." + (this.tokens.length - 1)); } let nextOnChannel = this.nextTokenOnChannel(tokenIndex + 1, Lexer_1.Lexer.DEFAULT_TOKEN_CHANNEL); let to; let from = tokenIndex + 1; // if none onchannel to right, nextOnChannel=-1 so set to = last token if (nextOnChannel === -1) { to = this.size - 1; } else { to = nextOnChannel; } return this.filterForChannel(from, to, channel); } /** Collect all tokens on specified channel to the left of * the current token up until we see a token on {@link Lexer#DEFAULT_TOKEN_CHANNEL}. * If `channel` is `-1`, find any non default channel token. */ getHiddenTokensToLeft(tokenIndex, channel = -1) { this.lazyInit(); if (tokenIndex < 0 || tokenIndex >= this.tokens.length) { throw new RangeError(tokenIndex + " not in 0.." + (this.tokens.length - 1)); } if (tokenIndex === 0) { // obviously no tokens can appear before the first token return []; } let prevOnChannel = this.previousTokenOnChannel(tokenIndex - 1, Lexer_1.Lexer.DEFAULT_TOKEN_CHANNEL); if (prevOnChannel === tokenIndex - 1) { return []; } // if none onchannel to left, prevOnChannel=-1 then from=0 let from = prevOnChannel + 1; let to = tokenIndex - 1; return this.filterForChannel(from, to, channel); } filterForChannel(from, to, channel) { let hidden = new Array(); for (let i = from; i <= to; i++) { let t = this.tokens[i]; if (channel === -1) { if (t.channel !== Lexer_1.Lexer.DEFAULT_TOKEN_CHANNEL) { hidden.push(t); } } else { if (t.channel === channel) { hidden.push(t); } } } return hidden; } get sourceName() { return this.tokenSource.sourceName; } getText(interval) { if (interval === undefined) { interval = Interval_1.Interval.of(0, this.size - 1); } else if (!(interval instanceof Interval_1.Interval)) { // Note: the more obvious check for 'instanceof RuleContext' results in a circular dependency problem interval = interval.sourceInterval; } let start = interval.a; let stop = interval.b; if (start < 0 || stop < 0) { return ""; } this.fill(); if (stop >= this.tokens.length) { stop = this.tokens.length - 1; } let buf = ""; for (let i = start; i <= stop; i++) { let t = this.tokens[i]; if (t.type === Token_1.Token.EOF) { break; } buf += t.text; } return buf.toString(); } getTextFromRange(start, stop) { if (this.isToken(start) && this.isToken(stop)) { return this.getText(Interval_1.Interval.of(start.tokenIndex, stop.tokenIndex)); } return ""; } /** Get all tokens from lexer until EOF. */ fill() { this.lazyInit(); const blockSize = 1000; while (true) { let fetched = this.fetch(blockSize); if (fetched < blockSize) { return; } } } // TODO: Figure out a way to make this more flexible? isWritableToken(t) { return t instanceof CommonToken_1.CommonToken; } // TODO: Figure out a way to make this more flexible? isToken(t) { return t instanceof CommonToken_1.CommonToken; } }; __decorate([ Decorators_1.NotNull ], BufferedTokenStream.prototype, "_tokenSource", void 0); __decorate([ Decorators_1.Override ], BufferedTokenStream.prototype, "tokenSource", null); __decorate([ Decorators_1.Override ], BufferedTokenStream.prototype, "index", null); __decorate([ Decorators_1.Override ], BufferedTokenStream.prototype, "mark", null); __decorate([ Decorators_1.Override ], BufferedTokenStream.prototype, "release", null); __decorate([ Decorators_1.Override ], BufferedTokenStream.prototype, "seek", null); __decorate([ Decorators_1.Override ], BufferedTokenStream.prototype, "size", null); __decorate([ Decorators_1.Override ], BufferedTokenStream.prototype, "consume", null); __decorate([ Decorators_1.Override ], BufferedTokenStream.prototype, "get", null); __decorate([ Decorators_1.Override ], BufferedTokenStream.prototype, "LA", null); __decorate([ Decorators_1.NotNull, Decorators_1.Override ], BufferedTokenStream.prototype, "LT", null); __decorate([ Decorators_1.Override ], BufferedTokenStream.prototype, "sourceName", null); __decorate([ Decorators_1.NotNull, Decorators_1.Override ], BufferedTokenStream.prototype, "getText", null); __decorate([ Decorators_1.NotNull, Decorators_1.Override ], BufferedTokenStream.prototype, "getTextFromRange", null); BufferedTokenStream = __decorate([ __param(0, Decorators_1.NotNull) ], BufferedTokenStream); exports.BufferedTokenStream = BufferedTokenStream; //# sourceMappingURL=BufferedTokenStream.js.map