UNPKG

antlr4-runtime

Version:

JavaScript runtime for ANTLR4

github.com/antlr/antlr4

391 lines (359 loc) • 9.95 kB

JavaScript

/* Copyright (c) 2012-2022 The ANTLR Project. All rights reserved. * Use of this file is governed by the BSD 3-clause license that * can be found in the LICENSE.txt file in the project root. */ import Token from './Token.js'; import Lexer from './Lexer.js'; import Interval from './misc/Interval.js'; import TokenStream from "./TokenStream.js"; /** * This implementation of {@link TokenStream} loads tokens from a * {@link TokenSource} on-demand, and places the tokens in a buffer to provide * access to any previous token by index. * * <p> * This token stream ignores the value of {@link Token//getChannel}. If your * parser requires the token stream filter tokens to only those on a particular * channel, such as {@link Token//DEFAULT_CHANNEL} or * {@link Token//HIDDEN_CHANNEL}, use a filtering token stream such a * {@link CommonTokenStream}.</p> */ export default class BufferedTokenStream extends TokenStream { constructor(tokenSource) { super(); // The {@link TokenSource} from which tokens for this stream are fetched. this.tokenSource = tokenSource; /** * A collection of all tokens fetched from the token source. The list is * considered a complete view of the input once {@link //fetchedEOF} is set * to {@code true}. */ this.tokens = []; /** * The index into {@link //tokens} of the current token (next token to * {@link //consume}). {@link //tokens}{@code [}{@link //p}{@code ]} should * be * {@link //LT LT(1)}. * * <p>This field is set to -1 when the stream is first constructed or when * {@link //setTokenSource} is called, indicating that the first token has * not yet been fetched from the token source. For additional information, * see the documentation of {@link IntStream} for a description of * Initializing Methods.</p> */ this.index = -1; /** * Indicates whether the {@link Token//EOF} token has been fetched from * {@link //tokenSource} and added to {@link //tokens}. This field improves * performance for the following cases: * * <ul> * <li>{@link //consume}: The lookahead check in {@link //consume} to * prevent * consuming the EOF symbol is optimized by checking the values of * {@link //fetchedEOF} and {@link //p} instead of calling {@link * //LA}.</li> * <li>{@link //fetch}: The check to prevent adding multiple EOF symbols * into * {@link //tokens} is trivial with this field.</li> * <ul> */ this.fetchedEOF = false; } mark() { return 0; } release(marker) { // no resources to release } reset() { this.seek(0); } seek(index) { this.lazyInit(); this.index = this.adjustSeekIndex(index); } get size() { return this.tokens.length; } get(index) { this.lazyInit(); return this.tokens[index]; } consume() { let skipEofCheck = false; if (this.index >= 0) { if (this.fetchedEOF) { // the last token in tokens is EOF. skip check if p indexes any // fetched token except the last. skipEofCheck = this.index < this.tokens.length - 1; } else { // no EOF token in tokens. skip check if p indexes a fetched token. skipEofCheck = this.index < this.tokens.length; } } else { // not yet initialized skipEofCheck = false; } if (!skipEofCheck && this.LA(1) === Token.EOF) { throw "cannot consume EOF"; } if (this.sync(this.index + 1)) { this.index = this.adjustSeekIndex(this.index + 1); } } /** * Make sure index {@code i} in tokens has a token. * * @return {Boolean} {@code true} if a token is located at index {@code i}, otherwise * {@code false}. * @see //get(int i) */ sync(i) { const n = i - this.tokens.length + 1; // how many more elements we need? if (n > 0) { const fetched = this.fetch(n); return fetched >= n; } return true; } /** * Add {@code n} elements to buffer. * * @return {Number} The actual number of elements added to the buffer. */ fetch(n) { if (this.fetchedEOF) { return 0; } for (let i = 0; i < n; i++) { const t = this.tokenSource.nextToken(); t.tokenIndex = this.tokens.length; this.tokens.push(t); if (t.type === Token.EOF) { this.fetchedEOF = true; return i + 1; } } return n; } // Get all tokens from start..stop inclusively/// getTokens(start, stop, types) { if (types === undefined) { types = null; } if (start < 0 || stop < 0) { return null; } this.lazyInit(); const subset = []; if (stop >= this.tokens.length) { stop = this.tokens.length - 1; } for (let i = start; i < stop; i++) { const t = this.tokens[i]; if (t.type === Token.EOF) { break; } if (types === null || types.contains(t.type)) { subset.push(t); } } return subset; } LA(i) { return this.LT(i).type; } LB(k) { if (this.index - k < 0) { return null; } return this.tokens[this.index - k]; } LT(k) { this.lazyInit(); if (k === 0) { return null; } if (k < 0) { return this.LB(-k); } const i = this.index + k - 1; this.sync(i); if (i >= this.tokens.length) { // return EOF token // EOF must be last token return this.tokens[this.tokens.length - 1]; } return this.tokens[i]; } /** * Allowed derived classes to modify the behavior of operations which change * the current stream position by adjusting the target token index of a seek * operation. The default implementation simply returns {@code i}. If an * exception is thrown in this method, the current stream index should not be * changed. * * <p>For example, {@link CommonTokenStream} overrides this method to ensure * that * the seek target is always an on-channel token.</p> * * @param {Number} i The target token index. * @return {Number} The adjusted target token index. */ adjustSeekIndex(i) { return i; } lazyInit() { if (this.index === -1) { this.setup(); } } setup() { this.sync(0); this.index = this.adjustSeekIndex(0); } // Reset this token stream by setting its token source./// setTokenSource(tokenSource) { this.tokenSource = tokenSource; this.tokens = []; this.index = -1; this.fetchedEOF = false; } /** * Given a starting index, return the index of the next token on channel. * Return i if tokens[i] is on channel. Return -1 if there are no tokens * on channel between i and EOF. */ nextTokenOnChannel(i, channel) { this.sync(i); if (i >= this.tokens.length) { return -1; } let token = this.tokens[i]; while (token.channel !== this.channel) { if (token.type === Token.EOF) { return -1; } i += 1; this.sync(i); token = this.tokens[i]; } return i; } /** * Given a starting index, return the index of the previous token on channel. * Return i if tokens[i] is on channel. Return -1 if there are no tokens * on channel between i and 0. */ previousTokenOnChannel(i, channel) { while (i >= 0 && this.tokens[i].channel !== channel) { i -= 1; } return i; } /** * Collect all tokens on specified channel to the right of * the current token up until we see a token on DEFAULT_TOKEN_CHANNEL or * EOF. If channel is -1, find any non default channel token. */ getHiddenTokensToRight(tokenIndex, channel) { if (channel === undefined) { channel = -1; } this.lazyInit(); if (tokenIndex < 0 || tokenIndex >= this.tokens.length) { throw "" + tokenIndex + " not in 0.." + this.tokens.length - 1; } const nextOnChannel = this.nextTokenOnChannel(tokenIndex + 1, Lexer.DEFAULT_TOKEN_CHANNEL); const from_ = tokenIndex + 1; // if none onchannel to right, nextOnChannel=-1 so set to = last token const to = nextOnChannel === -1 ? this.tokens.length - 1 : nextOnChannel; return this.filterForChannel(from_, to, channel); } /** * Collect all tokens on specified channel to the left of * the current token up until we see a token on DEFAULT_TOKEN_CHANNEL. * If channel is -1, find any non default channel token. */ getHiddenTokensToLeft(tokenIndex, channel) { if (channel === undefined) { channel = -1; } this.lazyInit(); if (tokenIndex < 0 || tokenIndex >= this.tokens.length) { throw "" + tokenIndex + " not in 0.." + this.tokens.length - 1; } const prevOnChannel = this.previousTokenOnChannel(tokenIndex - 1, Lexer.DEFAULT_TOKEN_CHANNEL); if (prevOnChannel === tokenIndex - 1) { return null; } // if none on channel to left, prevOnChannel=-1 then from=0 const from_ = prevOnChannel + 1; const to = tokenIndex - 1; return this.filterForChannel(from_, to, channel); } filterForChannel(left, right, channel) { const hidden = []; for (let i = left; i < right + 1; i++) { const t = this.tokens[i]; if (channel === -1) { if (t.channel !== Lexer.DEFAULT_TOKEN_CHANNEL) { hidden.push(t); } } else if (t.channel === channel) { hidden.push(t); } } if (hidden.length === 0) { return null; } return hidden; } getSourceName() { return this.tokenSource.getSourceName(); } // Get the text of all tokens in this buffer./// getText(interval) { this.lazyInit(); this.fill(); if (!interval) { interval = new Interval(0, this.tokens.length - 1); } let start = interval.start; if (start instanceof Token) { start = start.tokenIndex; } let stop = interval.stop; if (stop instanceof Token) { stop = stop.tokenIndex; } if (start === null || stop === null || start < 0 || stop < 0) { return ""; } if (stop >= this.tokens.length) { stop = this.tokens.length - 1; } let s = ""; for (let i = start; i < stop + 1; i++) { const t = this.tokens[i]; if (t.type === Token.EOF) { break; } s = s + t.text; } return s; } // Get all tokens from lexer until EOF/// fill() { this.lazyInit(); // noinspection StatementWithEmptyBodyJS while (this.fetch(1000) === 1000); } } Object.defineProperty(BufferedTokenStream, "size", { get: function() { return this.tokens.length; } })