diff options
Diffstat (limited to 'runtime/Java/src/main/java/org/antlr/runtime/RecognizerSharedState.java')
-rw-r--r-- | runtime/Java/src/main/java/org/antlr/runtime/RecognizerSharedState.java | 144 |
1 files changed, 144 insertions, 0 deletions
diff --git a/runtime/Java/src/main/java/org/antlr/runtime/RecognizerSharedState.java b/runtime/Java/src/main/java/org/antlr/runtime/RecognizerSharedState.java new file mode 100644 index 0000000..068ac3b --- /dev/null +++ b/runtime/Java/src/main/java/org/antlr/runtime/RecognizerSharedState.java @@ -0,0 +1,144 @@ +/* + [The "BSD license"] + Copyright (c) 2005-2009 Terence Parr + All rights reserved. + + Redistribution and use in source and binary forms, with or without + modification, are permitted provided that the following conditions + are met: + 1. Redistributions of source code must retain the above copyright + notice, this list of conditions and the following disclaimer. + 2. Redistributions in binary form must reproduce the above copyright + notice, this list of conditions and the following disclaimer in the + documentation and/or other materials provided with the distribution. + 3. The name of the author may not be used to endorse or promote products + derived from this software without specific prior written permission. + + THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR + IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES + OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. + IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, + INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT + NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, + DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY + THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT + (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF + THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + */package org.antlr.runtime; + +import java.util.Map; + +/** The set of fields needed by an abstract recognizer to recognize input + * and recover from errors etc... As a separate state object, it can be + * shared among multiple grammars; e.g., when one grammar imports another. + * + * These fields are publically visible but the actual state pointer per + * parser is protected. + */ +public class RecognizerSharedState { + /** Track the set of token types that can follow any rule invocation. + * Stack grows upwards. When it hits the max, it grows 2x in size + * and keeps going. + */ + public BitSet[] following = new BitSet[BaseRecognizer.INITIAL_FOLLOW_STACK_SIZE]; + public int _fsp = -1; + + /** This is true when we see an error and before having successfully + * matched a token. Prevents generation of more than one error message + * per error. + */ + public boolean errorRecovery = false; + + /** The index into the input stream where the last error occurred. + * This is used to prevent infinite loops where an error is found + * but no token is consumed during recovery...another error is found, + * ad naseum. This is a failsafe mechanism to guarantee that at least + * one token/tree node is consumed for two errors. + */ + public int lastErrorIndex = -1; + + /** In lieu of a return value, this indicates that a rule or token + * has failed to match. Reset to false upon valid token match. + */ + public boolean failed = false; + + /** Did the recognizer encounter a syntax error? Track how many. */ + public int syntaxErrors = 0; + + /** If 0, no backtracking is going on. Safe to exec actions etc... + * If >0 then it's the level of backtracking. + */ + public int backtracking = 0; + + /** An array[size num rules] of Map<Integer,Integer> that tracks + * the stop token index for each rule. ruleMemo[ruleIndex] is + * the memoization table for ruleIndex. For key ruleStartIndex, you + * get back the stop token for associated rule or MEMO_RULE_FAILED. + * + * This is only used if rule memoization is on (which it is by default). + */ + public Map[] ruleMemo; + + + // LEXER FIELDS (must be in same state object to avoid casting + // constantly in generated code and Lexer object) :( + + + /** The goal of all lexer rules/methods is to create a token object. + * This is an instance variable as multiple rules may collaborate to + * create a single token. nextToken will return this object after + * matching lexer rule(s). If you subclass to allow multiple token + * emissions, then set this to the last token to be matched or + * something nonnull so that the auto token emit mechanism will not + * emit another token. + */ + public Token token; + + /** What character index in the stream did the current token start at? + * Needed, for example, to get the text for current token. Set at + * the start of nextToken. + */ + public int tokenStartCharIndex = -1; + + /** The line on which the first character of the token resides */ + public int tokenStartLine; + + /** The character position of first character within the line */ + public int tokenStartCharPositionInLine; + + /** The channel number for the current token */ + public int channel; + + /** The token type for the current token */ + public int type; + + /** You can set the text for the current token to override what is in + * the input char buffer. Use setText() or can set this instance var. + */ + public String text; + + public RecognizerSharedState() {;} + + public RecognizerSharedState(RecognizerSharedState state) { + if ( this.following.length < state.following.length ) { + this.following = new BitSet[state.following.length]; + } + System.arraycopy(state.following, 0, this.following, 0, state.following.length); + this._fsp = state._fsp; + this.errorRecovery = state.errorRecovery; + this.lastErrorIndex = state.lastErrorIndex; + this.failed = state.failed; + this.syntaxErrors = state.syntaxErrors; + this.backtracking = state.backtracking; + if ( state.ruleMemo!=null ) { + this.ruleMemo = new Map[state.ruleMemo.length]; + System.arraycopy(state.ruleMemo, 0, this.ruleMemo, 0, state.ruleMemo.length); + } + this.token = state.token; + this.tokenStartCharIndex = state.tokenStartCharIndex; + this.tokenStartCharPositionInLine = state.tokenStartCharPositionInLine; + this.channel = state.channel; + this.type = state.type; + this.text = state.text; + } +} |