You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
551 lines
17 KiB
551 lines
17 KiB
5 years ago
|
package com.fr.third.antlr;
|
||
|
|
||
|
/* ANTLR Translator Generator
|
||
|
* Project led by Terence Parr at http://www.cs.usfca.edu
|
||
|
* Software rights: http://www.antlr.org/license.html
|
||
|
*/
|
||
|
|
||
|
|
||
|
import java.util.*;
|
||
|
|
||
|
import com.fr.third.antlr.ASdebug.ASDebugStream;
|
||
|
import com.fr.third.antlr.ASdebug.IASDebugStream;
|
||
|
import com.fr.third.antlr.ASdebug.TokenOffsetInfo;
|
||
|
import com.fr.third.antlr.collections.impl.BitSet;
|
||
|
|
||
|
/** This token stream tracks the *entire* token stream coming from
|
||
|
* a lexer, but does not pass on the whitespace (or whatever else
|
||
|
* you want to discard) to the parser.
|
||
|
*
|
||
|
* This class can then be asked for the ith token in the input stream.
|
||
|
* Useful for dumping out the input stream exactly after doing some
|
||
|
* augmentation or other manipulations. Tokens are index from 0..n-1
|
||
|
*
|
||
|
* You can insert stuff, replace, and delete chunks. Note that the
|
||
|
* operations are done lazily--only if you convert the buffer to a
|
||
|
* String. This is very efficient because you are not moving data around
|
||
|
* all the time. As the buffer of tokens is converted to strings, the
|
||
|
* toString() method(s) check to see if there is an operation at the
|
||
|
* current index. If so, the operation is done and then normal String
|
||
|
* rendering continues on the buffer. This is like having multiple Turing
|
||
|
* machine instruction streams (programs) operating on a single input tape. :)
|
||
|
*
|
||
|
* Since the operations are done lazily at toString-time, operations do not
|
||
|
* screw up the token index values. That is, an insert operation at token
|
||
|
* index i does not change the index values for tokens i+1..n-1.
|
||
|
*
|
||
|
* Because operations never actually alter the buffer, you may always get
|
||
|
* the original token stream back without undoing anything. Since
|
||
|
* the instructions are queued up, you can easily simulate transactions and
|
||
|
* roll back any changes if there is an error just by removing instructions.
|
||
|
* For example,
|
||
|
*
|
||
|
* TokenStreamRewriteEngine rewriteEngine =
|
||
|
* new TokenStreamRewriteEngine(lexer);
|
||
|
* JavaRecognizer parser = new JavaRecognizer(rewriteEngine);
|
||
|
* ...
|
||
|
* rewriteEngine.insertAfter("pass1", t, "foobar");}
|
||
|
* rewriteEngine.insertAfter("pass2", u, "start");}
|
||
|
* System.out.println(rewriteEngine.toString("pass1"));
|
||
|
* System.out.println(rewriteEngine.toString("pass2"));
|
||
|
*
|
||
|
* You can also have multiple "instruction streams" and get multiple
|
||
|
* rewrites from a single pass over the input. Just name the instruction
|
||
|
* streams and use that name again when printing the buffer. This could be
|
||
|
* useful for generating a C file and also its header file--all from the
|
||
|
* same buffer.
|
||
|
*
|
||
|
* If you don't use named rewrite streams, a "default" stream is used.
|
||
|
*
|
||
|
* Terence Parr, parrt at antlr.org
|
||
|
* University of San Francisco
|
||
|
* February 2004
|
||
|
*/
|
||
|
public class TokenStreamRewriteEngine implements TokenStream, IASDebugStream {
|
||
|
public static final int MIN_TOKEN_INDEX = 0;
|
||
|
|
||
|
static class RewriteOperation {
|
||
|
protected int index;
|
||
|
protected String text;
|
||
|
protected RewriteOperation(int index, String text) {
|
||
|
this.index = index;
|
||
|
this.text = text;
|
||
|
}
|
||
|
/** Execute the rewrite operation by possibly adding to the buffer.
|
||
|
* Return the index of the next token to operate on.
|
||
|
*/
|
||
|
public int execute(StringBuffer buf) {
|
||
|
return index;
|
||
|
}
|
||
|
public String toString() {
|
||
|
String opName = getClass().getName();
|
||
|
int $index = opName.indexOf('$');
|
||
|
opName = opName.substring($index+1, opName.length());
|
||
|
return opName+"@"+index+'"'+text+'"';
|
||
|
}
|
||
|
}
|
||
|
|
||
|
static class InsertBeforeOp extends RewriteOperation {
|
||
|
public InsertBeforeOp(int index, String text) {
|
||
|
super(index,text);
|
||
|
}
|
||
|
public int execute(StringBuffer buf) {
|
||
|
buf.append(text);
|
||
|
return index;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/** I'm going to try replacing range from x..y with (y-x)+1 ReplaceOp
|
||
|
* instructions.
|
||
|
*/
|
||
|
static class ReplaceOp extends RewriteOperation {
|
||
|
protected int lastIndex;
|
||
|
public ReplaceOp(int from, int to, String text) {
|
||
|
super(from,text);
|
||
|
lastIndex = to;
|
||
|
}
|
||
|
public int execute(StringBuffer buf) {
|
||
|
if ( text!=null ) {
|
||
|
buf.append(text);
|
||
|
}
|
||
|
return lastIndex+1;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
static class DeleteOp extends ReplaceOp {
|
||
|
public DeleteOp(int from, int to) {
|
||
|
super(from, to, null);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
public static final String DEFAULT_PROGRAM_NAME = "default";
|
||
|
public static final int PROGRAM_INIT_SIZE = 100;
|
||
|
|
||
|
/** Track the incoming list of tokens */
|
||
|
protected List tokens;
|
||
|
|
||
|
/** You may have multiple, named streams of rewrite operations.
|
||
|
* I'm calling these things "programs."
|
||
|
* Maps String (name) -> rewrite (List)
|
||
|
*/
|
||
|
protected Map programs = null;
|
||
|
|
||
|
/** Map String (program name) -> Integer index */
|
||
|
protected Map lastRewriteTokenIndexes = null;
|
||
|
|
||
|
/** track index of tokens */
|
||
|
protected int index = MIN_TOKEN_INDEX;
|
||
|
|
||
|
/** Who do we suck tokens from? */
|
||
|
protected TokenStream stream;
|
||
|
|
||
|
/** Which (whitespace) token(s) to throw out */
|
||
|
protected BitSet discardMask = new BitSet();
|
||
|
|
||
|
public TokenStreamRewriteEngine(TokenStream upstream) {
|
||
|
this(upstream,1000);
|
||
|
}
|
||
|
|
||
|
public TokenStreamRewriteEngine(TokenStream upstream, int initialSize) {
|
||
|
stream = upstream;
|
||
|
tokens = new ArrayList(initialSize);
|
||
|
programs = new HashMap();
|
||
|
programs.put(DEFAULT_PROGRAM_NAME,
|
||
|
new ArrayList(PROGRAM_INIT_SIZE));
|
||
|
lastRewriteTokenIndexes = new HashMap();
|
||
|
}
|
||
|
|
||
|
public Token nextToken() throws TokenStreamException {
|
||
|
TokenWithIndex t;
|
||
|
// suck tokens until end of stream or we find a non-discarded token
|
||
|
do {
|
||
|
t = (TokenWithIndex)stream.nextToken();
|
||
|
if ( t!=null ) {
|
||
|
t.setIndex(index); // what is t's index in list?
|
||
|
if ( t.getType()!=Token.EOF_TYPE ) {
|
||
|
tokens.add(t); // track all tokens except EOF
|
||
|
}
|
||
|
index++; // move to next position
|
||
|
}
|
||
|
} while ( t!=null && discardMask.member(t.getType()) );
|
||
|
return t;
|
||
|
}
|
||
|
|
||
|
public void rollback(int instructionIndex) {
|
||
|
rollback(DEFAULT_PROGRAM_NAME, instructionIndex);
|
||
|
}
|
||
|
|
||
|
/** Rollback the instruction stream for a program so that
|
||
|
* the indicated instruction (via instructionIndex) is no
|
||
|
* longer in the stream. UNTESTED!
|
||
|
*/
|
||
|
public void rollback(String programName, int instructionIndex) {
|
||
|
List is = (List)programs.get(programName);
|
||
|
if ( is!=null ) {
|
||
|
programs.put(programName, is.subList(MIN_TOKEN_INDEX,instructionIndex));
|
||
|
}
|
||
|
}
|
||
|
|
||
|
public void deleteProgram() {
|
||
|
deleteProgram(DEFAULT_PROGRAM_NAME);
|
||
|
}
|
||
|
|
||
|
/** Reset the program so that no instructions exist */
|
||
|
public void deleteProgram(String programName) {
|
||
|
rollback(programName, MIN_TOKEN_INDEX);
|
||
|
}
|
||
|
|
||
|
/** If op.index > lastRewriteTokenIndexes, just add to the end.
|
||
|
* Otherwise, do linear */
|
||
|
protected void addToSortedRewriteList(RewriteOperation op) {
|
||
|
addToSortedRewriteList(DEFAULT_PROGRAM_NAME, op);
|
||
|
}
|
||
|
|
||
|
/** old; before moving v3 stuff in
|
||
|
protected void addToSortedRewriteList(String programName, RewriteOperation op) {
|
||
|
List rewrites = getProgram(programName);
|
||
|
// if at or beyond last op's index, just append
|
||
|
if ( op.index>=getLastRewriteTokenIndex(programName) ) {
|
||
|
rewrites.add(op); // append to list of operations
|
||
|
// record the index of this operation for next time through
|
||
|
setLastRewriteTokenIndex(programName, op.index);
|
||
|
return;
|
||
|
}
|
||
|
// not after the last one, so must insert to ordered list
|
||
|
Comparator comparator = new Comparator() {
|
||
|
public int compare(Object o, Object o1) {
|
||
|
RewriteOperation a = (RewriteOperation)o;
|
||
|
RewriteOperation b = (RewriteOperation)o1;
|
||
|
if ( a.index<b.index ) return -1;
|
||
|
if ( a.index>b.index ) return 1;
|
||
|
return 0;
|
||
|
}
|
||
|
};
|
||
|
int pos = Collections.binarySearch(rewrites, op, comparator);
|
||
|
if ( pos<0 ) {
|
||
|
rewrites.add(-pos-1, op);
|
||
|
}
|
||
|
}
|
||
|
*/
|
||
|
|
||
|
/** Add an instruction to the rewrite instruction list ordered by
|
||
|
* the instruction number (use a binary search for efficiency).
|
||
|
* The list is ordered so that toString() can be done efficiently.
|
||
|
*
|
||
|
* When there are multiple instructions at the same index, the instructions
|
||
|
* must be ordered to ensure proper behavior. For example, a delete at
|
||
|
* index i must kill any replace operation at i. Insert-before operations
|
||
|
* must come before any replace / delete instructions. If there are
|
||
|
* multiple insert instructions for a single index, they are done in
|
||
|
* reverse insertion order so that "insert foo" then "insert bar" yields
|
||
|
* "foobar" in front rather than "barfoo". This is convenient because
|
||
|
* I can insert new InsertOp instructions at the index returned by
|
||
|
* the binary search. A ReplaceOp kills any previous replace op. Since
|
||
|
* delete is the same as replace with null text, i can check for
|
||
|
* ReplaceOp and cover DeleteOp at same time. :)
|
||
|
*/
|
||
|
protected void addToSortedRewriteList(String programName, RewriteOperation op) {
|
||
|
List rewrites = getProgram(programName);
|
||
|
//System.out.println("### add "+op+"; rewrites="+rewrites);
|
||
|
Comparator comparator = new Comparator() {
|
||
|
public int compare(Object o, Object o1) {
|
||
|
RewriteOperation a = (RewriteOperation)o;
|
||
|
RewriteOperation b = (RewriteOperation)o1;
|
||
|
if ( a.index<b.index ) return -1;
|
||
|
if ( a.index>b.index ) return 1;
|
||
|
return 0;
|
||
|
}
|
||
|
};
|
||
|
int pos = Collections.binarySearch(rewrites, op, comparator);
|
||
|
//System.out.println("bin search returns: pos="+pos);
|
||
|
|
||
|
if ( pos>=0 ) {
|
||
|
// binarySearch does not guarantee first element when multiple
|
||
|
// are found. I must seach backwards for first op with op.index
|
||
|
for (; pos>=0; pos--) {
|
||
|
RewriteOperation prevOp = (RewriteOperation)rewrites.get(pos);
|
||
|
if ( prevOp.index<op.index ) {
|
||
|
break;
|
||
|
}
|
||
|
}
|
||
|
pos++; // pos points at first op before ops with op.index; go back up one
|
||
|
// now pos is the index in rewrites of first op with op.index
|
||
|
//System.out.println("first op with op.index: pos="+pos);
|
||
|
|
||
|
// an instruction operating already on that index was found;
|
||
|
// make this one happen after all the others
|
||
|
//System.out.println("found instr for index="+op.index);
|
||
|
if ( op instanceof ReplaceOp ) {
|
||
|
boolean replaced = false;
|
||
|
int i;
|
||
|
// look for an existing replace
|
||
|
for (i=pos; i<rewrites.size(); i++) {
|
||
|
RewriteOperation prevOp = (RewriteOperation)rewrites.get(pos);
|
||
|
if ( prevOp.index!=op.index ) {
|
||
|
break;
|
||
|
}
|
||
|
if ( prevOp instanceof ReplaceOp ) {
|
||
|
rewrites.set(pos, op); // replace old with new
|
||
|
replaced=true;
|
||
|
break;
|
||
|
}
|
||
|
// keep going; must be an insert
|
||
|
}
|
||
|
if ( !replaced ) {
|
||
|
// add replace op to the end of all the inserts
|
||
|
rewrites.add(i, op);
|
||
|
}
|
||
|
}
|
||
|
else {
|
||
|
// inserts are added in front of existing inserts
|
||
|
rewrites.add(pos, op);
|
||
|
}
|
||
|
}
|
||
|
else {
|
||
|
//System.out.println("no instruction at pos=="+pos);
|
||
|
rewrites.add(-pos-1, op);
|
||
|
}
|
||
|
//System.out.println("after, rewrites="+rewrites);
|
||
|
}
|
||
|
|
||
|
public void insertAfter(Token t, String text) {
|
||
|
insertAfter(DEFAULT_PROGRAM_NAME, t, text);
|
||
|
}
|
||
|
|
||
|
public void insertAfter(int index, String text) {
|
||
|
insertAfter(DEFAULT_PROGRAM_NAME, index, text);
|
||
|
}
|
||
|
|
||
|
public void insertAfter(String programName, Token t, String text) {
|
||
|
insertAfter(programName,((TokenWithIndex)t).getIndex(), text);
|
||
|
}
|
||
|
|
||
|
public void insertAfter(String programName, int index, String text) {
|
||
|
// to insert after, just insert before next index (even if past end)
|
||
|
insertBefore(programName,index+1, text);
|
||
|
}
|
||
|
|
||
|
public void insertBefore(Token t, String text) {
|
||
|
insertBefore(DEFAULT_PROGRAM_NAME, t, text);
|
||
|
}
|
||
|
|
||
|
public void insertBefore(int index, String text) {
|
||
|
insertBefore(DEFAULT_PROGRAM_NAME, index, text);
|
||
|
}
|
||
|
|
||
|
public void insertBefore(String programName, Token t, String text) {
|
||
|
insertBefore(programName, ((TokenWithIndex)t).getIndex(), text);
|
||
|
}
|
||
|
|
||
|
public void insertBefore(String programName, int index, String text) {
|
||
|
addToSortedRewriteList(programName, new InsertBeforeOp(index,text));
|
||
|
}
|
||
|
|
||
|
public void replace(int index, String text) {
|
||
|
replace(DEFAULT_PROGRAM_NAME, index, index, text);
|
||
|
}
|
||
|
|
||
|
public void replace(int from, int to, String text) {
|
||
|
replace(DEFAULT_PROGRAM_NAME, from, to, text);
|
||
|
}
|
||
|
|
||
|
public void replace(Token indexT, String text) {
|
||
|
replace(DEFAULT_PROGRAM_NAME, indexT, indexT, text);
|
||
|
}
|
||
|
|
||
|
public void replace(Token from, Token to, String text) {
|
||
|
replace(DEFAULT_PROGRAM_NAME, from, to, text);
|
||
|
}
|
||
|
|
||
|
public void replace(String programName, int from, int to, String text) {
|
||
|
addToSortedRewriteList(new ReplaceOp(from, to, text));
|
||
|
}
|
||
|
|
||
|
public void replace(String programName, Token from, Token to, String text) {
|
||
|
replace(programName,
|
||
|
((TokenWithIndex)from).getIndex(),
|
||
|
((TokenWithIndex)to).getIndex(),
|
||
|
text);
|
||
|
}
|
||
|
|
||
|
public void delete(int index) {
|
||
|
delete(DEFAULT_PROGRAM_NAME, index, index);
|
||
|
}
|
||
|
|
||
|
public void delete(int from, int to) {
|
||
|
delete(DEFAULT_PROGRAM_NAME, from, to);
|
||
|
}
|
||
|
|
||
|
public void delete(Token indexT) {
|
||
|
delete(DEFAULT_PROGRAM_NAME, indexT, indexT);
|
||
|
}
|
||
|
|
||
|
public void delete(Token from, Token to) {
|
||
|
delete(DEFAULT_PROGRAM_NAME, from, to);
|
||
|
}
|
||
|
|
||
|
public void delete(String programName, int from, int to) {
|
||
|
replace(programName,from,to,null);
|
||
|
}
|
||
|
|
||
|
public void delete(String programName, Token from, Token to) {
|
||
|
replace(programName,from,to,null);
|
||
|
}
|
||
|
|
||
|
public void discard(int ttype) {
|
||
|
discardMask.add(ttype);
|
||
|
}
|
||
|
|
||
|
public TokenWithIndex getToken(int i) {
|
||
|
return (TokenWithIndex)tokens.get(i);
|
||
|
}
|
||
|
|
||
|
public int getTokenStreamSize() {
|
||
|
return tokens.size();
|
||
|
}
|
||
|
|
||
|
public String toOriginalString() {
|
||
|
return toOriginalString(MIN_TOKEN_INDEX, getTokenStreamSize()-1);
|
||
|
}
|
||
|
|
||
|
public String toOriginalString(int start, int end) {
|
||
|
StringBuffer buf = new StringBuffer();
|
||
|
for (int i=start; i>=MIN_TOKEN_INDEX && i<=end && i<tokens.size(); i++) {
|
||
|
buf.append(getToken(i).getText());
|
||
|
}
|
||
|
return buf.toString();
|
||
|
}
|
||
|
|
||
|
public String toString() {
|
||
|
return toString(MIN_TOKEN_INDEX, getTokenStreamSize()-1);
|
||
|
}
|
||
|
|
||
|
public String toString(String programName) {
|
||
|
return toString(programName, MIN_TOKEN_INDEX, getTokenStreamSize()-1);
|
||
|
}
|
||
|
|
||
|
public String toString(int start, int end) {
|
||
|
return toString(DEFAULT_PROGRAM_NAME, start, end);
|
||
|
}
|
||
|
|
||
|
public String toString(String programName, int start, int end) {
|
||
|
List rewrites = (List)programs.get(programName);
|
||
|
if ( rewrites==null || rewrites.size()==0 ) {
|
||
|
return toOriginalString(start,end); // no instructions to execute
|
||
|
}
|
||
|
StringBuffer buf = new StringBuffer();
|
||
|
|
||
|
/// Index of first rewrite we have not done
|
||
|
int rewriteOpIndex = 0;
|
||
|
|
||
|
int tokenCursor=start;
|
||
|
while ( tokenCursor>=MIN_TOKEN_INDEX &&
|
||
|
tokenCursor<=end &&
|
||
|
tokenCursor<tokens.size() )
|
||
|
{
|
||
|
//System.out.println("tokenCursor="+tokenCursor);
|
||
|
// execute instructions associated with this token index
|
||
|
if ( rewriteOpIndex<rewrites.size() ) {
|
||
|
RewriteOperation op =
|
||
|
(RewriteOperation)rewrites.get(rewriteOpIndex);
|
||
|
|
||
|
// skip all ops at lower index
|
||
|
while ( op.index<tokenCursor && rewriteOpIndex<rewrites.size() ) {
|
||
|
rewriteOpIndex++;
|
||
|
if ( rewriteOpIndex<rewrites.size() ) {
|
||
|
op = (RewriteOperation)rewrites.get(rewriteOpIndex);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
// while we have ops for this token index, exec them
|
||
|
while ( tokenCursor==op.index && rewriteOpIndex<rewrites.size() ) {
|
||
|
//System.out.println("execute "+op+" at instruction "+rewriteOpIndex);
|
||
|
tokenCursor = op.execute(buf);
|
||
|
//System.out.println("after execute tokenCursor = "+tokenCursor);
|
||
|
rewriteOpIndex++;
|
||
|
if ( rewriteOpIndex<rewrites.size() ) {
|
||
|
op = (RewriteOperation)rewrites.get(rewriteOpIndex);
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
// dump the token at this index
|
||
|
if ( tokenCursor<=end ) {
|
||
|
buf.append(getToken(tokenCursor).getText());
|
||
|
tokenCursor++;
|
||
|
}
|
||
|
}
|
||
|
// now see if there are operations (append) beyond last token index
|
||
|
for (int opi=rewriteOpIndex; opi<rewrites.size(); opi++) {
|
||
|
RewriteOperation op =
|
||
|
(RewriteOperation)rewrites.get(opi);
|
||
|
if ( op.index>=size() ) {
|
||
|
op.execute(buf); // must be insertions if after last token
|
||
|
}
|
||
|
//System.out.println("execute "+op+" at "+opi);
|
||
|
//op.execute(buf); // must be insertions if after last token
|
||
|
}
|
||
|
|
||
|
return buf.toString();
|
||
|
}
|
||
|
|
||
|
public String toDebugString() {
|
||
|
return toDebugString(MIN_TOKEN_INDEX, getTokenStreamSize()-1);
|
||
|
}
|
||
|
|
||
|
public String toDebugString(int start, int end) {
|
||
|
StringBuffer buf = new StringBuffer();
|
||
|
for (int i=start; i>=MIN_TOKEN_INDEX && i<=end && i<tokens.size(); i++) {
|
||
|
buf.append(getToken(i));
|
||
|
}
|
||
|
return buf.toString();
|
||
|
}
|
||
|
|
||
|
public int getLastRewriteTokenIndex() {
|
||
|
return getLastRewriteTokenIndex(DEFAULT_PROGRAM_NAME);
|
||
|
}
|
||
|
|
||
|
protected int getLastRewriteTokenIndex(String programName) {
|
||
|
Integer I = (Integer)lastRewriteTokenIndexes.get(programName);
|
||
|
if ( I==null ) {
|
||
|
return -1;
|
||
|
}
|
||
|
return I.intValue();
|
||
|
}
|
||
|
|
||
|
protected void setLastRewriteTokenIndex(String programName, int i) {
|
||
|
lastRewriteTokenIndexes.put(programName, new Integer(i));
|
||
|
}
|
||
|
|
||
|
protected List getProgram(String name) {
|
||
|
List is = (List)programs.get(name);
|
||
|
if ( is==null ) {
|
||
|
is = initializeProgram(name);
|
||
|
}
|
||
|
return is;
|
||
|
}
|
||
|
|
||
|
private List initializeProgram(String name) {
|
||
|
List is = new ArrayList(PROGRAM_INIT_SIZE);
|
||
|
programs.put(name, is);
|
||
|
return is;
|
||
|
}
|
||
|
|
||
|
public int size() {
|
||
|
return tokens.size();
|
||
|
}
|
||
|
|
||
|
public int index() {
|
||
|
return index;
|
||
|
}
|
||
|
|
||
|
public String getEntireText()
|
||
|
{
|
||
|
return ASDebugStream.getEntireText(this.stream);
|
||
|
}
|
||
|
|
||
|
public TokenOffsetInfo getOffsetInfo(Token token)
|
||
|
{
|
||
|
return ASDebugStream.getOffsetInfo(this.stream, token);
|
||
|
}
|
||
|
}
|