changed grammar to allow <assoc=right> on | operator for alt. still allowed on token refs but ignored. Simplified left-recursion elemination rules. see CHANGES.TXT Aug 7, 2013. BREAKING CHANGE. Must alter ternary op alts in grammars.

This commit is contained in:
Terence Parr 2013-08-07 16:46:52 -07:00 committed by Sam Harwell
parent 185ee4e18e
commit 531afe5af8
7 changed files with 140 additions and 114 deletions

View File

@ -1,5 +1,44 @@
ANTLR v4 Honey Badger ANTLR v4 Honey Badger
August 7, 2013
* [BREAKING CHANGE] Altered left-recursion elimination to be simpler. Now,
we use the following patterns:
* Binary expressions are expressions which contain a recursive invocation of
the rule as the first and last element of the alternative.
* Suffix expressions contain a recursive invocation of the rule as the first
element of the alternative, but not as the last element.
* Prefix expressions contain a recursive invocation of the rule as the last
element of the alternative, but not as the first element.
There is no such thing as a "ternary" expression--they are just binary
expressions in disguise.
The right associativity specifiers no longer on the individual tokens because
it's done on alternative basis anyway. The option is now on the individual
alternative; e.g.,
e : e '*' e
| e '+' e
|<assoc=right> e '?' e ':' e
|<assoc=right> e '=' e
| INT
;
If your language uses a right-associative ternary operator, you will need
to update your grammar to include <assoc=right> on the alternative operator.
This also fixes #245 and fixes #268:
https://github.com/antlr/antlr4/issues/245
https://github.com/antlr/antlr4/issues/268
To smooth the transition, <assoc=right> is still allowed on token references
but it is ignored.
June 30, 2013 -- 4.1 release June 30, 2013 -- 4.1 release
June 24, 2013 June 24, 2013

View File

@ -38,11 +38,11 @@ import org.antlr.v4.Tool;
import org.antlr.v4.codegen.CodeGenerator; import org.antlr.v4.codegen.CodeGenerator;
import org.antlr.v4.parse.GrammarASTAdaptor; import org.antlr.v4.parse.GrammarASTAdaptor;
import org.antlr.v4.parse.LeftRecursiveRuleWalker; import org.antlr.v4.parse.LeftRecursiveRuleWalker;
import org.antlr.v4.runtime.misc.IntervalSet;
import org.antlr.v4.runtime.misc.Pair; import org.antlr.v4.runtime.misc.Pair;
import org.antlr.v4.tool.ErrorType; import org.antlr.v4.tool.ErrorType;
import org.antlr.v4.tool.ast.AltAST; import org.antlr.v4.tool.ast.AltAST;
import org.antlr.v4.tool.ast.GrammarAST; import org.antlr.v4.tool.ast.GrammarAST;
import org.antlr.v4.tool.ast.GrammarASTWithOptions;
import org.stringtemplate.v4.ST; import org.stringtemplate.v4.ST;
import org.stringtemplate.v4.STGroup; import org.stringtemplate.v4.STGroup;
import org.stringtemplate.v4.STGroupFile; import org.stringtemplate.v4.STGroupFile;
@ -115,11 +115,10 @@ public class LeftRecursiveRuleAnalyzer extends LeftRecursiveRuleWalker {
} }
@Override @Override
public void setTokenAssoc(GrammarAST t, int alt) { public void setAltAssoc(AltAST t, int alt) {
ASSOC assoc = ASSOC.left; ASSOC assoc = ASSOC.left;
if ( t instanceof GrammarASTWithOptions ) { if ( t.getOptions()!=null ) {
if ( ((GrammarASTWithOptions)t).getOptions()!=null ) { String a = t.getOptionString("assoc");
String a = ((GrammarASTWithOptions)t).getOptionString("assoc");
if ( a!=null ) { if ( a!=null ) {
if ( a.equals(ASSOC.right.toString()) ) { if ( a.equals(ASSOC.right.toString()) ) {
assoc = ASSOC.right; assoc = ASSOC.right;
@ -132,14 +131,13 @@ public class LeftRecursiveRuleAnalyzer extends LeftRecursiveRuleWalker {
} }
} }
} }
}
if ( altAssociativity.get(alt)!=null && altAssociativity.get(alt)!=assoc ) { if ( altAssociativity.get(alt)!=null && altAssociativity.get(alt)!=assoc ) {
tool.errMgr.toolError(ErrorType.ALL_OPS_NEED_SAME_ASSOC, alt); tool.errMgr.toolError(ErrorType.ALL_OPS_NEED_SAME_ASSOC, alt);
} }
altAssociativity.put(alt, assoc); altAssociativity.put(alt, assoc);
//System.out.println("op " + alt + ": " + t.getText()+", assoc="+assoc); System.out.println("setAltAssoc: op " + alt + ": " + t.getText()+", assoc="+assoc);
} }
@Override @Override
@ -169,32 +167,6 @@ public class LeftRecursiveRuleAnalyzer extends LeftRecursiveRuleWalker {
//System.out.println("binaryAlt " + alt + ": " + altText + ", rewrite=" + rewriteText); //System.out.println("binaryAlt " + alt + ": " + altText + ", rewrite=" + rewriteText);
} }
/** Convert e ? e : e -> ? e : e_[nextPrec] */
@Override
public void ternaryAlt(AltAST originalAltTree, int alt) {
AltAST altTree = (AltAST)originalAltTree.dupTree();
String altLabel = altTree.altLabel!=null ? altTree.altLabel.getText() : null;
GrammarAST lrlabel = stripLeftRecursion(altTree);
String label = lrlabel != null ? lrlabel.getText() : null;
if ( lrlabel!=null ) {
leftRecursiveRuleRefLabels.add(new Pair<GrammarAST,String>(lrlabel,altLabel));
}
stripAssocOptions(altTree);
stripAltLabel(altTree);
int nextPrec = nextPrecedence(alt);
altTree = addPrecedenceArgToLastRule(altTree, nextPrec);
String altText = text(altTree);
altText = altText.trim();
LeftRecursiveRuleAltInfo a =
new LeftRecursiveRuleAltInfo(alt, altText, label, altLabel, originalAltTree);
a.nextPrec = nextPrec;
ternaryAlts.put(alt, a);
//System.out.println("ternaryAlt " + alt + ": " + altText + ", rewrite=" + rewriteText);
}
@Override @Override
public void prefixAlt(AltAST originalAltTree, int alt) { public void prefixAlt(AltAST originalAltTree, int alt) {
AltAST altTree = (AltAST)originalAltTree.dupTree(); AltAST altTree = (AltAST)originalAltTree.dupTree();
@ -282,24 +254,18 @@ public class LeftRecursiveRuleAnalyzer extends LeftRecursiveRuleWalker {
public AltAST addPrecedenceArgToRules(AltAST t, int prec) { public AltAST addPrecedenceArgToRules(AltAST t, int prec) {
if ( t==null ) return null; if ( t==null ) return null;
for (GrammarAST rref : t.getNodesWithType(RULE_REF)) { // get all top-level rule refs from ALT
if ( rref.getText().equals(ruleName) ) { List<GrammarAST> outerAltRuleRefs = t.getNodesWithTypePreorderDFS(IntervalSet.of(RULE_REF));
for (GrammarAST rref : outerAltRuleRefs) {
boolean recursive = rref.getText().equals(ruleName);
boolean rightmost = rref == outerAltRuleRefs.get(outerAltRuleRefs.size()-1);
if ( recursive && rightmost ) {
rref.setText(ruleName+"["+prec+"]"); rref.setText(ruleName+"["+prec+"]");
} }
} }
return t; return t;
} }
public AltAST addPrecedenceArgToLastRule(AltAST t, int prec) {
if ( t==null ) return null;
GrammarAST last = null;
for (GrammarAST rref : t.getNodesWithType(RULE_REF)) { last = rref; }
if ( last !=null && last.getText().equals(ruleName) ) {
last.setText(ruleName+"["+prec+"]");
}
return t;
}
public void stripAssocOptions(GrammarAST t) { public void stripAssocOptions(GrammarAST t) {
if ( t==null ) return; if ( t==null ) return;
for (GrammarAST options : t.getNodesWithType(ELEMENT_OPTIONS)) { for (GrammarAST options : t.getNodesWithType(ELEMENT_OPTIONS)) {
@ -347,15 +313,21 @@ public class LeftRecursiveRuleAnalyzer extends LeftRecursiveRuleWalker {
public GrammarAST stripLeftRecursion(GrammarAST altAST) { public GrammarAST stripLeftRecursion(GrammarAST altAST) {
GrammarAST lrlabel=null; GrammarAST lrlabel=null;
GrammarAST first = (GrammarAST)altAST.getChild(0); GrammarAST first = (GrammarAST)altAST.getChild(0);
int leftRecurRuleIndex = 0;
if ( first.getType() == ELEMENT_OPTIONS ) {
first = (GrammarAST)altAST.getChild(1);
leftRecurRuleIndex = 1;
}
Tree rref = first.getChild(1); // if label=rule Tree rref = first.getChild(1); // if label=rule
if ( (first.getType()==RULE_REF && first.getText().equals(ruleName)) || if ( (first.getType()==RULE_REF && first.getText().equals(ruleName)) ||
(rref!=null && rref.getType()==RULE_REF && rref.getText().equals(ruleName)) ) (rref!=null && rref.getType()==RULE_REF && rref.getText().equals(ruleName)) )
{ {
if ( first.getType()==ASSIGN ) lrlabel = (GrammarAST)first.getChild(0); if ( first.getType()==ASSIGN ) lrlabel = (GrammarAST)first.getChild(0);
// remove rule ref (first child) // remove rule ref (first child unless options present)
altAST.deleteChild(0); altAST.deleteChild(leftRecurRuleIndex);
// reset index so it prints properly // reset index so it prints properly (sets token range of
GrammarAST newFirstChild = (GrammarAST)altAST.getChild(0); // ALT to start to right of left recur rule we deleted)
GrammarAST newFirstChild = (GrammarAST)altAST.getChild(leftRecurRuleIndex);
altAST.setTokenStartIndex(newFirstChild.getTokenStartIndex()); altAST.setTokenStartIndex(newFirstChild.getTokenStartIndex());
} }
return lrlabel; return lrlabel;
@ -385,10 +357,11 @@ public class LeftRecursiveRuleAnalyzer extends LeftRecursiveRuleWalker {
return numAlts-alt+1; return numAlts-alt+1;
} }
// Assumes left assoc
public int nextPrecedence(int alt) { public int nextPrecedence(int alt) {
int p = precedence(alt); int p = precedence(alt);
if ( altAssociativity.get(alt)==ASSOC.left ) p++; if ( altAssociativity.get(alt)==ASSOC.right ) return p;
return p; return p+1;
} }
@Override @Override

View File

@ -654,8 +654,12 @@ altList
// An individual alt with an optional alt option like <assoc=right> // An individual alt with an optional alt option like <assoc=right>
alternative alternative
@init { paraphrases.push("matching alternative"); } @init { paraphrases.push("matching alternative"); }
@after { paraphrases.pop(); } @after {
: ruleElementOptions? e+=element+ -> ^(ALT<AltAST> ruleElementOptions? $e+) paraphrases.pop();
Grammar.setNodeOptions($tree, $o.tree);
}
: o=ruleElementOptions?
e+=element+ -> ^(ALT<AltAST> ruleElementOptions? $e+)
| -> ^(ALT<AltAST> EPSILON) // empty alt | -> ^(ALT<AltAST> EPSILON) // empty alt
; ;
@ -879,7 +883,8 @@ if ( options!=null ) {
// Terminals may be adorned with certain options when // Terminals may be adorned with certain options when
// reference in the grammar: TOK<,,,> // reference in the grammar: TOK<,,,>
ruleElementOptions ruleElementOptions
: LT (elementOption (COMMA elementOption)*)? GT -> ^(ELEMENT_OPTIONS[$LT,"ELEMENT_OPTIONS"] elementOption*) : LT (elementOption (COMMA elementOption)*)? GT
-> ^(ELEMENT_OPTIONS[$LT,"ELEMENT_OPTIONS"] elementOption*)
; ;
// When used with elements we can specify what the tree node type can // When used with elements we can specify what the tree node type can

View File

@ -49,9 +49,8 @@ private String ruleName;
private int currentOuterAltNumber; // which outer alt of rule? private int currentOuterAltNumber; // which outer alt of rule?
public int numAlts; // how many alts for this rule total? public int numAlts; // how many alts for this rule total?
public void setTokenAssoc(GrammarAST t, int alt) {} public void setAltAssoc(AltAST altTree, int alt) {}
public void binaryAlt(AltAST altTree, int alt) {} public void binaryAlt(AltAST altTree, int alt) {}
public void ternaryAlt(AltAST altTree, int alt) {}
public void prefixAlt(AltAST altTree, int alt) {} public void prefixAlt(AltAST altTree, int alt) {}
public void suffixAlt(AltAST altTree, int alt) {} public void suffixAlt(AltAST altTree, int alt) {}
public void otherAlt(AltAST altTree, int alt) {} public void otherAlt(AltAST altTree, int alt) {}
@ -112,46 +111,36 @@ ruleBlock returns [boolean isLeftRec]
/** An alt is either prefix, suffix, binary, or ternary operation or "other" */ /** An alt is either prefix, suffix, binary, or ternary operation or "other" */
outerAlternative returns [boolean isLeftRec] outerAlternative returns [boolean isLeftRec]
: (binaryMultipleOp)=> binaryMultipleOp : (binary)=> binary
{binaryAlt((AltAST)$start, currentOuterAltNumber); $isLeftRec=true;} {binaryAlt((AltAST)$start, currentOuterAltNumber); $isLeftRec=true;}
| (binary)=> binary
{binaryAlt((AltAST)$start, currentOuterAltNumber); $isLeftRec=true;}
| (ternary)=> ternary
{ternaryAlt((AltAST)$start, currentOuterAltNumber); $isLeftRec=true;}
| (prefix)=> prefix | (prefix)=> prefix
{prefixAlt((AltAST)$start, currentOuterAltNumber);} {prefixAlt((AltAST)$start, currentOuterAltNumber);}
| (suffix)=> suffix | (suffix)=> suffix
{suffixAlt((AltAST)$start, currentOuterAltNumber); $isLeftRec=true;} {suffixAlt((AltAST)$start, currentOuterAltNumber); $isLeftRec=true;}
| ^(ALT element+) // "other" case | nonLeftRecur {otherAlt((AltAST)$start, currentOuterAltNumber);}
{otherAlt((AltAST)$start, currentOuterAltNumber);}
;
// (ALT (= a e) (= op (SET '*' '/')) (= b e) {}) (ALT INT {}) (ALT '(' (= x e) ')' {})
binaryMultipleOp
: ^( ALT recurse bops recurse ACTION? )
;
bops: ^(ASSIGN ID bops)
| ^( BLOCK ( ^( ALT (op=token)+ {setTokenAssoc($op.t, currentOuterAltNumber);} ) )+ )
| ^(SET (op=token)+ {setTokenAssoc($op.t, currentOuterAltNumber);})
; ;
binary binary
: ^( ALT recurse (op=token)+ {setTokenAssoc($op.t, currentOuterAltNumber);} recurse ACTION? ) : ^( ALT ruleElementOptions? recurse element+ recurse ACTION? )
; {setAltAssoc((AltAST)$ALT,currentOuterAltNumber);}
ternary
: ^( ALT recurse op=token recurse token recurse ACTION? ) {setTokenAssoc($op.t, currentOuterAltNumber);}
; ;
prefix prefix
: ^( ALT {setTokenAssoc((GrammarAST)input.LT(1), currentOuterAltNumber);} : ^( ALT ruleElementOptions?
({!((CommonTree)input.LT(1)).getText().equals(ruleName)}? element)+ ({!((CommonTree)input.LT(1)).getText().equals(ruleName)}? element)+
recurse ACTION? recurse ACTION?
) )
{setAltAssoc((AltAST)$ALT,currentOuterAltNumber);}
; ;
suffix : ^( ALT recurse {setTokenAssoc((GrammarAST)input.LT(1), currentOuterAltNumber);} element+ ) ; suffix
: ^( ALT ruleElementOptions? recurse element+ )
{setAltAssoc((AltAST)$ALT,currentOuterAltNumber);}
;
nonLeftRecur
: ^(ALT element+) // no assoc for these; ignore if <assoc=...> present
;
recurse recurse
: ^(ASSIGN ID recurseNoLabel) : ^(ASSIGN ID recurseNoLabel)
@ -164,16 +153,16 @@ token returns [GrammarAST t=null]
: ^(ASSIGN ID s=token {$t = $s.t;}) : ^(ASSIGN ID s=token {$t = $s.t;})
| ^(PLUS_ASSIGN ID s=token {$t = $s.t;}) | ^(PLUS_ASSIGN ID s=token {$t = $s.t;})
| b=STRING_LITERAL {$t = $b;} | b=STRING_LITERAL {$t = $b;}
| ^(b=STRING_LITERAL elementOptions) {$t = $b;} | ^(b=STRING_LITERAL ruleElementOptions) {$t = $b;}
| ^(c=TOKEN_REF elementOptions) {$t = $c;} | ^(c=TOKEN_REF ruleElementOptions) {$t = $c;}
| c=TOKEN_REF {$t = $c;} | c=TOKEN_REF {$t = $c;}
; ;
elementOptions ruleElementOptions
: ^(ELEMENT_OPTIONS elementOption*) : ^(ELEMENT_OPTIONS ruleElementOption*)
; ;
elementOption ruleElementOption
: ID : ID
| ^(ASSIGN ID ID) | ^(ASSIGN ID ID)
| ^(ASSIGN ID STRING_LITERAL) | ^(ASSIGN ID STRING_LITERAL)
@ -211,16 +200,16 @@ block
; ;
alternative alternative
: ^(ALT elementOptions? element+) : ^(ALT ruleElementOptions? element+)
; ;
atom atom
: ^(RULE_REF ARG_ACTION?) : ^(RULE_REF ARG_ACTION?)
| ^(STRING_LITERAL elementOptions) | ^(STRING_LITERAL ruleElementOptions)
| STRING_LITERAL | STRING_LITERAL
| ^(TOKEN_REF elementOptions) | ^(TOKEN_REF ruleElementOptions)
| TOKEN_REF | TOKEN_REF
| ^(WILDCARD elementOptions) | ^(WILDCARD ruleElementOptions)
| WILDCARD | WILDCARD
| ^(DOT ID element) | ^(DOT ID element)
; ;

View File

@ -754,6 +754,7 @@ public class Grammar implements AttributeResolver {
* set option assoc=right in TOKEN_REF. * set option assoc=right in TOKEN_REF.
*/ */
public static void setNodeOptions(GrammarAST node, GrammarAST options) { public static void setNodeOptions(GrammarAST node, GrammarAST options) {
if ( options==null ) return;
GrammarASTWithOptions t = (GrammarASTWithOptions)node; GrammarASTWithOptions t = (GrammarASTWithOptions)node;
if ( t.getChildCount()==0 || options.getChildCount()==0 ) return; if ( t.getChildCount()==0 || options.getChildCount()==0 ) return;
for (Object o : options.getChildren()) { for (Object o : options.getChildren()) {

View File

@ -115,6 +115,21 @@ public class GrammarAST extends CommonTree {
return nodes; return nodes;
} }
public List<GrammarAST> getNodesWithTypePreorderDFS(IntervalSet types) {
ArrayList<GrammarAST> nodes = new ArrayList<GrammarAST>();
getNodesWithTypePreorderDFS_(nodes, types);
return nodes;
}
public void getNodesWithTypePreorderDFS_(List<GrammarAST> nodes, IntervalSet types) {
if ( types.contains(this.getType()) ) nodes.add(this);
// walk all children of root.
for (int i= 0; i < getChildCount(); i++) {
GrammarAST child = (GrammarAST)getChild(i);
child.getNodesWithTypePreorderDFS_(nodes, types);
}
}
public AltAST getOutermostAltNode() { public AltAST getOutermostAltNode() {
if ( this instanceof AltAST && parent.parent instanceof RuleAST ) { if ( this instanceof AltAST && parent.parent instanceof RuleAST ) {
return (AltAST)this; return (AltAST)this;

View File

@ -33,7 +33,8 @@ package org.antlr.v4.test;
import org.antlr.v4.tool.ErrorType; import org.antlr.v4.tool.ErrorType;
import org.junit.Test; import org.junit.Test;
import static org.junit.Assert.*; import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertNull;
/** */ /** */
public class TestLeftRecursion extends BaseTest { public class TestLeftRecursion extends BaseTest {
@ -115,8 +116,8 @@ public class TestLeftRecursion extends BaseTest {
"s @after {System.out.println($ctx.toStringTree(this));} : e EOF ;\n" + // must indicate EOF can follow or 'a<EOF>' won't match "s @after {System.out.println($ctx.toStringTree(this));} : e EOF ;\n" + // must indicate EOF can follow or 'a<EOF>' won't match
"e : e '*' e" + "e : e '*' e" +
" | e '+' e" + " | e '+' e" +
" | e '?'<assoc=right> e ':' e" + " |<assoc=right> e '?' e ':' e" +
" | e '='<assoc=right> e" + " |<assoc=right> e '=' e" +
" | ID" + " | ID" +
" ;\n" + " ;\n" +
"ID : 'a'..'z'+ ;\n" + "ID : 'a'..'z'+ ;\n" +
@ -198,23 +199,24 @@ public class TestLeftRecursion extends BaseTest {
" | e 'instanceof' e\n" + " | e 'instanceof' e\n" +
" | e ('==' | '!=') e\n" + " | e ('==' | '!=') e\n" +
" | e '&' e\n" + " | e '&' e\n" +
" | e '^'<assoc=right> e\n" + " |<assoc=right> e '^' e\n" +
" | e '|' e\n" + " | e '|' e\n" +
" | e '&&' e\n" + " | e '&&' e\n" +
" | e '||' e\n" + " | e '||' e\n" +
" | e '?' e ':' e\n" + " | e '?' e ':' e\n" +
" | e ('='<assoc=right>\n" + " |<assoc=right>" +
" |'+='<assoc=right>\n" + " e ('='\n" +
" |'-='<assoc=right>\n" + " |'+='\n" +
" |'*='<assoc=right>\n" + " |'-='\n" +
" |'/='<assoc=right>\n" + " |'*='\n" +
" |'&='<assoc=right>\n" + " |'/='\n" +
" |'|='<assoc=right>\n" + " |'&='\n" +
" |'^='<assoc=right>\n" + " |'|='\n" +
" |'>>='<assoc=right>\n" + " |'^='\n" +
" |'>>>='<assoc=right>\n" + " |'>>='\n" +
" |'<<='<assoc=right>\n" + " |'>>>='\n" +
" |'%='<assoc=right>) e\n" + " |'<<='\n" +
" |'%=') e\n" +
" ;\n" + " ;\n" +
"type: ID \n" + "type: ID \n" +
" | ID '[' ']'\n" + " | ID '[' ']'\n" +
@ -229,6 +231,8 @@ public class TestLeftRecursion extends BaseTest {
"(a|b)&c", "(s (e (e ( (e (e a) | (e b)) )) & (e c)) <EOF>)", "(a|b)&c", "(s (e (e ( (e (e a) | (e b)) )) & (e c)) <EOF>)",
"a > b", "(s (e (e a) > (e b)) <EOF>)", "a > b", "(s (e (e a) > (e b)) <EOF>)",
"a >> b", "(s (e (e a) >> (e b)) <EOF>)", "a >> b", "(s (e (e a) >> (e b)) <EOF>)",
"a=b=c", "(s (e (e a) = (e (e b) = (e c))) <EOF>)",
"a^b^c", "(s (e (e a) ^ (e (e b) ^ (e c))) <EOF>)",
"(T)x", "(s (e ( (type T) ) (e x)) <EOF>)", "(T)x", "(s (e ( (type T) ) (e x)) <EOF>)",
"new A().b", "(s (e (e new (type A) ( )) . b) <EOF>)", "new A().b", "(s (e (e new (type A) ( )) . b) <EOF>)",
"(T)t.f()", "(s (e (e ( (type T) ) (e (e t) . f)) ( )) <EOF>)", "(T)t.f()", "(s (e (e ( (type T) ) (e (e t) . f)) ( )) <EOF>)",