1 package edu.berkeley.sbp.meta;
2 import edu.berkeley.sbp.util.*;
3 import edu.berkeley.sbp.*;
4 import edu.berkeley.sbp.chr.*;
5 import edu.berkeley.sbp.misc.*;
6 import edu.berkeley.sbp.bind.*;
8 import java.lang.annotation.*;
9 import java.lang.reflect.*;
12 /** The java classes typically used to represent a parsed grammar AST */
13 public class MetaGrammarBindings {
15 /** A grammar (a set of nonterminals) */
16 public static class Grammar extends HashMap<String,NonTerminal> {
17 public @bind Grammar(NonTerminal[] nonterminals) {
18 for(NonTerminal nt : nonterminals) this.put(nt.name, nt); }
19 public String toString() {
21 for(NonTerminal nt : values()) ret += nt + ", ";
26 public abstract static class Un extends El {
27 public Seq[][] sequences;
28 public void build(MetaGrammar.Context cx, Union u) {
29 HashSet<Sequence> bad2 = new HashSet<Sequence>();
30 for(int i=0; i<sequences.length; i++) {
31 Seq[] group = sequences[i];
32 Union u2 = new Union();
33 if (sequences.length==1) u2 = u;
34 for(int j=0; j<group.length; j++) {
35 group[j].build(cx, u2, false);
37 if (sequences.length==1) break;
38 Sequence seq = Sequence.singleton(u2);
39 for(Sequence s : bad2) {
44 bad2.add(Sequence.singleton(u2));
49 public static class NonTerminal extends Un {
51 public String name = null;
52 public @bind NonTerminal(@bind.arg String name, @bind.arg Seq[][] sequences) { this(name, sequences, false); }
53 public NonTerminal(String name, Seq[][] sequences, boolean rep) {
55 this.sequences = sequences;
58 public Element build(MetaGrammar.Context cx) { return cx.get(name); }
60 public static @bind.as("=") NonTerminal go(@bind.arg String name, @bind.arg Seq[][] sequences) { return new NonTerminal(name, sequences, true); }
62 public static class AnonUn extends Un {
63 public @bind.as("(") AnonUn(Seq[][] sequences) {
64 this.sequences = sequences;
66 public Element build(MetaGrammar.Context cx) {
67 Union ret = new Union();
73 public static class Range {
74 public @bind Range(char only) { first = only; last = only; }
75 public @bind Range(char first, char last) { this.first = first; this.last = last; }
79 public static abstract class El {
80 public String getLabel() { return null; }
81 public String getOwnerTag() { return null; }
82 public boolean drop() { return false; }
83 public abstract Element build(MetaGrammar.Context cx);
85 public static class Drop extends El {
87 public Drop(El e) { this.e = e; }
88 public String getLabel() { return null; }
89 public boolean drop() { return true; }
90 public String getOwnerTag() { return e.getOwnerTag(); }
91 public Element build(MetaGrammar.Context cx) { return e.build(cx); }
93 public static class Label extends El {
96 public Label(String label, El e) { this.e = e; this.label = label; }
97 public String getLabel() { return label; }
98 public String getOwnerTag() { return e.getOwnerTag(); }
99 public Element build(MetaGrammar.Context cx) { return e.build(cx); }
101 public static /*abstract*/ class Seq {
102 HashSet<Seq> and = new HashSet<Seq>();
103 HashSet<Seq> not = new HashSet<Seq>();
108 public Seq(El e) { this(new El[] { e }); }
109 public Seq(El[] elements) { this.elements = elements; }
110 public Seq tag(String tag) { this.tag = tag; return this; }
111 public Seq follow(El follow) { this.follow = follow; return this; }
113 Seq ret = new Seq(elements);
120 public Seq and(Seq s) { and.add(s); s.lame = true; return this; }
121 public Seq andnot(Seq s) { not.add(s); s.lame = true; return this; }
122 public Seq separate(El sep) {
123 El[] elements = new El[this.elements.length * 2 - 1];
124 for(int i=0; i<this.elements.length; i++) {
125 elements[i*2] = this.elements[i];
126 if (i<this.elements.length-1)
127 elements[i*2+1] = new Drop(sep);
129 this.elements = elements;
132 public Sequence build(MetaGrammar.Context cx, Union u, boolean lame) {
133 Sequence ret = build0(cx, lame || this.lame);
134 for(Seq s : and) { Sequence dork = s.build(cx, u, true); ret = ret.and(dork); }
135 for(Seq s : not) { Sequence dork = s.build(cx, u, true); ret = ret.not(dork); }
140 public Sequence build0(MetaGrammar.Context cx, boolean lame) {
141 boolean unwrap = false;
142 boolean dropAll = lame;
143 if (tag!=null && tag.equals("[]")) unwrap = true;
144 if (tag!=null && "()".equals(tag)) dropAll = true;
145 Object[] labels = new Object[elements.length];
146 boolean[] drops = new boolean[elements.length];
147 Element[] els = new Element[elements.length];
148 for(int i=0; i<elements.length; i++) {
149 labels[i] = elements[i].getLabel();
150 drops[i] = elements[i].drop();
151 els[i] = elements[i].build(cx);
152 if (elements[i].getOwnerTag() != null)
153 tag = elements[i].getOwnerTag();
156 if (dropAll) ret = Sequence.drop(els, false);
157 else if (unwrap) ret = Sequence.unwrap(els, cx.rm.repeatTag(), drops);
158 else if (tag!=null) {
159 ret = cx.rm.resolveTag(tag, cx.cnt, els, labels, drops);
161 ret = cx.rm.tryResolveTag(tag, cx.cnt, els, labels, drops);
164 for(int i=0; i<els.length; i++)
166 if (idx==-1) idx = i;
167 else throw new Error("multiple non-dropped elements in sequence: " + Sequence.drop(els,false));
168 if (idx != -1) ret = Sequence.singleton(els, idx);
169 else ret = Sequence.drop(els, false);
172 if (this.follow != null)
173 ret.follow = infer(this.follow.build(cx));
174 ret.lame = this.lame;
178 public static @bind.as("&") Seq and2(Seq s, Seq a) { return s.and(a); }
179 public static @bind.as("&~") Seq andnot2(Seq s, Seq a) { return s.andnot(a); }
180 public static @bind.as("->") Seq arrow(Seq s, El e) { return s.follow(e); }
181 public static @bind.as("::") Seq tag(String tagname, Seq s) { return s.tag(tagname); }
182 public static @bind.as("/") Seq slash(Seq s, El e) { return s.separate(e); }
184 public static Seq seq(El[] elements) { return new Seq(elements); }
185 public static @bind.as("Elements") Seq seq2(El[] elements) { return new Seq(elements); }
186 public static @bind.as Seq psx(Seq s) { return s; }
187 public static @bind.as(":") El colon(String s, El e) { return new Label(s, e); }
188 public static @bind.as(")") void close(String foo) { throw new Error("not supported"); }
189 public static @bind.as("()") El epsilon() { return new Constant(Union.epsilon); }
191 public static @bind class NonTerminalReference extends El {
192 public @bind.arg String nonTerminal;
193 public Element build(MetaGrammar.Context cx) { return cx.get(nonTerminal); }
196 public static class Literal extends Constant {
197 public @bind Literal(@bind.arg String string) { super(CharRange.string(string)); }
198 public boolean drop() { return true; }
201 public static class CharClass extends El {
203 public @bind.as("[") CharClass(Range[] ranges) { this.ranges = ranges; }
204 public Element build(MetaGrammar.Context cx) {
205 edu.berkeley.sbp.util.Range.Set set = new edu.berkeley.sbp.util.Range.Set();
206 for(Range r : ranges)
207 set.add(r.first, r.last);
208 return CharRange.set(set);
212 public static @bind.as("{") class XTree extends El {
213 public @bind.arg Seq body;
214 public Element build(MetaGrammar.Context cx) {
219 public static class Rep extends El {
221 public boolean zero, many, max;
222 public Rep(El e, El sep, boolean zero, boolean many, boolean max) {
223 this.e = e; this.sep = sep; this.zero = zero; this.many = many; this.max = max;}
224 public Element build(MetaGrammar.Context cx) {
226 ? Sequence.repeat(e.build(cx), zero, many, sep==null ? null : sep.build(cx), cx.rm.repeatTag())
228 ? Sequence.repeatMaximal(infer(e.build(cx)), zero, many, cx.rm.repeatTag())
229 : Sequence.repeatMaximal(e.build(cx), zero, many, infer(sep.build(cx)), cx.rm.repeatTag());
232 public static class Constant extends El {
234 public Constant(Element constant) { this.constant = constant; }
235 public Element build(MetaGrammar.Context cx) { return constant; }
237 public abstract static class PostProcess extends El {
239 public PostProcess(El e) { this.e = e; }
240 public Element build(MetaGrammar.Context cx) { return postProcess(e.build(cx)); }
241 public abstract Element postProcess(Element e);
244 // FIXME: it would be nice if we could hoist this into "Rep"
245 public static @bind.as("++") El plusmax(final El e) { return new Rep(e, null, false, true, true); }
246 public static @bind.as("+") El plus(final El e) { return new Rep(e, null, false, true, false); }
247 public static @bind.as("++/") El plusmaxfollow(final El e, final El sep) { return new Rep(e, sep, false, true, true); }
248 public static @bind.as("+/") El plusfollow(final El e, final El sep) { return new Rep(e, sep, false, true, false); }
249 public static @bind.as("**") El starmax(final El e) { return new Rep(e, null, true, true, true); }
250 public static @bind.as("*") El star(final El e) { return new Rep(e, null, true, true, false); }
251 public static @bind.as("**/") El starmaxfollow(final El e, final El sep) { return new Rep(e, sep, true, true, true); }
252 public static @bind.as("*/") El starfollow(final El e, final El sep) { return new Rep(e, sep, true, true, false); }
253 public static @bind.as("?") El question(final El e) { return new Rep(e, null, true, true, false); }
255 public static @bind.as("!") El bang(final El e) { return new Drop(e); }
257 public static @bind.as("^") El caret(final String s) {
258 return new Drop(new Constant(CharRange.string(s)) {
259 public String getOwnerTag() { return s; }
263 public static @bind.as("~") El tilde(final El e) {
264 return new PostProcess(e) {
265 public Element postProcess(Element e) {
266 return infer((Topology<Character>)Atom.toAtom(e).complement());
269 public static @bind.as("^^") void doublecaret(final El e) { throw new Error("not implemented"); }
271 //public static @bind.as("(") El subexpression(Seq[][] rhs) { return new NonTerminal(rhs); }
273 public static @bind.as("Word") String word(String s) { return s; }
274 public static @bind.as("Quoted") String quoted(String s) { return s; }
275 public static @bind.as("escaped") String c(char c) { return c+""; }
276 public static @bind.as("EmptyString") String emptystring() { return ""; }
277 public static @bind.as("\n") String retur() { return "\n"; }
278 public static @bind.as("\r") String lf() { return "\r"; }
280 static Atom infer(Element e) { return infer((Topology<Character>)Atom.toAtom(e)); }
281 static Atom infer(Topology<Character> t) { return new CharRange(new CharTopology(t)); }