1 package edu.berkeley.sbp.meta;
2 import edu.berkeley.sbp.util.*;
3 import edu.berkeley.sbp.*;
4 import edu.berkeley.sbp.chr.*;
5 import edu.berkeley.sbp.misc.*;
6 import edu.berkeley.sbp.bind.*;
8 import java.lang.annotation.*;
9 import java.lang.reflect.*;
12 /** The java classes typically used to represent a parsed grammar AST */
13 public class MetaGrammarBindings {
15 /** A grammar (a set of nonterminals) */
16 public static class Grammar extends HashMap<String,NonTerminal> {
17 public @bind Grammar(NonTerminal[] nonterminals) {
18 for(NonTerminal nt : nonterminals) this.put(nt.name, nt); }
19 public String toString() {
21 for(NonTerminal nt : values()) ret += nt + ", ";
26 public abstract static class Un extends El {
27 public Seq[][] sequences;
28 public void build(MetaGrammar.Context cx, Union u) {
29 HashSet<Sequence> bad2 = new HashSet<Sequence>();
30 for(int i=0; i<sequences.length; i++) {
31 Seq[] group = sequences[i];
32 Union u2 = new Union();
33 if (sequences.length==1) u2 = u;
34 for(int j=0; j<group.length; j++) {
35 group[j].build(cx, u2, false);
37 if (sequences.length==1) break;
38 Sequence seq = Sequence.singleton(u2);
39 for(Sequence s : bad2) {
44 bad2.add(Sequence.singleton(u2));
49 public static class NonTerminal extends Un {
51 public String name = null;
52 public String sep = null;
53 public @bind NonTerminal(@bind.arg String name, @bind.arg Seq[][] sequences) { this(name, sequences, false); }
54 public NonTerminal(String name, Seq[][] sequences, boolean rep) { this(name, sequences, rep, null); }
55 public NonTerminal(String name, Seq[][] sequences, boolean rep, String sep) {
57 this.sequences = sequences;
61 public Element build(MetaGrammar.Context cx) { return cx.get(name); }
62 public void build(MetaGrammar.Context cx, Union u) {
63 if (!rep) { super.build(cx, u); return; }
64 HashSet<Sequence> bad2 = new HashSet<Sequence>();
66 Union urep = new Union();
67 urep.add(Sequence.empty);
68 urep.add(Sequence.singleton(new Element[] { cx.get(sep), u }, 1));
70 for(int i=0; i<sequences.length; i++) {
71 Seq[] group = sequences[i];
72 Union u2 = new Union();
73 if (sequences.length==1) u2 = u;
74 for(int j=0; j<group.length; j++) {
75 Union u3 = new Union();
76 group[j].build(cx, u3, false);
77 Sequence s = Sequence.unwrap(new Element[] { u3, urep },
79 new boolean[] { false, false });
82 if (sequences.length==1) break;
83 Sequence seq = Sequence.singleton(u2);
84 for(Sequence s : bad2) {
89 bad2.add(Sequence.singleton(u2));
93 public static @bind.as("=") NonTerminal go(@bind.arg String name, @bind.arg Seq[][] sequences) { return new NonTerminal(name, sequences, true); }
94 public static @bind.as("=") NonTerminal go(@bind.arg String name, @bind.arg String sep, @bind.arg Seq[][] sequences) {
95 return new NonTerminal(name, sequences, true, sep);
98 public static class AnonUn extends Un {
99 public @bind.as("(") AnonUn(Seq[][] sequences) {
100 this.sequences = sequences;
102 public Element build(MetaGrammar.Context cx) {
103 Union ret = new Union();
109 public static class Range {
110 public @bind Range(char only) { first = only; last = only; }
111 public @bind Range(char first, char last) { this.first = first; this.last = last; }
115 public static abstract class El {
116 public String getLabel() { return null; }
117 public String getOwnerTag() { return null; }
118 public boolean drop() { return false; }
119 public abstract Element build(MetaGrammar.Context cx);
121 public static class Drop extends El {
123 public Drop(El e) { this.e = e; }
124 public String getLabel() { return null; }
125 public boolean drop() { return true; }
126 public String getOwnerTag() { return e.getOwnerTag(); }
127 public Element build(MetaGrammar.Context cx) { return e.build(cx); }
129 public static class Label extends El {
132 public Label(String label, El e) { this.e = e; this.label = label; }
133 public String getLabel() { return label; }
134 public String getOwnerTag() { return e.getOwnerTag(); }
135 public Element build(MetaGrammar.Context cx) { return e.build(cx); }
137 public static /*abstract*/ class Seq {
138 HashSet<Seq> and = new HashSet<Seq>();
139 HashSet<Seq> not = new HashSet<Seq>();
144 public void append(El e) {
145 El[] elements = new El[this.elements.length+1];
146 System.arraycopy(this.elements, 0, elements, 0, this.elements.length);
147 this.elements = elements;
148 elements[elements.length-1] = e;
150 public Seq(El e) { this(new El[] { e }); }
151 public Seq(El[] elements) { this.elements = elements; }
152 public Seq tag(String tag) { this.tag = tag; return this; }
153 public Seq follow(El follow) { this.follow = follow; return this; }
155 Seq ret = new Seq(elements);
162 public Seq and(Seq s) { and.add(s); s.lame = true; return this; }
163 public Seq andnot(Seq s) { not.add(s); s.lame = true; return this; }
164 public Seq separate(El sep) {
165 El[] elements = new El[this.elements.length * 2 - 1];
166 for(int i=0; i<this.elements.length; i++) {
167 elements[i*2] = this.elements[i];
168 if (i<this.elements.length-1)
169 elements[i*2+1] = new Drop(sep);
171 this.elements = elements;
174 public Sequence build(MetaGrammar.Context cx, Union u, boolean lame) {
175 Sequence ret = build0(cx, lame || this.lame);
176 for(Seq s : and) { Sequence dork = s.build(cx, u, true); ret = ret.and(dork); }
177 for(Seq s : not) { Sequence dork = s.build(cx, u, true); ret = ret.not(dork); }
182 public Sequence build0(MetaGrammar.Context cx, boolean lame) {
183 boolean unwrap = false;
184 boolean dropAll = lame;
185 if (tag!=null && tag.equals("[]")) unwrap = true;
186 if (tag!=null && "()".equals(tag)) dropAll = true;
187 Object[] labels = new Object[elements.length];
188 boolean[] drops = new boolean[elements.length];
189 Element[] els = new Element[elements.length];
190 for(int i=0; i<elements.length; i++) {
191 labels[i] = elements[i].getLabel();
192 drops[i] = elements[i].drop();
193 els[i] = elements[i].build(cx);
194 if (elements[i].getOwnerTag() != null)
195 tag = elements[i].getOwnerTag();
198 if (dropAll) ret = Sequence.drop(els, false);
199 else if (unwrap) ret = Sequence.unwrap(els, cx.rm.repeatTag(), drops);
201 if (tag != null) ret = cx.rm.resolveTag(tag, cx.cnt, els, labels, drops);
202 else ret = cx.rm.tryResolveTag(tag, cx.cnt, els, labels, drops);
205 for(int i=0; i<els.length; i++)
207 if (idx==-1) idx = i;
208 else throw new Error("multiple non-dropped elements in sequence: " + Sequence.drop(els,false));
209 if (idx != -1) ret = Sequence.singleton(els, idx);
210 else ret = Sequence.drop(els, false);
213 if (this.follow != null)
214 ret.follow = infer(this.follow.build(cx));
215 ret.lame = this.lame;
219 public static @bind.as("&") Seq and2(Seq s, Seq a) { return s.and(a); }
220 public static @bind.as("&~") Seq andnot2(Seq s, Seq a) { return s.andnot(a); }
221 public static @bind.as("->") Seq arrow(Seq s, El e) { return s.follow(e); }
222 public static @bind.as("::") Seq tag(String tagname, Seq s) { return s.tag(tagname); }
223 public static @bind.as("/") Seq slash(Seq s, El e) { return s.separate(e); }
225 public static Seq seq(El[] elements) { return new Seq(elements); }
226 public static @bind.as("Elements") Seq seq2(El[] elements) { return new Seq(elements); }
227 public static @bind.as Seq psx(Seq s) { return s; }
228 public static @bind.as(":") El colon(String s, El e) { return new Label(s, e); }
229 public static @bind.as(")") void close(String foo) { throw new Error("not supported"); }
230 public static @bind.as("()") El epsilon() { return new Constant(Union.epsilon); }
232 public static @bind class NonTerminalReference extends El {
233 public @bind.arg String nonTerminal;
234 public Element build(MetaGrammar.Context cx) { return cx.get(nonTerminal); }
237 public static class Literal extends Constant {
238 public @bind Literal(@bind.arg String string) { super(CharRange.string(string)); }
239 public boolean drop() { return true; }
242 public static class CharClass extends El {
244 public @bind.as("[") CharClass(Range[] ranges) { this.ranges = ranges; }
245 public Element build(MetaGrammar.Context cx) {
246 edu.berkeley.sbp.util.Range.Set set = new edu.berkeley.sbp.util.Range.Set();
247 for(Range r : ranges)
248 set.add(r.first, r.last);
249 return CharRange.set(set);
253 public static @bind.as("{") class XTree extends El {
254 public @bind.arg Seq body;
255 public Element build(MetaGrammar.Context cx) {
256 Union u = new Union();
257 Sequence s = body.build(cx, u, false);
258 Union u2 = new Union();
259 u2.add(Sequence.singleton(new Element[] {
270 public static class Rep extends El {
272 public boolean zero, many, max;
273 public Rep(El e, El sep, boolean zero, boolean many, boolean max) {
274 this.e = e; this.sep = sep; this.zero = zero; this.many = many; this.max = max;}
275 public Element build(MetaGrammar.Context cx) {
277 ? Sequence.repeat(e.build(cx), zero, many, sep==null ? null : sep.build(cx), cx.rm.repeatTag())
279 ? Sequence.repeatMaximal(infer(e.build(cx)), zero, many, cx.rm.repeatTag())
280 : Sequence.repeatMaximal(e.build(cx), zero, many, infer(sep.build(cx)), cx.rm.repeatTag());
283 public static class Constant extends El {
285 public Constant(Element constant) { this.constant = constant; }
286 public Element build(MetaGrammar.Context cx) { return constant; }
288 public abstract static class PostProcess extends El {
290 public PostProcess(El e) { this.e = e; }
291 public Element build(MetaGrammar.Context cx) { return postProcess(e.build(cx)); }
292 public abstract Element postProcess(Element e);
295 // FIXME: it would be nice if we could hoist this into "Rep"
296 public static @bind.as("++") El plusmax(final El e) { return new Rep(e, null, false, true, true); }
297 public static @bind.as("+") El plus(final El e) { return new Rep(e, null, false, true, false); }
298 public static @bind.as("++/") El plusmaxfollow(final El e, final El sep) { return new Rep(e, sep, false, true, true); }
299 public static @bind.as("+/") El plusfollow(final El e, final El sep) { return new Rep(e, sep, false, true, false); }
300 public static @bind.as("**") El starmax(final El e) { return new Rep(e, null, true, true, true); }
301 public static @bind.as("*") El star(final El e) { return new Rep(e, null, true, true, false); }
302 public static @bind.as("**/") El starmaxfollow(final El e, final El sep) { return new Rep(e, sep, true, true, true); }
303 public static @bind.as("*/") El starfollow(final El e, final El sep) { return new Rep(e, sep, true, true, false); }
304 public static @bind.as("?") El question(final El e) { return new Rep(e, null, true, true, false); }
306 public static @bind.as("!") El bang(final El e) { return new Drop(e); }
308 public static @bind.as("^") El caret(final String s) {
309 return new Drop(new Constant(CharRange.string(s)) {
310 public String getOwnerTag() { return s; }
314 public static @bind.as("~") El tilde(final El e) {
315 return new PostProcess(e) {
316 public Element postProcess(Element e) {
317 return infer((Topology<Character>)Atom.toAtom(e).complement());
320 public static @bind.as("^^") void doublecaret(final El e) { throw new Error("not implemented"); }
322 //public static @bind.as("(") El subexpression(Seq[][] rhs) { return new NonTerminal(rhs); }
324 public static @bind.as("Word") String word(String s) { return s; }
325 public static @bind.as("Quoted") String quoted(String s) { return s; }
326 public static @bind.as("escaped") String c(char c) { return c+""; }
327 public static @bind.as("EmptyString") String emptystring() { return ""; }
328 public static @bind.as("\n") String retur() { return "\n"; }
329 public static @bind.as("\r") String lf() { return "\r"; }
331 static Atom infer(Element e) { return infer((Topology<Character>)Atom.toAtom(e)); }
332 static Atom infer(Topology<Character> t) { return new CharRange(new CharTopology(t)); }