X-Git-Url: http://git.megacz.com/?p=sbp.git;a=blobdiff_plain;f=src%2Fedu%2Fberkeley%2Fsbp%2FParser.java;h=e8e0dc8e641a5c5ffc52d30de57a8712c6dc3847;hp=6986a4b900de9f22a9fe3416159d17eac25d684d;hb=fd97655ce34c3aff1a47bfb2f45775ac711923b1;hpb=6caa23ec64fa689a91c0b81238d04ff7322a945c diff --git a/src/edu/berkeley/sbp/Parser.java b/src/edu/berkeley/sbp/Parser.java index 6986a4b..e8e0dc8 100644 --- a/src/edu/berkeley/sbp/Parser.java +++ b/src/edu/berkeley/sbp/Parser.java @@ -9,20 +9,30 @@ import java.util.*; import java.lang.reflect.*; /** a parser which translates streams of Tokens of type T into a Forest */ -public class Parser { +public abstract class Parser { private final Table pt; - //public Parser( Topology top) { this(new Table( top)); } - //public Parser(String s, Topology top) { this(new Table(s, top)); } + private static void reachable(Element e, HashSet h) { + if (e instanceof Atom) return; + for(Sequence s : ((Union)e)) + reachable(s.firstp(), h); + } + private static void reachable(Position p, HashSet h) { + if (h.contains(p)) return; + h.add(p); + if (p.element() != null) reachable(p.element(), h); + } /** * create a parser to parse the grammar with start symbol u - * @param top a "sample" Topology that can be cloned (FIXME, demanding this is lame) */ - public Parser(Union u, Topology top) { this(new Table(u, top)); } + protected Parser(Union u) { this.pt = new Table(u, top()); } + protected Parser(Table pt) { this.pt = pt; } + + public abstract Forest shiftedToken(T t, Token.Location loc); + public abstract Topology top(); - Parser(Table pt) { this.pt = pt; } /** parse input for a exactly one unique result, throwing Ambiguous if not unique or Failed if none */ public Tree parse1(Token.Stream input) throws IOException, Failed, Ambiguous { return parse(input).expand1(); } @@ -30,12 +40,15 @@ public class Parser { /** parse input, using the table pt to drive the parser */ public Forest parse(Token.Stream input) throws IOException, Failed { GSS gss = new GSS(); - GSS.Phase current = gss.new Phase(null, input.next()); + Token.Location loc = input.getLocation(); + GSS.Phase current = gss.new Phase(null, input.next(), loc); current.newNode(null, null, pt.start, true, null); for(;;) { - GSS.Phase next = gss.new Phase(current, input.next()); + loc = input.getLocation(); + GSS.Phase next = gss.new Phase(current, input.next(), loc); current.reduce(); - current.shift(next); + Forest forest = current.token==null ? null : shiftedToken((T)current.token, loc); + current.shift(next, forest); if (current.isDone()) return (Forest)current.finalResult; current.checkFailure(); current = next; @@ -51,7 +64,7 @@ public class Parser { public Failed() { this("", null); } public Failed(String message, Token.Location loc) { this.location = loc; this.message = message; } public Token.Location getLocation() { return location; } - public String toString() { return message + (location==null ? "" : (" at " + location + "\n" + location.getContext())); } + public String toString() { return message + (location==null ? "" : (" at " + location)); } } public static class Ambiguous extends RuntimeException { @@ -69,18 +82,19 @@ public class Parser { // Table ////////////////////////////////////////////////////////////////////////////// + static class Top extends Union { public Top() { super("0"); } } + /** an SLR(1) parse table which may contain conflicts */ static class Table { private final Union start0 = new Top(); private final Sequence start0seq; - static class Top extends Union { public Top() { super("0"); } } public final Walk.Cache cache = new Walk.Cache(); public HashSet closure() { HashSet hp = new HashSet(); - start0.reachable(hp); + reachable(start0, hp); return hp; } public Position firstPosition() { return start0seq.firstp(); } @@ -144,7 +158,7 @@ public class Parser { // FIXME: how does right-nullability interact with follow restrictions? // all right-nullable rules get a reduction [Johnstone 2000] if (p.isRightNullable(cache)) { - Walk.Follow wf = new Walk.Follow(top.fresh(), p.owner(), all_elements, cache); + Walk.Follow wf = new Walk.Follow(top.empty(), p.owner(), all_elements, cache); Reduction red = new Reduction(p); state.reductions.put(wf.walk(p.owner()), red); if (wf.includesEof()) state.eofReductions.add(red, true); @@ -153,7 +167,7 @@ public class Parser { // if the element following this position is an atom, copy the corresponding // set of rows out of the "master" goto table and into this state's shift table if (p.element() != null && p.element() instanceof Atom) - state.shifts.addAll(state.gotoSetTerminals.subset(((Atom)p.element()).dup())); + state.shifts.addAll(state.gotoSetTerminals.subset(((Atom)p.element()))); } } @@ -223,8 +237,8 @@ public class Parser { if (position.isLast() || !(position.element() instanceof Atom)) continue; Atom a = (Atom)position.element(); HashSet hp = new HashSet(); - position.next().reachable(hp); - bag0.addAll(a.dup(), /*clo.walk()*/hp); + reachable(position.next(), hp); + bag0.addAll(a, /*clo.walk()*/hp); } // Step 1b: for each _minimal, contiguous_ set of characters having an identical next-position @@ -262,7 +276,7 @@ public class Parser { if (ys != null) { for(Element y : ys) { HashSet hp = new HashSet(); - p.next().reachable(hp); + reachable(p.next(), hp); move.addAll(y, hp); } }