X-Git-Url: http://git.megacz.com/?p=sbp.git;a=blobdiff_plain;f=src%2Fedu%2Fberkeley%2Fsbp%2FGSS.java;h=816c0860364e43c5c2f78b32ee53cd835826521e;hp=1adb8e445ee2dfb192f5a242b0a619bac940383e;hb=ae0cef03f2e46f6ae6438f9a3e60ca36ff1a4643;hpb=526da96dd06e152d194ec92c9ef9df6085a1251b diff --git a/src/edu/berkeley/sbp/GSS.java b/src/edu/berkeley/sbp/GSS.java index 1adb8e4..816c086 100644 --- a/src/edu/berkeley/sbp/GSS.java +++ b/src/edu/berkeley/sbp/GSS.java @@ -1,9 +1,8 @@ package edu.berkeley.sbp; import edu.berkeley.sbp.*; import edu.berkeley.sbp.util.*; +import edu.berkeley.sbp.Parser.Table.*; import edu.berkeley.sbp.Sequence.Position; -import edu.berkeley.sbp.Parser.Table.State; -import edu.berkeley.sbp.Parser.Table.Reduction; import java.io.*; import java.util.*; import java.lang.reflect.*; @@ -11,154 +10,85 @@ import java.lang.reflect.*; /** implements Tomita's Graph Structured Stack */ class GSS { + static int count = 0; + static int shifts = 0; + static int reductions = 0; + int resets = 0; + int waits = 0; + public GSS() { } private Phase.Node[] reducing_list = null; - public int resets = 0; - public int waits = 0; - - HashMapBag inhibited = new HashMapBag(); - HashMapBag assumed = new HashMapBag(); - HashMapBag waiting = new HashMapBag(); - HashMapBag performed = new HashMapBag(); - HashSet tail = new HashSet(); + + // FIXME: right now, these are the performance bottleneck + HashMapBag waiting = new HashMapBag(); + HashMapBag performed = new HashMapBag(); + HashMapBag lastperformed = new HashMapBag(); + HashMapBag expected = new HashMapBag(); + /** FIXME */ + Forest.Many finalResult; + /** corresponds to a positions between tokens the input stream; same as Tomita's U_i's */ - public class Phase implements Invokable { + class Phase implements Invokable.Node>, IntegerMappable, GraphViz.ToGraphViz, Iterable { - /** the token immediately after this phase */ - public final Token token; + public Iterator iterator() { return hash.iterator(); } + public void invoke(State st, Forest result, Node n) { + shifts++; + good |= next.newNode(n, result, st, false); + } - boolean reducing; + /** the token immediately after this phase */ + final Tok token; - /** currently this is necessary only for the code() hack -- it doesn't actually correspond to the input */ private final int pos; - /** FIXME */ - public Forest.Ref finalResult; - - /** all nodes, keyed by the value returned by code() */ - /*private*/ HashMap hash; /* ALLOC */ - - /** the number of nodes in this phase */ - private int numNodes; - - boolean closed; - + boolean reducing; + private IntPairMap hash; /* ALLOC */ + private boolean closed; private boolean good; private Phase next = null; - - private Token.Location location; + private Phase prev; + private Input.Location location; public final Parser parser; private Forest forest; - Phase prev; - public Phase(Phase prev, Parser parser, Phase previous, Token token, Token.Location location, Forest forest) { + + public Phase(Phase prev, Parser parser, Phase previous, Tok token, Input.Location location, Forest forest) throws ParseFailed { this.prev = prev; this.forest = forest; this.parser = parser; this.pos = previous==null ? 0 : previous.pos+1; this.token = token; this.location = location; - inhibited.clear(); - assumed.clear(); + performed.clear(); reset(); } - public void reset() { - tail.clear(); + public void reset() throws ParseFailed { waiting.clear(); + expected.clear(); + lastperformed.clear(); + lastperformed.addAll(performed); performed.clear(); - hash = new HashMap(); + hash = new IntPairMap(); + reset = false; good = false; closed = false; - numNodes = 0; reducing = false; finalResult = null; if (prev != null) prev.shift(this, forest); } - public void complain(Node n, HashMap> errors, boolean force) { - if (n.touched) return; - n.touched = true; - for(Position p : n.state) { - //if (!p.isLast()) { - if (((p.isFirst() || p.isLast()) && !force) || p.owner().name==null) { - for(Node n2 : n.parents()) - complain(n2, errors, force | p.isFirst()); - } else { - String seqname = p.owner().name; - HashSet hs = errors.get(seqname); - if (hs==null) errors.put(seqname, hs = new HashSet()); - hs.add(p.element()+""); - //String s = " while parsing " + seqname + ": expected a " + p.element(); - //"\n"; - /* - s += " parsed: "; - for(Position p2 = p.owner().firstp(); p2 != null && p2 != p && !p2.isLast(); p2 = p2.next()) s += (p2.element() + " "); - s += "\n"; - s += " expected: "; - for(Position p2 = p; p2 != null && !p2.isLast(); p2 = p2.next()) s += (p2.element() + " "); - */ - //s += "\n"; - //errors.add(s); - } - } - } - - public String black(Object o) { return "\033[30m"+o+"\033[0m"; } - public String red(Object o) { return "\033[31m"+o+"\033[0m"; } - public String green(Object o) { return "\033[32m"+o+"\033[0m"; } - public String yellow(Object o) { return "\033[33m"+o+"\033[0m"; } - public String blue(Object o) { return "\033[34m"+o+"\033[0m"; } - public String purple(Object o) { return "\033[35m"+o+"\033[0m"; } - public String cyan(Object o) { return "\033[36m"+o+"\033[0m"; } - public String el(Object e) { - String s = e.toString(); - if (s.length()==0 || s.charAt(0)!='\"' || s.charAt(s.length()-1)!='\"') return yellow(s); - s = s.substring(1); - s = s.substring(0, s.length()-1); - StringBuffer ret = new StringBuffer(); - for(int i=0; i" : token.toString(); - StringBuffer ret = new StringBuffer(); - ret.append("\n "); - ret.append(message); - HashMap> errors = new HashMap>(); - for(Node n : hash.values()) complain(n, errors, false); - for(String s : errors.keySet()) { - ret.append(" while parsing " + yellow(s)); - HashSet hs = errors.get(s); - if (hs.size()==1) ret.append(" expected " + yellow(el(hs.iterator().next())) + "\n"); - else { - ret.append(" expected "); - boolean first = true; - for(String s2 : hs) { - if (!first) ret.append(" or "); - first = false; - ret.append(yellow(el(s2))); - } - ret.append("\n"); - } - } - return ret.toString(); - } - - public boolean isDone() throws Parser.Failed { + + public boolean isDone() throws ParseFailed { if (token != null) return false; if (token==null && finalResult==null) - throw new Parser.Failed(error(red("unexpected end of file\n")), - getLocation()); + throw new ParseFailed(ParseFailed.error(ANSI.red("unexpected end of file\n"), token, hash.values()), getLocation()); return true; } - public Token.Location getLocation() { return location; } + public Input.Location getLocation() { return location; } /** add a new node (merging with existing nodes if possible) * @param parent the parent of the new node @@ -168,35 +98,42 @@ class GSS { * @param start the earliest part of the input contributing to this node (used to make merging decisions) */ public boolean newNode(Node parent, Forest pending, State state, boolean fromEmptyReduction) { - Node p = hash.get(code(state, parent==null?null:parent.phase())); + Node p = hash.get(state, parent==null?null:parent.phase()); if (p != null) return newNode2(p, parent, pending, state, fromEmptyReduction); else return newNode3(parent, pending, state, fromEmptyReduction); } - public void newNode(Node parent, Forest pending, State state, boolean fromEmptyReduction, Reduction reduction) { + public void newNode(Node parent, Forest pending, State state, boolean fromEmptyReduction, Position reduction) { int pos = parent==null?0:parent.phase()==null?0:parent.phase().pos; - Sequence owner = reduction==null ? null : reduction.position.owner(); + Sequence owner = reduction==null ? null : reduction.owner(); if (reduction!=null) { - if (inhibited.contains(pos, owner)) return; - /* - if (assumed.contains(pos, owner)) { - tail.add(new Waiting(parent, pending, state, fromEmptyReduction, reduction)); - return; + if (owner.hates!=null) { + for (Sequence s : performed.getAll(pos)) + if (owner.hates.contains(s)) + return; + for (Sequence s : lastperformed.getAll(pos)) + if (owner.hates.contains(s)) { + //System.out.println("now expecting ["+pos+"] => " + s); + expected.add(pos, s); + return; + } } - */ if (owner.needs != null) for(Sequence s : owner.needs) if (!performed.contains(pos, s)) { waiting.add(s, new Waiting(parent, pending, state, fromEmptyReduction, reduction)); return; } - if ((owner.needed != null && owner.needed.size()>0) || - (owner.hated != null && owner.hated.size()>0) || - (owner.hates != null && owner.hates.size()>0)) + if (!performed.contains(pos, owner)) { performed.add(pos, owner); + if (owner.hated != null) + for(Sequence seq : owner.hated) + if (performed.contains(pos, seq)) { + performed.remove(pos, seq); + reset = true; + } + } } - if (!owner.lame) - newNode(parent, pending, state, fromEmptyReduction); - if (reduction!=null) inhibit(reduction, parent==null?0:parent.phase().pos); + newNode(parent, pending, state, fromEmptyReduction); if (reduction != null) { boolean redo = true; while(redo) { @@ -212,126 +149,113 @@ class GSS { } } } + private boolean newNode2(Node p, Node parent, Forest pending, State state, boolean fromEmptyReduction) { - p.holder.merge(pending); - if (p.parents().contains(parent)) return true; + if (p.merge(parent, pending)) return true; p.parents().add(parent, true); - if (p!=parent && !fromEmptyReduction) p.queueReductions(parent); + if (p!=parent && !fromEmptyReduction && reducing) p.performReductions(parent); return true; } + private boolean newNode3(Node parent, Forest pending, State state, boolean fromEmptyReduction) { do { if (token != null && state.canShift(token)) break; if (state.isAccepting()) break; if (token==null) break; - //if (!state.canReduce(token)) return false; + if (!state.canReduce(token)) return false; //if (count > 1) break; //if (r.numPop == 0) break; //r.reduce(pending, parent, null, Phase.this, null); //return; } while(false); - Node n = new Node(parent, pending, state, fromEmptyReduction); // ALLOC - n.queueEmptyReductions(); - if (!fromEmptyReduction) n.queueReductions(parent); + Node n = new Node(parent, pending, state); // ALLOC + if (reducing) { + n.performEmptyReductions(); + if (!fromEmptyReduction) n.performReductions(parent); + } return true; } - public void uninhibit(int p, Sequence s) { - if (s.hated!=null) - for(Sequence s2 : s.hated) - inhibited.remove(p, s2); - } - - public void inhibit(Reduction r, int p) { - if (r.position.owner().hated == null) return; - // remember that dead states are still allowed to shift -- just not allowed to reduce - boolean reset = false; - for(Sequence seq : r.position.owner().hated) { - if (performed.contains(p,seq)) { - uninhibit(p, seq); - //System.out.println("\nresetting due to " + r.position.owner() + " killing " + seq); - //inhibited.clear(); - inhibited.add(p, seq); - //assumed = inhibited; - //inhibited = new HashMapBag(); - reset = true; - resets++; - throw new Reset(); - } - inhibited.add(p, seq); - } - } - /** perform all reduction operations */ - public void reduce() { + public void reduce() throws ParseFailed { try { reducing = true; if (reducing_list==null || reducing_list.length < hash.size()) reducing_list = new Phase.Node[hash.size() * 4]; - Collection hv = hash.values(); - hv.toArray(reducing_list); - int num = hv.size(); + hash.toArray(reducing_list); + int num = hash.size(); for(int i=0; inext */ - public void shift(Phase next, Forest result) throws Parser.Failed { - if (prev!=null) prev.hash = null; + public void shift(Phase next, Forest result) throws ParseFailed { + // this massively improves GC performance + if (prev!=null && parser.helpgc) { + prev.hash = null; + } this.next = next; closed = true; Forest res = null; boolean ok = false; for(Phase.Node n : hash.values()) { - //if (n.holder().empty() && pos>0) continue; if (token == null && n.state.isAccepting()) { - if (finalResult==null) finalResult = new Forest.Ref(); - finalResult.merge(n.holder); + if (finalResult==null) finalResult = new Forest.Many(); + for(Object f : n.results()) + finalResult.merge((Forest)f); } if (token == null) continue; n.state.invokeShifts(token, this, result, n); } if (!good && token!=null) - throw new Parser.Failed(error(red("unexpected character")+" "+purple(token)+" encountered at "+green(getLocation())+"\n"), + throw new ParseFailed(ParseFailed.error(ANSI.red("unexpected character ")+" \'"+ + ANSI.purple(StringUtil.escapify(token+"", "\\\'\r\n"))+ + "\' encountered at "+ + ANSI.green(getLocation())+"\n", token, hash.values()), getLocation()); if (token==null && finalResult==null) - throw new Parser.Failed(error(red("unexpected end of file\n")), + throw new ParseFailed(ParseFailed.error(ANSI.red("unexpected end of file\n"), token, hash.values()), getLocation()); - - // this massively improves GC performance - //hash = null; } - public class Waiting { + class Waiting { Node parent; Forest pending; State state; boolean fromEmptyReduction; - Reduction reduction; - public Waiting(Node parent, Forest pending, State state, boolean fromEmptyReduction, Reduction reduction) { + Position reduction; + public Waiting(Node parent, Forest pending, State state, boolean fromEmptyReduction, Position reduction) { waits++; this.parent = parent; this.pending = pending; @@ -345,79 +269,139 @@ class GSS { } } - // GSS Nodes ////////////////////////////////////////////////////////////////////////////// + // Node ///////////////////////////////////////////////////////////////////////////////// /** a node in the GSS */ - public final class Node extends FastSet implements Invokable { + final class Node implements Invokable, IntegerMappable, GraphViz.ToGraphViz { + public FastSet set = new FastSet(); - public boolean touched = false; - private Forest.Ref holder = null; + private boolean allqueued = false; /** what state this node is in */ - public final State state; + public final Parser.Table.State state; /** which Phase this Node belongs to (node that Node is also a non-static inner class of Phase) */ - public Phase phase() { return Phase.this; } - - public Forest.Ref holder() { return holder==null ? (holder = new Forest.Ref()) : holder; } - public Forest pending() { return Phase.this.closed ? holder().resolve() : holder; } - public FastSet parents() { return this; } + public Phase phase() { return Phase.this; } + + private HashSet resultMap = new HashSet(); + public Iterable results() { return resultMap; } + public FastSet parents() { return set; } + public boolean merge(Node parent, Forest result) { + // FIXME: inefficient! + for(Forest.Many f : results()) { + if (f.parents.contains(parent) /* UGLY: */ && f.parents.size()==1) { + f.merge(result); + return true; + } + } + Forest.Many f = new Forest.Many(); + f.parents.add(parent); + f.merge(result); + resultMap.add(f); + set.add(parent, true); + return false; + } - public void queueReductions() { - if (!reducing) return; + public void performReductions() { if (allqueued) return; allqueued = true; - int where = parents().size(); state.invokeReductions(token, this, this, null); } - public void queueReductions(Node n2) { - if (!allqueued) { queueReductions(); return; } - state.invokeReductions(token, this, this, n2); + public void performReductions(Node n2) { + if (!allqueued) performReductions(); + else state.invokeReductions(token, this, this, n2); } - public final void invoke(Reduction r, Node n, Node n2) { - if (n==null) { - if (r.numPop==0) r.reduce(this); - return; + public void performEmptyReductions() { state.invokeReductions(token, this, null, null); } + public final void invoke(Position r, Node n, Node n2) { + reductions++; + if (n==null || n2==null || r.pos==0) { + if (r.pos==0) { + if (n==null) n = this; + else return; + } + if (n==null) return; + Forest[] holder = new Forest[r.pos]; + if (r.pos==0) n.finish(r, r.zero(), n.phase()); + else n.reduce(r, r.pos-1, n.phase(), null); + } else { + if (r.pos<=0) throw new Error("called wrong form of reduce()"); + int pos = r.pos-1; + n.reduce(r, pos, n.phase(), n2); } - if (r.numPop==0) return; - if (n2==null) r.reduce(n); - else r.reduce(n, n2); } - public void queueEmptyReductions() { - if (!reducing) return; - state.invokeReductions(token, this, null, null); + + public void reduce(Position r, int pos, Phase target, Node only) { + Forest[] holder = r.holder; + Forest old = holder[pos]; + + HashSet rr = new HashSet(); + for(Forest result : results()) rr.add(result); + for(Forest result : rr) + for(Node child : ((Forest.Many)result).parents) { + if (only != null && child!=only) continue; + holder[pos] = result; + if (pos==0) child.finish(r, r.rewrite(child.phase().getLocation().createRegion(phase().getLocation())), target); + else child.reduce(r, pos-1, target, null); + } + + holder[pos] = old; } - private boolean fe; - public boolean dead = false; - public boolean redo = false; - private Node(Node parent, Forest pending, State state, boolean fe) { - this.fe = fe; + public void finish(Position r, Forest result, Phase target) { + Parser.Table.State state0 = state.gotoSetNonTerminals.get(r.owner()); + if (result==null) throw new Error(); + if (state0!=null) + target.newNode(this, result, state0, r.pos<=0, r); + } + + private Node(Node parent, Forest pending, State state) { this.state = state; - this.holder().merge(pending); - //if (holder().empty()) throw new Error(holder()+""); + this.merge(parent, pending); Phase start = parent==null ? null : parent.phase(); if (parent != null) parents().add(parent, true); - if (Phase.this.hash.get(code(state, start)) != null) throw new Error("severe problem!"); - Phase.this.hash.put(code(state, start), this); - Phase.this.numNodes++; + if (Phase.this.hash.get(state, start) != null) throw new Error("severe problem!"); + Phase.this.hash.put(state, start, this); } + public int toInt() { return idx; } + private final int idx = node_idx++; + + // GraphViz ////////////////////////////////////////////////////////////////////////////// + + public GraphViz.Node toGraphViz(GraphViz gv) { + if (gv.hasNode(this)) return gv.createNode(this); + GraphViz.Node n = gv.createNode(this); + n.label = ""+state.toStringx(); + n.shape = "rectangle"; + n.fill = "green"; + for(Forest result : results()) n.edge(result, ""); + for(Node parent : parents()) n.edge(parent, ""); + ((GraphViz.Group)phase().toGraphViz(gv)).add(n); + return n; + } + public boolean isTransparent() { return false; } + public boolean isHidden() { return false; } + } + private int node_idx = 0; - } + public int toInt() { return pos+1; } + public int size() { return hash==null ? 0 : hash.size(); } - /** helper method */ - private static boolean equal(Object a, Object b) { - if (a==null && b==null) return true; - if (a==null || b==null) return false; - return a.equals(b); - } + // GraphViz ////////////////////////////////////////////////////////////////////////////// + + public GraphViz.Node toGraphViz(GraphViz gv) { + if (gv.hasNode(this)) return gv.createNode(this); + GraphViz.Group g = gv.createGroup(this); + g.label = "Phase " + pos; + g.color = "gray"; + g.cluster = true; + return g; + } + public boolean isTransparent() { return false; } + public boolean isHidden() { return false; } - /** this is something of a hack right now */ - private static long code(State state, Phase start) { - return (((long)state.idx) << 32) | (start==null ? 0 : (start.pos+1)); } }