X-Git-Url: http://git.megacz.com/?p=sbp.git;a=blobdiff_plain;f=src%2Fedu%2Fberkeley%2Fsbp%2FForest.java;h=073e37bc84185ea26970216ed2ee2db153ecdc13;hp=dbcd3c06036df2727d53026031a1367beddb4380;hb=HEAD;hpb=e14f41fe193ceef8dfd8b4bc2f327e3550231a4c diff --git a/src/edu/berkeley/sbp/Forest.java b/src/edu/berkeley/sbp/Forest.java index dbcd3c0..073e37b 100644 --- a/src/edu/berkeley/sbp/Forest.java +++ b/src/edu/berkeley/sbp/Forest.java @@ -1,177 +1,324 @@ +// Copyright 2006-2007 all rights reserved; see LICENSE file for BSD-style license + package edu.berkeley.sbp; -import edu.berkeley.sbp.*; -import edu.berkeley.sbp.*; import edu.berkeley.sbp.util.*; import java.io.*; import java.util.*; -import java.lang.reflect.*; -/** an efficient representation of a collection of trees (Tomita's shared packed parse forest) */ -public abstract class Forest { +/** + * + * An efficient representation of a collection of trees (Tomita's + * shared packed parse forest). + * + */ +public abstract class Forest implements GraphViz.ToGraphViz { /** assume that this forest contains exactly one tree and return it; otherwise throw an exception */ - public final Tree expand1() throws Parser.Ambiguous, Parser.Failed { - Iterator> it = expand(true).iterator(); - if (!it.hasNext()) throw new Parser.Failed(); - return it.next(); - } + public abstract Tree expand1() throws Ambiguous; /** expand this forest into a set of trees */ - public abstract HashSet> expand(boolean toss); + public Iterable> expand() { + HashSet> ht = new HashSet>(); + expand(ht, new HashSet>(), null); + return ht; + } + + /** returns the input Region which this Forest was parsed from */ + public abstract Input.Region getRegion(); - static Forest singleton(Token.Location loc) { return create(loc, null, new Forest[] { }, false, true); } - static Forest singleton(Token.Location loc, Forest body) { return create(loc, null, new Forest[] { body }, false, true); } - static Forest leaf(Token.Location loc, T tag) { return create(loc, tag, null, false, false); } - public static Forest create(Token.Location loc, T tag, Forest[] tokens, boolean unwrap, boolean singleton) { - return new MultiForest(loc, tag, tokens, unwrap, singleton); + // Package-Private ////////////////////////////////////////////////////////////////////////////// + + public static Forest create(Input.Region region, NodeType head, Forest[] children) { + return create(region, head, children, new boolean[children==null ? 0 : children.length]); } + public static Forest create(Input.Region region, NodeType head, Forest[] children, boolean[] lifts) { + if (region == null) throw new RuntimeException("invoked Forest.create(region=null) -- this should never happen"); + return new One(region, head, children, lifts); } - // Body ////////////////////////////////////////////////////////////////////////////// + abstract void expand(HashSet> ht, HashSet> ignore, Tree bogus); + abstract void gather(HashSet> ignore); + abstract void edges(GraphViz.StateNode n); + boolean ambiguous() { return false; } + + // One ////////////////////////////////////////////////////////////////////////////// - protected static class Body { + /** A "single" forest with a head and child subforests */ + private static class One extends Forest { - private final Token.Location location; - private final T tag; - private final Forest[] tokens; - private final boolean unwrap; - private final boolean singleton; + private final Input.Region location; + private final NodeType head; + private final Forest[] children; - private Body(Token.Location loc, T tag, Forest[] tokens, boolean unwrap, boolean singleton) { - this.location = loc; - this.tag = tag; - this.tokens = tokens==null ? emptyForestArray : new Forest[tokens.length]; - if (tokens != null) System.arraycopy(tokens, 0, this.tokens, 0, tokens.length); - if (tokens != null) for(int i=0; i> expand(boolean toss, ArrayList> toks, int i, HashSet> h) { - if (singleton) { - for(Body b : (IterableForest)tokens[0]) b.expand(toss, toks, i, h); + public Input.Region getRegion() { return location; } - } else if (i==tokens.length) { - h.add(new Tree(null, tag, toks.toArray(tree_hint))); + private One(Input.Region loc, NodeType head, Forest[] children, boolean[] lifts) { + this.location = loc; + this.head = head; + if (head==null) throw new RuntimeException("invoked Forest.create(,null,,,) -- this should never happen"); + this.children = children==null ? emptyForestArray : new Forest[children.length]; + if (children != null) System.arraycopy(children, 0, this.children, 0, children.length); + if (children != null) for(int i=0; i)tokens[i]) - b.expand(toss, toks, 0, h); + public Tree expand1() throws Ambiguous { + if (children.length == 0) + return new Tree(location, head); + else + return expand1ForOneAndMany((Forest)this); + } + void gather(HashSet> hf) { + hf.add(this); + for(Forest f : children) f.gather(hf); + } + void expand(HashSet> ht, HashSet> ignore, Tree bogus) { + if (ignore.contains(this)) { ht.add(bogus); return; } + expand(0, new Tree[children.length], ht, ignore, bogus); + } + private void expand(final int i, Tree[] ta, HashSet> ht, HashSet> ignore, + Tree bogus) { + if (i==children.length) { + ht.add(new Tree(location, head, ta, lifts)); } else { - boolean hit = false; - for(Tree r : tokens[i].expand(toss)) { - hit = true; - int old = toks.size(); - toks.add(r); - expand(toss, toks, i+1, h); - while(toks.size() > old) toks.remove(toks.size()-1); + HashSet> ht2 = new HashSet>(); + children[i].expand(ht2, ignore, bogus); + for(Tree tc : ht2) { + ta[i] = tc; + expand(i+1, ta, ht, ignore, bogus); + ta[i] = null; } - //if (!hit) throw new Error(); } - return h; } - void addTo(FastSet h) { - if (!singleton) h.add(this, true); - else for(Body b : (IterableForest)tokens[0]) b.addTo(h); - } + // GraphViz, ToInt ////////////////////////////////////////////////////////////////////////////// - public String toString() { - StringBuffer ret = new StringBuffer(); - for(int i=0; i 0) { - ret.append(q); - ret.append(" "); + public boolean isTransparent() { return false; } + public boolean isHidden() { return false; } + public GraphViz.StateNode toGraphViz(GraphViz gv) { + if (gv.hasNode(this)) return gv.createNode(this); + GraphViz.StateNode n = gv.createNode(this); + n.label = headToString()==null?"":headToString(); + n.directed = true; + edges(n); + return n; + } + boolean edges = false; // FIXME ?? + public void edges(GraphViz.StateNode n) { + if (edges) return; + edges = true; + for(int i=0; i 0 ? tag+":" : tag+"") : ""; - if (tail.length() > 0) tail = "{" + tail + "}"; - return head + tail; } + + protected String headToString() { return head==null?null:head.toString(); } + protected String headToJava() { return "null"; } + protected String left() { return "{"; } + protected String right() { return "}"; } + protected boolean ignoreSingleton() { return false; } } - // Ref ////////////////////////////////////////////////////////////////////////////// + // Many ////////////////////////////////////////////////////////////////////////////// - private static abstract class IterableForest extends Forest implements Iterable> { - public abstract Iterator> iterator(); - } + /** An "ambiguity node"; this is immutable once it has been "looked at" */ + static class Many extends Forest { - /** - * This class represents a partially complete collection of - * forests to be viewed as a forest at some later date; once - * viewed, it becomes immutable - */ - static class Ref extends IterableForest { - private FastSet hp = new FastSet(); - private Forest res = null; - public Ref() { } - public void merge(Forest p) { - if (res != null) throw new Error("already resolved!"); - if (p==null) throw new Error(); - if (p!=this) hp.add(p, true); - } - public Iterator> iterator() { return ((IterableForest)resolve()).iterator(); } - public HashSet> expand(boolean toss) { return resolve().expand(toss); } - public String toString() { return resolve().toString(); } - public Forest resolve() { - if (hp==null) return res; - FastSet nh = new FastSet(); - for(Forest p : hp) - for(Body b : (IterableForest)p) - b.addTo(nh); - res = new MultiForest(nh); - hp = null; - return res; - } - } + private FastSet> hp = new FastSet>(); + private boolean touched = false; + + public Many() { } - // Implementations ////////////////////////////////////////////////////////////////////////////// + public Input.Region getRegion() { return hp.iterator().next().getRegion(); } // all should be identical + + Forest simplify() throws Ambiguous { + touched(); + if (hp.size() > 1) { + HashSet> hf0 = new HashSet>(); + Iterator> ih = hp.iterator(); + ih.next().gather(hf0); + for(Forest f : hp) { + HashSet> hf1 = new HashSet>(); + f.gather(hf1); + hf0.retainAll(hf1); + } + HashSet> ht = new HashSet>(); + expand(ht, hf0, new Tree(null, "*")); + throw new Ambiguous((Forest)this, + (HashSet>)(Object)ht); + } - private static class MultiForest extends IterableForest { - private final FastSet> results; - private MultiForest(FastSet> results) { this.results = results; } - public MultiForest(Token.Location loc, T tag, Forest[] tokens, boolean unwrap, boolean singleton) { - this.results = new FastSet>(new Body(loc, tag, tokens, unwrap, singleton)); + return hp.iterator().next(); } - public Iterator> iterator() { return results.iterator(); } - public HashSet> expand(boolean toss) { - HashSet> ret = new HashSet>(); - for(Body b : results) - ret.addAll(b.expand(toss, new ArrayList>(), 0, new HashSet>())); - if (toss && ret.size() > 1) throw new Parser.Ambiguous(this); - return ret; + public Tree expand1() throws Ambiguous { + return simplify().expand1(); } - // Display ////////////////////////////////////////////////////////////////////////////// - - private String toString = null; - public String toString() { - if (toString != null) return toString; - StringBuffer ret = new StringBuffer(); - if (results.size()==1) { - for(Forest.Body r : results) - ret.append(r); - return toString = ret.toString(); - } - ret.append(" r : results) { - if (!first) ret.append(' '); - first = false; - ret.append(r); + void gather(HashSet> ht) { + touched(); + + // FIXME: do something more sensible here + if (ht.contains(this)) { + System.err.println("WARNING: grammar produced a circular forest\n" + this); + //throw new Error("grammar produced a circular forest:\n" + this); + return; } - ret.append("?>"); - return toString = ret.toString(); + + ht.add(this); + for(Forest f : hp) f.gather(ht); + } + + private void touched() { + if (touched) return; + touched = true; + /* + FastSet> f2 = new FastSet>(); + for(Forest f : hp) + if (f instanceof Forest.One) f2.add(f); + else for(Forest ff : ((Forest.Many)f)) + f2.add(ff); + hp = f2; + */ + } + public boolean contains(Forest f) { + touched(); + return hp.contains(f); + } + public void merge(Forest p) { + if (touched) throw new RuntimeException("attempt to merge() on a Forest.Many that has already been examined"); + if (p==this) throw new RuntimeException("attempt to merge() a Forest.Many to itself!"); + hp.add(p, true); + } + boolean ambiguous() { + touched(); + if (hp.size()==0) return false; + if (hp.size()==1) return hp.iterator().next().ambiguous(); + return true; + } + + void expand(HashSet> ht, HashSet> ignore, Tree bogus) { + touched(); + if (ignore.contains(this)) { ht.add(bogus); return; } + for (Forest f : hp) f.expand(ht, ignore, bogus); + } + + + // GraphViz, ToInt ////////////////////////////////////////////////////////////////////////////// + + public boolean isTransparent() { return hp.size()==1; } + public boolean isHidden() { return hp.size()==0; } + public void edges(GraphViz.StateNode n) { + if (hp.size()==1) { hp.iterator().next().edges(n); return; } + for(Forest f : hp) f.edges(n); + } + public GraphViz.StateNode toGraphViz(GraphViz gv) { + if (hp.size()==1) return hp.iterator().next().toGraphViz(gv); + if (gv.hasNode(this)) return gv.createNode(this); + GraphViz.StateNode n = gv.createNode(this); + n.label = "?"; + n.color = "red"; + for(Forest f : hp) n.edge(f, null); + return n; } } + // Statics ////////////////////////////////////////////////////////////////////////////// + /** Depth-first expansion, handling .One and .Many without recursion. */ + private static Tree expand1ForOneAndMany( + Forest forest) throws Ambiguous { + List> nodes = new ArrayList>(); + List> build = new ArrayList>(); + + // path stack + List> path = new ArrayList>(); + List sizes = new ArrayList(), + poss = new ArrayList(); + + // handle the left-most leaf + expand1Descend(path, nodes, sizes, poss, forest); + + for (Forest.One f; path.size() > 0;) { + // up one + f = pop(path); + int size = pop(sizes) + 1; + int pos = pop(poss) + 1; + Forest[] children = f.children; + if (pos < children.length) { + // down the next branch + path.add(f); + sizes.add(new Integer(size)); + poss.add(new Integer(pos)); + + // handle the left-most leaf + expand1Descend(path, nodes, sizes, poss, children[pos]); + } else { + if (path.size() > 0 && peek(path).lifts[peek(poss)]) { + // skip assembling this node, lift children + sizes.add(pop(sizes) + size - 1); + continue; + } + // assemble this node + for (int i=size; i > 0; i--) + build.add(nodes.remove(nodes.size() - i)); + nodes.add(new Tree(f.location, f.head, build)); + build.clear(); + } + } + + return pop(nodes); + } + + /** Descend to the left-most leaf, building the path. */ + private static void expand1Descend( + List> path, List> nodes, + List sizes, List poss, Forest f) + throws Ambiguous { + while (true) { + if (f instanceof Forest.Many) + f = ((Forest.Many)f).simplify(); + else if (f instanceof Forest.One) { + Forest.One one = (Forest.One)f; + if (one.children.length == 0) + break; + path.add(one); + sizes.add(0); + poss.add(0); + f = one.children[0]; + } else { + nodes.add(f.expand1()); + return; + } + } + + if (path.size() > 0 && peek(path).lifts[peek(poss)]) + sizes.add(pop(sizes) - 1); // ignore lifted leafs + else + nodes.add(f.expand1()); + } + + private static T pop(List list) { + return list.remove(list.size() - 1); } + private static T peek(List list) { + return list.get(list.size() - 1); } + private static Tree[] tree_hint = new Tree[0]; + private static String[] string_hint = new String[0]; private static final Forest[] emptyForestArray = new Forest[0]; + + protected String headToString() { return null; } + protected String headToJava() { return "null"; } + protected String left() { return ""; } + protected boolean ignoreSingleton() { return true; } }