X-Git-Url: http://git.megacz.com/?p=sbp.git;a=blobdiff_plain;f=src%2Fedu%2Fberkeley%2Fsbp%2FForest.java;h=3795c9ad19d5cdb17a2a72d9f9d1195567a82086;hp=34759e366148392ceb9fa07e9e5ed322c1a107a9;hb=815430f1fa820e28981bf4cff3fe15a4b9f5d97d;hpb=4cc825538bcfaacea47ba7c89a1e47321a95baab diff --git a/src/edu/berkeley/sbp/Forest.java b/src/edu/berkeley/sbp/Forest.java index 34759e3..3795c9a 100644 --- a/src/edu/berkeley/sbp/Forest.java +++ b/src/edu/berkeley/sbp/Forest.java @@ -1,135 +1,222 @@ package edu.berkeley.sbp; import edu.berkeley.sbp.*; -import edu.berkeley.sbp.*; +import edu.berkeley.sbp.Sequence.Position; import edu.berkeley.sbp.util.*; import java.io.*; import java.util.*; import java.lang.reflect.*; -/** an efficient representation of a collection of trees (Tomita's shared packed parse forest) */ -public abstract class Forest /*extends PrintableTree>*/ implements Iterable> { +/** + * An efficient representation of a collection of trees (Tomita's + * shared packed parse forest). + */ +public abstract class Forest implements GraphViz.ToGraphViz { + /** assume that this forest contains exactly one tree and return it; otherwise throw an exception */ - public final Tree expand1() throws Ambiguous, ParseFailed { - Iterator> it = expand(true).iterator(); - if (!it.hasNext()) throw new ParseFailed(); - return it.next(); - } + public abstract Tree expand1() throws Ambiguous; /** expand this forest into a set of trees */ - public HashSet> expand(boolean toss) { - HashSet> ret = new HashSet>(); - for(Body b : this) - ret.addAll(b.expand(toss, new ArrayList>(), 0, new HashSet>())); - if (toss && ret.size() > 1) throw new Ambiguous(this); - return ret; - } + public void expand(HashSet> ht) { expand(ht, new HashSet>(), null); } - static Forest singleton(Input.Location loc) { return create(loc, null, new Forest[] { }, false, true); } - static Forest singleton(Input.Location loc, Forest body) { return create(loc, null, new Forest[] { body }, false, true); } - static Forest leaf(Input.Location loc, T tag) { return create(loc, tag, null, false, false); } - public static Forest create(Input.Location loc, T tag, Forest[] tokens, boolean unwrap, boolean singleton) { - return new MyBody(loc, tag, tokens, unwrap, singleton); + /** create a new forest */ + public static Forest create(Input.Region loc, T head, Forest[] children, boolean unwrap) { + return new One(loc, head, children, unwrap); } - // Body ////////////////////////////////////////////////////////////////////////////// - protected static interface Body { - HashSet> expand(boolean toss, ArrayList> toks, int i, HashSet> h); - } + // Package-Private ////////////////////////////////////////////////////////////////////////////// + + abstract void expand(HashSet> ht, HashSet> ignore, Tree bogus); + abstract void gather(HashSet> ignore); + boolean ambiguous() { return false; } + + public abstract void edges(GraphViz.Node n); + + + // One ////////////////////////////////////////////////////////////////////////////// + + /** A "single" forest with a head and child subforests */ + public static class One extends Forest { - protected static class MyBody extends Forest implements Body /* extends PrintableTree> implements Iterable>*/ { - public Iterator> iterator() { return new SingletonIterator>(this); } + private final Input.Region location; + private final T head; + private final Forest[] children; - private final Input.Location location; - private final T tag; - private final Forest[] tokens; + /** if true, the last child's children are considered children of this node */ private final boolean unwrap; - private final boolean singleton; - private MyBody(Input.Location loc, T tag, Forest[] tokens, boolean unwrap, boolean singleton) { + private One(Input.Region loc, T head, Forest[] children, boolean unwrap) { this.location = loc; - this.tag = tag; - this.tokens = tokens==null ? emptyForestArray : new Forest[tokens.length]; - if (tokens != null) System.arraycopy(tokens, 0, this.tokens, 0, tokens.length); - if (tokens != null) for(int i=0; i> expand(boolean toss, ArrayList> toks, int i, HashSet> h) { - if (singleton) { - for(Body b : tokens[0]) b.expand(toss, toks, i, h); - - } else if (i==tokens.length) { - h.add(new Tree(null, tag, toks.toArray(tree_hint))); - - } else if (unwrap && i==tokens.length-1) { - if (tokens[i] != null) - for(Body b : tokens[i]) - b.expand(toss, toks, 0, h); + public Tree expand1() throws Ambiguous { + Tree[] ret = new Tree[children.length]; + for(int i=0; i(location, head, ret, unwrap); + } + public void gather(HashSet> hf) { + hf.add(this); + for(Forest f : children) f.gather(hf); + } + public void expand(HashSet> ht, HashSet> ignore, Tree bogus) { + if (ignore.contains(this)) { ht.add(bogus); return; } + expand(0, new Tree[children.length], ht, ignore, bogus); + } + private void expand(final int i, Tree[] ta, HashSet> ht, HashSet> ignore, Tree bogus) { + if (i==children.length) { + ht.add(new Tree(location, head, ta, unwrap)); } else { - boolean hit = false; - for(Tree r : tokens[i].expand(toss)) { - hit = true; - int old = toks.size(); - toks.add(r); - expand(toss, toks, i+1, h); - while(toks.size() > old) toks.remove(toks.size()-1); + HashSet> ht2 = new HashSet>(); + children[i].expand(ht2, ignore, bogus); + for(Tree tc : ht2) { + ta[i] = tc; + expand(i+1, ta, ht, ignore, bogus); + ta[i] = null; + } + } + } + + // GraphViz, ToInt ////////////////////////////////////////////////////////////////////////////// + + public boolean isTransparent() { return false; } + public boolean isHidden() { return false; } + public GraphViz.Node toGraphViz(GraphViz gv) { + if (gv.hasNode(this)) return gv.createNode(this); + GraphViz.Node n = gv.createNode(this); + n.label = headToString()==null?"":headToString(); + n.directed = true; + edges(n); + return n; + } + boolean edges = false; + public void edges(GraphViz.Node n) { + if (edges) return; + edges = true; + for(int i=0; i extends Forest { + /** An "ambiguity node"; this is immutable once it has been "looked at" */ + public static class Many extends Forest { + + HashSet parents = new HashSet(); private FastSet> hp = new FastSet>(); - public Ref() { } - public void merge(Forest p) { if (p!=this) hp.add(p, true); } - public Iterator> iterator() { - final Iterator> ift = hp==null ? null : hp.iterator(); - return new Iterator>() { - Iterator> ibt = ift==null ? null : ift.hasNext() ? ift.next().iterator() : null; - public void remove() { throw new RuntimeException("not supported"); } - public boolean hasNext() { - if (ibt==null) return false; - if (ibt.hasNext()) return true; - ibt = ift.hasNext() ? ift.next().iterator() : null; - return hasNext(); - } - public Body next() { - return ibt.next(); + private boolean touched = false; + + public Many() { } + + public Iterator> iterator() { + touched(); + return (Iterator>)hp.iterator(); // FIXME: fastset's iterator is not safe! + } + + public Tree expand1() throws Ambiguous { + touched(); + if (hp.size() > 1) { + HashSet> hf0 = new HashSet>(); + Iterator> ih = hp.iterator(); + ih.next().gather(hf0); + for(Forest f : hp) { + HashSet> hf1 = new HashSet>(); + f.gather(hf1); + hf0.retainAll(hf1); } - }; + HashSet> ht = new HashSet>(); + expand(ht, hf0, new Tree(null, "*")); + throw new Ambiguous((Forest)this, + (HashSet>)(Object)ht); + } + return hp.iterator().next().expand1(); + } + + public void gather(HashSet> ht) { + touched(); + ht.add(this); + for(Forest f : hp) f.gather(ht); + } + private void touched() { + if (touched) return; + touched = true; + FastSet> f2 = new FastSet>(); + for(Forest f : hp) + if (f instanceof Forest.One) f2.add(f); + else for(Forest ff : ((Forest.Many)f)) + f2.add(ff); + hp = f2; + } + public boolean contains(Forest f) { + touched(); + return hp.contains(f); + } + public void merge(Forest p) { + if (touched) throw new RuntimeException("attempt to merge() on a Forest.Many that has already been examined"); + if (p==this) throw new RuntimeException("attempt to merge() a Forest.Many to itself!"); + hp.add(p, true); + } + boolean ambiguous() { + touched(); + if (hp.size()==0) return false; + if (hp.size()==1) return hp.iterator().next().ambiguous(); + return true; + } + + public void expand(HashSet> ht, HashSet> ignore, Tree bogus) { + touched(); + if (ignore.contains(this)) { ht.add(bogus); return; } + for (Forest f : hp) f.expand(ht, ignore, bogus); } - public Forest resolve() { return this; } - } + // GraphViz, ToInt ////////////////////////////////////////////////////////////////////////////// + + public boolean isTransparent() { return hp.size()==1; } + public boolean isHidden() { return hp.size()==0; } + public void edges(GraphViz.Node n) { + if (hp.size()==1) { hp.iterator().next().edges(n); return; } + for(Forest f : hp) f.edges(n); + } + public GraphViz.Node toGraphViz(GraphViz gv) { + if (hp.size()==1) return hp.iterator().next().toGraphViz(gv); + if (gv.hasNode(this)) return gv.createNode(this); + GraphViz.Node n = gv.createNode(this); + n.label = "?"; + n.color = "red"; + for(Forest f : hp) n.edge(f, null); + return n; + } + } + // Statics ////////////////////////////////////////////////////////////////////////////// private static Tree[] tree_hint = new Tree[0]; + private static String[] string_hint = new String[0]; private static final Forest[] emptyForestArray = new Forest[0]; protected String headToString() { return null; } - protected String headToJava() { return null; } + protected String headToJava() { return "null"; } protected String left() { return ""; } protected boolean ignoreSingleton() { return true; }