X-Git-Url: http://git.megacz.com/?p=sbp.git;a=blobdiff_plain;f=src%2Fedu%2Fberkeley%2Fsbp%2FForest.java;h=1730f607eba82daeb513f88053b53d08137a33e2;hp=34759e366148392ceb9fa07e9e5ed322c1a107a9;hb=0ddfec9ac2783f59115205dc0f3806137265c59c;hpb=4cc825538bcfaacea47ba7c89a1e47321a95baab diff --git a/src/edu/berkeley/sbp/Forest.java b/src/edu/berkeley/sbp/Forest.java index 34759e3..1730f60 100644 --- a/src/edu/berkeley/sbp/Forest.java +++ b/src/edu/berkeley/sbp/Forest.java @@ -1,135 +1,237 @@ +// Copyright 2006 all rights reserved; see LICENSE file for BSD-style license + package edu.berkeley.sbp; import edu.berkeley.sbp.*; -import edu.berkeley.sbp.*; +import edu.berkeley.sbp.Sequence.Position; import edu.berkeley.sbp.util.*; import java.io.*; import java.util.*; import java.lang.reflect.*; -/** an efficient representation of a collection of trees (Tomita's shared packed parse forest) */ -public abstract class Forest /*extends PrintableTree>*/ implements Iterable> { +/** + * + * An efficient representation of a collection of trees (Tomita's + * shared packed parse forest). + * + */ +public abstract class Forest implements GraphViz.ToGraphViz { /** assume that this forest contains exactly one tree and return it; otherwise throw an exception */ - public final Tree expand1() throws Ambiguous, ParseFailed { - Iterator> it = expand(true).iterator(); - if (!it.hasNext()) throw new ParseFailed(); - return it.next(); - } + public abstract Tree expand1() throws Ambiguous; /** expand this forest into a set of trees */ - public HashSet> expand(boolean toss) { - HashSet> ret = new HashSet>(); - for(Body b : this) - ret.addAll(b.expand(toss, new ArrayList>(), 0, new HashSet>())); - if (toss && ret.size() > 1) throw new Ambiguous(this); - return ret; - } + public void expand(HashSet> ht) { expand(ht, new HashSet>(), null); } - static Forest singleton(Input.Location loc) { return create(loc, null, new Forest[] { }, false, true); } - static Forest singleton(Input.Location loc, Forest body) { return create(loc, null, new Forest[] { body }, false, true); } - static Forest leaf(Input.Location loc, T tag) { return create(loc, tag, null, false, false); } - public static Forest create(Input.Location loc, T tag, Forest[] tokens, boolean unwrap, boolean singleton) { - return new MyBody(loc, tag, tokens, unwrap, singleton); + static Forest create(Input.Region loc, NodeType head, Forest[] children, boolean lift) { + if (loc == null) throw new RuntimeException("invoked Forest.create(null,,,,) -- this should never happen"); + return new One(loc, head, children, lift); } - // Body ////////////////////////////////////////////////////////////////////////////// + /** create a new forest */ + public static Forest create(Input.Region loc, NodeType head, Forest[] children) { + return Forest.create(loc, head, children, false); } - protected static interface Body { - HashSet> expand(boolean toss, ArrayList> toks, int i, HashSet> h); - } + // Package-Private ////////////////////////////////////////////////////////////////////////////// - protected static class MyBody extends Forest implements Body /* extends PrintableTree> implements Iterable>*/ { - public Iterator> iterator() { return new SingletonIterator>(this); } + abstract void expand(HashSet> ht, HashSet> ignore, Tree bogus); + abstract void gather(HashSet> ignore); + abstract void edges(GraphViz.Node n); + boolean ambiguous() { return false; } + + abstract Input.Region getRegion(); - private final Input.Location location; - private final T tag; - private final Forest[] tokens; - private final boolean unwrap; - private final boolean singleton; + // One ////////////////////////////////////////////////////////////////////////////// - private MyBody(Input.Location loc, T tag, Forest[] tokens, boolean unwrap, boolean singleton) { - this.location = loc; - this.tag = tag; - this.tokens = tokens==null ? emptyForestArray : new Forest[tokens.length]; - if (tokens != null) System.arraycopy(tokens, 0, this.tokens, 0, tokens.length); - if (tokens != null) for(int i=0; i extends Forest { - public HashSet> expand(boolean toss, ArrayList> toks, int i, HashSet> h) { - if (singleton) { - for(Body b : tokens[0]) b.expand(toss, toks, i, h); + private final Input.Region location; + private final NodeType head; + private final Forest[] children; - } else if (i==tokens.length) { - h.add(new Tree(null, tag, toks.toArray(tree_hint))); + /** if true, the last child's children are considered children of this node */ + private final boolean lift; - } else if (unwrap && i==tokens.length-1) { - if (tokens[i] != null) - for(Body b : tokens[i]) - b.expand(toss, toks, 0, h); + Input.Region getRegion() { return location; } + private One(Input.Region loc, NodeType head, Forest[] children, boolean lift) { + this.location = loc; + this.head = head; + if (head==null) throw new RuntimeException("invoked Forest.create(,null,,,) -- this should never happen"); + this.children = children==null ? emptyForestArray : new Forest[children.length]; + if (children != null) System.arraycopy(children, 0, this.children, 0, children.length); + if (children != null) for(int i=0; i expand1() throws Ambiguous { + Tree[] ret = new Tree[children.length]; + for(int i=0; i(location, head, ret, lift); + } + + void gather(HashSet> hf) { + hf.add(this); + for(Forest f : children) f.gather(hf); + } + void expand(HashSet> ht, HashSet> ignore, Tree bogus) { + if (ignore.contains(this)) { ht.add(bogus); return; } + expand(0, new Tree[children.length], ht, ignore, bogus); + } + private void expand(final int i, Tree[] ta, HashSet> ht, HashSet> ignore, Tree bogus) { + if (i==children.length) { + ht.add(new Tree(location, head, ta, lift)); } else { - boolean hit = false; - for(Tree r : tokens[i].expand(toss)) { - hit = true; - int old = toks.size(); - toks.add(r); - expand(toss, toks, i+1, h); - while(toks.size() > old) toks.remove(toks.size()-1); + HashSet> ht2 = new HashSet>(); + children[i].expand(ht2, ignore, bogus); + for(Tree tc : ht2) { + ta[i] = tc; + expand(i+1, ta, ht, ignore, bogus); + ta[i] = null; + } + } + } + + // GraphViz, ToInt ////////////////////////////////////////////////////////////////////////////// + + public boolean isTransparent() { return false; } + public boolean isHidden() { return false; } + public GraphViz.Node toGraphViz(GraphViz gv) { + if (gv.hasNode(this)) return gv.createNode(this); + GraphViz.Node n = gv.createNode(this); + n.label = headToString()==null?"":headToString(); + n.directed = true; + edges(n); + return n; + } + boolean edges = false; // FIXME ?? + public void edges(GraphViz.Node n) { + if (edges) return; + edges = true; + for(int i=0; i extends Forest { - private FastSet> hp = new FastSet>(); - public Ref() { } - public void merge(Forest p) { if (p!=this) hp.add(p, true); } - public Iterator> iterator() { - final Iterator> ift = hp==null ? null : hp.iterator(); - return new Iterator>() { - Iterator> ibt = ift==null ? null : ift.hasNext() ? ift.next().iterator() : null; - public void remove() { throw new RuntimeException("not supported"); } - public boolean hasNext() { - if (ibt==null) return false; - if (ibt.hasNext()) return true; - ibt = ift.hasNext() ? ift.next().iterator() : null; - return hasNext(); - } - public Body next() { - return ibt.next(); + // Many ////////////////////////////////////////////////////////////////////////////// + + /** An "ambiguity node"; this is immutable once it has been "looked at" */ + static class Many extends Forest { + + private FastSet> hp = new FastSet>(); + private boolean touched = false; + + public Many() { } + + Input.Region getRegion() { return hp.iterator().next().getRegion(); } // all should be identical + + public Tree expand1() throws Ambiguous { + touched(); + if (hp.size() > 1) { + HashSet> hf0 = new HashSet>(); + Iterator> ih = hp.iterator(); + ih.next().gather(hf0); + for(Forest f : hp) { + HashSet> hf1 = new HashSet>(); + f.gather(hf1); + hf0.retainAll(hf1); } - }; + HashSet> ht = new HashSet>(); + expand(ht, hf0, new Tree(null, "*")); + throw new Ambiguous((Forest)this, + (HashSet>)(Object)ht); + } + return hp.iterator().next().expand1(); + } + + void gather(HashSet> ht) { + touched(); + + // FIXME: do something more sensible here + if (ht.contains(this)) { + System.err.println("WARNING: grammar produced a circular forest\n" + this); + //throw new Error("grammar produced a circular forest:\n" + this); + return; + } + ht.add(this); + for(Forest f : hp) f.gather(ht); + } + + private void touched() { + if (touched) return; + touched = true; + /* + FastSet> f2 = new FastSet>(); + for(Forest f : hp) + if (f instanceof Forest.One) f2.add(f); + else for(Forest ff : ((Forest.Many)f)) + f2.add(ff); + hp = f2; + */ + } + public boolean contains(Forest f) { + touched(); + return hp.contains(f); + } + public void merge(Forest p) { + if (touched) throw new RuntimeException("attempt to merge() on a Forest.Many that has already been examined"); + if (p==this) throw new RuntimeException("attempt to merge() a Forest.Many to itself!"); + hp.add(p, true); + } + boolean ambiguous() { + touched(); + if (hp.size()==0) return false; + if (hp.size()==1) return hp.iterator().next().ambiguous(); + return true; + } + + void expand(HashSet> ht, HashSet> ignore, Tree bogus) { + touched(); + if (ignore.contains(this)) { ht.add(bogus); return; } + for (Forest f : hp) f.expand(ht, ignore, bogus); } - public Forest resolve() { return this; } - } + // GraphViz, ToInt ////////////////////////////////////////////////////////////////////////////// + + public boolean isTransparent() { return hp.size()==1; } + public boolean isHidden() { return hp.size()==0; } + public void edges(GraphViz.Node n) { + if (hp.size()==1) { hp.iterator().next().edges(n); return; } + for(Forest f : hp) f.edges(n); + } + public GraphViz.Node toGraphViz(GraphViz gv) { + if (hp.size()==1) return hp.iterator().next().toGraphViz(gv); + if (gv.hasNode(this)) return gv.createNode(this); + GraphViz.Node n = gv.createNode(this); + n.label = "?"; + n.color = "red"; + for(Forest f : hp) n.edge(f, null); + return n; + } + } + // Statics ////////////////////////////////////////////////////////////////////////////// private static Tree[] tree_hint = new Tree[0]; + private static String[] string_hint = new String[0]; private static final Forest[] emptyForestArray = new Forest[0]; protected String headToString() { return null; } - protected String headToJava() { return null; } + protected String headToJava() { return "null"; } protected String left() { return ""; } protected boolean ignoreSingleton() { return true; }