X-Git-Url: http://git.megacz.com/?p=sbp.git;a=blobdiff_plain;f=src%2Fedu%2Fberkeley%2Fsbp%2FForest.java;h=636ad4f08af8c101d3db45b78628422ec5fcfe02;hp=643734147623c7db7e735d7b2bbf984a84aa0d6d;hb=24219bdf084b45273e869cd19382d1640b396566;hpb=014de68a21aa2d17fdfd0bac7e404a725997a246 diff --git a/src/edu/berkeley/sbp/Forest.java b/src/edu/berkeley/sbp/Forest.java index 6437341..636ad4f 100644 --- a/src/edu/berkeley/sbp/Forest.java +++ b/src/edu/berkeley/sbp/Forest.java @@ -1,224 +1,239 @@ +// Copyright 2006-2007 all rights reserved; see LICENSE file for BSD-style license + package edu.berkeley.sbp; -import edu.berkeley.sbp.*; -import edu.berkeley.sbp.*; import edu.berkeley.sbp.util.*; import java.io.*; import java.util.*; -import java.lang.reflect.*; -/** an efficient representation of a collection of trees (Tomita's shared packed parse forest) */ -public abstract class Forest { +/** + * + * An efficient representation of a collection of trees (Tomita's + * shared packed parse forest). + * + */ +public abstract class Forest implements GraphViz.ToGraphViz { /** assume that this forest contains exactly one tree and return it; otherwise throw an exception */ - public final Tree expand1() throws Parser.Ambiguous, Parser.Failed { - Iterator> it = expand(true).iterator(); - if (!it.hasNext()) throw new Parser.Failed(); - return it.next(); - } + public abstract Tree expand1() throws Ambiguous; /** expand this forest into a set of trees */ - public abstract HashSet> expand(boolean toss); + public Iterable> expand() { + HashSet> ht = new HashSet>(); + expand(ht, new HashSet>(), null); + return ht; + } - abstract boolean valid(); + /** returns the input Region which this Forest was parsed from */ + public abstract Input.Region getRegion(); - static Forest singleton(Token.Location loc, Sequence creator) { return create(loc, null, new Forest[] { }, creator, false, true); } - static Forest singleton(Token.Location loc, Forest body, Sequence creator) { return create(loc, null, new Forest[] { body }, creator, false, true); } - static Forest leaf(Token.Location loc, T tag, Sequence creator) { return create(loc, tag, null, creator, false, false); } - public static Forest create(Token.Location loc, T tag, Forest[] tokens, Sequence creator, boolean unwrap, boolean singleton) { - return new MultiForest(loc, tag, tokens, creator, unwrap, singleton); + // Package-Private ////////////////////////////////////////////////////////////////////////////// + + public static Forest create(Input.Region region, NodeType head, Forest[] children) { + return create(region, head, children, new boolean[children==null ? 0 : children.length]); } + public static Forest create(Input.Region region, NodeType head, Forest[] children, boolean[] lifts) { + if (region == null) throw new RuntimeException("invoked Forest.create(region=null) -- this should never happen"); + return new One(region, head, children, lifts); } - // Body ////////////////////////////////////////////////////////////////////////////// + abstract void expand(HashSet> ht, HashSet> ignore, Tree bogus); + abstract void gather(HashSet> ignore); + abstract void edges(GraphViz.StateNode n); + boolean ambiguous() { return false; } + + // One ////////////////////////////////////////////////////////////////////////////// - protected static class Body { + /** A "single" forest with a head and child subforests */ + private static class One extends Forest { - private final Token.Location location; - private final T tag; - private final Forest[] tokens; - private final Sequence creator; - private final boolean unwrap; - private final boolean singleton; + private final Input.Region location; + private final NodeType head; + private final Forest[] children; - private Body(Token.Location loc, T tag, Forest[] tokens, Sequence creator, boolean unwrap, boolean singleton) { - this.location = loc; - this.tag = tag; - this.tokens = tokens==null ? emptyForestArray : new Forest[tokens.length]; - if (tokens != null) System.arraycopy(tokens, 0, this.tokens, 0, tokens.length); - this.creator = creator; - this.unwrap = unwrap; - this.singleton = singleton; - } + /** if true, the last child's children are considered children of this node */ + private final boolean[] lifts; - private HashSet> expand(boolean toss, ArrayList> toks, int i, HashSet> h) { - if (singleton) { - for(Body b : (IterableForest)tokens[0]) b.expand(toss, toks, i, h); + public Input.Region getRegion() { return location; } - } else if (i==tokens.length) { - h.add(new Tree(null, tag, toks.toArray(tree_hint))); + private One(Input.Region loc, NodeType head, Forest[] children, boolean[] lifts) { + this.location = loc; + this.head = head; + if (head==null) throw new RuntimeException("invoked Forest.create(,null,,,) -- this should never happen"); + this.children = children==null ? emptyForestArray : new Forest[children.length]; + if (children != null) System.arraycopy(children, 0, this.children, 0, children.length); + if (children != null) for(int i=0; i)tokens[i]) - b.expand(toss, toks, 0, h); + public Tree expand1() throws Ambiguous { + Tree[] ret = new Tree[children.length]; + for(int i=0; i(location, head, ret, lifts); + } + void gather(HashSet> hf) { + hf.add(this); + for(Forest f : children) f.gather(hf); + } + void expand(HashSet> ht, HashSet> ignore, Tree bogus) { + if (ignore.contains(this)) { ht.add(bogus); return; } + expand(0, new Tree[children.length], ht, ignore, bogus); + } + private void expand(final int i, Tree[] ta, HashSet> ht, HashSet> ignore, + Tree bogus) { + if (i==children.length) { + ht.add(new Tree(location, head, ta, lifts)); } else { - if (tokens[i]!=null) { - HashSet> exp = tokens[i].expand(toss); - if (exp != null) - for(Tree r : exp) { - int old = toks.size(); - toks.add(r); - expand(toss, toks, i+1, h); - while(toks.size() > old) toks.remove(toks.size()-1); - } + HashSet> ht2 = new HashSet>(); + children[i].expand(ht2, ignore, bogus); + for(Tree tc : ht2) { + ta[i] = tc; + expand(i+1, ta, ht, ignore, bogus); + ta[i] = null; } } - return h; - } - void addTo(HashSet h) { - if (!singleton) h.add(this); - else for(Body b : (IterableForest)tokens[0]) b.addTo(h); - } - void addTo(FastSet h) { - if (!singleton) h.add(this, true); - else for(Body b : (IterableForest)tokens[0]) b.addTo(h); - } - - private boolean kcache = false; - private boolean keep = false; - public boolean keep() { - if (kcache) return keep; - kcache = true; - for(Forest token : tokens) if (!token.valid()) return keep = false; - return keep = creator==null || (creator.needs.size()==0 && creator.hates.size()==0); - } - public boolean keep(Iterable> h) { - if (keep()) return true; - for(Forest token : tokens) if (!token.valid()) return false; - int needs = 0; - for(Body b : h) { - if (creator.hates.contains(b.creator) && b.keep(h)) return false; - if (creator.needs.contains(b.creator) && b.keep(h)) needs--; - } - return needs <= -1 * creator.needs.size(); } - - public String toString() { - StringBuffer ret = new StringBuffer(); - for(int i=0; i 0) { - ret.append(q); - ret.append(" "); + // GraphViz, ToInt ////////////////////////////////////////////////////////////////////////////// + + public boolean isTransparent() { return false; } + public boolean isHidden() { return false; } + public GraphViz.StateNode toGraphViz(GraphViz gv) { + if (gv.hasNode(this)) return gv.createNode(this); + GraphViz.StateNode n = gv.createNode(this); + n.label = headToString()==null?"":headToString(); + n.directed = true; + edges(n); + return n; + } + boolean edges = false; // FIXME ?? + public void edges(GraphViz.StateNode n) { + if (edges) return; + edges = true; + for(int i=0; i 0 ? tag+":" : tag+"") : ""; - if (tail.length() > 0) tail = "{" + tail + "}"; - return head + tail; } + + protected String headToString() { return head==null?null:head.toString(); } + protected String headToJava() { return "null"; } + protected String left() { return "{"; } + protected String right() { return "}"; } + protected boolean ignoreSingleton() { return false; } } - // Ref ////////////////////////////////////////////////////////////////////////////// + // Many ////////////////////////////////////////////////////////////////////////////// - static abstract class IterableForest extends Forest implements Iterable> { - public abstract Iterator> iterator(); - } + /** An "ambiguity node"; this is immutable once it has been "looked at" */ + static class Many extends Forest { - /** - * This class represents a partially complete collection of - * forests to be viewed as a forest at some later date; once - * viewed, it becomes immutable - */ - static class Ref extends IterableForest { - private FastSet hp = new FastSet(); - private Forest res = null; - public boolean valid = false; - public Ref() { } - public void merge(Forest p) { - if (res != null) throw new Error("already resolved!"); - if (p==null) throw new Error(); - if (p!=this) hp.add(p); - } - public Iterator> iterator() { return ((IterableForest)resolve()).iterator(); } - public HashSet> expand(boolean toss) { return resolve().expand(toss); } - public boolean valid() { if (valid) return true; resolve(); return valid; } - public String toString() { return resolve().toString(); } - public Forest resolve() { - if (hp==null) return res; - HashSet results = null; - FastSet nh = new FastSet(); - for(Forest p : hp) - for(Body b : (IterableForest)p) { - if (b.keep() && (b.creator==null || !b.creator.lame)) { valid = true; b.addTo(nh); } - else results = new HashSet(); - } - if (results != null) { - for(Forest p : hp) - for(Body b : (IterableForest)p) - results.add(b); - for(Body b : results) { - if (b.keep() && (b.creator==null || !b.creator.lame)) continue; - if (b.creator!=null && b.creator.lame) continue; - if (!b.keep(results)) continue; - valid = true; - b.addTo(nh); + private FastSet> hp = new FastSet>(); + private boolean touched = false; + + public Many() { } + + public Input.Region getRegion() { return hp.iterator().next().getRegion(); } // all should be identical + + public Tree expand1() throws Ambiguous { + touched(); + if (hp.size() > 1) { + HashSet> hf0 = new HashSet>(); + Iterator> ih = hp.iterator(); + ih.next().gather(hf0); + for(Forest f : hp) { + HashSet> hf1 = new HashSet>(); + f.gather(hf1); + hf0.retainAll(hf1); } + HashSet> ht = new HashSet>(); + expand(ht, hf0, new Tree(null, "*")); + throw new Ambiguous((Forest)this, + (HashSet>)(Object)ht); } - hp = null; - return res = new MultiForest(nh, valid); + return hp.iterator().next().expand1(); } - } + + void gather(HashSet> ht) { + touched(); + + // FIXME: do something more sensible here + if (ht.contains(this)) { + System.err.println("WARNING: grammar produced a circular forest\n" + this); + //throw new Error("grammar produced a circular forest:\n" + this); + return; + } - // Implementations ////////////////////////////////////////////////////////////////////////////// + ht.add(this); + for(Forest f : hp) f.gather(ht); + } + + private void touched() { + if (touched) return; + touched = true; + /* + FastSet> f2 = new FastSet>(); + for(Forest f : hp) + if (f instanceof Forest.One) f2.add(f); + else for(Forest ff : ((Forest.Many)f)) + f2.add(ff); + hp = f2; + */ + } + public boolean contains(Forest f) { + touched(); + return hp.contains(f); + } + public void merge(Forest p) { + if (touched) throw new RuntimeException("attempt to merge() on a Forest.Many that has already been examined"); + if (p==this) throw new RuntimeException("attempt to merge() a Forest.Many to itself!"); + hp.add(p, true); + } + boolean ambiguous() { + touched(); + if (hp.size()==0) return false; + if (hp.size()==1) return hp.iterator().next().ambiguous(); + return true; + } - private static class MultiForest extends IterableForest { - private final FastSet> results; - private boolean valid; - public boolean valid() { return valid; } - private MultiForest(FastSet> results, boolean valid) { this.results = results; this.valid = valid; } - public MultiForest(Token.Location loc, T tag, Forest[] tokens, Sequence creator, boolean unwrap, boolean singleton) { - this.results = new FastSet>(new Body(loc, tag, tokens, creator, unwrap, singleton)); - this.valid = true; + void expand(HashSet> ht, HashSet> ignore, Tree bogus) { + touched(); + if (ignore.contains(this)) { ht.add(bogus); return; } + for (Forest f : hp) f.expand(ht, ignore, bogus); } - public Iterator> iterator() { return results.iterator(); } - public HashSet> expand(boolean toss) { - HashSet> ret = new HashSet>(); - for(Body b : results) - ret.addAll(b.expand(toss, new ArrayList>(), 0, new HashSet>())); - if (toss && ret.size() > 1) throw new Parser.Ambiguous(this); - return ret; + + // GraphViz, ToInt ////////////////////////////////////////////////////////////////////////////// + + public boolean isTransparent() { return hp.size()==1; } + public boolean isHidden() { return hp.size()==0; } + public void edges(GraphViz.StateNode n) { + if (hp.size()==1) { hp.iterator().next().edges(n); return; } + for(Forest f : hp) f.edges(n); } - - // Display ////////////////////////////////////////////////////////////////////////////// - - private String toString = null; - public String toString() { - if (toString != null) return toString; - StringBuffer ret = new StringBuffer(); - if (results.size()==1) { - for(Forest.Body r : results) - ret.append(r); - return toString = ret.toString(); - } - ret.append(" r : results) { - if (!first) ret.append(' '); - first = false; - ret.append(r); - } - ret.append("?>"); - return toString = ret.toString(); + public GraphViz.StateNode toGraphViz(GraphViz gv) { + if (hp.size()==1) return hp.iterator().next().toGraphViz(gv); + if (gv.hasNode(this)) return gv.createNode(this); + GraphViz.StateNode n = gv.createNode(this); + n.label = "?"; + n.color = "red"; + for(Forest f : hp) n.edge(f, null); + return n; } } // Statics ////////////////////////////////////////////////////////////////////////////// private static Tree[] tree_hint = new Tree[0]; - private static Body[] body_hint = new Body[0]; + private static String[] string_hint = new String[0]; private static final Forest[] emptyForestArray = new Forest[0]; + + protected String headToString() { return null; } + protected String headToJava() { return "null"; } + protected String left() { return ""; } + protected boolean ignoreSingleton() { return true; } }