X-Git-Url: http://git.megacz.com/?p=sbp.git;a=blobdiff_plain;f=src%2Fedu%2Fberkeley%2Fsbp%2FForest.java;h=cf64ed272a57322dd12473acf5c44049a07bf920;hp=9dabf6064cfc4649667a5f700ce41d83e0b46292;hb=dc9bb3a45ed306e2e35549076842b3e74efecb48;hpb=eda544585c2304faa82d249c4744fd5cecbf9211 diff --git a/src/edu/berkeley/sbp/Forest.java b/src/edu/berkeley/sbp/Forest.java index 9dabf60..cf64ed2 100644 --- a/src/edu/berkeley/sbp/Forest.java +++ b/src/edu/berkeley/sbp/Forest.java @@ -1,176 +1,214 @@ +// Copyright 2006 all rights reserved; see LICENSE file for BSD-style license + package edu.berkeley.sbp; -import edu.berkeley.sbp.*; -import edu.berkeley.sbp.Sequence.Position; import edu.berkeley.sbp.util.*; import java.io.*; import java.util.*; -import java.lang.reflect.*; - -/** an efficient representation of a collection of trees (Tomita's shared packed parse forest) */ -public abstract class Forest /*extends PrintableTree>*/ - implements Visitable>, - IntegerMappable, - GraphViz.ToGraphViz { - private static int master_idx = 0; - private final int idx = master_idx++; - public int toInt() { return idx; } +/** + * + * An efficient representation of a collection of trees (Tomita's + * shared packed parse forest). + * + */ +public abstract class Forest implements GraphViz.ToGraphViz { /** assume that this forest contains exactly one tree and return it; otherwise throw an exception */ - public final Tree expand1() throws Ambiguous, ParseFailed { - try { - Iterator> it = expand(true).iterator(); - if (!it.hasNext()) throw new ParseFailed(); - return it.next(); - } catch (InnerAmbiguous ia) { throw new Ambiguous(ia.f); } - } + public abstract Tree expand1() throws Ambiguous; /** expand this forest into a set of trees */ - public HashSet> expand(boolean toss) { - final HashSetTreeConsumer ret = new HashSetTreeConsumer(); - visit(new TreeMaker2(toss, ret), null, null); - if (toss && ret.size() > 1) throw new InnerAmbiguous(this); - return ret; + public Iterable> expand() { + HashSet> ht = new HashSet>(); + expand(ht, new HashSet>(), null); + return ht; } - private static class InnerAmbiguous extends RuntimeException { - public final Forest f; - public InnerAmbiguous(Forest f) { this.f = f; } - } + /** returns the input Region which this Forest was parsed from */ + public abstract Input.Region getRegion(); - static interface TreeConsumer { - public void addTree(Tree t); + // Package-Private ////////////////////////////////////////////////////////////////////////////// + + static Forest create(Input.Region region, NodeType head, Forest[] children, boolean lift) { + if (region == null) throw new RuntimeException("invoked Forest.create(region=null) -- this should never happen"); + return new One(region, head, children, lift); } - static class HashSetTreeConsumer extends HashSet> implements TreeConsumer { - public void addTree(Tree t) { - super.add(t); + + /** create a new forest */ + public static Forest create(Input.Region region, NodeType head, Forest[] children) { + return Forest.create(region, head, children, false); } + + abstract void expand(HashSet> ht, HashSet> ignore, Tree bogus); + abstract void gather(HashSet> ignore); + abstract void edges(GraphViz.Node n); + boolean ambiguous() { return false; } + + // One ////////////////////////////////////////////////////////////////////////////// + + /** A "single" forest with a head and child subforests */ + private static class One extends Forest { + + private final Input.Region location; + private final NodeType head; + private final Forest[] children; + + /** if true, the last child's children are considered children of this node */ + private final boolean lift; + + public Input.Region getRegion() { return location; } + + private One(Input.Region loc, NodeType head, Forest[] children, boolean lift) { + this.location = loc; + this.head = head; + if (head==null) throw new RuntimeException("invoked Forest.create(,null,,,) -- this should never happen"); + this.children = children==null ? emptyForestArray : new Forest[children.length]; + if (children != null) System.arraycopy(children, 0, this.children, 0, children.length); + if (children != null) for(int i=0; i Forest singleton(Input.Location loc, Position p) { - return create(loc, null, new Forest[] { }, new Object[0], false, true, p); } - static Forest singleton(Input.Location loc, Forest body, Position p) { - //return create(loc, null, new Forest[] { body }, false, true, p); - return body; - } - static Forest leaf(Input.Location loc, T tag, Position p) { return create(loc, tag, null, null, false, false, p); } - public static Forest create(Input.Location loc, T tag, Forest[] tokens, Object[] labels, boolean unwrap, boolean singleton, Position p) { - return new MyBody(loc, tag, tokens, labels, unwrap, singleton, p); - } - // Body ////////////////////////////////////////////////////////////////////////////// + public Tree expand1() throws Ambiguous { + Tree[] ret = new Tree[children.length]; + for(int i=0; i(location, head, ret, lift); + } - protected static interface Body extends GraphViz.ToGraphViz { - void expand(int i, TreeMaker h); - } - public abstract void edges(GraphViz.Node n); - public boolean ambiguous() { return false; } - protected static class MyBody extends Forest implements Body /* extends PrintableTree> implements */ { + void gather(HashSet> hf) { + hf.add(this); + for(Forest f : children) f.gather(hf); + } + void expand(HashSet> ht, HashSet> ignore, Tree bogus) { + if (ignore.contains(this)) { ht.add(bogus); return; } + expand(0, new Tree[children.length], ht, ignore, bogus); + } + private void expand(final int i, Tree[] ta, HashSet> ht, HashSet> ignore, + Tree bogus) { + if (i==children.length) { + ht.add(new Tree(location, head, ta, lift)); + } else { + HashSet> ht2 = new HashSet>(); + children[i].expand(ht2, ignore, bogus); + for(Tree tc : ht2) { + ta[i] = tc; + expand(i+1, ta, ht, ignore, bogus); + ta[i] = null; + } + } + } + + // GraphViz, ToInt ////////////////////////////////////////////////////////////////////////////// public boolean isTransparent() { return false; } public boolean isHidden() { return false; } public GraphViz.Node toGraphViz(GraphViz gv) { if (gv.hasNode(this)) return gv.createNode(this); GraphViz.Node n = gv.createNode(this); - n.label = StringUtil.escapify(headToString()==null?"":headToString(), "\r\n"); + n.label = headToString()==null?"":headToString(); n.directed = true; - n.comment = reduction==null?null:reduction+""; edges(n); return n; } - boolean edges = false; + boolean edges = false; // FIXME ?? public void edges(GraphViz.Node n) { if (edges) return; edges = true; - for(int i=0; i void visit(Invokable,B,C> ivbc, B b, C c) { - ivbc.invoke(this, b, c); - } + protected String headToString() { return head==null?null:head.toString(); } + protected String headToJava() { return "null"; } + protected String left() { return "{"; } + protected String right() { return "}"; } + protected boolean ignoreSingleton() { return false; } + } - private final Input.Location location; - private final T tag; - private final Forest[] tokens; - private final Object[] labels; - private final boolean unwrap; - private final boolean singleton; - private final Sequence.Position reduction; - private MyBody(Input.Location loc, T tag, Forest[] tokens, Object[] labels, boolean unwrap, boolean singleton, Position reduction) { - this.location = loc; - this.tag = tag; - this.tokens = tokens==null ? emptyForestArray : new Forest[tokens.length]; - if (tokens != null) System.arraycopy(tokens, 0, this.tokens, 0, tokens.length); - if (tokens != null) for(int i=0; i h) { - if (singleton) { - tokens[0].visit(h, null, i); - return; - } - if (i==0) h.start(tag, location); + // Many ////////////////////////////////////////////////////////////////////////////// - if (i==tokens.length) { - h.finish(tag, location); + /** An "ambiguity node"; this is immutable once it has been "looked at" */ + static class Many extends Forest { - } else if (unwrap && i==tokens.length-1) { - if (tokens[i] != null) - tokens[i].visit(h, null, 0); + private FastSet> hp = new FastSet>(); + private boolean touched = false; - } else { - tokens[i].visit(new TreeMaker(h.toss) { - public void start(T head, Input.Location loc) { } - public void addTree(Tree t, Object label) { toks.add(t); labs.add(label); } - public void finish(T head, Input.Location loc) { - int old = h.toks.size(); - h.addTree(new Tree(loc, head, toks.toArray(tree_hint), labs.toArray(string_hint)), labels==null?null:labels[i]); - expand(i+1, h); - while(h.toks.size() > old) h.toks.remove(h.toks.size()-1); - while(h.labs.size() > old) h.labs.remove(h.labs.size()-1); - } - }, null, null); - } - } + public Many() { } - protected String headToString() { return tag==null?null:tag.toString(); } - protected String headToJava() { return null; } - protected String left() { return "{"; } - protected String right() { return "}"; } - protected boolean ignoreSingleton() { return false; } - } + public Input.Region getRegion() { return hp.iterator().next().getRegion(); } // all should be identical + public Tree expand1() throws Ambiguous { + touched(); + if (hp.size() > 1) { + HashSet> hf0 = new HashSet>(); + Iterator> ih = hp.iterator(); + ih.next().gather(hf0); + for(Forest f : hp) { + HashSet> hf1 = new HashSet>(); + f.gather(hf1); + hf0.retainAll(hf1); + } + HashSet> ht = new HashSet>(); + expand(ht, hf0, new Tree(null, "*")); + throw new Ambiguous((Forest)this, + (HashSet>)(Object)ht); + } + return hp.iterator().next().expand1(); + } + + void gather(HashSet> ht) { + touched(); + + // FIXME: do something more sensible here + if (ht.contains(this)) { + System.err.println("WARNING: grammar produced a circular forest\n" + this); + //throw new Error("grammar produced a circular forest:\n" + this); + return; + } - // Ref ////////////////////////////////////////////////////////////////////////////// + ht.add(this); + for(Forest f : hp) f.gather(ht); + } - /** - * This class represents a partially complete collection of - * forests to be viewed as a forest at some later date; once - * viewed, it becomes immutable - */ - static class Ref extends Forest { - public boolean ambiguous() { + private void touched() { + if (touched) return; + touched = true; + /* + FastSet> f2 = new FastSet>(); + for(Forest f : hp) + if (f instanceof Forest.One) f2.add(f); + else for(Forest ff : ((Forest.Many)f)) + f2.add(ff); + hp = f2; + */ + } + public boolean contains(Forest f) { + touched(); + return hp.contains(f); + } + public void merge(Forest p) { + if (touched) throw new RuntimeException("attempt to merge() on a Forest.Many that has already been examined"); + if (p==this) throw new RuntimeException("attempt to merge() a Forest.Many to itself!"); + hp.add(p, true); + } + boolean ambiguous() { + touched(); if (hp.size()==0) return false; if (hp.size()==1) return hp.iterator().next().ambiguous(); return true; } - private FastSet> hp = new FastSet>(); - public Ref() { } - public int toInt() { - if (hp.size()==1) return hp.iterator().next().toInt(); - return super.toInt(); + + void expand(HashSet> ht, HashSet> ignore, Tree bogus) { + touched(); + if (ignore.contains(this)) { ht.add(bogus); return; } + for (Forest f : hp) f.expand(ht, ignore, bogus); } - public void merge(Forest p) { if (p!=this) hp.add(p, true); } + + + // GraphViz, ToInt ////////////////////////////////////////////////////////////////////////////// public boolean isTransparent() { return hp.size()==1; } public boolean isHidden() { return hp.size()==0; } @@ -179,7 +217,6 @@ public abstract class Forest /*extends PrintableTree>*/ for(Forest f : hp) f.edges(n); } public GraphViz.Node toGraphViz(GraphViz gv) { - //if (hp.size()==0) return null; if (hp.size()==1) return hp.iterator().next().toGraphViz(gv); if (gv.hasNode(this)) return gv.createNode(this); GraphViz.Node n = gv.createNode(this); @@ -188,45 +225,6 @@ public abstract class Forest /*extends PrintableTree>*/ for(Forest f : hp) n.edge(f, null); return n; } - - public void visit(Invokable,B,C> ivbc, B b, C c) { - if (hp==null) return; - for(Forest f : hp) - f.visit(ivbc, b, c); - } - public Forest resolve() { return this; } - } - - public abstract void visit(Invokable,B,C> ivbc, B b, C c); - private static class TreeMaker2 extends TreeMaker { - private TreeConsumer tc; - public TreeMaker2(boolean toss, TreeConsumer tc) { super(toss); this.tc = tc; } - public void finish(T head, Input.Location loc) { tc.addTree(new Tree(loc, head, toks.toArray(tree_hint), labs.toArray(string_hint)));; } - public void start(T head, Input.Location loc) { } - public void addTree(Tree t, Object label) { toks.add(t); labs.add(label); } - } - private static abstract class TreeMaker implements Invokable,Boolean,Integer>/*, TreeConsumer*/ { - public ArrayList> toks = new ArrayList>(); - public ArrayList labs = new ArrayList(); - private boolean toss; - protected T head; - public TreeMaker(boolean toss) { this.toss = toss; } - public abstract void start(T head, Input.Location loc); - public abstract void finish(T head, Input.Location loc); - public abstract void addTree(Tree t, Object label); - public void invoke(Forest.Body bod, Boolean o, Integer i) { - if (i==null) { - ArrayList> toks = this.toks; - this.toks = new ArrayList>(); - ArrayList labs = this.labs; - this.labs = new ArrayList(); - bod.expand(0, this); - this.toks = toks; - this.labs = labs; - } else { - bod.expand(i, this); - } - } } // Statics ////////////////////////////////////////////////////////////////////////////// @@ -236,7 +234,7 @@ public abstract class Forest /*extends PrintableTree>*/ private static final Forest[] emptyForestArray = new Forest[0]; protected String headToString() { return null; } - protected String headToJava() { return null; } + protected String headToJava() { return "null"; } protected String left() { return ""; } protected boolean ignoreSingleton() { return true; }