X-Git-Url: http://git.megacz.com/?p=sbp.git;a=blobdiff_plain;f=src%2Fedu%2Fberkeley%2Fsbp%2FForest.java;h=cf64ed272a57322dd12473acf5c44049a07bf920;hp=7fde86e681d3ec06854a39ec798576b0b9430559;hb=dc9bb3a45ed306e2e35549076842b3e74efecb48;hpb=a26089cd0d7c95cad657b745e836cb4cba35a97a diff --git a/src/edu/berkeley/sbp/Forest.java b/src/edu/berkeley/sbp/Forest.java index 7fde86e..cf64ed2 100644 --- a/src/edu/berkeley/sbp/Forest.java +++ b/src/edu/berkeley/sbp/Forest.java @@ -1,78 +1,93 @@ +// Copyright 2006 all rights reserved; see LICENSE file for BSD-style license + package edu.berkeley.sbp; -import edu.berkeley.sbp.*; -import edu.berkeley.sbp.Sequence.Position; import edu.berkeley.sbp.util.*; import java.io.*; import java.util.*; -import java.lang.reflect.*; - -/** an efficient representation of a collection of trees (Tomita's shared packed parse forest) */ -public abstract class Forest /*extends PrintableTree>*/ - implements IntegerMappable, - GraphViz.ToGraphViz { - private static int master_idx = 0; - private final int idx = master_idx++; - public int toInt() { return idx; } +/** + * + * An efficient representation of a collection of trees (Tomita's + * shared packed parse forest). + * + */ +public abstract class Forest implements GraphViz.ToGraphViz { /** assume that this forest contains exactly one tree and return it; otherwise throw an exception */ - public abstract Tree expand1() throws Ambiguous; + public abstract Tree expand1() throws Ambiguous; /** expand this forest into a set of trees */ - public void expand(HashSet> ht) { expand(ht, new HashSet>(), null); } - public abstract void expand(HashSet> ht, HashSet> ignore, Tree bogus); - public abstract void gather(HashSet> ignore); - public HashSet> expand(boolean toss) { - HashSet> ret = new HashSet>(); - expand(ret); - return ret; + public Iterable> expand() { + HashSet> ht = new HashSet>(); + expand(ht, new HashSet>(), null); + return ht; } - public static Forest create(Input.Region loc, T tag, Forest[] tokens, boolean unwrap) { - return new Body(loc, tag, tokens, unwrap); + /** returns the input Region which this Forest was parsed from */ + public abstract Input.Region getRegion(); + + // Package-Private ////////////////////////////////////////////////////////////////////////////// + + static Forest create(Input.Region region, NodeType head, Forest[] children, boolean lift) { + if (region == null) throw new RuntimeException("invoked Forest.create(region=null) -- this should never happen"); + return new One(region, head, children, lift); } - public abstract void edges(GraphViz.Node n); - public boolean ambiguous() { return false; } - // Body ////////////////////////////////////////////////////////////////////////////// + /** create a new forest */ + public static Forest create(Input.Region region, NodeType head, Forest[] children) { + return Forest.create(region, head, children, false); } + + abstract void expand(HashSet> ht, HashSet> ignore, Tree bogus); + abstract void gather(HashSet> ignore); + abstract void edges(GraphViz.Node n); + boolean ambiguous() { return false; } + + // One ////////////////////////////////////////////////////////////////////////////// - public /*protected*/ static class Body extends Forest /* extends PrintableTree> implements */ { + /** A "single" forest with a head and child subforests */ + private static class One extends Forest { private final Input.Region location; - private final T tag; - private final Forest[] tokens; - private final boolean unwrap; + private final NodeType head; + private final Forest[] children; + + /** if true, the last child's children are considered children of this node */ + private final boolean lift; - private Body(Input.Region loc, T tag, Forest[] tokens, boolean unwrap) { + public Input.Region getRegion() { return location; } + + private One(Input.Region loc, NodeType head, Forest[] children, boolean lift) { this.location = loc; - this.tag = tag; - this.tokens = tokens==null ? emptyForestArray : new Forest[tokens.length]; - if (tokens != null) System.arraycopy(tokens, 0, this.tokens, 0, tokens.length); - if (tokens != null) for(int i=0; i expand1() throws Ambiguous { - Tree[] ret = new Tree[tokens.length]; - for(int i=0; i(location, tag, ret, unwrap); + public Tree expand1() throws Ambiguous { + Tree[] ret = new Tree[children.length]; + for(int i=0; i(location, head, ret, lift); } - public void gather(HashSet> hf) { + + void gather(HashSet> hf) { hf.add(this); - for(Forest f : tokens) f.gather(hf); + for(Forest f : children) f.gather(hf); } - public void expand(HashSet> ht, HashSet> ignore, Tree bogus) { + void expand(HashSet> ht, HashSet> ignore, Tree bogus) { if (ignore.contains(this)) { ht.add(bogus); return; } - expand(0, new Tree[tokens.length], ht, ignore, bogus); + expand(0, new Tree[children.length], ht, ignore, bogus); } - public void expand(final int i, Tree[] ta, HashSet> ht, HashSet> ignore, Tree bogus) { - if (i==tokens.length) { - ht.add(new Tree(location, tag, ta, unwrap)); + private void expand(final int i, Tree[] ta, HashSet> ht, HashSet> ignore, + Tree bogus) { + if (i==children.length) { + ht.add(new Tree(location, head, ta, lift)); } else { - HashSet> ht2 = new HashSet>(); - tokens[i].expand(ht2, ignore, bogus); - for(Tree tc : ht2) { + HashSet> ht2 = new HashSet>(); + children[i].expand(ht2, ignore, bogus); + for(Tree tc : ht2) { ta[i] = tc; expand(i+1, ta, ht, ignore, bogus); ta[i] = null; @@ -92,20 +107,20 @@ public abstract class Forest /*extends PrintableTree>*/ edges(n); return n; } - boolean edges = false; + boolean edges = false; // FIXME ?? public void edges(GraphViz.Node n) { if (edges) return; edges = true; - for(int i=0; i /*extends PrintableTree>*/ } - // Ref ////////////////////////////////////////////////////////////////////////////// + // Many ////////////////////////////////////////////////////////////////////////////// + + /** An "ambiguity node"; this is immutable once it has been "looked at" */ + static class Many extends Forest { - /** - * This class represents a partially complete collection of - * forests to be viewed as a forest at some later date; once - * viewed, it becomes immutable - */ - static class Ref extends Forest { - public HashSet parents = new HashSet(); - private FastSet> hp = new FastSet>(); + private FastSet> hp = new FastSet>(); + private boolean touched = false; - public Ref() { } + public Many() { } - public Tree expand1() throws Ambiguous { - if (hp.size() > 1) throw new Ambiguous(this); + public Input.Region getRegion() { return hp.iterator().next().getRegion(); } // all should be identical + + public Tree expand1() throws Ambiguous { + touched(); + if (hp.size() > 1) { + HashSet> hf0 = new HashSet>(); + Iterator> ih = hp.iterator(); + ih.next().gather(hf0); + for(Forest f : hp) { + HashSet> hf1 = new HashSet>(); + f.gather(hf1); + hf0.retainAll(hf1); + } + HashSet> ht = new HashSet>(); + expand(ht, hf0, new Tree(null, "*")); + throw new Ambiguous((Forest)this, + (HashSet>)(Object)ht); + } return hp.iterator().next().expand1(); } - public void gather(HashSet> ht) { + void gather(HashSet> ht) { + touched(); + + // FIXME: do something more sensible here + if (ht.contains(this)) { + System.err.println("WARNING: grammar produced a circular forest\n" + this); + //throw new Error("grammar produced a circular forest:\n" + this); + return; + } + ht.add(this); - for(Forest f : hp) f.gather(ht); + for(Forest f : hp) f.gather(ht); } - public Forest resolve() { return this; } - public void expand(HashSet> ht, HashSet> ignore, Tree bogus) { - if (ignore.contains(this)) { ht.add(bogus); return; } - for (Forest f : hp) f.expand(ht, ignore, bogus); + private void touched() { + if (touched) return; + touched = true; + /* + FastSet> f2 = new FastSet>(); + for(Forest f : hp) + if (f instanceof Forest.One) f2.add(f); + else for(Forest ff : ((Forest.Many)f)) + f2.add(ff); + hp = f2; + */ + } + public boolean contains(Forest f) { + touched(); + return hp.contains(f); + } + public void merge(Forest p) { + if (touched) throw new RuntimeException("attempt to merge() on a Forest.Many that has already been examined"); + if (p==this) throw new RuntimeException("attempt to merge() a Forest.Many to itself!"); + hp.add(p, true); } - public boolean contains(Forest f) { return hp.contains(f); } - public void merge(Forest p) { if (p!=this) hp.add(p, true); } - public boolean ambiguous() { + boolean ambiguous() { + touched(); if (hp.size()==0) return false; if (hp.size()==1) return hp.iterator().next().ambiguous(); return true; } + void expand(HashSet> ht, HashSet> ignore, Tree bogus) { + touched(); + if (ignore.contains(this)) { ht.add(bogus); return; } + for (Forest f : hp) f.expand(ht, ignore, bogus); + } + + // GraphViz, ToInt ////////////////////////////////////////////////////////////////////////////// - public int toInt() { - if (hp.size()==1) return hp.iterator().next().toInt(); - return super.toInt(); - } public boolean isTransparent() { return hp.size()==1; } public boolean isHidden() { return hp.size()==0; } public void edges(GraphViz.Node n) { @@ -162,7 +217,6 @@ public abstract class Forest /*extends PrintableTree>*/ for(Forest f : hp) f.edges(n); } public GraphViz.Node toGraphViz(GraphViz gv) { - //if (hp.size()==0) return null; if (hp.size()==1) return hp.iterator().next().toGraphViz(gv); if (gv.hasNode(this)) return gv.createNode(this); GraphViz.Node n = gv.createNode(this);