X-Git-Url: http://git.megacz.com/?p=sbp.git;a=blobdiff_plain;f=src%2Fedu%2Fberkeley%2Fsbp%2FSequence.java;h=430f29813c37952956b6cf0762f4a4c03219840f;hp=2530a211cf0a996591a4248f6ab83e447fa66579;hb=260e46cff8995fb5a01e94c1a707d0ffff0a5382;hpb=9b031db4cefc550c82a8bb6da3b061d3790c2cdc diff --git a/src/edu/berkeley/sbp/Sequence.java b/src/edu/berkeley/sbp/Sequence.java index 2530a21..430f298 100644 --- a/src/edu/berkeley/sbp/Sequence.java +++ b/src/edu/berkeley/sbp/Sequence.java @@ -1,3 +1,5 @@ +// Copyright 2006-2007 all rights reserved; see LICENSE file for BSD-style license + package edu.berkeley.sbp; import edu.berkeley.sbp.util.*; import edu.berkeley.sbp.*; @@ -8,148 +10,230 @@ import java.lang.reflect.*; import java.lang.ref.*; /** juxtaposition; zero or more adjacent Elements; can specify a rewriting */ -public abstract class Sequence extends Element implements Iterable { +public abstract class Sequence implements Iterable, SequenceOrElement { protected final Element[] elements; - final HashSet hated = new HashSet(); + boolean needed_or_hated = false; + boolean in_a_union = false; final HashSet needs = new HashSet(); final HashSet hates = new HashSet(); - final Position firstp; + // FIXME: these are ugly -- migrate into Grammar + HashMap canNeed = new HashMap(); + HashMap canKill = new HashMap(); - Atom follow = null; + final Position firstp; - // Static Constructors ////////////////////////////////////////////////////////////////////////////// + Atom follow = null; - abstract Sequence _clone(); - Sequence dup() { - Sequence ret = _clone(); - for(Sequence s : needs) { ret.needs.add(s); } - for(Sequence s : hates) { ret.hates.add(s); s.hated.add(ret); } - ret.follow = follow; + private static int global_sernum = 0; + private int sernum = global_sernum++; + int[] needs_int() { + int[] ret = new int[needs.size()]; + int i = 0; + for(Sequence s : needs) ret[i++] = s.sernum; + return ret; + } + int[] hates_int() { + int[] ret = new int[hates.size()]; + int i = 0; + for(Sequence s : hates) ret[i++] = s.sernum; return ret; } - /** create an empty sequence (matches the empty string) */ - public static Sequence create() { return new Sequence.Constant.Empty(); } + + // Static Constructors ////////////////////////////////////////////////////////////////////////////// /** create a sequence of one element */ public static Sequence create(Element e) { return create(new Element[] { e }, 0); } /** create a sequence which drops the result of all but one of its element */ - public static Sequence create(Element[] e, int idx) { return new Singleton(e, idx); } + public static Sequence create(Element[] e, int which) { + return new Singleton(e, which); } - /** after matching the sequence, insert a constant into the output tree */ - public static Sequence newConstantSequence(Element[] e, Object o) { return new Constant(e, o); } + /** create a sequence which always evaluates to a constant result */ + public static Sequence create(Object result, Element[] e) { + return new RewritingSequence(result, e, trues(e.length)); } + private static boolean[] trues(int length) { + boolean[] ret = new boolean[length]; + for(int i=0; ie whose corresponding boolean in drops + * @param drop only elements of e whose corresponding boolean in drops * is false will be included in the output tree - * @param unwrap if true, all children of the last child (ie - * grandchildren) are promoted to children of this node; this is very useful for matching repetitions + * @param lifts which (if any) child trees to lift **/ - public static Sequence create(Object tag, Element[] e, boolean[] drops, boolean unwrap) { - return unwrap - ? new Unwrap(e, tag, drops) - : new RewritingSequence(tag, e, drops); + public static Sequence create(Object head, Element[] e, boolean[] drop) { + return create(head, e, drop, new boolean[e.length]); } + public static Sequence create(Object head, Element[] e, boolean[] drop, boolean[] lifts) { + if (lifts==null) lifts = new boolean[e.length]; + return new RewritingSequence(head, e, drop, lifts); } - //////////////////////////////////////////////////////////////////////////////// - /** return a new sequence identical to this one, but with a positive conjunct s */ - public Sequence and(Sequence s) { Sequence ret = dup(); ret.needs.add(s); return ret; } + public Sequence and(Sequence s) { + if (s.in_a_union) + throw new RuntimeException("you may not use a sequence as a conjunct if it belongs to a Union"); + Sequence ret = dup(); + ret.needs.add(s); + s.needed_or_hated=true; + return ret; + } /** return a new sequence identical to this one, but with a negative conjunct s */ - public Sequence not(Sequence s) { Sequence ret = dup(); ret.hates.add(s); s.hated.add(ret); return ret; } + public Sequence andnot(Sequence s) { + if (s.in_a_union) + throw new RuntimeException("you may not use a sequence as a conjunct if it belongs to a Union"); + Sequence ret = dup(); + ret.hates.add(s); + s.needed_or_hated=true; + return ret; + } /** return a new sequence identical to this one, but with a follow-set restricted to a */ public Sequence followedBy(Atom a) { Sequence ret = dup(); ret.follow = a; return ret; } + //////////////////////////////////////////////////////////////////////////////// + + abstract Sequence _clone(); + private Sequence dup() { + Sequence ret = _clone(); + for(Sequence s : needs) { ret.needs.add(s); } + for(Sequence s : hates) { ret.hates.add(s); } + ret.follow = follow; + return ret; + } + Iterable needs() { return needs; } Iterable hates() { return hates; } - Position firstp() { return firstp; } + Pos firstp() { return firstp; } + Pos lastp() { return firstp().last(); } public Iterator iterator() { return new ArrayIterator(elements); } protected Sequence(Element[] elements) { this.elements = elements; - this.firstp = new Position(0); + for(int i=0; i Forest postReduce(Input.Region loc, Forest[] args, Position p); // Position ////////////////////////////////////////////////////////////////////////////// - /** the imaginary position before or after an element of a sequence; corresponds to an "LR item" */ - class Position implements IntegerMappable { + static abstract class Pos implements IntegerMappable, Comparable, Serializable { + + public int ord = -1; + private transient Sequence owner; + + public int ord() { return ord; } + + final Forest[] holder; + + Pos(int len, Sequence owner) { + this.owner = owner; + this.holder = new Forest[len]; + } + + public abstract int provides(); + public abstract int[] needs(); + public abstract int[] hates(); + public abstract boolean owner_needed_or_hated(); - private Forest zero = null; - public Forest zero() { - if (zero != null) return zero; - if (pos > 0) throw new Error(); - return zero = rewrite(null); + public abstract boolean isFirst(); + public abstract boolean isLast(); + public abstract Pos last(); + public abstract Pos prev(); + public abstract Pos next(); + + /** the element which produces the sequence to which this Position belongs */ + public Sequence owner() { return owner; } + + abstract Element element(); + + public abstract int numPops(); + public abstract Forest rewrite(Input.Region loc); + } + + /** the imaginary position before or after an element of a sequence; corresponds to an "LR item" */ + private static class Position extends Pos implements IntegerMappable { + /* + public Pos getPos() { + return new DumbPos(elements.length, provides(), needs(), hates(), owner_needed_or_hated(), numPops(), + public int provides(); + public int[] needs(); + public int[] hates(); + public boolean owner_needed_or_hated(); + public int numPops(); + public Forest rewrite(Input.Region loc) + }; } + */ + public int numPops() { return pos; } + final int pos; + private final Position next; + private final Position prev; - final int pos; - private final Position next; - final Forest[] holder; + public int provides() { return owner().sernum; } + public int[] needs() { return owner().needs_int(); } + public int[] hates() { return owner().hates_int(); } + public boolean owner_needed_or_hated() { return owner().needed_or_hated; } - private Position(int pos) { + private Position(Sequence owner, int pos, Position prev) { + super(owner.elements.length,owner); this.pos = pos; - this.next = pos==elements.length ? null : new Position(pos+1); - this.holder = new Forest[elements.length]; + this.next = pos==owner.elements.length ? null : new Position(owner, pos+1, this); + this.prev = prev; } - boolean isFirst() { return pos==0; } + public int compareTo(Pos p) { + return ord - ((Position)p).ord; + } - /** the element immediately after this Position, or null if this is the last Position */ - public Element element() { return pos>=elements.length ? null : elements[pos]; } + public boolean isFirst() { return pos==0; } + public int pos() { return pos; } - /** the element which produces the sequence to which this Position belongs */ - public Sequence owner() { return Sequence.this; } + /** the element immediately after this Position, or null if this is the last Position */ + public Element element() { return pos>=owner().elements.length ? null : owner().elements[pos]; } /** the next Position (the Position after this.element()) */ public Position next() { return next; } /** true iff this Position is the last one in the sequence */ public boolean isLast() { return next()==null; } + public Position last() { return isLast() ? this : next().last(); } + public Position prev() { return prev; } // Position ///////////////////////////////////////////////////////////////////////////////// - final Forest rewrite(Input.Region loc) { return rewrite(loc, true); } - private final Forest rewrite(Input.Region loc, boolean epsilonCheck) { - if (epsilonCheck && this==firstp()) return epsilonForm(); + public final Forest rewrite(Input.Region loc) { + if (isFirst()) return owner().epsilonForm(loc); for(int i=0; i ret = Sequence.this.postReduce(loc, holder, this); - //for(int k=0; k { } private static int master_position_idx = 0; + // toString ////////////////////////////////////////////////////////////////////////////// public String toString() { return toString(new StringBuffer(), false).toString(); } StringBuffer toString(StringBuffer sb) { return toString(sb, true); } StringBuffer toString(StringBuffer sb, boolean spacing) { for(int i=0; i "); sb.append(follow); } + for(Sequence s : needs) { + sb.append("& "); + sb.append(s); + } + for(Sequence s : hates) { + sb.append("&~ "); + sb.append(s); + } return sb; } - // Specialized Subclasses ////////////////////////////////////////////////////////////////////////////// - static class Constant extends Sequence { - private final Object result; - public Constant(Element[] e, Object result) { super(e); this.result = result; } - Sequence _clone() { return new Constant(elements, result); } - public Forest postReduce(Input.Region loc, Forest[] args, Position p) { - return (Forest)Forest.create(loc, result, null, false); - } - static class Drop extends Constant { - Sequence _clone() { return new Drop(elements); } - public Drop(Element[] e) { super(e, null); } - } - static class Empty extends Sequence.Constant.Drop { - Sequence _clone() { return new Empty(); } - public Empty() { super(new Element[] { }); } } - } - static class Singleton extends Sequence { private final int idx; public Singleton(Element e) { this(new Element[] { e }, 0); } public Singleton(Element[] e, int idx) { super(e); this.idx = idx; } public Forest postReduce(Input.Region loc, Forest[] args, Position p) { return args[idx]; } Sequence _clone() { return new Singleton(elements,idx); } - } - - static class Unwrap extends Sequence { - private boolean[] drops; - private final Object tag; - public Unwrap(Element[] e, Object tag) { super(e); this.drops = null; this.tag = tag; } - public Unwrap(Element[] e, Object tag, boolean[] drops) { super(e); this.drops = drops; this.tag = tag; } - Sequence _clone() { return new Unwrap(elements, tag, drops); } - public Forest postReduce(Input.Region loc, Forest[] args, Position p) { - for(int i=0; i[] args2 = new Forest[count]; - int j = 0; - for(int i=0; i tagf; - public RegionRewritingSequence(Functor tagfunctor, Element[] e, boolean[] drops) { - super(null, e, drops); - this.tagf = tagfunctor; - } - public Forest postReduce(Input.Region loc, Forest[] args, Position p) { - this.tag = tagf.invoke(loc); - Forest ret = super.postReduce(loc, args, p); - this.tag = null; - return ret; + Forest epsilonForm(Input.Region loc) { + return ((Union)elements[idx]).epsilonForm(loc); } } static class RewritingSequence extends Sequence { - /*private*/public /*final*/ Object tag; + private final Object tag; private final boolean[] drops; - private int count = 0; + private final boolean[] lifts; Sequence _clone() { return new RewritingSequence(tag, elements, drops); } public RewritingSequence(Object tag, Element[] e) { this(tag, e, null); } - public RewritingSequence(Object tag, Element[] e, boolean[] drops) { + public RewritingSequence(Object tag, Element[] e, boolean[] drops) { this(tag, e, drops, new boolean[e.length]); } + public RewritingSequence(Object tag, Element[] e, boolean[] drops, boolean[] lifts) { super(e); + if (tag==null) throw new Error(); this.tag = tag; this.drops = drops == null ? new boolean[e.length] : drops; + int count = 0; for(int i=0; i Forest postReduce(Input.Region loc, Forest[] args, Position p) { - Forest[] args2 = new Forest[count]; + Forest[] args2 = new Forest[lifts.length]; int j = 0; for(int i=0; i { if (spacing) for(int i=0; i<50-len; i++) sb.append(' '); return sb; } + Forest epsilonForm(Input.Region loc) { + return Forest.create(loc, tag, new Forest[0], lifts); + } } - }