--- /dev/null
+// This file was derived from org.mozilla.javascript.TokenStream; it\r
+// is covered by the NPL 1.1.\r
+\r
+/**\r
+ * The contents of this file are subject to the Netscape Public\r
+ * License Version 1.1 (the "License"); you may not use this file\r
+ * except in compliance with the License. You may obtain a copy of\r
+ * the License at http://www.mozilla.org/NPL/\r
+ *\r
+ * Software distributed under the License is distributed on an "AS\r
+ * IS" basis, WITHOUT WARRANTY OF ANY KIND, either express or\r
+ * implied. See the License for the specific language governing\r
+ * rights and limitations under the License.\r
+ *\r
+ * The Initial Developer of the Original Code is Netscape\r
+ * Communications Corporation.\r
+ *\r
+ * Contributor(s): Roger Lawrence, Mike McCabe\r
+ */\r
+\r
+package org.xwt.js;\r
+import java.io.*;\r
+\r
+class Lexer {\r
+\r
+ SmartReader in;\r
+ int op;\r
+ Number number;\r
+ String string;\r
+ public Lexer(Reader r) { in = new SmartReader(r); }\r
+\r
+ // Token Constants //////////////////////////////////////////////////////////\r
+\r
+ public final static int\r
+ EOL = 1, // end of line\r
+ RETURN = 5,\r
+ GOTO = 6,\r
+ BITOR = 11,\r
+ BITXOR = 12,\r
+ BITAND = 13,\r
+ EQ = 14,\r
+ NE = 15,\r
+ LT = 16,\r
+ LE = 17,\r
+ GT = 18,\r
+ GE = 19,\r
+ LSH = 20,\r
+ RSH = 21,\r
+ URSH = 22,\r
+ ADD = 23,\r
+ SUB = 24,\r
+ MUL = 25,\r
+ DIV = 26,\r
+ MOD = 27,\r
+ BITNOT = 28,\r
+ DELPROP = 31,\r
+ TYPEOF = 32,\r
+ NAME = 44,\r
+ NUMBER = 45,\r
+ STRING = 46,\r
+ NULL = 49,\r
+ THIS = 50,\r
+ FALSE = 51,\r
+ TRUE = 52,\r
+ SHEQ = 53, // shallow equality (===)\r
+ SHNE = 54, // shallow inequality (!==)\r
+ THROW = 62,\r
+ IN = 63,\r
+ INSTANCEOF = 64,\r
+ TRY = 75,\r
+ SEMI = 89, // semicolon\r
+ LB = 90, // left bracket\r
+ RB = 91, // right bracket\r
+ LC = 92, // left curly brace\r
+ RC = 93, // right curly brace\r
+ LP = 94, // left paren\r
+ RP = 95, // right paren\r
+ COMMA = 96, // comma operator\r
+ ASSIGN = 97, // assignment ops (= += -= etc.)\r
+ HOOK = 98, // conditional (?:)\r
+ COLON = 99, // colon\r
+ OR = 100, // logical or (||)\r
+ AND = 101, // logical and (&&)\r
+ EQOP = 102, // equality ops (== !=)\r
+ RELOP = 103, // relational ops (< <= > >=)\r
+ SHOP = 104, // shift ops (<< >> >>>)\r
+ UNARYOP = 105, // unary prefix operator\r
+ INC = 106, // increment (++)\r
+ DEC = 107, // decrement (--)\r
+ DOT = 108, // member operator (.)\r
+ PRIMARY = 109, // true, false, null, this\r
+ FUNCTION = 110, // function keyword\r
+ \r
+ IF = 113, // if keyword\r
+ ELSE = 114, // else keyword\r
+ SWITCH = 115, // switch keyword\r
+ CASE = 116, // case keyword\r
+ DEFAULT = 117, // default keyword\r
+ WHILE = 118, // while keyword\r
+ DO = 119, // do keyword\r
+ FOR = 120, // for keyword\r
+ BREAK = 121, // break keyword\r
+ CONTINUE = 122, // continue keyword\r
+ VAR = 123, // var keyword\r
+ WITH = 124, // with keyword\r
+ CATCH = 125, // catch keyword\r
+ FINALLY = 126, // finally keyword\r
+ RESERVED = 127, // reserved keywords\r
+ NOP = 128, // NOP\r
+ VOID = 132, // void keyword\r
+ ASSERT = 150; // assert keyword\r
+\r
+\r
+ // Predicates ///////////////////////////////////////////////////////////////////////\r
+\r
+ protected static boolean isJSIdentifier(String s) {\r
+ int length = s.length();\r
+ if (length == 0 || !Character.isJavaIdentifierStart(s.charAt(0))) return false;\r
+ for (int i=1; i<length; i++) {\r
+ char c = s.charAt(i);\r
+ if (!Character.isJavaIdentifierPart(c) && c == '\\' && !((i + 5) < length) &&\r
+ (s.charAt(i + 1) == 'u') && 0 <= xDigitToInt(s.charAt(i + 2)) && 0 <= xDigitToInt(s.charAt(i + 3)) && \r
+ 0 <= xDigitToInt(s.charAt(i + 4)) && 0 <= xDigitToInt(s.charAt(i + 5)))\r
+ return false;\r
+ }\r
+ return true;\r
+ }\r
+\r
+ private static boolean isAlpha(int c) { return ((c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z')); }\r
+ private static boolean isDigit(int c) { return (c >= '0' && c <= '9'); }\r
+ private static boolean isLineBreak(int c) { return (c == '\n' || c == '\r' || c == 0x2028 || c == 0x2029); }\r
+ private static int xDigitToInt(int c) {\r
+ if ('0' <= c && c <= '9') return c - '0';\r
+ if ('a' <= c && c <= 'f') return c - ('a' - 10);\r
+ if ('A' <= c && c <= 'F') return c - ('A' - 10);\r
+ return -1;\r
+ }\r
+ public static boolean isWhiteSpace(int c) {\r
+ if (c == '\u0020' || c == '\u0009' || c == '\u000C' || c == '\u000B' || c == '\u00A0') return true;\r
+ return Character.getType((char)c) == Character.SPACE_SEPARATOR;\r
+ }\r
+\r
+ \r
+ // Token Subtype Handlers /////////////////////////////////////////////////////////\r
+\r
+ private int getKeyword(String name) throws IOException {\r
+ final int \r
+ Id_break = BREAK,\r
+ Id_case = CASE,\r
+ Id_continue = CONTINUE,\r
+ Id_default = DEFAULT,\r
+ Id_delete = DELPROP,\r
+ Id_do = DO,\r
+ Id_else = ELSE,\r
+ Id_false = PRIMARY | (FALSE << 8),\r
+ Id_for = FOR,\r
+ Id_function = FUNCTION,\r
+ Id_if = IF,\r
+ Id_in = RELOP | (IN << 8),\r
+ Id_null = PRIMARY | (NULL << 8),\r
+ Id_return = RETURN,\r
+ Id_switch = SWITCH,\r
+ Id_this = PRIMARY | (THIS << 8),\r
+ Id_true = PRIMARY | (TRUE << 8),\r
+ Id_typeof = UNARYOP | (TYPEOF << 8),\r
+ Id_var = VAR,\r
+ Id_void = UNARYOP | (VOID << 8),\r
+ Id_while = WHILE,\r
+ Id_with = WITH,\r
+\r
+ // the following are #ifdef RESERVE_JAVA_KEYWORDS in jsscan.c\r
+ Id_abstract = RESERVED,\r
+ Id_boolean = RESERVED,\r
+ Id_byte = RESERVED,\r
+ Id_catch = CATCH,\r
+ Id_char = RESERVED,\r
+ Id_class = RESERVED,\r
+ Id_const = RESERVED,\r
+ Id_debugger = RESERVED,\r
+ Id_double = RESERVED,\r
+ Id_enum = RESERVED,\r
+ Id_extends = RESERVED,\r
+ Id_final = RESERVED,\r
+ Id_finally = FINALLY,\r
+ Id_float = RESERVED,\r
+ Id_goto = RESERVED,\r
+ Id_implements = RESERVED,\r
+ Id_instanceof = RELOP | (INSTANCEOF << 8),\r
+ Id_int = RESERVED,\r
+ Id_interface = RESERVED,\r
+ Id_long = RESERVED,\r
+ Id_native = RESERVED,\r
+ Id_package = RESERVED,\r
+ Id_private = RESERVED,\r
+ Id_protected = RESERVED,\r
+ Id_public = RESERVED,\r
+ Id_assert = ASSERT,\r
+ Id_short = RESERVED,\r
+ Id_static = RESERVED,\r
+ Id_super = RESERVED,\r
+ Id_synchronized = RESERVED,\r
+ Id_throw = THROW,\r
+ Id_throws = RESERVED,\r
+ Id_transient = RESERVED,\r
+ Id_try = TRY,\r
+ Id_volatile = RESERVED;\r
+ \r
+ int id;\r
+ String s = name;\r
+ L0: { id = -1; String X = null; int c;\r
+ L: switch (s.length()) {\r
+ case 2: c=s.charAt(1);\r
+ if (c=='f') { if (s.charAt(0)=='i') {id=Id_if; break L0;} }\r
+ else if (c=='n') { if (s.charAt(0)=='i') {id=Id_in; break L0;} }\r
+ else if (c=='o') { if (s.charAt(0)=='d') {id=Id_do; break L0;} }\r
+ break L;\r
+ case 3: switch (s.charAt(0)) {\r
+ case 'f': if (s.charAt(2)=='r' && s.charAt(1)=='o') {id=Id_for; break L0;} break L;\r
+ case 'i': if (s.charAt(2)=='t' && s.charAt(1)=='n') {id=Id_int; break L0;} break L;\r
+ case 'n': if (s.charAt(2)=='w' && s.charAt(1)=='e')\r
+ throw new IOException("the new keyword is not permitted in XWT scripts");\r
+ break L;\r
+ case 't': if (s.charAt(2)=='y' && s.charAt(1)=='r') {id=Id_try; break L0;} break L;\r
+ case 'v': if (s.charAt(2)=='r' && s.charAt(1)=='a') {id=Id_var; break L0;} break L;\r
+ } break L;\r
+ case 4: switch (s.charAt(0)) {\r
+ case 'b': X="byte";id=Id_byte; break L;\r
+ case 'c': c=s.charAt(3);\r
+ if (c=='e') { if (s.charAt(2)=='s' && s.charAt(1)=='a') {id=Id_case; break L0;} }\r
+ else if (c=='r') { if (s.charAt(2)=='a' && s.charAt(1)=='h') {id=Id_char; break L0;} }\r
+ break L;\r
+ case 'e': c=s.charAt(3);\r
+ if (c=='e') { if (s.charAt(2)=='s' && s.charAt(1)=='l') {id=Id_else; break L0;} }\r
+ else if (c=='m') { if (s.charAt(2)=='u' && s.charAt(1)=='n') {id=Id_enum; break L0;} }\r
+ break L;\r
+ case 'g': X="goto";id=Id_goto; break L;\r
+ case 'l': X="long";id=Id_long; break L;\r
+ case 'n': X="null";id=Id_null; break L;\r
+ case 't': c=s.charAt(3);\r
+ if (c=='e') { if (s.charAt(2)=='u' && s.charAt(1)=='r') {id=Id_true; break L0;} }\r
+ else if (c=='s') { if (s.charAt(2)=='i' && s.charAt(1)=='h') {id=Id_this; break L0;} }\r
+ break L;\r
+ case 'v': X="void";id=Id_void; break L;\r
+ case 'w': X="with";id=Id_with; break L;\r
+ } break L;\r
+ case 5: switch (s.charAt(2)) {\r
+ case 'a': X="class";id=Id_class; break L;\r
+ case 'e': X="break";id=Id_break; break L;\r
+ case 'i': X="while";id=Id_while; break L;\r
+ case 'l': X="false";id=Id_false; break L;\r
+ case 'n': c=s.charAt(0);\r
+ if (c=='c') { X="const"; throw new IOException("the const keyword is not permitted in XWT"); }\r
+ else if (c=='f') { X="final";id=Id_final; }\r
+ break L;\r
+ case 'o': c=s.charAt(0);\r
+ if (c=='f') { X="float";id=Id_float; }\r
+ else if (c=='s') { X="short";id=Id_short; }\r
+ break L;\r
+ case 'p': X="super";id=Id_super; break L;\r
+ case 'r': X="throw";id=Id_throw; break L;\r
+ case 't': X="catch";id=Id_catch; break L;\r
+ } break L;\r
+ case 6: switch (s.charAt(1)) {\r
+ case 'a': X="native";id=Id_native; break L;\r
+ case 'e': c=s.charAt(0);\r
+ if (c=='d') { X="delete"; throw new IOException("the delete keyword is not permitted in XWT scripts"); }\r
+ else if (c=='r') { X="return";id=Id_return; }\r
+ break L;\r
+ case 'h': X="throws";id=Id_throws; break L;\r
+ case 'o': X="double";id=Id_double; break L;\r
+ case 's': X="assert";id=Id_assert; break L;\r
+ case 'u': X="public";id=Id_public; break L;\r
+ case 'w': X="switch";id=Id_switch; break L;\r
+ case 'y': X="typeof";id=Id_typeof; break L;\r
+ } break L;\r
+ case 7: switch (s.charAt(1)) {\r
+ case 'a': X="package";id=Id_package; break L;\r
+ case 'e': X="default";id=Id_default; break L;\r
+ case 'i': X="finally";id=Id_finally; break L;\r
+ case 'o': X="boolean";id=Id_boolean; break L;\r
+ case 'r': X="private";id=Id_private; break L;\r
+ case 'x': X="extends";id=Id_extends; break L;\r
+ } break L;\r
+ case 8: switch (s.charAt(0)) {\r
+ case 'a': X="abstract";id=Id_abstract; break L;\r
+ case 'c': X="continue";id=Id_continue; break L;\r
+ case 'd': X="debugger";id=Id_debugger; break L;\r
+ case 'f': X="function";id=Id_function; break L;\r
+ case 'v': X="volatile";id=Id_volatile; break L;\r
+ } break L;\r
+ case 9: c=s.charAt(0);\r
+ if (c=='i') { X="interface";id=Id_interface; }\r
+ else if (c=='p') { X="protected";id=Id_protected; }\r
+ else if (c=='t') { X="transient";id=Id_transient; }\r
+ break L;\r
+ case 10: c=s.charAt(1);\r
+ if (c=='m') { X="implements";id=Id_implements; }\r
+ else if (c=='n') { X="instanceof"; throw new IOException("the instanceof keyword is not permitted in XWT scripts"); }\r
+ break L;\r
+ case 12: X="synchronized";id=Id_synchronized; break L;\r
+ }\r
+ if (X!=null && X!=s && !X.equals(s)) id = -1;\r
+ }\r
+ if (id == -1) { return -1; }\r
+ this.op = id >> 8;\r
+ return id & 0xff;\r
+ }\r
+\r
+ private int getIdentifier(int c) throws IOException {\r
+ in.startString();\r
+ while (Character.isJavaIdentifierPart((char)(c = in.read())));\r
+ in.unread();\r
+ String str = in.getString();\r
+ int result = getKeyword(str);\r
+ if (result != -1) return result;\r
+ this.string = str;\r
+ return NAME;\r
+ }\r
+ \r
+ private int getNumber(int c) throws IOException {\r
+ int base = 10;\r
+ in.startString();\r
+ double dval = Double.NaN;\r
+ long longval = 0;\r
+ boolean isInteger = true;\r
+ \r
+ // figure out what base we're using\r
+ if (c == '0') {\r
+ if (Character.toLowerCase((char)(c = in.read())) == 'x') { base = 16; in.startString(); }\r
+ else if (isDigit(c)) base = 8;\r
+ }\r
+ \r
+ while (0 <= xDigitToInt(c) && !(base < 16 && isAlpha(c))) c = in.read();\r
+ if (base == 10 && (c == '.' || c == 'e' || c == 'E')) {\r
+ isInteger = false;\r
+ if (c == '.') do { c = in.read(); } while (isDigit(c));\r
+ if (c == 'e' || c == 'E') {\r
+ c = in.read();\r
+ if (c == '+' || c == '-') c = in.read();\r
+ if (!isDigit(c)) throw new IOException("msg.missing.exponent");\r
+ do { c = in.read(); } while (isDigit(c));\r
+ }\r
+ }\r
+ in.unread();\r
+\r
+ String numString = in.getString();\r
+ if (base == 10 && !isInteger) {\r
+ try { dval = (Double.valueOf(numString)).doubleValue(); }\r
+ catch (NumberFormatException ex) { throw new IOException("msg.caught.nfe"); }\r
+ } else {\r
+ if (isInteger) {\r
+ longval = Long.parseLong(numString, base);\r
+ dval = (double)longval;\r
+ else {\r
+ // FIXME: we're not handling hex/octal fractions... does that matter?\r
+ dval = Double.parseDouble(numString);\r
+ longval = (long) dval;\r
+ if (longval == dval) isInteger = true;\r
+ }\r
+ }\r
+ \r
+ if (!isInteger) this.number = new Double(dval);\r
+ else if (Byte.MIN_VALUE <= longval && longval <= Byte.MAX_VALUE) this.number = new Byte((byte)longval);\r
+ else if (Short.MIN_VALUE <= longval && longval <= Short.MAX_VALUE) this.number = new Short((short)longval);\r
+ else if (Integer.MIN_VALUE <= longval && longval <= Integer.MAX_VALUE) this.number = new Integer((int)longval);\r
+ else this.number = new Double(longval);\r
+ return NUMBER;\r
+ }\r
+ \r
+ private int getString(int c) throws IOException {\r
+ StringBuffer stringBuf = null;\r
+ int quoteChar = c;\r
+ int val = 0;\r
+ c = in.read();\r
+ in.startString(); // start after the first "\r
+ while(c != quoteChar) {\r
+ if (c == '\n' || c == -1) throw new IOException("msg.unterminated.string.lit");\r
+ if (c == '\\') {\r
+ if (stringBuf == null) {\r
+ in.unread(); // Don't include the backslash\r
+ stringBuf = new StringBuffer(in.getString());\r
+ in.read();\r
+ }\r
+ switch (c = in.read()) {\r
+ case 'b': c = '\b'; break;\r
+ case 'f': c = '\f'; break;\r
+ case 'n': c = '\n'; break;\r
+ case 'r': c = '\r'; break;\r
+ case 't': c = '\t'; break;\r
+ case 'v': c = '\u000B'; break;\r
+ default: throw new IOException("\\u and \\0 escapes not currently supported -- use XML entities");\r
+ }\r
+ }\r
+ if (stringBuf != null) stringBuf.append((char) c);\r
+ c = in.read();\r
+ }\r
+ if (stringBuf != null) this.string = stringBuf.toString();\r
+ else {\r
+ in.unread(); // miss the trailing "\r
+ this.string = in.getString();\r
+ in.read();\r
+ }\r
+ return STRING;\r
+ }\r
+\r
+ // hack because you can't do "foo ? 1 : (bar(); 2)" in Java\r
+ final int op(int set, int ret) { this.op = set; return ret; }\r
+\r
+ public int getToken() throws IOException {\r
+ int c;\r
+ do { if ((c = in.read()) == '\n') break; } while (isWhiteSpace(c) || c == '\n');\r
+ if (c == -1) return -1;\r
+ if (c == '\\' && in.peek() == 'u') throw new IOException("\\u and \\0 escapes not currently supported -- use XML entities");\r
+ if (Character.isJavaIdentifierStart((char)c)) return getIdentifier(c);\r
+ if (isDigit(c) || (c == '.' && isDigit(in.peek()))) return getNumber(c);\r
+ if (c == '"' || c == '\'') return getString(c);\r
+ switch (c) {\r
+ case '\n': return EOL;\r
+ case ';': return SEMI;\r
+ case '[': return LB;\r
+ case ']': return RB;\r
+ case '{': return LC;\r
+ case '}': return RC;\r
+ case '(': return LP;\r
+ case ')': return RP;\r
+ case ',': return COMMA;\r
+ case '?': return HOOK;\r
+ case ':': return COLON;\r
+ case '.': return DOT;\r
+ case '|': return in.match('|') ? OR : (in.match('=') ? op(BITOR, ASSIGN) : BITOR);\r
+ case '^': return in.match('=') ? op(BITXOR, ASSIGN) : BITXOR;\r
+ case '&': return in.match('&') ? AND : in.match('=') ? op(BITAND, ASSIGN) : BITAND;\r
+ case '=': return !in.match('=') ? op(NOP, ASSIGN) : op(in.match('=') ? SHEQ : EQ, EQOP);\r
+ case '!': return !in.match('=') ? op(NOP, UNARYOP) : op(in.match('=') ? SHNE : NE, EQOP);\r
+ case '%': return op(MOD, in.match('=') ? ASSIGN : MOD);\r
+ case '~': return op(BITNOT, UNARYOP);\r
+ case '+': return in.match('=') ? op(ADD, ASSIGN) : in.match('+') ? INC : ADD;\r
+ case '-': return in.match('=') ? op(SUB, ASSIGN) : in.match('-') ? DEC : SUB;\r
+ case '*': return in.match('=') ? op(MUL, ASSIGN) : MUL;\r
+ case '<': return !in.match('<') ?\r
+ op(in.match('=') ? LE : LT, RELOP) :\r
+ in.match('=') ? op(LSH, ASSIGN) : op(LSH, SHOP);\r
+ case '>': return !in.match('>') ?\r
+ op(in.match('=') ? GE : GT, RELOP) :\r
+ in.match('>') ?\r
+ op(URSH, in.match('=') ? ASSIGN : SHOP) :\r
+ op(RSH, in.match('=') ? ASSIGN : SHOP);\r
+ case '/':\r
+ if (in.match('=')) { op(DIV, ASSIGN); }\r
+ if (in.match('/')) { while ((c = in.read()) != -1 && c != '\n'); in.unread(); return getToken(); }\r
+ if (!in.match('*')) return DIV;\r
+ while ((c = in.read()) != -1 && !(c == '*' && in.match('/'))) {\r
+ if (c == '\n' || c != '/' || !in.match('*')) continue;\r
+ if (in.match('/')) return getToken();\r
+ throw new IOException("msg.nested.comment");\r
+ }\r
+ if (c == -1) throw new IOException("msg.unterminated.comment");\r
+ return getToken(); // `goto retry'\r
+ default: throw new IOException("illegal character: " + c);\r
+ }\r
+ }\r
+\r
+ private static class SmartReader {\r
+ PushbackReader reader = null;\r
+ int lastread = -1;\r
+\r
+ public SmartReader(Reader r) { reader = new PushbackReader(r); }\r
+ public void unread() throws IOException { reader.unread(lastread); }\r
+ public boolean match(char c) throws IOException { if (peek() == c) { reader.read(); return true; } else return false; }\r
+ public int peek() throws IOException {\r
+ int peeked = reader.read();\r
+ if (peeked != -1) reader.unread((char)peeked);\r
+ return peeked;\r
+ }\r
+ public int read() throws IOException {\r
+ lastread = reader.read();\r
+ if (accumulator != null) accumulator.append(lastread);\r
+ return lastread;\r
+ }\r
+\r
+ // FIXME: could be much more efficient\r
+ StringBuffer accumulator = null;\r
+ public void startString() { accumulator = new StringBuffer(); }\r
+ public String getString() throws IOException {\r
+ String ret = accumulator.toString();\r
+ accumulator = null;\r
+ return ret;\r
+ }\r
+ }\r
+\r
+}\r