mirror of
https://github.com/mozilla/gecko-dev.git
synced 2024-12-31 21:21:08 +00:00
1103 lines
28 KiB
C
1103 lines
28 KiB
C
/* -*- Mode: C; tab-width: 8; indent-tabs-mode: nil; c-basic-offset: 4 -*-
|
|
*
|
|
* The contents of this file are subject to the Netscape Public License
|
|
* Version 1.0 (the "NPL"); you may not use this file except in
|
|
* compliance with the NPL. You may obtain a copy of the NPL at
|
|
* http://www.mozilla.org/NPL/
|
|
*
|
|
* Software distributed under the NPL is distributed on an "AS IS" basis,
|
|
* WITHOUT WARRANTY OF ANY KIND, either express or implied. See the NPL
|
|
* for the specific language governing rights and limitations under the
|
|
* NPL.
|
|
*
|
|
* The Initial Developer of this code under the NPL is Netscape
|
|
* Communications Corporation. Portions created by Netscape are
|
|
* Copyright (C) 1998 Netscape Communications Corporation. All Rights
|
|
* Reserved.
|
|
*/
|
|
|
|
/*
|
|
* JS lexical scanner.
|
|
*/
|
|
#include "jsstddef.h"
|
|
#include <stdio.h> /* first to avoid trouble on some systems */
|
|
#include <errno.h>
|
|
#include <limits.h>
|
|
#include <math.h>
|
|
#include <memory.h>
|
|
#include <stdarg.h>
|
|
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include "prtypes.h"
|
|
#include "prarena.h"
|
|
#include "prassert.h"
|
|
#include "prdtoa.h"
|
|
#include "prprintf.h"
|
|
#include "jsapi.h"
|
|
#include "jsatom.h"
|
|
#include "jscntxt.h"
|
|
#include "jsconfig.h"
|
|
#include "jsnum.h"
|
|
#include "jsopcode.h"
|
|
#include "jsregexp.h"
|
|
#include "jsscan.h"
|
|
|
|
#define RESERVE_JAVA_KEYWORDS
|
|
#define RESERVE_ECMA_KEYWORDS
|
|
|
|
static struct keyword {
|
|
char *name;
|
|
int16 tokentype; /* JSTokenType */
|
|
int8 op; /* JSOp */
|
|
uint8 version; /* JSVersion */
|
|
} keywords[] = {
|
|
{"break", TOK_BREAK, JSOP_NOP},
|
|
{"case", TOK_CASE, JSOP_NOP},
|
|
{"continue", TOK_CONTINUE, JSOP_NOP},
|
|
{"default", TOK_DEFAULT, JSOP_NOP},
|
|
{js_delete_str, TOK_DELETE, JSOP_NOP},
|
|
{"do", TOK_DO, JSOP_NOP},
|
|
{"else", TOK_ELSE, JSOP_NOP},
|
|
{"export", TOK_EXPORT, JSOP_NOP, JSVERSION_1_2},
|
|
{js_false_str, TOK_PRIMARY, JSOP_FALSE},
|
|
{"for", TOK_FOR, JSOP_NOP},
|
|
{"function", TOK_FUNCTION, JSOP_NOP},
|
|
{"if", TOK_IF, JSOP_NOP},
|
|
{js_in_str, TOK_IN, JSOP_IN},
|
|
{js_new_str, TOK_NEW, JSOP_NEW},
|
|
{js_null_str, TOK_PRIMARY, JSOP_NULL},
|
|
{"return", TOK_RETURN, JSOP_NOP},
|
|
{"switch", TOK_SWITCH, JSOP_NOP},
|
|
{js_this_str, TOK_PRIMARY, JSOP_THIS},
|
|
{js_true_str, TOK_PRIMARY, JSOP_TRUE},
|
|
{js_typeof_str, TOK_UNARYOP, JSOP_TYPEOF},
|
|
{"var", TOK_VAR, JSOP_NOP},
|
|
{js_void_str, TOK_UNARYOP, JSOP_VOID},
|
|
{"while", TOK_WHILE, JSOP_NOP},
|
|
{"with", TOK_WITH, JSOP_NOP},
|
|
|
|
#if JS_HAS_EXCEPTIONS
|
|
{"try", TOK_TRY, JSOP_NOP},
|
|
{"catch", TOK_CATCH, JSOP_NOP},
|
|
{"finally", TOK_FINALLY, JSOP_NOP},
|
|
{"throw", TOK_THROW, JSOP_NOP},
|
|
#else
|
|
{"try", TOK_RESERVED, JSOP_NOP},
|
|
{"catch", TOK_RESERVED, JSOP_NOP},
|
|
{"finally", TOK_RESERVED, JSOP_NOP},
|
|
{"throw", TOK_RESERVED, JSOP_NOP},
|
|
#endif
|
|
|
|
#if JS_HAS_INSTANCEOF
|
|
{js_instanceof_str, TOK_INSTANCEOF, JSOP_INSTANCEOF},
|
|
#else
|
|
{js_instanceof_str, TOK_RESERVED, JSOP_NOP},
|
|
#endif
|
|
|
|
#ifdef RESERVE_JAVA_KEYWORDS
|
|
{"abstract", TOK_RESERVED, JSOP_NOP},
|
|
{"boolean", TOK_RESERVED, JSOP_NOP},
|
|
{"byte", TOK_RESERVED, JSOP_NOP},
|
|
{"char", TOK_RESERVED, JSOP_NOP},
|
|
{"class", TOK_RESERVED, JSOP_NOP},
|
|
{"const", TOK_RESERVED, JSOP_NOP},
|
|
{"double", TOK_RESERVED, JSOP_NOP},
|
|
{"extends", TOK_RESERVED, JSOP_NOP},
|
|
{"final", TOK_RESERVED, JSOP_NOP},
|
|
{"float", TOK_RESERVED, JSOP_NOP},
|
|
{"goto", TOK_RESERVED, JSOP_NOP},
|
|
{"implements", TOK_RESERVED, JSOP_NOP},
|
|
{"import", TOK_IMPORT, JSOP_NOP},
|
|
{"int", TOK_RESERVED, JSOP_NOP},
|
|
{"interface", TOK_RESERVED, JSOP_NOP},
|
|
{"long", TOK_RESERVED, JSOP_NOP},
|
|
{"native", TOK_RESERVED, JSOP_NOP},
|
|
{"package", TOK_RESERVED, JSOP_NOP},
|
|
{"private", TOK_RESERVED, JSOP_NOP},
|
|
{"protected", TOK_RESERVED, JSOP_NOP},
|
|
{"public", TOK_RESERVED, JSOP_NOP},
|
|
{"short", TOK_RESERVED, JSOP_NOP},
|
|
{"static", TOK_RESERVED, JSOP_NOP},
|
|
{"super", TOK_PRIMARY, JSOP_NOP},
|
|
{"synchronized", TOK_RESERVED, JSOP_NOP},
|
|
{"throws", TOK_RESERVED, JSOP_NOP},
|
|
{"transient", TOK_RESERVED, JSOP_NOP},
|
|
{"volatile", TOK_RESERVED, JSOP_NOP},
|
|
#endif
|
|
|
|
#ifdef RESERVE_ECMA_KEYWORDS
|
|
{"debugger", TOK_RESERVED, JSOP_NOP, JSVERSION_1_3},
|
|
{"enum", TOK_RESERVED, JSOP_NOP, JSVERSION_1_3},
|
|
#endif
|
|
|
|
{0}
|
|
};
|
|
|
|
JSBool
|
|
js_InitScanner(JSContext *cx)
|
|
{
|
|
struct keyword *kw;
|
|
JSAtom *atom;
|
|
|
|
for (kw = keywords; kw->name; kw++) {
|
|
atom = js_Atomize(cx, kw->name, strlen(kw->name), ATOM_PINNED);
|
|
if (!atom)
|
|
return JS_FALSE;
|
|
atom->kwindex = (JSVERSION_IS_ECMA(cx->version)
|
|
|| kw->version <= cx->version) ? kw - keywords : -1;
|
|
}
|
|
return JS_TRUE;
|
|
}
|
|
|
|
JS_FRIEND_API(void)
|
|
js_MapKeywords(void (*mapfun)(const char *))
|
|
{
|
|
struct keyword *kw;
|
|
|
|
for (kw = keywords; kw->name; kw++)
|
|
mapfun(kw->name);
|
|
}
|
|
|
|
JSTokenStream *
|
|
js_NewTokenStream(JSContext *cx, const jschar *base, size_t length,
|
|
const char *filename, uintN lineno,
|
|
JSPrincipals *principals)
|
|
{
|
|
JSTokenStream *ts;
|
|
|
|
ts = js_NewBufferTokenStream(cx, base, length);
|
|
if (!ts)
|
|
return NULL;
|
|
ts->filename = filename;
|
|
ts->lineno = lineno;
|
|
if (principals)
|
|
JSPRINCIPALS_HOLD(cx, principals);
|
|
ts->principals = principals;
|
|
return ts;
|
|
}
|
|
|
|
JS_FRIEND_API(JSTokenStream *)
|
|
js_NewBufferTokenStream(JSContext *cx, const jschar *base, size_t length)
|
|
{
|
|
size_t nb;
|
|
JSTokenStream *ts;
|
|
|
|
nb = sizeof(JSTokenStream) + JS_LINE_LIMIT * sizeof(jschar);
|
|
PR_ARENA_ALLOCATE(ts, &cx->tempPool, nb);
|
|
if (!ts) {
|
|
JS_ReportOutOfMemory(cx);
|
|
return NULL;
|
|
}
|
|
memset(ts, 0, nb);
|
|
CLEAR_PUSHBACK(ts);
|
|
ts->lineno = 1;
|
|
ts->linebuf.base = ts->linebuf.limit = ts->linebuf.ptr = (jschar *)(ts + 1);
|
|
ts->userbuf.base = (jschar *)base;
|
|
ts->userbuf.limit = (jschar *)base + length;
|
|
ts->userbuf.ptr = (jschar *)base;
|
|
#ifdef JSD_LOWLEVEL_SOURCE
|
|
ts->jsdc = JSD_JSDContextForJSContext(cx);
|
|
#endif
|
|
return ts;
|
|
}
|
|
|
|
#ifdef JSFILE
|
|
JS_FRIEND_API(JSTokenStream *)
|
|
js_NewFileTokenStream(JSContext *cx, const char *filename, FILE *defaultfp)
|
|
{
|
|
jschar *base;
|
|
JSTokenStream *ts;
|
|
FILE *file;
|
|
|
|
PR_ARENA_ALLOCATE(base, &cx->tempPool, JS_LINE_LIMIT * sizeof(jschar));
|
|
if (!base)
|
|
return NULL;
|
|
ts = js_NewBufferTokenStream(cx, base, JS_LINE_LIMIT);
|
|
if (!ts)
|
|
return NULL;
|
|
if (!filename || strcmp(filename, "-") == 0) {
|
|
file = defaultfp;
|
|
} else {
|
|
file = fopen(filename, "r");
|
|
if (!file) {
|
|
JS_ReportError(cx, "can't open %s: %s", filename, strerror(errno));
|
|
return NULL;
|
|
}
|
|
}
|
|
ts->userbuf.ptr = ts->userbuf.limit;
|
|
ts->file = file;
|
|
ts->filename = filename;
|
|
return ts;
|
|
}
|
|
#endif /* JSFILE */
|
|
|
|
JS_FRIEND_API(JSBool)
|
|
js_CloseTokenStream(JSContext *cx, JSTokenStream *ts)
|
|
{
|
|
if (ts->principals)
|
|
JSPRINCIPALS_DROP(cx, ts->principals);
|
|
#ifdef JSFILE
|
|
return !ts->file || fclose(ts->file) == 0;
|
|
#else
|
|
return JS_TRUE;
|
|
#endif
|
|
}
|
|
|
|
#ifdef JSD_LOWLEVEL_SOURCE
|
|
static void
|
|
SendSourceToJSDebugger(JSTokenStream *ts, jschar *str, size_t length)
|
|
{
|
|
if (!ts->jsdsrc) {
|
|
ts->jsdsrc = JSD_NewSourceText(ts->jsdc,
|
|
ts->filename ? ts->filename : "typein");
|
|
}
|
|
if (ts->jsdsrc) {
|
|
/* here we convert our Unicode into a C string to pass to JSD */
|
|
#define JSD_BUF_SIZE 1024
|
|
static char* buf = NULL;
|
|
int remaining = length;
|
|
|
|
if (!buf)
|
|
buf = malloc(JSD_BUF_SIZE);
|
|
if (buf)
|
|
{
|
|
while (remaining && ts->jsdsrc) {
|
|
int bytes = PR_MIN(remaining, JSD_BUF_SIZE);
|
|
int i;
|
|
for (i = 0; i < bytes; i++)
|
|
buf[i] = (const char) *(str++);
|
|
ts->jsdsrc = JSD_AppendSourceText(ts->jsdc,ts->jsdsrc,
|
|
buf, bytes,
|
|
JSD_SOURCE_PARTIAL);
|
|
remaining -= bytes;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
#endif
|
|
|
|
static int32
|
|
GetChar(JSTokenStream *ts)
|
|
{
|
|
int32 c;
|
|
ptrdiff_t len, olen;
|
|
jschar *nl;
|
|
|
|
if (ts->ungetpos != 0) {
|
|
c = ts->ungetbuf[--ts->ungetpos];
|
|
} else {
|
|
if (ts->linebuf.ptr == ts->linebuf.limit) {
|
|
len = PTRDIFF(ts->userbuf.limit, ts->userbuf.ptr, jschar);
|
|
if (len <= 0) {
|
|
#ifdef JSFILE
|
|
/* Fill ts->userbuf so that \r and \r\n convert to \n. */
|
|
if (ts->file) {
|
|
JSBool crflag;
|
|
char cbuf[JS_LINE_LIMIT];
|
|
jschar *ubuf;
|
|
ptrdiff_t i, j;
|
|
|
|
crflag = (ts->flags & TSF_CRFLAG) != 0;
|
|
if (!fgets(cbuf, JS_LINE_LIMIT - crflag, ts->file)) {
|
|
ts->flags |= TSF_EOF;
|
|
return EOF;
|
|
}
|
|
len = olen = strlen(cbuf);
|
|
PR_ASSERT(len > 0);
|
|
ubuf = ts->userbuf.base;
|
|
i = 0;
|
|
if (crflag) {
|
|
ts->flags &= ~TSF_CRFLAG;
|
|
if (cbuf[0] != '\n') {
|
|
ubuf[i++] = '\n';
|
|
len++;
|
|
ts->linepos--;
|
|
}
|
|
}
|
|
for (j = 0; i < len; i++, j++)
|
|
ubuf[i] = (jschar) (unsigned char) cbuf[j];
|
|
ts->userbuf.limit = ubuf + len;
|
|
ts->userbuf.ptr = ubuf;
|
|
} else
|
|
#endif /* JSFILE */
|
|
{
|
|
ts->flags |= TSF_EOF;
|
|
return EOF;
|
|
}
|
|
}
|
|
|
|
#ifdef JSD_LOWLEVEL_SOURCE
|
|
if (ts->jsdc)
|
|
SendSourceToJSDebugger(ts, ts->userbuf.ptr, len);
|
|
#endif
|
|
|
|
/*
|
|
* Any one of \n, \r, or \r\n ends a line (longest match wins).
|
|
*/
|
|
for (nl = ts->userbuf.ptr; nl < ts->userbuf.limit; nl++) {
|
|
if (*nl == '\n')
|
|
break;
|
|
if (*nl == '\r') {
|
|
if (nl + 1 < ts->userbuf.limit && nl[1] == '\n')
|
|
nl++;
|
|
break;
|
|
}
|
|
}
|
|
|
|
/*
|
|
* If there was a line terminator, copy thru it into linebuf.
|
|
* Else copy JS_LINE_LIMIT-1 bytes into linebuf.
|
|
*/
|
|
if (nl < ts->userbuf.limit)
|
|
len = PTRDIFF(nl, ts->userbuf.ptr, jschar) + 1;
|
|
if (len >= JS_LINE_LIMIT)
|
|
len = JS_LINE_LIMIT - 1;
|
|
js_strncpy(ts->linebuf.base, ts->userbuf.ptr, len);
|
|
ts->userbuf.ptr += len;
|
|
olen = len;
|
|
|
|
/*
|
|
* Make sure linebuf contains \n for EOL (don't do this in
|
|
* userbuf because the user's string might be readonly).
|
|
*/
|
|
if (nl < ts->userbuf.limit) {
|
|
if (*nl == '\r') {
|
|
if (ts->linebuf.base[len-1] == '\r') {
|
|
#ifdef JSFILE
|
|
/*
|
|
* Does the line segment end in \r? We must check
|
|
* for a \n at the front of the next segment before
|
|
* storing a \n into linebuf.
|
|
*/
|
|
if (nl + 1 == ts->userbuf.limit) {
|
|
len--;
|
|
ts->flags |= TSF_CRFLAG;
|
|
} else
|
|
#endif
|
|
ts->linebuf.base[len-1] = '\n';
|
|
}
|
|
} else if (*nl == '\n') {
|
|
if (nl > ts->userbuf.base &&
|
|
nl[-1] == '\r' &&
|
|
ts->linebuf.base[len-2] == '\r') {
|
|
len--;
|
|
PR_ASSERT(ts->linebuf.base[len] == '\n');
|
|
ts->linebuf.base[len-1] = '\n';
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Reset linebuf based on adjusted segment length. */
|
|
ts->linebuf.limit = ts->linebuf.base + len;
|
|
ts->linebuf.ptr = ts->linebuf.base;
|
|
|
|
/* Update position of linebuf within physical line in userbuf. */
|
|
if (!(ts->flags & TSF_NLFLAG))
|
|
ts->linepos += ts->linelen;
|
|
else
|
|
ts->linepos = 0;
|
|
if (ts->linebuf.limit[-1] == '\n')
|
|
ts->flags |= TSF_NLFLAG;
|
|
else
|
|
ts->flags &= ~TSF_NLFLAG;
|
|
|
|
/* Update linelen from original segment length. */
|
|
ts->linelen = olen;
|
|
}
|
|
c = *ts->linebuf.ptr++;
|
|
}
|
|
if (c == '\n')
|
|
ts->lineno++;
|
|
return c;
|
|
}
|
|
|
|
static void
|
|
UngetChar(JSTokenStream *ts, int32 c)
|
|
{
|
|
if (c == EOF)
|
|
return;
|
|
PR_ASSERT(ts->ungetpos < sizeof ts->ungetbuf / sizeof ts->ungetbuf[0]);
|
|
if (c == '\n')
|
|
ts->lineno--;
|
|
ts->ungetbuf[ts->ungetpos++] = (jschar)c;
|
|
}
|
|
|
|
static int32
|
|
PeekChar(JSTokenStream *ts)
|
|
{
|
|
int32 c;
|
|
|
|
c = GetChar(ts);
|
|
UngetChar(ts, c);
|
|
return c;
|
|
}
|
|
|
|
static JSBool
|
|
PeekChars(JSTokenStream *ts, intN n, jschar *cp)
|
|
{
|
|
intN i, j;
|
|
int32 c;
|
|
|
|
for (i = 0; i < n; i++) {
|
|
c = GetChar(ts);
|
|
if (c == EOF)
|
|
break;
|
|
cp[i] = (jschar)c;
|
|
}
|
|
for (j = i - 1; j >= 0; j--)
|
|
UngetChar(ts, cp[j]);
|
|
return i == n;
|
|
}
|
|
|
|
static void
|
|
SkipChars(JSTokenStream *ts, intN n)
|
|
{
|
|
while (--n >= 0)
|
|
GetChar(ts);
|
|
}
|
|
|
|
static int32
|
|
MatchChar(JSTokenStream *ts, int32 nextChar)
|
|
{
|
|
int32 c;
|
|
|
|
c = GetChar(ts);
|
|
if (c == nextChar)
|
|
return 1;
|
|
UngetChar(ts, c);
|
|
return 0;
|
|
}
|
|
|
|
void
|
|
js_ReportCompileError(JSContext *cx, JSTokenStream *ts, const char *format,
|
|
...)
|
|
{
|
|
va_list ap;
|
|
char *message;
|
|
jschar *limit, lastc;
|
|
JSErrorReporter onError;
|
|
JSErrorReport report;
|
|
JSString *linestr;
|
|
|
|
va_start(ap, format);
|
|
message = PR_vsmprintf(format, ap);
|
|
va_end(ap);
|
|
if (!message) {
|
|
JS_ReportOutOfMemory(cx);
|
|
return;
|
|
}
|
|
|
|
PR_ASSERT(ts->linebuf.limit < ts->linebuf.base + JS_LINE_LIMIT);
|
|
limit = ts->linebuf.limit;
|
|
lastc = limit[-1];
|
|
if (lastc == '\n')
|
|
limit[-1] = 0;
|
|
onError = cx->errorReporter;
|
|
if (onError) {
|
|
report.filename = ts->filename;
|
|
report.lineno = ts->lineno;
|
|
linestr = js_NewStringCopyZ(cx, ts->linebuf.base, 0);
|
|
report.linebuf = linestr
|
|
? JS_GetStringBytes(linestr)
|
|
: NULL;
|
|
report.tokenptr = linestr
|
|
? report.linebuf + (ts->token.ptr - ts->linebuf.base)
|
|
: NULL;
|
|
report.uclinebuf = ts->linebuf.base;
|
|
report.uctokenptr = ts->token.ptr;
|
|
(*onError)(cx, message, &report);
|
|
#if !defined XP_PC || !defined _MSC_VER || _MSC_VER > 800
|
|
} else {
|
|
if (!(ts->flags & TSF_INTERACTIVE))
|
|
fprintf(stderr, "JavaScript error: ");
|
|
if (ts->filename)
|
|
fprintf(stderr, "%s, ", ts->filename);
|
|
if (ts->lineno)
|
|
fprintf(stderr, "line %u: ", ts->lineno);
|
|
fprintf(stderr, "%s:\n%s\n",message,
|
|
js_DeflateString(cx, ts->linebuf.base,
|
|
ts->linebuf.limit - ts->linebuf.base));
|
|
|
|
#endif
|
|
}
|
|
if (lastc == '\n')
|
|
limit[-1] = lastc;
|
|
free(message);
|
|
}
|
|
|
|
JSTokenType
|
|
js_PeekToken(JSContext *cx, JSTokenStream *ts)
|
|
{
|
|
JSTokenType tt;
|
|
|
|
tt = ts->pushback.type;
|
|
if (tt == TOK_EOF) {
|
|
tt = js_GetToken(cx, ts);
|
|
js_UngetToken(ts);
|
|
}
|
|
return tt;
|
|
}
|
|
|
|
JSTokenType
|
|
js_PeekTokenSameLine(JSContext *cx, JSTokenStream *ts)
|
|
{
|
|
uintN newlines;
|
|
JSTokenType tt;
|
|
|
|
newlines = ts->flags & TSF_NEWLINES;
|
|
if (!newlines)
|
|
SCAN_NEWLINES(ts);
|
|
tt = js_PeekToken(cx, ts);
|
|
if (!newlines)
|
|
HIDE_NEWLINES(ts);
|
|
return tt;
|
|
}
|
|
|
|
#define TBINCR 64
|
|
|
|
static JSBool
|
|
GrowTokenBuf(JSContext *cx, JSTokenBuf *tb)
|
|
{
|
|
jschar *base;
|
|
ptrdiff_t offset, length;
|
|
size_t tbincr, tbsize;
|
|
PRArenaPool *pool;
|
|
|
|
base = tb->base;
|
|
offset = PTRDIFF(tb->ptr, base, jschar);
|
|
length = PTRDIFF(tb->limit, base, jschar);
|
|
tbincr = TBINCR * sizeof(jschar);
|
|
pool = &cx->tempPool;
|
|
if (!base) {
|
|
PR_ARENA_ALLOCATE(base, pool, tbincr);
|
|
} else {
|
|
tbsize = (size_t)(length * sizeof(jschar));
|
|
PR_ARENA_GROW(base, pool, tbsize, tbincr);
|
|
}
|
|
if (!base) {
|
|
JS_ReportOutOfMemory(cx);
|
|
return JS_FALSE;
|
|
}
|
|
tb->base = base;
|
|
tb->limit = base + length + TBINCR;
|
|
tb->ptr = base + offset;
|
|
return JS_TRUE;
|
|
}
|
|
|
|
static JSBool
|
|
AddToTokenBuf(JSContext *cx, JSTokenBuf *tb, jschar c)
|
|
{
|
|
if (tb->ptr == tb->limit && !GrowTokenBuf(cx, tb))
|
|
return JS_FALSE;
|
|
*tb->ptr++ = c;
|
|
return JS_TRUE;
|
|
}
|
|
|
|
JSTokenType
|
|
js_GetToken(JSContext *cx, JSTokenStream *ts)
|
|
{
|
|
int32 c;
|
|
JSAtom *atom;
|
|
|
|
#define INIT_TOKENBUF(tb) ((tb)->ptr = (tb)->base)
|
|
#define FINISH_TOKENBUF(tb) if (!AddToTokenBuf(cx, tb, 0)) RETURN(TOK_ERROR)
|
|
#define TOKEN_LENGTH(tb) ((tb)->ptr - (tb)->base - 1)
|
|
#define RETURN(tt) { if (tt == TOK_ERROR) ts->flags |= TSF_ERROR; \
|
|
ts->token.pos.end.index = ts->linepos + \
|
|
(ts->linebuf.ptr - ts->linebuf.base) - \
|
|
ts->ungetpos; \
|
|
return (ts->token.type = tt); }
|
|
|
|
/* If there was a fatal error, keep returning TOK_ERROR. */
|
|
if (ts->flags & TSF_ERROR)
|
|
return TOK_ERROR;
|
|
|
|
/* Check for a pushed-back token resulting from mismatching lookahead. */
|
|
if (ts->pushback.type != TOK_EOF) {
|
|
ts->token = ts->pushback;
|
|
CLEAR_PUSHBACK(ts);
|
|
return ts->token.type;
|
|
}
|
|
|
|
retry:
|
|
do {
|
|
c = GetChar(ts);
|
|
if (c == '\n' && (ts->flags & TSF_NEWLINES))
|
|
break;
|
|
} while (JS_ISSPACE(c));
|
|
|
|
ts->token.ptr = ts->linebuf.ptr - 1;
|
|
ts->token.pos.begin.index = ts->linepos + (ts->token.ptr-ts->linebuf.base);
|
|
ts->token.pos.begin.lineno = ts->token.pos.end.lineno = ts->lineno;
|
|
|
|
if (c == EOF)
|
|
RETURN(TOK_EOF);
|
|
|
|
if (JS_ISIDENT(c)) {
|
|
INIT_TOKENBUF(&ts->tokenbuf);
|
|
do {
|
|
if (!AddToTokenBuf(cx, &ts->tokenbuf, (jschar)c))
|
|
RETURN(TOK_ERROR);
|
|
c = GetChar(ts);
|
|
} while (JS_ISIDENT2(c));
|
|
UngetChar(ts, c);
|
|
FINISH_TOKENBUF(&ts->tokenbuf);
|
|
|
|
atom = js_AtomizeChars(cx,
|
|
ts->tokenbuf.base,
|
|
TOKEN_LENGTH(&ts->tokenbuf),
|
|
0);
|
|
if (!atom)
|
|
RETURN(TOK_ERROR);
|
|
if (atom->kwindex >= 0) {
|
|
struct keyword *kw;
|
|
|
|
kw = &keywords[atom->kwindex];
|
|
ts->token.t_op = kw->op;
|
|
RETURN(kw->tokentype);
|
|
}
|
|
ts->token.t_op = JSOP_NAME;
|
|
ts->token.t_atom = atom;
|
|
RETURN(TOK_NAME);
|
|
}
|
|
|
|
if (JS7_ISDEC(c) || (c == '.' && JS7_ISDEC(PeekChar(ts)))) {
|
|
jsint radix;
|
|
const jschar *endptr;
|
|
jsdouble dval;
|
|
|
|
radix = 10;
|
|
INIT_TOKENBUF(&ts->tokenbuf);
|
|
|
|
if (c == '0') {
|
|
if (!AddToTokenBuf(cx, &ts->tokenbuf, (jschar)c))
|
|
RETURN(TOK_ERROR);
|
|
c = GetChar(ts);
|
|
if (JS_TOLOWER(c) == 'x') {
|
|
if (!AddToTokenBuf(cx, &ts->tokenbuf, (jschar)c))
|
|
RETURN(TOK_ERROR);
|
|
c = GetChar(ts);
|
|
radix = 16;
|
|
} else if (JS7_ISDEC(c) && c < '8') {
|
|
/*
|
|
* XXX Warning needed. Checking against c < '8' above is
|
|
* non-ECMA, but is required to support legacy code; it's
|
|
* likely that "08" and "09" are in use in code having to do
|
|
* with dates. So we need to support it, which makes our
|
|
* behavior a superset of ECMA in this area. We should be
|
|
* raising a warning if '8' or '9' is encountered.
|
|
*/
|
|
radix = 8;
|
|
}
|
|
}
|
|
|
|
while (JS7_ISHEX(c)) {
|
|
if (radix < 16 && (JS7_ISLET(c) || (radix == 8 && c >= '8')))
|
|
break;
|
|
if (!AddToTokenBuf(cx, &ts->tokenbuf, (jschar)c))
|
|
RETURN(TOK_ERROR);
|
|
c = GetChar(ts);
|
|
}
|
|
|
|
if (radix == 10 && (c == '.' || JS_TOLOWER(c) == 'e')) {
|
|
if (c == '.') {
|
|
do {
|
|
if (!AddToTokenBuf(cx, &ts->tokenbuf, (jschar)c))
|
|
RETURN(TOK_ERROR);
|
|
c = GetChar(ts);
|
|
} while (JS7_ISDEC(c));
|
|
}
|
|
if (JS_TOLOWER(c) == 'e') {
|
|
if (!AddToTokenBuf(cx, &ts->tokenbuf, (jschar)c))
|
|
RETURN(TOK_ERROR);
|
|
c = GetChar(ts);
|
|
if (c == '+' || c == '-') {
|
|
if (!AddToTokenBuf(cx, &ts->tokenbuf, (jschar)c))
|
|
RETURN(TOK_ERROR);
|
|
c = GetChar(ts);
|
|
}
|
|
if (!JS7_ISDEC(c)) {
|
|
js_ReportCompileError(cx, ts, "missing exponent");
|
|
RETURN(TOK_ERROR);
|
|
}
|
|
do {
|
|
if (!AddToTokenBuf(cx, &ts->tokenbuf, (jschar)c))
|
|
RETURN(TOK_ERROR);
|
|
c = GetChar(ts);
|
|
} while (JS7_ISDEC(c));
|
|
}
|
|
}
|
|
|
|
UngetChar(ts, c);
|
|
FINISH_TOKENBUF(&ts->tokenbuf);
|
|
|
|
if (radix == 10) {
|
|
if (!js_strtod(cx, ts->tokenbuf.base, &endptr, &dval)) {
|
|
js_ReportCompileError(cx, ts, "out of memory");
|
|
RETURN(TOK_ERROR);
|
|
}
|
|
} else {
|
|
if (!js_strtointeger(cx, ts->tokenbuf.base, &endptr, radix, &dval)) {
|
|
js_ReportCompileError(cx, ts, "out of memory");
|
|
RETURN(TOK_ERROR);
|
|
}
|
|
}
|
|
ts->token.t_dval = dval;
|
|
RETURN(TOK_NUMBER);
|
|
}
|
|
|
|
if (c == '"' || c == '\'') {
|
|
int32 val, qc = c;
|
|
|
|
INIT_TOKENBUF(&ts->tokenbuf);
|
|
while ((c = GetChar(ts)) != qc) {
|
|
if (c == '\n' || c == EOF) {
|
|
UngetChar(ts, c);
|
|
js_ReportCompileError(cx, ts, "unterminated string literal");
|
|
RETURN(TOK_ERROR);
|
|
}
|
|
if (c == '\\') {
|
|
switch (c = GetChar(ts)) {
|
|
case 'b': c = '\b'; break;
|
|
case 'f': c = '\f'; break;
|
|
case 'n': c = '\n'; break;
|
|
case 'r': c = '\r'; break;
|
|
case 't': c = '\t'; break;
|
|
case 'v': c = '\v'; break;
|
|
|
|
default:
|
|
if ('0' <= c && c < '8') {
|
|
val = JS7_UNDEC(c);
|
|
c = PeekChar(ts);
|
|
if ('0' <= c && c < '8') {
|
|
val = 8 * val + JS7_UNDEC(c);
|
|
GetChar(ts);
|
|
c = PeekChar(ts);
|
|
if ('0' <= c && c < '8') {
|
|
int32 save = val;
|
|
val = 8 * val + JS7_UNDEC(c);
|
|
if (val <= 0377)
|
|
GetChar(ts);
|
|
else
|
|
val = save;
|
|
}
|
|
}
|
|
c = (jschar)val;
|
|
} else if (c == 'u') {
|
|
jschar cp[4];
|
|
if (PeekChars(ts, 4, cp) &&
|
|
JS7_ISHEX(cp[0]) && JS7_ISHEX(cp[1]) &&
|
|
JS7_ISHEX(cp[2]) && JS7_ISHEX(cp[3])) {
|
|
c = (((((JS7_UNHEX(cp[0]) << 4)
|
|
+ JS7_UNHEX(cp[1])) << 4)
|
|
+ JS7_UNHEX(cp[2])) << 4)
|
|
+ JS7_UNHEX(cp[3]);
|
|
SkipChars(ts, 4);
|
|
}
|
|
} else if (c == 'x') {
|
|
jschar cp[2];
|
|
if (PeekChars(ts, 2, cp) &&
|
|
JS7_ISHEX(cp[0]) && JS7_ISHEX(cp[1])) {
|
|
c = (JS7_UNHEX(cp[0]) << 4) + JS7_UNHEX(cp[1]);
|
|
SkipChars(ts, 2);
|
|
}
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
if (!AddToTokenBuf(cx, &ts->tokenbuf, (jschar)c))
|
|
RETURN(TOK_ERROR);
|
|
}
|
|
FINISH_TOKENBUF(&ts->tokenbuf);
|
|
atom = js_AtomizeChars(cx,
|
|
ts->tokenbuf.base,
|
|
TOKEN_LENGTH(&ts->tokenbuf),
|
|
0);
|
|
if (!atom)
|
|
RETURN(TOK_ERROR);
|
|
ts->token.pos.end.lineno = ts->lineno;
|
|
ts->token.t_op = JSOP_STRING;
|
|
ts->token.t_atom = atom;
|
|
RETURN(TOK_STRING);
|
|
}
|
|
|
|
switch (c) {
|
|
case '\n': c = TOK_EOL; break;
|
|
case ';': c = TOK_SEMI; break;
|
|
case '.': c = TOK_DOT; break;
|
|
case '[': c = TOK_LB; break;
|
|
case ']': c = TOK_RB; break;
|
|
case '{': c = TOK_LC; break;
|
|
case '}': c = TOK_RC; break;
|
|
case '(': c = TOK_LP; break;
|
|
case ')': c = TOK_RP; break;
|
|
case ',': c = TOK_COMMA; break;
|
|
case '?': c = TOK_HOOK; break;
|
|
case ':': c = TOK_COLON; break;
|
|
|
|
case '|':
|
|
if (MatchChar(ts, c)) {
|
|
c = TOK_OR;
|
|
} else if (MatchChar(ts, '=')) {
|
|
ts->token.t_op = JSOP_BITOR;
|
|
c = TOK_ASSIGN;
|
|
} else {
|
|
c = TOK_BITOR;
|
|
}
|
|
break;
|
|
|
|
case '^':
|
|
if (MatchChar(ts, '=')) {
|
|
ts->token.t_op = JSOP_BITXOR;
|
|
c = TOK_ASSIGN;
|
|
} else {
|
|
c = TOK_BITXOR;
|
|
}
|
|
break;
|
|
|
|
case '&':
|
|
if (MatchChar(ts, c)) {
|
|
c = TOK_AND;
|
|
} else if (MatchChar(ts, '=')) {
|
|
ts->token.t_op = JSOP_BITAND;
|
|
c = TOK_ASSIGN;
|
|
} else {
|
|
c = TOK_BITAND;
|
|
}
|
|
break;
|
|
|
|
case '=':
|
|
if (MatchChar(ts, c)) {
|
|
#if JS_HAS_TRIPLE_EQOPS
|
|
ts->token.t_op = MatchChar(ts, c) ? JSOP_NEW_EQ : cx->jsop_eq;
|
|
#else
|
|
ts->token.t_op = cx->jsop_eq;
|
|
#endif
|
|
c = TOK_EQOP;
|
|
} else {
|
|
ts->token.t_op = JSOP_NOP;
|
|
c = TOK_ASSIGN;
|
|
}
|
|
break;
|
|
|
|
case '!':
|
|
if (MatchChar(ts, '=')) {
|
|
#if JS_HAS_TRIPLE_EQOPS
|
|
ts->token.t_op = MatchChar(ts, '=') ? JSOP_NEW_NE : cx->jsop_ne;
|
|
#else
|
|
ts->token.t_op = cx->jsop_ne;
|
|
#endif
|
|
c = TOK_EQOP;
|
|
} else {
|
|
ts->token.t_op = JSOP_NOT;
|
|
c = TOK_UNARYOP;
|
|
}
|
|
break;
|
|
|
|
case '<':
|
|
/* NB: treat HTML begin-comment as comment-till-end-of-line */
|
|
if (MatchChar(ts, '!')) {
|
|
if (MatchChar(ts, '-')) {
|
|
if (MatchChar(ts, '-'))
|
|
goto skipline;
|
|
UngetChar(ts, '-');
|
|
}
|
|
UngetChar(ts, '!');
|
|
}
|
|
if (MatchChar(ts, c)) {
|
|
ts->token.t_op = JSOP_LSH;
|
|
c = MatchChar(ts, '=') ? TOK_ASSIGN : TOK_SHOP;
|
|
} else {
|
|
ts->token.t_op = MatchChar(ts, '=') ? JSOP_LE : JSOP_LT;
|
|
c = TOK_RELOP;
|
|
}
|
|
break;
|
|
|
|
case '>':
|
|
if (MatchChar(ts, c)) {
|
|
ts->token.t_op = MatchChar(ts, c) ? JSOP_URSH : JSOP_RSH;
|
|
c = MatchChar(ts, '=') ? TOK_ASSIGN : TOK_SHOP;
|
|
} else {
|
|
ts->token.t_op = MatchChar(ts, '=') ? JSOP_GE : JSOP_GT;
|
|
c = TOK_RELOP;
|
|
}
|
|
break;
|
|
|
|
case '*':
|
|
ts->token.t_op = JSOP_MUL;
|
|
c = MatchChar(ts, '=') ? TOK_ASSIGN : TOK_STAR;
|
|
break;
|
|
|
|
case '/':
|
|
if (MatchChar(ts, '/')) {
|
|
skipline:
|
|
while ((c = GetChar(ts)) != EOF && c != '\n')
|
|
/* skip to end of line */;
|
|
UngetChar(ts, c);
|
|
goto retry;
|
|
}
|
|
if (MatchChar(ts, '*')) {
|
|
while ((c = GetChar(ts)) != EOF &&
|
|
!(c == '*' && MatchChar(ts, '/'))) {
|
|
if (c == '/' && MatchChar(ts, '*')) {
|
|
if (MatchChar(ts, '/'))
|
|
goto retry;
|
|
js_ReportCompileError(cx, ts, "nested comment");
|
|
}
|
|
}
|
|
if (c == EOF) {
|
|
js_ReportCompileError(cx, ts, "unterminated comment");
|
|
RETURN(TOK_ERROR);
|
|
}
|
|
goto retry;
|
|
}
|
|
|
|
#if JS_HAS_REGEXPS
|
|
if (ts->flags & TSF_REGEXP) {
|
|
JSObject *obj;
|
|
uintN flags;
|
|
|
|
INIT_TOKENBUF(&ts->tokenbuf);
|
|
while ((c = GetChar(ts)) != '/') {
|
|
if (c == '\n' || c == EOF) {
|
|
UngetChar(ts, c);
|
|
js_ReportCompileError(cx, ts,
|
|
"unterminated regular expression literal");
|
|
RETURN(TOK_ERROR);
|
|
}
|
|
if (c == '\\') {
|
|
if (!AddToTokenBuf(cx, &ts->tokenbuf, (jschar)c))
|
|
RETURN(TOK_ERROR);
|
|
c = GetChar(ts);
|
|
}
|
|
if (!AddToTokenBuf(cx, &ts->tokenbuf, (jschar)c))
|
|
RETURN(TOK_ERROR);
|
|
}
|
|
FINISH_TOKENBUF(&ts->tokenbuf);
|
|
for (flags = 0; ; ) {
|
|
if (MatchChar(ts, 'g'))
|
|
flags |= JSREG_GLOB;
|
|
else if (MatchChar(ts, 'i'))
|
|
flags |= JSREG_FOLD;
|
|
else
|
|
break;
|
|
}
|
|
c = PeekChar(ts);
|
|
if (JS7_ISLET(c)) {
|
|
ts->token.ptr = ts->linebuf.ptr - 1;
|
|
js_ReportCompileError(cx, ts,
|
|
"invalid flag after regular expression");
|
|
(void) GetChar(ts);
|
|
RETURN(TOK_ERROR);
|
|
}
|
|
obj = js_NewRegExpObject(cx,
|
|
ts->tokenbuf.base,
|
|
TOKEN_LENGTH(&ts->tokenbuf),
|
|
flags);
|
|
if (!obj)
|
|
RETURN(TOK_ERROR);
|
|
atom = js_AtomizeObject(cx, obj, 0);
|
|
if (!atom)
|
|
RETURN(TOK_ERROR);
|
|
ts->token.t_op = JSOP_OBJECT;
|
|
ts->token.t_atom = atom;
|
|
RETURN(TOK_OBJECT);
|
|
}
|
|
#endif /* JS_HAS_REGEXPS */
|
|
|
|
ts->token.t_op = JSOP_DIV;
|
|
c = MatchChar(ts, '=') ? TOK_ASSIGN : TOK_DIVOP;
|
|
break;
|
|
|
|
case '%':
|
|
ts->token.t_op = JSOP_MOD;
|
|
c = MatchChar(ts, '=') ? TOK_ASSIGN : TOK_DIVOP;
|
|
break;
|
|
|
|
case '~':
|
|
ts->token.t_op = JSOP_BITNOT;
|
|
c = TOK_UNARYOP;
|
|
break;
|
|
|
|
case '+':
|
|
case '-':
|
|
if (MatchChar(ts, '=')) {
|
|
ts->token.t_op = (c == '+') ? JSOP_ADD : JSOP_SUB;
|
|
c = TOK_ASSIGN;
|
|
} else if (MatchChar(ts, c)) {
|
|
c = (c == '+') ? TOK_INC : TOK_DEC;
|
|
} else if (c == '-') {
|
|
ts->token.t_op = JSOP_NEG;
|
|
c = TOK_MINUS;
|
|
} else {
|
|
ts->token.t_op = JSOP_POS;
|
|
c = TOK_PLUS;
|
|
}
|
|
break;
|
|
|
|
#if JS_HAS_SHARP_VARS
|
|
case '#':
|
|
{
|
|
uint32 n;
|
|
|
|
c = GetChar(ts);
|
|
if (!JS7_ISDEC(c)) {
|
|
UngetChar(ts, c);
|
|
goto badchar;
|
|
}
|
|
n = (uint32)JS7_UNDEC(c);
|
|
for (;;) {
|
|
c = GetChar(ts);
|
|
if (!JS7_ISDEC(c))
|
|
break;
|
|
n = 10 * n + JS7_UNDEC(c);
|
|
if (n >= ATOM_INDEX_LIMIT) {
|
|
js_ReportCompileError(cx, ts,
|
|
"overlarge sharp variable number");
|
|
RETURN(TOK_ERROR);
|
|
}
|
|
}
|
|
ts->token.t_dval = (jsdouble) n;
|
|
if (c == '=')
|
|
RETURN(TOK_DEFSHARP);
|
|
if (c == '#')
|
|
RETURN(TOK_USESHARP);
|
|
goto badchar;
|
|
}
|
|
|
|
badchar:
|
|
#endif /* JS_HAS_SHARP_VARS */
|
|
|
|
default:
|
|
js_ReportCompileError(cx, ts, "illegal character");
|
|
RETURN(TOK_ERROR);
|
|
}
|
|
|
|
PR_ASSERT(c < TOK_LIMIT);
|
|
RETURN(c);
|
|
|
|
#undef INIT_TOKENBUF
|
|
#undef FINISH_TOKENBUF
|
|
#undef TOKEN_LENGTH
|
|
#undef RETURN
|
|
}
|
|
|
|
void
|
|
js_UngetToken(JSTokenStream *ts)
|
|
{
|
|
PR_ASSERT(ts->pushback.type == TOK_EOF);
|
|
if (ts->flags & TSF_ERROR)
|
|
return;
|
|
ts->pushback = ts->token;
|
|
}
|
|
|
|
JSBool
|
|
js_MatchToken(JSContext *cx, JSTokenStream *ts, JSTokenType tt)
|
|
{
|
|
if (js_GetToken(cx, ts) == tt)
|
|
return JS_TRUE;
|
|
js_UngetToken(ts);
|
|
return JS_FALSE;
|
|
}
|