summaryrefslogtreecommitdiffstats
path: root/kjs/lexer.h
diff options
context:
space:
mode:
Diffstat (limited to 'kjs/lexer.h')
-rw-r--r--kjs/lexer.h165
1 files changed, 165 insertions, 0 deletions
diff --git a/kjs/lexer.h b/kjs/lexer.h
new file mode 100644
index 000000000..c6cb6aa88
--- /dev/null
+++ b/kjs/lexer.h
@@ -0,0 +1,165 @@
+// -*- c-basic-offset: 2 -*-
+/*
+ * This file is part of the KDE libraries
+ * Copyright (C) 1999-2000 Harri Porten (porten@kde.org)
+ *
+ * This library is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Library General Public
+ * License as published by the Free Software Foundation; either
+ * version 2 of the License, or (at your option) any later version.
+ *
+ * This library is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ * Library General Public License for more details.
+ *
+ * You should have received a copy of the GNU Library General Public License
+ * along with this library; see the file COPYING.LIB. If not, write to
+ * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
+ * Boston, MA 02110-1301, USA.
+ *
+ */
+
+#ifndef _KJSLEXER_H_
+#define _KJSLEXER_H_
+
+#include "ustring.h"
+
+
+namespace KJS {
+
+ class Identifier;
+
+ class RegExp;
+
+ class Lexer {
+ public:
+ Lexer();
+ ~Lexer();
+ static Lexer *curr();
+
+ void setCode(const UChar *c, unsigned int len);
+ int lex();
+
+ int lineNo() const { return yylineno + 1; }
+
+ bool prevTerminator() const { return terminator; }
+
+ enum State { Start,
+ IdentifierOrKeyword,
+ Identifier,
+ InIdentifierOrKeyword,
+ InIdentifier,
+ InIdentifierUnicodeEscapeStart,
+ InIdentifierUnicodeEscape,
+ InSingleLineComment,
+ InMultiLineComment,
+ InNum,
+ InNum0,
+ InHex,
+ InOctal,
+ InDecimal,
+ InExponentIndicator,
+ InExponent,
+ Hex,
+ Octal,
+ Number,
+ String,
+ Eof,
+ InString,
+ InEscapeSequence,
+ InHexEscape,
+ InUnicodeEscape,
+ Other,
+ Bad };
+
+ bool scanRegExp();
+ UString pattern, flags;
+ bool hadError() const { return foundBad; }
+
+ static bool isWhiteSpace(unsigned short c);
+ static bool isIdentLetter(unsigned short c);
+ static bool isDecimalDigit(unsigned short c);
+ static bool isHexDigit(unsigned short c);
+ static bool isOctalDigit(unsigned short c);
+
+ private:
+ int yylineno;
+ bool done;
+ char *buffer8;
+ UChar *buffer16;
+ unsigned int size8, size16;
+ unsigned int pos8, pos16;
+ bool terminator;
+ bool restrKeyword;
+ // encountered delimiter like "'" and "}" on last run
+ bool delimited;
+ bool skipLF;
+ bool skipCR;
+ bool convertNextIdentifier;
+ int stackToken;
+ int lastToken;
+ bool foundBad;
+
+ State state;
+ void setDone(State s);
+ unsigned int pos;
+ void shift(unsigned int p);
+ void nextLine();
+ int lookupKeyword(const char *);
+
+ int matchPunctuator(unsigned short c1, unsigned short c2,
+ unsigned short c3, unsigned short c4);
+ unsigned short singleEscape(unsigned short c) const;
+ unsigned short convertOctal(unsigned short c1, unsigned short c2,
+ unsigned short c3) const;
+ public:
+ static unsigned char convertHex(unsigned short c1);
+ static unsigned char convertHex(unsigned short c1, unsigned short c2);
+ static UChar convertUnicode(unsigned short c1, unsigned short c2,
+ unsigned short c3, unsigned short c4);
+
+#ifdef KJS_DEBUG_MEM
+ /**
+ * Clear statically allocated resources
+ */
+ static void globalClear();
+#endif
+
+ void doneParsing();
+
+ private:
+
+ void record8(unsigned short c);
+ void record16(int c);
+ void record16(UChar c);
+
+ KJS::Identifier *makeIdentifier(UChar *buffer, unsigned int pos);
+ UString *makeUString(UChar *buffer, unsigned int pos);
+
+ const UChar *code;
+ unsigned int length;
+ int yycolumn;
+#ifndef KJS_PURE_ECMA
+ int bol; // begin of line
+#endif
+
+ // current and following unicode characters (int to allow for -1 for end-of-file marker)
+ int current, next1, next2, next3;
+
+ UString **strings;
+ unsigned int numStrings;
+ unsigned int stringsCapacity;
+
+ KJS::Identifier **identifiers;
+ unsigned int numIdentifiers;
+ unsigned int identifiersCapacity;
+
+ // for future extensions
+ class LexerPrivate;
+ LexerPrivate *priv;
+ };
+
+} // namespace
+
+#endif