/**************************************************************************** ** ** Copyright (C) 2009 Nokia Corporation and/or its subsidiary(-ies). ** All rights reserved. ** Contact: Nokia Corporation (qt-info@nokia.com) ** ** This file is part of the tools applications of the Qt Toolkit. ** ** $QT_BEGIN_LICENSE:LGPL$ ** No Commercial Usage ** This file contains pre-release code and may not be distributed. ** You may use this file in accordance with the terms and conditions ** contained in the Technology Preview License Agreement accompanying ** this package. ** ** GNU Lesser General Public License Usage ** Alternatively, this file may be used under the terms of the GNU Lesser ** General Public License version 2.1 as published by the Free Software ** Foundation and appearing in the file LICENSE.LGPL included in the ** packaging of this file. Please review the following information to ** ensure the GNU Lesser General Public License version 2.1 requirements ** will be met: http://www.gnu.org/licenses/old-licenses/lgpl-2.1.html. ** ** In addition, as a special exception, Nokia gives you certain additional ** rights. These rights are described in the Nokia Qt LGPL Exception ** version 1.1, included in the file LGPL_EXCEPTION.txt in this package. ** ** If you have questions regarding the use of this file, please contact ** Nokia at qt-info@nokia.com. ** ** ** ** ** ** ** ** ** $QT_END_LICENSE$ ** ****************************************************************************/ /* tokenizer.h */ #ifndef TOKENIZER_H #define TOKENIZER_H #include <qstack.h> #include <qstring.h> #include <stdio.h> #include "location.h" QT_BEGIN_NAMESPACE /* Here come the C++ tokens we support. The first part contains all-purpose tokens; then come keywords. If you add a keyword, make sure to modify the keyword array in tokenizer.cpp as well, and possibly adjust Tok_FirstKeyword and Tok_LastKeyword. */ enum { Tok_Eoi, Tok_Ampersand, Tok_Aster, Tok_Caret, Tok_LeftParen, Tok_RightParen, Tok_LeftParenAster, Tok_Equal, Tok_LeftBrace, Tok_RightBrace, Tok_Semicolon, Tok_Colon, Tok_LeftAngle, Tok_RightAngle, Tok_Comma, Tok_Ellipsis, Tok_Gulbrandsen, Tok_LeftBracket, Tok_RightBracket, Tok_Tilde, Tok_SomeOperator, Tok_Number, Tok_String, Tok_Doc, Tok_Comment, Tok_Ident, Tok_At, Tok_char, Tok_class, Tok_const, Tok_double, Tok_enum, Tok_explicit, Tok_friend, Tok_inline, Tok_int, Tok_long, Tok_namespace, Tok_operator, Tok_private, Tok_protected, Tok_public, Tok_short, Tok_signals, Tok_signed, Tok_slots, Tok_static, Tok_struct, Tok_template, Tok_typedef, Tok_typename, Tok_union, Tok_unsigned, Tok_using, Tok_virtual, Tok_void, Tok_volatile, Tok_int64, Tok_Q_OBJECT, Tok_Q_OVERRIDE, Tok_Q_PROPERTY, Tok_Q_DECLARE_SEQUENTIAL_ITERATOR, Tok_Q_DECLARE_MUTABLE_SEQUENTIAL_ITERATOR, Tok_Q_DECLARE_ASSOCIATIVE_ITERATOR, Tok_Q_DECLARE_MUTABLE_ASSOCIATIVE_ITERATOR, Tok_Q_DECLARE_FLAGS, Tok_Q_SIGNALS, Tok_Q_SLOTS, Tok_QT_COMPAT, Tok_QT_COMPAT_CONSTRUCTOR, Tok_QT_DEPRECATED, Tok_QT_MOC_COMPAT, Tok_QT_MODULE, Tok_QT3_SUPPORT, Tok_QT3_SUPPORT_CONSTRUCTOR, Tok_QT3_MOC_SUPPORT, Tok_QDOC_PROPERTY, Tok_FirstKeyword = Tok_char, Tok_LastKeyword = Tok_QDOC_PROPERTY }; /* The Tokenizer class implements lexical analysis of C++ source files. Not every operator or keyword of C++ is recognized; only those that are interesting to us. Some Qt keywords or macros are also recognized. */ class Tokenizer { public: Tokenizer(const Location& loc, const QByteArray &in); Tokenizer(const Location& loc, FILE *in); ~Tokenizer(); int getToken(); void setParsingFnOrMacro(bool macro) { parsingMacro = macro; } bool parsingFnOrMacro() const { return parsingMacro; } const Location &location() const { return yyTokLoc; } QString previousLexeme() const { return QString(yyPrevLex); } QString lexeme() const { return QString(yyLex); } QString version() const { return yyVersion; } int braceDepth() const { return yyBraceDepth; } int parenDepth() const { return yyParenDepth; } int bracketDepth() const { return yyBracketDepth; } static void initialize(const Config &config); static void terminate(); static bool isTrue(const QString &condition); private: void init(); void start(const Location& loc); /* This limit on the length of a lexeme seems fairly high, but a doc comment can be arbitrarily long. The previous 65,536 limit was reached by Mark Summerfield. */ enum { yyLexBufSize = 524288 }; int getch() { return yyPos == yyIn.size() ? EOF : yyIn[yyPos++]; } inline int getChar() { if (yyCh == EOF) return EOF; if (yyLexLen < yyLexBufSize - 1) { yyLex[yyLexLen++] = (char) yyCh; yyLex[yyLexLen] = '\0'; } yyCurLoc.advance(yyCh); int ch = getch(); if (ch == EOF) return EOF; // cast explicitely to make sure the value of ch // is in range [0..255] to avoid assert messages // when using debug CRT that checks its input. return int(uint(uchar(ch))); } int getTokenAfterPreprocessor(); void pushSkipping(bool skip); bool popSkipping(); Location yyTokLoc; Location yyCurLoc; char *yyLexBuf1; char *yyLexBuf2; char *yyPrevLex; char *yyLex; size_t yyLexLen; QStack<bool> yyPreprocessorSkipping; int yyNumPreprocessorSkipping; int yyBraceDepth; int yyParenDepth; int yyBracketDepth; int yyCh; QString yyVersion; bool parsingMacro; protected: QByteArray yyIn; int yyPos; }; QT_END_NAMESPACE #endif