//===- AsmLexer.h - Lexer for Assembly Files --------------------*- C++ -*-===// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // // This class declares the lexer for assembly files. // //===----------------------------------------------------------------------===// #ifndef ASMLEXER_H #define ASMLEXER_H #include "llvm/ADT/StringRef.h" #include "llvm/MC/MCAsmLexer.h" #include "llvm/Support/DataTypes.h" #include #include namespace llvm { class MemoryBuffer; class SourceMgr; class SMLoc; namespace asmtok { enum TokKind { // Markers Eof, Error, // String values. Identifier, Register, String, // Integer values. IntVal, // No-value. EndOfStatement, Colon, Plus, Minus, Tilde, Slash, // '/' LParen, RParen, Star, Comma, Dollar, Equal, EqualEqual, Pipe, PipePipe, Caret, Amp, AmpAmp, Exclaim, ExclaimEqual, Percent, Less, LessEqual, LessLess, LessGreater, Greater, GreaterEqual, GreaterGreater }; } /// AsmLexer - Lexer class for assembly files. class AsmLexer : public MCAsmLexer { SourceMgr &SrcMgr; const char *CurPtr; const MemoryBuffer *CurBuf; // A llvm::StringSet<>, which provides uniqued and null-terminated strings. void *TheStringSet; // Information about the current token. const char *TokStart; asmtok::TokKind CurKind; const char *CurStrVal; // This is valid for Identifier. int64_t CurIntVal; /// CurBuffer - This is the current buffer index we're lexing from as managed /// by the SourceMgr object. int CurBuffer; void operator=(const AsmLexer&); // DO NOT IMPLEMENT AsmLexer(const AsmLexer&); // DO NOT IMPLEMENT public: AsmLexer(SourceMgr &SrcMgr); ~AsmLexer(); asmtok::TokKind Lex() { return CurKind = LexToken(); } asmtok::TokKind getKind() const { return CurKind; } bool is(asmtok::TokKind K) const { return CurKind == K; } bool isNot(asmtok::TokKind K) const { return CurKind != K; } /// getCurStrVal - Get the string for the current token, this includes all /// characters (for example, the quotes on strings) in the token. /// /// The returned StringRef points into the source manager's memory buffer, and /// is safe to store across calls to Lex(). StringRef getCurStrVal() const { assert((CurKind == asmtok::Identifier || CurKind == asmtok::Register || CurKind == asmtok::String) && "This token doesn't have a string value"); return CurStrVal; } int64_t getCurIntVal() const { assert(CurKind == asmtok::IntVal && "This token isn't an integer"); return CurIntVal; } SMLoc getLoc() const; /// EnterIncludeFile - Enter the specified file. This returns true on failure. bool EnterIncludeFile(const std::string &Filename); void PrintMessage(SMLoc Loc, const std::string &Msg, const char *Type) const; private: int getNextChar(); asmtok::TokKind ReturnError(const char *Loc, const std::string &Msg); /// LexToken - Read the next token and return its code. asmtok::TokKind LexToken(); asmtok::TokKind LexIdentifier(); asmtok::TokKind LexPercent(); asmtok::TokKind LexSlash(); asmtok::TokKind LexLineComment(); asmtok::TokKind LexDigit(); asmtok::TokKind LexQuote(); }; } // end namespace llvm #endif