2007-11-18 02:57:27 +00:00
|
|
|
//===- TGLexer.h - Lexer for TableGen Files ---------------------*- C++ -*-===//
|
|
|
|
//
|
|
|
|
// The LLVM Compiler Infrastructure
|
|
|
|
//
|
2007-12-29 20:37:13 +00:00
|
|
|
// This file is distributed under the University of Illinois Open Source
|
|
|
|
// License. See LICENSE.TXT for details.
|
2007-11-18 02:57:27 +00:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
|
|
|
// This class represents the Lexer for tablegen files.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#ifndef TGLEXER_H
|
|
|
|
#define TGLEXER_H
|
|
|
|
|
2010-11-29 18:47:54 +00:00
|
|
|
#include "llvm/Support/DataTypes.h"
|
2007-11-18 02:57:27 +00:00
|
|
|
#include <string>
|
2011-06-01 13:10:15 +00:00
|
|
|
#include <vector>
|
2007-11-22 23:19:05 +00:00
|
|
|
#include <cassert>
|
2007-11-18 02:57:27 +00:00
|
|
|
|
|
|
|
namespace llvm {
|
|
|
|
class MemoryBuffer;
|
2009-06-21 03:41:50 +00:00
|
|
|
class SourceMgr;
|
2009-06-21 03:39:35 +00:00
|
|
|
class SMLoc;
|
2010-09-27 17:42:11 +00:00
|
|
|
class Twine;
|
|
|
|
|
2007-11-22 20:49:04 +00:00
|
|
|
namespace tgtok {
|
|
|
|
enum TokKind {
|
|
|
|
// Markers
|
|
|
|
Eof, Error,
|
|
|
|
|
|
|
|
// Tokens with no info.
|
|
|
|
minus, plus, // - +
|
|
|
|
l_square, r_square, // [ ]
|
|
|
|
l_brace, r_brace, // { }
|
|
|
|
l_paren, r_paren, // ( )
|
|
|
|
less, greater, // < >
|
2011-03-14 02:30:32 +00:00
|
|
|
colon, semi, // : ;
|
2007-11-22 20:49:04 +00:00
|
|
|
comma, period, // , .
|
|
|
|
equal, question, // = ?
|
2011-10-19 13:04:43 +00:00
|
|
|
paste, // #
|
|
|
|
|
2007-11-22 20:49:04 +00:00
|
|
|
// Keywords.
|
2011-10-07 18:25:05 +00:00
|
|
|
Bit, Bits, Class, Code, Dag, Def, Defm, Field, In, Int, Let, List,
|
2007-11-22 20:49:04 +00:00
|
|
|
MultiClass, String,
|
|
|
|
|
|
|
|
// !keywords.
|
2010-10-06 00:19:21 +00:00
|
|
|
XConcat, XSRA, XSRL, XSHL, XStrConcat, XCast, XSubst,
|
2011-01-07 17:05:37 +00:00
|
|
|
XForEach, XHead, XTail, XEmpty, XIf, XEq,
|
2009-04-22 20:18:10 +00:00
|
|
|
|
2007-11-22 20:49:04 +00:00
|
|
|
// Integer value.
|
|
|
|
IntVal,
|
|
|
|
|
|
|
|
// String valued tokens.
|
|
|
|
Id, StrVal, VarName, CodeFragment
|
|
|
|
};
|
|
|
|
}
|
2007-11-18 02:57:27 +00:00
|
|
|
|
2007-11-22 20:49:04 +00:00
|
|
|
/// TGLexer - TableGen Lexer class.
|
2007-11-18 02:57:27 +00:00
|
|
|
class TGLexer {
|
2009-06-21 03:41:50 +00:00
|
|
|
SourceMgr &SrcMgr;
|
2009-03-13 07:05:43 +00:00
|
|
|
|
2007-11-18 02:57:27 +00:00
|
|
|
const char *CurPtr;
|
2009-03-13 07:05:43 +00:00
|
|
|
const MemoryBuffer *CurBuf;
|
2007-11-18 02:57:27 +00:00
|
|
|
|
2007-11-22 20:49:04 +00:00
|
|
|
// Information about the current token.
|
|
|
|
const char *TokStart;
|
|
|
|
tgtok::TokKind CurCode;
|
|
|
|
std::string CurStrVal; // This is valid for ID, STRVAL, VARNAME, CODEFRAGMENT
|
2008-10-17 01:33:43 +00:00
|
|
|
int64_t CurIntVal; // This is valid for INTVAL.
|
2009-03-13 07:05:43 +00:00
|
|
|
|
|
|
|
/// CurBuffer - This is the current buffer index we're lexing from as managed
|
|
|
|
/// by the SourceMgr object.
|
|
|
|
int CurBuffer;
|
2011-06-01 13:10:15 +00:00
|
|
|
/// Dependencies - This is the list of all included files.
|
|
|
|
std::vector<std::string> Dependencies;
|
2007-11-18 02:57:27 +00:00
|
|
|
|
|
|
|
public:
|
2009-06-21 03:41:50 +00:00
|
|
|
TGLexer(SourceMgr &SrcMgr);
|
2009-03-13 07:05:43 +00:00
|
|
|
~TGLexer() {}
|
2007-11-18 02:57:27 +00:00
|
|
|
|
2007-11-22 20:49:04 +00:00
|
|
|
tgtok::TokKind Lex() {
|
|
|
|
return CurCode = LexToken();
|
|
|
|
}
|
2011-06-01 13:10:15 +00:00
|
|
|
|
|
|
|
const std::vector<std::string> &getDependencies() const {
|
|
|
|
return Dependencies;
|
|
|
|
}
|
2007-11-22 20:49:04 +00:00
|
|
|
|
|
|
|
tgtok::TokKind getCode() const { return CurCode; }
|
2007-11-18 02:57:27 +00:00
|
|
|
|
2007-11-22 20:49:04 +00:00
|
|
|
const std::string &getCurStrVal() const {
|
|
|
|
assert((CurCode == tgtok::Id || CurCode == tgtok::StrVal ||
|
|
|
|
CurCode == tgtok::VarName || CurCode == tgtok::CodeFragment) &&
|
|
|
|
"This token doesn't have a string value");
|
|
|
|
return CurStrVal;
|
|
|
|
}
|
2008-10-17 01:33:43 +00:00
|
|
|
int64_t getCurIntVal() const {
|
2007-11-22 20:49:04 +00:00
|
|
|
assert(CurCode == tgtok::IntVal && "This token isn't an integer");
|
|
|
|
return CurIntVal;
|
|
|
|
}
|
2007-11-19 07:43:52 +00:00
|
|
|
|
2009-06-21 03:39:35 +00:00
|
|
|
SMLoc getLoc() const;
|
2007-11-19 07:38:58 +00:00
|
|
|
|
2007-11-18 02:57:27 +00:00
|
|
|
private:
|
2007-11-22 20:49:04 +00:00
|
|
|
/// LexToken - Read the next token and return its code.
|
|
|
|
tgtok::TokKind LexToken();
|
|
|
|
|
2010-09-27 17:42:11 +00:00
|
|
|
tgtok::TokKind ReturnError(const char *Loc, const Twine &Msg);
|
2007-11-19 07:38:58 +00:00
|
|
|
|
2007-11-18 02:57:27 +00:00
|
|
|
int getNextChar();
|
2011-10-19 13:03:35 +00:00
|
|
|
int peekNextChar(int Index);
|
2007-11-18 02:57:27 +00:00
|
|
|
void SkipBCPLComment();
|
|
|
|
bool SkipCComment();
|
2007-11-22 20:49:04 +00:00
|
|
|
tgtok::TokKind LexIdentifier();
|
2007-11-18 02:57:27 +00:00
|
|
|
bool LexInclude();
|
2007-11-22 20:49:04 +00:00
|
|
|
tgtok::TokKind LexString();
|
|
|
|
tgtok::TokKind LexVarName();
|
|
|
|
tgtok::TokKind LexNumber();
|
|
|
|
tgtok::TokKind LexBracket();
|
|
|
|
tgtok::TokKind LexExclaim();
|
2007-11-18 02:57:27 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
} // end namespace llvm
|
|
|
|
|
|
|
|
#endif
|