2001-06-06 20:29:01 +00:00
|
|
|
//===-- ReaderInternals.h - Definitions internal to the reader ---*- C++ -*--=//
|
|
|
|
//
|
|
|
|
// This header file defines various stuff that is used by the bytecode reader.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#ifndef READER_INTERNALS_H
|
|
|
|
#define READER_INTERNALS_H
|
|
|
|
|
2003-09-22 23:38:23 +00:00
|
|
|
#include "llvm/Constant.h"
|
2001-12-03 18:02:31 +00:00
|
|
|
#include "llvm/DerivedTypes.h"
|
2002-08-17 22:01:27 +00:00
|
|
|
#include "llvm/Function.h"
|
2003-09-22 23:38:23 +00:00
|
|
|
#include "llvm/ModuleProvider.h"
|
|
|
|
#include "llvm/Bytecode/Primitives.h"
|
2001-06-06 20:29:01 +00:00
|
|
|
#include <utility>
|
2002-08-17 22:01:27 +00:00
|
|
|
#include <map>
|
2003-09-22 23:38:23 +00:00
|
|
|
#include <memory>
|
|
|
|
class Module;
|
2001-06-06 20:29:01 +00:00
|
|
|
|
2001-09-07 16:37:43 +00:00
|
|
|
// Enable to trace to figure out what the heck is going on when parsing fails
|
2003-09-04 23:47:07 +00:00
|
|
|
//#define TRACE_LEVEL 10
|
2001-09-07 16:37:43 +00:00
|
|
|
|
2003-09-22 23:38:23 +00:00
|
|
|
#if TRACE_LEVEL // ByteCodeReading_TRACEr
|
2003-03-19 20:54:26 +00:00
|
|
|
#define BCR_TRACE(n, X) \
|
|
|
|
if (n < TRACE_LEVEL) std::cerr << std::string(n*2, ' ') << X
|
2001-09-07 16:37:43 +00:00
|
|
|
#else
|
|
|
|
#define BCR_TRACE(n, X)
|
|
|
|
#endif
|
|
|
|
|
2001-06-06 20:29:01 +00:00
|
|
|
struct RawInst { // The raw fields out of the bytecode stream...
|
|
|
|
unsigned NumOperands;
|
|
|
|
unsigned Opcode;
|
|
|
|
const Type *Ty;
|
|
|
|
unsigned Arg1, Arg2;
|
|
|
|
union {
|
|
|
|
unsigned Arg3;
|
2002-01-20 22:54:45 +00:00
|
|
|
std::vector<unsigned> *VarArgs; // Contains arg #3,4,5... if NumOperands > 3
|
2001-06-06 20:29:01 +00:00
|
|
|
};
|
|
|
|
};
|
|
|
|
|
2003-09-22 23:38:23 +00:00
|
|
|
struct LazyFunctionInfo {
|
|
|
|
const unsigned char *Buf, *EndBuf;
|
|
|
|
unsigned FunctionSlot;
|
|
|
|
};
|
|
|
|
|
|
|
|
class BytecodeParser : public AbstractTypeUser, public AbstractModuleProvider {
|
2002-08-17 22:01:27 +00:00
|
|
|
BytecodeParser(const BytecodeParser &); // DO NOT IMPLEMENT
|
|
|
|
void operator=(const BytecodeParser &); // DO NOT IMPLEMENT
|
2001-06-06 20:29:01 +00:00
|
|
|
public:
|
2003-09-22 23:58:08 +00:00
|
|
|
BytecodeParser() {
|
2001-06-06 20:29:01 +00:00
|
|
|
// Define this in case we don't see a ModuleGlobalInfo block.
|
|
|
|
FirstDerivedTyID = Type::FirstDerivedTyID;
|
|
|
|
}
|
2003-09-22 23:38:23 +00:00
|
|
|
|
2003-03-19 20:54:26 +00:00
|
|
|
~BytecodeParser() {
|
2003-05-22 18:26:48 +00:00
|
|
|
freeState();
|
|
|
|
}
|
|
|
|
void freeState() {
|
2003-03-19 20:54:26 +00:00
|
|
|
freeTable(Values);
|
|
|
|
freeTable(LateResolveValues);
|
|
|
|
freeTable(ModuleValues);
|
|
|
|
}
|
2001-06-06 20:29:01 +00:00
|
|
|
|
2003-09-22 23:38:23 +00:00
|
|
|
Module* releaseModule() {
|
|
|
|
// Since we're losing control of this Module, we must hand it back complete
|
|
|
|
materializeModule();
|
|
|
|
freeState();
|
|
|
|
Module *tempM = TheModule;
|
|
|
|
TheModule = 0;
|
|
|
|
return tempM;
|
|
|
|
}
|
2001-10-24 01:15:12 +00:00
|
|
|
|
2003-09-22 23:38:23 +00:00
|
|
|
void ParseBytecode(const unsigned char *Buf, unsigned Length,
|
|
|
|
const std::string &ModuleID);
|
2001-10-24 01:15:12 +00:00
|
|
|
|
2002-04-04 19:24:11 +00:00
|
|
|
void dump() const {
|
2002-06-25 20:44:04 +00:00
|
|
|
std::cerr << "BytecodeParser instance!\n";
|
2002-04-04 19:24:11 +00:00
|
|
|
}
|
|
|
|
|
2001-06-06 20:29:01 +00:00
|
|
|
private: // All of this data is transient across calls to ParseBytecode
|
2003-03-19 20:54:26 +00:00
|
|
|
struct ValueList : public User {
|
|
|
|
ValueList() : User(Type::TypeTy, Value::TypeVal) {
|
|
|
|
}
|
|
|
|
~ValueList() {}
|
|
|
|
|
|
|
|
// vector compatibility methods
|
|
|
|
unsigned size() const { return getNumOperands(); }
|
|
|
|
void push_back(Value *V) { Operands.push_back(Use(V, this)); }
|
|
|
|
Value *back() const { return Operands.back(); }
|
|
|
|
void pop_back() { Operands.pop_back(); }
|
|
|
|
bool empty() const { return Operands.empty(); }
|
|
|
|
|
|
|
|
virtual void print(std::ostream& OS) const {
|
|
|
|
OS << "Bytecode Reader UseHandle!";
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2003-03-06 17:55:45 +00:00
|
|
|
// Information about the module, extracted from the bytecode revision number.
|
|
|
|
unsigned char RevisionNum; // The rev # itself
|
|
|
|
unsigned char FirstDerivedTyID; // First variable index to use for type
|
|
|
|
bool HasImplicitZeroInitializer; // Is entry 0 of every slot implicity zeros?
|
2003-04-16 21:16:05 +00:00
|
|
|
bool hasInternalMarkerOnly; // Only types of linkage are intern/external
|
2003-03-06 17:55:45 +00:00
|
|
|
|
2003-03-19 20:54:26 +00:00
|
|
|
typedef std::vector<ValueList*> ValueTable;
|
2001-06-06 20:29:01 +00:00
|
|
|
ValueTable Values, LateResolveValues;
|
2003-03-19 20:54:26 +00:00
|
|
|
ValueTable ModuleValues;
|
2001-09-07 16:37:43 +00:00
|
|
|
|
2002-08-17 22:01:27 +00:00
|
|
|
// GlobalRefs - This maintains a mapping between <Type, Slot #>'s and forward
|
|
|
|
// references to global values or constants. Such values may be referenced
|
|
|
|
// before they are defined, and if so, the temporary object that they
|
|
|
|
// represent is held here.
|
|
|
|
//
|
2003-03-19 20:54:26 +00:00
|
|
|
typedef std::map<std::pair<const Type *, unsigned>, Value*> GlobalRefsType;
|
2002-08-17 22:01:27 +00:00
|
|
|
GlobalRefsType GlobalRefs;
|
2001-10-13 06:47:01 +00:00
|
|
|
|
2001-09-07 16:37:43 +00:00
|
|
|
// TypesLoaded - This vector mirrors the Values[TypeTyID] plane. It is used
|
|
|
|
// to deal with forward references to types.
|
|
|
|
//
|
2003-06-18 19:22:36 +00:00
|
|
|
typedef std::vector<PATypeHandle> TypeValuesListTy;
|
2001-09-07 16:37:43 +00:00
|
|
|
TypeValuesListTy ModuleTypeValues;
|
2003-03-06 17:18:14 +00:00
|
|
|
TypeValuesListTy FunctionTypeValues;
|
2001-06-06 20:29:01 +00:00
|
|
|
|
2003-03-19 20:54:26 +00:00
|
|
|
// When the ModuleGlobalInfo section is read, we create a function object for
|
|
|
|
// each function in the module. When the function is loaded, this function is
|
|
|
|
// filled in.
|
|
|
|
//
|
|
|
|
std::vector<std::pair<Function*, unsigned> > FunctionSignatureList;
|
|
|
|
|
|
|
|
// Constant values are read in after global variables. Because of this, we
|
|
|
|
// must defer setting the initializers on global variables until after module
|
|
|
|
// level constants have been read. In the mean time, this list keeps track of
|
|
|
|
// what we must do.
|
2001-06-06 20:29:01 +00:00
|
|
|
//
|
2003-03-19 20:54:26 +00:00
|
|
|
std::vector<std::pair<GlobalVariable*, unsigned> > GlobalInits;
|
2001-06-06 20:29:01 +00:00
|
|
|
|
2003-09-22 23:38:23 +00:00
|
|
|
// For lazy reading-in of functions, we need to save away several pieces of
|
|
|
|
// information about each function: its begin and end pointer in the buffer
|
|
|
|
// and its FunctionSlot.
|
|
|
|
//
|
|
|
|
std::map<Function*, LazyFunctionInfo*> LazyFunctionLoadMap;
|
|
|
|
|
2001-06-06 20:29:01 +00:00
|
|
|
private:
|
2003-03-19 20:54:26 +00:00
|
|
|
void freeTable(ValueTable &Tab) {
|
|
|
|
while (!Tab.empty()) {
|
|
|
|
delete Tab.back();
|
|
|
|
Tab.pop_back();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2003-09-22 23:38:23 +00:00
|
|
|
public:
|
|
|
|
void ParseModule(const unsigned char * Buf, const unsigned char *End);
|
|
|
|
void materializeFunction(Function *F);
|
|
|
|
|
|
|
|
private:
|
|
|
|
void ParseVersionInfo (const unsigned char *&Buf, const unsigned char *End);
|
|
|
|
void ParseModuleGlobalInfo(const unsigned char *&Buf, const unsigned char *E);
|
|
|
|
void ParseSymbolTable(const unsigned char *&Buf, const unsigned char *End,
|
|
|
|
SymbolTable *);
|
|
|
|
void ParseFunction(const unsigned char *&Buf, const unsigned char *End);
|
|
|
|
void ParseGlobalTypes(const unsigned char *&Buf, const unsigned char *EndBuf);
|
|
|
|
|
|
|
|
std::auto_ptr<BasicBlock>
|
|
|
|
ParseBasicBlock(const unsigned char *&Buf, const unsigned char *End);
|
|
|
|
|
2003-05-22 18:08:30 +00:00
|
|
|
bool ParseInstruction (const unsigned char *&Buf, const unsigned char *End,
|
2003-09-08 18:04:16 +00:00
|
|
|
Instruction *&);
|
2003-09-23 16:17:50 +00:00
|
|
|
std::auto_ptr<RawInst> ParseRawInst(const unsigned char *&Buf,
|
|
|
|
const unsigned char *End);
|
2003-05-22 18:08:30 +00:00
|
|
|
|
2003-09-22 23:38:23 +00:00
|
|
|
void ParseConstantPool(const unsigned char *&Buf, const unsigned char *EndBuf,
|
|
|
|
ValueTable &Tab, TypeValuesListTy &TypeTab);
|
|
|
|
void parseConstantValue(const unsigned char *&Buf, const unsigned char *End,
|
2001-12-03 22:26:30 +00:00
|
|
|
const Type *Ty, Constant *&V);
|
2003-09-22 23:38:23 +00:00
|
|
|
void parseTypeConstants(const unsigned char *&Buf,
|
2003-05-22 18:08:30 +00:00
|
|
|
const unsigned char *EndBuf,
|
2003-09-22 23:38:23 +00:00
|
|
|
TypeValuesListTy &Tab, unsigned NumEntries);
|
2003-05-22 18:08:30 +00:00
|
|
|
const Type *parseTypeConstant(const unsigned char *&Buf,
|
|
|
|
const unsigned char *EndBuf);
|
2001-06-06 20:29:01 +00:00
|
|
|
|
|
|
|
Value *getValue(const Type *Ty, unsigned num, bool Create = true);
|
|
|
|
const Type *getType(unsigned ID);
|
2002-10-14 03:33:02 +00:00
|
|
|
Constant *getConstantValue(const Type *Ty, unsigned num);
|
2001-06-06 20:29:01 +00:00
|
|
|
|
2003-03-19 20:54:26 +00:00
|
|
|
int insertValue(Value *V, ValueTable &Table); // -1 = Failure
|
|
|
|
void setValueTo(ValueTable &D, unsigned Slot, Value *V);
|
2003-09-22 23:38:23 +00:00
|
|
|
void postResolveValues(ValueTable &ValTab);
|
2001-06-06 20:29:01 +00:00
|
|
|
|
2003-09-22 23:38:23 +00:00
|
|
|
void getTypeSlot(const Type *Ty, unsigned &Slot);
|
2001-09-07 16:37:43 +00:00
|
|
|
|
2002-08-17 22:01:27 +00:00
|
|
|
// resolve all references to the placeholder (if any) for the given value
|
|
|
|
void ResolveReferencesToValue(Value *Val, unsigned Slot);
|
|
|
|
|
2002-07-14 23:05:09 +00:00
|
|
|
|
2001-09-07 16:37:43 +00:00
|
|
|
// refineAbstractType - The callback method is invoked when one of the
|
|
|
|
// elements of TypeValues becomes more concrete...
|
|
|
|
//
|
|
|
|
virtual void refineAbstractType(const DerivedType *OldTy, const Type *NewTy);
|
2001-06-06 20:29:01 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
template<class SuperType>
|
|
|
|
class PlaceholderDef : public SuperType {
|
|
|
|
unsigned ID;
|
2002-08-17 22:01:27 +00:00
|
|
|
PlaceholderDef(); // DO NOT IMPLEMENT
|
|
|
|
void operator=(const PlaceholderDef &); // DO NOT IMPLEMENT
|
2001-06-06 20:29:01 +00:00
|
|
|
public:
|
|
|
|
PlaceholderDef(const Type *Ty, unsigned id) : SuperType(Ty), ID(id) {}
|
|
|
|
unsigned getID() { return ID; }
|
|
|
|
};
|
|
|
|
|
|
|
|
struct InstPlaceHolderHelper : public Instruction {
|
|
|
|
InstPlaceHolderHelper(const Type *Ty) : Instruction(Ty, UserOp1, "") {}
|
2001-07-07 19:24:15 +00:00
|
|
|
virtual const char *getOpcodeName() const { return "placeholder"; }
|
2001-06-06 20:29:01 +00:00
|
|
|
|
|
|
|
virtual Instruction *clone() const { abort(); return 0; }
|
|
|
|
};
|
|
|
|
|
|
|
|
struct BBPlaceHolderHelper : public BasicBlock {
|
|
|
|
BBPlaceHolderHelper(const Type *Ty) : BasicBlock() {
|
2002-04-08 21:59:36 +00:00
|
|
|
assert(Ty == Type::LabelTy);
|
2001-06-06 20:29:01 +00:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2002-07-14 23:05:09 +00:00
|
|
|
struct ConstantPlaceHolderHelper : public Constant {
|
|
|
|
ConstantPlaceHolderHelper(const Type *Ty)
|
|
|
|
: Constant(Ty) {}
|
|
|
|
virtual bool isNullValue() const { return false; }
|
|
|
|
};
|
|
|
|
|
2002-08-17 22:01:27 +00:00
|
|
|
typedef PlaceholderDef<InstPlaceHolderHelper> ValPHolder;
|
2001-06-06 20:29:01 +00:00
|
|
|
typedef PlaceholderDef<BBPlaceHolderHelper> BBPHolder;
|
2002-07-14 23:05:09 +00:00
|
|
|
typedef PlaceholderDef<ConstantPlaceHolderHelper> ConstPHolder;
|
|
|
|
|
2003-09-22 23:38:23 +00:00
|
|
|
// Some common errors we find
|
|
|
|
static const std::string Error_readvbr = "read_vbr(): error reading.";
|
|
|
|
static const std::string Error_read = "read(): error reading.";
|
|
|
|
static const std::string Error_inputdata = "input_data(): error reading.";
|
|
|
|
static const std::string Error_DestSlot = "No destination slot found.";
|
2001-06-06 20:29:01 +00:00
|
|
|
|
2002-08-17 22:01:27 +00:00
|
|
|
static inline unsigned getValueIDNumberFromPlaceHolder(Value *Val) {
|
|
|
|
if (isa<Constant>(Val))
|
|
|
|
return ((ConstPHolder*)Val)->getID();
|
2002-07-14 23:05:09 +00:00
|
|
|
|
|
|
|
// else discriminate by type
|
2002-08-17 22:01:27 +00:00
|
|
|
switch (Val->getType()->getPrimitiveID()) {
|
|
|
|
case Type::LabelTyID: return ((BBPHolder*)Val)->getID();
|
|
|
|
default: return ((ValPHolder*)Val)->getID();
|
2001-06-06 20:29:01 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2003-09-22 23:38:23 +00:00
|
|
|
static inline void readBlock(const unsigned char *&Buf,
|
2003-05-22 18:08:30 +00:00
|
|
|
const unsigned char *EndBuf,
|
2003-09-22 23:38:23 +00:00
|
|
|
unsigned &Type, unsigned &Size) {
|
2001-06-06 20:29:01 +00:00
|
|
|
#if DEBUG_OUTPUT
|
|
|
|
bool Result = read(Buf, EndBuf, Type) || read(Buf, EndBuf, Size);
|
2002-06-25 20:44:04 +00:00
|
|
|
std::cerr << "StartLoc = " << ((unsigned)Buf & 4095)
|
2001-06-06 20:29:01 +00:00
|
|
|
<< " Type = " << Type << " Size = " << Size << endl;
|
2003-09-22 23:38:23 +00:00
|
|
|
if (Result) throw Error_read;
|
2001-06-06 20:29:01 +00:00
|
|
|
#else
|
2003-09-22 23:38:23 +00:00
|
|
|
if (read(Buf, EndBuf, Type) || read(Buf, EndBuf, Size)) throw Error_read;
|
2001-06-06 20:29:01 +00:00
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
|
|
|
#endif
|