//===- ReadConst.cpp - Code to constants and constant pools ---------------===// // // This file implements functionality to deserialize constants and entire // constant pools. // // Note that this library should be as fast as possible, reentrant, and // thread-safe!! // //===----------------------------------------------------------------------===// #include "ReaderInternals.h" #include "llvm/Module.h" #include "llvm/Constants.h" #include const Type *BytecodeParser::parseTypeConstant(const unsigned char *&Buf, const unsigned char *EndBuf) { unsigned PrimType; if (read_vbr(Buf, EndBuf, PrimType)) throw Error_readvbr; const Type *Val = 0; if ((Val = Type::getPrimitiveType((Type::PrimitiveID)PrimType))) return Val; switch (PrimType) { case Type::FunctionTyID: { unsigned Typ; if (read_vbr(Buf, EndBuf, Typ)) return Val; const Type *RetType = getType(Typ); if (RetType == 0) return Val; unsigned NumParams; if (read_vbr(Buf, EndBuf, NumParams)) return Val; std::vector Params; while (NumParams--) { if (read_vbr(Buf, EndBuf, Typ)) return Val; const Type *Ty = getType(Typ); if (Ty == 0) return Val; Params.push_back(Ty); } bool isVarArg = Params.size() && Params.back() == Type::VoidTy; if (isVarArg) Params.pop_back(); return FunctionType::get(RetType, Params, isVarArg); } case Type::ArrayTyID: { unsigned ElTyp; if (read_vbr(Buf, EndBuf, ElTyp)) return Val; const Type *ElementType = getType(ElTyp); if (ElementType == 0) return Val; unsigned NumElements; if (read_vbr(Buf, EndBuf, NumElements)) return Val; BCR_TRACE(5, "Array Type Constant #" << ElTyp << " size=" << NumElements << "\n"); return ArrayType::get(ElementType, NumElements); } case Type::StructTyID: { unsigned Typ; std::vector Elements; if (read_vbr(Buf, EndBuf, Typ)) return Val; while (Typ) { // List is terminated by void/0 typeid const Type *Ty = getType(Typ); if (Ty == 0) return Val; Elements.push_back(Ty); if (read_vbr(Buf, EndBuf, Typ)) return Val; } return StructType::get(Elements); } case Type::PointerTyID: { unsigned ElTyp; if (read_vbr(Buf, EndBuf, ElTyp)) return Val; BCR_TRACE(5, "Pointer Type Constant #" << ElTyp << "\n"); const Type *ElementType = getType(ElTyp); if (ElementType == 0) return Val; return PointerType::get(ElementType); } case Type::OpaqueTyID: { return OpaqueType::get(); } default: std::cerr << __FILE__ << ":" << __LINE__ << ": Don't know how to deserialize" << " primitive Type " << PrimType << "\n"; return Val; } } // parseTypeConstants - We have to use this weird code to handle recursive // types. We know that recursive types will only reference the current slab of // values in the type plane, but they can forward reference types before they // have been read. For example, Type #0 might be '{ Ty#1 }' and Type #1 might // be 'Ty#0*'. When reading Type #0, type number one doesn't exist. To fix // this ugly problem, we pessimistically insert an opaque type for each type we // are about to read. This means that forward references will resolve to // something and when we reread the type later, we can replace the opaque type // with a new resolved concrete type. // void debug_type_tables(); void BytecodeParser::parseTypeConstants(const unsigned char *&Buf, const unsigned char *EndBuf, TypeValuesListTy &Tab, unsigned NumEntries) { assert(Tab.size() == 0 && "should not have read type constants in before!"); // Insert a bunch of opaque types to be resolved later... for (unsigned i = 0; i < NumEntries; ++i) Tab.push_back(OpaqueType::get()); // Loop through reading all of the types. Forward types will make use of the // opaque types just inserted. // for (unsigned i = 0; i < NumEntries; ++i) { const Type *NewTy = parseTypeConstant(Buf, EndBuf), *OldTy = Tab[i].get(); if (NewTy == 0) throw std::string("Parsed invalid type."); BCR_TRACE(4, "#" << i << ": Read Type Constant: '" << NewTy << "' Replacing: " << OldTy << "\n"); // Don't insertValue the new type... instead we want to replace the opaque // type with the new concrete value... // // Refine the abstract type to the new type. This causes all uses of the // abstract type to use the newty. This also will cause the opaque type // to be deleted... // ((DerivedType*)Tab[i].get())->refineAbstractTypeTo(NewTy); // This should have replace the old opaque type with the new type in the // value table... or with a preexisting type that was already in the system assert(Tab[i] != OldTy && "refineAbstractType didn't work!"); } BCR_TRACE(5, "Resulting types:\n"); for (unsigned i = 0; i < NumEntries; ++i) { BCR_TRACE(5, (void*)Tab[i].get() << " - " << Tab[i].get() << "\n"); } debug_type_tables(); } void BytecodeParser::parseConstantValue(const unsigned char *&Buf, const unsigned char *EndBuf, const Type *Ty, Constant *&V) { // We must check for a ConstantExpr before switching by type because // a ConstantExpr can be of any type, and has no explicit value. // unsigned isExprNumArgs; // 0 if not expr; numArgs if is expr if (read_vbr(Buf, EndBuf, isExprNumArgs)) throw Error_readvbr; if (isExprNumArgs) { // FIXME: Encoding of constant exprs could be much more compact! unsigned Opcode; std::vector ArgVec; ArgVec.reserve(isExprNumArgs); if (read_vbr(Buf, EndBuf, Opcode)) throw Error_readvbr; // Read the slot number and types of each of the arguments for (unsigned i = 0; i != isExprNumArgs; ++i) { unsigned ArgValSlot, ArgTypeSlot; if (read_vbr(Buf, EndBuf, ArgValSlot)) throw Error_readvbr; if (read_vbr(Buf, EndBuf, ArgTypeSlot)) throw Error_readvbr; const Type *ArgTy = getType(ArgTypeSlot); if (ArgTy == 0) throw std::string("Argument type slot not found."); BCR_TRACE(4, "CE Arg " << i << ": Type: '" << ArgTy << "' slot: " << ArgValSlot << "\n"); // Get the arg value from its slot if it exists, otherwise a placeholder Constant *C = getConstantValue(ArgTy, ArgValSlot); if (C == 0) throw std::string("No arg value or placeholder found."); ArgVec.push_back(C); } // Construct a ConstantExpr of the appropriate kind if (isExprNumArgs == 1) { // All one-operand expressions assert(Opcode == Instruction::Cast); V = ConstantExpr::getCast(ArgVec[0], Ty); } else if (Opcode == Instruction::GetElementPtr) { // GetElementPtr std::vector IdxList(ArgVec.begin()+1, ArgVec.end()); V = ConstantExpr::getGetElementPtr(ArgVec[0], IdxList); } else { // All other 2-operand expressions V = ConstantExpr::get(Opcode, ArgVec[0], ArgVec[1]); } return; } // Ok, not an ConstantExpr. We now know how to read the given type... switch (Ty->getPrimitiveID()) { case Type::BoolTyID: { unsigned Val; if (read_vbr(Buf, EndBuf, Val)) throw Error_readvbr; if (Val != 0 && Val != 1) throw std::string("Invalid boolean value read."); V = ConstantBool::get(Val == 1); break; } case Type::UByteTyID: // Unsigned integer types... case Type::UShortTyID: case Type::UIntTyID: { unsigned Val; if (read_vbr(Buf, EndBuf, Val)) throw Error_readvbr; if (!ConstantUInt::isValueValidForType(Ty, Val)) throw std::string("Invalid unsigned byte/short/int read."); V = ConstantUInt::get(Ty, Val); break; } case Type::ULongTyID: { uint64_t Val; if (read_vbr(Buf, EndBuf, Val)) throw Error_readvbr; V = ConstantUInt::get(Ty, Val); break; } case Type::SByteTyID: // Signed integer types... case Type::ShortTyID: case Type::IntTyID: { case Type::LongTyID: int64_t Val; if (read_vbr(Buf, EndBuf, Val)) throw Error_readvbr; if (!ConstantSInt::isValueValidForType(Ty, Val)) throw std::string("Invalid signed byte/short/int/long read."); V = ConstantSInt::get(Ty, Val); break; } case Type::FloatTyID: { float F; if (input_data(Buf, EndBuf, &F, &F+1)) throw Error_inputdata; V = ConstantFP::get(Ty, F); break; } case Type::DoubleTyID: { double Val; if (input_data(Buf, EndBuf, &Val, &Val+1)) throw Error_inputdata; V = ConstantFP::get(Ty, Val); break; } case Type::TypeTyID: assert(0 && "Type constants should be handled separately!!!"); abort(); case Type::ArrayTyID: { const ArrayType *AT = cast(Ty); unsigned NumElements = AT->getNumElements(); std::vector Elements; while (NumElements--) { // Read all of the elements of the constant. unsigned Slot; if (read_vbr(Buf, EndBuf, Slot)) throw Error_readvbr; Constant *C = getConstantValue(AT->getElementType(), Slot); if (!C) throw std::string("Unable to get const value of array slot."); Elements.push_back(C); } V = ConstantArray::get(AT, Elements); break; } case Type::StructTyID: { const StructType *ST = cast(Ty); const StructType::ElementTypes &ET = ST->getElementTypes(); std::vector Elements; for (unsigned i = 0; i < ET.size(); ++i) { unsigned Slot; if (read_vbr(Buf, EndBuf, Slot)) throw Error_readvbr; Constant *C = getConstantValue(ET[i], Slot); if (!C) throw std::string("Could not read const value in struct slot."); Elements.push_back(C); } V = ConstantStruct::get(ST, Elements); break; } case Type::PointerTyID: { const PointerType *PT = cast(Ty); unsigned SubClass; if (HasImplicitZeroInitializer) SubClass = 1; else if (read_vbr(Buf, EndBuf, SubClass)) throw Error_readvbr; switch (SubClass) { case 0: // ConstantPointerNull value... V = ConstantPointerNull::get(PT); break; case 1: { // ConstantPointerRef value... unsigned Slot; if (read_vbr(Buf, EndBuf, Slot)) throw Error_readvbr; BCR_TRACE(4, "CPR: Type: '" << Ty << "' slot: " << Slot << "\n"); // Check to see if we have already read this global variable... Value *Val = getValue(PT, Slot, false); GlobalValue *GV; if (Val) { if (!(GV = dyn_cast(Val))) throw std::string("Value of ConstantPointerRef not in ValueTable!"); BCR_TRACE(5, "Value Found in ValueTable!\n"); } else if (RevisionNum > 0) { // Revision #0 could have forward references to globals that were weird. // We got rid of this in subsequent revs. throw std::string("Forward references to globals not allowed."); } else { // Nope... find or create a forward ref. for it GlobalRefsType::iterator I = GlobalRefs.find(std::make_pair(PT, Slot)); if (I != GlobalRefs.end()) { BCR_TRACE(5, "Previous forward ref found!\n"); GV = cast(I->second); } else { BCR_TRACE(5, "Creating new forward ref to a global variable!\n"); // Create a placeholder for the global variable reference... GlobalVariable *GVar = new GlobalVariable(PT->getElementType(), false, GlobalValue::InternalLinkage); // Keep track of the fact that we have a forward ref to recycle it GlobalRefs.insert(std::make_pair(std::make_pair(PT, Slot), GVar)); // Must temporarily push this value into the module table... TheModule->getGlobalList().push_back(GVar); GV = GVar; } } V = ConstantPointerRef::get(GV); break; } default: BCR_TRACE(5, "UNKNOWN Pointer Constant Type!\n"); throw std::string("Unknown pointer constant type."); } break; } default: std::cerr << __FILE__ << ":" << __LINE__ << ": Don't know how to deserialize constant value of type '" << Ty->getName() << "'\n"; throw std::string("Don't know how to deserialize constant value of type '"+ Ty->getName()); } } void BytecodeParser::ParseGlobalTypes(const unsigned char *&Buf, const unsigned char *EndBuf) { ValueTable T; ParseConstantPool(Buf, EndBuf, T, ModuleTypeValues); } void BytecodeParser::ParseConstantPool(const unsigned char *&Buf, const unsigned char *EndBuf, ValueTable &Tab, TypeValuesListTy &TypeTab) { while (Buf < EndBuf) { unsigned NumEntries, Typ; if (read_vbr(Buf, EndBuf, NumEntries) || read_vbr(Buf, EndBuf, Typ)) throw Error_readvbr; const Type *Ty = getType(Typ); if (Ty == 0) throw std::string("Invalid type read."); BCR_TRACE(3, "Type: '" << Ty << "' NumEntries: " << NumEntries << "\n"); if (Typ == Type::TypeTyID) { parseTypeConstants(Buf, EndBuf, TypeTab, NumEntries); } else { for (unsigned i = 0; i < NumEntries; ++i) { Constant *C; int Slot; parseConstantValue(Buf, EndBuf, Ty, C); assert(C && "parseConstantValue returned NULL!"); BCR_TRACE(4, "Read Constant: '" << *C << "'\n"); if ((Slot = insertValue(C, Tab)) == -1) throw std::string("Could not insert value into ValueTable."); // If we are reading a function constant table, make sure that we adjust // the slot number to be the real global constant number. // if (&Tab != &ModuleValues && Typ < ModuleValues.size()) Slot += ModuleValues[Typ]->size(); ResolveReferencesToValue(C, (unsigned)Slot); } } } if (Buf > EndBuf) throw std::string("Read past end of buffer."); }