2004-11-06 08:51:45 +00:00
|
|
|
//===-- Archive.cpp - Generic LLVM archive functions ------------*- C++ -*-===//
|
2005-04-21 21:13:18 +00:00
|
|
|
//
|
2004-11-06 08:51:45 +00:00
|
|
|
// The LLVM Compiler Infrastructure
|
|
|
|
//
|
2005-04-21 21:13:18 +00:00
|
|
|
// This file was developed by Reid Spencer and is distributed under the
|
2004-11-06 08:51:45 +00:00
|
|
|
// University of Illinois Open Source License. See LICENSE.TXT for details.
|
2005-04-21 21:13:18 +00:00
|
|
|
//
|
2004-11-06 08:51:45 +00:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
2004-11-14 21:56:59 +00:00
|
|
|
// This file contains the implementation of the Archive and ArchiveMember
|
|
|
|
// classes that is common to both reading and writing archives..
|
2004-11-06 08:51:45 +00:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#include "ArchiveInternals.h"
|
2004-11-14 21:56:59 +00:00
|
|
|
#include "llvm/ModuleProvider.h"
|
2007-02-07 23:53:17 +00:00
|
|
|
#include "llvm/Module.h"
|
|
|
|
#include "llvm/Bytecode/Reader.h"
|
2005-04-21 17:49:57 +00:00
|
|
|
#include "llvm/System/Process.h"
|
2004-11-06 08:51:45 +00:00
|
|
|
using namespace llvm;
|
|
|
|
|
2004-11-14 21:56:59 +00:00
|
|
|
// getMemberSize - compute the actual physical size of the file member as seen
|
|
|
|
// on disk. This isn't the size of member's payload. Use getSize() for that.
|
|
|
|
unsigned
|
|
|
|
ArchiveMember::getMemberSize() const {
|
|
|
|
// Basically its the file size plus the header size
|
|
|
|
unsigned result = info.fileSize + sizeof(ArchiveMemberHeader);
|
|
|
|
|
|
|
|
// If it has a long filename, include the name length
|
|
|
|
if (hasLongFilename())
|
2004-12-11 00:14:15 +00:00
|
|
|
result += path.toString().length() + 1;
|
2004-11-14 21:56:59 +00:00
|
|
|
|
|
|
|
// If its now odd lengthed, include the padding byte
|
2005-04-21 21:13:18 +00:00
|
|
|
if (result % 2 != 0 )
|
2004-11-14 21:56:59 +00:00
|
|
|
result++;
|
|
|
|
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
|
|
|
// This default constructor is only use by the ilist when it creates its
|
|
|
|
// sentry node. We give it specific static values to make it stand out a bit.
|
2005-04-21 21:13:18 +00:00
|
|
|
ArchiveMember::ArchiveMember()
|
2006-05-06 23:25:53 +00:00
|
|
|
: next(0), prev(0), parent(0), path("--invalid--"), flags(0), data(0)
|
2004-11-14 21:56:59 +00:00
|
|
|
{
|
2005-04-21 17:49:57 +00:00
|
|
|
info.user = sys::Process::GetCurrentUserId();
|
2005-04-21 21:13:18 +00:00
|
|
|
info.group = sys::Process::GetCurrentGroupId();
|
|
|
|
info.mode = 0777;
|
|
|
|
info.fileSize = 0;
|
2004-11-14 21:56:59 +00:00
|
|
|
info.modTime = sys::TimeValue::now();
|
|
|
|
}
|
|
|
|
|
|
|
|
// This is the constructor that the Archive class uses when it is building or
|
|
|
|
// reading an archive. It just defaults a few things and ensures the parent is
|
2005-04-21 21:13:18 +00:00
|
|
|
// set for the iplist. The Archive class fills in the ArchiveMember's data.
|
|
|
|
// This is required because correctly setting the data may depend on other
|
2004-11-14 21:56:59 +00:00
|
|
|
// things in the Archive.
|
|
|
|
ArchiveMember::ArchiveMember(Archive* PAR)
|
|
|
|
: next(0), prev(0), parent(PAR), path(), flags(0), data(0)
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2005-04-21 21:13:18 +00:00
|
|
|
// This method allows an ArchiveMember to be replaced with the data for a
|
2004-11-14 21:56:59 +00:00
|
|
|
// different file, presumably as an update to the member. It also makes sure
|
|
|
|
// the flags are reset correctly.
|
2006-08-24 23:45:08 +00:00
|
|
|
bool ArchiveMember::replaceWith(const sys::Path& newFile, std::string* ErrMsg) {
|
2006-12-15 19:44:51 +00:00
|
|
|
if (!newFile.exists()) {
|
|
|
|
if (ErrMsg)
|
|
|
|
*ErrMsg = "Can not replace an archive member with a non-existent file";
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2004-11-14 21:56:59 +00:00
|
|
|
data = 0;
|
|
|
|
path = newFile;
|
|
|
|
|
2004-11-20 07:29:40 +00:00
|
|
|
// SVR4 symbol tables have an empty name
|
2004-12-11 00:14:15 +00:00
|
|
|
if (path.toString() == ARFILE_SVR4_SYMTAB_NAME)
|
2004-11-20 07:29:40 +00:00
|
|
|
flags |= SVR4SymbolTableFlag;
|
2004-11-14 21:56:59 +00:00
|
|
|
else
|
2004-11-20 07:29:40 +00:00
|
|
|
flags &= ~SVR4SymbolTableFlag;
|
|
|
|
|
|
|
|
// BSD4.4 symbol tables have a special name
|
2004-12-11 00:14:15 +00:00
|
|
|
if (path.toString() == ARFILE_BSD4_SYMTAB_NAME)
|
2004-11-20 07:29:40 +00:00
|
|
|
flags |= BSD4SymbolTableFlag;
|
|
|
|
else
|
|
|
|
flags &= ~BSD4SymbolTableFlag;
|
2004-11-14 21:56:59 +00:00
|
|
|
|
|
|
|
// LLVM symbol tables have a very specific name
|
2004-12-11 00:14:15 +00:00
|
|
|
if (path.toString() == ARFILE_LLVM_SYMTAB_NAME)
|
2004-11-14 21:56:59 +00:00
|
|
|
flags |= LLVMSymbolTableFlag;
|
|
|
|
else
|
|
|
|
flags &= ~LLVMSymbolTableFlag;
|
|
|
|
|
|
|
|
// String table name
|
2004-12-11 00:14:15 +00:00
|
|
|
if (path.toString() == ARFILE_STRTAB_NAME)
|
2004-11-14 21:56:59 +00:00
|
|
|
flags |= StringTableFlag;
|
|
|
|
else
|
|
|
|
flags &= ~StringTableFlag;
|
|
|
|
|
|
|
|
// If it has a slash then it has a path
|
2004-12-11 00:14:15 +00:00
|
|
|
bool hasSlash = path.toString().find('/') != std::string::npos;
|
2004-11-14 21:56:59 +00:00
|
|
|
if (hasSlash)
|
|
|
|
flags |= HasPathFlag;
|
|
|
|
else
|
|
|
|
flags &= ~HasPathFlag;
|
|
|
|
|
|
|
|
// If it has a slash or its over 15 chars then its a long filename format
|
2004-12-11 00:14:15 +00:00
|
|
|
if (hasSlash || path.toString().length() > 15)
|
2004-11-14 21:56:59 +00:00
|
|
|
flags |= HasLongFilenameFlag;
|
|
|
|
else
|
|
|
|
flags &= ~HasLongFilenameFlag;
|
|
|
|
|
|
|
|
// Get the signature and status info
|
|
|
|
const char* signature = (const char*) data;
|
2006-07-28 22:03:44 +00:00
|
|
|
std::string magic;
|
2004-11-14 21:56:59 +00:00
|
|
|
if (!signature) {
|
|
|
|
path.getMagicNumber(magic,4);
|
|
|
|
signature = magic.c_str();
|
2006-07-28 22:03:44 +00:00
|
|
|
std::string err;
|
2007-04-07 19:45:30 +00:00
|
|
|
const sys::FileStatus *FSinfo =
|
|
|
|
sys::PathWithStatus(path).getFileStatus(false, ErrMsg);
|
2007-03-29 19:05:44 +00:00
|
|
|
if (FSinfo)
|
|
|
|
info = *FSinfo;
|
|
|
|
else
|
2006-08-24 23:45:08 +00:00
|
|
|
return true;
|
2004-11-14 21:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Determine what kind of file it is
|
|
|
|
switch (sys::IdentifyFileType(signature,4)) {
|
2007-04-04 06:31:04 +00:00
|
|
|
case sys::Bytecode_FileType:
|
2004-11-14 21:56:59 +00:00
|
|
|
flags |= BytecodeFlag;
|
|
|
|
break;
|
2007-04-04 06:31:04 +00:00
|
|
|
case sys::CompressedBytecode_FileType:
|
2004-11-14 21:56:59 +00:00
|
|
|
flags |= CompressedBytecodeFlag;
|
|
|
|
flags &= ~CompressedFlag;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
flags &= ~(BytecodeFlag|CompressedBytecodeFlag);
|
|
|
|
break;
|
|
|
|
}
|
2006-08-24 23:45:08 +00:00
|
|
|
return false;
|
2004-11-14 21:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Archive constructor - this is the only constructor that gets used for the
|
2005-04-21 21:13:18 +00:00
|
|
|
// Archive class. Everything else (default,copy) is deprecated. This just
|
2004-11-14 21:56:59 +00:00
|
|
|
// initializes and maps the file into memory, if requested.
|
2007-02-07 21:41:02 +00:00
|
|
|
Archive::Archive(const sys::Path& filename, BCDecompressor_t *BCDC)
|
2004-11-16 06:47:07 +00:00
|
|
|
: archPath(filename), members(), mapfile(0), base(0), symTab(), strtab(),
|
2007-02-07 21:41:02 +00:00
|
|
|
symTabSize(0), firstFileOffset(0), modules(), foreignST(0),
|
|
|
|
Decompressor(BCDC) {
|
2006-08-24 23:45:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
bool
|
|
|
|
Archive::mapToMemory(std::string* ErrMsg)
|
|
|
|
{
|
|
|
|
mapfile = new sys::MappedFile();
|
|
|
|
if (mapfile->open(archPath, sys::MappedFile::READ_ACCESS, ErrMsg))
|
|
|
|
return true;
|
|
|
|
if (!(base = (char*) mapfile->map(ErrMsg)))
|
|
|
|
return true;
|
|
|
|
return false;
|
2004-11-06 08:51:45 +00:00
|
|
|
}
|
|
|
|
|
2005-11-30 05:21:10 +00:00
|
|
|
void Archive::cleanUpMemory() {
|
2004-11-14 21:56:59 +00:00
|
|
|
// Shutdown the file mapping
|
|
|
|
if (mapfile) {
|
2005-01-28 01:17:07 +00:00
|
|
|
mapfile->close();
|
2004-11-14 21:56:59 +00:00
|
|
|
delete mapfile;
|
2005-11-30 05:21:10 +00:00
|
|
|
|
|
|
|
mapfile = 0;
|
|
|
|
base = 0;
|
2004-11-14 21:56:59 +00:00
|
|
|
}
|
2005-11-30 05:21:10 +00:00
|
|
|
|
|
|
|
// Forget the entire symbol table
|
|
|
|
symTab.clear();
|
|
|
|
symTabSize = 0;
|
|
|
|
|
|
|
|
firstFileOffset = 0;
|
|
|
|
|
|
|
|
// Free the foreign symbol table member
|
|
|
|
if (foreignST) {
|
|
|
|
delete foreignST;
|
|
|
|
foreignST = 0;
|
|
|
|
}
|
|
|
|
|
2004-11-14 21:56:59 +00:00
|
|
|
// Delete any ModuleProviders and ArchiveMember's we've allocated as a result
|
|
|
|
// of symbol table searches.
|
|
|
|
for (ModuleMap::iterator I=modules.begin(), E=modules.end(); I != E; ++I ) {
|
|
|
|
delete I->second.first;
|
|
|
|
delete I->second.second;
|
|
|
|
}
|
2004-11-06 08:51:45 +00:00
|
|
|
}
|
|
|
|
|
2005-11-30 05:21:10 +00:00
|
|
|
// Archive destructor - just clean up memory
|
|
|
|
Archive::~Archive() {
|
|
|
|
cleanUpMemory();
|
|
|
|
}
|
|
|
|
|
2007-02-07 23:53:17 +00:00
|
|
|
|
|
|
|
|
|
|
|
static void getSymbols(Module*M, std::vector<std::string>& symbols) {
|
|
|
|
// Loop over global variables
|
|
|
|
for (Module::global_iterator GI = M->global_begin(), GE=M->global_end(); GI != GE; ++GI)
|
|
|
|
if (!GI->isDeclaration() && !GI->hasInternalLinkage())
|
|
|
|
if (!GI->getName().empty())
|
|
|
|
symbols.push_back(GI->getName());
|
|
|
|
|
|
|
|
// Loop over functions.
|
|
|
|
for (Module::iterator FI = M->begin(), FE = M->end(); FI != FE; ++FI)
|
|
|
|
if (!FI->isDeclaration() && !FI->hasInternalLinkage())
|
|
|
|
if (!FI->getName().empty())
|
|
|
|
symbols.push_back(FI->getName());
|
|
|
|
}
|
|
|
|
|
|
|
|
// Get just the externally visible defined symbols from the bytecode
|
|
|
|
bool llvm::GetBytecodeSymbols(const sys::Path& fName,
|
|
|
|
std::vector<std::string>& symbols,
|
|
|
|
BCDecompressor_t *BCDC,
|
|
|
|
std::string* ErrMsg) {
|
|
|
|
ModuleProvider *MP = getBytecodeModuleProvider(fName.toString(), BCDC,ErrMsg);
|
|
|
|
if (!MP)
|
|
|
|
return true;
|
|
|
|
|
|
|
|
// Get the module from the provider
|
|
|
|
Module* M = MP->materializeModule();
|
|
|
|
if (M == 0) {
|
|
|
|
delete MP;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Get the symbols
|
|
|
|
getSymbols(M, symbols);
|
|
|
|
|
|
|
|
// Done with the module.
|
|
|
|
delete MP;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
ModuleProvider*
|
|
|
|
llvm::GetBytecodeSymbols(const unsigned char*Buffer, unsigned Length,
|
|
|
|
const std::string& ModuleID,
|
|
|
|
std::vector<std::string>& symbols,
|
|
|
|
BCDecompressor_t *BCDC,
|
|
|
|
std::string* ErrMsg) {
|
|
|
|
// Get the module provider
|
|
|
|
ModuleProvider* MP =
|
|
|
|
getBytecodeBufferModuleProvider(Buffer, Length, ModuleID, BCDC, ErrMsg, 0);
|
|
|
|
if (!MP)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
// Get the module from the provider
|
|
|
|
Module* M = MP->materializeModule();
|
|
|
|
if (M == 0) {
|
|
|
|
delete MP;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Get the symbols
|
|
|
|
getSymbols(M, symbols);
|
|
|
|
|
|
|
|
// Done with the module. Note that ModuleProvider will delete the
|
|
|
|
// Module when it is deleted. Also note that its the caller's responsibility
|
|
|
|
// to delete the ModuleProvider.
|
|
|
|
return MP;
|
|
|
|
}
|