mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2024-12-21 16:31:16 +00:00
539d8d8a72
- Adds support for sniffing PE/COFF files on win32 (.exe and .dll) which are COFF files that have an MS-DOS compatibility stub on the front of them. - Fixes a bug in the COFFObjectFile's support for the Microsoft COFF extension for long symbol names, wherein it was attempting to parse the leading '/' in an extended symbol name reference as part of the integer offset. - Fixes bugs in COFFObjectFile and ELFObjectFile wherein section and symbol iterators were being returned with uninitialized bytes; the type DataRefImpl is a union between 2 32-bit words (d.a and d.b) and a single intptr_t word (p). Only p was being initialized, so in 32-bit builds the result would be iterators with random upper 32-bit words in their DataRefImpls. This caused random failures when seeking around in object files. Patch by Graydon Hoare! git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@128799 91177308-0d34-0410-b5e6-96231b3b80d8
392 lines
12 KiB
C++
392 lines
12 KiB
C++
//===- COFFObjectFile.cpp - COFF object file implementation -----*- C++ -*-===//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file declares the COFFObjectFile class.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "llvm/ADT/StringSwitch.h"
|
|
#include "llvm/ADT/Triple.h"
|
|
#include "llvm/Object/ObjectFile.h"
|
|
#include "llvm/Support/COFF.h"
|
|
#include "llvm/Support/Endian.h"
|
|
|
|
using namespace llvm;
|
|
using namespace object;
|
|
|
|
namespace {
|
|
using support::ulittle8_t;
|
|
using support::ulittle16_t;
|
|
using support::ulittle32_t;
|
|
using support::little16_t;
|
|
}
|
|
|
|
namespace {
|
|
struct coff_file_header {
|
|
ulittle16_t Machine;
|
|
ulittle16_t NumberOfSections;
|
|
ulittle32_t TimeDateStamp;
|
|
ulittle32_t PointerToSymbolTable;
|
|
ulittle32_t NumberOfSymbols;
|
|
ulittle16_t SizeOfOptionalHeader;
|
|
ulittle16_t Characteristics;
|
|
};
|
|
}
|
|
|
|
extern char coff_file_header_layout_static_assert
|
|
[sizeof(coff_file_header) == 20 ? 1 : -1];
|
|
|
|
namespace {
|
|
struct coff_symbol {
|
|
struct StringTableOffset {
|
|
ulittle32_t Zeroes;
|
|
ulittle32_t Offset;
|
|
};
|
|
|
|
union {
|
|
char ShortName[8];
|
|
StringTableOffset Offset;
|
|
} Name;
|
|
|
|
ulittle32_t Value;
|
|
little16_t SectionNumber;
|
|
|
|
struct {
|
|
ulittle8_t BaseType;
|
|
ulittle8_t ComplexType;
|
|
} Type;
|
|
|
|
ulittle8_t StorageClass;
|
|
ulittle8_t NumberOfAuxSymbols;
|
|
};
|
|
}
|
|
|
|
extern char coff_coff_symbol_layout_static_assert
|
|
[sizeof(coff_symbol) == 18 ? 1 : -1];
|
|
|
|
namespace {
|
|
struct coff_section {
|
|
char Name[8];
|
|
ulittle32_t VirtualSize;
|
|
ulittle32_t VirtualAddress;
|
|
ulittle32_t SizeOfRawData;
|
|
ulittle32_t PointerToRawData;
|
|
ulittle32_t PointerToRelocations;
|
|
ulittle32_t PointerToLinenumbers;
|
|
ulittle16_t NumberOfRelocations;
|
|
ulittle16_t NumberOfLinenumbers;
|
|
ulittle32_t Characteristics;
|
|
};
|
|
}
|
|
|
|
extern char coff_coff_section_layout_static_assert
|
|
[sizeof(coff_section) == 40 ? 1 : -1];
|
|
|
|
namespace {
|
|
class COFFObjectFile : public ObjectFile {
|
|
private:
|
|
uint64_t HeaderOff;
|
|
const coff_file_header *Header;
|
|
const coff_section *SectionTable;
|
|
const coff_symbol *SymbolTable;
|
|
const char *StringTable;
|
|
|
|
const coff_section *getSection(std::size_t index) const;
|
|
const char *getString(std::size_t offset) const;
|
|
|
|
protected:
|
|
virtual SymbolRef getSymbolNext(DataRefImpl Symb) const;
|
|
virtual StringRef getSymbolName(DataRefImpl Symb) const;
|
|
virtual uint64_t getSymbolAddress(DataRefImpl Symb) const;
|
|
virtual uint64_t getSymbolSize(DataRefImpl Symb) const;
|
|
virtual char getSymbolNMTypeChar(DataRefImpl Symb) const;
|
|
virtual bool isSymbolInternal(DataRefImpl Symb) const;
|
|
|
|
virtual SectionRef getSectionNext(DataRefImpl Sec) const;
|
|
virtual StringRef getSectionName(DataRefImpl Sec) const;
|
|
virtual uint64_t getSectionAddress(DataRefImpl Sec) const;
|
|
virtual uint64_t getSectionSize(DataRefImpl Sec) const;
|
|
virtual StringRef getSectionContents(DataRefImpl Sec) const;
|
|
virtual bool isSectionText(DataRefImpl Sec) const;
|
|
|
|
public:
|
|
COFFObjectFile(MemoryBuffer *Object);
|
|
virtual symbol_iterator begin_symbols() const;
|
|
virtual symbol_iterator end_symbols() const;
|
|
virtual section_iterator begin_sections() const;
|
|
virtual section_iterator end_sections() const;
|
|
|
|
virtual uint8_t getBytesInAddress() const;
|
|
virtual StringRef getFileFormatName() const;
|
|
virtual unsigned getArch() const;
|
|
};
|
|
} // end namespace
|
|
|
|
SymbolRef COFFObjectFile::getSymbolNext(DataRefImpl Symb) const {
|
|
const coff_symbol *symb = reinterpret_cast<const coff_symbol*>(Symb.p);
|
|
symb += 1 + symb->NumberOfAuxSymbols;
|
|
Symb.p = reinterpret_cast<intptr_t>(symb);
|
|
return SymbolRef(Symb, this);
|
|
}
|
|
|
|
StringRef COFFObjectFile::getSymbolName(DataRefImpl Symb) const {
|
|
const coff_symbol *symb = reinterpret_cast<const coff_symbol*>(Symb.p);
|
|
// Check for string table entry. First 4 bytes are 0.
|
|
if (symb->Name.Offset.Zeroes == 0) {
|
|
uint32_t Offset = symb->Name.Offset.Offset;
|
|
return StringRef(getString(Offset));
|
|
}
|
|
|
|
if (symb->Name.ShortName[7] == 0)
|
|
// Null terminated, let ::strlen figure out the length.
|
|
return StringRef(symb->Name.ShortName);
|
|
// Not null terminated, use all 8 bytes.
|
|
return StringRef(symb->Name.ShortName, 8);
|
|
}
|
|
|
|
uint64_t COFFObjectFile::getSymbolAddress(DataRefImpl Symb) const {
|
|
const coff_symbol *symb = reinterpret_cast<const coff_symbol*>(Symb.p);
|
|
const coff_section *Section = getSection(symb->SectionNumber);
|
|
char Type = getSymbolNMTypeChar(Symb);
|
|
if (Type == 'U' || Type == 'w')
|
|
return UnknownAddressOrSize;
|
|
if (Section)
|
|
return Section->VirtualAddress + symb->Value;
|
|
return symb->Value;
|
|
}
|
|
|
|
uint64_t COFFObjectFile::getSymbolSize(DataRefImpl Symb) const {
|
|
// FIXME: Return the correct size. This requires looking at all the symbols
|
|
// in the same section as this symbol, and looking for either the next
|
|
// symbol, or the end of the section.
|
|
const coff_symbol *symb = reinterpret_cast<const coff_symbol*>(Symb.p);
|
|
const coff_section *Section = getSection(symb->SectionNumber);
|
|
char Type = getSymbolNMTypeChar(Symb);
|
|
if (Type == 'U' || Type == 'w')
|
|
return UnknownAddressOrSize;
|
|
if (Section)
|
|
return Section->SizeOfRawData - symb->Value;
|
|
return 0;
|
|
}
|
|
|
|
char COFFObjectFile::getSymbolNMTypeChar(DataRefImpl Symb) const {
|
|
const coff_symbol *symb = reinterpret_cast<const coff_symbol*>(Symb.p);
|
|
char ret = StringSwitch<char>(getSymbolName(Symb))
|
|
.StartsWith(".debug", 'N')
|
|
.StartsWith(".sxdata", 'N')
|
|
.Default('?');
|
|
|
|
if (ret != '?')
|
|
return ret;
|
|
|
|
uint32_t Characteristics = 0;
|
|
uint32_t PointerToRawData = 0;
|
|
const coff_section *Section = getSection(symb->SectionNumber);
|
|
if (Section) {
|
|
Characteristics = Section->Characteristics;
|
|
PointerToRawData = Section->PointerToRawData;
|
|
}
|
|
|
|
switch (symb->SectionNumber) {
|
|
case COFF::IMAGE_SYM_UNDEFINED:
|
|
// Check storage classes.
|
|
if (symb->StorageClass == COFF::IMAGE_SYM_CLASS_WEAK_EXTERNAL)
|
|
return 'w'; // Don't do ::toupper.
|
|
else
|
|
ret = 'u';
|
|
break;
|
|
case COFF::IMAGE_SYM_ABSOLUTE:
|
|
ret = 'a';
|
|
break;
|
|
case COFF::IMAGE_SYM_DEBUG:
|
|
ret = 'n';
|
|
break;
|
|
default:
|
|
// Check section type.
|
|
if (Characteristics & COFF::IMAGE_SCN_CNT_CODE)
|
|
ret = 't';
|
|
else if ( Characteristics & COFF::IMAGE_SCN_MEM_READ
|
|
&& ~Characteristics & COFF::IMAGE_SCN_MEM_WRITE) // Read only.
|
|
ret = 'r';
|
|
else if (Characteristics & COFF::IMAGE_SCN_CNT_INITIALIZED_DATA)
|
|
ret = 'd';
|
|
else if (Characteristics & COFF::IMAGE_SCN_CNT_UNINITIALIZED_DATA)
|
|
ret = 'b';
|
|
else if (Characteristics & COFF::IMAGE_SCN_LNK_INFO)
|
|
ret = 'i';
|
|
|
|
// Check for section symbol.
|
|
else if ( symb->StorageClass == COFF::IMAGE_SYM_CLASS_STATIC
|
|
&& symb->Value == 0)
|
|
ret = 's';
|
|
}
|
|
|
|
if (symb->StorageClass == COFF::IMAGE_SYM_CLASS_EXTERNAL)
|
|
ret = ::toupper(ret);
|
|
|
|
return ret;
|
|
}
|
|
|
|
bool COFFObjectFile::isSymbolInternal(DataRefImpl Symb) const {
|
|
return false;
|
|
}
|
|
|
|
SectionRef COFFObjectFile::getSectionNext(DataRefImpl Sec) const {
|
|
const coff_section *sec = reinterpret_cast<const coff_section*>(Sec.p);
|
|
sec += 1;
|
|
Sec.p = reinterpret_cast<intptr_t>(sec);
|
|
return SectionRef(Sec, this);
|
|
}
|
|
|
|
StringRef COFFObjectFile::getSectionName(DataRefImpl Sec) const {
|
|
const coff_section *sec = reinterpret_cast<const coff_section*>(Sec.p);
|
|
StringRef name;
|
|
if (sec->Name[7] == 0)
|
|
// Null terminated, let ::strlen figure out the length.
|
|
name = sec->Name;
|
|
else
|
|
// Not null terminated, use all 8 bytes.
|
|
name = StringRef(sec->Name, 8);
|
|
|
|
// Check for string table entry. First byte is '/'.
|
|
if (name[0] == '/') {
|
|
uint32_t Offset;
|
|
name.substr(1).getAsInteger(10, Offset);
|
|
return StringRef(getString(Offset));
|
|
}
|
|
|
|
// It's just a normal name.
|
|
return name;
|
|
}
|
|
|
|
uint64_t COFFObjectFile::getSectionAddress(DataRefImpl Sec) const {
|
|
const coff_section *sec = reinterpret_cast<const coff_section*>(Sec.p);
|
|
return sec->VirtualAddress;
|
|
}
|
|
|
|
uint64_t COFFObjectFile::getSectionSize(DataRefImpl Sec) const {
|
|
const coff_section *sec = reinterpret_cast<const coff_section*>(Sec.p);
|
|
return sec->SizeOfRawData;
|
|
}
|
|
|
|
StringRef COFFObjectFile::getSectionContents(DataRefImpl Sec) const {
|
|
const coff_section *sec = reinterpret_cast<const coff_section*>(Sec.p);
|
|
return StringRef(reinterpret_cast<const char *>(base + sec->PointerToRawData),
|
|
sec->SizeOfRawData);
|
|
}
|
|
|
|
bool COFFObjectFile::isSectionText(DataRefImpl Sec) const {
|
|
const coff_section *sec = reinterpret_cast<const coff_section*>(Sec.p);
|
|
return sec->Characteristics & COFF::IMAGE_SCN_CNT_CODE;
|
|
}
|
|
|
|
COFFObjectFile::COFFObjectFile(MemoryBuffer *Object)
|
|
: ObjectFile(Object) {
|
|
|
|
HeaderOff = 0;
|
|
|
|
if (base[0] == 0x4d && base[1] == 0x5a) {
|
|
// PE/COFF, seek through MS-DOS compatibility stub and 4-byte
|
|
// PE signature to find 'normal' COFF header.
|
|
HeaderOff += *reinterpret_cast<const ulittle32_t *>(base + 0x3c);
|
|
HeaderOff += 4;
|
|
}
|
|
|
|
Header = reinterpret_cast<const coff_file_header *>(base + HeaderOff);
|
|
SectionTable =
|
|
reinterpret_cast<const coff_section *>( base
|
|
+ HeaderOff
|
|
+ sizeof(coff_file_header)
|
|
+ Header->SizeOfOptionalHeader);
|
|
SymbolTable =
|
|
reinterpret_cast<const coff_symbol *>(base + Header->PointerToSymbolTable);
|
|
|
|
// Find string table.
|
|
StringTable = reinterpret_cast<const char *>(base)
|
|
+ Header->PointerToSymbolTable
|
|
+ Header->NumberOfSymbols * 18;
|
|
}
|
|
|
|
ObjectFile::symbol_iterator COFFObjectFile::begin_symbols() const {
|
|
DataRefImpl ret;
|
|
memset(&ret, 0, sizeof(DataRefImpl));
|
|
ret.p = reinterpret_cast<intptr_t>(SymbolTable);
|
|
return symbol_iterator(SymbolRef(ret, this));
|
|
}
|
|
|
|
ObjectFile::symbol_iterator COFFObjectFile::end_symbols() const {
|
|
// The symbol table ends where the string table begins.
|
|
DataRefImpl ret;
|
|
memset(&ret, 0, sizeof(DataRefImpl));
|
|
ret.p = reinterpret_cast<intptr_t>(StringTable);
|
|
return symbol_iterator(SymbolRef(ret, this));
|
|
}
|
|
|
|
ObjectFile::section_iterator COFFObjectFile::begin_sections() const {
|
|
DataRefImpl ret;
|
|
memset(&ret, 0, sizeof(DataRefImpl));
|
|
ret.p = reinterpret_cast<intptr_t>(SectionTable);
|
|
return section_iterator(SectionRef(ret, this));
|
|
}
|
|
|
|
ObjectFile::section_iterator COFFObjectFile::end_sections() const {
|
|
DataRefImpl ret;
|
|
memset(&ret, 0, sizeof(DataRefImpl));
|
|
ret.p = reinterpret_cast<intptr_t>(SectionTable + Header->NumberOfSections);
|
|
return section_iterator(SectionRef(ret, this));
|
|
}
|
|
|
|
uint8_t COFFObjectFile::getBytesInAddress() const {
|
|
return getArch() == Triple::x86_64 ? 8 : 4;
|
|
}
|
|
|
|
StringRef COFFObjectFile::getFileFormatName() const {
|
|
switch(Header->Machine) {
|
|
case COFF::IMAGE_FILE_MACHINE_I386:
|
|
return "COFF-i386";
|
|
case COFF::IMAGE_FILE_MACHINE_AMD64:
|
|
return "COFF-x86-64";
|
|
default:
|
|
return "COFF-<unknown arch>";
|
|
}
|
|
}
|
|
|
|
unsigned COFFObjectFile::getArch() const {
|
|
switch(Header->Machine) {
|
|
case COFF::IMAGE_FILE_MACHINE_I386:
|
|
return Triple::x86;
|
|
case COFF::IMAGE_FILE_MACHINE_AMD64:
|
|
return Triple::x86_64;
|
|
default:
|
|
return Triple::UnknownArch;
|
|
}
|
|
}
|
|
|
|
const coff_section *COFFObjectFile::getSection(std::size_t index) const {
|
|
if (index > 0 && index <= Header->NumberOfSections)
|
|
return SectionTable + (index - 1);
|
|
return 0;
|
|
}
|
|
|
|
const char *COFFObjectFile::getString(std::size_t offset) const {
|
|
const ulittle32_t *StringTableSize =
|
|
reinterpret_cast<const ulittle32_t *>(StringTable);
|
|
if (offset < *StringTableSize)
|
|
return StringTable + offset;
|
|
return 0;
|
|
}
|
|
|
|
namespace llvm {
|
|
|
|
ObjectFile *ObjectFile::createCOFFObjectFile(MemoryBuffer *Object) {
|
|
return new COFFObjectFile(Object);
|
|
}
|
|
|
|
} // end namespace llvm
|