Hemant Kulkarni 2217577fa7 Added program header emission
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@168195 91177308-0d34-0410-b5e6-96231b3b80d8
2012-11-16 20:51:32 +00:00

286 lines
10 KiB
Python
Executable File

#!/usr/bin/env python
import struct
import sys
import StringIO
import common_dump
class Reader:
def __init__(self, path):
if path == "-":
# Snarf all the data so we can seek.
self.file = StringIO.StringIO(sys.stdin.read())
else:
self.file = open(path, "rb")
self.isLSB = None
self.is64Bit = None
self.isN64 = False
def seek(self, pos):
self.file.seek(pos)
def read(self, N):
data = self.file.read(N)
if len(data) != N:
raise ValueError, "Out of data!"
return data
def read8(self):
return (ord(self.read(1)), 8)
def read16(self):
return (struct.unpack('><'[self.isLSB] + 'H', self.read(2))[0], 16)
def read32(self):
return (struct.unpack('><'[self.isLSB] + 'I', self.read(4))[0], 32)
def read64(self):
return (struct.unpack('><'[self.isLSB] + 'Q', self.read(8))[0], 64)
def readWord(self):
if self.is64Bit:
return self.read64()
else:
return self.read32()
class StringTable:
def __init__(self, strings):
self.string_table = strings
def __getitem__(self, index):
end = self.string_table.index('\x00', index)
return self.string_table[index:end]
class ProgramHeader:
def __init__(self, f):
self.p_type = f.read32()
if f.is64Bit:
self.p_flags = f.read32()
self.p_offset = f.readWord()
self.p_vaddr = f.readWord()
self.p_paddr = f.readWord()
self.p_filesz = f.readWord()
self.p_memsz = f.readWord()
if not f.is64Bit:
self.p_flags = f.read32()
self.p_align = f.readWord()
def dump(self):
print " (('p_type', %s)" % common_dump.HexDump(self.p_type)
print " ('p_flags', %s)" % common_dump.HexDump(self.p_flags)
print " ('p_offset', %s)" % common_dump.HexDump(self.p_offset)
print " ('p_vaddr', %s)" % common_dump.HexDump(self.p_vaddr)
print " ('p_paddr', %s)" % common_dump.HexDump(self.p_paddr)
print " ('p_filesz', %s)" % common_dump.HexDump(self.p_filesz)
print " ('p_memsz', %s)" % common_dump.HexDump(self.p_memsz)
print " ('p_align', %s)" % common_dump.HexDump(self.p_align)
print " ),"
class Section:
def __init__(self, f):
self.sh_name = f.read32()
self.sh_type = f.read32()
self.sh_flags = f.readWord()
self.sh_addr = f.readWord()
self.sh_offset = f.readWord()
self.sh_size = f.readWord()
self.sh_link = f.read32()
self.sh_info = f.read32()
self.sh_addralign = f.readWord()
self.sh_entsize = f.readWord()
def dump(self, shstrtab, f, strtab, dumpdata):
print " (('sh_name', %s)" % common_dump.HexDump(self.sh_name), "# %r" % shstrtab[self.sh_name[0]]
print " ('sh_type', %s)" % common_dump.HexDump(self.sh_type)
print " ('sh_flags', %s)" % common_dump.HexDump(self.sh_flags)
print " ('sh_addr', %s)" % common_dump.HexDump(self.sh_addr)
print " ('sh_offset', %s)" % common_dump.HexDump(self.sh_offset)
print " ('sh_size', %s)" % common_dump.HexDump(self.sh_size)
print " ('sh_link', %s)" % common_dump.HexDump(self.sh_link)
print " ('sh_info', %s)" % common_dump.HexDump(self.sh_info)
print " ('sh_addralign', %s)" % common_dump.HexDump(self.sh_addralign)
print " ('sh_entsize', %s)" % common_dump.HexDump(self.sh_entsize)
if self.sh_type[0] == 2: # SHT_SYMTAB
print " ('_symbols', ["
dumpSymtab(f, self, strtab)
print " ])"
elif self.sh_type[0] == 4 or self.sh_type[0] == 9: # SHT_RELA / SHT_REL
print " ('_relocations', ["
dumpRel(f, self, self.sh_type[0] == 4)
print " ])"
elif dumpdata:
f.seek(self.sh_offset[0])
if self.sh_type != 8: # != SHT_NOBITS
data = f.read(self.sh_size[0])
print " ('_section_data', '%s')" % common_dump.dataToHex(data)
else:
print " ('_section_data', '')"
print " ),"
def dumpSymtab(f, section, strtab):
entries = section.sh_size[0] // section.sh_entsize[0]
for index in range(entries):
f.seek(section.sh_offset[0] + index * section.sh_entsize[0])
print " # Symbol %s" % index
name = f.read32()
print " (('st_name', %s)" % common_dump.HexDump(name), "# %r" % strtab[name[0]]
if not f.is64Bit:
print " ('st_value', %s)" % common_dump.HexDump(f.read32())
print " ('st_size', %s)" % common_dump.HexDump(f.read32())
st_info = f.read8()[0]
st_bind = (st_info >> 4, 4)
st_type = (st_info & 0xf, 4)
print " ('st_bind', %s)" % common_dump.HexDump(st_bind)
print " ('st_type', %s)" % common_dump.HexDump(st_type)
print " ('st_other', %s)" % common_dump.HexDump(f.read8())
print " ('st_shndx', %s)" % common_dump.HexDump(f.read16())
if f.is64Bit:
print " ('st_value', %s)" % common_dump.HexDump(f.read64())
print " ('st_size', %s)" % common_dump.HexDump(f.read64())
print " ),"
def dumpRel(f, section, dumprela = False):
entries = section.sh_size[0] // section.sh_entsize[0]
for index in range(entries):
f.seek(section.sh_offset[0] + index * section.sh_entsize[0])
print " # Relocation %s" % index
print " (('r_offset', %s)" % common_dump.HexDump(f.readWord())
if f.isN64:
r_sym = f.read32()
r_ssym = f.read8()
r_type3 = f.read8()
r_type2 = f.read8()
r_type = f.read8()
print " ('r_sym', %s)" % common_dump.HexDump(r_sym)
print " ('r_ssym', %s)" % common_dump.HexDump(r_ssym)
print " ('r_type3', %s)" % common_dump.HexDump(r_type3)
print " ('r_type2', %s)" % common_dump.HexDump(r_type2)
print " ('r_type', %s)" % common_dump.HexDump(r_type)
else:
r_info = f.readWord()[0]
if f.is64Bit:
r_sym = (r_info >> 32, 32)
r_type = (r_info & 0xffffffff, 32)
else:
r_sym = (r_info >> 8, 24)
r_type = (r_info & 0xff, 8)
print " ('r_sym', %s)" % common_dump.HexDump(r_sym)
print " ('r_type', %s)" % common_dump.HexDump(r_type)
if dumprela:
print " ('r_addend', %s)" % common_dump.HexDump(f.readWord())
print " ),"
def dumpELF(path, opts):
f = Reader(path)
magic = f.read(4)
assert magic == '\x7FELF'
fileclass = f.read8()
if fileclass[0] == 1: # ELFCLASS32
f.is64Bit = False
elif fileclass[0] == 2: # ELFCLASS64
f.is64Bit = True
else:
raise ValueError, "Unknown file class %s" % common_dump.HexDump(fileclass)
print "('e_indent[EI_CLASS]', %s)" % common_dump.HexDump(fileclass)
byteordering = f.read8()
if byteordering[0] == 1: # ELFDATA2LSB
f.isLSB = True
elif byteordering[0] == 2: # ELFDATA2MSB
f.isLSB = False
else:
raise ValueError, "Unknown byte ordering %s" % common_dump.HexDump(byteordering)
print "('e_indent[EI_DATA]', %s)" % common_dump.HexDump(byteordering)
print "('e_indent[EI_VERSION]', %s)" % common_dump.HexDump(f.read8())
print "('e_indent[EI_OSABI]', %s)" % common_dump.HexDump(f.read8())
print "('e_indent[EI_ABIVERSION]', %s)" % common_dump.HexDump(f.read8())
f.seek(16) # Seek to end of e_ident.
print "('e_type', %s)" % common_dump.HexDump(f.read16())
# Does any other architecture use N64?
e_machine = f.read16()
if e_machine[0] == 0x0008 and f.is64Bit: # EM_MIPS && 64 bit
f.isN64 = True
print "('e_machine', %s)" % common_dump.HexDump(e_machine)
print "('e_version', %s)" % common_dump.HexDump(f.read32())
print "('e_entry', %s)" % common_dump.HexDump(f.readWord())
e_phoff = f.readWord()
print "('e_phoff', %s)" % common_dump.HexDump(e_phoff)
e_shoff = f.readWord()
print "('e_shoff', %s)" % common_dump.HexDump(e_shoff)
print "('e_flags', %s)" % common_dump.HexDump(f.read32())
print "('e_ehsize', %s)" % common_dump.HexDump(f.read16())
e_phentsize = f.read16()
print "('e_phentsize', %s)" % common_dump.HexDump(e_phentsize)
e_phnum = f.read16()
print "('e_phnum', %s)" % common_dump.HexDump(e_phnum)
e_shentsize = f.read16()
print "('e_shentsize', %s)" % common_dump.HexDump(e_shentsize)
e_shnum = f.read16()
print "('e_shnum', %s)" % common_dump.HexDump(e_shnum)
e_shstrndx = f.read16()
print "('e_shstrndx', %s)" % common_dump.HexDump(e_shstrndx)
# Read all section headers
sections = []
for index in range(e_shnum[0]):
f.seek(e_shoff[0] + index * e_shentsize[0])
s = Section(f)
sections.append(s)
# Read .shstrtab so we can resolve section names
f.seek(sections[e_shstrndx[0]].sh_offset[0])
shstrtab = StringTable(f.read(sections[e_shstrndx[0]].sh_size[0]))
# Get the symbol string table
strtab = None
for section in sections:
if shstrtab[section.sh_name[0]] == ".strtab":
f.seek(section.sh_offset[0])
strtab = StringTable(f.read(section.sh_size[0]))
break
print "('_sections', ["
for index in range(e_shnum[0]):
print " # Section %s" % index
sections[index].dump(shstrtab, f, strtab, opts.dumpSectionData)
print "])"
# Read all program headers
headers = []
for index in range(e_phnum[0]):
f.seek(e_phoff[0] + index * e_phentsize[0])
h = ProgramHeader(f)
headers.append(h)
print "('_ProgramHeaders', ["
for index in range(e_phnum[0]):
print " # Program Header %s" % index
headers[index].dump()
print "])"
if __name__ == "__main__":
from optparse import OptionParser, OptionGroup
parser = OptionParser("usage: %prog [options] {files}")
parser.add_option("", "--dump-section-data", dest="dumpSectionData",
help="Dump the contents of sections",
action="store_true", default=False)
(opts, args) = parser.parse_args()
if not args:
args.append('-')
for arg in args:
dumpELF(arg, opts)