| #!/usr/bin/env python |
| |
| import struct |
| import sys |
| import StringIO |
| |
| import common_dump |
| |
| class Reader: |
| def __init__(self, path): |
| if path == "-": |
| # Snarf all the data so we can seek. |
| self.file = StringIO.StringIO(sys.stdin.read()) |
| else: |
| self.file = open(path, "rb") |
| self.isLSB = None |
| self.is64Bit = None |
| self.isN64 = False |
| |
| def seek(self, pos): |
| self.file.seek(pos) |
| |
| def read(self, N): |
| data = self.file.read(N) |
| if len(data) != N: |
| raise ValueError, "Out of data!" |
| return data |
| |
| def read8(self): |
| return (ord(self.read(1)), 8) |
| |
| def read16(self): |
| return (struct.unpack('><'[self.isLSB] + 'H', self.read(2))[0], 16) |
| |
| def read32(self): |
| return (struct.unpack('><'[self.isLSB] + 'I', self.read(4))[0], 32) |
| |
| def read64(self): |
| return (struct.unpack('><'[self.isLSB] + 'Q', self.read(8))[0], 64) |
| |
| def readWord(self): |
| if self.is64Bit: |
| return self.read64() |
| else: |
| return self.read32() |
| |
| class StringTable: |
| def __init__(self, strings): |
| self.string_table = strings |
| |
| def __getitem__(self, index): |
| end = self.string_table.index('\x00', index) |
| return self.string_table[index:end] |
| |
| class ProgramHeader: |
| def __init__(self, f): |
| self.p_type = f.read32() |
| if f.is64Bit: |
| self.p_flags = f.read32() |
| self.p_offset = f.readWord() |
| self.p_vaddr = f.readWord() |
| self.p_paddr = f.readWord() |
| self.p_filesz = f.readWord() |
| self.p_memsz = f.readWord() |
| if not f.is64Bit: |
| self.p_flags = f.read32() |
| self.p_align = f.readWord() |
| |
| def dump(self): |
| print " (('p_type', %s)" % common_dump.HexDump(self.p_type) |
| print " ('p_flags', %s)" % common_dump.HexDump(self.p_flags) |
| print " ('p_offset', %s)" % common_dump.HexDump(self.p_offset) |
| print " ('p_vaddr', %s)" % common_dump.HexDump(self.p_vaddr) |
| print " ('p_paddr', %s)" % common_dump.HexDump(self.p_paddr) |
| print " ('p_filesz', %s)" % common_dump.HexDump(self.p_filesz) |
| print " ('p_memsz', %s)" % common_dump.HexDump(self.p_memsz) |
| print " ('p_align', %s)" % common_dump.HexDump(self.p_align) |
| print " )," |
| |
| class Section: |
| def __init__(self, f): |
| self.sh_name = f.read32() |
| self.sh_type = f.read32() |
| self.sh_flags = f.readWord() |
| self.sh_addr = f.readWord() |
| self.sh_offset = f.readWord() |
| self.sh_size = f.readWord() |
| self.sh_link = f.read32() |
| self.sh_info = f.read32() |
| self.sh_addralign = f.readWord() |
| self.sh_entsize = f.readWord() |
| |
| def dump(self, shstrtab, f, strtab, dumpdata): |
| print " (('sh_name', %s)" % common_dump.HexDump(self.sh_name), "# %r" % shstrtab[self.sh_name[0]] |
| print " ('sh_type', %s)" % common_dump.HexDump(self.sh_type) |
| print " ('sh_flags', %s)" % common_dump.HexDump(self.sh_flags) |
| print " ('sh_addr', %s)" % common_dump.HexDump(self.sh_addr) |
| print " ('sh_offset', %s)" % common_dump.HexDump(self.sh_offset) |
| print " ('sh_size', %s)" % common_dump.HexDump(self.sh_size) |
| print " ('sh_link', %s)" % common_dump.HexDump(self.sh_link) |
| print " ('sh_info', %s)" % common_dump.HexDump(self.sh_info) |
| print " ('sh_addralign', %s)" % common_dump.HexDump(self.sh_addralign) |
| print " ('sh_entsize', %s)" % common_dump.HexDump(self.sh_entsize) |
| if self.sh_type[0] == 2: # SHT_SYMTAB |
| print " ('_symbols', [" |
| dumpSymtab(f, self, strtab) |
| print " ])" |
| elif self.sh_type[0] == 4 or self.sh_type[0] == 9: # SHT_RELA / SHT_REL |
| print " ('_relocations', [" |
| dumpRel(f, self, self.sh_type[0] == 4) |
| print " ])" |
| elif dumpdata: |
| f.seek(self.sh_offset[0]) |
| if self.sh_type != 8: # != SHT_NOBITS |
| data = f.read(self.sh_size[0]) |
| print " ('_section_data', '%s')" % common_dump.dataToHex(data) |
| else: |
| print " ('_section_data', '')" |
| print " )," |
| |
| def dumpSymtab(f, section, strtab): |
| entries = section.sh_size[0] // section.sh_entsize[0] |
| |
| for index in range(entries): |
| f.seek(section.sh_offset[0] + index * section.sh_entsize[0]) |
| print " # Symbol %s" % index |
| name = f.read32() |
| print " (('st_name', %s)" % common_dump.HexDump(name), "# %r" % strtab[name[0]] |
| if not f.is64Bit: |
| print " ('st_value', %s)" % common_dump.HexDump(f.read32()) |
| print " ('st_size', %s)" % common_dump.HexDump(f.read32()) |
| st_info = f.read8()[0] |
| st_bind = (st_info >> 4, 4) |
| st_type = (st_info & 0xf, 4) |
| print " ('st_bind', %s)" % common_dump.HexDump(st_bind) |
| print " ('st_type', %s)" % common_dump.HexDump(st_type) |
| print " ('st_other', %s)" % common_dump.HexDump(f.read8()) |
| print " ('st_shndx', %s)" % common_dump.HexDump(f.read16()) |
| if f.is64Bit: |
| print " ('st_value', %s)" % common_dump.HexDump(f.read64()) |
| print " ('st_size', %s)" % common_dump.HexDump(f.read64()) |
| print " )," |
| |
| def dumpRel(f, section, dumprela = False): |
| entries = section.sh_size[0] // section.sh_entsize[0] |
| |
| for index in range(entries): |
| f.seek(section.sh_offset[0] + index * section.sh_entsize[0]) |
| print " # Relocation %s" % index |
| print " (('r_offset', %s)" % common_dump.HexDump(f.readWord()) |
| |
| if f.isN64: |
| r_sym = f.read32() |
| r_ssym = f.read8() |
| r_type3 = f.read8() |
| r_type2 = f.read8() |
| r_type = f.read8() |
| print " ('r_sym', %s)" % common_dump.HexDump(r_sym) |
| print " ('r_ssym', %s)" % common_dump.HexDump(r_ssym) |
| print " ('r_type3', %s)" % common_dump.HexDump(r_type3) |
| print " ('r_type2', %s)" % common_dump.HexDump(r_type2) |
| print " ('r_type', %s)" % common_dump.HexDump(r_type) |
| else: |
| r_info = f.readWord()[0] |
| if f.is64Bit: |
| r_sym = (r_info >> 32, 32) |
| r_type = (r_info & 0xffffffff, 32) |
| else: |
| r_sym = (r_info >> 8, 24) |
| r_type = (r_info & 0xff, 8) |
| print " ('r_sym', %s)" % common_dump.HexDump(r_sym) |
| print " ('r_type', %s)" % common_dump.HexDump(r_type) |
| if dumprela: |
| print " ('r_addend', %s)" % common_dump.HexDump(f.readWord()) |
| print " )," |
| |
| def dumpELF(path, opts): |
| f = Reader(path) |
| |
| magic = f.read(4) |
| assert magic == '\x7FELF' |
| |
| fileclass = f.read8() |
| if fileclass[0] == 1: # ELFCLASS32 |
| f.is64Bit = False |
| elif fileclass[0] == 2: # ELFCLASS64 |
| f.is64Bit = True |
| else: |
| raise ValueError, "Unknown file class %s" % common_dump.HexDump(fileclass) |
| print "('e_indent[EI_CLASS]', %s)" % common_dump.HexDump(fileclass) |
| |
| byteordering = f.read8() |
| if byteordering[0] == 1: # ELFDATA2LSB |
| f.isLSB = True |
| elif byteordering[0] == 2: # ELFDATA2MSB |
| f.isLSB = False |
| else: |
| raise ValueError, "Unknown byte ordering %s" % common_dump.HexDump(byteordering) |
| print "('e_indent[EI_DATA]', %s)" % common_dump.HexDump(byteordering) |
| |
| print "('e_indent[EI_VERSION]', %s)" % common_dump.HexDump(f.read8()) |
| print "('e_indent[EI_OSABI]', %s)" % common_dump.HexDump(f.read8()) |
| print "('e_indent[EI_ABIVERSION]', %s)" % common_dump.HexDump(f.read8()) |
| |
| f.seek(16) # Seek to end of e_ident. |
| |
| print "('e_type', %s)" % common_dump.HexDump(f.read16()) |
| |
| # Does any other architecture use N64? |
| e_machine = f.read16() |
| if e_machine[0] == 0x0008 and f.is64Bit: # EM_MIPS && 64 bit |
| f.isN64 = True |
| |
| print "('e_machine', %s)" % common_dump.HexDump(e_machine) |
| print "('e_version', %s)" % common_dump.HexDump(f.read32()) |
| print "('e_entry', %s)" % common_dump.HexDump(f.readWord()) |
| e_phoff = f.readWord() |
| print "('e_phoff', %s)" % common_dump.HexDump(e_phoff) |
| e_shoff = f.readWord() |
| print "('e_shoff', %s)" % common_dump.HexDump(e_shoff) |
| print "('e_flags', %s)" % common_dump.HexDump(f.read32()) |
| print "('e_ehsize', %s)" % common_dump.HexDump(f.read16()) |
| e_phentsize = f.read16() |
| print "('e_phentsize', %s)" % common_dump.HexDump(e_phentsize) |
| e_phnum = f.read16() |
| print "('e_phnum', %s)" % common_dump.HexDump(e_phnum) |
| e_shentsize = f.read16() |
| print "('e_shentsize', %s)" % common_dump.HexDump(e_shentsize) |
| e_shnum = f.read16() |
| print "('e_shnum', %s)" % common_dump.HexDump(e_shnum) |
| e_shstrndx = f.read16() |
| print "('e_shstrndx', %s)" % common_dump.HexDump(e_shstrndx) |
| |
| |
| # Read all section headers |
| sections = [] |
| for index in range(e_shnum[0]): |
| f.seek(e_shoff[0] + index * e_shentsize[0]) |
| s = Section(f) |
| sections.append(s) |
| |
| # Read .shstrtab so we can resolve section names |
| f.seek(sections[e_shstrndx[0]].sh_offset[0]) |
| shstrtab = StringTable(f.read(sections[e_shstrndx[0]].sh_size[0])) |
| |
| # Get the symbol string table |
| strtab = None |
| for section in sections: |
| if shstrtab[section.sh_name[0]] == ".strtab": |
| f.seek(section.sh_offset[0]) |
| strtab = StringTable(f.read(section.sh_size[0])) |
| break |
| |
| print "('_sections', [" |
| for index in range(e_shnum[0]): |
| print " # Section %s" % index |
| sections[index].dump(shstrtab, f, strtab, opts.dumpSectionData) |
| print "])" |
| |
| # Read all program headers |
| headers = [] |
| for index in range(e_phnum[0]): |
| f.seek(e_phoff[0] + index * e_phentsize[0]) |
| h = ProgramHeader(f) |
| headers.append(h) |
| |
| print "('_ProgramHeaders', [" |
| for index in range(e_phnum[0]): |
| print " # Program Header %s" % index |
| headers[index].dump() |
| print "])" |
| |
| if __name__ == "__main__": |
| from optparse import OptionParser, OptionGroup |
| parser = OptionParser("usage: %prog [options] {files}") |
| parser.add_option("", "--dump-section-data", dest="dumpSectionData", |
| help="Dump the contents of sections", |
| action="store_true", default=False) |
| (opts, args) = parser.parse_args() |
| |
| if not args: |
| args.append('-') |
| |
| for arg in args: |
| dumpELF(arg, opts) |