Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 1 | #!/usr/bin/env python |
| 2 | |
| 3 | import struct |
| 4 | import sys |
| 5 | import StringIO |
| 6 | |
Rafael Espindola | 228290c | 2010-09-11 15:25:58 +0000 | [diff] [blame] | 7 | import common_dump |
| 8 | |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 9 | class Reader: |
| 10 | def __init__(self, path): |
| 11 | if path == "-": |
| 12 | # Snarf all the data so we can seek. |
| 13 | self.file = StringIO.StringIO(sys.stdin.read()) |
| 14 | else: |
| 15 | self.file = open(path, "rb") |
| 16 | self.isLSB = None |
| 17 | self.is64Bit = None |
| 18 | |
| 19 | def seek(self, pos): |
| 20 | self.file.seek(pos) |
| 21 | |
| 22 | def read(self, N): |
| 23 | data = self.file.read(N) |
| 24 | if len(data) != N: |
| 25 | raise ValueError, "Out of data!" |
| 26 | return data |
| 27 | |
| 28 | def read8(self): |
| 29 | return ord(self.read(1)) |
| 30 | |
| 31 | def read16(self): |
| 32 | return struct.unpack('><'[self.isLSB] + 'H', self.read(2))[0] |
| 33 | |
| 34 | def read32(self): |
| 35 | return struct.unpack('><'[self.isLSB] + 'I', self.read(4))[0] |
| 36 | |
| 37 | def read32S(self): |
| 38 | return struct.unpack('><'[self.isLSB] + 'i', self.read(4))[0] |
| 39 | |
| 40 | def read64(self): |
| 41 | return struct.unpack('><'[self.isLSB] + 'Q', self.read(8))[0] |
| 42 | |
| 43 | def read64S(self): |
| 44 | return struct.unpack('><'[self.isLSB] + 'q', self.read(8))[0] |
| 45 | |
| 46 | def readWord(self): |
| 47 | if self.is64Bit: |
| 48 | return self.read64() |
| 49 | else: |
| 50 | return self.read32() |
| 51 | |
| 52 | def readWordS(self): |
| 53 | if self.is64Bit: |
| 54 | return self.read64S() |
| 55 | else: |
| 56 | return self.read32S() |
| 57 | |
| 58 | class StringTable: |
| 59 | def __init__(self, strings): |
| 60 | self.string_table = strings |
| 61 | |
| 62 | def __getitem__(self, index): |
| 63 | end = self.string_table.index('\x00', index) |
| 64 | return self.string_table[index:end] |
| 65 | |
| 66 | class Section: |
| 67 | def __init__(self, f): |
| 68 | self.sh_name = f.read32() |
| 69 | self.sh_type = f.read32() |
| 70 | self.sh_flags = f.readWord() |
| 71 | self.sh_addr = f.readWord() |
| 72 | self.sh_offset = f.readWord() |
| 73 | self.sh_size = f.readWord() |
| 74 | self.sh_link = f.read32() |
| 75 | self.sh_info = f.read32() |
| 76 | self.sh_addralign = f.readWord() |
| 77 | self.sh_entsize = f.readWord() |
| 78 | |
| 79 | def dump(self, shstrtab, f, strtab, dumpdata): |
Jason W Kim | f7d5278 | 2010-10-19 17:39:10 +0000 | [diff] [blame] | 80 | print " (('sh_name', %s)" % common_dump.HexDump(self.sh_name), "# %r" % shstrtab[self.sh_name] |
| 81 | print " ('sh_type', %s)" % common_dump.HexDump(self.sh_type) |
| 82 | print " ('sh_flags', %s)" % common_dump.HexDump(self.sh_flags) |
| 83 | print " ('sh_addr', %s)" % common_dump.HexDump(self.sh_addr) |
| 84 | print " ('sh_offset', %s)" % common_dump.HexDump(self.sh_offset) |
| 85 | print " ('sh_size', %s)" % common_dump.HexDump(self.sh_size) |
| 86 | print " ('sh_link', %s)" % common_dump.HexDump(self.sh_link) |
| 87 | print " ('sh_info', %s)" % common_dump.HexDump(self.sh_info) |
| 88 | print " ('sh_addralign', %s)" % common_dump.HexDump(self.sh_addralign) |
| 89 | print " ('sh_entsize', %s)" % common_dump.HexDump(self.sh_entsize) |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 90 | if self.sh_type == 2: # SHT_SYMTAB |
| 91 | print " ('_symbols', [" |
| 92 | dumpSymtab(f, self, strtab) |
| 93 | print " ])" |
| 94 | elif self.sh_type == 4 or self.sh_type == 9: # SHT_RELA / SHT_REL |
| 95 | print " ('_relocations', [" |
| 96 | dumpRel(f, self, self.sh_type == 4) |
| 97 | print " ])" |
| 98 | elif dumpdata: |
| 99 | f.seek(self.sh_offset) |
Jason W Kim | 6147bda | 2010-12-16 00:15:10 +0000 | [diff] [blame] | 100 | if self.sh_type != 8: # != SHT_NOBITS |
| 101 | data = f.read(self.sh_size) |
| 102 | print " ('_section_data', '%s')" % common_dump.dataToHex(data) |
| 103 | else: |
| 104 | print " ('_section_data', '')" |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 105 | print " )," |
| 106 | |
| 107 | def dumpSymtab(f, section, strtab): |
| 108 | entries = section.sh_size // section.sh_entsize |
| 109 | |
| 110 | for index in range(entries): |
| 111 | f.seek(section.sh_offset + index * section.sh_entsize) |
Jason W Kim | f7d5278 | 2010-10-19 17:39:10 +0000 | [diff] [blame] | 112 | print " # Symbol %s" % common_dump.HexDump(index) |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 113 | name = f.read32() |
Jason W Kim | f7d5278 | 2010-10-19 17:39:10 +0000 | [diff] [blame] | 114 | print " (('st_name', %s)" % common_dump.HexDump(name), "# %r" % strtab[name] |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 115 | if not f.is64Bit: |
Jason W Kim | f7d5278 | 2010-10-19 17:39:10 +0000 | [diff] [blame] | 116 | print " ('st_value', %s)" % common_dump.HexDump(f.read32()) |
| 117 | print " ('st_size', %s)" % common_dump.HexDump(f.read32()) |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 118 | st_info = f.read8() |
Jason W Kim | f7d5278 | 2010-10-19 17:39:10 +0000 | [diff] [blame] | 119 | print " ('st_bind', %s)" % common_dump.HexDump((st_info >> 4)) |
| 120 | print " ('st_type', %s)" % common_dump.HexDump((st_info & 0xf)) |
| 121 | print " ('st_other', %s)" % common_dump.HexDump(f.read8()) |
| 122 | print " ('st_shndx', %s)" % common_dump.HexDump(f.read16()) |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 123 | if f.is64Bit: |
Roman Divacky | 1ae3c16 | 2010-12-20 20:49:43 +0000 | [diff] [blame] | 124 | print " ('st_value', %s)" % common_dump.HexDump(f.read64(), 64) |
| 125 | print " ('st_size', %s)" % common_dump.HexDump(f.read64(), 64) |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 126 | print " )," |
| 127 | |
| 128 | def dumpRel(f, section, dumprela = False): |
| 129 | entries = section.sh_size // section.sh_entsize |
| 130 | |
| 131 | for index in range(entries): |
| 132 | f.seek(section.sh_offset + index * section.sh_entsize) |
Jason W Kim | f7d5278 | 2010-10-19 17:39:10 +0000 | [diff] [blame] | 133 | print " # Relocation %s" % common_dump.HexDump(index) |
| 134 | print " (('r_offset', %s)" % common_dump.HexDump(f.readWord()) |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 135 | r_info = f.readWord() |
| 136 | if f.is64Bit: |
Jason W Kim | f7d5278 | 2010-10-19 17:39:10 +0000 | [diff] [blame] | 137 | print " ('r_sym', %s)" % common_dump.HexDump((r_info >> 32)) |
| 138 | print " ('r_type', %s)" % common_dump.HexDump((r_info & 0xffffffff)) |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 139 | else: |
Jason W Kim | f7d5278 | 2010-10-19 17:39:10 +0000 | [diff] [blame] | 140 | print " ('r_sym', %s)" % common_dump.HexDump((r_info >> 8)) |
| 141 | print " ('r_type', %s)" % common_dump.HexDump((r_info & 0xff)) |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 142 | if dumprela: |
Jason W Kim | f7d5278 | 2010-10-19 17:39:10 +0000 | [diff] [blame] | 143 | print " ('r_addend', %s)" % common_dump.HexDump(f.readWordS()) |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 144 | print " )," |
| 145 | |
| 146 | def dumpELF(path, opts): |
| 147 | f = Reader(path) |
| 148 | |
| 149 | magic = f.read(4) |
| 150 | assert magic == '\x7FELF' |
| 151 | |
| 152 | fileclass = f.read8() |
| 153 | if fileclass == 1: # ELFCLASS32 |
| 154 | f.is64Bit = False |
| 155 | elif fileclass == 2: # ELFCLASS64 |
| 156 | f.is64Bit = True |
| 157 | else: |
Jason W Kim | f7d5278 | 2010-10-19 17:39:10 +0000 | [diff] [blame] | 158 | raise ValueError, "Unknown file class %s" % common_dump.HexDump(fileclass) |
| 159 | print "('e_indent[EI_CLASS]', %s)" % common_dump.HexDump(fileclass) |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 160 | |
| 161 | byteordering = f.read8() |
| 162 | if byteordering == 1: # ELFDATA2LSB |
| 163 | f.isLSB = True |
| 164 | elif byteordering == 2: # ELFDATA2MSB |
| 165 | f.isLSB = False |
| 166 | else: |
Jason W Kim | f7d5278 | 2010-10-19 17:39:10 +0000 | [diff] [blame] | 167 | raise ValueError, "Unknown byte ordering %s" % common_dump.HexDump(byteordering) |
| 168 | print "('e_indent[EI_DATA]', %s)" % common_dump.HexDump(byteordering) |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 169 | |
Jason W Kim | f7d5278 | 2010-10-19 17:39:10 +0000 | [diff] [blame] | 170 | print "('e_indent[EI_VERSION]', %s)" % common_dump.HexDump(f.read8()) |
| 171 | print "('e_indent[EI_OSABI]', %s)" % common_dump.HexDump(f.read8()) |
| 172 | print "('e_indent[EI_ABIVERSION]', %s)" % common_dump.HexDump(f.read8()) |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 173 | |
| 174 | f.seek(16) # Seek to end of e_ident. |
| 175 | |
Jason W Kim | f7d5278 | 2010-10-19 17:39:10 +0000 | [diff] [blame] | 176 | print "('e_type', %s)" % common_dump.HexDump(f.read16()) |
| 177 | print "('e_machine', %s)" % common_dump.HexDump(f.read16()) |
| 178 | print "('e_version', %s)" % common_dump.HexDump(f.read32()) |
| 179 | print "('e_entry', %s)" % common_dump.HexDump(f.readWord()) |
| 180 | print "('e_phoff', %s)" % common_dump.HexDump(f.readWord()) |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 181 | e_shoff = f.readWord() |
Jason W Kim | f7d5278 | 2010-10-19 17:39:10 +0000 | [diff] [blame] | 182 | print "('e_shoff', %s)" % common_dump.HexDump(e_shoff) |
| 183 | print "('e_flags', %s)" % common_dump.HexDump(f.read32()) |
| 184 | print "('e_ehsize', %s)" % common_dump.HexDump(f.read16()) |
| 185 | print "('e_phentsize', %s)" % common_dump.HexDump(f.read16()) |
| 186 | print "('e_phnum', %s)" % common_dump.HexDump(f.read16()) |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 187 | e_shentsize = f.read16() |
Jason W Kim | f7d5278 | 2010-10-19 17:39:10 +0000 | [diff] [blame] | 188 | print "('e_shentsize', %s)" % common_dump.HexDump(e_shentsize) |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 189 | e_shnum = f.read16() |
Jason W Kim | f7d5278 | 2010-10-19 17:39:10 +0000 | [diff] [blame] | 190 | print "('e_shnum', %s)" % common_dump.HexDump(e_shnum) |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 191 | e_shstrndx = f.read16() |
Jason W Kim | f7d5278 | 2010-10-19 17:39:10 +0000 | [diff] [blame] | 192 | print "('e_shstrndx', %s)" % common_dump.HexDump(e_shstrndx) |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 193 | |
| 194 | # Read all section headers |
| 195 | sections = [] |
| 196 | for index in range(e_shnum): |
| 197 | f.seek(e_shoff + index * e_shentsize) |
| 198 | s = Section(f) |
| 199 | sections.append(s) |
| 200 | |
| 201 | # Read .shstrtab so we can resolve section names |
| 202 | f.seek(sections[e_shstrndx].sh_offset) |
| 203 | shstrtab = StringTable(f.read(sections[e_shstrndx].sh_size)) |
| 204 | |
| 205 | # Get the symbol string table |
| 206 | strtab = None |
| 207 | for section in sections: |
| 208 | if shstrtab[section.sh_name] == ".strtab": |
| 209 | f.seek(section.sh_offset) |
| 210 | strtab = StringTable(f.read(section.sh_size)) |
| 211 | break |
| 212 | |
| 213 | print "('_sections', [" |
| 214 | for index in range(e_shnum): |
Jason W Kim | f7d5278 | 2010-10-19 17:39:10 +0000 | [diff] [blame] | 215 | print " # Section %s" % common_dump.HexDump(index) |
Benjamin Kramer | a754be4 | 2010-09-09 15:00:41 +0000 | [diff] [blame] | 216 | sections[index].dump(shstrtab, f, strtab, opts.dumpSectionData) |
| 217 | print "])" |
| 218 | |
| 219 | if __name__ == "__main__": |
| 220 | from optparse import OptionParser, OptionGroup |
| 221 | parser = OptionParser("usage: %prog [options] {files}") |
| 222 | parser.add_option("", "--dump-section-data", dest="dumpSectionData", |
| 223 | help="Dump the contents of sections", |
| 224 | action="store_true", default=False) |
| 225 | (opts, args) = parser.parse_args() |
| 226 | |
| 227 | if not args: |
| 228 | args.append('-') |
| 229 | |
| 230 | for arg in args: |
| 231 | dumpELF(arg, opts) |