Eli Bendersky | 3edefab | 2011-09-16 14:52:54 +0300 | [diff] [blame] | 1 | #!/usr/bin/env python |
Eli Bendersky | 933f699 | 2011-09-09 08:11:06 +0300 | [diff] [blame] | 2 | #------------------------------------------------------------------------------- |
Eli Bendersky | 2fc0f2a | 2011-09-17 10:39:29 +0300 | [diff] [blame] | 3 | # scripts/readelf.py |
Eli Bendersky | 933f699 | 2011-09-09 08:11:06 +0300 | [diff] [blame] | 4 | # |
| 5 | # A clone of 'readelf' in Python, based on the pyelftools library |
| 6 | # |
| 7 | # Eli Bendersky (eliben@gmail.com) |
| 8 | # This code is in the public domain |
| 9 | #------------------------------------------------------------------------------- |
Eli Bendersky | 53e86db | 2011-09-18 06:04:30 +0300 | [diff] [blame] | 10 | import os, sys |
Eli Bendersky | 933f699 | 2011-09-09 08:11:06 +0300 | [diff] [blame] | 11 | from optparse import OptionParser |
Eli Bendersky | 53e86db | 2011-09-18 06:04:30 +0300 | [diff] [blame] | 12 | import string |
| 13 | |
Eli Bendersky | 933f699 | 2011-09-09 08:11:06 +0300 | [diff] [blame] | 14 | |
| 15 | # If elftools is not installed, maybe we're running from the root or scripts |
| 16 | # dir of the source distribution |
| 17 | # |
| 18 | try: |
| 19 | import elftools |
| 20 | except ImportError: |
| 21 | sys.path.extend(['.', '..']) |
| 22 | |
Eli Bendersky | 0b27ba4 | 2011-09-17 06:44:02 +0300 | [diff] [blame] | 23 | from elftools import __version__ |
Eli Bendersky | 933f699 | 2011-09-09 08:11:06 +0300 | [diff] [blame] | 24 | from elftools.common.exceptions import ELFError |
| 25 | from elftools.elf.elffile import ELFFile |
Eli Bendersky | 3f4de3e | 2011-09-14 05:58:06 +0300 | [diff] [blame] | 26 | from elftools.elf.segments import InterpSegment |
Eli Bendersky | 149315a | 2011-11-24 08:12:37 +0200 | [diff] [blame] | 27 | from elftools.elf.sections import SymbolTableSection |
| 28 | from elftools.elf.relocation import RelocationSection |
Eli Bendersky | 933f699 | 2011-09-09 08:11:06 +0300 | [diff] [blame] | 29 | from elftools.elf.descriptions import ( |
| 30 | describe_ei_class, describe_ei_data, describe_ei_version, |
Eli Bendersky | de8d71e | 2011-09-09 08:22:35 +0300 | [diff] [blame] | 31 | describe_ei_osabi, describe_e_type, describe_e_machine, |
Eli Bendersky | 26de2ac | 2011-09-13 06:50:28 +0300 | [diff] [blame] | 32 | describe_e_version_numeric, describe_p_type, describe_p_flags, |
Eli Bendersky | 377bd86 | 2011-09-16 11:10:44 +0300 | [diff] [blame] | 33 | describe_sh_type, describe_sh_flags, |
Eli Bendersky | 3edefab | 2011-09-16 14:52:54 +0300 | [diff] [blame] | 34 | describe_symbol_type, describe_symbol_bind, describe_symbol_visibility, |
Eli Bendersky | 89a824f | 2011-09-23 10:59:59 +0300 | [diff] [blame] | 35 | describe_symbol_shndx, describe_reloc_type, |
Eli Bendersky | 933f699 | 2011-09-09 08:11:06 +0300 | [diff] [blame] | 36 | ) |
Eli Bendersky | 149315a | 2011-11-24 08:12:37 +0200 | [diff] [blame] | 37 | from elftools.dwarf.dwarfinfo import DWARFInfo |
eliben | aee11d2 | 2011-10-26 10:42:34 +0200 | [diff] [blame] | 38 | from elftools.dwarf.descriptions import describe_attr_value |
Eli Bendersky | 933f699 | 2011-09-09 08:11:06 +0300 | [diff] [blame] | 39 | |
| 40 | |
| 41 | class ReadElf(object): |
| 42 | """ display_* methods are used to emit output into the output stream |
| 43 | """ |
| 44 | def __init__(self, file, output): |
| 45 | """ file: |
| 46 | stream object with the ELF file to read |
| 47 | |
| 48 | output: |
| 49 | output stream to write to |
| 50 | """ |
| 51 | self.elffile = ELFFile(file) |
| 52 | self.output = output |
eliben | 0fc47af | 2011-10-02 13:47:12 +0200 | [diff] [blame] | 53 | |
| 54 | # Lazily initialized if a debug dump is requested |
| 55 | self._dwarfinfo = None |
Eli Bendersky | 933f699 | 2011-09-09 08:11:06 +0300 | [diff] [blame] | 56 | |
| 57 | def display_file_header(self): |
| 58 | """ Display the ELF file header |
| 59 | """ |
| 60 | self._emitline('ELF Header:') |
| 61 | self._emit(' Magic: ') |
| 62 | self._emitline(' '.join('%2.2x' % ord(b) |
| 63 | for b in self.elffile.e_ident_raw)) |
| 64 | header = self.elffile.header |
| 65 | e_ident = header['e_ident'] |
| 66 | self._emitline(' Class: %s' % |
| 67 | describe_ei_class(e_ident['EI_CLASS'])) |
| 68 | self._emitline(' Data: %s' % |
| 69 | describe_ei_data(e_ident['EI_DATA'])) |
| 70 | self._emitline(' Version: %s' % |
| 71 | describe_ei_version(e_ident['EI_VERSION'])) |
| 72 | self._emitline(' OS/ABI: %s' % |
| 73 | describe_ei_osabi(e_ident['EI_OSABI'])) |
| 74 | self._emitline(' ABI Version: %d' % |
| 75 | e_ident['EI_ABIVERSION']) |
| 76 | self._emitline(' Type: %s' % |
| 77 | describe_e_type(header['e_type'])) |
Eli Bendersky | de8d71e | 2011-09-09 08:22:35 +0300 | [diff] [blame] | 78 | self._emitline(' Machine: %s' % |
| 79 | describe_e_machine(header['e_machine'])) |
| 80 | self._emitline(' Version: %s' % |
| 81 | describe_e_version_numeric(header['e_version'])) |
Eli Bendersky | d62928d | 2011-09-09 10:05:57 +0300 | [diff] [blame] | 82 | self._emitline(' Entry point address: %s' % |
Eli Bendersky | 26de2ac | 2011-09-13 06:50:28 +0300 | [diff] [blame] | 83 | self._format_hex(header['e_entry'])) |
Eli Bendersky | 2fc0f2a | 2011-09-17 10:39:29 +0300 | [diff] [blame] | 84 | self._emit(' Start of program headers: %s' % |
Eli Bendersky | d62928d | 2011-09-09 10:05:57 +0300 | [diff] [blame] | 85 | header['e_phoff']) |
| 86 | self._emitline(' (bytes into file)') |
Eli Bendersky | 2fc0f2a | 2011-09-17 10:39:29 +0300 | [diff] [blame] | 87 | self._emit(' Start of section headers: %s' % |
Eli Bendersky | d62928d | 2011-09-09 10:05:57 +0300 | [diff] [blame] | 88 | header['e_shoff']) |
| 89 | self._emitline(' (bytes into file)') |
| 90 | self._emitline(' Flags: %s' % |
Eli Bendersky | 26de2ac | 2011-09-13 06:50:28 +0300 | [diff] [blame] | 91 | self._format_hex(header['e_flags'])) |
Eli Bendersky | d62928d | 2011-09-09 10:05:57 +0300 | [diff] [blame] | 92 | self._emitline(' Size of this header: %s (bytes)' % |
| 93 | header['e_ehsize']) |
| 94 | self._emitline(' Size of program headers: %s (bytes)' % |
| 95 | header['e_phentsize']) |
| 96 | self._emitline(' Number of program headers: %s' % |
| 97 | header['e_phnum']) |
| 98 | self._emitline(' Size of section headers: %s (bytes)' % |
| 99 | header['e_shentsize']) |
| 100 | self._emitline(' Number of section headers: %s' % |
| 101 | header['e_shnum']) |
| 102 | self._emitline(' Section header string table index: %s' % |
| 103 | header['e_shstrndx']) |
Eli Bendersky | 933f699 | 2011-09-09 08:11:06 +0300 | [diff] [blame] | 104 | |
Eli Bendersky | 0b27ba4 | 2011-09-17 06:44:02 +0300 | [diff] [blame] | 105 | def display_program_headers(self, show_heading=True): |
| 106 | """ Display the ELF program headers. |
| 107 | If show_heading is True, displays the heading for this information |
| 108 | (Elf file type is...) |
Eli Bendersky | 26de2ac | 2011-09-13 06:50:28 +0300 | [diff] [blame] | 109 | """ |
| 110 | self._emitline() |
Eli Bendersky | 2fc0f2a | 2011-09-17 10:39:29 +0300 | [diff] [blame] | 111 | if self.elffile.num_segments() == 0: |
| 112 | self._emitline('There are no program headers in this file.') |
| 113 | return |
| 114 | |
Eli Bendersky | 26de2ac | 2011-09-13 06:50:28 +0300 | [diff] [blame] | 115 | elfheader = self.elffile.header |
Eli Bendersky | 0b27ba4 | 2011-09-17 06:44:02 +0300 | [diff] [blame] | 116 | if show_heading: |
| 117 | self._emitline('Elf file type is %s' % |
| 118 | describe_e_type(elfheader['e_type'])) |
| 119 | self._emitline('Entry point is %s' % |
| 120 | self._format_hex(elfheader['e_entry'])) |
| 121 | # readelf weirness - why isn't e_phoff printed as hex? (for section |
| 122 | # headers, it is...) |
| 123 | self._emitline('There are %s program headers, starting at offset %s' % ( |
| 124 | elfheader['e_phnum'], elfheader['e_phoff'])) |
| 125 | self._emitline() |
Eli Bendersky | 26de2ac | 2011-09-13 06:50:28 +0300 | [diff] [blame] | 126 | |
Eli Bendersky | 2fc0f2a | 2011-09-17 10:39:29 +0300 | [diff] [blame] | 127 | self._emitline('Program Headers:') |
Eli Bendersky | 26de2ac | 2011-09-13 06:50:28 +0300 | [diff] [blame] | 128 | |
| 129 | # Now comes the table of program headers with their attributes. Note |
| 130 | # that due to different formatting constraints of 32-bit and 64-bit |
| 131 | # addresses, there are some conditions on elfclass here. |
| 132 | # |
| 133 | # First comes the table heading |
| 134 | # |
| 135 | if self.elffile.elfclass == 32: |
| 136 | self._emitline(' Type Offset VirtAddr PhysAddr FileSiz MemSiz Flg Align') |
| 137 | else: |
| 138 | self._emitline(' Type Offset VirtAddr PhysAddr') |
| 139 | self._emitline(' FileSiz MemSiz Flags Align') |
| 140 | |
| 141 | # Now the entries |
| 142 | # |
| 143 | for segment in self.elffile.iter_segments(): |
| 144 | self._emit(' %-14s ' % describe_p_type(segment['p_type'])) |
| 145 | |
| 146 | if self.elffile.elfclass == 32: |
| 147 | self._emitline('%s %s %s %s %s %-3s %s' % ( |
| 148 | self._format_hex(segment['p_offset'], fieldsize=6), |
| 149 | self._format_hex(segment['p_vaddr'], fullhex=True), |
| 150 | self._format_hex(segment['p_paddr'], fullhex=True), |
| 151 | self._format_hex(segment['p_filesz'], fieldsize=5), |
| 152 | self._format_hex(segment['p_memsz'], fieldsize=5), |
| 153 | describe_p_flags(segment['p_flags']), |
| 154 | self._format_hex(segment['p_align']))) |
Eli Bendersky | a41c3c0 | 2011-09-14 06:18:28 +0300 | [diff] [blame] | 155 | else: # 64 |
| 156 | self._emitline('%s %s %s' % ( |
| 157 | self._format_hex(segment['p_offset'], fullhex=True), |
| 158 | self._format_hex(segment['p_vaddr'], fullhex=True), |
| 159 | self._format_hex(segment['p_paddr'], fullhex=True))) |
| 160 | self._emitline(' %s %s %-3s %s' % ( |
| 161 | self._format_hex(segment['p_filesz'], fullhex=True), |
| 162 | self._format_hex(segment['p_memsz'], fullhex=True), |
| 163 | describe_p_flags(segment['p_flags']), |
| 164 | # lead0x set to False for p_align, to mimic readelf. |
| 165 | # No idea why the difference from 32-bit mode :-| |
| 166 | self._format_hex(segment['p_align'], lead0x=False))) |
Eli Bendersky | 26de2ac | 2011-09-13 06:50:28 +0300 | [diff] [blame] | 167 | |
Eli Bendersky | 3f4de3e | 2011-09-14 05:58:06 +0300 | [diff] [blame] | 168 | if isinstance(segment, InterpSegment): |
| 169 | self._emitline(' [Requesting program interpreter: %s]' % |
| 170 | segment.get_interp_name()) |
| 171 | |
Eli Bendersky | 58585b0 | 2011-09-15 07:07:54 +0300 | [diff] [blame] | 172 | # Sections to segments mapping |
| 173 | # |
| 174 | if self.elffile.num_sections() == 0: |
| 175 | # No sections? We're done |
| 176 | return |
| 177 | |
| 178 | self._emitline('\n Section to Segment mapping:') |
Eli Bendersky | 2fc0f2a | 2011-09-17 10:39:29 +0300 | [diff] [blame] | 179 | self._emitline(' Segment Sections...') |
Eli Bendersky | 58585b0 | 2011-09-15 07:07:54 +0300 | [diff] [blame] | 180 | |
| 181 | for nseg, segment in enumerate(self.elffile.iter_segments()): |
Eli Bendersky | 2fc0f2a | 2011-09-17 10:39:29 +0300 | [diff] [blame] | 182 | self._emit(' %2.2d ' % nseg) |
Eli Bendersky | 58585b0 | 2011-09-15 07:07:54 +0300 | [diff] [blame] | 183 | |
| 184 | for section in self.elffile.iter_sections(): |
| 185 | if ( not section.is_null() and |
| 186 | segment.section_in_segment(section)): |
| 187 | self._emit('%s ' % section.name) |
| 188 | |
| 189 | self._emitline('') |
| 190 | |
Eli Bendersky | 0b27ba4 | 2011-09-17 06:44:02 +0300 | [diff] [blame] | 191 | def display_section_headers(self, show_heading=True): |
Eli Bendersky | 377bd86 | 2011-09-16 11:10:44 +0300 | [diff] [blame] | 192 | """ Display the ELF section headers |
| 193 | """ |
| 194 | elfheader = self.elffile.header |
Eli Bendersky | 0b27ba4 | 2011-09-17 06:44:02 +0300 | [diff] [blame] | 195 | if show_heading: |
| 196 | self._emitline('There are %s section headers, starting at offset %s' % ( |
| 197 | elfheader['e_shnum'], self._format_hex(elfheader['e_shoff']))) |
Eli Bendersky | 26de2ac | 2011-09-13 06:50:28 +0300 | [diff] [blame] | 198 | |
Eli Bendersky | 2fc0f2a | 2011-09-17 10:39:29 +0300 | [diff] [blame] | 199 | self._emitline('\nSection Header%s:' % ( |
Eli Bendersky | 377bd86 | 2011-09-16 11:10:44 +0300 | [diff] [blame] | 200 | 's' if elfheader['e_shnum'] > 1 else '')) |
Eli Bendersky | 26de2ac | 2011-09-13 06:50:28 +0300 | [diff] [blame] | 201 | |
Eli Bendersky | 377bd86 | 2011-09-16 11:10:44 +0300 | [diff] [blame] | 202 | # Different formatting constraints of 32-bit and 64-bit addresses |
| 203 | # |
| 204 | if self.elffile.elfclass == 32: |
| 205 | self._emitline(' [Nr] Name Type Addr Off Size ES Flg Lk Inf Al') |
| 206 | else: |
| 207 | self._emitline(' [Nr] Name Type Address Offset') |
| 208 | self._emitline(' Size EntSize Flags Link Info Align') |
| 209 | |
| 210 | # Now the entries |
| 211 | # |
| 212 | for nsec, section in enumerate(self.elffile.iter_sections()): |
| 213 | self._emit(' [%2u] %-17.17s %-15.15s ' % ( |
| 214 | nsec, section.name, describe_sh_type(section['sh_type']))) |
| 215 | |
| 216 | if self.elffile.elfclass == 32: |
| 217 | self._emitline('%s %s %s %s %3s %2s %3s %2s' % ( |
| 218 | self._format_hex(section['sh_addr'], fieldsize=8, lead0x=False), |
| 219 | self._format_hex(section['sh_offset'], fieldsize=6, lead0x=False), |
| 220 | self._format_hex(section['sh_size'], fieldsize=6, lead0x=False), |
| 221 | self._format_hex(section['sh_entsize'], fieldsize=2, lead0x=False), |
| 222 | describe_sh_flags(section['sh_flags']), |
| 223 | section['sh_link'], section['sh_info'], |
| 224 | section['sh_addralign'])) |
| 225 | else: # 64 |
| 226 | self._emitline(' %s %s' % ( |
| 227 | self._format_hex(section['sh_addr'], fullhex=True, lead0x=False), |
| 228 | self._format_hex(section['sh_offset'], |
| 229 | fieldsize=16 if section['sh_offset'] > 0xffffffff else 8, |
| 230 | lead0x=False))) |
| 231 | self._emitline(' %s %s %3s %2s %3s %s' % ( |
| 232 | self._format_hex(section['sh_size'], fullhex=True, lead0x=False), |
| 233 | self._format_hex(section['sh_entsize'], fullhex=True, lead0x=False), |
| 234 | describe_sh_flags(section['sh_flags']), |
| 235 | section['sh_link'], section['sh_info'], |
| 236 | section['sh_addralign'])) |
| 237 | |
| 238 | self._emitline('Key to Flags:') |
Eli Bendersky | 93e630d | 2011-11-16 07:22:57 +0200 | [diff] [blame] | 239 | self._emit(' W (write), A (alloc), X (execute), M (merge), S (strings)') |
| 240 | if self.elffile['e_machine'] in ('EM_X86_64', 'EM_L10M'): |
| 241 | self._emitline(', l (large)') |
| 242 | else: |
| 243 | self._emitline() |
| 244 | self._emitline(' I (info), L (link order), G (group), T (TLS), E (exclude), x (unknown)') |
Eli Bendersky | 377bd86 | 2011-09-16 11:10:44 +0300 | [diff] [blame] | 245 | self._emitline(' O (extra OS processing required) o (OS specific), p (processor specific)') |
| 246 | |
Eli Bendersky | 3edefab | 2011-09-16 14:52:54 +0300 | [diff] [blame] | 247 | def display_symbol_tables(self): |
| 248 | """ Display the symbol tables contained in the file |
| 249 | """ |
| 250 | for section in self.elffile.iter_sections(): |
| 251 | if not isinstance(section, SymbolTableSection): |
| 252 | continue |
| 253 | |
| 254 | if section['sh_entsize'] == 0: |
| 255 | self._emitline("\nSymbol table '%s' has a sh_entsize of zero!" % ( |
| 256 | section.name)) |
| 257 | continue |
| 258 | |
| 259 | self._emitline("\nSymbol table '%s' contains %s entries:" % ( |
| 260 | section.name, section.num_symbols())) |
| 261 | |
| 262 | if self.elffile.elfclass == 32: |
| 263 | self._emitline(' Num: Value Size Type Bind Vis Ndx Name') |
| 264 | else: # 64 |
| 265 | self._emitline(' Num: Value Size Type Bind Vis Ndx Name') |
| 266 | |
| 267 | for nsym, symbol in enumerate(section.iter_symbols()): |
Eli Bendersky | b6fa365 | 2011-09-16 15:20:20 +0300 | [diff] [blame] | 268 | # symbol names are truncated to 25 chars, similarly to readelf |
| 269 | self._emitline('%6d: %s %5d %-7s %-6s %-7s %4s %.25s' % ( |
Eli Bendersky | 3edefab | 2011-09-16 14:52:54 +0300 | [diff] [blame] | 270 | nsym, |
| 271 | self._format_hex(symbol['st_value'], fullhex=True, lead0x=False), |
| 272 | symbol['st_size'], |
| 273 | describe_symbol_type(symbol['st_info']['type']), |
| 274 | describe_symbol_bind(symbol['st_info']['bind']), |
| 275 | describe_symbol_visibility(symbol['st_other']['visibility']), |
| 276 | describe_symbol_shndx(symbol['st_shndx']), |
| 277 | symbol.name)) |
| 278 | |
Eli Bendersky | 84066b2 | 2011-09-20 06:48:52 +0300 | [diff] [blame] | 279 | def display_relocations(self): |
| 280 | """ Display the relocations contained in the file |
| 281 | """ |
| 282 | has_relocation_sections = False |
| 283 | for section in self.elffile.iter_sections(): |
| 284 | if not isinstance(section, RelocationSection): |
| 285 | continue |
| 286 | |
| 287 | has_relocation_sections = True |
| 288 | self._emitline("\nRelocation section '%s' at offset %s contains %s entries:" % ( |
Eli Bendersky | 7c1ffa6 | 2011-09-22 06:37:07 +0300 | [diff] [blame] | 289 | section.name, |
| 290 | self._format_hex(section['sh_offset']), |
| 291 | section.num_relocations())) |
Eli Bendersky | 89a824f | 2011-09-23 10:59:59 +0300 | [diff] [blame] | 292 | if section.is_RELA(): |
| 293 | self._emitline(" Offset Info Type Sym. Value Sym. Name + Addend") |
| 294 | else: |
| 295 | self._emitline(" Offset Info Type Sym.Value Sym. Name") |
| 296 | |
| 297 | # The symbol table section pointed to in sh_link |
| 298 | symtable = self.elffile.get_section(section['sh_link']) |
| 299 | |
Eli Bendersky | 84066b2 | 2011-09-20 06:48:52 +0300 | [diff] [blame] | 300 | for rel in section.iter_relocations(): |
Eli Bendersky | 89a824f | 2011-09-23 10:59:59 +0300 | [diff] [blame] | 301 | hexwidth = 8 if self.elffile.elfclass == 32 else 12 |
Eli Bendersky | 099d48f | 2011-09-23 12:03:48 +0300 | [diff] [blame] | 302 | self._emit('%s %s %-17.17s' % ( |
Eli Bendersky | 89a824f | 2011-09-23 10:59:59 +0300 | [diff] [blame] | 303 | self._format_hex(rel['r_offset'], |
| 304 | fieldsize=hexwidth, lead0x=False), |
| 305 | self._format_hex(rel['r_info'], |
| 306 | fieldsize=hexwidth, lead0x=False), |
| 307 | describe_reloc_type( |
Eli Bendersky | 067b3fd | 2011-11-18 12:02:57 +0200 | [diff] [blame] | 308 | rel['r_info_type'], self.elffile))) |
Eli Bendersky | 099d48f | 2011-09-23 12:03:48 +0300 | [diff] [blame] | 309 | |
| 310 | if rel['r_info_sym'] == 0: |
| 311 | self._emitline() |
| 312 | continue |
| 313 | |
| 314 | symbol = symtable.get_symbol(rel['r_info_sym']) |
Eli Bendersky | adf707a | 2011-09-23 15:23:41 +0300 | [diff] [blame] | 315 | # Some symbols have zero 'st_name', so instead what's used is |
| 316 | # the name of the section they point at |
| 317 | if symbol['st_name'] == 0: |
| 318 | symsec = self.elffile.get_section(symbol['st_shndx']) |
| 319 | symbol_name = symsec.name |
| 320 | else: |
| 321 | symbol_name = symbol.name |
Eli Bendersky | 6434a96 | 2011-09-23 17:14:08 +0300 | [diff] [blame] | 322 | self._emit(' %s %s%22.22s' % ( |
Eli Bendersky | 89a824f | 2011-09-23 10:59:59 +0300 | [diff] [blame] | 323 | self._format_hex( |
| 324 | symbol['st_value'], |
| 325 | fullhex=True, lead0x=False), |
| 326 | ' ' if self.elffile.elfclass == 32 else '', |
Eli Bendersky | adf707a | 2011-09-23 15:23:41 +0300 | [diff] [blame] | 327 | symbol_name)) |
Eli Bendersky | 89a824f | 2011-09-23 10:59:59 +0300 | [diff] [blame] | 328 | if section.is_RELA(): |
| 329 | self._emit(' %s %x' % ( |
| 330 | '+' if rel['r_addend'] >= 0 else '-', |
| 331 | abs(rel['r_addend']))) |
| 332 | self._emitline() |
Eli Bendersky | 84066b2 | 2011-09-20 06:48:52 +0300 | [diff] [blame] | 333 | |
| 334 | if not has_relocation_sections: |
| 335 | self._emitline('\nThere are no relocations in this file.') |
| 336 | |
Eli Bendersky | c4a4c07 | 2011-09-17 15:28:28 +0300 | [diff] [blame] | 337 | def display_hex_dump(self, section_spec): |
| 338 | """ Display a hex dump of a section. section_spec is either a section |
| 339 | number or a name. |
| 340 | """ |
eliben | 54e39b2 | 2011-09-19 13:10:57 +0300 | [diff] [blame] | 341 | section = self._section_from_spec(section_spec) |
| 342 | if section is None: |
Eli Bendersky | c4a4c07 | 2011-09-17 15:28:28 +0300 | [diff] [blame] | 343 | self._emitline("Section '%s' does not exist in the file!" % ( |
| 344 | section_spec)) |
| 345 | return |
| 346 | |
Eli Bendersky | c4a4c07 | 2011-09-17 15:28:28 +0300 | [diff] [blame] | 347 | self._emitline("\nHex dump of section '%s':" % section.name) |
Eli Bendersky | adf707a | 2011-09-23 15:23:41 +0300 | [diff] [blame] | 348 | self._note_relocs_for_section(section) |
Eli Bendersky | c4a4c07 | 2011-09-17 15:28:28 +0300 | [diff] [blame] | 349 | addr = section['sh_addr'] |
| 350 | data = section.data() |
| 351 | dataptr = 0 |
| 352 | |
| 353 | while dataptr < len(data): |
| 354 | bytesleft = len(data) - dataptr |
| 355 | # chunks of 16 bytes per line |
| 356 | linebytes = 16 if bytesleft > 16 else bytesleft |
| 357 | |
| 358 | self._emit(' %s ' % self._format_hex(addr, fieldsize=8)) |
| 359 | for i in range(16): |
| 360 | if i < linebytes: |
| 361 | self._emit('%2.2x' % ord(data[dataptr + i])) |
| 362 | else: |
| 363 | self._emit(' ') |
| 364 | if i % 4 == 3: |
| 365 | self._emit(' ') |
| 366 | |
| 367 | for i in range(linebytes): |
| 368 | c = data[dataptr + i] |
Eli Bendersky | 099d48f | 2011-09-23 12:03:48 +0300 | [diff] [blame] | 369 | if c >= ' ' and ord(c) < 0x7f: |
Eli Bendersky | c4a4c07 | 2011-09-17 15:28:28 +0300 | [diff] [blame] | 370 | self._emit(c) |
| 371 | else: |
| 372 | self._emit('.') |
| 373 | |
| 374 | self._emitline() |
| 375 | addr += linebytes |
| 376 | dataptr += linebytes |
| 377 | |
| 378 | self._emitline() |
| 379 | |
Eli Bendersky | 53e86db | 2011-09-18 06:04:30 +0300 | [diff] [blame] | 380 | def display_string_dump(self, section_spec): |
| 381 | """ Display a strings dump of a section. section_spec is either a |
| 382 | section number or a name. |
| 383 | """ |
eliben | 54e39b2 | 2011-09-19 13:10:57 +0300 | [diff] [blame] | 384 | section = self._section_from_spec(section_spec) |
| 385 | if section is None: |
Eli Bendersky | 53e86db | 2011-09-18 06:04:30 +0300 | [diff] [blame] | 386 | self._emitline("Section '%s' does not exist in the file!" % ( |
| 387 | section_spec)) |
| 388 | return |
| 389 | |
| 390 | printables = set(string.printable) |
Eli Bendersky | 53e86db | 2011-09-18 06:04:30 +0300 | [diff] [blame] | 391 | self._emitline("\nString dump of section '%s':" % section.name) |
| 392 | |
| 393 | found = False |
| 394 | data = section.data() |
| 395 | dataptr = 0 |
| 396 | |
| 397 | while dataptr < len(data): |
| 398 | while dataptr < len(data) and data[dataptr] not in printables: |
| 399 | dataptr += 1 |
| 400 | |
| 401 | if dataptr >= len(data): |
| 402 | break |
| 403 | |
| 404 | endptr = dataptr |
| 405 | while endptr < len(data) and data[endptr] != '\x00': |
| 406 | endptr += 1 |
| 407 | |
| 408 | found = True |
| 409 | self._emitline(' [%6x] %s' % ( |
| 410 | dataptr, data[dataptr:endptr])) |
| 411 | |
| 412 | dataptr = endptr |
| 413 | |
| 414 | if not found: |
| 415 | self._emitline(' No strings found in this section.') |
| 416 | else: |
| 417 | self._emitline() |
Eli Bendersky | c4a4c07 | 2011-09-17 15:28:28 +0300 | [diff] [blame] | 418 | |
eliben | 0fc47af | 2011-10-02 13:47:12 +0200 | [diff] [blame] | 419 | def display_debug_dump(self, section_name): |
| 420 | """ Dump a DWARF section |
| 421 | """ |
| 422 | self._init_dwarfinfo() |
| 423 | if self._dwarfinfo is None: |
| 424 | return |
| 425 | |
| 426 | if section_name == 'info': |
| 427 | self._dump_debug_info() |
| 428 | else: |
| 429 | self._emitline('debug dump not yet supported for "%s"' % section_name) |
| 430 | |
Eli Bendersky | 26de2ac | 2011-09-13 06:50:28 +0300 | [diff] [blame] | 431 | def _format_hex(self, addr, fieldsize=None, fullhex=False, lead0x=True): |
Eli Bendersky | 6a12cde | 2011-09-09 10:23:16 +0300 | [diff] [blame] | 432 | """ Format an address into a hexadecimal string. |
Eli Bendersky | d62928d | 2011-09-09 10:05:57 +0300 | [diff] [blame] | 433 | |
Eli Bendersky | 26de2ac | 2011-09-13 06:50:28 +0300 | [diff] [blame] | 434 | fieldsize: |
| 435 | Size of the hexadecimal field (with leading zeros to fit the |
| 436 | address into. For example with fieldsize=8, the format will |
| 437 | be %08x |
| 438 | If None, the minimal required field size will be used. |
| 439 | |
Eli Bendersky | 6a12cde | 2011-09-09 10:23:16 +0300 | [diff] [blame] | 440 | fullhex: |
Eli Bendersky | 26de2ac | 2011-09-13 06:50:28 +0300 | [diff] [blame] | 441 | If True, override fieldsize to set it to the maximal size |
| 442 | needed for the elfclass |
Eli Bendersky | 6a12cde | 2011-09-09 10:23:16 +0300 | [diff] [blame] | 443 | |
| 444 | lead0x: |
| 445 | If True, leading 0x is added |
Eli Bendersky | d62928d | 2011-09-09 10:05:57 +0300 | [diff] [blame] | 446 | """ |
Eli Bendersky | 6a12cde | 2011-09-09 10:23:16 +0300 | [diff] [blame] | 447 | s = '0x' if lead0x else '' |
| 448 | if fullhex: |
Eli Bendersky | 26de2ac | 2011-09-13 06:50:28 +0300 | [diff] [blame] | 449 | fieldsize = 8 if self.elffile.elfclass == 32 else 16 |
| 450 | if fieldsize is None: |
| 451 | field = '%x' |
Eli Bendersky | 6a12cde | 2011-09-09 10:23:16 +0300 | [diff] [blame] | 452 | else: |
Eli Bendersky | 26de2ac | 2011-09-13 06:50:28 +0300 | [diff] [blame] | 453 | field = '%' + '0%sx' % fieldsize |
| 454 | return s + field % addr |
Eli Bendersky | d62928d | 2011-09-09 10:05:57 +0300 | [diff] [blame] | 455 | |
eliben | 54e39b2 | 2011-09-19 13:10:57 +0300 | [diff] [blame] | 456 | def _section_from_spec(self, spec): |
| 457 | """ Retrieve a section given a "spec" (either number or name). |
Eli Bendersky | c4a4c07 | 2011-09-17 15:28:28 +0300 | [diff] [blame] | 458 | Return None if no such section exists in the file. |
| 459 | """ |
| 460 | try: |
| 461 | num = int(spec) |
eliben | 54e39b2 | 2011-09-19 13:10:57 +0300 | [diff] [blame] | 462 | if num < self.elffile.num_sections(): |
| 463 | return self.elffile.get_section(num) |
| 464 | else: |
| 465 | return None |
Eli Bendersky | c4a4c07 | 2011-09-17 15:28:28 +0300 | [diff] [blame] | 466 | except ValueError: |
| 467 | # Not a number. Must be a name then |
eliben | 54e39b2 | 2011-09-19 13:10:57 +0300 | [diff] [blame] | 468 | return self.elffile.get_section_by_name(spec) |
Eli Bendersky | c4a4c07 | 2011-09-17 15:28:28 +0300 | [diff] [blame] | 469 | |
Eli Bendersky | adf707a | 2011-09-23 15:23:41 +0300 | [diff] [blame] | 470 | def _note_relocs_for_section(self, section): |
| 471 | """ If there are relocation sections pointing to the givne section, |
| 472 | emit a note about it. |
| 473 | """ |
| 474 | for relsec in self.elffile.iter_sections(): |
| 475 | if isinstance(relsec, RelocationSection): |
| 476 | info_idx = relsec['sh_info'] |
| 477 | if self.elffile.get_section(info_idx) == section: |
| 478 | self._emitline(' Note: This section has relocations against it, but these have NOT been applied to this dump.') |
| 479 | return |
| 480 | |
eliben | 0fc47af | 2011-10-02 13:47:12 +0200 | [diff] [blame] | 481 | def _init_dwarfinfo(self): |
| 482 | """ Initialize the DWARF info contained in the file and assign it to |
| 483 | self._dwarfinfo. |
| 484 | Leave self._dwarfinfo at None if no DWARF info was found in the file |
| 485 | """ |
| 486 | if self._dwarfinfo is not None: |
| 487 | return |
| 488 | |
| 489 | if self.elffile.has_dwarf_info(): |
| 490 | self._dwarfinfo = self.elffile.get_dwarf_info() |
| 491 | else: |
| 492 | self._dwarfinfo = None |
| 493 | |
| 494 | def _dump_debug_info(self): |
| 495 | """ Dump the debugging info section. |
| 496 | """ |
eliben | 985c2c1 | 2011-11-14 17:53:23 +0200 | [diff] [blame] | 497 | self._emitline('Contents of the .debug_info section:\n') |
| 498 | |
eliben | 0fc47af | 2011-10-02 13:47:12 +0200 | [diff] [blame] | 499 | # Offset of the .debug_info section in the stream |
Eli Bendersky | 149315a | 2011-11-24 08:12:37 +0200 | [diff] [blame] | 500 | section_offset = self._dwarfinfo.debug_info_sec.global_offset |
Eli Bendersky | 6062bf7 | 2011-11-23 06:54:40 +0200 | [diff] [blame] | 501 | |
eliben | 0fc47af | 2011-10-02 13:47:12 +0200 | [diff] [blame] | 502 | for cu in self._dwarfinfo.iter_CUs(): |
eliben | 985c2c1 | 2011-11-14 17:53:23 +0200 | [diff] [blame] | 503 | self._emitline(' Compilation Unit @ offset %s:' % |
Eli Bendersky | 149315a | 2011-11-24 08:12:37 +0200 | [diff] [blame] | 504 | self._format_hex(cu.cu_offset)) |
eliben | 0fc47af | 2011-10-02 13:47:12 +0200 | [diff] [blame] | 505 | self._emitline(' Length: %s (%s)' % ( |
| 506 | self._format_hex(cu['unit_length']), |
| 507 | '%s-bit' % cu.dwarf_format())) |
| 508 | self._emitline(' Version: %s' % cu['version']), |
| 509 | self._emitline(' Abbrev Offset: %s' % cu['debug_abbrev_offset']), |
| 510 | self._emitline(' Pointer Size: %s' % cu['address_size']) |
| 511 | |
| 512 | # The nesting depth of each DIE within the tree of DIEs must be |
| 513 | # displayed. To implement this, a counter is incremented each time |
| 514 | # the current DIE has children, and decremented when a null die is |
| 515 | # encountered. Due to the way the DIE tree is serialized, this will |
| 516 | # correctly reflect the nesting depth |
| 517 | # |
| 518 | die_depth = 0 |
| 519 | for die in cu.iter_DIEs(): |
| 520 | if die.is_null(): |
| 521 | die_depth -= 1 |
| 522 | continue |
eliben | aee11d2 | 2011-10-26 10:42:34 +0200 | [diff] [blame] | 523 | self._emitline(' <%s><%x>: Abbrev Number: %s (%s)' % ( |
| 524 | die_depth, |
Eli Bendersky | 149315a | 2011-11-24 08:12:37 +0200 | [diff] [blame] | 525 | die.offset, |
eliben | aee11d2 | 2011-10-26 10:42:34 +0200 | [diff] [blame] | 526 | die.abbrev_code, |
| 527 | die.tag)) |
| 528 | |
Eli Bendersky | 41c971a | 2011-10-27 14:29:32 +0200 | [diff] [blame] | 529 | for attr in die.attributes.itervalues(): |
eliben | aee11d2 | 2011-10-26 10:42:34 +0200 | [diff] [blame] | 530 | self._emitline(' <%2x> %-18s: %s' % ( |
Eli Bendersky | 149315a | 2011-11-24 08:12:37 +0200 | [diff] [blame] | 531 | attr.offset, |
Eli Bendersky | 41c971a | 2011-10-27 14:29:32 +0200 | [diff] [blame] | 532 | attr.name, |
eliben | 3bc9c34 | 2011-10-26 13:10:58 +0200 | [diff] [blame] | 533 | describe_attr_value( |
Eli Bendersky | 5be3be8 | 2011-10-27 14:28:12 +0200 | [diff] [blame] | 534 | attr, die, section_offset))) |
eliben | 0fc47af | 2011-10-02 13:47:12 +0200 | [diff] [blame] | 535 | |
| 536 | if die.has_children: |
| 537 | die_depth += 1 |
eliben | aee11d2 | 2011-10-26 10:42:34 +0200 | [diff] [blame] | 538 | |
Eli Bendersky | f5670e8 | 2011-11-24 09:05:44 +0200 | [diff] [blame] | 539 | self._emitline() |
eliben | 0fc47af | 2011-10-02 13:47:12 +0200 | [diff] [blame] | 540 | |
Eli Bendersky | 26de2ac | 2011-09-13 06:50:28 +0300 | [diff] [blame] | 541 | def _emit(self, s=''): |
Eli Bendersky | 933f699 | 2011-09-09 08:11:06 +0300 | [diff] [blame] | 542 | """ Emit an object to output |
| 543 | """ |
| 544 | self.output.write(str(s)) |
Eli Bendersky | d62928d | 2011-09-09 10:05:57 +0300 | [diff] [blame] | 545 | |
Eli Bendersky | 26de2ac | 2011-09-13 06:50:28 +0300 | [diff] [blame] | 546 | def _emitline(self, s=''): |
Eli Bendersky | 933f699 | 2011-09-09 08:11:06 +0300 | [diff] [blame] | 547 | """ Emit an object to output, followed by a newline |
| 548 | """ |
| 549 | self.output.write(str(s) + '\n') |
| 550 | |
| 551 | |
Eli Bendersky | 0b27ba4 | 2011-09-17 06:44:02 +0300 | [diff] [blame] | 552 | SCRIPT_DESCRIPTION = 'Display information about the contents of ELF format files' |
| 553 | VERSION_STRING = '%%prog: based on pyelftools %s' % __version__ |
| 554 | |
| 555 | |
Eli Bendersky | 0193fb8 | 2011-11-26 16:16:16 +0200 | [diff] [blame] | 556 | def main(stream=None): |
Eli Bendersky | 0b27ba4 | 2011-09-17 06:44:02 +0300 | [diff] [blame] | 557 | # parse the command-line arguments and invoke ReadElf |
Eli Bendersky | 40eb170 | 2011-09-16 16:59:52 +0300 | [diff] [blame] | 558 | optparser = OptionParser( |
Eli Bendersky | ecde41b | 2011-09-16 17:16:20 +0300 | [diff] [blame] | 559 | usage='usage: %prog [options] <elf-file>', |
Eli Bendersky | 0b27ba4 | 2011-09-17 06:44:02 +0300 | [diff] [blame] | 560 | description=SCRIPT_DESCRIPTION, |
Eli Bendersky | 40eb170 | 2011-09-16 16:59:52 +0300 | [diff] [blame] | 561 | add_help_option=False, # -h is a real option of readelf |
Eli Bendersky | 0b27ba4 | 2011-09-17 06:44:02 +0300 | [diff] [blame] | 562 | prog='readelf.py', |
| 563 | version=VERSION_STRING) |
Eli Bendersky | 40eb170 | 2011-09-16 16:59:52 +0300 | [diff] [blame] | 564 | optparser.add_option('-H', '--help', |
| 565 | action='store_true', dest='help', |
| 566 | help='Display this information') |
| 567 | optparser.add_option('-h', '--file-header', |
Eli Bendersky | ecde41b | 2011-09-16 17:16:20 +0300 | [diff] [blame] | 568 | action='store_true', dest='show_file_header', |
| 569 | help='Display the ELF file header') |
Eli Bendersky | 40eb170 | 2011-09-16 16:59:52 +0300 | [diff] [blame] | 570 | optparser.add_option('-l', '--program-headers', '--segments', |
Eli Bendersky | 0b27ba4 | 2011-09-17 06:44:02 +0300 | [diff] [blame] | 571 | action='store_true', dest='show_program_header', |
Eli Bendersky | ecde41b | 2011-09-16 17:16:20 +0300 | [diff] [blame] | 572 | help='Display the program headers') |
Eli Bendersky | 40eb170 | 2011-09-16 16:59:52 +0300 | [diff] [blame] | 573 | optparser.add_option('-S', '--section-headers', '--sections', |
Eli Bendersky | 0b27ba4 | 2011-09-17 06:44:02 +0300 | [diff] [blame] | 574 | action='store_true', dest='show_section_header', |
Eli Bendersky | ecde41b | 2011-09-16 17:16:20 +0300 | [diff] [blame] | 575 | help="Display the sections' headers") |
Eli Bendersky | 40eb170 | 2011-09-16 16:59:52 +0300 | [diff] [blame] | 576 | optparser.add_option('-e', '--headers', |
Eli Bendersky | ecde41b | 2011-09-16 17:16:20 +0300 | [diff] [blame] | 577 | action='store_true', dest='show_all_headers', |
| 578 | help='Equivalent to: -h -l -S') |
Eli Bendersky | 40eb170 | 2011-09-16 16:59:52 +0300 | [diff] [blame] | 579 | optparser.add_option('-s', '--symbols', '--syms', |
Eli Bendersky | ecde41b | 2011-09-16 17:16:20 +0300 | [diff] [blame] | 580 | action='store_true', dest='show_symbols', |
| 581 | help='Display the symbol table') |
Eli Bendersky | 84066b2 | 2011-09-20 06:48:52 +0300 | [diff] [blame] | 582 | optparser.add_option('-r', '--relocs', |
| 583 | action='store_true', dest='show_relocs', |
| 584 | help='Display the relocations (if present)') |
Eli Bendersky | c4a4c07 | 2011-09-17 15:28:28 +0300 | [diff] [blame] | 585 | optparser.add_option('-x', '--hex-dump', |
| 586 | action='store', dest='show_hex_dump', metavar='<number|name>', |
| 587 | help='Dump the contents of section <number|name> as bytes') |
Eli Bendersky | 53e86db | 2011-09-18 06:04:30 +0300 | [diff] [blame] | 588 | optparser.add_option('-p', '--string-dump', |
| 589 | action='store', dest='show_string_dump', metavar='<number|name>', |
| 590 | help='Dump the contents of section <number|name> as strings') |
eliben | 0fc47af | 2011-10-02 13:47:12 +0200 | [diff] [blame] | 591 | optparser.add_option('--debug-dump', |
| 592 | action='store', dest='debug_dump_section', metavar='<section>', |
| 593 | help='Display the contents of DWARF debug sections') |
Eli Bendersky | 53e86db | 2011-09-18 06:04:30 +0300 | [diff] [blame] | 594 | |
Eli Bendersky | 933f699 | 2011-09-09 08:11:06 +0300 | [diff] [blame] | 595 | options, args = optparser.parse_args() |
| 596 | |
Eli Bendersky | 40eb170 | 2011-09-16 16:59:52 +0300 | [diff] [blame] | 597 | if options.help or len(args) == 0: |
| 598 | optparser.print_help() |
| 599 | sys.exit(0) |
| 600 | |
Eli Bendersky | 0b27ba4 | 2011-09-17 06:44:02 +0300 | [diff] [blame] | 601 | if options.show_all_headers: |
| 602 | do_file_header = do_section_header = do_program_header = True |
| 603 | else: |
| 604 | do_file_header = options.show_file_header |
| 605 | do_section_header = options.show_section_header |
| 606 | do_program_header = options.show_program_header |
| 607 | |
Eli Bendersky | 933f699 | 2011-09-09 08:11:06 +0300 | [diff] [blame] | 608 | with open(args[0], 'rb') as file: |
| 609 | try: |
Eli Bendersky | 0193fb8 | 2011-11-26 16:16:16 +0200 | [diff] [blame] | 610 | readelf = ReadElf(file, stream or sys.stdout) |
Eli Bendersky | 0b27ba4 | 2011-09-17 06:44:02 +0300 | [diff] [blame] | 611 | if do_file_header: |
| 612 | readelf.display_file_header() |
Eli Bendersky | 0b27ba4 | 2011-09-17 06:44:02 +0300 | [diff] [blame] | 613 | if do_section_header: |
| 614 | readelf.display_section_headers( |
| 615 | show_heading=not do_file_header) |
Eli Bendersky | 2fc0f2a | 2011-09-17 10:39:29 +0300 | [diff] [blame] | 616 | if do_program_header: |
| 617 | readelf.display_program_headers( |
| 618 | show_heading=not do_file_header) |
Eli Bendersky | 0b27ba4 | 2011-09-17 06:44:02 +0300 | [diff] [blame] | 619 | if options.show_symbols: |
| 620 | readelf.display_symbol_tables() |
Eli Bendersky | 84066b2 | 2011-09-20 06:48:52 +0300 | [diff] [blame] | 621 | if options.show_relocs: |
| 622 | readelf.display_relocations() |
Eli Bendersky | c4a4c07 | 2011-09-17 15:28:28 +0300 | [diff] [blame] | 623 | if options.show_hex_dump: |
| 624 | readelf.display_hex_dump(options.show_hex_dump) |
Eli Bendersky | 53e86db | 2011-09-18 06:04:30 +0300 | [diff] [blame] | 625 | if options.show_string_dump: |
| 626 | readelf.display_string_dump(options.show_string_dump) |
eliben | 0fc47af | 2011-10-02 13:47:12 +0200 | [diff] [blame] | 627 | if options.debug_dump_section: |
| 628 | readelf.display_debug_dump(options.debug_dump_section) |
Eli Bendersky | 933f699 | 2011-09-09 08:11:06 +0300 | [diff] [blame] | 629 | except ELFError as ex: |
Eli Bendersky | 0b27ba4 | 2011-09-17 06:44:02 +0300 | [diff] [blame] | 630 | sys.stderr.write('ELF error: %s\n' % ex) |
Eli Bendersky | 933f699 | 2011-09-09 08:11:06 +0300 | [diff] [blame] | 631 | sys.exit(1) |
| 632 | |
| 633 | |
Eli Bendersky | 0193fb8 | 2011-11-26 16:16:16 +0200 | [diff] [blame] | 634 | def profile_main(): |
| 635 | # Run 'main' redirecting its output to readelfout.txt |
| 636 | # Saves profiling information in readelf.profile |
| 637 | PROFFILE = 'readelf.profile' |
| 638 | import cProfile |
| 639 | cProfile.run('main(open("readelfout.txt", "w"))', PROFFILE) |
| 640 | |
| 641 | # Dig in some profiling stats |
| 642 | import pstats |
| 643 | p = pstats.Stats(PROFFILE) |
| 644 | p.sort_stats('cumulative').print_stats(25) |
| 645 | |
| 646 | |
Eli Bendersky | 933f699 | 2011-09-09 08:11:06 +0300 | [diff] [blame] | 647 | #------------------------------------------------------------------------------- |
| 648 | if __name__ == '__main__': |
Eli Bendersky | 4f4d80c | 2011-11-26 16:49:27 +0200 | [diff] [blame] | 649 | main() |
| 650 | #profile_main() |
Eli Bendersky | 0193fb8 | 2011-11-26 16:16:16 +0200 | [diff] [blame] | 651 | |
Eli Bendersky | 933f699 | 2011-09-09 08:11:06 +0300 | [diff] [blame] | 652 | |