#------------------------------------------------------------------------------- # elftools: dwarf/descriptions.py # # Textual descriptions of the various values and enums of DWARF # # Eli Bendersky (eliben@gmail.com) # This code is in the public domain #------------------------------------------------------------------------------- from collections import defaultdict from .constants import * from .dwarf_expr import DWARFExprParser from .die import DIE from ..common.utils import preserve_stream_pos, dwarf_assert, bytes2str from .callframe import instruction_name, CIE, FDE def set_global_machine_arch(machine_arch): global _MACHINE_ARCH _MACHINE_ARCH = machine_arch def describe_attr_value(attr, die, section_offset): """ Given an attribute attr, return the textual representation of its value, suitable for tools like readelf. To cover all cases, this function needs some extra arguments: die: the DIE this attribute was extracted from section_offset: offset in the stream of the section the DIE belongs to """ descr_func = _ATTR_DESCRIPTION_MAP[attr.form] val_description = descr_func(attr, die, section_offset) # For some attributes we can display further information extra_info_func = _EXTRA_INFO_DESCRIPTION_MAP[attr.name] extra_info = extra_info_func(attr, die, section_offset) return str(val_description) + '\t' + extra_info def describe_CFI_instructions(entry): """ Given a CFI entry (CIE or FDE), return the textual description of its instructions. """ def _assert_FDE_instruction(instr): dwarf_assert( isinstance(entry, FDE), 'Unexpected instruction "%s" for a CIE' % instr) def _full_reg_name(regnum): regname = describe_reg_name(regnum, _MACHINE_ARCH, False) if regname: return 'r%s (%s)' % (regnum, regname) else: return 'r%s' % regnum if isinstance(entry, CIE): cie = entry else: # FDE cie = entry.cie pc = entry['initial_location'] s = '' for instr in entry.instructions: name = instruction_name(instr.opcode) if name in ('DW_CFA_offset', 'DW_CFA_offset_extended', 'DW_CFA_offset_extended_sf', 'DW_CFA_val_offset', 'DW_CFA_val_offset_sf'): s += ' %s: %s at cfa%+d\n' % ( name, _full_reg_name(instr.args[0]), instr.args[1] * cie['data_alignment_factor']) elif name in ( 'DW_CFA_restore', 'DW_CFA_restore_extended', 'DW_CFA_undefined', 'DW_CFA_same_value', 'DW_CFA_def_cfa_register'): s += ' %s: %s\n' % (name, _full_reg_name(instr.args[0])) elif name == 'DW_CFA_register': s += ' %s: %s in %s' % ( name, _full_reg_name(instr.args[0]), _full_reg_name(instr.args[1])) elif name == 'DW_CFA_set_loc': pc = instr.args[0] s += ' %s: %08x\n' % (name, pc) elif name in ( 'DW_CFA_advance_loc1', 'DW_CFA_advance_loc2', 'DW_CFA_advance_loc4', 'DW_CFA_advance_loc'): _assert_FDE_instruction(instr) factored_offset = instr.args[0] * cie['code_alignment_factor'] s += ' %s: %s to %08x\n' % ( name, factored_offset, factored_offset + pc) pc += factored_offset elif name in ( 'DW_CFA_remember_state', 'DW_CFA_restore_state', 'DW_CFA_nop'): s += ' %s\n' % name elif name == 'DW_CFA_def_cfa': s += ' %s: %s ofs %s\n' % ( name, _full_reg_name(instr.args[0]), instr.args[1]) elif name == 'DW_CFA_def_cfa_sf': s += ' %s: %s ofs %s\n' % ( name, _full_reg_name(instr.args[0]), instr.args[1] * cie['data_alignment_factor']) elif name in ('DW_CFA_def_cfa_offset', 'DW_CFA_GNU_args_size'): s += ' %s: %s\n' % (name, instr.args[0]) elif name == 'DW_CFA_def_cfa_expression': expr_dumper = ExprDumper(entry.structs) # readelf output is missing a colon for DW_CFA_def_cfa_expression s += ' %s (%s)\n' % (name, expr_dumper.dump_expr(instr.args[0])) elif name == 'DW_CFA_expression': expr_dumper = ExprDumper(entry.structs) s += ' %s: %s (%s)\n' % ( name, _full_reg_name(instr.args[0]), expr_dumper.dump_expr(instr.args[1])) else: s += ' %s: \n' % name return s def describe_CFI_register_rule(rule): s = _DESCR_CFI_REGISTER_RULE_TYPE[rule.type] if rule.type in ('OFFSET', 'VAL_OFFSET'): s += '%+d' % rule.arg elif rule.type == 'REGISTER': s += describe_reg_name(rule.arg) return s def describe_CFI_CFA_rule(rule): if rule.expr: return 'exp' else: return '%s%+d' % (describe_reg_name(rule.reg), rule.offset) def describe_DWARF_expr(expr, structs, cu_offset=None): """ Textual description of a DWARF expression encoded in 'expr'. structs should come from the entity encompassing the expression - it's needed to be able to parse it correctly. """ # Since this function can be called a lot, initializing a fresh new # ExprDumper per call is expensive. So a rudimentary caching scheme is in # place to create only one such dumper per instance of structs. cache_key = id(structs) if cache_key not in _DWARF_EXPR_DUMPER_CACHE: _DWARF_EXPR_DUMPER_CACHE[cache_key] = \ ExprDumper(structs) dwarf_expr_dumper = _DWARF_EXPR_DUMPER_CACHE[cache_key] return '(' + dwarf_expr_dumper.dump_expr(expr, cu_offset) + ')' def describe_reg_name(regnum, machine_arch=None, default=True): """ Provide a textual description for a register name, given its serial number. The number is expected to be valid. """ if machine_arch is None: machine_arch = _MACHINE_ARCH if machine_arch == 'x86': return _REG_NAMES_x86[regnum] elif machine_arch == 'x64': return _REG_NAMES_x64[regnum] elif machine_arch == 'AArch64': return _REG_NAMES_AArch64[regnum] elif default: return 'r%s' % regnum else: return None def describe_form_class(form): """For a given form name, determine its value class. For example, given 'DW_FORM_data1' returns 'constant'. For some forms, like DW_FORM_indirect and DW_FORM_sec_offset, the class is not hard-coded and extra information is required. For these, None is returned. """ return _FORM_CLASS[form] #------------------------------------------------------------------------------- # The machine architecture. Set globally via set_global_machine_arch # _MACHINE_ARCH = None # Implements the alternative format of readelf: lowercase hex, prefixed with 0x unless 0 def _format_hex(n): return '0x%x' % n if n != 0 else '0' def _describe_attr_ref(attr, die, section_offset): return '<%s>' % _format_hex(attr.value + die.cu.cu_offset) def _describe_attr_ref_sig8(attr, die, section_offset): return 'signature: %s' % _format_hex(attr.value) def _describe_attr_value_passthrough(attr, die, section_offset): return attr.value def _describe_attr_hex(attr, die, section_offset): return '%s' % _format_hex(attr.value) def _describe_attr_hex_addr(attr, die, section_offset): return '<%s>' % _format_hex(attr.value) def _describe_attr_split_64bit(attr, die, section_offset): low_word = attr.value & 0xFFFFFFFF high_word = (attr.value >> 32) & 0xFFFFFFFF return '%s %s' % (_format_hex(low_word), _format_hex(high_word)) def _describe_attr_strp(attr, die, section_offset): return '(indirect string, offset: %s): %s' % ( _format_hex(attr.raw_value), bytes2str(attr.value)) def _describe_attr_line_strp(attr, die, section_offset): return '(indirect line string, offset: %s): %s' % ( _format_hex(attr.raw_value), bytes2str(attr.value)) def _describe_attr_string(attr, die, section_offset): return bytes2str(attr.value) def _describe_attr_debool(attr, die, section_offset): """ To be consistent with readelf, generate 1 for True flags, 0 for False flags. """ return '1' if attr.value else '0' def _describe_attr_present(attr, die, section_offset): """ Some forms may simply mean that an attribute is present, without providing any value. """ return '1' def _describe_attr_block(attr, die, section_offset): s = '%s byte block: ' % len(attr.value) s += ' '.join('%x' % item for item in attr.value) + ' ' return s _ATTR_DESCRIPTION_MAP = defaultdict( lambda: _describe_attr_value_passthrough, # default_factory DW_FORM_ref1=_describe_attr_ref, DW_FORM_ref2=_describe_attr_ref, DW_FORM_ref4=_describe_attr_ref, DW_FORM_ref8=_describe_attr_split_64bit, DW_FORM_ref_udata=_describe_attr_ref, DW_FORM_ref_addr=_describe_attr_hex_addr, DW_FORM_data4=_describe_attr_hex, DW_FORM_data8=_describe_attr_hex, DW_FORM_addr=_describe_attr_hex, DW_FORM_sec_offset=_describe_attr_hex, DW_FORM_flag=_describe_attr_debool, DW_FORM_data1=_describe_attr_value_passthrough, DW_FORM_data2=_describe_attr_value_passthrough, DW_FORM_sdata=_describe_attr_value_passthrough, DW_FORM_udata=_describe_attr_value_passthrough, DW_FORM_string=_describe_attr_string, DW_FORM_strp=_describe_attr_strp, DW_FORM_line_strp=_describe_attr_line_strp, DW_FORM_block1=_describe_attr_block, DW_FORM_block2=_describe_attr_block, DW_FORM_block4=_describe_attr_block, DW_FORM_block=_describe_attr_block, DW_FORM_flag_present=_describe_attr_present, DW_FORM_exprloc=_describe_attr_block, DW_FORM_ref_sig8=_describe_attr_ref_sig8, ) _FORM_CLASS = dict( DW_FORM_addr='address', DW_FORM_block2='block', DW_FORM_block4='block', DW_FORM_data2='constant', DW_FORM_data4='constant', DW_FORM_data8='constant', DW_FORM_string='string', DW_FORM_block='block', DW_FORM_block1='block', DW_FORM_data1='constant', DW_FORM_flag='flag', DW_FORM_sdata='constant', DW_FORM_strp='string', DW_FORM_udata='constant', DW_FORM_ref_addr='reference', DW_FORM_ref1='reference', DW_FORM_ref2='reference', DW_FORM_ref4='reference', DW_FORM_ref8='reference', DW_FORM_ref_udata='reference', DW_FORM_indirect=None, DW_FORM_sec_offset=None, DW_FORM_exprloc='exprloc', DW_FORM_flag_present='flag', DW_FORM_ref_sig8='reference', ) _DESCR_DW_INL = { DW_INL_not_inlined: '(not inlined)', DW_INL_inlined: '(inlined)', DW_INL_declared_not_inlined: '(declared as inline but ignored)', DW_INL_declared_inlined: '(declared as inline and inlined)', } _DESCR_DW_LANG = { DW_LANG_C89: '(ANSI C)', DW_LANG_C: '(non-ANSI C)', DW_LANG_Ada83: '(Ada)', DW_LANG_C_plus_plus: '(C++)', DW_LANG_Cobol74: '(Cobol 74)', DW_LANG_Cobol85: '(Cobol 85)', DW_LANG_Fortran77: '(FORTRAN 77)', DW_LANG_Fortran90: '(Fortran 90)', DW_LANG_Pascal83: '(ANSI Pascal)', DW_LANG_Modula2: '(Modula 2)', DW_LANG_Java: '(Java)', DW_LANG_C99: '(ANSI C99)', DW_LANG_Ada95: '(ADA 95)', DW_LANG_Fortran95: '(Fortran 95)', DW_LANG_PLI: '(PLI)', DW_LANG_ObjC: '(Objective C)', DW_LANG_ObjC_plus_plus: '(Objective C++)', DW_LANG_UPC: '(Unified Parallel C)', DW_LANG_D: '(D)', DW_LANG_Python: '(Python)', DW_LANG_OpenCL: '(OpenCL)', DW_LANG_Go: '(Go)', DW_LANG_Modula3: '(Modula 3)', DW_LANG_Haskell: '(Haskell)', DW_LANG_C_plus_plus_03: '(C++03)', DW_LANG_C_plus_plus_11: '(C++11)', DW_LANG_OCaml: '(OCaml)', DW_LANG_Rust: '(Rust)', DW_LANG_C11: '(C11)', DW_LANG_Swift: '(Swift)', DW_LANG_Julia: '(Julia)', DW_LANG_Dylan: '(Dylan)', DW_LANG_C_plus_plus_14: '(C++14)', DW_LANG_Fortran03: '(Fortran 03)', DW_LANG_Fortran08: '(Fortran 08)', DW_LANG_RenderScript: '(RenderScript)', DW_LANG_BLISS: '(Bliss)', # Not in binutils DW_LANG_Mips_Assembler: '(MIPS assembler)', DW_LANG_HP_Bliss: '(HP Bliss)', DW_LANG_HP_Basic91: '(HP Basic 91)', DW_LANG_HP_Pascal91: '(HP Pascal 91)', DW_LANG_HP_IMacro: '(HP IMacro)', DW_LANG_HP_Assembler: '(HP assembler)' } _DESCR_DW_ATE = { DW_ATE_void: '(void)', DW_ATE_address: '(machine address)', DW_ATE_boolean: '(boolean)', DW_ATE_complex_float: '(complex float)', DW_ATE_float: '(float)', DW_ATE_signed: '(signed)', DW_ATE_signed_char: '(signed char)', DW_ATE_unsigned: '(unsigned)', DW_ATE_unsigned_char: '(unsigned char)', DW_ATE_imaginary_float: '(imaginary float)', DW_ATE_decimal_float: '(decimal float)', DW_ATE_packed_decimal: '(packed_decimal)', DW_ATE_numeric_string: '(numeric_string)', DW_ATE_edited: '(edited)', DW_ATE_signed_fixed: '(signed_fixed)', DW_ATE_unsigned_fixed: '(unsigned_fixed)', DW_ATE_UTF: '(unicode string)', DW_ATE_HP_float80: '(HP_float80)', DW_ATE_HP_complex_float80: '(HP_complex_float80)', DW_ATE_HP_float128: '(HP_float128)', DW_ATE_HP_complex_float128: '(HP_complex_float128)', DW_ATE_HP_floathpintel: '(HP_floathpintel)', DW_ATE_HP_imaginary_float80: '(HP_imaginary_float80)', DW_ATE_HP_imaginary_float128: '(HP_imaginary_float128)', } _DESCR_DW_ACCESS = { DW_ACCESS_public: '(public)', DW_ACCESS_protected: '(protected)', DW_ACCESS_private: '(private)', } _DESCR_DW_VIS = { DW_VIS_local: '(local)', DW_VIS_exported: '(exported)', DW_VIS_qualified: '(qualified)', } _DESCR_DW_VIRTUALITY = { DW_VIRTUALITY_none: '(none)', DW_VIRTUALITY_virtual: '(virtual)', DW_VIRTUALITY_pure_virtual: '(pure virtual)', } _DESCR_DW_ID_CASE = { DW_ID_case_sensitive: '(case_sensitive)', DW_ID_up_case: '(up_case)', DW_ID_down_case: '(down_case)', DW_ID_case_insensitive: '(case_insensitive)', } _DESCR_DW_CC = { DW_CC_normal: '(normal)', DW_CC_program: '(program)', DW_CC_nocall: '(nocall)', } _DESCR_DW_ORD = { DW_ORD_row_major: '(row major)', DW_ORD_col_major: '(column major)', } _DESCR_CFI_REGISTER_RULE_TYPE = dict( UNDEFINED='u', SAME_VALUE='s', OFFSET='c', VAL_OFFSET='v', REGISTER='', EXPRESSION='exp', VAL_EXPRESSION='vexp', ARCHITECTURAL='a', ) def _make_extra_mapper(mapping, default, default_interpolate_value=False): """ Create a mapping function from attribute parameters to an extra value that should be displayed. """ def mapper(attr, die, section_offset): if default_interpolate_value: d = default % attr.value else: d = default return mapping.get(attr.value, d) return mapper def _make_extra_string(s=''): """ Create an extra function that just returns a constant string. """ def extra(attr, die, section_offset): return s return extra _DWARF_EXPR_DUMPER_CACHE = {} def _location_list_extra(attr, die, section_offset): # According to section 2.6 of the DWARF spec v3, class loclistptr means # a location list, and class block means a location expression. # DW_FORM_sec_offset is new in DWARFv4 as a section offset. if attr.form in ('DW_FORM_data4', 'DW_FORM_data8', 'DW_FORM_sec_offset'): return '(location list)' else: return describe_DWARF_expr(attr.value, die.cu.structs, die.cu.cu_offset) def _data_member_location_extra(attr, die, section_offset): # According to section 5.5.6 of the DWARF spec v4, a data member location # can be an integer offset, or a location description. # if attr.form in ('DW_FORM_data1', 'DW_FORM_data2', 'DW_FORM_data4', 'DW_FORM_data8', 'DW_FORM_sdata'): return '' # No extra description needed else: return describe_DWARF_expr(attr.value, die.cu.structs, die.cu.cu_offset) def _import_extra(attr, die, section_offset): # For DW_AT_import the value points to a DIE (that can be either in the # current DIE's CU or in another CU, depending on the FORM). The extra # information for it is the abbreviation number in this DIE and its tag. if attr.form == 'DW_FORM_ref_addr': # Absolute offset value ref_die_offset = section_offset + attr.value else: # Relative offset to the current DIE's CU ref_die_offset = attr.value + die.cu.cu_offset # Now find the CU this DIE belongs to (since we have to find its abbrev # table). This is done by linearly scanning through all CUs, looking for # one spanning an address space containing the referred DIE's offset. for cu in die.dwarfinfo.iter_CUs(): if cu['unit_length'] + cu.cu_offset > ref_die_offset >= cu.cu_offset: # Once we have the CU, we can actually parse this DIE from the # stream. with preserve_stream_pos(die.stream): ref_die = DIE(cu, die.stream, ref_die_offset) #print '&&& ref_die', ref_die return '[Abbrev Number: %s (%s)]' % ( ref_die.abbrev_code, ref_die.tag) return '[unknown]' _EXTRA_INFO_DESCRIPTION_MAP = defaultdict( lambda: _make_extra_string(''), # default_factory DW_AT_inline=_make_extra_mapper( _DESCR_DW_INL, '(Unknown inline attribute value: %x', default_interpolate_value=True), DW_AT_language=_make_extra_mapper( _DESCR_DW_LANG, '(Unknown: %x)', default_interpolate_value=True), DW_AT_encoding=_make_extra_mapper(_DESCR_DW_ATE, '(unknown type)'), DW_AT_accessibility=_make_extra_mapper( _DESCR_DW_ACCESS, '(unknown accessibility)'), DW_AT_visibility=_make_extra_mapper( _DESCR_DW_VIS, '(unknown visibility)'), DW_AT_virtuality=_make_extra_mapper( _DESCR_DW_VIRTUALITY, '(unknown virtuality)'), DW_AT_identifier_case=_make_extra_mapper( _DESCR_DW_ID_CASE, '(unknown case)'), DW_AT_calling_convention=_make_extra_mapper( _DESCR_DW_CC, '(unknown convention)'), DW_AT_ordering=_make_extra_mapper( _DESCR_DW_ORD, '(undefined)'), DW_AT_frame_base=_location_list_extra, DW_AT_location=_location_list_extra, DW_AT_string_length=_location_list_extra, DW_AT_return_addr=_location_list_extra, DW_AT_data_member_location=_data_member_location_extra, DW_AT_vtable_elem_location=_location_list_extra, DW_AT_segment=_location_list_extra, DW_AT_static_link=_location_list_extra, DW_AT_use_location=_location_list_extra, DW_AT_allocated=_location_list_extra, DW_AT_associated=_location_list_extra, DW_AT_data_location=_location_list_extra, DW_AT_stride=_location_list_extra, DW_AT_call_value=_location_list_extra, DW_AT_import=_import_extra, DW_AT_GNU_call_site_value=_location_list_extra, DW_AT_GNU_call_site_data_value=_location_list_extra, DW_AT_GNU_call_site_target=_location_list_extra, DW_AT_GNU_call_site_target_clobbered=_location_list_extra, ) # 8 in a line, for easier counting _REG_NAMES_x86 = [ 'eax', 'ecx', 'edx', 'ebx', 'esp', 'ebp', 'esi', 'edi', 'eip', 'eflags', '', 'st0', 'st1', 'st2', 'st3', 'st4', 'st5', 'st6', 'st7', '', '', 'xmm0', 'xmm1', 'xmm2', 'xmm3', 'xmm4', 'xmm5', 'xmm6', 'xmm7', 'mm0', 'mm1', 'mm2', 'mm3', 'mm4', 'mm5', 'mm6', 'mm7', 'fcw', 'fsw', 'mxcsr', 'es', 'cs', 'ss', 'ds', 'fs', 'gs', '', '', 'tr', 'ldtr' ] _REG_NAMES_x64 = [ 'rax', 'rdx', 'rcx', 'rbx', 'rsi', 'rdi', 'rbp', 'rsp', 'r8', 'r9', 'r10', 'r11', 'r12', 'r13', 'r14', 'r15', 'rip', 'xmm0', 'xmm1', 'xmm2', 'xmm3', 'xmm4', 'xmm5', 'xmm6', 'xmm7', 'xmm8', 'xmm9', 'xmm10', 'xmm11', 'xmm12', 'xmm13', 'xmm14', 'xmm15', 'st0', 'st1', 'st2', 'st3', 'st4', 'st5', 'st6', 'st7', 'mm0', 'mm1', 'mm2', 'mm3', 'mm4', 'mm5', 'mm6', 'mm7', 'rflags', 'es', 'cs', 'ss', 'ds', 'fs', 'gs', '', '', 'fs.base', 'gs.base', '', '', 'tr', 'ldtr', 'mxcsr', 'fcw', 'fsw' ] # https://developer.arm.com/documentation/ihi0057/e/?lang=en#dwarf-register-names _REG_NAMES_AArch64 = [ 'x0', 'x1', 'x2', 'x3', 'x4', 'x5', 'x6', 'x7', 'x8', 'x9', 'x10', 'x11', 'x12', 'x13', 'x14', 'x15', 'x16', 'x17', 'x18', 'x19', 'x20', 'x21', 'x22', 'x23', 'x24', 'x25', 'x26', 'x27', 'x28', 'x29', 'x30', 'sp', '', 'ELR_mode', 'RA_SIGN_STATE', '', '', '', '', '', '', '', '', '', '', '', 'VG', 'FFR', 'p0', 'p1', 'p2', 'p3', 'p4', 'p5', 'p6', 'p7', 'p8', 'p9', 'p10', 'p11', 'p12', 'p13', 'p14', 'p15', 'v0', 'v1', 'v2', 'v3', 'v4', 'v5', 'v6', 'v7', 'v8', 'v9', 'v10', 'v11', 'v12', 'v13', 'v14', 'v15', 'v16', 'v17', 'v18', 'v19', 'v20', 'v21', 'v22', 'v23', 'v24', 'v25', 'v26', 'v27', 'v28', 'v29', 'v30', 'v31', 'z0', 'z1', 'z2', 'z3', 'z4', 'z5', 'z6', 'z7', 'z8', 'z9', 'z10', 'z11', 'z12', 'z13', 'z14', 'z15', 'z16', 'z17', 'z18', 'z19', 'z20', 'z21', 'z22', 'z23', 'z24', 'z25', 'z26', 'z27', 'z28', 'z29', 'z30', 'z31' ] class ExprDumper(object): """ A dumper for DWARF expressions that dumps a textual representation of the complete expression. Usage: after creation, call dump_expr repeatedly - it's stateless. """ def __init__(self, structs): self.structs = structs self.expr_parser = DWARFExprParser(self.structs) self._init_lookups() def dump_expr(self, expr, cu_offset=None): """ Parse and dump a DWARF expression. expr should be a list of (integer) byte values. cu_offset is the cu_offset value from the CU object where the expression resides. Only affects a handful of GNU opcodes, if None is provided, that's not a crash condition, only the expression dump will not be consistent of that of readelf. Returns a string representing the expression. """ parsed = self.expr_parser.parse_expr(expr) s = [] for deo in parsed: s.append(self._dump_to_string(deo.op, deo.op_name, deo.args, cu_offset)) return '; '.join(s) def _init_lookups(self): self._ops_with_decimal_arg = set([ 'DW_OP_const1u', 'DW_OP_const1s', 'DW_OP_const2u', 'DW_OP_const2s', 'DW_OP_const4u', 'DW_OP_const4s', 'DW_OP_const8u', 'DW_OP_const8s', 'DW_OP_constu', 'DW_OP_consts', 'DW_OP_pick', 'DW_OP_plus_uconst', 'DW_OP_bra', 'DW_OP_skip', 'DW_OP_fbreg', 'DW_OP_piece', 'DW_OP_deref_size', 'DW_OP_xderef_size', 'DW_OP_regx',]) for n in range(0, 32): self._ops_with_decimal_arg.add('DW_OP_breg%s' % n) self._ops_with_two_decimal_args = set(['DW_OP_bregx', 'DW_OP_bit_piece']) self._ops_with_hex_arg = set( ['DW_OP_addr', 'DW_OP_call2', 'DW_OP_call4', 'DW_OP_call_ref']) def _dump_to_string(self, opcode, opcode_name, args, cu_offset=None): # Some GNU ops contain an offset from the current CU as an argument, # but readelf emits those ops with offset from the info section # so we need the base offset of the parent CU. # If omitted, arguments on some GNU opcodes will be off. if cu_offset is None: cu_offset = 0 if len(args) == 0: if opcode_name.startswith('DW_OP_reg'): regnum = int(opcode_name[9:]) return '%s (%s)' % ( opcode_name, describe_reg_name(regnum, _MACHINE_ARCH)) else: return opcode_name elif opcode_name in self._ops_with_decimal_arg: if opcode_name.startswith('DW_OP_breg'): regnum = int(opcode_name[10:]) return '%s (%s): %s' % ( opcode_name, describe_reg_name(regnum, _MACHINE_ARCH), args[0]) elif opcode_name.endswith('regx'): # applies to both regx and bregx return '%s: %s (%s)' % ( opcode_name, args[0], describe_reg_name(args[0], _MACHINE_ARCH)) else: return '%s: %s' % (opcode_name, args[0]) elif opcode_name in self._ops_with_hex_arg: return '%s: %x' % (opcode_name, args[0]) elif opcode_name in self._ops_with_two_decimal_args: return '%s: %s %s' % (opcode_name, args[0], args[1]) elif opcode_name in ('DW_OP_GNU_entry_value', 'DW_OP_entry_value'): return '%s: (%s)' % (opcode_name, ','.join([self._dump_to_string(deo.op, deo.op_name, deo.args, cu_offset) for deo in args[0]])) elif opcode_name == 'DW_OP_implicit_value': return "%s %s byte block: %s" % (opcode_name, len(args[0]), ''.join(["%x " % b for b in args[0]])) elif opcode_name == 'DW_OP_GNU_parameter_ref': return "%s: <0x%x>" % (opcode_name, args[0] + cu_offset) elif opcode_name in ('DW_OP_GNU_implicit_pointer', 'DW_OP_implicit_pointer'): return "%s: <0x%x> %d" % (opcode_name, args[0], args[1]) elif opcode_name in ('DW_OP_GNU_convert', 'DW_OP_convert'): return "%s <0x%x>" % (opcode_name, args[0] + cu_offset) elif opcode_name in ('DW_OP_GNU_deref_type', 'DW_OP_deref_type'): return "%s: %d <0x%x>" % (opcode_name, args[0], args[1] + cu_offset) elif opcode_name in ('DW_OP_GNU_const_type', 'DW_OP_const_type'): return "%s: <0x%x> %d byte block: %s " % (opcode_name, args[0] + cu_offset, len(args[1]), ' '.join("%x" % b for b in args[1])) elif opcode_name in ('DW_OP_GNU_regval_type', 'DW_OP_regval_type'): return "%s: %d (%s) <0x%x>" % (opcode_name, args[0], describe_reg_name(args[0], _MACHINE_ARCH), args[1] + cu_offset) else: return '' % opcode_name