677 lines
26 KiB
Python
677 lines
26 KiB
Python
#-------------------------------------------------------------------------------
|
|
# elftools: dwarf/descriptions.py
|
|
#
|
|
# Textual descriptions of the various values and enums of DWARF
|
|
#
|
|
# Eli Bendersky (eliben@gmail.com)
|
|
# This code is in the public domain
|
|
#-------------------------------------------------------------------------------
|
|
from collections import defaultdict
|
|
|
|
from .constants import *
|
|
from .dwarf_expr import DWARFExprParser
|
|
from .die import DIE
|
|
from ..common.utils import preserve_stream_pos, dwarf_assert, bytes2str
|
|
from .callframe import instruction_name, CIE, FDE
|
|
|
|
|
|
def set_global_machine_arch(machine_arch):
|
|
global _MACHINE_ARCH
|
|
_MACHINE_ARCH = machine_arch
|
|
|
|
|
|
def describe_attr_value(attr, die, section_offset):
|
|
""" Given an attribute attr, return the textual representation of its
|
|
value, suitable for tools like readelf.
|
|
|
|
To cover all cases, this function needs some extra arguments:
|
|
|
|
die: the DIE this attribute was extracted from
|
|
section_offset: offset in the stream of the section the DIE belongs to
|
|
"""
|
|
descr_func = _ATTR_DESCRIPTION_MAP[attr.form]
|
|
val_description = descr_func(attr, die, section_offset)
|
|
|
|
# For some attributes we can display further information
|
|
extra_info_func = _EXTRA_INFO_DESCRIPTION_MAP[attr.name]
|
|
extra_info = extra_info_func(attr, die, section_offset)
|
|
return str(val_description) + '\t' + extra_info
|
|
|
|
|
|
def describe_CFI_instructions(entry):
|
|
""" Given a CFI entry (CIE or FDE), return the textual description of its
|
|
instructions.
|
|
"""
|
|
def _assert_FDE_instruction(instr):
|
|
dwarf_assert(
|
|
isinstance(entry, FDE),
|
|
'Unexpected instruction "%s" for a CIE' % instr)
|
|
|
|
def _full_reg_name(regnum):
|
|
regname = describe_reg_name(regnum, _MACHINE_ARCH, False)
|
|
if regname:
|
|
return 'r%s (%s)' % (regnum, regname)
|
|
else:
|
|
return 'r%s' % regnum
|
|
|
|
if isinstance(entry, CIE):
|
|
cie = entry
|
|
else: # FDE
|
|
cie = entry.cie
|
|
pc = entry['initial_location']
|
|
|
|
s = ''
|
|
for instr in entry.instructions:
|
|
name = instruction_name(instr.opcode)
|
|
|
|
if name in ('DW_CFA_offset',
|
|
'DW_CFA_offset_extended', 'DW_CFA_offset_extended_sf',
|
|
'DW_CFA_val_offset', 'DW_CFA_val_offset_sf'):
|
|
s += ' %s: %s at cfa%+d\n' % (
|
|
name, _full_reg_name(instr.args[0]),
|
|
instr.args[1] * cie['data_alignment_factor'])
|
|
elif name in ( 'DW_CFA_restore', 'DW_CFA_restore_extended',
|
|
'DW_CFA_undefined', 'DW_CFA_same_value',
|
|
'DW_CFA_def_cfa_register'):
|
|
s += ' %s: %s\n' % (name, _full_reg_name(instr.args[0]))
|
|
elif name == 'DW_CFA_register':
|
|
s += ' %s: %s in %s' % (
|
|
name, _full_reg_name(instr.args[0]),
|
|
_full_reg_name(instr.args[1]))
|
|
elif name == 'DW_CFA_set_loc':
|
|
pc = instr.args[0]
|
|
s += ' %s: %08x\n' % (name, pc)
|
|
elif name in ( 'DW_CFA_advance_loc1', 'DW_CFA_advance_loc2',
|
|
'DW_CFA_advance_loc4', 'DW_CFA_advance_loc'):
|
|
_assert_FDE_instruction(instr)
|
|
factored_offset = instr.args[0] * cie['code_alignment_factor']
|
|
s += ' %s: %s to %08x\n' % (
|
|
name, factored_offset, factored_offset + pc)
|
|
pc += factored_offset
|
|
elif name in ( 'DW_CFA_remember_state', 'DW_CFA_restore_state',
|
|
'DW_CFA_nop'):
|
|
s += ' %s\n' % name
|
|
elif name == 'DW_CFA_def_cfa':
|
|
s += ' %s: %s ofs %s\n' % (
|
|
name, _full_reg_name(instr.args[0]), instr.args[1])
|
|
elif name == 'DW_CFA_def_cfa_sf':
|
|
s += ' %s: %s ofs %s\n' % (
|
|
name, _full_reg_name(instr.args[0]),
|
|
instr.args[1] * cie['data_alignment_factor'])
|
|
elif name in ('DW_CFA_def_cfa_offset', 'DW_CFA_GNU_args_size'):
|
|
s += ' %s: %s\n' % (name, instr.args[0])
|
|
elif name == 'DW_CFA_def_cfa_expression':
|
|
expr_dumper = ExprDumper(entry.structs)
|
|
# readelf output is missing a colon for DW_CFA_def_cfa_expression
|
|
s += ' %s (%s)\n' % (name, expr_dumper.dump_expr(instr.args[0]))
|
|
elif name == 'DW_CFA_expression':
|
|
expr_dumper = ExprDumper(entry.structs)
|
|
s += ' %s: %s (%s)\n' % (
|
|
name, _full_reg_name(instr.args[0]),
|
|
expr_dumper.dump_expr(instr.args[1]))
|
|
else:
|
|
s += ' %s: <??>\n' % name
|
|
|
|
return s
|
|
|
|
|
|
def describe_CFI_register_rule(rule):
|
|
s = _DESCR_CFI_REGISTER_RULE_TYPE[rule.type]
|
|
if rule.type in ('OFFSET', 'VAL_OFFSET'):
|
|
s += '%+d' % rule.arg
|
|
elif rule.type == 'REGISTER':
|
|
s += describe_reg_name(rule.arg)
|
|
return s
|
|
|
|
|
|
def describe_CFI_CFA_rule(rule):
|
|
if rule.expr:
|
|
return 'exp'
|
|
else:
|
|
return '%s%+d' % (describe_reg_name(rule.reg), rule.offset)
|
|
|
|
|
|
def describe_DWARF_expr(expr, structs, cu_offset=None):
|
|
""" Textual description of a DWARF expression encoded in 'expr'.
|
|
structs should come from the entity encompassing the expression - it's
|
|
needed to be able to parse it correctly.
|
|
"""
|
|
# Since this function can be called a lot, initializing a fresh new
|
|
# ExprDumper per call is expensive. So a rudimentary caching scheme is in
|
|
# place to create only one such dumper per instance of structs.
|
|
cache_key = id(structs)
|
|
if cache_key not in _DWARF_EXPR_DUMPER_CACHE:
|
|
_DWARF_EXPR_DUMPER_CACHE[cache_key] = \
|
|
ExprDumper(structs)
|
|
dwarf_expr_dumper = _DWARF_EXPR_DUMPER_CACHE[cache_key]
|
|
return '(' + dwarf_expr_dumper.dump_expr(expr, cu_offset) + ')'
|
|
|
|
|
|
def describe_reg_name(regnum, machine_arch=None, default=True):
|
|
""" Provide a textual description for a register name, given its serial
|
|
number. The number is expected to be valid.
|
|
"""
|
|
if machine_arch is None:
|
|
machine_arch = _MACHINE_ARCH
|
|
|
|
if machine_arch == 'x86':
|
|
return _REG_NAMES_x86[regnum]
|
|
elif machine_arch == 'x64':
|
|
return _REG_NAMES_x64[regnum]
|
|
elif machine_arch == 'AArch64':
|
|
return _REG_NAMES_AArch64[regnum]
|
|
elif default:
|
|
return 'r%s' % regnum
|
|
else:
|
|
return None
|
|
|
|
def describe_form_class(form):
|
|
"""For a given form name, determine its value class.
|
|
|
|
For example, given 'DW_FORM_data1' returns 'constant'.
|
|
|
|
For some forms, like DW_FORM_indirect and DW_FORM_sec_offset, the class is
|
|
not hard-coded and extra information is required. For these, None is
|
|
returned.
|
|
"""
|
|
return _FORM_CLASS[form]
|
|
|
|
|
|
#-------------------------------------------------------------------------------
|
|
|
|
# The machine architecture. Set globally via set_global_machine_arch
|
|
#
|
|
_MACHINE_ARCH = None
|
|
|
|
# Implements the alternative format of readelf: lowercase hex, prefixed with 0x unless 0
|
|
def _format_hex(n):
|
|
return '0x%x' % n if n != 0 else '0'
|
|
|
|
def _describe_attr_ref(attr, die, section_offset):
|
|
return '<%s>' % _format_hex(attr.value + die.cu.cu_offset)
|
|
|
|
def _describe_attr_ref_sig8(attr, die, section_offset):
|
|
return 'signature: %s' % _format_hex(attr.value)
|
|
|
|
def _describe_attr_value_passthrough(attr, die, section_offset):
|
|
return attr.value
|
|
|
|
def _describe_attr_hex(attr, die, section_offset):
|
|
return '%s' % _format_hex(attr.value)
|
|
|
|
def _describe_attr_hex_addr(attr, die, section_offset):
|
|
return '<%s>' % _format_hex(attr.value)
|
|
|
|
def _describe_attr_split_64bit(attr, die, section_offset):
|
|
low_word = attr.value & 0xFFFFFFFF
|
|
high_word = (attr.value >> 32) & 0xFFFFFFFF
|
|
return '%s %s' % (_format_hex(low_word), _format_hex(high_word))
|
|
|
|
def _describe_attr_strp(attr, die, section_offset):
|
|
return '(indirect string, offset: %s): %s' % (
|
|
_format_hex(attr.raw_value), bytes2str(attr.value))
|
|
|
|
def _describe_attr_line_strp(attr, die, section_offset):
|
|
return '(indirect line string, offset: %s): %s' % (
|
|
_format_hex(attr.raw_value), bytes2str(attr.value))
|
|
|
|
def _describe_attr_string(attr, die, section_offset):
|
|
return bytes2str(attr.value)
|
|
|
|
def _describe_attr_debool(attr, die, section_offset):
|
|
""" To be consistent with readelf, generate 1 for True flags, 0 for False
|
|
flags.
|
|
"""
|
|
return '1' if attr.value else '0'
|
|
|
|
def _describe_attr_present(attr, die, section_offset):
|
|
""" Some forms may simply mean that an attribute is present,
|
|
without providing any value.
|
|
"""
|
|
return '1'
|
|
|
|
def _describe_attr_block(attr, die, section_offset):
|
|
s = '%s byte block: ' % len(attr.value)
|
|
s += ' '.join('%x' % item for item in attr.value) + ' '
|
|
return s
|
|
|
|
|
|
_ATTR_DESCRIPTION_MAP = defaultdict(
|
|
lambda: _describe_attr_value_passthrough, # default_factory
|
|
|
|
DW_FORM_ref1=_describe_attr_ref,
|
|
DW_FORM_ref2=_describe_attr_ref,
|
|
DW_FORM_ref4=_describe_attr_ref,
|
|
DW_FORM_ref8=_describe_attr_split_64bit,
|
|
DW_FORM_ref_udata=_describe_attr_ref,
|
|
DW_FORM_ref_addr=_describe_attr_hex_addr,
|
|
DW_FORM_data4=_describe_attr_hex,
|
|
DW_FORM_data8=_describe_attr_hex,
|
|
DW_FORM_addr=_describe_attr_hex,
|
|
DW_FORM_sec_offset=_describe_attr_hex,
|
|
DW_FORM_flag=_describe_attr_debool,
|
|
DW_FORM_data1=_describe_attr_value_passthrough,
|
|
DW_FORM_data2=_describe_attr_value_passthrough,
|
|
DW_FORM_sdata=_describe_attr_value_passthrough,
|
|
DW_FORM_udata=_describe_attr_value_passthrough,
|
|
DW_FORM_string=_describe_attr_string,
|
|
DW_FORM_strp=_describe_attr_strp,
|
|
DW_FORM_line_strp=_describe_attr_line_strp,
|
|
DW_FORM_block1=_describe_attr_block,
|
|
DW_FORM_block2=_describe_attr_block,
|
|
DW_FORM_block4=_describe_attr_block,
|
|
DW_FORM_block=_describe_attr_block,
|
|
DW_FORM_flag_present=_describe_attr_present,
|
|
DW_FORM_exprloc=_describe_attr_block,
|
|
DW_FORM_ref_sig8=_describe_attr_ref_sig8,
|
|
)
|
|
|
|
_FORM_CLASS = dict(
|
|
DW_FORM_addr='address',
|
|
DW_FORM_block2='block',
|
|
DW_FORM_block4='block',
|
|
DW_FORM_data2='constant',
|
|
DW_FORM_data4='constant',
|
|
DW_FORM_data8='constant',
|
|
DW_FORM_string='string',
|
|
DW_FORM_block='block',
|
|
DW_FORM_block1='block',
|
|
DW_FORM_data1='constant',
|
|
DW_FORM_flag='flag',
|
|
DW_FORM_sdata='constant',
|
|
DW_FORM_strp='string',
|
|
DW_FORM_udata='constant',
|
|
DW_FORM_ref_addr='reference',
|
|
DW_FORM_ref1='reference',
|
|
DW_FORM_ref2='reference',
|
|
DW_FORM_ref4='reference',
|
|
DW_FORM_ref8='reference',
|
|
DW_FORM_ref_udata='reference',
|
|
DW_FORM_indirect=None,
|
|
DW_FORM_sec_offset=None,
|
|
DW_FORM_exprloc='exprloc',
|
|
DW_FORM_flag_present='flag',
|
|
DW_FORM_ref_sig8='reference',
|
|
)
|
|
|
|
_DESCR_DW_INL = {
|
|
DW_INL_not_inlined: '(not inlined)',
|
|
DW_INL_inlined: '(inlined)',
|
|
DW_INL_declared_not_inlined: '(declared as inline but ignored)',
|
|
DW_INL_declared_inlined: '(declared as inline and inlined)',
|
|
}
|
|
|
|
_DESCR_DW_LANG = {
|
|
DW_LANG_C89: '(ANSI C)',
|
|
DW_LANG_C: '(non-ANSI C)',
|
|
DW_LANG_Ada83: '(Ada)',
|
|
DW_LANG_C_plus_plus: '(C++)',
|
|
DW_LANG_Cobol74: '(Cobol 74)',
|
|
DW_LANG_Cobol85: '(Cobol 85)',
|
|
DW_LANG_Fortran77: '(FORTRAN 77)',
|
|
DW_LANG_Fortran90: '(Fortran 90)',
|
|
DW_LANG_Pascal83: '(ANSI Pascal)',
|
|
DW_LANG_Modula2: '(Modula 2)',
|
|
DW_LANG_Java: '(Java)',
|
|
DW_LANG_C99: '(ANSI C99)',
|
|
DW_LANG_Ada95: '(ADA 95)',
|
|
DW_LANG_Fortran95: '(Fortran 95)',
|
|
DW_LANG_PLI: '(PLI)',
|
|
DW_LANG_ObjC: '(Objective C)',
|
|
DW_LANG_ObjC_plus_plus: '(Objective C++)',
|
|
DW_LANG_UPC: '(Unified Parallel C)',
|
|
DW_LANG_D: '(D)',
|
|
DW_LANG_Python: '(Python)',
|
|
DW_LANG_OpenCL: '(OpenCL)',
|
|
DW_LANG_Go: '(Go)',
|
|
DW_LANG_Modula3: '(Modula 3)',
|
|
DW_LANG_Haskell: '(Haskell)',
|
|
DW_LANG_C_plus_plus_03: '(C++03)',
|
|
DW_LANG_C_plus_plus_11: '(C++11)',
|
|
DW_LANG_OCaml: '(OCaml)',
|
|
DW_LANG_Rust: '(Rust)',
|
|
DW_LANG_C11: '(C11)',
|
|
DW_LANG_Swift: '(Swift)',
|
|
DW_LANG_Julia: '(Julia)',
|
|
DW_LANG_Dylan: '(Dylan)',
|
|
DW_LANG_C_plus_plus_14: '(C++14)',
|
|
DW_LANG_Fortran03: '(Fortran 03)',
|
|
DW_LANG_Fortran08: '(Fortran 08)',
|
|
DW_LANG_RenderScript: '(RenderScript)',
|
|
DW_LANG_BLISS: '(Bliss)', # Not in binutils
|
|
DW_LANG_Mips_Assembler: '(MIPS assembler)',
|
|
DW_LANG_HP_Bliss: '(HP Bliss)',
|
|
DW_LANG_HP_Basic91: '(HP Basic 91)',
|
|
DW_LANG_HP_Pascal91: '(HP Pascal 91)',
|
|
DW_LANG_HP_IMacro: '(HP IMacro)',
|
|
DW_LANG_HP_Assembler: '(HP assembler)'
|
|
}
|
|
|
|
_DESCR_DW_ATE = {
|
|
DW_ATE_void: '(void)',
|
|
DW_ATE_address: '(machine address)',
|
|
DW_ATE_boolean: '(boolean)',
|
|
DW_ATE_complex_float: '(complex float)',
|
|
DW_ATE_float: '(float)',
|
|
DW_ATE_signed: '(signed)',
|
|
DW_ATE_signed_char: '(signed char)',
|
|
DW_ATE_unsigned: '(unsigned)',
|
|
DW_ATE_unsigned_char: '(unsigned char)',
|
|
DW_ATE_imaginary_float: '(imaginary float)',
|
|
DW_ATE_decimal_float: '(decimal float)',
|
|
DW_ATE_packed_decimal: '(packed_decimal)',
|
|
DW_ATE_numeric_string: '(numeric_string)',
|
|
DW_ATE_edited: '(edited)',
|
|
DW_ATE_signed_fixed: '(signed_fixed)',
|
|
DW_ATE_unsigned_fixed: '(unsigned_fixed)',
|
|
DW_ATE_UTF: '(unicode string)',
|
|
DW_ATE_HP_float80: '(HP_float80)',
|
|
DW_ATE_HP_complex_float80: '(HP_complex_float80)',
|
|
DW_ATE_HP_float128: '(HP_float128)',
|
|
DW_ATE_HP_complex_float128: '(HP_complex_float128)',
|
|
DW_ATE_HP_floathpintel: '(HP_floathpintel)',
|
|
DW_ATE_HP_imaginary_float80: '(HP_imaginary_float80)',
|
|
DW_ATE_HP_imaginary_float128: '(HP_imaginary_float128)',
|
|
}
|
|
|
|
_DESCR_DW_ACCESS = {
|
|
DW_ACCESS_public: '(public)',
|
|
DW_ACCESS_protected: '(protected)',
|
|
DW_ACCESS_private: '(private)',
|
|
}
|
|
|
|
_DESCR_DW_VIS = {
|
|
DW_VIS_local: '(local)',
|
|
DW_VIS_exported: '(exported)',
|
|
DW_VIS_qualified: '(qualified)',
|
|
}
|
|
|
|
_DESCR_DW_VIRTUALITY = {
|
|
DW_VIRTUALITY_none: '(none)',
|
|
DW_VIRTUALITY_virtual: '(virtual)',
|
|
DW_VIRTUALITY_pure_virtual: '(pure virtual)',
|
|
}
|
|
|
|
_DESCR_DW_ID_CASE = {
|
|
DW_ID_case_sensitive: '(case_sensitive)',
|
|
DW_ID_up_case: '(up_case)',
|
|
DW_ID_down_case: '(down_case)',
|
|
DW_ID_case_insensitive: '(case_insensitive)',
|
|
}
|
|
|
|
_DESCR_DW_CC = {
|
|
DW_CC_normal: '(normal)',
|
|
DW_CC_program: '(program)',
|
|
DW_CC_nocall: '(nocall)',
|
|
}
|
|
|
|
_DESCR_DW_ORD = {
|
|
DW_ORD_row_major: '(row major)',
|
|
DW_ORD_col_major: '(column major)',
|
|
}
|
|
|
|
_DESCR_CFI_REGISTER_RULE_TYPE = dict(
|
|
UNDEFINED='u',
|
|
SAME_VALUE='s',
|
|
OFFSET='c',
|
|
VAL_OFFSET='v',
|
|
REGISTER='',
|
|
EXPRESSION='exp',
|
|
VAL_EXPRESSION='vexp',
|
|
ARCHITECTURAL='a',
|
|
)
|
|
|
|
def _make_extra_mapper(mapping, default, default_interpolate_value=False):
|
|
""" Create a mapping function from attribute parameters to an extra
|
|
value that should be displayed.
|
|
"""
|
|
def mapper(attr, die, section_offset):
|
|
if default_interpolate_value:
|
|
d = default % attr.value
|
|
else:
|
|
d = default
|
|
return mapping.get(attr.value, d)
|
|
return mapper
|
|
|
|
|
|
def _make_extra_string(s=''):
|
|
""" Create an extra function that just returns a constant string.
|
|
"""
|
|
def extra(attr, die, section_offset):
|
|
return s
|
|
return extra
|
|
|
|
|
|
_DWARF_EXPR_DUMPER_CACHE = {}
|
|
|
|
def _location_list_extra(attr, die, section_offset):
|
|
# According to section 2.6 of the DWARF spec v3, class loclistptr means
|
|
# a location list, and class block means a location expression.
|
|
# DW_FORM_sec_offset is new in DWARFv4 as a section offset.
|
|
if attr.form in ('DW_FORM_data4', 'DW_FORM_data8', 'DW_FORM_sec_offset'):
|
|
return '(location list)'
|
|
else:
|
|
return describe_DWARF_expr(attr.value, die.cu.structs, die.cu.cu_offset)
|
|
|
|
|
|
def _data_member_location_extra(attr, die, section_offset):
|
|
# According to section 5.5.6 of the DWARF spec v4, a data member location
|
|
# can be an integer offset, or a location description.
|
|
#
|
|
if attr.form in ('DW_FORM_data1', 'DW_FORM_data2',
|
|
'DW_FORM_data4', 'DW_FORM_data8',
|
|
'DW_FORM_sdata'):
|
|
return '' # No extra description needed
|
|
else:
|
|
return describe_DWARF_expr(attr.value, die.cu.structs, die.cu.cu_offset)
|
|
|
|
|
|
def _import_extra(attr, die, section_offset):
|
|
# For DW_AT_import the value points to a DIE (that can be either in the
|
|
# current DIE's CU or in another CU, depending on the FORM). The extra
|
|
# information for it is the abbreviation number in this DIE and its tag.
|
|
if attr.form == 'DW_FORM_ref_addr':
|
|
# Absolute offset value
|
|
ref_die_offset = section_offset + attr.value
|
|
else:
|
|
# Relative offset to the current DIE's CU
|
|
ref_die_offset = attr.value + die.cu.cu_offset
|
|
|
|
# Now find the CU this DIE belongs to (since we have to find its abbrev
|
|
# table). This is done by linearly scanning through all CUs, looking for
|
|
# one spanning an address space containing the referred DIE's offset.
|
|
for cu in die.dwarfinfo.iter_CUs():
|
|
if cu['unit_length'] + cu.cu_offset > ref_die_offset >= cu.cu_offset:
|
|
# Once we have the CU, we can actually parse this DIE from the
|
|
# stream.
|
|
with preserve_stream_pos(die.stream):
|
|
ref_die = DIE(cu, die.stream, ref_die_offset)
|
|
#print '&&& ref_die', ref_die
|
|
return '[Abbrev Number: %s (%s)]' % (
|
|
ref_die.abbrev_code, ref_die.tag)
|
|
|
|
return '[unknown]'
|
|
|
|
|
|
_EXTRA_INFO_DESCRIPTION_MAP = defaultdict(
|
|
lambda: _make_extra_string(''), # default_factory
|
|
|
|
DW_AT_inline=_make_extra_mapper(
|
|
_DESCR_DW_INL, '(Unknown inline attribute value: %x',
|
|
default_interpolate_value=True),
|
|
DW_AT_language=_make_extra_mapper(
|
|
_DESCR_DW_LANG, '(Unknown: %x)', default_interpolate_value=True),
|
|
DW_AT_encoding=_make_extra_mapper(_DESCR_DW_ATE, '(unknown type)'),
|
|
DW_AT_accessibility=_make_extra_mapper(
|
|
_DESCR_DW_ACCESS, '(unknown accessibility)'),
|
|
DW_AT_visibility=_make_extra_mapper(
|
|
_DESCR_DW_VIS, '(unknown visibility)'),
|
|
DW_AT_virtuality=_make_extra_mapper(
|
|
_DESCR_DW_VIRTUALITY, '(unknown virtuality)'),
|
|
DW_AT_identifier_case=_make_extra_mapper(
|
|
_DESCR_DW_ID_CASE, '(unknown case)'),
|
|
DW_AT_calling_convention=_make_extra_mapper(
|
|
_DESCR_DW_CC, '(unknown convention)'),
|
|
DW_AT_ordering=_make_extra_mapper(
|
|
_DESCR_DW_ORD, '(undefined)'),
|
|
DW_AT_frame_base=_location_list_extra,
|
|
DW_AT_location=_location_list_extra,
|
|
DW_AT_string_length=_location_list_extra,
|
|
DW_AT_return_addr=_location_list_extra,
|
|
DW_AT_data_member_location=_data_member_location_extra,
|
|
DW_AT_vtable_elem_location=_location_list_extra,
|
|
DW_AT_segment=_location_list_extra,
|
|
DW_AT_static_link=_location_list_extra,
|
|
DW_AT_use_location=_location_list_extra,
|
|
DW_AT_allocated=_location_list_extra,
|
|
DW_AT_associated=_location_list_extra,
|
|
DW_AT_data_location=_location_list_extra,
|
|
DW_AT_stride=_location_list_extra,
|
|
DW_AT_call_value=_location_list_extra,
|
|
DW_AT_import=_import_extra,
|
|
DW_AT_GNU_call_site_value=_location_list_extra,
|
|
DW_AT_GNU_call_site_data_value=_location_list_extra,
|
|
DW_AT_GNU_call_site_target=_location_list_extra,
|
|
DW_AT_GNU_call_site_target_clobbered=_location_list_extra,
|
|
)
|
|
|
|
# 8 in a line, for easier counting
|
|
_REG_NAMES_x86 = [
|
|
'eax', 'ecx', 'edx', 'ebx', 'esp', 'ebp', 'esi', 'edi',
|
|
'eip', 'eflags', '<none>', 'st0', 'st1', 'st2', 'st3', 'st4',
|
|
'st5', 'st6', 'st7', '<none>', '<none>', 'xmm0', 'xmm1', 'xmm2',
|
|
'xmm3', 'xmm4', 'xmm5', 'xmm6', 'xmm7', 'mm0', 'mm1', 'mm2',
|
|
'mm3', 'mm4', 'mm5', 'mm6', 'mm7', 'fcw', 'fsw', 'mxcsr',
|
|
'es', 'cs', 'ss', 'ds', 'fs', 'gs', '<none>', '<none>', 'tr', 'ldtr'
|
|
]
|
|
|
|
_REG_NAMES_x64 = [
|
|
'rax', 'rdx', 'rcx', 'rbx', 'rsi', 'rdi', 'rbp', 'rsp',
|
|
'r8', 'r9', 'r10', 'r11', 'r12', 'r13', 'r14', 'r15',
|
|
'rip', 'xmm0', 'xmm1', 'xmm2', 'xmm3', 'xmm4', 'xmm5', 'xmm6',
|
|
'xmm7', 'xmm8', 'xmm9', 'xmm10', 'xmm11', 'xmm12', 'xmm13', 'xmm14',
|
|
'xmm15', 'st0', 'st1', 'st2', 'st3', 'st4', 'st5', 'st6',
|
|
'st7', 'mm0', 'mm1', 'mm2', 'mm3', 'mm4', 'mm5', 'mm6',
|
|
'mm7', 'rflags', 'es', 'cs', 'ss', 'ds', 'fs', 'gs',
|
|
'<none>', '<none>', 'fs.base', 'gs.base', '<none>', '<none>', 'tr', 'ldtr',
|
|
'mxcsr', 'fcw', 'fsw'
|
|
]
|
|
|
|
# https://developer.arm.com/documentation/ihi0057/e/?lang=en#dwarf-register-names
|
|
_REG_NAMES_AArch64 = [
|
|
'x0', 'x1', 'x2', 'x3', 'x4', 'x5', 'x6', 'x7',
|
|
'x8', 'x9', 'x10', 'x11', 'x12', 'x13', 'x14', 'x15',
|
|
'x16', 'x17', 'x18', 'x19', 'x20', 'x21', 'x22', 'x23',
|
|
'x24', 'x25', 'x26', 'x27', 'x28', 'x29', 'x30', 'sp',
|
|
'<none>', 'ELR_mode', 'RA_SIGN_STATE', '<none>', '<none>', '<none>', '<none>', '<none>',
|
|
'<none>', '<none>', '<none>', '<none>', '<none>', '<none>', 'VG', 'FFR',
|
|
'p0', 'p1', 'p2', 'p3', 'p4', 'p5', 'p6', 'p7',
|
|
'p8', 'p9', 'p10', 'p11', 'p12', 'p13', 'p14', 'p15',
|
|
'v0', 'v1', 'v2', 'v3', 'v4', 'v5', 'v6', 'v7',
|
|
'v8', 'v9', 'v10', 'v11', 'v12', 'v13', 'v14', 'v15',
|
|
'v16', 'v17', 'v18', 'v19', 'v20', 'v21', 'v22', 'v23',
|
|
'v24', 'v25', 'v26', 'v27', 'v28', 'v29', 'v30', 'v31',
|
|
'z0', 'z1', 'z2', 'z3', 'z4', 'z5', 'z6', 'z7',
|
|
'z8', 'z9', 'z10', 'z11', 'z12', 'z13', 'z14', 'z15',
|
|
'z16', 'z17', 'z18', 'z19', 'z20', 'z21', 'z22', 'z23',
|
|
'z24', 'z25', 'z26', 'z27', 'z28', 'z29', 'z30', 'z31'
|
|
]
|
|
|
|
|
|
class ExprDumper(object):
|
|
""" A dumper for DWARF expressions that dumps a textual
|
|
representation of the complete expression.
|
|
|
|
Usage: after creation, call dump_expr repeatedly - it's stateless.
|
|
"""
|
|
def __init__(self, structs):
|
|
self.structs = structs
|
|
self.expr_parser = DWARFExprParser(self.structs)
|
|
self._init_lookups()
|
|
|
|
def dump_expr(self, expr, cu_offset=None):
|
|
""" Parse and dump a DWARF expression. expr should be a list of
|
|
(integer) byte values. cu_offset is the cu_offset
|
|
value from the CU object where the expression resides.
|
|
Only affects a handful of GNU opcodes, if None is provided,
|
|
that's not a crash condition, only the expression dump will
|
|
not be consistent of that of readelf.
|
|
|
|
Returns a string representing the expression.
|
|
"""
|
|
parsed = self.expr_parser.parse_expr(expr)
|
|
s = []
|
|
for deo in parsed:
|
|
s.append(self._dump_to_string(deo.op, deo.op_name, deo.args, cu_offset))
|
|
return '; '.join(s)
|
|
|
|
def _init_lookups(self):
|
|
self._ops_with_decimal_arg = set([
|
|
'DW_OP_const1u', 'DW_OP_const1s', 'DW_OP_const2u', 'DW_OP_const2s',
|
|
'DW_OP_const4u', 'DW_OP_const4s', 'DW_OP_const8u', 'DW_OP_const8s',
|
|
'DW_OP_constu', 'DW_OP_consts', 'DW_OP_pick', 'DW_OP_plus_uconst',
|
|
'DW_OP_bra', 'DW_OP_skip', 'DW_OP_fbreg', 'DW_OP_piece',
|
|
'DW_OP_deref_size', 'DW_OP_xderef_size', 'DW_OP_regx',])
|
|
|
|
for n in range(0, 32):
|
|
self._ops_with_decimal_arg.add('DW_OP_breg%s' % n)
|
|
|
|
self._ops_with_two_decimal_args = set(['DW_OP_bregx', 'DW_OP_bit_piece'])
|
|
|
|
self._ops_with_hex_arg = set(
|
|
['DW_OP_addr', 'DW_OP_call2', 'DW_OP_call4', 'DW_OP_call_ref'])
|
|
|
|
def _dump_to_string(self, opcode, opcode_name, args, cu_offset=None):
|
|
# Some GNU ops contain an offset from the current CU as an argument,
|
|
# but readelf emits those ops with offset from the info section
|
|
# so we need the base offset of the parent CU.
|
|
# If omitted, arguments on some GNU opcodes will be off.
|
|
if cu_offset is None:
|
|
cu_offset = 0
|
|
|
|
if len(args) == 0:
|
|
if opcode_name.startswith('DW_OP_reg'):
|
|
regnum = int(opcode_name[9:])
|
|
return '%s (%s)' % (
|
|
opcode_name,
|
|
describe_reg_name(regnum, _MACHINE_ARCH))
|
|
else:
|
|
return opcode_name
|
|
elif opcode_name in self._ops_with_decimal_arg:
|
|
if opcode_name.startswith('DW_OP_breg'):
|
|
regnum = int(opcode_name[10:])
|
|
return '%s (%s): %s' % (
|
|
opcode_name,
|
|
describe_reg_name(regnum, _MACHINE_ARCH),
|
|
args[0])
|
|
elif opcode_name.endswith('regx'):
|
|
# applies to both regx and bregx
|
|
return '%s: %s (%s)' % (
|
|
opcode_name,
|
|
args[0],
|
|
describe_reg_name(args[0], _MACHINE_ARCH))
|
|
else:
|
|
return '%s: %s' % (opcode_name, args[0])
|
|
elif opcode_name in self._ops_with_hex_arg:
|
|
return '%s: %x' % (opcode_name, args[0])
|
|
elif opcode_name in self._ops_with_two_decimal_args:
|
|
return '%s: %s %s' % (opcode_name, args[0], args[1])
|
|
elif opcode_name in ('DW_OP_GNU_entry_value', 'DW_OP_entry_value'):
|
|
return '%s: (%s)' % (opcode_name, ','.join([self._dump_to_string(deo.op, deo.op_name, deo.args, cu_offset) for deo in args[0]]))
|
|
elif opcode_name == 'DW_OP_implicit_value':
|
|
return "%s %s byte block: %s" % (opcode_name, len(args[0]), ''.join(["%x " % b for b in args[0]]))
|
|
elif opcode_name == 'DW_OP_GNU_parameter_ref':
|
|
return "%s: <0x%x>" % (opcode_name, args[0] + cu_offset)
|
|
elif opcode_name in ('DW_OP_GNU_implicit_pointer', 'DW_OP_implicit_pointer'):
|
|
return "%s: <0x%x> %d" % (opcode_name, args[0], args[1])
|
|
elif opcode_name in ('DW_OP_GNU_convert', 'DW_OP_convert'):
|
|
return "%s <0x%x>" % (opcode_name, args[0] + cu_offset)
|
|
elif opcode_name in ('DW_OP_GNU_deref_type', 'DW_OP_deref_type'):
|
|
return "%s: %d <0x%x>" % (opcode_name, args[0], args[1] + cu_offset)
|
|
elif opcode_name in ('DW_OP_GNU_const_type', 'DW_OP_const_type'):
|
|
return "%s: <0x%x> %d byte block: %s " % (opcode_name, args[0] + cu_offset, len(args[1]), ' '.join("%x" % b for b in args[1]))
|
|
elif opcode_name in ('DW_OP_GNU_regval_type', 'DW_OP_regval_type'):
|
|
return "%s: %d (%s) <0x%x>" % (opcode_name, args[0], describe_reg_name(args[0], _MACHINE_ARCH), args[1] + cu_offset)
|
|
else:
|
|
return '<unknown %s>' % opcode_name
|