1 #-------------------------------------------------------------------------------
2 # elftools: dwarf/dwarf_expr.py
4 # Decoding DWARF expressions
6 # Eli Bendersky (eliben@gmail.com)
7 # This code is in the public domain
8 #-------------------------------------------------------------------------------
9 from collections
import namedtuple
10 from io
import BytesIO
12 from ..common
.utils
import struct_parse
, bytelist2string
, read_blob
13 from ..common
.exceptions
import DWARFError
16 # DWARF expression opcodes. name -> opcode mapping
17 DW_OP_name2opcode
= dict(
47 DW_OP_plus_uconst
=0x23,
64 DW_OP_deref_size
=0x94,
65 DW_OP_xderef_size
=0x95,
67 DW_OP_push_object_address
=0x97,
71 DW_OP_form_tls_address
=0x9b,
72 DW_OP_call_frame_cfa
=0x9c,
74 DW_OP_implicit_value
=0x9e,
75 DW_OP_stack_value
=0x9f,
76 DW_OP_implicit_pointer
=0xa0,
79 DW_OP_entry_value
=0xa3,
80 DW_OP_const_type
=0xa4,
81 DW_OP_regval_type
=0xa5,
82 DW_OP_deref_type
=0xa6,
83 DW_OP_xderef_type
=0xa7,
85 DW_OP_reinterpret
=0xa9,
87 DW_OP_GNU_push_tls_address
=0xe0,
88 DW_OP_WASM_location
=0xed,
89 DW_OP_GNU_implicit_pointer
=0xf2,
90 DW_OP_GNU_entry_value
=0xf3,
91 DW_OP_GNU_const_type
=0xf4,
92 DW_OP_GNU_regval_type
=0xf5,
93 DW_OP_GNU_deref_type
=0xf6,
94 DW_OP_GNU_convert
=0xf7,
95 DW_OP_GNU_parameter_ref
=0xfa,
99 def _generate_dynamic_values(map, prefix
, index_start
, index_end
, value_start
):
100 """ Generate values in a map (dict) dynamically. Each key starts with
101 a (string) prefix, followed by an index in the inclusive range
102 [index_start, index_end]. The values start at value_start.
104 for index
in range(index_start
, index_end
+ 1):
105 name
= '%s%s' % (prefix
, index
)
106 value
= value_start
+ index
- index_start
109 _generate_dynamic_values(DW_OP_name2opcode
, 'DW_OP_lit', 0, 31, 0x30)
110 _generate_dynamic_values(DW_OP_name2opcode
, 'DW_OP_reg', 0, 31, 0x50)
111 _generate_dynamic_values(DW_OP_name2opcode
, 'DW_OP_breg', 0, 31, 0x70)
113 # opcode -> name mapping
114 DW_OP_opcode2name
= dict((v
, k
) for k
, v
in DW_OP_name2opcode
.items())
117 # Each parsed DWARF expression is returned as this type with its numeric opcode,
118 # op name (as a string) and a list of arguments.
119 DWARFExprOp
= namedtuple('DWARFExprOp', 'op op_name args offset')
122 class DWARFExprParser(object):
123 """DWARF expression parser.
125 When initialized, requires structs to cache a dispatch table. After that,
126 parse_expr can be called repeatedly - it's stateless.
129 def __init__(self
, structs
):
130 self
._dispatch
_table
= _init_dispatch_table(structs
)
132 def parse_expr(self
, expr
):
133 """ Parses expr (a list of integers) into a list of DWARFExprOp.
135 The list can potentially be nested.
137 stream
= BytesIO(bytelist2string(expr
))
141 # Get the next opcode from the stream. If nothing is left in the
142 # stream, we're done.
143 offset
= stream
.tell()
144 byte
= stream
.read(1)
148 # Decode the opcode and its name.
150 op_name
= DW_OP_opcode2name
.get(op
, 'OP:0x%x' % op
)
152 # Use dispatch table to parse args.
153 arg_parser
= self
._dispatch
_table
[op
]
154 args
= arg_parser(stream
)
156 parsed
.append(DWARFExprOp(op
=op
, op_name
=op_name
, args
=args
, offset
=offset
))
161 def _init_dispatch_table(structs
):
162 """Creates a dispatch table for parsing args of an op.
164 Returns a dict mapping opcode to a function. The function accepts a stream
165 and return a list of parsed arguments for the opcode from the stream;
166 the stream is advanced by the function as needed.
169 def add(opcode_name
, func
):
170 table
[DW_OP_name2opcode
[opcode_name
]] = func
173 return lambda stream
: []
176 return lambda stream
: [struct_parse(structs
.Dwarf_target_addr(''),
179 def parse_arg_struct(arg_struct
):
180 return lambda stream
: [struct_parse(arg_struct
, stream
)]
182 def parse_arg_struct2(arg1_struct
, arg2_struct
):
183 return lambda stream
: [struct_parse(arg1_struct
, stream
),
184 struct_parse(arg2_struct
, stream
)]
186 # ULEB128, then an expression of that length
187 def parse_nestedexpr():
189 size
= struct_parse(structs
.Dwarf_uleb128(''), stream
)
190 nested_expr_blob
= read_blob(stream
, size
)
191 return [DWARFExprParser(structs
).parse_expr(nested_expr_blob
)]
194 # ULEB128, then a blob of that size
196 return lambda stream
: [read_blob(stream
, struct_parse(structs
.Dwarf_uleb128(''), stream
))]
198 # ULEB128 with datatype DIE offset, then byte, then a blob of that size
199 def parse_typedblob():
200 return lambda stream
: [struct_parse(structs
.Dwarf_uleb128(''), stream
), read_blob(stream
, struct_parse(structs
.Dwarf_uint8(''), stream
))]
202 # https://yurydelendik.github.io/webassembly-dwarf/
203 # Byte, then variant: 0, 1, 2 => uleb128, 3 => uint32
206 op
= struct_parse(structs
.Dwarf_uint8(''), stream
)
208 return [op
, struct_parse(structs
.Dwarf_uleb128(''), stream
)]
210 return [op
, struct_parse(structs
.Dwarf_uint32(''), stream
)]
212 raise DWARFError("Unknown operation code in DW_OP_WASM_location: %d" % (op
,))
215 add('DW_OP_addr', parse_op_addr())
216 add('DW_OP_addrx', parse_arg_struct(structs
.Dwarf_uleb128('')))
217 add('DW_OP_const1u', parse_arg_struct(structs
.Dwarf_uint8('')))
218 add('DW_OP_const1s', parse_arg_struct(structs
.Dwarf_int8('')))
219 add('DW_OP_const2u', parse_arg_struct(structs
.Dwarf_uint16('')))
220 add('DW_OP_const2s', parse_arg_struct(structs
.Dwarf_int16('')))
221 add('DW_OP_const4u', parse_arg_struct(structs
.Dwarf_uint32('')))
222 add('DW_OP_const4s', parse_arg_struct(structs
.Dwarf_int32('')))
223 add('DW_OP_const8u', parse_arg_struct(structs
.Dwarf_uint64('')))
224 add('DW_OP_const8s', parse_arg_struct(structs
.Dwarf_int64('')))
225 add('DW_OP_constu', parse_arg_struct(structs
.Dwarf_uleb128('')))
226 add('DW_OP_consts', parse_arg_struct(structs
.Dwarf_sleb128('')))
227 add('DW_OP_pick', parse_arg_struct(structs
.Dwarf_uint8('')))
228 add('DW_OP_plus_uconst', parse_arg_struct(structs
.Dwarf_uleb128('')))
229 add('DW_OP_bra', parse_arg_struct(structs
.Dwarf_int16('')))
230 add('DW_OP_skip', parse_arg_struct(structs
.Dwarf_int16('')))
232 for opname
in [ 'DW_OP_deref', 'DW_OP_dup', 'DW_OP_drop', 'DW_OP_over',
233 'DW_OP_swap', 'DW_OP_swap', 'DW_OP_rot', 'DW_OP_xderef',
234 'DW_OP_abs', 'DW_OP_and', 'DW_OP_div', 'DW_OP_minus',
235 'DW_OP_mod', 'DW_OP_mul', 'DW_OP_neg', 'DW_OP_not',
236 'DW_OP_or', 'DW_OP_plus', 'DW_OP_shl', 'DW_OP_shr',
237 'DW_OP_shra', 'DW_OP_xor', 'DW_OP_eq', 'DW_OP_ge',
238 'DW_OP_gt', 'DW_OP_le', 'DW_OP_lt', 'DW_OP_ne', 'DW_OP_nop',
239 'DW_OP_push_object_address', 'DW_OP_form_tls_address',
240 'DW_OP_call_frame_cfa', 'DW_OP_stack_value',
241 'DW_OP_GNU_push_tls_address']:
242 add(opname
, parse_noargs())
244 for n
in range(0, 32):
245 add('DW_OP_lit%s' % n
, parse_noargs())
246 add('DW_OP_reg%s' % n
, parse_noargs())
247 add('DW_OP_breg%s' % n
, parse_arg_struct(structs
.Dwarf_sleb128('')))
249 add('DW_OP_fbreg', parse_arg_struct(structs
.Dwarf_sleb128('')))
250 add('DW_OP_regx', parse_arg_struct(structs
.Dwarf_uleb128('')))
251 add('DW_OP_bregx', parse_arg_struct2(structs
.Dwarf_uleb128(''),
252 structs
.Dwarf_sleb128('')))
253 add('DW_OP_piece', parse_arg_struct(structs
.Dwarf_uleb128('')))
254 add('DW_OP_bit_piece', parse_arg_struct2(structs
.Dwarf_uleb128(''),
255 structs
.Dwarf_uleb128('')))
256 add('DW_OP_deref_size', parse_arg_struct(structs
.Dwarf_int8('')))
257 add('DW_OP_xderef_size', parse_arg_struct(structs
.Dwarf_int8('')))
258 add('DW_OP_call2', parse_arg_struct(structs
.Dwarf_uint16('')))
259 add('DW_OP_call4', parse_arg_struct(structs
.Dwarf_uint32('')))
260 add('DW_OP_call_ref', parse_arg_struct(structs
.Dwarf_offset('')))
261 add('DW_OP_implicit_value', parse_blob())
262 add('DW_OP_entry_value', parse_nestedexpr())
263 add('DW_OP_const_type', parse_typedblob())
264 add('DW_OP_regval_type', parse_arg_struct2(structs
.Dwarf_uleb128(''),
265 structs
.Dwarf_uleb128('')))
266 add('DW_OP_deref_type', parse_arg_struct2(structs
.Dwarf_uint8(''),
267 structs
.Dwarf_uleb128('')))
268 add('DW_OP_implicit_pointer', parse_arg_struct2(structs
.Dwarf_offset(''),
269 structs
.Dwarf_sleb128('')))
270 add('DW_OP_convert', parse_arg_struct(structs
.Dwarf_uleb128('')))
271 add('DW_OP_GNU_entry_value', parse_nestedexpr())
272 add('DW_OP_GNU_const_type', parse_typedblob())
273 add('DW_OP_GNU_regval_type', parse_arg_struct2(structs
.Dwarf_uleb128(''),
274 structs
.Dwarf_uleb128('')))
275 add('DW_OP_GNU_deref_type', parse_arg_struct2(structs
.Dwarf_uint8(''),
276 structs
.Dwarf_uleb128('')))
277 add('DW_OP_GNU_implicit_pointer', parse_arg_struct2(structs
.Dwarf_offset(''),
278 structs
.Dwarf_sleb128('')))
279 add('DW_OP_GNU_parameter_ref', parse_arg_struct(structs
.Dwarf_offset('')))
280 add('DW_OP_GNU_convert', parse_arg_struct(structs
.Dwarf_uleb128('')))
281 add('DW_OP_WASM_location', parse_wasmloc())