1 /* General "disassemble this chunk" code. Used for debugging. */
2 #include "qemu/osdep.h"
3 #include "disas/dis-asm.h"
5 #include "qemu/qemu-print.h"
8 #include "disas/disas.h"
9 #include "disas/capstone.h"
11 typedef struct CPUDebug
{
12 struct disassemble_info info
;
16 /* Filled in by elfload.c. Simplistic, but will do for now. */
17 struct syminfo
*syminfos
= NULL
;
19 /* Get LENGTH bytes from info's buffer, at target address memaddr.
20 Transfer them to myaddr. */
22 buffer_read_memory(bfd_vma memaddr
, bfd_byte
*myaddr
, int length
,
23 struct disassemble_info
*info
)
25 if (memaddr
< info
->buffer_vma
26 || memaddr
+ length
> info
->buffer_vma
+ info
->buffer_length
)
27 /* Out of bounds. Use EIO because GDB uses it. */
29 memcpy (myaddr
, info
->buffer
+ (memaddr
- info
->buffer_vma
), length
);
33 /* Get LENGTH bytes from info's buffer, at target address memaddr.
34 Transfer them to myaddr. */
36 target_read_memory (bfd_vma memaddr
,
39 struct disassemble_info
*info
)
41 CPUDebug
*s
= container_of(info
, CPUDebug
, info
);
43 cpu_memory_rw_debug(s
->cpu
, memaddr
, myaddr
, length
, 0);
47 /* Print an error message. We can assume that this is in response to
48 an error return from buffer_read_memory. */
50 perror_memory (int status
, bfd_vma memaddr
, struct disassemble_info
*info
)
54 (*info
->fprintf_func
) (info
->stream
, "Unknown error %d\n", status
);
56 /* Actually, address between memaddr and memaddr + len was
58 (*info
->fprintf_func
) (info
->stream
,
59 "Address 0x%" PRIx64
" is out of bounds.\n", memaddr
);
62 /* This could be in a separate file, to save minuscule amounts of space
63 in statically linked executables. */
65 /* Just print the address is hex. This is included for completeness even
66 though both GDB and objdump provide their own (to print symbolic
70 generic_print_address (bfd_vma addr
, struct disassemble_info
*info
)
72 (*info
->fprintf_func
) (info
->stream
, "0x%" PRIx64
, addr
);
75 /* Print address in hex, truncated to the width of a host virtual address. */
77 generic_print_host_address(bfd_vma addr
, struct disassemble_info
*info
)
79 uint64_t mask
= ~0ULL >> (64 - (sizeof(void *) * 8));
80 generic_print_address(addr
& mask
, info
);
83 /* Just return the given address. */
86 generic_symbol_at_address (bfd_vma addr
, struct disassemble_info
*info
)
91 bfd_vma
bfd_getl64 (const bfd_byte
*addr
)
95 v
= (unsigned long long) addr
[0];
96 v
|= (unsigned long long) addr
[1] << 8;
97 v
|= (unsigned long long) addr
[2] << 16;
98 v
|= (unsigned long long) addr
[3] << 24;
99 v
|= (unsigned long long) addr
[4] << 32;
100 v
|= (unsigned long long) addr
[5] << 40;
101 v
|= (unsigned long long) addr
[6] << 48;
102 v
|= (unsigned long long) addr
[7] << 56;
106 bfd_vma
bfd_getl32 (const bfd_byte
*addr
)
110 v
= (unsigned long) addr
[0];
111 v
|= (unsigned long) addr
[1] << 8;
112 v
|= (unsigned long) addr
[2] << 16;
113 v
|= (unsigned long) addr
[3] << 24;
117 bfd_vma
bfd_getb32 (const bfd_byte
*addr
)
121 v
= (unsigned long) addr
[0] << 24;
122 v
|= (unsigned long) addr
[1] << 16;
123 v
|= (unsigned long) addr
[2] << 8;
124 v
|= (unsigned long) addr
[3];
128 bfd_vma
bfd_getl16 (const bfd_byte
*addr
)
132 v
= (unsigned long) addr
[0];
133 v
|= (unsigned long) addr
[1] << 8;
137 bfd_vma
bfd_getb16 (const bfd_byte
*addr
)
141 v
= (unsigned long) addr
[0] << 24;
142 v
|= (unsigned long) addr
[1] << 16;
146 static int print_insn_objdump(bfd_vma pc
, disassemble_info
*info
,
149 int i
, n
= info
->buffer_length
;
150 uint8_t *buf
= g_malloc(n
);
152 info
->read_memory_func(pc
, buf
, n
, info
);
154 for (i
= 0; i
< n
; ++i
) {
156 info
->fprintf_func(info
->stream
, "\n%s: ", prefix
);
158 info
->fprintf_func(info
->stream
, "%02x", buf
[i
]);
165 static int print_insn_od_host(bfd_vma pc
, disassemble_info
*info
)
167 return print_insn_objdump(pc
, info
, "OBJD-H");
170 static int print_insn_od_target(bfd_vma pc
, disassemble_info
*info
)
172 return print_insn_objdump(pc
, info
, "OBJD-T");
175 #ifdef CONFIG_CAPSTONE
176 /* Temporary storage for the capstone library. This will be alloced via
177 malloc with a size private to the library; thus there's no reason not
178 to share this across calls and across host vs target disassembly. */
179 static __thread cs_insn
*cap_insn
;
181 /* Initialize the Capstone library. */
182 /* ??? It would be nice to cache this. We would need one handle for the
183 host and one for the target. For most targets we can reset specific
184 parameters via cs_option(CS_OPT_MODE, new_mode), but we cannot change
185 CS_ARCH_* in this way. Thus we would need to be able to close and
186 re-open the target handle with a different arch for the target in order
187 to handle AArch64 vs AArch32 mode switching. */
188 static cs_err
cap_disas_start(disassemble_info
*info
, csh
*handle
)
190 cs_mode cap_mode
= info
->cap_mode
;
193 cap_mode
+= (info
->endian
== BFD_ENDIAN_BIG
? CS_MODE_BIG_ENDIAN
194 : CS_MODE_LITTLE_ENDIAN
);
196 err
= cs_open(info
->cap_arch
, cap_mode
, handle
);
197 if (err
!= CS_ERR_OK
) {
201 /* ??? There probably ought to be a better place to put this. */
202 if (info
->cap_arch
== CS_ARCH_X86
) {
203 /* We don't care about errors (if for some reason the library
204 is compiled without AT&T syntax); the user will just have
205 to deal with the Intel syntax. */
206 cs_option(*handle
, CS_OPT_SYNTAX
, CS_OPT_SYNTAX_ATT
);
209 /* "Disassemble" unknown insns as ".byte W,X,Y,Z". */
210 cs_option(*handle
, CS_OPT_SKIPDATA
, CS_OPT_ON
);
212 /* Allocate temp space for cs_disasm_iter. */
213 if (cap_insn
== NULL
) {
214 cap_insn
= cs_malloc(*handle
);
215 if (cap_insn
== NULL
) {
223 static void cap_dump_insn_units(disassemble_info
*info
, cs_insn
*insn
,
226 fprintf_function print
= info
->fprintf_func
;
227 FILE *stream
= info
->stream
;
229 switch (info
->cap_insn_unit
) {
231 if (info
->endian
== BFD_ENDIAN_BIG
) {
232 for (; i
< n
; i
+= 4) {
233 print(stream
, " %08x", ldl_be_p(insn
->bytes
+ i
));
237 for (; i
< n
; i
+= 4) {
238 print(stream
, " %08x", ldl_le_p(insn
->bytes
+ i
));
244 if (info
->endian
== BFD_ENDIAN_BIG
) {
245 for (; i
< n
; i
+= 2) {
246 print(stream
, " %04x", lduw_be_p(insn
->bytes
+ i
));
249 for (; i
< n
; i
+= 2) {
250 print(stream
, " %04x", lduw_le_p(insn
->bytes
+ i
));
257 print(stream
, " %02x", insn
->bytes
[i
]);
263 static void cap_dump_insn(disassemble_info
*info
, cs_insn
*insn
)
265 fprintf_function print
= info
->fprintf_func
;
268 print(info
->stream
, "0x%08" PRIx64
": ", insn
->address
);
271 split
= info
->cap_insn_split
;
273 /* Dump the first SPLIT bytes of the instruction. */
274 cap_dump_insn_units(info
, insn
, 0, MIN(n
, split
));
276 /* Add padding up to SPLIT so that mnemonics line up. */
278 int width
= (split
- n
) / info
->cap_insn_unit
;
279 width
*= (2 * info
->cap_insn_unit
+ 1);
280 print(info
->stream
, "%*s", width
, "");
283 /* Print the actual instruction. */
284 print(info
->stream
, " %-8s %s\n", insn
->mnemonic
, insn
->op_str
);
286 /* Dump any remaining part of the insn on subsequent lines. */
287 for (i
= split
; i
< n
; i
+= split
) {
288 print(info
->stream
, "0x%08" PRIx64
": ", insn
->address
+ i
);
289 cap_dump_insn_units(info
, insn
, i
, MIN(n
, i
+ split
));
290 print(info
->stream
, "\n");
294 /* Disassemble SIZE bytes at PC for the target. */
295 static bool cap_disas_target(disassemble_info
*info
, uint64_t pc
, size_t size
)
297 uint8_t cap_buf
[1024];
302 if (cap_disas_start(info
, &handle
) != CS_ERR_OK
) {
308 size_t tsize
= MIN(sizeof(cap_buf
) - csize
, size
);
309 const uint8_t *cbuf
= cap_buf
;
311 target_read_memory(pc
+ csize
, cap_buf
+ csize
, tsize
, info
);
315 while (cs_disasm_iter(handle
, &cbuf
, &csize
, &pc
, insn
)) {
316 cap_dump_insn(info
, insn
);
319 /* If the target memory is not consumed, go back for more... */
321 /* ... taking care to move any remaining fractional insn
322 to the beginning of the buffer. */
324 memmove(cap_buf
, cbuf
, csize
);
329 /* Since the target memory is consumed, we should not have
330 a remaining fractional insn. */
332 (*info
->fprintf_func
)(info
->stream
,
333 "Disassembler disagrees with translator "
334 "over instruction decoding\n"
335 "Please report this to qemu-devel@nongnu.org\n");
344 /* Disassemble SIZE bytes at CODE for the host. */
345 static bool cap_disas_host(disassemble_info
*info
, void *code
, size_t size
)
352 if (cap_disas_start(info
, &handle
) != CS_ERR_OK
) {
358 pc
= (uintptr_t)code
;
360 while (cs_disasm_iter(handle
, &cbuf
, &size
, &pc
, insn
)) {
361 cap_dump_insn(info
, insn
);
364 (*info
->fprintf_func
)(info
->stream
,
365 "Disassembler disagrees with TCG over instruction encoding\n"
366 "Please report this to qemu-devel@nongnu.org\n");
373 #if !defined(CONFIG_USER_ONLY)
374 /* Disassemble COUNT insns at PC for the target. */
375 static bool cap_disas_monitor(disassemble_info
*info
, uint64_t pc
, int count
)
382 if (cap_disas_start(info
, &handle
) != CS_ERR_OK
) {
388 /* We want to read memory for one insn, but generically we do not
389 know how much memory that is. We have a small buffer which is
390 known to be sufficient for all supported targets. Try to not
391 read beyond the page, Just In Case. For even more simplicity,
392 ignore the actual target page size and use a 1k boundary. If
393 that turns out to be insufficient, we'll come back around the
394 loop and read more. */
395 uint64_t epc
= QEMU_ALIGN_UP(pc
+ csize
+ 1, 1024);
396 size_t tsize
= MIN(sizeof(cap_buf
) - csize
, epc
- pc
);
397 const uint8_t *cbuf
= cap_buf
;
399 /* Make certain that we can make progress. */
401 info
->read_memory_func(pc
, cap_buf
+ csize
, tsize
, info
);
404 if (cs_disasm_iter(handle
, &cbuf
, &csize
, &pc
, insn
)) {
405 cap_dump_insn(info
, insn
);
410 memmove(cap_buf
, cbuf
, csize
);
416 #endif /* !CONFIG_USER_ONLY */
418 # define cap_disas_target(i, p, s) false
419 # define cap_disas_host(i, p, s) false
420 # define cap_disas_monitor(i, p, c) false
421 # define cap_disas_plugin(i, p, c) false
422 #endif /* CONFIG_CAPSTONE */
424 /* Disassemble this for me please... (debugging). */
425 void target_disas(FILE *out
, CPUState
*cpu
, target_ulong code
,
428 CPUClass
*cc
= CPU_GET_CLASS(cpu
);
433 INIT_DISASSEMBLE_INFO(s
.info
, out
, fprintf
);
436 s
.info
.read_memory_func
= target_read_memory
;
437 s
.info
.buffer_vma
= code
;
438 s
.info
.buffer_length
= size
;
439 s
.info
.print_address_func
= generic_print_address
;
440 s
.info
.cap_arch
= -1;
442 s
.info
.cap_insn_unit
= 4;
443 s
.info
.cap_insn_split
= 4;
445 #ifdef TARGET_WORDS_BIGENDIAN
446 s
.info
.endian
= BFD_ENDIAN_BIG
;
448 s
.info
.endian
= BFD_ENDIAN_LITTLE
;
451 if (cc
->disas_set_info
) {
452 cc
->disas_set_info(cpu
, &s
.info
);
455 if (s
.info
.cap_arch
>= 0 && cap_disas_target(&s
.info
, code
, size
)) {
459 if (s
.info
.print_insn
== NULL
) {
460 s
.info
.print_insn
= print_insn_od_target
;
463 for (pc
= code
; size
> 0; pc
+= count
, size
-= count
) {
464 fprintf(out
, "0x" TARGET_FMT_lx
": ", pc
);
465 count
= s
.info
.print_insn(pc
, &s
.info
);
471 "Disassembler disagrees with translator over instruction "
473 "Please report this to qemu-devel@nongnu.org\n");
479 static __thread GString plugin_disas_output
;
481 static int plugin_printf(FILE *stream
, const char *fmt
, ...)
484 GString
*s
= &plugin_disas_output
;
485 int initial_len
= s
->len
;
488 g_string_append_vprintf(s
, fmt
, va
);
491 return s
->len
- initial_len
;
494 static void plugin_print_address(bfd_vma addr
, struct disassemble_info
*info
)
500 #ifdef CONFIG_CAPSTONE
501 /* Disassemble a single instruction directly into plugin output */
503 bool cap_disas_plugin(disassemble_info
*info
, uint64_t pc
, size_t size
)
505 uint8_t cap_buf
[1024];
510 GString
*s
= &plugin_disas_output
;
512 if (cap_disas_start(info
, &handle
) != CS_ERR_OK
) {
517 size_t tsize
= MIN(sizeof(cap_buf
) - csize
, size
);
518 const uint8_t *cbuf
= cap_buf
;
519 target_read_memory(pc
, cap_buf
, tsize
, info
);
521 count
= cs_disasm(handle
, cbuf
, size
, 0, 1, &insn
);
524 g_string_printf(s
, "%s %s", insn
->mnemonic
, insn
->op_str
);
526 g_string_printf(s
, "cs_disasm failed");
535 * We should only be dissembling one instruction at a time here. If
536 * there is left over it usually indicates the front end has read more
537 * bytes than it needed.
539 char *plugin_disas(CPUState
*cpu
, uint64_t addr
, size_t size
)
541 CPUClass
*cc
= CPU_GET_CLASS(cpu
);
544 GString
*ds
= g_string_set_size(&plugin_disas_output
, 0);
546 g_assert(ds
== &plugin_disas_output
);
548 INIT_DISASSEMBLE_INFO(s
.info
, NULL
, plugin_printf
);
551 s
.info
.read_memory_func
= target_read_memory
;
552 s
.info
.buffer_vma
= addr
;
553 s
.info
.buffer_length
= size
;
554 s
.info
.print_address_func
= plugin_print_address
;
555 s
.info
.cap_arch
= -1;
557 s
.info
.cap_insn_unit
= 4;
558 s
.info
.cap_insn_split
= 4;
560 #ifdef TARGET_WORDS_BIGENDIAN
561 s
.info
.endian
= BFD_ENDIAN_BIG
;
563 s
.info
.endian
= BFD_ENDIAN_LITTLE
;
566 if (cc
->disas_set_info
) {
567 cc
->disas_set_info(cpu
, &s
.info
);
570 if (s
.info
.cap_arch
>= 0 && cap_disas_plugin(&s
.info
, addr
, size
)) {
571 return g_strdup(ds
->str
);
574 if (s
.info
.print_insn
== NULL
) {
575 s
.info
.print_insn
= print_insn_od_target
;
578 count
= s
.info
.print_insn(addr
, &s
.info
);
580 /* The decoder probably read more than it needed it's not critical */
582 warn_report("%s: %zu bytes left over", __func__
, size
- count
);
585 return g_strdup(ds
->str
);
588 /* Disassemble this for me please... (debugging). */
589 void disas(FILE *out
, void *code
, unsigned long size
)
594 int (*print_insn
)(bfd_vma pc
, disassemble_info
*info
) = NULL
;
596 INIT_DISASSEMBLE_INFO(s
.info
, out
, fprintf
);
597 s
.info
.print_address_func
= generic_print_host_address
;
599 s
.info
.buffer
= code
;
600 s
.info
.buffer_vma
= (uintptr_t)code
;
601 s
.info
.buffer_length
= size
;
602 s
.info
.cap_arch
= -1;
604 s
.info
.cap_insn_unit
= 4;
605 s
.info
.cap_insn_split
= 4;
607 #ifdef HOST_WORDS_BIGENDIAN
608 s
.info
.endian
= BFD_ENDIAN_BIG
;
610 s
.info
.endian
= BFD_ENDIAN_LITTLE
;
612 #if defined(CONFIG_TCG_INTERPRETER)
613 print_insn
= print_insn_tci
;
614 #elif defined(__i386__)
615 s
.info
.mach
= bfd_mach_i386_i386
;
616 print_insn
= print_insn_i386
;
617 s
.info
.cap_arch
= CS_ARCH_X86
;
618 s
.info
.cap_mode
= CS_MODE_32
;
619 s
.info
.cap_insn_unit
= 1;
620 s
.info
.cap_insn_split
= 8;
621 #elif defined(__x86_64__)
622 s
.info
.mach
= bfd_mach_x86_64
;
623 print_insn
= print_insn_i386
;
624 s
.info
.cap_arch
= CS_ARCH_X86
;
625 s
.info
.cap_mode
= CS_MODE_64
;
626 s
.info
.cap_insn_unit
= 1;
627 s
.info
.cap_insn_split
= 8;
628 #elif defined(_ARCH_PPC)
629 s
.info
.disassembler_options
= (char *)"any";
630 print_insn
= print_insn_ppc
;
631 s
.info
.cap_arch
= CS_ARCH_PPC
;
633 s
.info
.cap_mode
= CS_MODE_64
;
635 #elif defined(__riscv) && defined(CONFIG_RISCV_DIS)
636 #if defined(_ILP32) || (__riscv_xlen == 32)
637 print_insn
= print_insn_riscv32
;
639 print_insn
= print_insn_riscv64
;
641 #error unsupported RISC-V ABI
643 #elif defined(__aarch64__) && defined(CONFIG_ARM_A64_DIS)
644 print_insn
= print_insn_arm_a64
;
645 s
.info
.cap_arch
= CS_ARCH_ARM64
;
646 #elif defined(__alpha__)
647 print_insn
= print_insn_alpha
;
648 #elif defined(__sparc__)
649 print_insn
= print_insn_sparc
;
650 s
.info
.mach
= bfd_mach_sparc_v9b
;
651 #elif defined(__arm__)
652 print_insn
= print_insn_arm
;
653 s
.info
.cap_arch
= CS_ARCH_ARM
;
654 /* TCG only generates code for arm mode. */
655 #elif defined(__MIPSEB__)
656 print_insn
= print_insn_big_mips
;
657 #elif defined(__MIPSEL__)
658 print_insn
= print_insn_little_mips
;
659 #elif defined(__m68k__)
660 print_insn
= print_insn_m68k
;
661 #elif defined(__s390__)
662 print_insn
= print_insn_s390
;
663 #elif defined(__hppa__)
664 print_insn
= print_insn_hppa
;
667 if (s
.info
.cap_arch
>= 0 && cap_disas_host(&s
.info
, code
, size
)) {
671 if (print_insn
== NULL
) {
672 print_insn
= print_insn_od_host
;
674 for (pc
= (uintptr_t)code
; size
> 0; pc
+= count
, size
-= count
) {
675 fprintf(out
, "0x%08" PRIxPTR
": ", pc
);
676 count
= print_insn(pc
, &s
.info
);
683 /* Look up symbol for debugging purpose. Returns "" if unknown. */
684 const char *lookup_symbol(target_ulong orig_addr
)
686 const char *symbol
= "";
689 for (s
= syminfos
; s
; s
= s
->next
) {
690 symbol
= s
->lookup_symbol(s
, orig_addr
);
691 if (symbol
[0] != '\0') {
699 #if !defined(CONFIG_USER_ONLY)
701 #include "monitor/monitor.h"
704 physical_read_memory(bfd_vma memaddr
, bfd_byte
*myaddr
, int length
,
705 struct disassemble_info
*info
)
707 CPUDebug
*s
= container_of(info
, CPUDebug
, info
);
709 address_space_read(s
->cpu
->as
, memaddr
, MEMTXATTRS_UNSPECIFIED
,
714 /* Disassembler for the monitor. */
715 void monitor_disas(Monitor
*mon
, CPUState
*cpu
,
716 target_ulong pc
, int nb_insn
, int is_physical
)
718 CPUClass
*cc
= CPU_GET_CLASS(cpu
);
722 INIT_DISASSEMBLE_INFO(s
.info
, NULL
, qemu_fprintf
);
725 s
.info
.read_memory_func
726 = (is_physical
? physical_read_memory
: target_read_memory
);
727 s
.info
.print_address_func
= generic_print_address
;
728 s
.info
.buffer_vma
= pc
;
729 s
.info
.cap_arch
= -1;
731 s
.info
.cap_insn_unit
= 4;
732 s
.info
.cap_insn_split
= 4;
734 #ifdef TARGET_WORDS_BIGENDIAN
735 s
.info
.endian
= BFD_ENDIAN_BIG
;
737 s
.info
.endian
= BFD_ENDIAN_LITTLE
;
740 if (cc
->disas_set_info
) {
741 cc
->disas_set_info(cpu
, &s
.info
);
744 if (s
.info
.cap_arch
>= 0 && cap_disas_monitor(&s
.info
, pc
, nb_insn
)) {
748 if (!s
.info
.print_insn
) {
749 monitor_printf(mon
, "0x" TARGET_FMT_lx
750 ": Asm output not supported on this arch\n", pc
);
754 for(i
= 0; i
< nb_insn
; i
++) {
755 monitor_printf(mon
, "0x" TARGET_FMT_lx
": ", pc
);
756 count
= s
.info
.print_insn(pc
, &s
.info
);
757 monitor_printf(mon
, "\n");