cpu: Move can_do_io field from CPU_COMMON to CPUState
[qemu/ar7.git] / tcg / tcg.c
blobf1e0763432a80ab43baab229723ce16456891a41
1 /*
2 * Tiny Code Generator for QEMU
4 * Copyright (c) 2008 Fabrice Bellard
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
25 /* define it to use liveness analysis (better code) */
26 #define USE_LIVENESS_ANALYSIS
27 #define USE_TCG_OPTIMIZATIONS
29 #include "config.h"
31 /* Define to jump the ELF file used to communicate with GDB. */
32 #undef DEBUG_JIT
34 #if !defined(CONFIG_DEBUG_TCG) && !defined(NDEBUG)
35 /* define it to suppress various consistency checks (faster) */
36 #define NDEBUG
37 #endif
39 #include "qemu-common.h"
40 #include "qemu/cache-utils.h"
41 #include "qemu/host-utils.h"
42 #include "qemu/timer.h"
44 /* Note: the long term plan is to reduce the dependencies on the QEMU
45 CPU definitions. Currently they are used for qemu_ld/st
46 instructions */
47 #define NO_CPU_IO_DEFS
48 #include "cpu.h"
50 #include "tcg-op.h"
52 #if UINTPTR_MAX == UINT32_MAX
53 # define ELF_CLASS ELFCLASS32
54 #else
55 # define ELF_CLASS ELFCLASS64
56 #endif
57 #ifdef HOST_WORDS_BIGENDIAN
58 # define ELF_DATA ELFDATA2MSB
59 #else
60 # define ELF_DATA ELFDATA2LSB
61 #endif
63 #include "elf.h"
65 /* Forward declarations for functions declared in tcg-target.c and used here. */
66 static void tcg_target_init(TCGContext *s);
67 static void tcg_target_qemu_prologue(TCGContext *s);
68 static void patch_reloc(uint8_t *code_ptr, int type,
69 intptr_t value, intptr_t addend);
71 /* The CIE and FDE header definitions will be common to all hosts. */
72 typedef struct {
73 uint32_t len __attribute__((aligned((sizeof(void *)))));
74 uint32_t id;
75 uint8_t version;
76 char augmentation[1];
77 uint8_t code_align;
78 uint8_t data_align;
79 uint8_t return_column;
80 } DebugFrameCIE;
82 typedef struct QEMU_PACKED {
83 uint32_t len __attribute__((aligned((sizeof(void *)))));
84 uint32_t cie_offset;
85 uintptr_t func_start;
86 uintptr_t func_len;
87 } DebugFrameFDEHeader;
89 static void tcg_register_jit_int(void *buf, size_t size,
90 void *debug_frame, size_t debug_frame_size)
91 __attribute__((unused));
93 /* Forward declarations for functions declared and used in tcg-target.c. */
94 static int target_parse_constraint(TCGArgConstraint *ct, const char **pct_str);
95 static void tcg_out_ld(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg1,
96 intptr_t arg2);
97 static void tcg_out_mov(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg);
98 static void tcg_out_movi(TCGContext *s, TCGType type,
99 TCGReg ret, tcg_target_long arg);
100 static void tcg_out_op(TCGContext *s, TCGOpcode opc, const TCGArg *args,
101 const int *const_args);
102 static void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg, TCGReg arg1,
103 intptr_t arg2);
104 static int tcg_target_const_match(tcg_target_long val,
105 const TCGArgConstraint *arg_ct);
106 static void tcg_out_tb_init(TCGContext *s);
107 static void tcg_out_tb_finalize(TCGContext *s);
110 TCGOpDef tcg_op_defs[] = {
111 #define DEF(s, oargs, iargs, cargs, flags) { #s, oargs, iargs, cargs, iargs + oargs + cargs, flags },
112 #include "tcg-opc.h"
113 #undef DEF
115 const size_t tcg_op_defs_max = ARRAY_SIZE(tcg_op_defs);
117 static TCGRegSet tcg_target_available_regs[2];
118 static TCGRegSet tcg_target_call_clobber_regs;
120 static inline void tcg_out8(TCGContext *s, uint8_t v)
122 *s->code_ptr++ = v;
125 static inline void tcg_out16(TCGContext *s, uint16_t v)
127 uint8_t *p = s->code_ptr;
128 *(uint16_t *)p = v;
129 s->code_ptr = p + 2;
132 static inline void tcg_out32(TCGContext *s, uint32_t v)
134 uint8_t *p = s->code_ptr;
135 *(uint32_t *)p = v;
136 s->code_ptr = p + 4;
139 static inline void tcg_out64(TCGContext *s, uint64_t v)
141 uint8_t *p = s->code_ptr;
142 *(uint64_t *)p = v;
143 s->code_ptr = p + 8;
146 /* label relocation processing */
148 static void tcg_out_reloc(TCGContext *s, uint8_t *code_ptr, int type,
149 int label_index, intptr_t addend)
151 TCGLabel *l;
152 TCGRelocation *r;
154 l = &s->labels[label_index];
155 if (l->has_value) {
156 /* FIXME: This may break relocations on RISC targets that
157 modify instruction fields in place. The caller may not have
158 written the initial value. */
159 patch_reloc(code_ptr, type, l->u.value, addend);
160 } else {
161 /* add a new relocation entry */
162 r = tcg_malloc(sizeof(TCGRelocation));
163 r->type = type;
164 r->ptr = code_ptr;
165 r->addend = addend;
166 r->next = l->u.first_reloc;
167 l->u.first_reloc = r;
171 static void tcg_out_label(TCGContext *s, int label_index, void *ptr)
173 TCGLabel *l;
174 TCGRelocation *r;
175 intptr_t value = (intptr_t)ptr;
177 l = &s->labels[label_index];
178 if (l->has_value) {
179 tcg_abort();
181 r = l->u.first_reloc;
182 while (r != NULL) {
183 patch_reloc(r->ptr, r->type, value, r->addend);
184 r = r->next;
186 l->has_value = 1;
187 l->u.value = value;
190 int gen_new_label(void)
192 TCGContext *s = &tcg_ctx;
193 int idx;
194 TCGLabel *l;
196 if (s->nb_labels >= TCG_MAX_LABELS)
197 tcg_abort();
198 idx = s->nb_labels++;
199 l = &s->labels[idx];
200 l->has_value = 0;
201 l->u.first_reloc = NULL;
202 return idx;
205 #include "tcg-target.c"
207 /* pool based memory allocation */
208 void *tcg_malloc_internal(TCGContext *s, int size)
210 TCGPool *p;
211 int pool_size;
213 if (size > TCG_POOL_CHUNK_SIZE) {
214 /* big malloc: insert a new pool (XXX: could optimize) */
215 p = g_malloc(sizeof(TCGPool) + size);
216 p->size = size;
217 p->next = s->pool_first_large;
218 s->pool_first_large = p;
219 return p->data;
220 } else {
221 p = s->pool_current;
222 if (!p) {
223 p = s->pool_first;
224 if (!p)
225 goto new_pool;
226 } else {
227 if (!p->next) {
228 new_pool:
229 pool_size = TCG_POOL_CHUNK_SIZE;
230 p = g_malloc(sizeof(TCGPool) + pool_size);
231 p->size = pool_size;
232 p->next = NULL;
233 if (s->pool_current)
234 s->pool_current->next = p;
235 else
236 s->pool_first = p;
237 } else {
238 p = p->next;
242 s->pool_current = p;
243 s->pool_cur = p->data + size;
244 s->pool_end = p->data + p->size;
245 return p->data;
248 void tcg_pool_reset(TCGContext *s)
250 TCGPool *p, *t;
251 for (p = s->pool_first_large; p; p = t) {
252 t = p->next;
253 g_free(p);
255 s->pool_first_large = NULL;
256 s->pool_cur = s->pool_end = NULL;
257 s->pool_current = NULL;
260 #include "helper.h"
262 typedef struct TCGHelperInfo {
263 void *func;
264 const char *name;
265 } TCGHelperInfo;
267 static const TCGHelperInfo all_helpers[] = {
268 #define GEN_HELPER 2
269 #include "helper.h"
271 /* Include tcg-runtime.c functions. */
272 { tcg_helper_div_i32, "div_i32" },
273 { tcg_helper_rem_i32, "rem_i32" },
274 { tcg_helper_divu_i32, "divu_i32" },
275 { tcg_helper_remu_i32, "remu_i32" },
277 { tcg_helper_shl_i64, "shl_i64" },
278 { tcg_helper_shr_i64, "shr_i64" },
279 { tcg_helper_sar_i64, "sar_i64" },
280 { tcg_helper_div_i64, "div_i64" },
281 { tcg_helper_rem_i64, "rem_i64" },
282 { tcg_helper_divu_i64, "divu_i64" },
283 { tcg_helper_remu_i64, "remu_i64" },
284 { tcg_helper_mulsh_i64, "mulsh_i64" },
285 { tcg_helper_muluh_i64, "muluh_i64" },
288 void tcg_context_init(TCGContext *s)
290 int op, total_args, n, i;
291 TCGOpDef *def;
292 TCGArgConstraint *args_ct;
293 int *sorted_args;
294 GHashTable *helper_table;
296 memset(s, 0, sizeof(*s));
297 s->nb_globals = 0;
299 /* Count total number of arguments and allocate the corresponding
300 space */
301 total_args = 0;
302 for(op = 0; op < NB_OPS; op++) {
303 def = &tcg_op_defs[op];
304 n = def->nb_iargs + def->nb_oargs;
305 total_args += n;
308 args_ct = g_malloc(sizeof(TCGArgConstraint) * total_args);
309 sorted_args = g_malloc(sizeof(int) * total_args);
311 for(op = 0; op < NB_OPS; op++) {
312 def = &tcg_op_defs[op];
313 def->args_ct = args_ct;
314 def->sorted_args = sorted_args;
315 n = def->nb_iargs + def->nb_oargs;
316 sorted_args += n;
317 args_ct += n;
320 /* Register helpers. */
321 /* Use g_direct_hash/equal for direct pointer comparisons on func. */
322 s->helpers = helper_table = g_hash_table_new(NULL, NULL);
324 for (i = 0; i < ARRAY_SIZE(all_helpers); ++i) {
325 g_hash_table_insert(helper_table, (gpointer)all_helpers[i].func,
326 (gpointer)all_helpers[i].name);
329 tcg_target_init(s);
332 void tcg_prologue_init(TCGContext *s)
334 /* init global prologue and epilogue */
335 s->code_buf = s->code_gen_prologue;
336 s->code_ptr = s->code_buf;
337 tcg_target_qemu_prologue(s);
338 flush_icache_range((uintptr_t)s->code_buf, (uintptr_t)s->code_ptr);
340 #ifdef DEBUG_DISAS
341 if (qemu_loglevel_mask(CPU_LOG_TB_OUT_ASM)) {
342 size_t size = s->code_ptr - s->code_buf;
343 qemu_log("PROLOGUE: [size=%zu]\n", size);
344 log_disas(s->code_buf, size);
345 qemu_log("\n");
346 qemu_log_flush();
348 #endif
351 void tcg_set_frame(TCGContext *s, int reg, intptr_t start, intptr_t size)
353 s->frame_start = start;
354 s->frame_end = start + size;
355 s->frame_reg = reg;
358 void tcg_func_start(TCGContext *s)
360 tcg_pool_reset(s);
361 s->nb_temps = s->nb_globals;
363 /* No temps have been previously allocated for size or locality. */
364 memset(s->free_temps, 0, sizeof(s->free_temps));
366 s->labels = tcg_malloc(sizeof(TCGLabel) * TCG_MAX_LABELS);
367 s->nb_labels = 0;
368 s->current_frame_offset = s->frame_start;
370 #ifdef CONFIG_DEBUG_TCG
371 s->goto_tb_issue_mask = 0;
372 #endif
374 s->gen_opc_ptr = s->gen_opc_buf;
375 s->gen_opparam_ptr = s->gen_opparam_buf;
377 s->be = tcg_malloc(sizeof(TCGBackendData));
380 static inline void tcg_temp_alloc(TCGContext *s, int n)
382 if (n > TCG_MAX_TEMPS)
383 tcg_abort();
386 static inline int tcg_global_reg_new_internal(TCGType type, int reg,
387 const char *name)
389 TCGContext *s = &tcg_ctx;
390 TCGTemp *ts;
391 int idx;
393 #if TCG_TARGET_REG_BITS == 32
394 if (type != TCG_TYPE_I32)
395 tcg_abort();
396 #endif
397 if (tcg_regset_test_reg(s->reserved_regs, reg))
398 tcg_abort();
399 idx = s->nb_globals;
400 tcg_temp_alloc(s, s->nb_globals + 1);
401 ts = &s->temps[s->nb_globals];
402 ts->base_type = type;
403 ts->type = type;
404 ts->fixed_reg = 1;
405 ts->reg = reg;
406 ts->name = name;
407 s->nb_globals++;
408 tcg_regset_set_reg(s->reserved_regs, reg);
409 return idx;
412 TCGv_i32 tcg_global_reg_new_i32(int reg, const char *name)
414 int idx;
416 idx = tcg_global_reg_new_internal(TCG_TYPE_I32, reg, name);
417 return MAKE_TCGV_I32(idx);
420 TCGv_i64 tcg_global_reg_new_i64(int reg, const char *name)
422 int idx;
424 idx = tcg_global_reg_new_internal(TCG_TYPE_I64, reg, name);
425 return MAKE_TCGV_I64(idx);
428 static inline int tcg_global_mem_new_internal(TCGType type, int reg,
429 intptr_t offset,
430 const char *name)
432 TCGContext *s = &tcg_ctx;
433 TCGTemp *ts;
434 int idx;
436 idx = s->nb_globals;
437 #if TCG_TARGET_REG_BITS == 32
438 if (type == TCG_TYPE_I64) {
439 char buf[64];
440 tcg_temp_alloc(s, s->nb_globals + 2);
441 ts = &s->temps[s->nb_globals];
442 ts->base_type = type;
443 ts->type = TCG_TYPE_I32;
444 ts->fixed_reg = 0;
445 ts->mem_allocated = 1;
446 ts->mem_reg = reg;
447 #ifdef TCG_TARGET_WORDS_BIGENDIAN
448 ts->mem_offset = offset + 4;
449 #else
450 ts->mem_offset = offset;
451 #endif
452 pstrcpy(buf, sizeof(buf), name);
453 pstrcat(buf, sizeof(buf), "_0");
454 ts->name = strdup(buf);
455 ts++;
457 ts->base_type = type;
458 ts->type = TCG_TYPE_I32;
459 ts->fixed_reg = 0;
460 ts->mem_allocated = 1;
461 ts->mem_reg = reg;
462 #ifdef TCG_TARGET_WORDS_BIGENDIAN
463 ts->mem_offset = offset;
464 #else
465 ts->mem_offset = offset + 4;
466 #endif
467 pstrcpy(buf, sizeof(buf), name);
468 pstrcat(buf, sizeof(buf), "_1");
469 ts->name = strdup(buf);
471 s->nb_globals += 2;
472 } else
473 #endif
475 tcg_temp_alloc(s, s->nb_globals + 1);
476 ts = &s->temps[s->nb_globals];
477 ts->base_type = type;
478 ts->type = type;
479 ts->fixed_reg = 0;
480 ts->mem_allocated = 1;
481 ts->mem_reg = reg;
482 ts->mem_offset = offset;
483 ts->name = name;
484 s->nb_globals++;
486 return idx;
489 TCGv_i32 tcg_global_mem_new_i32(int reg, intptr_t offset, const char *name)
491 int idx = tcg_global_mem_new_internal(TCG_TYPE_I32, reg, offset, name);
492 return MAKE_TCGV_I32(idx);
495 TCGv_i64 tcg_global_mem_new_i64(int reg, intptr_t offset, const char *name)
497 int idx = tcg_global_mem_new_internal(TCG_TYPE_I64, reg, offset, name);
498 return MAKE_TCGV_I64(idx);
501 static inline int tcg_temp_new_internal(TCGType type, int temp_local)
503 TCGContext *s = &tcg_ctx;
504 TCGTemp *ts;
505 int idx, k;
507 k = type + (temp_local ? TCG_TYPE_COUNT : 0);
508 idx = find_first_bit(s->free_temps[k].l, TCG_MAX_TEMPS);
509 if (idx < TCG_MAX_TEMPS) {
510 /* There is already an available temp with the right type. */
511 clear_bit(idx, s->free_temps[k].l);
513 ts = &s->temps[idx];
514 ts->temp_allocated = 1;
515 assert(ts->base_type == type);
516 assert(ts->temp_local == temp_local);
517 } else {
518 idx = s->nb_temps;
519 #if TCG_TARGET_REG_BITS == 32
520 if (type == TCG_TYPE_I64) {
521 tcg_temp_alloc(s, s->nb_temps + 2);
522 ts = &s->temps[s->nb_temps];
523 ts->base_type = type;
524 ts->type = TCG_TYPE_I32;
525 ts->temp_allocated = 1;
526 ts->temp_local = temp_local;
527 ts->name = NULL;
528 ts++;
529 ts->base_type = type;
530 ts->type = TCG_TYPE_I32;
531 ts->temp_allocated = 1;
532 ts->temp_local = temp_local;
533 ts->name = NULL;
534 s->nb_temps += 2;
535 } else
536 #endif
538 tcg_temp_alloc(s, s->nb_temps + 1);
539 ts = &s->temps[s->nb_temps];
540 ts->base_type = type;
541 ts->type = type;
542 ts->temp_allocated = 1;
543 ts->temp_local = temp_local;
544 ts->name = NULL;
545 s->nb_temps++;
549 #if defined(CONFIG_DEBUG_TCG)
550 s->temps_in_use++;
551 #endif
552 return idx;
555 TCGv_i32 tcg_temp_new_internal_i32(int temp_local)
557 int idx;
559 idx = tcg_temp_new_internal(TCG_TYPE_I32, temp_local);
560 return MAKE_TCGV_I32(idx);
563 TCGv_i64 tcg_temp_new_internal_i64(int temp_local)
565 int idx;
567 idx = tcg_temp_new_internal(TCG_TYPE_I64, temp_local);
568 return MAKE_TCGV_I64(idx);
571 static void tcg_temp_free_internal(int idx)
573 TCGContext *s = &tcg_ctx;
574 TCGTemp *ts;
575 int k;
577 #if defined(CONFIG_DEBUG_TCG)
578 s->temps_in_use--;
579 if (s->temps_in_use < 0) {
580 fprintf(stderr, "More temporaries freed than allocated!\n");
582 #endif
584 assert(idx >= s->nb_globals && idx < s->nb_temps);
585 ts = &s->temps[idx];
586 assert(ts->temp_allocated != 0);
587 ts->temp_allocated = 0;
589 k = ts->base_type + (ts->temp_local ? TCG_TYPE_COUNT : 0);
590 set_bit(idx, s->free_temps[k].l);
593 void tcg_temp_free_i32(TCGv_i32 arg)
595 tcg_temp_free_internal(GET_TCGV_I32(arg));
598 void tcg_temp_free_i64(TCGv_i64 arg)
600 tcg_temp_free_internal(GET_TCGV_I64(arg));
603 TCGv_i32 tcg_const_i32(int32_t val)
605 TCGv_i32 t0;
606 t0 = tcg_temp_new_i32();
607 tcg_gen_movi_i32(t0, val);
608 return t0;
611 TCGv_i64 tcg_const_i64(int64_t val)
613 TCGv_i64 t0;
614 t0 = tcg_temp_new_i64();
615 tcg_gen_movi_i64(t0, val);
616 return t0;
619 TCGv_i32 tcg_const_local_i32(int32_t val)
621 TCGv_i32 t0;
622 t0 = tcg_temp_local_new_i32();
623 tcg_gen_movi_i32(t0, val);
624 return t0;
627 TCGv_i64 tcg_const_local_i64(int64_t val)
629 TCGv_i64 t0;
630 t0 = tcg_temp_local_new_i64();
631 tcg_gen_movi_i64(t0, val);
632 return t0;
635 #if defined(CONFIG_DEBUG_TCG)
636 void tcg_clear_temp_count(void)
638 TCGContext *s = &tcg_ctx;
639 s->temps_in_use = 0;
642 int tcg_check_temp_count(void)
644 TCGContext *s = &tcg_ctx;
645 if (s->temps_in_use) {
646 /* Clear the count so that we don't give another
647 * warning immediately next time around.
649 s->temps_in_use = 0;
650 return 1;
652 return 0;
654 #endif
656 /* Note: we convert the 64 bit args to 32 bit and do some alignment
657 and endian swap. Maybe it would be better to do the alignment
658 and endian swap in tcg_reg_alloc_call(). */
659 void tcg_gen_callN(TCGContext *s, TCGv_ptr func, unsigned int flags,
660 int sizemask, TCGArg ret, int nargs, TCGArg *args)
662 int i;
663 int real_args;
664 int nb_rets;
665 TCGArg *nparam;
667 #if defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64
668 for (i = 0; i < nargs; ++i) {
669 int is_64bit = sizemask & (1 << (i+1)*2);
670 int is_signed = sizemask & (2 << (i+1)*2);
671 if (!is_64bit) {
672 TCGv_i64 temp = tcg_temp_new_i64();
673 TCGv_i64 orig = MAKE_TCGV_I64(args[i]);
674 if (is_signed) {
675 tcg_gen_ext32s_i64(temp, orig);
676 } else {
677 tcg_gen_ext32u_i64(temp, orig);
679 args[i] = GET_TCGV_I64(temp);
682 #endif /* TCG_TARGET_EXTEND_ARGS */
684 *s->gen_opc_ptr++ = INDEX_op_call;
685 nparam = s->gen_opparam_ptr++;
686 if (ret != TCG_CALL_DUMMY_ARG) {
687 #if TCG_TARGET_REG_BITS < 64
688 if (sizemask & 1) {
689 #ifdef TCG_TARGET_WORDS_BIGENDIAN
690 *s->gen_opparam_ptr++ = ret + 1;
691 *s->gen_opparam_ptr++ = ret;
692 #else
693 *s->gen_opparam_ptr++ = ret;
694 *s->gen_opparam_ptr++ = ret + 1;
695 #endif
696 nb_rets = 2;
697 } else
698 #endif
700 *s->gen_opparam_ptr++ = ret;
701 nb_rets = 1;
703 } else {
704 nb_rets = 0;
706 real_args = 0;
707 for (i = 0; i < nargs; i++) {
708 #if TCG_TARGET_REG_BITS < 64
709 int is_64bit = sizemask & (1 << (i+1)*2);
710 if (is_64bit) {
711 #ifdef TCG_TARGET_CALL_ALIGN_ARGS
712 /* some targets want aligned 64 bit args */
713 if (real_args & 1) {
714 *s->gen_opparam_ptr++ = TCG_CALL_DUMMY_ARG;
715 real_args++;
717 #endif
718 /* If stack grows up, then we will be placing successive
719 arguments at lower addresses, which means we need to
720 reverse the order compared to how we would normally
721 treat either big or little-endian. For those arguments
722 that will wind up in registers, this still works for
723 HPPA (the only current STACK_GROWSUP target) since the
724 argument registers are *also* allocated in decreasing
725 order. If another such target is added, this logic may
726 have to get more complicated to differentiate between
727 stack arguments and register arguments. */
728 #if defined(TCG_TARGET_WORDS_BIGENDIAN) != defined(TCG_TARGET_STACK_GROWSUP)
729 *s->gen_opparam_ptr++ = args[i] + 1;
730 *s->gen_opparam_ptr++ = args[i];
731 #else
732 *s->gen_opparam_ptr++ = args[i];
733 *s->gen_opparam_ptr++ = args[i] + 1;
734 #endif
735 real_args += 2;
736 continue;
738 #endif /* TCG_TARGET_REG_BITS < 64 */
740 *s->gen_opparam_ptr++ = args[i];
741 real_args++;
743 *s->gen_opparam_ptr++ = GET_TCGV_PTR(func);
745 *s->gen_opparam_ptr++ = flags;
747 *nparam = (nb_rets << 16) | (real_args + 1);
749 /* total parameters, needed to go backward in the instruction stream */
750 *s->gen_opparam_ptr++ = 1 + nb_rets + real_args + 3;
752 #if defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64
753 for (i = 0; i < nargs; ++i) {
754 int is_64bit = sizemask & (1 << (i+1)*2);
755 if (!is_64bit) {
756 TCGv_i64 temp = MAKE_TCGV_I64(args[i]);
757 tcg_temp_free_i64(temp);
760 #endif /* TCG_TARGET_EXTEND_ARGS */
763 #if TCG_TARGET_REG_BITS == 32
764 void tcg_gen_shifti_i64(TCGv_i64 ret, TCGv_i64 arg1,
765 int c, int right, int arith)
767 if (c == 0) {
768 tcg_gen_mov_i32(TCGV_LOW(ret), TCGV_LOW(arg1));
769 tcg_gen_mov_i32(TCGV_HIGH(ret), TCGV_HIGH(arg1));
770 } else if (c >= 32) {
771 c -= 32;
772 if (right) {
773 if (arith) {
774 tcg_gen_sari_i32(TCGV_LOW(ret), TCGV_HIGH(arg1), c);
775 tcg_gen_sari_i32(TCGV_HIGH(ret), TCGV_HIGH(arg1), 31);
776 } else {
777 tcg_gen_shri_i32(TCGV_LOW(ret), TCGV_HIGH(arg1), c);
778 tcg_gen_movi_i32(TCGV_HIGH(ret), 0);
780 } else {
781 tcg_gen_shli_i32(TCGV_HIGH(ret), TCGV_LOW(arg1), c);
782 tcg_gen_movi_i32(TCGV_LOW(ret), 0);
784 } else {
785 TCGv_i32 t0, t1;
787 t0 = tcg_temp_new_i32();
788 t1 = tcg_temp_new_i32();
789 if (right) {
790 tcg_gen_shli_i32(t0, TCGV_HIGH(arg1), 32 - c);
791 if (arith)
792 tcg_gen_sari_i32(t1, TCGV_HIGH(arg1), c);
793 else
794 tcg_gen_shri_i32(t1, TCGV_HIGH(arg1), c);
795 tcg_gen_shri_i32(TCGV_LOW(ret), TCGV_LOW(arg1), c);
796 tcg_gen_or_i32(TCGV_LOW(ret), TCGV_LOW(ret), t0);
797 tcg_gen_mov_i32(TCGV_HIGH(ret), t1);
798 } else {
799 tcg_gen_shri_i32(t0, TCGV_LOW(arg1), 32 - c);
800 /* Note: ret can be the same as arg1, so we use t1 */
801 tcg_gen_shli_i32(t1, TCGV_LOW(arg1), c);
802 tcg_gen_shli_i32(TCGV_HIGH(ret), TCGV_HIGH(arg1), c);
803 tcg_gen_or_i32(TCGV_HIGH(ret), TCGV_HIGH(ret), t0);
804 tcg_gen_mov_i32(TCGV_LOW(ret), t1);
806 tcg_temp_free_i32(t0);
807 tcg_temp_free_i32(t1);
810 #endif
812 static inline TCGMemOp tcg_canonicalize_memop(TCGMemOp op, bool is64, bool st)
814 switch (op & MO_SIZE) {
815 case MO_8:
816 op &= ~MO_BSWAP;
817 break;
818 case MO_16:
819 break;
820 case MO_32:
821 if (!is64) {
822 op &= ~MO_SIGN;
824 break;
825 case MO_64:
826 if (!is64) {
827 tcg_abort();
829 break;
831 if (st) {
832 op &= ~MO_SIGN;
834 return op;
837 static const TCGOpcode old_ld_opc[8] = {
838 [MO_UB] = INDEX_op_qemu_ld8u,
839 [MO_SB] = INDEX_op_qemu_ld8s,
840 [MO_UW] = INDEX_op_qemu_ld16u,
841 [MO_SW] = INDEX_op_qemu_ld16s,
842 #if TCG_TARGET_REG_BITS == 32
843 [MO_UL] = INDEX_op_qemu_ld32,
844 [MO_SL] = INDEX_op_qemu_ld32,
845 #else
846 [MO_UL] = INDEX_op_qemu_ld32u,
847 [MO_SL] = INDEX_op_qemu_ld32s,
848 #endif
849 [MO_Q] = INDEX_op_qemu_ld64,
852 static const TCGOpcode old_st_opc[4] = {
853 [MO_UB] = INDEX_op_qemu_st8,
854 [MO_UW] = INDEX_op_qemu_st16,
855 [MO_UL] = INDEX_op_qemu_st32,
856 [MO_Q] = INDEX_op_qemu_st64,
859 void tcg_gen_qemu_ld_i32(TCGv_i32 val, TCGv addr, TCGArg idx, TCGMemOp memop)
861 memop = tcg_canonicalize_memop(memop, 0, 0);
863 if (TCG_TARGET_HAS_new_ldst) {
864 *tcg_ctx.gen_opc_ptr++ = INDEX_op_qemu_ld_i32;
865 tcg_add_param_i32(val);
866 tcg_add_param_tl(addr);
867 *tcg_ctx.gen_opparam_ptr++ = memop;
868 *tcg_ctx.gen_opparam_ptr++ = idx;
869 return;
872 /* The old opcodes only support target-endian memory operations. */
873 assert((memop & MO_BSWAP) == MO_TE || (memop & MO_SIZE) == MO_8);
874 assert(old_ld_opc[memop & MO_SSIZE] != 0);
876 if (TCG_TARGET_REG_BITS == 32) {
877 *tcg_ctx.gen_opc_ptr++ = old_ld_opc[memop & MO_SSIZE];
878 tcg_add_param_i32(val);
879 tcg_add_param_tl(addr);
880 *tcg_ctx.gen_opparam_ptr++ = idx;
881 } else {
882 TCGv_i64 val64 = tcg_temp_new_i64();
884 *tcg_ctx.gen_opc_ptr++ = old_ld_opc[memop & MO_SSIZE];
885 tcg_add_param_i64(val64);
886 tcg_add_param_tl(addr);
887 *tcg_ctx.gen_opparam_ptr++ = idx;
889 tcg_gen_trunc_i64_i32(val, val64);
890 tcg_temp_free_i64(val64);
894 void tcg_gen_qemu_st_i32(TCGv_i32 val, TCGv addr, TCGArg idx, TCGMemOp memop)
896 memop = tcg_canonicalize_memop(memop, 0, 1);
898 if (TCG_TARGET_HAS_new_ldst) {
899 *tcg_ctx.gen_opc_ptr++ = INDEX_op_qemu_st_i32;
900 tcg_add_param_i32(val);
901 tcg_add_param_tl(addr);
902 *tcg_ctx.gen_opparam_ptr++ = memop;
903 *tcg_ctx.gen_opparam_ptr++ = idx;
904 return;
907 /* The old opcodes only support target-endian memory operations. */
908 assert((memop & MO_BSWAP) == MO_TE || (memop & MO_SIZE) == MO_8);
909 assert(old_st_opc[memop & MO_SIZE] != 0);
911 if (TCG_TARGET_REG_BITS == 32) {
912 *tcg_ctx.gen_opc_ptr++ = old_st_opc[memop & MO_SIZE];
913 tcg_add_param_i32(val);
914 tcg_add_param_tl(addr);
915 *tcg_ctx.gen_opparam_ptr++ = idx;
916 } else {
917 TCGv_i64 val64 = tcg_temp_new_i64();
919 tcg_gen_extu_i32_i64(val64, val);
921 *tcg_ctx.gen_opc_ptr++ = old_st_opc[memop & MO_SIZE];
922 tcg_add_param_i64(val64);
923 tcg_add_param_tl(addr);
924 *tcg_ctx.gen_opparam_ptr++ = idx;
926 tcg_temp_free_i64(val64);
930 void tcg_gen_qemu_ld_i64(TCGv_i64 val, TCGv addr, TCGArg idx, TCGMemOp memop)
932 memop = tcg_canonicalize_memop(memop, 1, 0);
934 #if TCG_TARGET_REG_BITS == 32
935 if ((memop & MO_SIZE) < MO_64) {
936 tcg_gen_qemu_ld_i32(TCGV_LOW(val), addr, idx, memop);
937 if (memop & MO_SIGN) {
938 tcg_gen_sari_i32(TCGV_HIGH(val), TCGV_LOW(val), 31);
939 } else {
940 tcg_gen_movi_i32(TCGV_HIGH(val), 0);
942 return;
944 #endif
946 if (TCG_TARGET_HAS_new_ldst) {
947 *tcg_ctx.gen_opc_ptr++ = INDEX_op_qemu_ld_i64;
948 tcg_add_param_i64(val);
949 tcg_add_param_tl(addr);
950 *tcg_ctx.gen_opparam_ptr++ = memop;
951 *tcg_ctx.gen_opparam_ptr++ = idx;
952 return;
955 /* The old opcodes only support target-endian memory operations. */
956 assert((memop & MO_BSWAP) == MO_TE || (memop & MO_SIZE) == MO_8);
957 assert(old_ld_opc[memop & MO_SSIZE] != 0);
959 *tcg_ctx.gen_opc_ptr++ = old_ld_opc[memop & MO_SSIZE];
960 tcg_add_param_i64(val);
961 tcg_add_param_tl(addr);
962 *tcg_ctx.gen_opparam_ptr++ = idx;
965 void tcg_gen_qemu_st_i64(TCGv_i64 val, TCGv addr, TCGArg idx, TCGMemOp memop)
967 memop = tcg_canonicalize_memop(memop, 1, 1);
969 #if TCG_TARGET_REG_BITS == 32
970 if ((memop & MO_SIZE) < MO_64) {
971 tcg_gen_qemu_st_i32(TCGV_LOW(val), addr, idx, memop);
972 return;
974 #endif
976 if (TCG_TARGET_HAS_new_ldst) {
977 *tcg_ctx.gen_opc_ptr++ = INDEX_op_qemu_st_i64;
978 tcg_add_param_i64(val);
979 tcg_add_param_tl(addr);
980 *tcg_ctx.gen_opparam_ptr++ = memop;
981 *tcg_ctx.gen_opparam_ptr++ = idx;
982 return;
985 /* The old opcodes only support target-endian memory operations. */
986 assert((memop & MO_BSWAP) == MO_TE || (memop & MO_SIZE) == MO_8);
987 assert(old_st_opc[memop & MO_SIZE] != 0);
989 *tcg_ctx.gen_opc_ptr++ = old_st_opc[memop & MO_SIZE];
990 tcg_add_param_i64(val);
991 tcg_add_param_tl(addr);
992 *tcg_ctx.gen_opparam_ptr++ = idx;
995 static void tcg_reg_alloc_start(TCGContext *s)
997 int i;
998 TCGTemp *ts;
999 for(i = 0; i < s->nb_globals; i++) {
1000 ts = &s->temps[i];
1001 if (ts->fixed_reg) {
1002 ts->val_type = TEMP_VAL_REG;
1003 } else {
1004 ts->val_type = TEMP_VAL_MEM;
1007 for(i = s->nb_globals; i < s->nb_temps; i++) {
1008 ts = &s->temps[i];
1009 if (ts->temp_local) {
1010 ts->val_type = TEMP_VAL_MEM;
1011 } else {
1012 ts->val_type = TEMP_VAL_DEAD;
1014 ts->mem_allocated = 0;
1015 ts->fixed_reg = 0;
1017 for(i = 0; i < TCG_TARGET_NB_REGS; i++) {
1018 s->reg_to_temp[i] = -1;
1022 static char *tcg_get_arg_str_idx(TCGContext *s, char *buf, int buf_size,
1023 int idx)
1025 TCGTemp *ts;
1027 assert(idx >= 0 && idx < s->nb_temps);
1028 ts = &s->temps[idx];
1029 if (idx < s->nb_globals) {
1030 pstrcpy(buf, buf_size, ts->name);
1031 } else {
1032 if (ts->temp_local)
1033 snprintf(buf, buf_size, "loc%d", idx - s->nb_globals);
1034 else
1035 snprintf(buf, buf_size, "tmp%d", idx - s->nb_globals);
1037 return buf;
1040 char *tcg_get_arg_str_i32(TCGContext *s, char *buf, int buf_size, TCGv_i32 arg)
1042 return tcg_get_arg_str_idx(s, buf, buf_size, GET_TCGV_I32(arg));
1045 char *tcg_get_arg_str_i64(TCGContext *s, char *buf, int buf_size, TCGv_i64 arg)
1047 return tcg_get_arg_str_idx(s, buf, buf_size, GET_TCGV_I64(arg));
1050 /* Find helper name. */
1051 static inline const char *tcg_find_helper(TCGContext *s, uintptr_t val)
1053 const char *ret = NULL;
1054 if (s->helpers) {
1055 ret = g_hash_table_lookup(s->helpers, (gpointer)val);
1057 return ret;
1060 static const char * const cond_name[] =
1062 [TCG_COND_NEVER] = "never",
1063 [TCG_COND_ALWAYS] = "always",
1064 [TCG_COND_EQ] = "eq",
1065 [TCG_COND_NE] = "ne",
1066 [TCG_COND_LT] = "lt",
1067 [TCG_COND_GE] = "ge",
1068 [TCG_COND_LE] = "le",
1069 [TCG_COND_GT] = "gt",
1070 [TCG_COND_LTU] = "ltu",
1071 [TCG_COND_GEU] = "geu",
1072 [TCG_COND_LEU] = "leu",
1073 [TCG_COND_GTU] = "gtu"
1076 static const char * const ldst_name[] =
1078 [MO_UB] = "ub",
1079 [MO_SB] = "sb",
1080 [MO_LEUW] = "leuw",
1081 [MO_LESW] = "lesw",
1082 [MO_LEUL] = "leul",
1083 [MO_LESL] = "lesl",
1084 [MO_LEQ] = "leq",
1085 [MO_BEUW] = "beuw",
1086 [MO_BESW] = "besw",
1087 [MO_BEUL] = "beul",
1088 [MO_BESL] = "besl",
1089 [MO_BEQ] = "beq",
1092 void tcg_dump_ops(TCGContext *s)
1094 const uint16_t *opc_ptr;
1095 const TCGArg *args;
1096 TCGArg arg;
1097 TCGOpcode c;
1098 int i, k, nb_oargs, nb_iargs, nb_cargs, first_insn;
1099 const TCGOpDef *def;
1100 char buf[128];
1102 first_insn = 1;
1103 opc_ptr = s->gen_opc_buf;
1104 args = s->gen_opparam_buf;
1105 while (opc_ptr < s->gen_opc_ptr) {
1106 c = *opc_ptr++;
1107 def = &tcg_op_defs[c];
1108 if (c == INDEX_op_debug_insn_start) {
1109 uint64_t pc;
1110 #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS
1111 pc = ((uint64_t)args[1] << 32) | args[0];
1112 #else
1113 pc = args[0];
1114 #endif
1115 if (!first_insn) {
1116 qemu_log("\n");
1118 qemu_log(" ---- 0x%" PRIx64, pc);
1119 first_insn = 0;
1120 nb_oargs = def->nb_oargs;
1121 nb_iargs = def->nb_iargs;
1122 nb_cargs = def->nb_cargs;
1123 } else if (c == INDEX_op_call) {
1124 TCGArg arg;
1126 /* variable number of arguments */
1127 arg = *args++;
1128 nb_oargs = arg >> 16;
1129 nb_iargs = arg & 0xffff;
1130 nb_cargs = def->nb_cargs;
1132 qemu_log(" %s ", def->name);
1134 /* function name */
1135 qemu_log("%s",
1136 tcg_get_arg_str_idx(s, buf, sizeof(buf),
1137 args[nb_oargs + nb_iargs - 1]));
1138 /* flags */
1139 qemu_log(",$0x%" TCG_PRIlx, args[nb_oargs + nb_iargs]);
1140 /* nb out args */
1141 qemu_log(",$%d", nb_oargs);
1142 for(i = 0; i < nb_oargs; i++) {
1143 qemu_log(",");
1144 qemu_log("%s", tcg_get_arg_str_idx(s, buf, sizeof(buf),
1145 args[i]));
1147 for(i = 0; i < (nb_iargs - 1); i++) {
1148 qemu_log(",");
1149 if (args[nb_oargs + i] == TCG_CALL_DUMMY_ARG) {
1150 qemu_log("<dummy>");
1151 } else {
1152 qemu_log("%s", tcg_get_arg_str_idx(s, buf, sizeof(buf),
1153 args[nb_oargs + i]));
1156 } else if (c == INDEX_op_movi_i32 || c == INDEX_op_movi_i64) {
1157 tcg_target_ulong val;
1158 const char *name;
1160 nb_oargs = def->nb_oargs;
1161 nb_iargs = def->nb_iargs;
1162 nb_cargs = def->nb_cargs;
1163 qemu_log(" %s %s,$", def->name,
1164 tcg_get_arg_str_idx(s, buf, sizeof(buf), args[0]));
1165 val = args[1];
1166 name = tcg_find_helper(s, val);
1167 if (name) {
1168 qemu_log("%s", name);
1169 } else {
1170 if (c == INDEX_op_movi_i32) {
1171 qemu_log("0x%x", (uint32_t)val);
1172 } else {
1173 qemu_log("0x%" PRIx64 , (uint64_t)val);
1176 } else {
1177 qemu_log(" %s ", def->name);
1178 if (c == INDEX_op_nopn) {
1179 /* variable number of arguments */
1180 nb_cargs = *args;
1181 nb_oargs = 0;
1182 nb_iargs = 0;
1183 } else {
1184 nb_oargs = def->nb_oargs;
1185 nb_iargs = def->nb_iargs;
1186 nb_cargs = def->nb_cargs;
1189 k = 0;
1190 for(i = 0; i < nb_oargs; i++) {
1191 if (k != 0) {
1192 qemu_log(",");
1194 qemu_log("%s", tcg_get_arg_str_idx(s, buf, sizeof(buf),
1195 args[k++]));
1197 for(i = 0; i < nb_iargs; i++) {
1198 if (k != 0) {
1199 qemu_log(",");
1201 qemu_log("%s", tcg_get_arg_str_idx(s, buf, sizeof(buf),
1202 args[k++]));
1204 switch (c) {
1205 case INDEX_op_brcond_i32:
1206 case INDEX_op_setcond_i32:
1207 case INDEX_op_movcond_i32:
1208 case INDEX_op_brcond2_i32:
1209 case INDEX_op_setcond2_i32:
1210 case INDEX_op_brcond_i64:
1211 case INDEX_op_setcond_i64:
1212 case INDEX_op_movcond_i64:
1213 if (args[k] < ARRAY_SIZE(cond_name) && cond_name[args[k]]) {
1214 qemu_log(",%s", cond_name[args[k++]]);
1215 } else {
1216 qemu_log(",$0x%" TCG_PRIlx, args[k++]);
1218 i = 1;
1219 break;
1220 case INDEX_op_qemu_ld_i32:
1221 case INDEX_op_qemu_st_i32:
1222 case INDEX_op_qemu_ld_i64:
1223 case INDEX_op_qemu_st_i64:
1224 if (args[k] < ARRAY_SIZE(ldst_name) && ldst_name[args[k]]) {
1225 qemu_log(",%s", ldst_name[args[k++]]);
1226 } else {
1227 qemu_log(",$0x%" TCG_PRIlx, args[k++]);
1229 i = 1;
1230 break;
1231 default:
1232 i = 0;
1233 break;
1235 for(; i < nb_cargs; i++) {
1236 if (k != 0) {
1237 qemu_log(",");
1239 arg = args[k++];
1240 qemu_log("$0x%" TCG_PRIlx, arg);
1243 qemu_log("\n");
1244 args += nb_iargs + nb_oargs + nb_cargs;
1248 /* we give more priority to constraints with less registers */
1249 static int get_constraint_priority(const TCGOpDef *def, int k)
1251 const TCGArgConstraint *arg_ct;
1253 int i, n;
1254 arg_ct = &def->args_ct[k];
1255 if (arg_ct->ct & TCG_CT_ALIAS) {
1256 /* an alias is equivalent to a single register */
1257 n = 1;
1258 } else {
1259 if (!(arg_ct->ct & TCG_CT_REG))
1260 return 0;
1261 n = 0;
1262 for(i = 0; i < TCG_TARGET_NB_REGS; i++) {
1263 if (tcg_regset_test_reg(arg_ct->u.regs, i))
1264 n++;
1267 return TCG_TARGET_NB_REGS - n + 1;
1270 /* sort from highest priority to lowest */
1271 static void sort_constraints(TCGOpDef *def, int start, int n)
1273 int i, j, p1, p2, tmp;
1275 for(i = 0; i < n; i++)
1276 def->sorted_args[start + i] = start + i;
1277 if (n <= 1)
1278 return;
1279 for(i = 0; i < n - 1; i++) {
1280 for(j = i + 1; j < n; j++) {
1281 p1 = get_constraint_priority(def, def->sorted_args[start + i]);
1282 p2 = get_constraint_priority(def, def->sorted_args[start + j]);
1283 if (p1 < p2) {
1284 tmp = def->sorted_args[start + i];
1285 def->sorted_args[start + i] = def->sorted_args[start + j];
1286 def->sorted_args[start + j] = tmp;
1292 void tcg_add_target_add_op_defs(const TCGTargetOpDef *tdefs)
1294 TCGOpcode op;
1295 TCGOpDef *def;
1296 const char *ct_str;
1297 int i, nb_args;
1299 for(;;) {
1300 if (tdefs->op == (TCGOpcode)-1)
1301 break;
1302 op = tdefs->op;
1303 assert((unsigned)op < NB_OPS);
1304 def = &tcg_op_defs[op];
1305 #if defined(CONFIG_DEBUG_TCG)
1306 /* Duplicate entry in op definitions? */
1307 assert(!def->used);
1308 def->used = 1;
1309 #endif
1310 nb_args = def->nb_iargs + def->nb_oargs;
1311 for(i = 0; i < nb_args; i++) {
1312 ct_str = tdefs->args_ct_str[i];
1313 /* Incomplete TCGTargetOpDef entry? */
1314 assert(ct_str != NULL);
1315 tcg_regset_clear(def->args_ct[i].u.regs);
1316 def->args_ct[i].ct = 0;
1317 if (ct_str[0] >= '0' && ct_str[0] <= '9') {
1318 int oarg;
1319 oarg = ct_str[0] - '0';
1320 assert(oarg < def->nb_oargs);
1321 assert(def->args_ct[oarg].ct & TCG_CT_REG);
1322 /* TCG_CT_ALIAS is for the output arguments. The input
1323 argument is tagged with TCG_CT_IALIAS. */
1324 def->args_ct[i] = def->args_ct[oarg];
1325 def->args_ct[oarg].ct = TCG_CT_ALIAS;
1326 def->args_ct[oarg].alias_index = i;
1327 def->args_ct[i].ct |= TCG_CT_IALIAS;
1328 def->args_ct[i].alias_index = oarg;
1329 } else {
1330 for(;;) {
1331 if (*ct_str == '\0')
1332 break;
1333 switch(*ct_str) {
1334 case 'i':
1335 def->args_ct[i].ct |= TCG_CT_CONST;
1336 ct_str++;
1337 break;
1338 default:
1339 if (target_parse_constraint(&def->args_ct[i], &ct_str) < 0) {
1340 fprintf(stderr, "Invalid constraint '%s' for arg %d of operation '%s'\n",
1341 ct_str, i, def->name);
1342 exit(1);
1349 /* TCGTargetOpDef entry with too much information? */
1350 assert(i == TCG_MAX_OP_ARGS || tdefs->args_ct_str[i] == NULL);
1352 /* sort the constraints (XXX: this is just an heuristic) */
1353 sort_constraints(def, 0, def->nb_oargs);
1354 sort_constraints(def, def->nb_oargs, def->nb_iargs);
1356 #if 0
1358 int i;
1360 printf("%s: sorted=", def->name);
1361 for(i = 0; i < def->nb_oargs + def->nb_iargs; i++)
1362 printf(" %d", def->sorted_args[i]);
1363 printf("\n");
1365 #endif
1366 tdefs++;
1369 #if defined(CONFIG_DEBUG_TCG)
1370 i = 0;
1371 for (op = 0; op < ARRAY_SIZE(tcg_op_defs); op++) {
1372 const TCGOpDef *def = &tcg_op_defs[op];
1373 if (def->flags & TCG_OPF_NOT_PRESENT) {
1374 /* Wrong entry in op definitions? */
1375 if (def->used) {
1376 fprintf(stderr, "Invalid op definition for %s\n", def->name);
1377 i = 1;
1379 } else {
1380 /* Missing entry in op definitions? */
1381 if (!def->used) {
1382 fprintf(stderr, "Missing op definition for %s\n", def->name);
1383 i = 1;
1387 if (i == 1) {
1388 tcg_abort();
1390 #endif
1393 #ifdef USE_LIVENESS_ANALYSIS
1395 /* set a nop for an operation using 'nb_args' */
1396 static inline void tcg_set_nop(TCGContext *s, uint16_t *opc_ptr,
1397 TCGArg *args, int nb_args)
1399 if (nb_args == 0) {
1400 *opc_ptr = INDEX_op_nop;
1401 } else {
1402 *opc_ptr = INDEX_op_nopn;
1403 args[0] = nb_args;
1404 args[nb_args - 1] = nb_args;
1408 /* liveness analysis: end of function: all temps are dead, and globals
1409 should be in memory. */
1410 static inline void tcg_la_func_end(TCGContext *s, uint8_t *dead_temps,
1411 uint8_t *mem_temps)
1413 memset(dead_temps, 1, s->nb_temps);
1414 memset(mem_temps, 1, s->nb_globals);
1415 memset(mem_temps + s->nb_globals, 0, s->nb_temps - s->nb_globals);
1418 /* liveness analysis: end of basic block: all temps are dead, globals
1419 and local temps should be in memory. */
1420 static inline void tcg_la_bb_end(TCGContext *s, uint8_t *dead_temps,
1421 uint8_t *mem_temps)
1423 int i;
1425 memset(dead_temps, 1, s->nb_temps);
1426 memset(mem_temps, 1, s->nb_globals);
1427 for(i = s->nb_globals; i < s->nb_temps; i++) {
1428 mem_temps[i] = s->temps[i].temp_local;
1432 /* Liveness analysis : update the opc_dead_args array to tell if a
1433 given input arguments is dead. Instructions updating dead
1434 temporaries are removed. */
1435 static void tcg_liveness_analysis(TCGContext *s)
1437 int i, op_index, nb_args, nb_iargs, nb_oargs, arg, nb_ops;
1438 TCGOpcode op, op_new, op_new2;
1439 TCGArg *args;
1440 const TCGOpDef *def;
1441 uint8_t *dead_temps, *mem_temps;
1442 uint16_t dead_args;
1443 uint8_t sync_args;
1444 bool have_op_new2;
1446 s->gen_opc_ptr++; /* skip end */
1448 nb_ops = s->gen_opc_ptr - s->gen_opc_buf;
1450 s->op_dead_args = tcg_malloc(nb_ops * sizeof(uint16_t));
1451 s->op_sync_args = tcg_malloc(nb_ops * sizeof(uint8_t));
1453 dead_temps = tcg_malloc(s->nb_temps);
1454 mem_temps = tcg_malloc(s->nb_temps);
1455 tcg_la_func_end(s, dead_temps, mem_temps);
1457 args = s->gen_opparam_ptr;
1458 op_index = nb_ops - 1;
1459 while (op_index >= 0) {
1460 op = s->gen_opc_buf[op_index];
1461 def = &tcg_op_defs[op];
1462 switch(op) {
1463 case INDEX_op_call:
1465 int call_flags;
1467 nb_args = args[-1];
1468 args -= nb_args;
1469 nb_iargs = args[0] & 0xffff;
1470 nb_oargs = args[0] >> 16;
1471 args++;
1472 call_flags = args[nb_oargs + nb_iargs];
1474 /* pure functions can be removed if their result is not
1475 used */
1476 if (call_flags & TCG_CALL_NO_SIDE_EFFECTS) {
1477 for(i = 0; i < nb_oargs; i++) {
1478 arg = args[i];
1479 if (!dead_temps[arg] || mem_temps[arg]) {
1480 goto do_not_remove_call;
1483 tcg_set_nop(s, s->gen_opc_buf + op_index,
1484 args - 1, nb_args);
1485 } else {
1486 do_not_remove_call:
1488 /* output args are dead */
1489 dead_args = 0;
1490 sync_args = 0;
1491 for(i = 0; i < nb_oargs; i++) {
1492 arg = args[i];
1493 if (dead_temps[arg]) {
1494 dead_args |= (1 << i);
1496 if (mem_temps[arg]) {
1497 sync_args |= (1 << i);
1499 dead_temps[arg] = 1;
1500 mem_temps[arg] = 0;
1503 if (!(call_flags & TCG_CALL_NO_READ_GLOBALS)) {
1504 /* globals should be synced to memory */
1505 memset(mem_temps, 1, s->nb_globals);
1507 if (!(call_flags & (TCG_CALL_NO_WRITE_GLOBALS |
1508 TCG_CALL_NO_READ_GLOBALS))) {
1509 /* globals should go back to memory */
1510 memset(dead_temps, 1, s->nb_globals);
1513 /* input args are live */
1514 for(i = nb_oargs; i < nb_iargs + nb_oargs; i++) {
1515 arg = args[i];
1516 if (arg != TCG_CALL_DUMMY_ARG) {
1517 if (dead_temps[arg]) {
1518 dead_args |= (1 << i);
1520 dead_temps[arg] = 0;
1523 s->op_dead_args[op_index] = dead_args;
1524 s->op_sync_args[op_index] = sync_args;
1526 args--;
1528 break;
1529 case INDEX_op_debug_insn_start:
1530 args -= def->nb_args;
1531 break;
1532 case INDEX_op_nopn:
1533 nb_args = args[-1];
1534 args -= nb_args;
1535 break;
1536 case INDEX_op_discard:
1537 args--;
1538 /* mark the temporary as dead */
1539 dead_temps[args[0]] = 1;
1540 mem_temps[args[0]] = 0;
1541 break;
1542 case INDEX_op_end:
1543 break;
1545 case INDEX_op_add2_i32:
1546 op_new = INDEX_op_add_i32;
1547 goto do_addsub2;
1548 case INDEX_op_sub2_i32:
1549 op_new = INDEX_op_sub_i32;
1550 goto do_addsub2;
1551 case INDEX_op_add2_i64:
1552 op_new = INDEX_op_add_i64;
1553 goto do_addsub2;
1554 case INDEX_op_sub2_i64:
1555 op_new = INDEX_op_sub_i64;
1556 do_addsub2:
1557 args -= 6;
1558 nb_iargs = 4;
1559 nb_oargs = 2;
1560 /* Test if the high part of the operation is dead, but not
1561 the low part. The result can be optimized to a simple
1562 add or sub. This happens often for x86_64 guest when the
1563 cpu mode is set to 32 bit. */
1564 if (dead_temps[args[1]] && !mem_temps[args[1]]) {
1565 if (dead_temps[args[0]] && !mem_temps[args[0]]) {
1566 goto do_remove;
1568 /* Create the single operation plus nop. */
1569 s->gen_opc_buf[op_index] = op = op_new;
1570 args[1] = args[2];
1571 args[2] = args[4];
1572 assert(s->gen_opc_buf[op_index + 1] == INDEX_op_nop);
1573 tcg_set_nop(s, s->gen_opc_buf + op_index + 1, args + 3, 3);
1574 /* Fall through and mark the single-word operation live. */
1575 nb_iargs = 2;
1576 nb_oargs = 1;
1578 goto do_not_remove;
1580 case INDEX_op_mulu2_i32:
1581 op_new = INDEX_op_mul_i32;
1582 op_new2 = INDEX_op_muluh_i32;
1583 have_op_new2 = TCG_TARGET_HAS_muluh_i32;
1584 goto do_mul2;
1585 case INDEX_op_muls2_i32:
1586 op_new = INDEX_op_mul_i32;
1587 op_new2 = INDEX_op_mulsh_i32;
1588 have_op_new2 = TCG_TARGET_HAS_mulsh_i32;
1589 goto do_mul2;
1590 case INDEX_op_mulu2_i64:
1591 op_new = INDEX_op_mul_i64;
1592 op_new2 = INDEX_op_muluh_i64;
1593 have_op_new2 = TCG_TARGET_HAS_muluh_i64;
1594 goto do_mul2;
1595 case INDEX_op_muls2_i64:
1596 op_new = INDEX_op_mul_i64;
1597 op_new2 = INDEX_op_mulsh_i64;
1598 have_op_new2 = TCG_TARGET_HAS_mulsh_i64;
1599 goto do_mul2;
1600 do_mul2:
1601 args -= 4;
1602 nb_iargs = 2;
1603 nb_oargs = 2;
1604 if (dead_temps[args[1]] && !mem_temps[args[1]]) {
1605 if (dead_temps[args[0]] && !mem_temps[args[0]]) {
1606 /* Both parts of the operation are dead. */
1607 goto do_remove;
1609 /* The high part of the operation is dead; generate the low. */
1610 s->gen_opc_buf[op_index] = op = op_new;
1611 args[1] = args[2];
1612 args[2] = args[3];
1613 } else if (have_op_new2 && dead_temps[args[0]]
1614 && !mem_temps[args[0]]) {
1615 /* The low part of the operation is dead; generate the high. */
1616 s->gen_opc_buf[op_index] = op = op_new2;
1617 args[0] = args[1];
1618 args[1] = args[2];
1619 args[2] = args[3];
1620 } else {
1621 goto do_not_remove;
1623 assert(s->gen_opc_buf[op_index + 1] == INDEX_op_nop);
1624 tcg_set_nop(s, s->gen_opc_buf + op_index + 1, args + 3, 1);
1625 /* Mark the single-word operation live. */
1626 nb_oargs = 1;
1627 goto do_not_remove;
1629 default:
1630 /* XXX: optimize by hardcoding common cases (e.g. triadic ops) */
1631 args -= def->nb_args;
1632 nb_iargs = def->nb_iargs;
1633 nb_oargs = def->nb_oargs;
1635 /* Test if the operation can be removed because all
1636 its outputs are dead. We assume that nb_oargs == 0
1637 implies side effects */
1638 if (!(def->flags & TCG_OPF_SIDE_EFFECTS) && nb_oargs != 0) {
1639 for(i = 0; i < nb_oargs; i++) {
1640 arg = args[i];
1641 if (!dead_temps[arg] || mem_temps[arg]) {
1642 goto do_not_remove;
1645 do_remove:
1646 tcg_set_nop(s, s->gen_opc_buf + op_index, args, def->nb_args);
1647 #ifdef CONFIG_PROFILER
1648 s->del_op_count++;
1649 #endif
1650 } else {
1651 do_not_remove:
1653 /* output args are dead */
1654 dead_args = 0;
1655 sync_args = 0;
1656 for(i = 0; i < nb_oargs; i++) {
1657 arg = args[i];
1658 if (dead_temps[arg]) {
1659 dead_args |= (1 << i);
1661 if (mem_temps[arg]) {
1662 sync_args |= (1 << i);
1664 dead_temps[arg] = 1;
1665 mem_temps[arg] = 0;
1668 /* if end of basic block, update */
1669 if (def->flags & TCG_OPF_BB_END) {
1670 tcg_la_bb_end(s, dead_temps, mem_temps);
1671 } else if (def->flags & TCG_OPF_SIDE_EFFECTS) {
1672 /* globals should be synced to memory */
1673 memset(mem_temps, 1, s->nb_globals);
1676 /* input args are live */
1677 for(i = nb_oargs; i < nb_oargs + nb_iargs; i++) {
1678 arg = args[i];
1679 if (dead_temps[arg]) {
1680 dead_args |= (1 << i);
1682 dead_temps[arg] = 0;
1684 s->op_dead_args[op_index] = dead_args;
1685 s->op_sync_args[op_index] = sync_args;
1687 break;
1689 op_index--;
1692 if (args != s->gen_opparam_buf) {
1693 tcg_abort();
1696 #else
1697 /* dummy liveness analysis */
1698 static void tcg_liveness_analysis(TCGContext *s)
1700 int nb_ops;
1701 nb_ops = s->gen_opc_ptr - s->gen_opc_buf;
1703 s->op_dead_args = tcg_malloc(nb_ops * sizeof(uint16_t));
1704 memset(s->op_dead_args, 0, nb_ops * sizeof(uint16_t));
1705 s->op_sync_args = tcg_malloc(nb_ops * sizeof(uint8_t));
1706 memset(s->op_sync_args, 0, nb_ops * sizeof(uint8_t));
1708 #endif
1710 #ifndef NDEBUG
1711 static void dump_regs(TCGContext *s)
1713 TCGTemp *ts;
1714 int i;
1715 char buf[64];
1717 for(i = 0; i < s->nb_temps; i++) {
1718 ts = &s->temps[i];
1719 printf(" %10s: ", tcg_get_arg_str_idx(s, buf, sizeof(buf), i));
1720 switch(ts->val_type) {
1721 case TEMP_VAL_REG:
1722 printf("%s", tcg_target_reg_names[ts->reg]);
1723 break;
1724 case TEMP_VAL_MEM:
1725 printf("%d(%s)", (int)ts->mem_offset, tcg_target_reg_names[ts->mem_reg]);
1726 break;
1727 case TEMP_VAL_CONST:
1728 printf("$0x%" TCG_PRIlx, ts->val);
1729 break;
1730 case TEMP_VAL_DEAD:
1731 printf("D");
1732 break;
1733 default:
1734 printf("???");
1735 break;
1737 printf("\n");
1740 for(i = 0; i < TCG_TARGET_NB_REGS; i++) {
1741 if (s->reg_to_temp[i] >= 0) {
1742 printf("%s: %s\n",
1743 tcg_target_reg_names[i],
1744 tcg_get_arg_str_idx(s, buf, sizeof(buf), s->reg_to_temp[i]));
1749 static void check_regs(TCGContext *s)
1751 int reg, k;
1752 TCGTemp *ts;
1753 char buf[64];
1755 for(reg = 0; reg < TCG_TARGET_NB_REGS; reg++) {
1756 k = s->reg_to_temp[reg];
1757 if (k >= 0) {
1758 ts = &s->temps[k];
1759 if (ts->val_type != TEMP_VAL_REG ||
1760 ts->reg != reg) {
1761 printf("Inconsistency for register %s:\n",
1762 tcg_target_reg_names[reg]);
1763 goto fail;
1767 for(k = 0; k < s->nb_temps; k++) {
1768 ts = &s->temps[k];
1769 if (ts->val_type == TEMP_VAL_REG &&
1770 !ts->fixed_reg &&
1771 s->reg_to_temp[ts->reg] != k) {
1772 printf("Inconsistency for temp %s:\n",
1773 tcg_get_arg_str_idx(s, buf, sizeof(buf), k));
1774 fail:
1775 printf("reg state:\n");
1776 dump_regs(s);
1777 tcg_abort();
1781 #endif
1783 static void temp_allocate_frame(TCGContext *s, int temp)
1785 TCGTemp *ts;
1786 ts = &s->temps[temp];
1787 #if !(defined(__sparc__) && TCG_TARGET_REG_BITS == 64)
1788 /* Sparc64 stack is accessed with offset of 2047 */
1789 s->current_frame_offset = (s->current_frame_offset +
1790 (tcg_target_long)sizeof(tcg_target_long) - 1) &
1791 ~(sizeof(tcg_target_long) - 1);
1792 #endif
1793 if (s->current_frame_offset + (tcg_target_long)sizeof(tcg_target_long) >
1794 s->frame_end) {
1795 tcg_abort();
1797 ts->mem_offset = s->current_frame_offset;
1798 ts->mem_reg = s->frame_reg;
1799 ts->mem_allocated = 1;
1800 s->current_frame_offset += sizeof(tcg_target_long);
1803 /* sync register 'reg' by saving it to the corresponding temporary */
1804 static inline void tcg_reg_sync(TCGContext *s, int reg)
1806 TCGTemp *ts;
1807 int temp;
1809 temp = s->reg_to_temp[reg];
1810 ts = &s->temps[temp];
1811 assert(ts->val_type == TEMP_VAL_REG);
1812 if (!ts->mem_coherent && !ts->fixed_reg) {
1813 if (!ts->mem_allocated) {
1814 temp_allocate_frame(s, temp);
1816 tcg_out_st(s, ts->type, reg, ts->mem_reg, ts->mem_offset);
1818 ts->mem_coherent = 1;
1821 /* free register 'reg' by spilling the corresponding temporary if necessary */
1822 static void tcg_reg_free(TCGContext *s, int reg)
1824 int temp;
1826 temp = s->reg_to_temp[reg];
1827 if (temp != -1) {
1828 tcg_reg_sync(s, reg);
1829 s->temps[temp].val_type = TEMP_VAL_MEM;
1830 s->reg_to_temp[reg] = -1;
1834 /* Allocate a register belonging to reg1 & ~reg2 */
1835 static int tcg_reg_alloc(TCGContext *s, TCGRegSet reg1, TCGRegSet reg2)
1837 int i, reg;
1838 TCGRegSet reg_ct;
1840 tcg_regset_andnot(reg_ct, reg1, reg2);
1842 /* first try free registers */
1843 for(i = 0; i < ARRAY_SIZE(tcg_target_reg_alloc_order); i++) {
1844 reg = tcg_target_reg_alloc_order[i];
1845 if (tcg_regset_test_reg(reg_ct, reg) && s->reg_to_temp[reg] == -1)
1846 return reg;
1849 /* XXX: do better spill choice */
1850 for(i = 0; i < ARRAY_SIZE(tcg_target_reg_alloc_order); i++) {
1851 reg = tcg_target_reg_alloc_order[i];
1852 if (tcg_regset_test_reg(reg_ct, reg)) {
1853 tcg_reg_free(s, reg);
1854 return reg;
1858 tcg_abort();
1861 /* mark a temporary as dead. */
1862 static inline void temp_dead(TCGContext *s, int temp)
1864 TCGTemp *ts;
1866 ts = &s->temps[temp];
1867 if (!ts->fixed_reg) {
1868 if (ts->val_type == TEMP_VAL_REG) {
1869 s->reg_to_temp[ts->reg] = -1;
1871 if (temp < s->nb_globals || ts->temp_local) {
1872 ts->val_type = TEMP_VAL_MEM;
1873 } else {
1874 ts->val_type = TEMP_VAL_DEAD;
1879 /* sync a temporary to memory. 'allocated_regs' is used in case a
1880 temporary registers needs to be allocated to store a constant. */
1881 static inline void temp_sync(TCGContext *s, int temp, TCGRegSet allocated_regs)
1883 TCGTemp *ts;
1885 ts = &s->temps[temp];
1886 if (!ts->fixed_reg) {
1887 switch(ts->val_type) {
1888 case TEMP_VAL_CONST:
1889 ts->reg = tcg_reg_alloc(s, tcg_target_available_regs[ts->type],
1890 allocated_regs);
1891 ts->val_type = TEMP_VAL_REG;
1892 s->reg_to_temp[ts->reg] = temp;
1893 ts->mem_coherent = 0;
1894 tcg_out_movi(s, ts->type, ts->reg, ts->val);
1895 /* fallthrough*/
1896 case TEMP_VAL_REG:
1897 tcg_reg_sync(s, ts->reg);
1898 break;
1899 case TEMP_VAL_DEAD:
1900 case TEMP_VAL_MEM:
1901 break;
1902 default:
1903 tcg_abort();
1908 /* save a temporary to memory. 'allocated_regs' is used in case a
1909 temporary registers needs to be allocated to store a constant. */
1910 static inline void temp_save(TCGContext *s, int temp, TCGRegSet allocated_regs)
1912 #ifdef USE_LIVENESS_ANALYSIS
1913 /* The liveness analysis already ensures that globals are back
1914 in memory. Keep an assert for safety. */
1915 assert(s->temps[temp].val_type == TEMP_VAL_MEM || s->temps[temp].fixed_reg);
1916 #else
1917 temp_sync(s, temp, allocated_regs);
1918 temp_dead(s, temp);
1919 #endif
1922 /* save globals to their canonical location and assume they can be
1923 modified be the following code. 'allocated_regs' is used in case a
1924 temporary registers needs to be allocated to store a constant. */
1925 static void save_globals(TCGContext *s, TCGRegSet allocated_regs)
1927 int i;
1929 for(i = 0; i < s->nb_globals; i++) {
1930 temp_save(s, i, allocated_regs);
1934 /* sync globals to their canonical location and assume they can be
1935 read by the following code. 'allocated_regs' is used in case a
1936 temporary registers needs to be allocated to store a constant. */
1937 static void sync_globals(TCGContext *s, TCGRegSet allocated_regs)
1939 int i;
1941 for (i = 0; i < s->nb_globals; i++) {
1942 #ifdef USE_LIVENESS_ANALYSIS
1943 assert(s->temps[i].val_type != TEMP_VAL_REG || s->temps[i].fixed_reg ||
1944 s->temps[i].mem_coherent);
1945 #else
1946 temp_sync(s, i, allocated_regs);
1947 #endif
1951 /* at the end of a basic block, we assume all temporaries are dead and
1952 all globals are stored at their canonical location. */
1953 static void tcg_reg_alloc_bb_end(TCGContext *s, TCGRegSet allocated_regs)
1955 TCGTemp *ts;
1956 int i;
1958 for(i = s->nb_globals; i < s->nb_temps; i++) {
1959 ts = &s->temps[i];
1960 if (ts->temp_local) {
1961 temp_save(s, i, allocated_regs);
1962 } else {
1963 #ifdef USE_LIVENESS_ANALYSIS
1964 /* The liveness analysis already ensures that temps are dead.
1965 Keep an assert for safety. */
1966 assert(ts->val_type == TEMP_VAL_DEAD);
1967 #else
1968 temp_dead(s, i);
1969 #endif
1973 save_globals(s, allocated_regs);
1976 #define IS_DEAD_ARG(n) ((dead_args >> (n)) & 1)
1977 #define NEED_SYNC_ARG(n) ((sync_args >> (n)) & 1)
1979 static void tcg_reg_alloc_movi(TCGContext *s, const TCGArg *args,
1980 uint16_t dead_args, uint8_t sync_args)
1982 TCGTemp *ots;
1983 tcg_target_ulong val;
1985 ots = &s->temps[args[0]];
1986 val = args[1];
1988 if (ots->fixed_reg) {
1989 /* for fixed registers, we do not do any constant
1990 propagation */
1991 tcg_out_movi(s, ots->type, ots->reg, val);
1992 } else {
1993 /* The movi is not explicitly generated here */
1994 if (ots->val_type == TEMP_VAL_REG)
1995 s->reg_to_temp[ots->reg] = -1;
1996 ots->val_type = TEMP_VAL_CONST;
1997 ots->val = val;
1999 if (NEED_SYNC_ARG(0)) {
2000 temp_sync(s, args[0], s->reserved_regs);
2002 if (IS_DEAD_ARG(0)) {
2003 temp_dead(s, args[0]);
2007 static void tcg_reg_alloc_mov(TCGContext *s, const TCGOpDef *def,
2008 const TCGArg *args, uint16_t dead_args,
2009 uint8_t sync_args)
2011 TCGRegSet allocated_regs;
2012 TCGTemp *ts, *ots;
2013 const TCGArgConstraint *arg_ct, *oarg_ct;
2015 tcg_regset_set(allocated_regs, s->reserved_regs);
2016 ots = &s->temps[args[0]];
2017 ts = &s->temps[args[1]];
2018 oarg_ct = &def->args_ct[0];
2019 arg_ct = &def->args_ct[1];
2021 /* If the source value is not in a register, and we're going to be
2022 forced to have it in a register in order to perform the copy,
2023 then copy the SOURCE value into its own register first. That way
2024 we don't have to reload SOURCE the next time it is used. */
2025 if (((NEED_SYNC_ARG(0) || ots->fixed_reg) && ts->val_type != TEMP_VAL_REG)
2026 || ts->val_type == TEMP_VAL_MEM) {
2027 ts->reg = tcg_reg_alloc(s, arg_ct->u.regs, allocated_regs);
2028 if (ts->val_type == TEMP_VAL_MEM) {
2029 tcg_out_ld(s, ts->type, ts->reg, ts->mem_reg, ts->mem_offset);
2030 ts->mem_coherent = 1;
2031 } else if (ts->val_type == TEMP_VAL_CONST) {
2032 tcg_out_movi(s, ts->type, ts->reg, ts->val);
2034 s->reg_to_temp[ts->reg] = args[1];
2035 ts->val_type = TEMP_VAL_REG;
2038 if (IS_DEAD_ARG(0) && !ots->fixed_reg) {
2039 /* mov to a non-saved dead register makes no sense (even with
2040 liveness analysis disabled). */
2041 assert(NEED_SYNC_ARG(0));
2042 /* The code above should have moved the temp to a register. */
2043 assert(ts->val_type == TEMP_VAL_REG);
2044 if (!ots->mem_allocated) {
2045 temp_allocate_frame(s, args[0]);
2047 tcg_out_st(s, ots->type, ts->reg, ots->mem_reg, ots->mem_offset);
2048 if (IS_DEAD_ARG(1)) {
2049 temp_dead(s, args[1]);
2051 temp_dead(s, args[0]);
2052 } else if (ts->val_type == TEMP_VAL_CONST) {
2053 /* propagate constant */
2054 if (ots->val_type == TEMP_VAL_REG) {
2055 s->reg_to_temp[ots->reg] = -1;
2057 ots->val_type = TEMP_VAL_CONST;
2058 ots->val = ts->val;
2059 } else {
2060 /* The code in the first if block should have moved the
2061 temp to a register. */
2062 assert(ts->val_type == TEMP_VAL_REG);
2063 if (IS_DEAD_ARG(1) && !ts->fixed_reg && !ots->fixed_reg) {
2064 /* the mov can be suppressed */
2065 if (ots->val_type == TEMP_VAL_REG) {
2066 s->reg_to_temp[ots->reg] = -1;
2068 ots->reg = ts->reg;
2069 temp_dead(s, args[1]);
2070 } else {
2071 if (ots->val_type != TEMP_VAL_REG) {
2072 /* When allocating a new register, make sure to not spill the
2073 input one. */
2074 tcg_regset_set_reg(allocated_regs, ts->reg);
2075 ots->reg = tcg_reg_alloc(s, oarg_ct->u.regs, allocated_regs);
2077 tcg_out_mov(s, ots->type, ots->reg, ts->reg);
2079 ots->val_type = TEMP_VAL_REG;
2080 ots->mem_coherent = 0;
2081 s->reg_to_temp[ots->reg] = args[0];
2082 if (NEED_SYNC_ARG(0)) {
2083 tcg_reg_sync(s, ots->reg);
2088 static void tcg_reg_alloc_op(TCGContext *s,
2089 const TCGOpDef *def, TCGOpcode opc,
2090 const TCGArg *args, uint16_t dead_args,
2091 uint8_t sync_args)
2093 TCGRegSet allocated_regs;
2094 int i, k, nb_iargs, nb_oargs, reg;
2095 TCGArg arg;
2096 const TCGArgConstraint *arg_ct;
2097 TCGTemp *ts;
2098 TCGArg new_args[TCG_MAX_OP_ARGS];
2099 int const_args[TCG_MAX_OP_ARGS];
2101 nb_oargs = def->nb_oargs;
2102 nb_iargs = def->nb_iargs;
2104 /* copy constants */
2105 memcpy(new_args + nb_oargs + nb_iargs,
2106 args + nb_oargs + nb_iargs,
2107 sizeof(TCGArg) * def->nb_cargs);
2109 /* satisfy input constraints */
2110 tcg_regset_set(allocated_regs, s->reserved_regs);
2111 for(k = 0; k < nb_iargs; k++) {
2112 i = def->sorted_args[nb_oargs + k];
2113 arg = args[i];
2114 arg_ct = &def->args_ct[i];
2115 ts = &s->temps[arg];
2116 if (ts->val_type == TEMP_VAL_MEM) {
2117 reg = tcg_reg_alloc(s, arg_ct->u.regs, allocated_regs);
2118 tcg_out_ld(s, ts->type, reg, ts->mem_reg, ts->mem_offset);
2119 ts->val_type = TEMP_VAL_REG;
2120 ts->reg = reg;
2121 ts->mem_coherent = 1;
2122 s->reg_to_temp[reg] = arg;
2123 } else if (ts->val_type == TEMP_VAL_CONST) {
2124 if (tcg_target_const_match(ts->val, arg_ct)) {
2125 /* constant is OK for instruction */
2126 const_args[i] = 1;
2127 new_args[i] = ts->val;
2128 goto iarg_end;
2129 } else {
2130 /* need to move to a register */
2131 reg = tcg_reg_alloc(s, arg_ct->u.regs, allocated_regs);
2132 tcg_out_movi(s, ts->type, reg, ts->val);
2133 ts->val_type = TEMP_VAL_REG;
2134 ts->reg = reg;
2135 ts->mem_coherent = 0;
2136 s->reg_to_temp[reg] = arg;
2139 assert(ts->val_type == TEMP_VAL_REG);
2140 if (arg_ct->ct & TCG_CT_IALIAS) {
2141 if (ts->fixed_reg) {
2142 /* if fixed register, we must allocate a new register
2143 if the alias is not the same register */
2144 if (arg != args[arg_ct->alias_index])
2145 goto allocate_in_reg;
2146 } else {
2147 /* if the input is aliased to an output and if it is
2148 not dead after the instruction, we must allocate
2149 a new register and move it */
2150 if (!IS_DEAD_ARG(i)) {
2151 goto allocate_in_reg;
2155 reg = ts->reg;
2156 if (tcg_regset_test_reg(arg_ct->u.regs, reg)) {
2157 /* nothing to do : the constraint is satisfied */
2158 } else {
2159 allocate_in_reg:
2160 /* allocate a new register matching the constraint
2161 and move the temporary register into it */
2162 reg = tcg_reg_alloc(s, arg_ct->u.regs, allocated_regs);
2163 tcg_out_mov(s, ts->type, reg, ts->reg);
2165 new_args[i] = reg;
2166 const_args[i] = 0;
2167 tcg_regset_set_reg(allocated_regs, reg);
2168 iarg_end: ;
2171 /* mark dead temporaries and free the associated registers */
2172 for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) {
2173 if (IS_DEAD_ARG(i)) {
2174 temp_dead(s, args[i]);
2178 if (def->flags & TCG_OPF_BB_END) {
2179 tcg_reg_alloc_bb_end(s, allocated_regs);
2180 } else {
2181 if (def->flags & TCG_OPF_CALL_CLOBBER) {
2182 /* XXX: permit generic clobber register list ? */
2183 for(reg = 0; reg < TCG_TARGET_NB_REGS; reg++) {
2184 if (tcg_regset_test_reg(tcg_target_call_clobber_regs, reg)) {
2185 tcg_reg_free(s, reg);
2189 if (def->flags & TCG_OPF_SIDE_EFFECTS) {
2190 /* sync globals if the op has side effects and might trigger
2191 an exception. */
2192 sync_globals(s, allocated_regs);
2195 /* satisfy the output constraints */
2196 tcg_regset_set(allocated_regs, s->reserved_regs);
2197 for(k = 0; k < nb_oargs; k++) {
2198 i = def->sorted_args[k];
2199 arg = args[i];
2200 arg_ct = &def->args_ct[i];
2201 ts = &s->temps[arg];
2202 if (arg_ct->ct & TCG_CT_ALIAS) {
2203 reg = new_args[arg_ct->alias_index];
2204 } else {
2205 /* if fixed register, we try to use it */
2206 reg = ts->reg;
2207 if (ts->fixed_reg &&
2208 tcg_regset_test_reg(arg_ct->u.regs, reg)) {
2209 goto oarg_end;
2211 reg = tcg_reg_alloc(s, arg_ct->u.regs, allocated_regs);
2213 tcg_regset_set_reg(allocated_regs, reg);
2214 /* if a fixed register is used, then a move will be done afterwards */
2215 if (!ts->fixed_reg) {
2216 if (ts->val_type == TEMP_VAL_REG) {
2217 s->reg_to_temp[ts->reg] = -1;
2219 ts->val_type = TEMP_VAL_REG;
2220 ts->reg = reg;
2221 /* temp value is modified, so the value kept in memory is
2222 potentially not the same */
2223 ts->mem_coherent = 0;
2224 s->reg_to_temp[reg] = arg;
2226 oarg_end:
2227 new_args[i] = reg;
2231 /* emit instruction */
2232 tcg_out_op(s, opc, new_args, const_args);
2234 /* move the outputs in the correct register if needed */
2235 for(i = 0; i < nb_oargs; i++) {
2236 ts = &s->temps[args[i]];
2237 reg = new_args[i];
2238 if (ts->fixed_reg && ts->reg != reg) {
2239 tcg_out_mov(s, ts->type, ts->reg, reg);
2241 if (NEED_SYNC_ARG(i)) {
2242 tcg_reg_sync(s, reg);
2244 if (IS_DEAD_ARG(i)) {
2245 temp_dead(s, args[i]);
2250 #ifdef TCG_TARGET_STACK_GROWSUP
2251 #define STACK_DIR(x) (-(x))
2252 #else
2253 #define STACK_DIR(x) (x)
2254 #endif
2256 static int tcg_reg_alloc_call(TCGContext *s, const TCGOpDef *def,
2257 TCGOpcode opc, const TCGArg *args,
2258 uint16_t dead_args, uint8_t sync_args)
2260 int nb_iargs, nb_oargs, flags, nb_regs, i, reg, nb_params;
2261 TCGArg arg, func_arg;
2262 TCGTemp *ts;
2263 intptr_t stack_offset;
2264 size_t call_stack_size;
2265 uintptr_t func_addr;
2266 int const_func_arg, allocate_args;
2267 TCGRegSet allocated_regs;
2268 const TCGArgConstraint *arg_ct;
2270 arg = *args++;
2272 nb_oargs = arg >> 16;
2273 nb_iargs = arg & 0xffff;
2274 nb_params = nb_iargs - 1;
2276 flags = args[nb_oargs + nb_iargs];
2278 nb_regs = ARRAY_SIZE(tcg_target_call_iarg_regs);
2279 if (nb_regs > nb_params)
2280 nb_regs = nb_params;
2282 /* assign stack slots first */
2283 call_stack_size = (nb_params - nb_regs) * sizeof(tcg_target_long);
2284 call_stack_size = (call_stack_size + TCG_TARGET_STACK_ALIGN - 1) &
2285 ~(TCG_TARGET_STACK_ALIGN - 1);
2286 allocate_args = (call_stack_size > TCG_STATIC_CALL_ARGS_SIZE);
2287 if (allocate_args) {
2288 /* XXX: if more than TCG_STATIC_CALL_ARGS_SIZE is needed,
2289 preallocate call stack */
2290 tcg_abort();
2293 stack_offset = TCG_TARGET_CALL_STACK_OFFSET;
2294 for(i = nb_regs; i < nb_params; i++) {
2295 arg = args[nb_oargs + i];
2296 #ifdef TCG_TARGET_STACK_GROWSUP
2297 stack_offset -= sizeof(tcg_target_long);
2298 #endif
2299 if (arg != TCG_CALL_DUMMY_ARG) {
2300 ts = &s->temps[arg];
2301 if (ts->val_type == TEMP_VAL_REG) {
2302 tcg_out_st(s, ts->type, ts->reg, TCG_REG_CALL_STACK, stack_offset);
2303 } else if (ts->val_type == TEMP_VAL_MEM) {
2304 reg = tcg_reg_alloc(s, tcg_target_available_regs[ts->type],
2305 s->reserved_regs);
2306 /* XXX: not correct if reading values from the stack */
2307 tcg_out_ld(s, ts->type, reg, ts->mem_reg, ts->mem_offset);
2308 tcg_out_st(s, ts->type, reg, TCG_REG_CALL_STACK, stack_offset);
2309 } else if (ts->val_type == TEMP_VAL_CONST) {
2310 reg = tcg_reg_alloc(s, tcg_target_available_regs[ts->type],
2311 s->reserved_regs);
2312 /* XXX: sign extend may be needed on some targets */
2313 tcg_out_movi(s, ts->type, reg, ts->val);
2314 tcg_out_st(s, ts->type, reg, TCG_REG_CALL_STACK, stack_offset);
2315 } else {
2316 tcg_abort();
2319 #ifndef TCG_TARGET_STACK_GROWSUP
2320 stack_offset += sizeof(tcg_target_long);
2321 #endif
2324 /* assign input registers */
2325 tcg_regset_set(allocated_regs, s->reserved_regs);
2326 for(i = 0; i < nb_regs; i++) {
2327 arg = args[nb_oargs + i];
2328 if (arg != TCG_CALL_DUMMY_ARG) {
2329 ts = &s->temps[arg];
2330 reg = tcg_target_call_iarg_regs[i];
2331 tcg_reg_free(s, reg);
2332 if (ts->val_type == TEMP_VAL_REG) {
2333 if (ts->reg != reg) {
2334 tcg_out_mov(s, ts->type, reg, ts->reg);
2336 } else if (ts->val_type == TEMP_VAL_MEM) {
2337 tcg_out_ld(s, ts->type, reg, ts->mem_reg, ts->mem_offset);
2338 } else if (ts->val_type == TEMP_VAL_CONST) {
2339 /* XXX: sign extend ? */
2340 tcg_out_movi(s, ts->type, reg, ts->val);
2341 } else {
2342 tcg_abort();
2344 tcg_regset_set_reg(allocated_regs, reg);
2348 /* assign function address */
2349 func_arg = args[nb_oargs + nb_iargs - 1];
2350 arg_ct = &def->args_ct[0];
2351 ts = &s->temps[func_arg];
2352 func_addr = ts->val;
2353 const_func_arg = 0;
2354 if (ts->val_type == TEMP_VAL_MEM) {
2355 reg = tcg_reg_alloc(s, arg_ct->u.regs, allocated_regs);
2356 tcg_out_ld(s, ts->type, reg, ts->mem_reg, ts->mem_offset);
2357 func_arg = reg;
2358 tcg_regset_set_reg(allocated_regs, reg);
2359 } else if (ts->val_type == TEMP_VAL_REG) {
2360 reg = ts->reg;
2361 if (!tcg_regset_test_reg(arg_ct->u.regs, reg)) {
2362 reg = tcg_reg_alloc(s, arg_ct->u.regs, allocated_regs);
2363 tcg_out_mov(s, ts->type, reg, ts->reg);
2365 func_arg = reg;
2366 tcg_regset_set_reg(allocated_regs, reg);
2367 } else if (ts->val_type == TEMP_VAL_CONST) {
2368 if (tcg_target_const_match(func_addr, arg_ct)) {
2369 const_func_arg = 1;
2370 func_arg = func_addr;
2371 } else {
2372 reg = tcg_reg_alloc(s, arg_ct->u.regs, allocated_regs);
2373 tcg_out_movi(s, ts->type, reg, func_addr);
2374 func_arg = reg;
2375 tcg_regset_set_reg(allocated_regs, reg);
2377 } else {
2378 tcg_abort();
2382 /* mark dead temporaries and free the associated registers */
2383 for(i = nb_oargs; i < nb_iargs + nb_oargs; i++) {
2384 if (IS_DEAD_ARG(i)) {
2385 temp_dead(s, args[i]);
2389 /* clobber call registers */
2390 for(reg = 0; reg < TCG_TARGET_NB_REGS; reg++) {
2391 if (tcg_regset_test_reg(tcg_target_call_clobber_regs, reg)) {
2392 tcg_reg_free(s, reg);
2396 /* Save globals if they might be written by the helper, sync them if
2397 they might be read. */
2398 if (flags & TCG_CALL_NO_READ_GLOBALS) {
2399 /* Nothing to do */
2400 } else if (flags & TCG_CALL_NO_WRITE_GLOBALS) {
2401 sync_globals(s, allocated_regs);
2402 } else {
2403 save_globals(s, allocated_regs);
2406 tcg_out_op(s, opc, &func_arg, &const_func_arg);
2408 /* assign output registers and emit moves if needed */
2409 for(i = 0; i < nb_oargs; i++) {
2410 arg = args[i];
2411 ts = &s->temps[arg];
2412 reg = tcg_target_call_oarg_regs[i];
2413 assert(s->reg_to_temp[reg] == -1);
2414 if (ts->fixed_reg) {
2415 if (ts->reg != reg) {
2416 tcg_out_mov(s, ts->type, ts->reg, reg);
2418 } else {
2419 if (ts->val_type == TEMP_VAL_REG) {
2420 s->reg_to_temp[ts->reg] = -1;
2422 ts->val_type = TEMP_VAL_REG;
2423 ts->reg = reg;
2424 ts->mem_coherent = 0;
2425 s->reg_to_temp[reg] = arg;
2426 if (NEED_SYNC_ARG(i)) {
2427 tcg_reg_sync(s, reg);
2429 if (IS_DEAD_ARG(i)) {
2430 temp_dead(s, args[i]);
2435 return nb_iargs + nb_oargs + def->nb_cargs + 1;
2438 #ifdef CONFIG_PROFILER
2440 static int64_t tcg_table_op_count[NB_OPS];
2442 static void dump_op_count(void)
2444 int i;
2445 FILE *f;
2446 f = fopen("/tmp/op.log", "w");
2447 for(i = INDEX_op_end; i < NB_OPS; i++) {
2448 fprintf(f, "%s %" PRId64 "\n", tcg_op_defs[i].name, tcg_table_op_count[i]);
2450 fclose(f);
2452 #endif
2455 static inline int tcg_gen_code_common(TCGContext *s, uint8_t *gen_code_buf,
2456 long search_pc)
2458 TCGOpcode opc;
2459 int op_index;
2460 const TCGOpDef *def;
2461 const TCGArg *args;
2463 #ifdef DEBUG_DISAS
2464 if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP))) {
2465 qemu_log("OP:\n");
2466 tcg_dump_ops(s);
2467 qemu_log("\n");
2469 #endif
2471 #ifdef CONFIG_PROFILER
2472 s->opt_time -= profile_getclock();
2473 #endif
2475 #ifdef USE_TCG_OPTIMIZATIONS
2476 s->gen_opparam_ptr =
2477 tcg_optimize(s, s->gen_opc_ptr, s->gen_opparam_buf, tcg_op_defs);
2478 #endif
2480 #ifdef CONFIG_PROFILER
2481 s->opt_time += profile_getclock();
2482 s->la_time -= profile_getclock();
2483 #endif
2485 tcg_liveness_analysis(s);
2487 #ifdef CONFIG_PROFILER
2488 s->la_time += profile_getclock();
2489 #endif
2491 #ifdef DEBUG_DISAS
2492 if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_OPT))) {
2493 qemu_log("OP after optimization and liveness analysis:\n");
2494 tcg_dump_ops(s);
2495 qemu_log("\n");
2497 #endif
2499 tcg_reg_alloc_start(s);
2501 s->code_buf = gen_code_buf;
2502 s->code_ptr = gen_code_buf;
2504 tcg_out_tb_init(s);
2506 args = s->gen_opparam_buf;
2507 op_index = 0;
2509 for(;;) {
2510 opc = s->gen_opc_buf[op_index];
2511 #ifdef CONFIG_PROFILER
2512 tcg_table_op_count[opc]++;
2513 #endif
2514 def = &tcg_op_defs[opc];
2515 #if 0
2516 printf("%s: %d %d %d\n", def->name,
2517 def->nb_oargs, def->nb_iargs, def->nb_cargs);
2518 // dump_regs(s);
2519 #endif
2520 switch(opc) {
2521 case INDEX_op_mov_i32:
2522 case INDEX_op_mov_i64:
2523 tcg_reg_alloc_mov(s, def, args, s->op_dead_args[op_index],
2524 s->op_sync_args[op_index]);
2525 break;
2526 case INDEX_op_movi_i32:
2527 case INDEX_op_movi_i64:
2528 tcg_reg_alloc_movi(s, args, s->op_dead_args[op_index],
2529 s->op_sync_args[op_index]);
2530 break;
2531 case INDEX_op_debug_insn_start:
2532 /* debug instruction */
2533 break;
2534 case INDEX_op_nop:
2535 case INDEX_op_nop1:
2536 case INDEX_op_nop2:
2537 case INDEX_op_nop3:
2538 break;
2539 case INDEX_op_nopn:
2540 args += args[0];
2541 goto next;
2542 case INDEX_op_discard:
2543 temp_dead(s, args[0]);
2544 break;
2545 case INDEX_op_set_label:
2546 tcg_reg_alloc_bb_end(s, s->reserved_regs);
2547 tcg_out_label(s, args[0], s->code_ptr);
2548 break;
2549 case INDEX_op_call:
2550 args += tcg_reg_alloc_call(s, def, opc, args,
2551 s->op_dead_args[op_index],
2552 s->op_sync_args[op_index]);
2553 goto next;
2554 case INDEX_op_end:
2555 goto the_end;
2556 default:
2557 /* Sanity check that we've not introduced any unhandled opcodes. */
2558 if (def->flags & TCG_OPF_NOT_PRESENT) {
2559 tcg_abort();
2561 /* Note: in order to speed up the code, it would be much
2562 faster to have specialized register allocator functions for
2563 some common argument patterns */
2564 tcg_reg_alloc_op(s, def, opc, args, s->op_dead_args[op_index],
2565 s->op_sync_args[op_index]);
2566 break;
2568 args += def->nb_args;
2569 next:
2570 if (search_pc >= 0 && search_pc < s->code_ptr - gen_code_buf) {
2571 return op_index;
2573 op_index++;
2574 #ifndef NDEBUG
2575 check_regs(s);
2576 #endif
2578 the_end:
2579 /* Generate TB finalization at the end of block */
2580 tcg_out_tb_finalize(s);
2581 return -1;
2584 int tcg_gen_code(TCGContext *s, uint8_t *gen_code_buf)
2586 #ifdef CONFIG_PROFILER
2588 int n;
2589 n = (s->gen_opc_ptr - s->gen_opc_buf);
2590 s->op_count += n;
2591 if (n > s->op_count_max)
2592 s->op_count_max = n;
2594 s->temp_count += s->nb_temps;
2595 if (s->nb_temps > s->temp_count_max)
2596 s->temp_count_max = s->nb_temps;
2598 #endif
2600 tcg_gen_code_common(s, gen_code_buf, -1);
2602 /* flush instruction cache */
2603 flush_icache_range((uintptr_t)gen_code_buf, (uintptr_t)s->code_ptr);
2605 return s->code_ptr - gen_code_buf;
2608 /* Return the index of the micro operation such as the pc after is <
2609 offset bytes from the start of the TB. The contents of gen_code_buf must
2610 not be changed, though writing the same values is ok.
2611 Return -1 if not found. */
2612 int tcg_gen_code_search_pc(TCGContext *s, uint8_t *gen_code_buf, long offset)
2614 return tcg_gen_code_common(s, gen_code_buf, offset);
2617 #ifdef CONFIG_PROFILER
2618 void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf)
2620 TCGContext *s = &tcg_ctx;
2621 int64_t tot;
2623 tot = s->interm_time + s->code_time;
2624 cpu_fprintf(f, "JIT cycles %" PRId64 " (%0.3f s at 2.4 GHz)\n",
2625 tot, tot / 2.4e9);
2626 cpu_fprintf(f, "translated TBs %" PRId64 " (aborted=%" PRId64 " %0.1f%%)\n",
2627 s->tb_count,
2628 s->tb_count1 - s->tb_count,
2629 s->tb_count1 ? (double)(s->tb_count1 - s->tb_count) / s->tb_count1 * 100.0 : 0);
2630 cpu_fprintf(f, "avg ops/TB %0.1f max=%d\n",
2631 s->tb_count ? (double)s->op_count / s->tb_count : 0, s->op_count_max);
2632 cpu_fprintf(f, "deleted ops/TB %0.2f\n",
2633 s->tb_count ?
2634 (double)s->del_op_count / s->tb_count : 0);
2635 cpu_fprintf(f, "avg temps/TB %0.2f max=%d\n",
2636 s->tb_count ?
2637 (double)s->temp_count / s->tb_count : 0,
2638 s->temp_count_max);
2640 cpu_fprintf(f, "cycles/op %0.1f\n",
2641 s->op_count ? (double)tot / s->op_count : 0);
2642 cpu_fprintf(f, "cycles/in byte %0.1f\n",
2643 s->code_in_len ? (double)tot / s->code_in_len : 0);
2644 cpu_fprintf(f, "cycles/out byte %0.1f\n",
2645 s->code_out_len ? (double)tot / s->code_out_len : 0);
2646 if (tot == 0)
2647 tot = 1;
2648 cpu_fprintf(f, " gen_interm time %0.1f%%\n",
2649 (double)s->interm_time / tot * 100.0);
2650 cpu_fprintf(f, " gen_code time %0.1f%%\n",
2651 (double)s->code_time / tot * 100.0);
2652 cpu_fprintf(f, "optim./code time %0.1f%%\n",
2653 (double)s->opt_time / (s->code_time ? s->code_time : 1)
2654 * 100.0);
2655 cpu_fprintf(f, "liveness/code time %0.1f%%\n",
2656 (double)s->la_time / (s->code_time ? s->code_time : 1) * 100.0);
2657 cpu_fprintf(f, "cpu_restore count %" PRId64 "\n",
2658 s->restore_count);
2659 cpu_fprintf(f, " avg cycles %0.1f\n",
2660 s->restore_count ? (double)s->restore_time / s->restore_count : 0);
2662 dump_op_count();
2664 #else
2665 void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf)
2667 cpu_fprintf(f, "[TCG profiler not compiled]\n");
2669 #endif
2671 #ifdef ELF_HOST_MACHINE
2672 /* In order to use this feature, the backend needs to do three things:
2674 (1) Define ELF_HOST_MACHINE to indicate both what value to
2675 put into the ELF image and to indicate support for the feature.
2677 (2) Define tcg_register_jit. This should create a buffer containing
2678 the contents of a .debug_frame section that describes the post-
2679 prologue unwind info for the tcg machine.
2681 (3) Call tcg_register_jit_int, with the constructed .debug_frame.
2684 /* Begin GDB interface. THE FOLLOWING MUST MATCH GDB DOCS. */
2685 typedef enum {
2686 JIT_NOACTION = 0,
2687 JIT_REGISTER_FN,
2688 JIT_UNREGISTER_FN
2689 } jit_actions_t;
2691 struct jit_code_entry {
2692 struct jit_code_entry *next_entry;
2693 struct jit_code_entry *prev_entry;
2694 const void *symfile_addr;
2695 uint64_t symfile_size;
2698 struct jit_descriptor {
2699 uint32_t version;
2700 uint32_t action_flag;
2701 struct jit_code_entry *relevant_entry;
2702 struct jit_code_entry *first_entry;
2705 void __jit_debug_register_code(void) __attribute__((noinline));
2706 void __jit_debug_register_code(void)
2708 asm("");
2711 /* Must statically initialize the version, because GDB may check
2712 the version before we can set it. */
2713 struct jit_descriptor __jit_debug_descriptor = { 1, 0, 0, 0 };
2715 /* End GDB interface. */
2717 static int find_string(const char *strtab, const char *str)
2719 const char *p = strtab + 1;
2721 while (1) {
2722 if (strcmp(p, str) == 0) {
2723 return p - strtab;
2725 p += strlen(p) + 1;
2729 static void tcg_register_jit_int(void *buf_ptr, size_t buf_size,
2730 void *debug_frame, size_t debug_frame_size)
2732 struct __attribute__((packed)) DebugInfo {
2733 uint32_t len;
2734 uint16_t version;
2735 uint32_t abbrev;
2736 uint8_t ptr_size;
2737 uint8_t cu_die;
2738 uint16_t cu_lang;
2739 uintptr_t cu_low_pc;
2740 uintptr_t cu_high_pc;
2741 uint8_t fn_die;
2742 char fn_name[16];
2743 uintptr_t fn_low_pc;
2744 uintptr_t fn_high_pc;
2745 uint8_t cu_eoc;
2748 struct ElfImage {
2749 ElfW(Ehdr) ehdr;
2750 ElfW(Phdr) phdr;
2751 ElfW(Shdr) shdr[7];
2752 ElfW(Sym) sym[2];
2753 struct DebugInfo di;
2754 uint8_t da[24];
2755 char str[80];
2758 struct ElfImage *img;
2760 static const struct ElfImage img_template = {
2761 .ehdr = {
2762 .e_ident[EI_MAG0] = ELFMAG0,
2763 .e_ident[EI_MAG1] = ELFMAG1,
2764 .e_ident[EI_MAG2] = ELFMAG2,
2765 .e_ident[EI_MAG3] = ELFMAG3,
2766 .e_ident[EI_CLASS] = ELF_CLASS,
2767 .e_ident[EI_DATA] = ELF_DATA,
2768 .e_ident[EI_VERSION] = EV_CURRENT,
2769 .e_type = ET_EXEC,
2770 .e_machine = ELF_HOST_MACHINE,
2771 .e_version = EV_CURRENT,
2772 .e_phoff = offsetof(struct ElfImage, phdr),
2773 .e_shoff = offsetof(struct ElfImage, shdr),
2774 .e_ehsize = sizeof(ElfW(Shdr)),
2775 .e_phentsize = sizeof(ElfW(Phdr)),
2776 .e_phnum = 1,
2777 .e_shentsize = sizeof(ElfW(Shdr)),
2778 .e_shnum = ARRAY_SIZE(img->shdr),
2779 .e_shstrndx = ARRAY_SIZE(img->shdr) - 1,
2780 #ifdef ELF_HOST_FLAGS
2781 .e_flags = ELF_HOST_FLAGS,
2782 #endif
2783 #ifdef ELF_OSABI
2784 .e_ident[EI_OSABI] = ELF_OSABI,
2785 #endif
2787 .phdr = {
2788 .p_type = PT_LOAD,
2789 .p_flags = PF_X,
2791 .shdr = {
2792 [0] = { .sh_type = SHT_NULL },
2793 /* Trick: The contents of code_gen_buffer are not present in
2794 this fake ELF file; that got allocated elsewhere. Therefore
2795 we mark .text as SHT_NOBITS (similar to .bss) so that readers
2796 will not look for contents. We can record any address. */
2797 [1] = { /* .text */
2798 .sh_type = SHT_NOBITS,
2799 .sh_flags = SHF_EXECINSTR | SHF_ALLOC,
2801 [2] = { /* .debug_info */
2802 .sh_type = SHT_PROGBITS,
2803 .sh_offset = offsetof(struct ElfImage, di),
2804 .sh_size = sizeof(struct DebugInfo),
2806 [3] = { /* .debug_abbrev */
2807 .sh_type = SHT_PROGBITS,
2808 .sh_offset = offsetof(struct ElfImage, da),
2809 .sh_size = sizeof(img->da),
2811 [4] = { /* .debug_frame */
2812 .sh_type = SHT_PROGBITS,
2813 .sh_offset = sizeof(struct ElfImage),
2815 [5] = { /* .symtab */
2816 .sh_type = SHT_SYMTAB,
2817 .sh_offset = offsetof(struct ElfImage, sym),
2818 .sh_size = sizeof(img->sym),
2819 .sh_info = 1,
2820 .sh_link = ARRAY_SIZE(img->shdr) - 1,
2821 .sh_entsize = sizeof(ElfW(Sym)),
2823 [6] = { /* .strtab */
2824 .sh_type = SHT_STRTAB,
2825 .sh_offset = offsetof(struct ElfImage, str),
2826 .sh_size = sizeof(img->str),
2829 .sym = {
2830 [1] = { /* code_gen_buffer */
2831 .st_info = ELF_ST_INFO(STB_GLOBAL, STT_FUNC),
2832 .st_shndx = 1,
2835 .di = {
2836 .len = sizeof(struct DebugInfo) - 4,
2837 .version = 2,
2838 .ptr_size = sizeof(void *),
2839 .cu_die = 1,
2840 .cu_lang = 0x8001, /* DW_LANG_Mips_Assembler */
2841 .fn_die = 2,
2842 .fn_name = "code_gen_buffer"
2844 .da = {
2845 1, /* abbrev number (the cu) */
2846 0x11, 1, /* DW_TAG_compile_unit, has children */
2847 0x13, 0x5, /* DW_AT_language, DW_FORM_data2 */
2848 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */
2849 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */
2850 0, 0, /* end of abbrev */
2851 2, /* abbrev number (the fn) */
2852 0x2e, 0, /* DW_TAG_subprogram, no children */
2853 0x3, 0x8, /* DW_AT_name, DW_FORM_string */
2854 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */
2855 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */
2856 0, 0, /* end of abbrev */
2857 0 /* no more abbrev */
2859 .str = "\0" ".text\0" ".debug_info\0" ".debug_abbrev\0"
2860 ".debug_frame\0" ".symtab\0" ".strtab\0" "code_gen_buffer",
2863 /* We only need a single jit entry; statically allocate it. */
2864 static struct jit_code_entry one_entry;
2866 uintptr_t buf = (uintptr_t)buf_ptr;
2867 size_t img_size = sizeof(struct ElfImage) + debug_frame_size;
2869 img = g_malloc(img_size);
2870 *img = img_template;
2871 memcpy(img + 1, debug_frame, debug_frame_size);
2873 img->phdr.p_vaddr = buf;
2874 img->phdr.p_paddr = buf;
2875 img->phdr.p_memsz = buf_size;
2877 img->shdr[1].sh_name = find_string(img->str, ".text");
2878 img->shdr[1].sh_addr = buf;
2879 img->shdr[1].sh_size = buf_size;
2881 img->shdr[2].sh_name = find_string(img->str, ".debug_info");
2882 img->shdr[3].sh_name = find_string(img->str, ".debug_abbrev");
2884 img->shdr[4].sh_name = find_string(img->str, ".debug_frame");
2885 img->shdr[4].sh_size = debug_frame_size;
2887 img->shdr[5].sh_name = find_string(img->str, ".symtab");
2888 img->shdr[6].sh_name = find_string(img->str, ".strtab");
2890 img->sym[1].st_name = find_string(img->str, "code_gen_buffer");
2891 img->sym[1].st_value = buf;
2892 img->sym[1].st_size = buf_size;
2894 img->di.cu_low_pc = buf;
2895 img->di.cu_high_pc = buf + buf_size;
2896 img->di.fn_low_pc = buf;
2897 img->di.fn_high_pc = buf + buf_size;
2899 #ifdef DEBUG_JIT
2900 /* Enable this block to be able to debug the ELF image file creation.
2901 One can use readelf, objdump, or other inspection utilities. */
2903 FILE *f = fopen("/tmp/qemu.jit", "w+b");
2904 if (f) {
2905 if (fwrite(img, img_size, 1, f) != img_size) {
2906 /* Avoid stupid unused return value warning for fwrite. */
2908 fclose(f);
2911 #endif
2913 one_entry.symfile_addr = img;
2914 one_entry.symfile_size = img_size;
2916 __jit_debug_descriptor.action_flag = JIT_REGISTER_FN;
2917 __jit_debug_descriptor.relevant_entry = &one_entry;
2918 __jit_debug_descriptor.first_entry = &one_entry;
2919 __jit_debug_register_code();
2921 #else
2922 /* No support for the feature. Provide the entry point expected by exec.c,
2923 and implement the internal function we declared earlier. */
2925 static void tcg_register_jit_int(void *buf, size_t size,
2926 void *debug_frame, size_t debug_frame_size)
2930 void tcg_register_jit(void *buf, size_t buf_size)
2933 #endif /* ELF_HOST_MACHINE */