2 * Tiny Code Generator for QEMU
4 * Copyright (c) 2008 Fabrice Bellard
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
25 /* define it to use liveness analysis (better code) */
26 #define USE_LIVENESS_ANALYSIS
30 #if !defined(CONFIG_DEBUG_TCG) && !defined(NDEBUG)
31 /* define it to suppress various consistency checks (faster) */
47 #include "qemu-common.h"
48 #include "cache-utils.h"
49 #include "host-utils.h"
50 #include "qemu-timer.h"
52 /* Note: the long term plan is to reduce the dependancies on the QEMU
53 CPU definitions. Currently they are used for qemu_ld/st
55 #define NO_CPU_IO_DEFS
61 #if defined(CONFIG_USE_GUEST_BASE) && !defined(TCG_TARGET_HAS_GUEST_BASE)
62 #error GUEST_BASE not supported on this host.
65 static void tcg_target_init(TCGContext
*s
);
66 static void tcg_target_qemu_prologue(TCGContext
*s
);
67 static void patch_reloc(uint8_t *code_ptr
, int type
,
68 tcg_target_long value
, tcg_target_long addend
);
70 static TCGOpDef tcg_op_defs
[] = {
71 #define DEF(s, oargs, iargs, cargs, flags) { #s, oargs, iargs, cargs, iargs + oargs + cargs, flags },
76 static TCGRegSet tcg_target_available_regs
[2];
77 static TCGRegSet tcg_target_call_clobber_regs
;
79 /* XXX: move that inside the context */
80 uint16_t *gen_opc_ptr
;
81 TCGArg
*gen_opparam_ptr
;
83 static inline void tcg_out8(TCGContext
*s
, uint8_t v
)
88 static inline void tcg_out16(TCGContext
*s
, uint16_t v
)
90 *(uint16_t *)s
->code_ptr
= v
;
94 static inline void tcg_out32(TCGContext
*s
, uint32_t v
)
96 *(uint32_t *)s
->code_ptr
= v
;
100 /* label relocation processing */
102 static void tcg_out_reloc(TCGContext
*s
, uint8_t *code_ptr
, int type
,
103 int label_index
, long addend
)
108 l
= &s
->labels
[label_index
];
110 /* FIXME: This may break relocations on RISC targets that
111 modify instruction fields in place. The caller may not have
112 written the initial value. */
113 patch_reloc(code_ptr
, type
, l
->u
.value
, addend
);
115 /* add a new relocation entry */
116 r
= tcg_malloc(sizeof(TCGRelocation
));
120 r
->next
= l
->u
.first_reloc
;
121 l
->u
.first_reloc
= r
;
125 static void tcg_out_label(TCGContext
*s
, int label_index
,
126 tcg_target_long value
)
131 l
= &s
->labels
[label_index
];
134 r
= l
->u
.first_reloc
;
136 patch_reloc(r
->ptr
, r
->type
, value
, r
->addend
);
143 int gen_new_label(void)
145 TCGContext
*s
= &tcg_ctx
;
149 if (s
->nb_labels
>= TCG_MAX_LABELS
)
151 idx
= s
->nb_labels
++;
154 l
->u
.first_reloc
= NULL
;
158 #include "tcg-target.c"
160 /* pool based memory allocation */
161 void *tcg_malloc_internal(TCGContext
*s
, int size
)
166 if (size
> TCG_POOL_CHUNK_SIZE
) {
167 /* big malloc: insert a new pool (XXX: could optimize) */
168 p
= qemu_malloc(sizeof(TCGPool
) + size
);
171 s
->pool_current
->next
= p
;
174 p
->next
= s
->pool_current
;
184 pool_size
= TCG_POOL_CHUNK_SIZE
;
185 p
= qemu_malloc(sizeof(TCGPool
) + pool_size
);
189 s
->pool_current
->next
= p
;
198 s
->pool_cur
= p
->data
+ size
;
199 s
->pool_end
= p
->data
+ p
->size
;
203 void tcg_pool_reset(TCGContext
*s
)
205 s
->pool_cur
= s
->pool_end
= NULL
;
206 s
->pool_current
= NULL
;
209 void tcg_context_init(TCGContext
*s
)
211 int op
, total_args
, n
;
213 TCGArgConstraint
*args_ct
;
216 memset(s
, 0, sizeof(*s
));
217 s
->temps
= s
->static_temps
;
220 /* Count total number of arguments and allocate the corresponding
223 for(op
= 0; op
< NB_OPS
; op
++) {
224 def
= &tcg_op_defs
[op
];
225 n
= def
->nb_iargs
+ def
->nb_oargs
;
229 args_ct
= qemu_malloc(sizeof(TCGArgConstraint
) * total_args
);
230 sorted_args
= qemu_malloc(sizeof(int) * total_args
);
232 for(op
= 0; op
< NB_OPS
; op
++) {
233 def
= &tcg_op_defs
[op
];
234 def
->args_ct
= args_ct
;
235 def
->sorted_args
= sorted_args
;
236 n
= def
->nb_iargs
+ def
->nb_oargs
;
244 void tcg_prologue_init(TCGContext
*s
)
246 /* init global prologue and epilogue */
247 s
->code_buf
= code_gen_prologue
;
248 s
->code_ptr
= s
->code_buf
;
249 tcg_target_qemu_prologue(s
);
250 flush_icache_range((unsigned long)s
->code_buf
,
251 (unsigned long)s
->code_ptr
);
254 void tcg_set_frame(TCGContext
*s
, int reg
,
255 tcg_target_long start
, tcg_target_long size
)
257 s
->frame_start
= start
;
258 s
->frame_end
= start
+ size
;
262 void tcg_func_start(TCGContext
*s
)
266 s
->nb_temps
= s
->nb_globals
;
267 for(i
= 0; i
< (TCG_TYPE_COUNT
* 2); i
++)
268 s
->first_free_temp
[i
] = -1;
269 s
->labels
= tcg_malloc(sizeof(TCGLabel
) * TCG_MAX_LABELS
);
271 s
->current_frame_offset
= s
->frame_start
;
273 gen_opc_ptr
= gen_opc_buf
;
274 gen_opparam_ptr
= gen_opparam_buf
;
277 static inline void tcg_temp_alloc(TCGContext
*s
, int n
)
279 if (n
> TCG_MAX_TEMPS
)
283 static inline int tcg_global_reg_new_internal(TCGType type
, int reg
,
286 TCGContext
*s
= &tcg_ctx
;
290 #if TCG_TARGET_REG_BITS == 32
291 if (type
!= TCG_TYPE_I32
)
294 if (tcg_regset_test_reg(s
->reserved_regs
, reg
))
297 tcg_temp_alloc(s
, s
->nb_globals
+ 1);
298 ts
= &s
->temps
[s
->nb_globals
];
299 ts
->base_type
= type
;
305 tcg_regset_set_reg(s
->reserved_regs
, reg
);
309 TCGv_i32
tcg_global_reg_new_i32(int reg
, const char *name
)
313 idx
= tcg_global_reg_new_internal(TCG_TYPE_I32
, reg
, name
);
314 return MAKE_TCGV_I32(idx
);
317 TCGv_i64
tcg_global_reg_new_i64(int reg
, const char *name
)
321 idx
= tcg_global_reg_new_internal(TCG_TYPE_I64
, reg
, name
);
322 return MAKE_TCGV_I64(idx
);
325 static inline int tcg_global_mem_new_internal(TCGType type
, int reg
,
326 tcg_target_long offset
,
329 TCGContext
*s
= &tcg_ctx
;
334 #if TCG_TARGET_REG_BITS == 32
335 if (type
== TCG_TYPE_I64
) {
337 tcg_temp_alloc(s
, s
->nb_globals
+ 2);
338 ts
= &s
->temps
[s
->nb_globals
];
339 ts
->base_type
= type
;
340 ts
->type
= TCG_TYPE_I32
;
342 ts
->mem_allocated
= 1;
344 #ifdef TCG_TARGET_WORDS_BIGENDIAN
345 ts
->mem_offset
= offset
+ 4;
347 ts
->mem_offset
= offset
;
349 pstrcpy(buf
, sizeof(buf
), name
);
350 pstrcat(buf
, sizeof(buf
), "_0");
351 ts
->name
= strdup(buf
);
354 ts
->base_type
= type
;
355 ts
->type
= TCG_TYPE_I32
;
357 ts
->mem_allocated
= 1;
359 #ifdef TCG_TARGET_WORDS_BIGENDIAN
360 ts
->mem_offset
= offset
;
362 ts
->mem_offset
= offset
+ 4;
364 pstrcpy(buf
, sizeof(buf
), name
);
365 pstrcat(buf
, sizeof(buf
), "_1");
366 ts
->name
= strdup(buf
);
372 tcg_temp_alloc(s
, s
->nb_globals
+ 1);
373 ts
= &s
->temps
[s
->nb_globals
];
374 ts
->base_type
= type
;
377 ts
->mem_allocated
= 1;
379 ts
->mem_offset
= offset
;
386 TCGv_i32
tcg_global_mem_new_i32(int reg
, tcg_target_long offset
,
391 idx
= tcg_global_mem_new_internal(TCG_TYPE_I32
, reg
, offset
, name
);
392 return MAKE_TCGV_I32(idx
);
395 TCGv_i64
tcg_global_mem_new_i64(int reg
, tcg_target_long offset
,
400 idx
= tcg_global_mem_new_internal(TCG_TYPE_I64
, reg
, offset
, name
);
401 return MAKE_TCGV_I64(idx
);
404 static inline int tcg_temp_new_internal(TCGType type
, int temp_local
)
406 TCGContext
*s
= &tcg_ctx
;
413 idx
= s
->first_free_temp
[k
];
415 /* There is already an available temp with the
418 s
->first_free_temp
[k
] = ts
->next_free_temp
;
419 ts
->temp_allocated
= 1;
420 assert(ts
->temp_local
== temp_local
);
423 #if TCG_TARGET_REG_BITS == 32
424 if (type
== TCG_TYPE_I64
) {
425 tcg_temp_alloc(s
, s
->nb_temps
+ 2);
426 ts
= &s
->temps
[s
->nb_temps
];
427 ts
->base_type
= type
;
428 ts
->type
= TCG_TYPE_I32
;
429 ts
->temp_allocated
= 1;
430 ts
->temp_local
= temp_local
;
433 ts
->base_type
= TCG_TYPE_I32
;
434 ts
->type
= TCG_TYPE_I32
;
435 ts
->temp_allocated
= 1;
436 ts
->temp_local
= temp_local
;
442 tcg_temp_alloc(s
, s
->nb_temps
+ 1);
443 ts
= &s
->temps
[s
->nb_temps
];
444 ts
->base_type
= type
;
446 ts
->temp_allocated
= 1;
447 ts
->temp_local
= temp_local
;
453 #if defined(CONFIG_DEBUG_TCG)
459 TCGv_i32
tcg_temp_new_internal_i32(int temp_local
)
463 idx
= tcg_temp_new_internal(TCG_TYPE_I32
, temp_local
);
464 return MAKE_TCGV_I32(idx
);
467 TCGv_i64
tcg_temp_new_internal_i64(int temp_local
)
471 idx
= tcg_temp_new_internal(TCG_TYPE_I64
, temp_local
);
472 return MAKE_TCGV_I64(idx
);
475 static inline void tcg_temp_free_internal(int idx
)
477 TCGContext
*s
= &tcg_ctx
;
481 #if defined(CONFIG_DEBUG_TCG)
483 if (s
->temps_in_use
< 0) {
484 fprintf(stderr
, "More temporaries freed than allocated!\n");
488 assert(idx
>= s
->nb_globals
&& idx
< s
->nb_temps
);
490 assert(ts
->temp_allocated
!= 0);
491 ts
->temp_allocated
= 0;
495 ts
->next_free_temp
= s
->first_free_temp
[k
];
496 s
->first_free_temp
[k
] = idx
;
499 void tcg_temp_free_i32(TCGv_i32 arg
)
501 tcg_temp_free_internal(GET_TCGV_I32(arg
));
504 void tcg_temp_free_i64(TCGv_i64 arg
)
506 tcg_temp_free_internal(GET_TCGV_I64(arg
));
509 TCGv_i32
tcg_const_i32(int32_t val
)
512 t0
= tcg_temp_new_i32();
513 tcg_gen_movi_i32(t0
, val
);
517 TCGv_i64
tcg_const_i64(int64_t val
)
520 t0
= tcg_temp_new_i64();
521 tcg_gen_movi_i64(t0
, val
);
525 TCGv_i32
tcg_const_local_i32(int32_t val
)
528 t0
= tcg_temp_local_new_i32();
529 tcg_gen_movi_i32(t0
, val
);
533 TCGv_i64
tcg_const_local_i64(int64_t val
)
536 t0
= tcg_temp_local_new_i64();
537 tcg_gen_movi_i64(t0
, val
);
541 #if defined(CONFIG_DEBUG_TCG)
542 void tcg_clear_temp_count(void)
544 TCGContext
*s
= &tcg_ctx
;
548 int tcg_check_temp_count(void)
550 TCGContext
*s
= &tcg_ctx
;
551 if (s
->temps_in_use
) {
552 /* Clear the count so that we don't give another
553 * warning immediately next time around.
562 void tcg_register_helper(void *func
, const char *name
)
564 TCGContext
*s
= &tcg_ctx
;
566 if ((s
->nb_helpers
+ 1) > s
->allocated_helpers
) {
567 n
= s
->allocated_helpers
;
573 s
->helpers
= realloc(s
->helpers
, n
* sizeof(TCGHelperInfo
));
574 s
->allocated_helpers
= n
;
576 s
->helpers
[s
->nb_helpers
].func
= (tcg_target_ulong
)func
;
577 s
->helpers
[s
->nb_helpers
].name
= name
;
581 /* Note: we convert the 64 bit args to 32 bit and do some alignment
582 and endian swap. Maybe it would be better to do the alignment
583 and endian swap in tcg_reg_alloc_call(). */
584 void tcg_gen_callN(TCGContext
*s
, TCGv_ptr func
, unsigned int flags
,
585 int sizemask
, TCGArg ret
, int nargs
, TCGArg
*args
)
587 #if defined(TCG_TARGET_I386) && TCG_TARGET_REG_BITS < 64
595 #if defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64
596 for (i
= 0; i
< nargs
; ++i
) {
597 int is_64bit
= sizemask
& (1 << (i
+1)*2);
598 int is_signed
= sizemask
& (2 << (i
+1)*2);
600 TCGv_i64 temp
= tcg_temp_new_i64();
601 TCGv_i64 orig
= MAKE_TCGV_I64(args
[i
]);
603 tcg_gen_ext32s_i64(temp
, orig
);
605 tcg_gen_ext32u_i64(temp
, orig
);
607 args
[i
] = GET_TCGV_I64(temp
);
610 #endif /* TCG_TARGET_EXTEND_ARGS */
612 *gen_opc_ptr
++ = INDEX_op_call
;
613 nparam
= gen_opparam_ptr
++;
614 #if defined(TCG_TARGET_I386) && TCG_TARGET_REG_BITS < 64
615 call_type
= (flags
& TCG_CALL_TYPE_MASK
);
617 if (ret
!= TCG_CALL_DUMMY_ARG
) {
618 #if TCG_TARGET_REG_BITS < 64
620 #ifdef TCG_TARGET_WORDS_BIGENDIAN
621 *gen_opparam_ptr
++ = ret
+ 1;
622 *gen_opparam_ptr
++ = ret
;
624 *gen_opparam_ptr
++ = ret
;
625 *gen_opparam_ptr
++ = ret
+ 1;
631 *gen_opparam_ptr
++ = ret
;
638 for (i
= 0; i
< nargs
; i
++) {
639 #if TCG_TARGET_REG_BITS < 64
640 int is_64bit
= sizemask
& (1 << (i
+1)*2);
642 #ifdef TCG_TARGET_I386
643 /* REGPARM case: if the third parameter is 64 bit, it is
644 allocated on the stack */
645 if (i
== 2 && call_type
== TCG_CALL_TYPE_REGPARM
) {
646 call_type
= TCG_CALL_TYPE_REGPARM_2
;
647 flags
= (flags
& ~TCG_CALL_TYPE_MASK
) | call_type
;
650 #ifdef TCG_TARGET_CALL_ALIGN_ARGS
651 /* some targets want aligned 64 bit args */
653 *gen_opparam_ptr
++ = TCG_CALL_DUMMY_ARG
;
657 /* If stack grows up, then we will be placing successive
658 arguments at lower addresses, which means we need to
659 reverse the order compared to how we would normally
660 treat either big or little-endian. For those arguments
661 that will wind up in registers, this still works for
662 HPPA (the only current STACK_GROWSUP target) since the
663 argument registers are *also* allocated in decreasing
664 order. If another such target is added, this logic may
665 have to get more complicated to differentiate between
666 stack arguments and register arguments. */
667 #if defined(TCG_TARGET_WORDS_BIGENDIAN) != defined(TCG_TARGET_STACK_GROWSUP)
668 *gen_opparam_ptr
++ = args
[i
] + 1;
669 *gen_opparam_ptr
++ = args
[i
];
671 *gen_opparam_ptr
++ = args
[i
];
672 *gen_opparam_ptr
++ = args
[i
] + 1;
677 #endif /* TCG_TARGET_REG_BITS < 64 */
679 *gen_opparam_ptr
++ = args
[i
];
682 *gen_opparam_ptr
++ = GET_TCGV_PTR(func
);
684 *gen_opparam_ptr
++ = flags
;
686 *nparam
= (nb_rets
<< 16) | (real_args
+ 1);
688 /* total parameters, needed to go backward in the instruction stream */
689 *gen_opparam_ptr
++ = 1 + nb_rets
+ real_args
+ 3;
691 #if defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64
692 for (i
= 0; i
< nargs
; ++i
) {
693 int is_64bit
= sizemask
& (1 << (i
+1)*2);
695 TCGv_i64 temp
= MAKE_TCGV_I64(args
[i
]);
696 tcg_temp_free_i64(temp
);
699 #endif /* TCG_TARGET_EXTEND_ARGS */
702 #if TCG_TARGET_REG_BITS == 32
703 void tcg_gen_shifti_i64(TCGv_i64 ret
, TCGv_i64 arg1
,
704 int c
, int right
, int arith
)
707 tcg_gen_mov_i32(TCGV_LOW(ret
), TCGV_LOW(arg1
));
708 tcg_gen_mov_i32(TCGV_HIGH(ret
), TCGV_HIGH(arg1
));
709 } else if (c
>= 32) {
713 tcg_gen_sari_i32(TCGV_LOW(ret
), TCGV_HIGH(arg1
), c
);
714 tcg_gen_sari_i32(TCGV_HIGH(ret
), TCGV_HIGH(arg1
), 31);
716 tcg_gen_shri_i32(TCGV_LOW(ret
), TCGV_HIGH(arg1
), c
);
717 tcg_gen_movi_i32(TCGV_HIGH(ret
), 0);
720 tcg_gen_shli_i32(TCGV_HIGH(ret
), TCGV_LOW(arg1
), c
);
721 tcg_gen_movi_i32(TCGV_LOW(ret
), 0);
726 t0
= tcg_temp_new_i32();
727 t1
= tcg_temp_new_i32();
729 tcg_gen_shli_i32(t0
, TCGV_HIGH(arg1
), 32 - c
);
731 tcg_gen_sari_i32(t1
, TCGV_HIGH(arg1
), c
);
733 tcg_gen_shri_i32(t1
, TCGV_HIGH(arg1
), c
);
734 tcg_gen_shri_i32(TCGV_LOW(ret
), TCGV_LOW(arg1
), c
);
735 tcg_gen_or_i32(TCGV_LOW(ret
), TCGV_LOW(ret
), t0
);
736 tcg_gen_mov_i32(TCGV_HIGH(ret
), t1
);
738 tcg_gen_shri_i32(t0
, TCGV_LOW(arg1
), 32 - c
);
739 /* Note: ret can be the same as arg1, so we use t1 */
740 tcg_gen_shli_i32(t1
, TCGV_LOW(arg1
), c
);
741 tcg_gen_shli_i32(TCGV_HIGH(ret
), TCGV_HIGH(arg1
), c
);
742 tcg_gen_or_i32(TCGV_HIGH(ret
), TCGV_HIGH(ret
), t0
);
743 tcg_gen_mov_i32(TCGV_LOW(ret
), t1
);
745 tcg_temp_free_i32(t0
);
746 tcg_temp_free_i32(t1
);
752 static void tcg_reg_alloc_start(TCGContext
*s
)
756 for(i
= 0; i
< s
->nb_globals
; i
++) {
759 ts
->val_type
= TEMP_VAL_REG
;
761 ts
->val_type
= TEMP_VAL_MEM
;
764 for(i
= s
->nb_globals
; i
< s
->nb_temps
; i
++) {
766 ts
->val_type
= TEMP_VAL_DEAD
;
767 ts
->mem_allocated
= 0;
770 for(i
= 0; i
< TCG_TARGET_NB_REGS
; i
++) {
771 s
->reg_to_temp
[i
] = -1;
775 static char *tcg_get_arg_str_idx(TCGContext
*s
, char *buf
, int buf_size
,
781 if (idx
< s
->nb_globals
) {
782 pstrcpy(buf
, buf_size
, ts
->name
);
785 snprintf(buf
, buf_size
, "loc%d", idx
- s
->nb_globals
);
787 snprintf(buf
, buf_size
, "tmp%d", idx
- s
->nb_globals
);
792 char *tcg_get_arg_str_i32(TCGContext
*s
, char *buf
, int buf_size
, TCGv_i32 arg
)
794 return tcg_get_arg_str_idx(s
, buf
, buf_size
, GET_TCGV_I32(arg
));
797 char *tcg_get_arg_str_i64(TCGContext
*s
, char *buf
, int buf_size
, TCGv_i64 arg
)
799 return tcg_get_arg_str_idx(s
, buf
, buf_size
, GET_TCGV_I64(arg
));
802 static int helper_cmp(const void *p1
, const void *p2
)
804 const TCGHelperInfo
*th1
= p1
;
805 const TCGHelperInfo
*th2
= p2
;
806 if (th1
->func
< th2
->func
)
808 else if (th1
->func
== th2
->func
)
814 /* find helper definition (Note: A hash table would be better) */
815 static TCGHelperInfo
*tcg_find_helper(TCGContext
*s
, tcg_target_ulong val
)
821 if (unlikely(!s
->helpers_sorted
)) {
822 qsort(s
->helpers
, s
->nb_helpers
, sizeof(TCGHelperInfo
),
824 s
->helpers_sorted
= 1;
829 m_max
= s
->nb_helpers
- 1;
830 while (m_min
<= m_max
) {
831 m
= (m_min
+ m_max
) >> 1;
845 static const char * const cond_name
[] =
847 [TCG_COND_EQ
] = "eq",
848 [TCG_COND_NE
] = "ne",
849 [TCG_COND_LT
] = "lt",
850 [TCG_COND_GE
] = "ge",
851 [TCG_COND_LE
] = "le",
852 [TCG_COND_GT
] = "gt",
853 [TCG_COND_LTU
] = "ltu",
854 [TCG_COND_GEU
] = "geu",
855 [TCG_COND_LEU
] = "leu",
856 [TCG_COND_GTU
] = "gtu"
859 void tcg_dump_ops(TCGContext
*s
, FILE *outfile
)
861 const uint16_t *opc_ptr
;
865 int i
, k
, nb_oargs
, nb_iargs
, nb_cargs
, first_insn
;
870 opc_ptr
= gen_opc_buf
;
871 args
= gen_opparam_buf
;
872 while (opc_ptr
< gen_opc_ptr
) {
874 def
= &tcg_op_defs
[c
];
875 if (c
== INDEX_op_debug_insn_start
) {
877 #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS
878 pc
= ((uint64_t)args
[1] << 32) | args
[0];
883 fprintf(outfile
, "\n");
884 fprintf(outfile
, " ---- 0x%" PRIx64
, pc
);
886 nb_oargs
= def
->nb_oargs
;
887 nb_iargs
= def
->nb_iargs
;
888 nb_cargs
= def
->nb_cargs
;
889 } else if (c
== INDEX_op_call
) {
892 /* variable number of arguments */
894 nb_oargs
= arg
>> 16;
895 nb_iargs
= arg
& 0xffff;
896 nb_cargs
= def
->nb_cargs
;
898 fprintf(outfile
, " %s ", def
->name
);
901 fprintf(outfile
, "%s",
902 tcg_get_arg_str_idx(s
, buf
, sizeof(buf
), args
[nb_oargs
+ nb_iargs
- 1]));
904 fprintf(outfile
, ",$0x%" TCG_PRIlx
,
905 args
[nb_oargs
+ nb_iargs
]);
907 fprintf(outfile
, ",$%d", nb_oargs
);
908 for(i
= 0; i
< nb_oargs
; i
++) {
909 fprintf(outfile
, ",");
910 fprintf(outfile
, "%s",
911 tcg_get_arg_str_idx(s
, buf
, sizeof(buf
), args
[i
]));
913 for(i
= 0; i
< (nb_iargs
- 1); i
++) {
914 fprintf(outfile
, ",");
915 if (args
[nb_oargs
+ i
] == TCG_CALL_DUMMY_ARG
) {
916 fprintf(outfile
, "<dummy>");
918 fprintf(outfile
, "%s",
919 tcg_get_arg_str_idx(s
, buf
, sizeof(buf
), args
[nb_oargs
+ i
]));
922 } else if (c
== INDEX_op_movi_i32
923 #if TCG_TARGET_REG_BITS == 64
924 || c
== INDEX_op_movi_i64
927 tcg_target_ulong val
;
930 nb_oargs
= def
->nb_oargs
;
931 nb_iargs
= def
->nb_iargs
;
932 nb_cargs
= def
->nb_cargs
;
933 fprintf(outfile
, " %s %s,$", def
->name
,
934 tcg_get_arg_str_idx(s
, buf
, sizeof(buf
), args
[0]));
936 th
= tcg_find_helper(s
, val
);
938 fprintf(outfile
, "%s", th
->name
);
940 if (c
== INDEX_op_movi_i32
)
941 fprintf(outfile
, "0x%x", (uint32_t)val
);
943 fprintf(outfile
, "0x%" PRIx64
, (uint64_t)val
);
946 fprintf(outfile
, " %s ", def
->name
);
947 if (c
== INDEX_op_nopn
) {
948 /* variable number of arguments */
953 nb_oargs
= def
->nb_oargs
;
954 nb_iargs
= def
->nb_iargs
;
955 nb_cargs
= def
->nb_cargs
;
959 for(i
= 0; i
< nb_oargs
; i
++) {
961 fprintf(outfile
, ",");
962 fprintf(outfile
, "%s",
963 tcg_get_arg_str_idx(s
, buf
, sizeof(buf
), args
[k
++]));
965 for(i
= 0; i
< nb_iargs
; i
++) {
967 fprintf(outfile
, ",");
968 fprintf(outfile
, "%s",
969 tcg_get_arg_str_idx(s
, buf
, sizeof(buf
), args
[k
++]));
972 case INDEX_op_brcond_i32
:
973 #if TCG_TARGET_REG_BITS == 32
974 case INDEX_op_brcond2_i32
:
975 #elif TCG_TARGET_REG_BITS == 64
976 case INDEX_op_brcond_i64
:
978 case INDEX_op_setcond_i32
:
979 #if TCG_TARGET_REG_BITS == 32
980 case INDEX_op_setcond2_i32
:
981 #elif TCG_TARGET_REG_BITS == 64
982 case INDEX_op_setcond_i64
:
984 if (args
[k
] < ARRAY_SIZE(cond_name
) && cond_name
[args
[k
]])
985 fprintf(outfile
, ",%s", cond_name
[args
[k
++]]);
987 fprintf(outfile
, ",$0x%" TCG_PRIlx
, args
[k
++]);
994 for(; i
< nb_cargs
; i
++) {
996 fprintf(outfile
, ",");
998 fprintf(outfile
, "$0x%" TCG_PRIlx
, arg
);
1001 fprintf(outfile
, "\n");
1002 args
+= nb_iargs
+ nb_oargs
+ nb_cargs
;
1006 /* we give more priority to constraints with less registers */
1007 static int get_constraint_priority(const TCGOpDef
*def
, int k
)
1009 const TCGArgConstraint
*arg_ct
;
1012 arg_ct
= &def
->args_ct
[k
];
1013 if (arg_ct
->ct
& TCG_CT_ALIAS
) {
1014 /* an alias is equivalent to a single register */
1017 if (!(arg_ct
->ct
& TCG_CT_REG
))
1020 for(i
= 0; i
< TCG_TARGET_NB_REGS
; i
++) {
1021 if (tcg_regset_test_reg(arg_ct
->u
.regs
, i
))
1025 return TCG_TARGET_NB_REGS
- n
+ 1;
1028 /* sort from highest priority to lowest */
1029 static void sort_constraints(TCGOpDef
*def
, int start
, int n
)
1031 int i
, j
, p1
, p2
, tmp
;
1033 for(i
= 0; i
< n
; i
++)
1034 def
->sorted_args
[start
+ i
] = start
+ i
;
1037 for(i
= 0; i
< n
- 1; i
++) {
1038 for(j
= i
+ 1; j
< n
; j
++) {
1039 p1
= get_constraint_priority(def
, def
->sorted_args
[start
+ i
]);
1040 p2
= get_constraint_priority(def
, def
->sorted_args
[start
+ j
]);
1042 tmp
= def
->sorted_args
[start
+ i
];
1043 def
->sorted_args
[start
+ i
] = def
->sorted_args
[start
+ j
];
1044 def
->sorted_args
[start
+ j
] = tmp
;
1050 void tcg_add_target_add_op_defs(const TCGTargetOpDef
*tdefs
)
1058 if (tdefs
->op
== (TCGOpcode
)-1)
1061 assert((unsigned)op
< NB_OPS
);
1062 def
= &tcg_op_defs
[op
];
1063 #if defined(CONFIG_DEBUG_TCG)
1064 /* Duplicate entry in op definitions? */
1068 nb_args
= def
->nb_iargs
+ def
->nb_oargs
;
1069 for(i
= 0; i
< nb_args
; i
++) {
1070 ct_str
= tdefs
->args_ct_str
[i
];
1071 /* Incomplete TCGTargetOpDef entry? */
1072 assert(ct_str
!= NULL
);
1073 tcg_regset_clear(def
->args_ct
[i
].u
.regs
);
1074 def
->args_ct
[i
].ct
= 0;
1075 if (ct_str
[0] >= '0' && ct_str
[0] <= '9') {
1077 oarg
= ct_str
[0] - '0';
1078 assert(oarg
< def
->nb_oargs
);
1079 assert(def
->args_ct
[oarg
].ct
& TCG_CT_REG
);
1080 /* TCG_CT_ALIAS is for the output arguments. The input
1081 argument is tagged with TCG_CT_IALIAS. */
1082 def
->args_ct
[i
] = def
->args_ct
[oarg
];
1083 def
->args_ct
[oarg
].ct
= TCG_CT_ALIAS
;
1084 def
->args_ct
[oarg
].alias_index
= i
;
1085 def
->args_ct
[i
].ct
|= TCG_CT_IALIAS
;
1086 def
->args_ct
[i
].alias_index
= oarg
;
1089 if (*ct_str
== '\0')
1093 def
->args_ct
[i
].ct
|= TCG_CT_CONST
;
1097 if (target_parse_constraint(&def
->args_ct
[i
], &ct_str
) < 0) {
1098 fprintf(stderr
, "Invalid constraint '%s' for arg %d of operation '%s'\n",
1099 ct_str
, i
, def
->name
);
1107 /* TCGTargetOpDef entry with too much information? */
1108 assert(i
== TCG_MAX_OP_ARGS
|| tdefs
->args_ct_str
[i
] == NULL
);
1110 /* sort the constraints (XXX: this is just an heuristic) */
1111 sort_constraints(def
, 0, def
->nb_oargs
);
1112 sort_constraints(def
, def
->nb_oargs
, def
->nb_iargs
);
1118 printf("%s: sorted=", def
->name
);
1119 for(i
= 0; i
< def
->nb_oargs
+ def
->nb_iargs
; i
++)
1120 printf(" %d", def
->sorted_args
[i
]);
1127 #if defined(CONFIG_DEBUG_TCG)
1129 for (op
= 0; op
< ARRAY_SIZE(tcg_op_defs
); op
++) {
1130 if (op
< INDEX_op_call
|| op
== INDEX_op_debug_insn_start
) {
1131 /* Wrong entry in op definitions? */
1132 if (tcg_op_defs
[op
].used
) {
1133 fprintf(stderr
, "Invalid op definition for %s\n",
1134 tcg_op_defs
[op
].name
);
1138 /* Missing entry in op definitions? */
1139 if (!tcg_op_defs
[op
].used
) {
1140 fprintf(stderr
, "Missing op definition for %s\n",
1141 tcg_op_defs
[op
].name
);
1152 #ifdef USE_LIVENESS_ANALYSIS
1154 /* set a nop for an operation using 'nb_args' */
1155 static inline void tcg_set_nop(TCGContext
*s
, uint16_t *opc_ptr
,
1156 TCGArg
*args
, int nb_args
)
1159 *opc_ptr
= INDEX_op_nop
;
1161 *opc_ptr
= INDEX_op_nopn
;
1163 args
[nb_args
- 1] = nb_args
;
1167 /* liveness analysis: end of function: globals are live, temps are
1169 /* XXX: at this stage, not used as there would be little gains because
1170 most TBs end with a conditional jump. */
1171 static inline void tcg_la_func_end(TCGContext
*s
, uint8_t *dead_temps
)
1173 memset(dead_temps
, 0, s
->nb_globals
);
1174 memset(dead_temps
+ s
->nb_globals
, 1, s
->nb_temps
- s
->nb_globals
);
1177 /* liveness analysis: end of basic block: globals are live, temps are
1178 dead, local temps are live. */
1179 static inline void tcg_la_bb_end(TCGContext
*s
, uint8_t *dead_temps
)
1184 memset(dead_temps
, 0, s
->nb_globals
);
1185 ts
= &s
->temps
[s
->nb_globals
];
1186 for(i
= s
->nb_globals
; i
< s
->nb_temps
; i
++) {
1195 /* Liveness analysis : update the opc_dead_args array to tell if a
1196 given input arguments is dead. Instructions updating dead
1197 temporaries are removed. */
1198 static void tcg_liveness_analysis(TCGContext
*s
)
1200 int i
, op_index
, nb_args
, nb_iargs
, nb_oargs
, arg
, nb_ops
;
1203 const TCGOpDef
*def
;
1204 uint8_t *dead_temps
;
1205 unsigned int dead_args
;
1207 gen_opc_ptr
++; /* skip end */
1209 nb_ops
= gen_opc_ptr
- gen_opc_buf
;
1211 s
->op_dead_args
= tcg_malloc(nb_ops
* sizeof(uint16_t));
1213 dead_temps
= tcg_malloc(s
->nb_temps
);
1214 memset(dead_temps
, 1, s
->nb_temps
);
1216 args
= gen_opparam_ptr
;
1217 op_index
= nb_ops
- 1;
1218 while (op_index
>= 0) {
1219 op
= gen_opc_buf
[op_index
];
1220 def
= &tcg_op_defs
[op
];
1228 nb_iargs
= args
[0] & 0xffff;
1229 nb_oargs
= args
[0] >> 16;
1231 call_flags
= args
[nb_oargs
+ nb_iargs
];
1233 /* pure functions can be removed if their result is not
1235 if (call_flags
& TCG_CALL_PURE
) {
1236 for(i
= 0; i
< nb_oargs
; i
++) {
1238 if (!dead_temps
[arg
])
1239 goto do_not_remove_call
;
1241 tcg_set_nop(s
, gen_opc_buf
+ op_index
,
1246 /* output args are dead */
1248 for(i
= 0; i
< nb_oargs
; i
++) {
1250 if (dead_temps
[arg
]) {
1251 dead_args
|= (1 << i
);
1253 dead_temps
[arg
] = 1;
1256 if (!(call_flags
& TCG_CALL_CONST
)) {
1257 /* globals are live (they may be used by the call) */
1258 memset(dead_temps
, 0, s
->nb_globals
);
1261 /* input args are live */
1262 for(i
= nb_oargs
; i
< nb_iargs
+ nb_oargs
; i
++) {
1264 if (arg
!= TCG_CALL_DUMMY_ARG
) {
1265 if (dead_temps
[arg
]) {
1266 dead_args
|= (1 << i
);
1268 dead_temps
[arg
] = 0;
1271 s
->op_dead_args
[op_index
] = dead_args
;
1276 case INDEX_op_set_label
:
1278 /* mark end of basic block */
1279 tcg_la_bb_end(s
, dead_temps
);
1281 case INDEX_op_debug_insn_start
:
1282 args
-= def
->nb_args
;
1288 case INDEX_op_discard
:
1290 /* mark the temporary as dead */
1291 dead_temps
[args
[0]] = 1;
1295 /* XXX: optimize by hardcoding common cases (e.g. triadic ops) */
1297 args
-= def
->nb_args
;
1298 nb_iargs
= def
->nb_iargs
;
1299 nb_oargs
= def
->nb_oargs
;
1301 /* Test if the operation can be removed because all
1302 its outputs are dead. We assume that nb_oargs == 0
1303 implies side effects */
1304 if (!(def
->flags
& TCG_OPF_SIDE_EFFECTS
) && nb_oargs
!= 0) {
1305 for(i
= 0; i
< nb_oargs
; i
++) {
1307 if (!dead_temps
[arg
])
1310 tcg_set_nop(s
, gen_opc_buf
+ op_index
, args
, def
->nb_args
);
1311 #ifdef CONFIG_PROFILER
1317 /* output args are dead */
1319 for(i
= 0; i
< nb_oargs
; i
++) {
1321 if (dead_temps
[arg
]) {
1322 dead_args
|= (1 << i
);
1324 dead_temps
[arg
] = 1;
1327 /* if end of basic block, update */
1328 if (def
->flags
& TCG_OPF_BB_END
) {
1329 tcg_la_bb_end(s
, dead_temps
);
1330 } else if (def
->flags
& TCG_OPF_CALL_CLOBBER
) {
1331 /* globals are live */
1332 memset(dead_temps
, 0, s
->nb_globals
);
1335 /* input args are live */
1336 for(i
= nb_oargs
; i
< nb_oargs
+ nb_iargs
; i
++) {
1338 if (dead_temps
[arg
]) {
1339 dead_args
|= (1 << i
);
1341 dead_temps
[arg
] = 0;
1343 s
->op_dead_args
[op_index
] = dead_args
;
1350 if (args
!= gen_opparam_buf
)
1354 /* dummy liveness analysis */
1355 static void tcg_liveness_analysis(TCGContext
*s
)
1358 nb_ops
= gen_opc_ptr
- gen_opc_buf
;
1360 s
->op_dead_args
= tcg_malloc(nb_ops
* sizeof(uint16_t));
1361 memset(s
->op_dead_args
, 0, nb_ops
* sizeof(uint16_t));
1366 static void dump_regs(TCGContext
*s
)
1372 for(i
= 0; i
< s
->nb_temps
; i
++) {
1374 printf(" %10s: ", tcg_get_arg_str_idx(s
, buf
, sizeof(buf
), i
));
1375 switch(ts
->val_type
) {
1377 printf("%s", tcg_target_reg_names
[ts
->reg
]);
1380 printf("%d(%s)", (int)ts
->mem_offset
, tcg_target_reg_names
[ts
->mem_reg
]);
1382 case TEMP_VAL_CONST
:
1383 printf("$0x%" TCG_PRIlx
, ts
->val
);
1395 for(i
= 0; i
< TCG_TARGET_NB_REGS
; i
++) {
1396 if (s
->reg_to_temp
[i
] >= 0) {
1398 tcg_target_reg_names
[i
],
1399 tcg_get_arg_str_idx(s
, buf
, sizeof(buf
), s
->reg_to_temp
[i
]));
1404 static void check_regs(TCGContext
*s
)
1410 for(reg
= 0; reg
< TCG_TARGET_NB_REGS
; reg
++) {
1411 k
= s
->reg_to_temp
[reg
];
1414 if (ts
->val_type
!= TEMP_VAL_REG
||
1416 printf("Inconsistency for register %s:\n",
1417 tcg_target_reg_names
[reg
]);
1422 for(k
= 0; k
< s
->nb_temps
; k
++) {
1424 if (ts
->val_type
== TEMP_VAL_REG
&&
1426 s
->reg_to_temp
[ts
->reg
] != k
) {
1427 printf("Inconsistency for temp %s:\n",
1428 tcg_get_arg_str_idx(s
, buf
, sizeof(buf
), k
));
1430 printf("reg state:\n");
1438 static void temp_allocate_frame(TCGContext
*s
, int temp
)
1441 ts
= &s
->temps
[temp
];
1442 #ifndef __sparc_v9__ /* Sparc64 stack is accessed with offset of 2047 */
1443 s
->current_frame_offset
= (s
->current_frame_offset
+
1444 (tcg_target_long
)sizeof(tcg_target_long
) - 1) &
1445 ~(sizeof(tcg_target_long
) - 1);
1447 if (s
->current_frame_offset
+ (tcg_target_long
)sizeof(tcg_target_long
) >
1451 ts
->mem_offset
= s
->current_frame_offset
;
1452 ts
->mem_reg
= s
->frame_reg
;
1453 ts
->mem_allocated
= 1;
1454 s
->current_frame_offset
+= (tcg_target_long
)sizeof(tcg_target_long
);
1457 /* free register 'reg' by spilling the corresponding temporary if necessary */
1458 static void tcg_reg_free(TCGContext
*s
, int reg
)
1463 temp
= s
->reg_to_temp
[reg
];
1465 ts
= &s
->temps
[temp
];
1466 assert(ts
->val_type
== TEMP_VAL_REG
);
1467 if (!ts
->mem_coherent
) {
1468 if (!ts
->mem_allocated
)
1469 temp_allocate_frame(s
, temp
);
1470 tcg_out_st(s
, ts
->type
, reg
, ts
->mem_reg
, ts
->mem_offset
);
1472 ts
->val_type
= TEMP_VAL_MEM
;
1473 s
->reg_to_temp
[reg
] = -1;
1477 /* Allocate a register belonging to reg1 & ~reg2 */
1478 static int tcg_reg_alloc(TCGContext
*s
, TCGRegSet reg1
, TCGRegSet reg2
)
1483 tcg_regset_andnot(reg_ct
, reg1
, reg2
);
1485 /* first try free registers */
1486 for(i
= 0; i
< ARRAY_SIZE(tcg_target_reg_alloc_order
); i
++) {
1487 reg
= tcg_target_reg_alloc_order
[i
];
1488 if (tcg_regset_test_reg(reg_ct
, reg
) && s
->reg_to_temp
[reg
] == -1)
1492 /* XXX: do better spill choice */
1493 for(i
= 0; i
< ARRAY_SIZE(tcg_target_reg_alloc_order
); i
++) {
1494 reg
= tcg_target_reg_alloc_order
[i
];
1495 if (tcg_regset_test_reg(reg_ct
, reg
)) {
1496 tcg_reg_free(s
, reg
);
1504 /* save a temporary to memory. 'allocated_regs' is used in case a
1505 temporary registers needs to be allocated to store a constant. */
1506 static void temp_save(TCGContext
*s
, int temp
, TCGRegSet allocated_regs
)
1511 ts
= &s
->temps
[temp
];
1512 if (!ts
->fixed_reg
) {
1513 switch(ts
->val_type
) {
1515 tcg_reg_free(s
, ts
->reg
);
1518 ts
->val_type
= TEMP_VAL_MEM
;
1520 case TEMP_VAL_CONST
:
1521 reg
= tcg_reg_alloc(s
, tcg_target_available_regs
[ts
->type
],
1523 if (!ts
->mem_allocated
)
1524 temp_allocate_frame(s
, temp
);
1525 tcg_out_movi(s
, ts
->type
, reg
, ts
->val
);
1526 tcg_out_st(s
, ts
->type
, reg
, ts
->mem_reg
, ts
->mem_offset
);
1527 ts
->val_type
= TEMP_VAL_MEM
;
1537 /* save globals to their cannonical location and assume they can be
1538 modified be the following code. 'allocated_regs' is used in case a
1539 temporary registers needs to be allocated to store a constant. */
1540 static void save_globals(TCGContext
*s
, TCGRegSet allocated_regs
)
1544 for(i
= 0; i
< s
->nb_globals
; i
++) {
1545 temp_save(s
, i
, allocated_regs
);
1549 /* at the end of a basic block, we assume all temporaries are dead and
1550 all globals are stored at their canonical location. */
1551 static void tcg_reg_alloc_bb_end(TCGContext
*s
, TCGRegSet allocated_regs
)
1556 for(i
= s
->nb_globals
; i
< s
->nb_temps
; i
++) {
1558 if (ts
->temp_local
) {
1559 temp_save(s
, i
, allocated_regs
);
1561 if (ts
->val_type
== TEMP_VAL_REG
) {
1562 s
->reg_to_temp
[ts
->reg
] = -1;
1564 ts
->val_type
= TEMP_VAL_DEAD
;
1568 save_globals(s
, allocated_regs
);
1571 #define IS_DEAD_ARG(n) ((dead_args >> (n)) & 1)
1573 static void tcg_reg_alloc_movi(TCGContext
*s
, const TCGArg
*args
)
1576 tcg_target_ulong val
;
1578 ots
= &s
->temps
[args
[0]];
1581 if (ots
->fixed_reg
) {
1582 /* for fixed registers, we do not do any constant
1584 tcg_out_movi(s
, ots
->type
, ots
->reg
, val
);
1586 /* The movi is not explicitly generated here */
1587 if (ots
->val_type
== TEMP_VAL_REG
)
1588 s
->reg_to_temp
[ots
->reg
] = -1;
1589 ots
->val_type
= TEMP_VAL_CONST
;
1594 static void tcg_reg_alloc_mov(TCGContext
*s
, const TCGOpDef
*def
,
1596 unsigned int dead_args
)
1600 const TCGArgConstraint
*arg_ct
;
1602 ots
= &s
->temps
[args
[0]];
1603 ts
= &s
->temps
[args
[1]];
1604 arg_ct
= &def
->args_ct
[0];
1606 /* XXX: always mark arg dead if IS_DEAD_ARG(1) */
1607 if (ts
->val_type
== TEMP_VAL_REG
) {
1608 if (IS_DEAD_ARG(1) && !ts
->fixed_reg
&& !ots
->fixed_reg
) {
1609 /* the mov can be suppressed */
1610 if (ots
->val_type
== TEMP_VAL_REG
)
1611 s
->reg_to_temp
[ots
->reg
] = -1;
1613 s
->reg_to_temp
[reg
] = -1;
1614 ts
->val_type
= TEMP_VAL_DEAD
;
1616 if (ots
->val_type
== TEMP_VAL_REG
) {
1619 reg
= tcg_reg_alloc(s
, arg_ct
->u
.regs
, s
->reserved_regs
);
1621 if (ts
->reg
!= reg
) {
1622 tcg_out_mov(s
, ots
->type
, reg
, ts
->reg
);
1625 } else if (ts
->val_type
== TEMP_VAL_MEM
) {
1626 if (ots
->val_type
== TEMP_VAL_REG
) {
1629 reg
= tcg_reg_alloc(s
, arg_ct
->u
.regs
, s
->reserved_regs
);
1631 tcg_out_ld(s
, ts
->type
, reg
, ts
->mem_reg
, ts
->mem_offset
);
1632 } else if (ts
->val_type
== TEMP_VAL_CONST
) {
1633 if (ots
->fixed_reg
) {
1635 tcg_out_movi(s
, ots
->type
, reg
, ts
->val
);
1637 /* propagate constant */
1638 if (ots
->val_type
== TEMP_VAL_REG
)
1639 s
->reg_to_temp
[ots
->reg
] = -1;
1640 ots
->val_type
= TEMP_VAL_CONST
;
1647 s
->reg_to_temp
[reg
] = args
[0];
1649 ots
->val_type
= TEMP_VAL_REG
;
1650 ots
->mem_coherent
= 0;
1653 static void tcg_reg_alloc_op(TCGContext
*s
,
1654 const TCGOpDef
*def
, TCGOpcode opc
,
1656 unsigned int dead_args
)
1658 TCGRegSet allocated_regs
;
1659 int i
, k
, nb_iargs
, nb_oargs
, reg
;
1661 const TCGArgConstraint
*arg_ct
;
1663 TCGArg new_args
[TCG_MAX_OP_ARGS
];
1664 int const_args
[TCG_MAX_OP_ARGS
];
1666 nb_oargs
= def
->nb_oargs
;
1667 nb_iargs
= def
->nb_iargs
;
1669 /* copy constants */
1670 memcpy(new_args
+ nb_oargs
+ nb_iargs
,
1671 args
+ nb_oargs
+ nb_iargs
,
1672 sizeof(TCGArg
) * def
->nb_cargs
);
1674 /* satisfy input constraints */
1675 tcg_regset_set(allocated_regs
, s
->reserved_regs
);
1676 for(k
= 0; k
< nb_iargs
; k
++) {
1677 i
= def
->sorted_args
[nb_oargs
+ k
];
1679 arg_ct
= &def
->args_ct
[i
];
1680 ts
= &s
->temps
[arg
];
1681 if (ts
->val_type
== TEMP_VAL_MEM
) {
1682 reg
= tcg_reg_alloc(s
, arg_ct
->u
.regs
, allocated_regs
);
1683 tcg_out_ld(s
, ts
->type
, reg
, ts
->mem_reg
, ts
->mem_offset
);
1684 ts
->val_type
= TEMP_VAL_REG
;
1686 ts
->mem_coherent
= 1;
1687 s
->reg_to_temp
[reg
] = arg
;
1688 } else if (ts
->val_type
== TEMP_VAL_CONST
) {
1689 if (tcg_target_const_match(ts
->val
, arg_ct
)) {
1690 /* constant is OK for instruction */
1692 new_args
[i
] = ts
->val
;
1695 /* need to move to a register */
1696 reg
= tcg_reg_alloc(s
, arg_ct
->u
.regs
, allocated_regs
);
1697 tcg_out_movi(s
, ts
->type
, reg
, ts
->val
);
1698 ts
->val_type
= TEMP_VAL_REG
;
1700 ts
->mem_coherent
= 0;
1701 s
->reg_to_temp
[reg
] = arg
;
1704 assert(ts
->val_type
== TEMP_VAL_REG
);
1705 if (arg_ct
->ct
& TCG_CT_IALIAS
) {
1706 if (ts
->fixed_reg
) {
1707 /* if fixed register, we must allocate a new register
1708 if the alias is not the same register */
1709 if (arg
!= args
[arg_ct
->alias_index
])
1710 goto allocate_in_reg
;
1712 /* if the input is aliased to an output and if it is
1713 not dead after the instruction, we must allocate
1714 a new register and move it */
1715 if (!IS_DEAD_ARG(i
)) {
1716 goto allocate_in_reg
;
1721 if (tcg_regset_test_reg(arg_ct
->u
.regs
, reg
)) {
1722 /* nothing to do : the constraint is satisfied */
1725 /* allocate a new register matching the constraint
1726 and move the temporary register into it */
1727 reg
= tcg_reg_alloc(s
, arg_ct
->u
.regs
, allocated_regs
);
1728 tcg_out_mov(s
, ts
->type
, reg
, ts
->reg
);
1732 tcg_regset_set_reg(allocated_regs
, reg
);
1736 if (def
->flags
& TCG_OPF_BB_END
) {
1737 tcg_reg_alloc_bb_end(s
, allocated_regs
);
1739 /* mark dead temporaries and free the associated registers */
1740 for(i
= nb_oargs
; i
< nb_oargs
+ nb_iargs
; i
++) {
1742 if (IS_DEAD_ARG(i
)) {
1743 ts
= &s
->temps
[arg
];
1744 if (!ts
->fixed_reg
) {
1745 if (ts
->val_type
== TEMP_VAL_REG
)
1746 s
->reg_to_temp
[ts
->reg
] = -1;
1747 ts
->val_type
= TEMP_VAL_DEAD
;
1752 if (def
->flags
& TCG_OPF_CALL_CLOBBER
) {
1753 /* XXX: permit generic clobber register list ? */
1754 for(reg
= 0; reg
< TCG_TARGET_NB_REGS
; reg
++) {
1755 if (tcg_regset_test_reg(tcg_target_call_clobber_regs
, reg
)) {
1756 tcg_reg_free(s
, reg
);
1759 /* XXX: for load/store we could do that only for the slow path
1760 (i.e. when a memory callback is called) */
1762 /* store globals and free associated registers (we assume the insn
1763 can modify any global. */
1764 save_globals(s
, allocated_regs
);
1767 /* satisfy the output constraints */
1768 tcg_regset_set(allocated_regs
, s
->reserved_regs
);
1769 for(k
= 0; k
< nb_oargs
; k
++) {
1770 i
= def
->sorted_args
[k
];
1772 arg_ct
= &def
->args_ct
[i
];
1773 ts
= &s
->temps
[arg
];
1774 if (arg_ct
->ct
& TCG_CT_ALIAS
) {
1775 reg
= new_args
[arg_ct
->alias_index
];
1777 /* if fixed register, we try to use it */
1779 if (ts
->fixed_reg
&&
1780 tcg_regset_test_reg(arg_ct
->u
.regs
, reg
)) {
1783 reg
= tcg_reg_alloc(s
, arg_ct
->u
.regs
, allocated_regs
);
1785 tcg_regset_set_reg(allocated_regs
, reg
);
1786 /* if a fixed register is used, then a move will be done afterwards */
1787 if (!ts
->fixed_reg
) {
1788 if (ts
->val_type
== TEMP_VAL_REG
)
1789 s
->reg_to_temp
[ts
->reg
] = -1;
1790 if (IS_DEAD_ARG(i
)) {
1791 ts
->val_type
= TEMP_VAL_DEAD
;
1793 ts
->val_type
= TEMP_VAL_REG
;
1795 /* temp value is modified, so the value kept in memory is
1796 potentially not the same */
1797 ts
->mem_coherent
= 0;
1798 s
->reg_to_temp
[reg
] = arg
;
1806 /* emit instruction */
1807 tcg_out_op(s
, opc
, new_args
, const_args
);
1809 /* move the outputs in the correct register if needed */
1810 for(i
= 0; i
< nb_oargs
; i
++) {
1811 ts
= &s
->temps
[args
[i
]];
1813 if (ts
->fixed_reg
&& ts
->reg
!= reg
) {
1814 tcg_out_mov(s
, ts
->type
, ts
->reg
, reg
);
1819 #ifdef TCG_TARGET_STACK_GROWSUP
1820 #define STACK_DIR(x) (-(x))
1822 #define STACK_DIR(x) (x)
1825 static int tcg_reg_alloc_call(TCGContext
*s
, const TCGOpDef
*def
,
1826 TCGOpcode opc
, const TCGArg
*args
,
1827 unsigned int dead_args
)
1829 int nb_iargs
, nb_oargs
, flags
, nb_regs
, i
, reg
, nb_params
;
1830 TCGArg arg
, func_arg
;
1832 tcg_target_long stack_offset
, call_stack_size
, func_addr
;
1833 int const_func_arg
, allocate_args
;
1834 TCGRegSet allocated_regs
;
1835 const TCGArgConstraint
*arg_ct
;
1839 nb_oargs
= arg
>> 16;
1840 nb_iargs
= arg
& 0xffff;
1841 nb_params
= nb_iargs
- 1;
1843 flags
= args
[nb_oargs
+ nb_iargs
];
1845 nb_regs
= tcg_target_get_call_iarg_regs_count(flags
);
1846 if (nb_regs
> nb_params
)
1847 nb_regs
= nb_params
;
1849 /* assign stack slots first */
1850 call_stack_size
= (nb_params
- nb_regs
) * sizeof(tcg_target_long
);
1851 call_stack_size
= (call_stack_size
+ TCG_TARGET_STACK_ALIGN
- 1) &
1852 ~(TCG_TARGET_STACK_ALIGN
- 1);
1853 allocate_args
= (call_stack_size
> TCG_STATIC_CALL_ARGS_SIZE
);
1854 if (allocate_args
) {
1855 /* XXX: if more than TCG_STATIC_CALL_ARGS_SIZE is needed,
1856 preallocate call stack */
1860 stack_offset
= TCG_TARGET_CALL_STACK_OFFSET
;
1861 for(i
= nb_regs
; i
< nb_params
; i
++) {
1862 arg
= args
[nb_oargs
+ i
];
1863 #ifdef TCG_TARGET_STACK_GROWSUP
1864 stack_offset
-= sizeof(tcg_target_long
);
1866 if (arg
!= TCG_CALL_DUMMY_ARG
) {
1867 ts
= &s
->temps
[arg
];
1868 if (ts
->val_type
== TEMP_VAL_REG
) {
1869 tcg_out_st(s
, ts
->type
, ts
->reg
, TCG_REG_CALL_STACK
, stack_offset
);
1870 } else if (ts
->val_type
== TEMP_VAL_MEM
) {
1871 reg
= tcg_reg_alloc(s
, tcg_target_available_regs
[ts
->type
],
1873 /* XXX: not correct if reading values from the stack */
1874 tcg_out_ld(s
, ts
->type
, reg
, ts
->mem_reg
, ts
->mem_offset
);
1875 tcg_out_st(s
, ts
->type
, reg
, TCG_REG_CALL_STACK
, stack_offset
);
1876 } else if (ts
->val_type
== TEMP_VAL_CONST
) {
1877 reg
= tcg_reg_alloc(s
, tcg_target_available_regs
[ts
->type
],
1879 /* XXX: sign extend may be needed on some targets */
1880 tcg_out_movi(s
, ts
->type
, reg
, ts
->val
);
1881 tcg_out_st(s
, ts
->type
, reg
, TCG_REG_CALL_STACK
, stack_offset
);
1886 #ifndef TCG_TARGET_STACK_GROWSUP
1887 stack_offset
+= sizeof(tcg_target_long
);
1891 /* assign input registers */
1892 tcg_regset_set(allocated_regs
, s
->reserved_regs
);
1893 for(i
= 0; i
< nb_regs
; i
++) {
1894 arg
= args
[nb_oargs
+ i
];
1895 if (arg
!= TCG_CALL_DUMMY_ARG
) {
1896 ts
= &s
->temps
[arg
];
1897 reg
= tcg_target_call_iarg_regs
[i
];
1898 tcg_reg_free(s
, reg
);
1899 if (ts
->val_type
== TEMP_VAL_REG
) {
1900 if (ts
->reg
!= reg
) {
1901 tcg_out_mov(s
, ts
->type
, reg
, ts
->reg
);
1903 } else if (ts
->val_type
== TEMP_VAL_MEM
) {
1904 tcg_out_ld(s
, ts
->type
, reg
, ts
->mem_reg
, ts
->mem_offset
);
1905 } else if (ts
->val_type
== TEMP_VAL_CONST
) {
1906 /* XXX: sign extend ? */
1907 tcg_out_movi(s
, ts
->type
, reg
, ts
->val
);
1911 tcg_regset_set_reg(allocated_regs
, reg
);
1915 /* assign function address */
1916 func_arg
= args
[nb_oargs
+ nb_iargs
- 1];
1917 arg_ct
= &def
->args_ct
[0];
1918 ts
= &s
->temps
[func_arg
];
1919 func_addr
= ts
->val
;
1921 if (ts
->val_type
== TEMP_VAL_MEM
) {
1922 reg
= tcg_reg_alloc(s
, arg_ct
->u
.regs
, allocated_regs
);
1923 tcg_out_ld(s
, ts
->type
, reg
, ts
->mem_reg
, ts
->mem_offset
);
1925 tcg_regset_set_reg(allocated_regs
, reg
);
1926 } else if (ts
->val_type
== TEMP_VAL_REG
) {
1928 if (!tcg_regset_test_reg(arg_ct
->u
.regs
, reg
)) {
1929 reg
= tcg_reg_alloc(s
, arg_ct
->u
.regs
, allocated_regs
);
1930 tcg_out_mov(s
, ts
->type
, reg
, ts
->reg
);
1933 tcg_regset_set_reg(allocated_regs
, reg
);
1934 } else if (ts
->val_type
== TEMP_VAL_CONST
) {
1935 if (tcg_target_const_match(func_addr
, arg_ct
)) {
1937 func_arg
= func_addr
;
1939 reg
= tcg_reg_alloc(s
, arg_ct
->u
.regs
, allocated_regs
);
1940 tcg_out_movi(s
, ts
->type
, reg
, func_addr
);
1942 tcg_regset_set_reg(allocated_regs
, reg
);
1949 /* mark dead temporaries and free the associated registers */
1950 for(i
= nb_oargs
; i
< nb_iargs
+ nb_oargs
; i
++) {
1952 if (IS_DEAD_ARG(i
)) {
1953 ts
= &s
->temps
[arg
];
1954 if (!ts
->fixed_reg
) {
1955 if (ts
->val_type
== TEMP_VAL_REG
)
1956 s
->reg_to_temp
[ts
->reg
] = -1;
1957 ts
->val_type
= TEMP_VAL_DEAD
;
1962 /* clobber call registers */
1963 for(reg
= 0; reg
< TCG_TARGET_NB_REGS
; reg
++) {
1964 if (tcg_regset_test_reg(tcg_target_call_clobber_regs
, reg
)) {
1965 tcg_reg_free(s
, reg
);
1969 /* store globals and free associated registers (we assume the call
1970 can modify any global. */
1971 if (!(flags
& TCG_CALL_CONST
)) {
1972 save_globals(s
, allocated_regs
);
1975 tcg_out_op(s
, opc
, &func_arg
, &const_func_arg
);
1977 /* assign output registers and emit moves if needed */
1978 for(i
= 0; i
< nb_oargs
; i
++) {
1980 ts
= &s
->temps
[arg
];
1981 reg
= tcg_target_call_oarg_regs
[i
];
1982 assert(s
->reg_to_temp
[reg
] == -1);
1983 if (ts
->fixed_reg
) {
1984 if (ts
->reg
!= reg
) {
1985 tcg_out_mov(s
, ts
->type
, ts
->reg
, reg
);
1988 if (ts
->val_type
== TEMP_VAL_REG
)
1989 s
->reg_to_temp
[ts
->reg
] = -1;
1990 if (IS_DEAD_ARG(i
)) {
1991 ts
->val_type
= TEMP_VAL_DEAD
;
1993 ts
->val_type
= TEMP_VAL_REG
;
1995 ts
->mem_coherent
= 0;
1996 s
->reg_to_temp
[reg
] = arg
;
2001 return nb_iargs
+ nb_oargs
+ def
->nb_cargs
+ 1;
2004 #ifdef CONFIG_PROFILER
2006 static int64_t tcg_table_op_count
[NB_OPS
];
2008 static void dump_op_count(void)
2012 f
= fopen("/tmp/op.log", "w");
2013 for(i
= INDEX_op_end
; i
< NB_OPS
; i
++) {
2014 fprintf(f
, "%s %" PRId64
"\n", tcg_op_defs
[i
].name
, tcg_table_op_count
[i
]);
2021 static inline int tcg_gen_code_common(TCGContext
*s
, uint8_t *gen_code_buf
,
2026 const TCGOpDef
*def
;
2027 unsigned int dead_args
;
2031 if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP
))) {
2033 tcg_dump_ops(s
, logfile
);
2038 #ifdef CONFIG_PROFILER
2039 s
->la_time
-= profile_getclock();
2041 tcg_liveness_analysis(s
);
2042 #ifdef CONFIG_PROFILER
2043 s
->la_time
+= profile_getclock();
2047 if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_OPT
))) {
2048 qemu_log("OP after liveness analysis:\n");
2049 tcg_dump_ops(s
, logfile
);
2054 tcg_reg_alloc_start(s
);
2056 s
->code_buf
= gen_code_buf
;
2057 s
->code_ptr
= gen_code_buf
;
2059 args
= gen_opparam_buf
;
2063 opc
= gen_opc_buf
[op_index
];
2064 #ifdef CONFIG_PROFILER
2065 tcg_table_op_count
[opc
]++;
2067 def
= &tcg_op_defs
[opc
];
2069 printf("%s: %d %d %d\n", def
->name
,
2070 def
->nb_oargs
, def
->nb_iargs
, def
->nb_cargs
);
2074 case INDEX_op_mov_i32
:
2075 #if TCG_TARGET_REG_BITS == 64
2076 case INDEX_op_mov_i64
:
2078 dead_args
= s
->op_dead_args
[op_index
];
2079 tcg_reg_alloc_mov(s
, def
, args
, dead_args
);
2081 case INDEX_op_movi_i32
:
2082 #if TCG_TARGET_REG_BITS == 64
2083 case INDEX_op_movi_i64
:
2085 tcg_reg_alloc_movi(s
, args
);
2087 case INDEX_op_debug_insn_start
:
2088 /* debug instruction */
2098 case INDEX_op_discard
:
2101 ts
= &s
->temps
[args
[0]];
2102 /* mark the temporary as dead */
2103 if (!ts
->fixed_reg
) {
2104 if (ts
->val_type
== TEMP_VAL_REG
)
2105 s
->reg_to_temp
[ts
->reg
] = -1;
2106 ts
->val_type
= TEMP_VAL_DEAD
;
2110 case INDEX_op_set_label
:
2111 tcg_reg_alloc_bb_end(s
, s
->reserved_regs
);
2112 tcg_out_label(s
, args
[0], (long)s
->code_ptr
);
2115 dead_args
= s
->op_dead_args
[op_index
];
2116 args
+= tcg_reg_alloc_call(s
, def
, opc
, args
, dead_args
);
2121 /* Note: in order to speed up the code, it would be much
2122 faster to have specialized register allocator functions for
2123 some common argument patterns */
2124 dead_args
= s
->op_dead_args
[op_index
];
2125 tcg_reg_alloc_op(s
, def
, opc
, args
, dead_args
);
2128 args
+= def
->nb_args
;
2130 if (search_pc
>= 0 && search_pc
< s
->code_ptr
- gen_code_buf
) {
2142 int tcg_gen_code(TCGContext
*s
, uint8_t *gen_code_buf
)
2144 #ifdef CONFIG_PROFILER
2147 n
= (gen_opc_ptr
- gen_opc_buf
);
2149 if (n
> s
->op_count_max
)
2150 s
->op_count_max
= n
;
2152 s
->temp_count
+= s
->nb_temps
;
2153 if (s
->nb_temps
> s
->temp_count_max
)
2154 s
->temp_count_max
= s
->nb_temps
;
2158 tcg_gen_code_common(s
, gen_code_buf
, -1);
2160 /* flush instruction cache */
2161 flush_icache_range((unsigned long)gen_code_buf
,
2162 (unsigned long)s
->code_ptr
);
2163 return s
->code_ptr
- gen_code_buf
;
2166 /* Return the index of the micro operation such as the pc after is <
2167 offset bytes from the start of the TB. The contents of gen_code_buf must
2168 not be changed, though writing the same values is ok.
2169 Return -1 if not found. */
2170 int tcg_gen_code_search_pc(TCGContext
*s
, uint8_t *gen_code_buf
, long offset
)
2172 return tcg_gen_code_common(s
, gen_code_buf
, offset
);
2175 #ifdef CONFIG_PROFILER
2176 void tcg_dump_info(FILE *f
, fprintf_function cpu_fprintf
)
2178 TCGContext
*s
= &tcg_ctx
;
2181 tot
= s
->interm_time
+ s
->code_time
;
2182 cpu_fprintf(f
, "JIT cycles %" PRId64
" (%0.3f s at 2.4 GHz)\n",
2184 cpu_fprintf(f
, "translated TBs %" PRId64
" (aborted=%" PRId64
" %0.1f%%)\n",
2186 s
->tb_count1
- s
->tb_count
,
2187 s
->tb_count1
? (double)(s
->tb_count1
- s
->tb_count
) / s
->tb_count1
* 100.0 : 0);
2188 cpu_fprintf(f
, "avg ops/TB %0.1f max=%d\n",
2189 s
->tb_count
? (double)s
->op_count
/ s
->tb_count
: 0, s
->op_count_max
);
2190 cpu_fprintf(f
, "deleted ops/TB %0.2f\n",
2192 (double)s
->del_op_count
/ s
->tb_count
: 0);
2193 cpu_fprintf(f
, "avg temps/TB %0.2f max=%d\n",
2195 (double)s
->temp_count
/ s
->tb_count
: 0,
2198 cpu_fprintf(f
, "cycles/op %0.1f\n",
2199 s
->op_count
? (double)tot
/ s
->op_count
: 0);
2200 cpu_fprintf(f
, "cycles/in byte %0.1f\n",
2201 s
->code_in_len
? (double)tot
/ s
->code_in_len
: 0);
2202 cpu_fprintf(f
, "cycles/out byte %0.1f\n",
2203 s
->code_out_len
? (double)tot
/ s
->code_out_len
: 0);
2206 cpu_fprintf(f
, " gen_interm time %0.1f%%\n",
2207 (double)s
->interm_time
/ tot
* 100.0);
2208 cpu_fprintf(f
, " gen_code time %0.1f%%\n",
2209 (double)s
->code_time
/ tot
* 100.0);
2210 cpu_fprintf(f
, "liveness/code time %0.1f%%\n",
2211 (double)s
->la_time
/ (s
->code_time
? s
->code_time
: 1) * 100.0);
2212 cpu_fprintf(f
, "cpu_restore count %" PRId64
"\n",
2214 cpu_fprintf(f
, " avg cycles %0.1f\n",
2215 s
->restore_count
? (double)s
->restore_time
/ s
->restore_count
: 0);
2220 void tcg_dump_info(FILE *f
, fprintf_function cpu_fprintf
)
2222 cpu_fprintf(f
, "[TCG profiler not compiled]\n");