tcg: Remove TCG_TARGET_HAS_GUEST_BASE define
[qemu/kevin.git] / tcg / tcg.c
bloba171f784a4f01f060d3b30f2148d5253cd4c24ea
1 /*
2 * Tiny Code Generator for QEMU
4 * Copyright (c) 2008 Fabrice Bellard
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
25 /* define it to use liveness analysis (better code) */
26 #define USE_LIVENESS_ANALYSIS
27 #define USE_TCG_OPTIMIZATIONS
29 #include "config.h"
31 /* Define to jump the ELF file used to communicate with GDB. */
32 #undef DEBUG_JIT
34 #if !defined(CONFIG_DEBUG_TCG) && !defined(NDEBUG)
35 /* define it to suppress various consistency checks (faster) */
36 #define NDEBUG
37 #endif
39 #include "qemu-common.h"
40 #include "cache-utils.h"
41 #include "host-utils.h"
42 #include "qemu-timer.h"
44 /* Note: the long term plan is to reduce the dependancies on the QEMU
45 CPU definitions. Currently they are used for qemu_ld/st
46 instructions */
47 #define NO_CPU_IO_DEFS
48 #include "cpu.h"
50 #include "tcg-op.h"
52 #if TCG_TARGET_REG_BITS == 64
53 # define ELF_CLASS ELFCLASS64
54 #else
55 # define ELF_CLASS ELFCLASS32
56 #endif
57 #ifdef HOST_WORDS_BIGENDIAN
58 # define ELF_DATA ELFDATA2MSB
59 #else
60 # define ELF_DATA ELFDATA2LSB
61 #endif
63 #include "elf.h"
65 /* Forward declarations for functions declared in tcg-target.c and used here. */
66 static void tcg_target_init(TCGContext *s);
67 static void tcg_target_qemu_prologue(TCGContext *s);
68 static void patch_reloc(uint8_t *code_ptr, int type,
69 tcg_target_long value, tcg_target_long addend);
71 static void tcg_register_jit_int(void *buf, size_t size,
72 void *debug_frame, size_t debug_frame_size)
73 __attribute__((unused));
75 /* Forward declarations for functions declared and used in tcg-target.c. */
76 static int target_parse_constraint(TCGArgConstraint *ct, const char **pct_str);
77 static void tcg_out_ld(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg1,
78 tcg_target_long arg2);
79 static void tcg_out_mov(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg);
80 static void tcg_out_movi(TCGContext *s, TCGType type,
81 TCGReg ret, tcg_target_long arg);
82 static void tcg_out_op(TCGContext *s, TCGOpcode opc, const TCGArg *args,
83 const int *const_args);
84 static void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg, TCGReg arg1,
85 tcg_target_long arg2);
86 static int tcg_target_const_match(tcg_target_long val,
87 const TCGArgConstraint *arg_ct);
89 TCGOpDef tcg_op_defs[] = {
90 #define DEF(s, oargs, iargs, cargs, flags) { #s, oargs, iargs, cargs, iargs + oargs + cargs, flags },
91 #include "tcg-opc.h"
92 #undef DEF
94 const size_t tcg_op_defs_max = ARRAY_SIZE(tcg_op_defs);
96 static TCGRegSet tcg_target_available_regs[2];
97 static TCGRegSet tcg_target_call_clobber_regs;
99 /* XXX: move that inside the context */
100 uint16_t *gen_opc_ptr;
101 TCGArg *gen_opparam_ptr;
103 static inline void tcg_out8(TCGContext *s, uint8_t v)
105 *s->code_ptr++ = v;
108 static inline void tcg_out16(TCGContext *s, uint16_t v)
110 *(uint16_t *)s->code_ptr = v;
111 s->code_ptr += 2;
114 static inline void tcg_out32(TCGContext *s, uint32_t v)
116 *(uint32_t *)s->code_ptr = v;
117 s->code_ptr += 4;
120 /* label relocation processing */
122 static void tcg_out_reloc(TCGContext *s, uint8_t *code_ptr, int type,
123 int label_index, long addend)
125 TCGLabel *l;
126 TCGRelocation *r;
128 l = &s->labels[label_index];
129 if (l->has_value) {
130 /* FIXME: This may break relocations on RISC targets that
131 modify instruction fields in place. The caller may not have
132 written the initial value. */
133 patch_reloc(code_ptr, type, l->u.value, addend);
134 } else {
135 /* add a new relocation entry */
136 r = tcg_malloc(sizeof(TCGRelocation));
137 r->type = type;
138 r->ptr = code_ptr;
139 r->addend = addend;
140 r->next = l->u.first_reloc;
141 l->u.first_reloc = r;
145 static void tcg_out_label(TCGContext *s, int label_index, void *ptr)
147 TCGLabel *l;
148 TCGRelocation *r;
149 tcg_target_long value = (tcg_target_long)ptr;
151 l = &s->labels[label_index];
152 if (l->has_value)
153 tcg_abort();
154 r = l->u.first_reloc;
155 while (r != NULL) {
156 patch_reloc(r->ptr, r->type, value, r->addend);
157 r = r->next;
159 l->has_value = 1;
160 l->u.value = value;
163 int gen_new_label(void)
165 TCGContext *s = &tcg_ctx;
166 int idx;
167 TCGLabel *l;
169 if (s->nb_labels >= TCG_MAX_LABELS)
170 tcg_abort();
171 idx = s->nb_labels++;
172 l = &s->labels[idx];
173 l->has_value = 0;
174 l->u.first_reloc = NULL;
175 return idx;
178 #include "tcg-target.c"
180 /* pool based memory allocation */
181 void *tcg_malloc_internal(TCGContext *s, int size)
183 TCGPool *p;
184 int pool_size;
186 if (size > TCG_POOL_CHUNK_SIZE) {
187 /* big malloc: insert a new pool (XXX: could optimize) */
188 p = g_malloc(sizeof(TCGPool) + size);
189 p->size = size;
190 p->next = s->pool_first_large;
191 s->pool_first_large = p;
192 return p->data;
193 } else {
194 p = s->pool_current;
195 if (!p) {
196 p = s->pool_first;
197 if (!p)
198 goto new_pool;
199 } else {
200 if (!p->next) {
201 new_pool:
202 pool_size = TCG_POOL_CHUNK_SIZE;
203 p = g_malloc(sizeof(TCGPool) + pool_size);
204 p->size = pool_size;
205 p->next = NULL;
206 if (s->pool_current)
207 s->pool_current->next = p;
208 else
209 s->pool_first = p;
210 } else {
211 p = p->next;
215 s->pool_current = p;
216 s->pool_cur = p->data + size;
217 s->pool_end = p->data + p->size;
218 return p->data;
221 void tcg_pool_reset(TCGContext *s)
223 TCGPool *p, *t;
224 for (p = s->pool_first_large; p; p = t) {
225 t = p->next;
226 g_free(p);
228 s->pool_first_large = NULL;
229 s->pool_cur = s->pool_end = NULL;
230 s->pool_current = NULL;
233 void tcg_context_init(TCGContext *s)
235 int op, total_args, n;
236 TCGOpDef *def;
237 TCGArgConstraint *args_ct;
238 int *sorted_args;
240 memset(s, 0, sizeof(*s));
241 s->nb_globals = 0;
243 /* Count total number of arguments and allocate the corresponding
244 space */
245 total_args = 0;
246 for(op = 0; op < NB_OPS; op++) {
247 def = &tcg_op_defs[op];
248 n = def->nb_iargs + def->nb_oargs;
249 total_args += n;
252 args_ct = g_malloc(sizeof(TCGArgConstraint) * total_args);
253 sorted_args = g_malloc(sizeof(int) * total_args);
255 for(op = 0; op < NB_OPS; op++) {
256 def = &tcg_op_defs[op];
257 def->args_ct = args_ct;
258 def->sorted_args = sorted_args;
259 n = def->nb_iargs + def->nb_oargs;
260 sorted_args += n;
261 args_ct += n;
264 tcg_target_init(s);
267 void tcg_prologue_init(TCGContext *s)
269 /* init global prologue and epilogue */
270 s->code_buf = code_gen_prologue;
271 s->code_ptr = s->code_buf;
272 tcg_target_qemu_prologue(s);
273 flush_icache_range((tcg_target_ulong)s->code_buf,
274 (tcg_target_ulong)s->code_ptr);
277 void tcg_set_frame(TCGContext *s, int reg,
278 tcg_target_long start, tcg_target_long size)
280 s->frame_start = start;
281 s->frame_end = start + size;
282 s->frame_reg = reg;
285 void tcg_func_start(TCGContext *s)
287 int i;
288 tcg_pool_reset(s);
289 s->nb_temps = s->nb_globals;
290 for(i = 0; i < (TCG_TYPE_COUNT * 2); i++)
291 s->first_free_temp[i] = -1;
292 s->labels = tcg_malloc(sizeof(TCGLabel) * TCG_MAX_LABELS);
293 s->nb_labels = 0;
294 s->current_frame_offset = s->frame_start;
296 #ifdef CONFIG_DEBUG_TCG
297 s->goto_tb_issue_mask = 0;
298 #endif
300 gen_opc_ptr = gen_opc_buf;
301 gen_opparam_ptr = gen_opparam_buf;
304 static inline void tcg_temp_alloc(TCGContext *s, int n)
306 if (n > TCG_MAX_TEMPS)
307 tcg_abort();
310 static inline int tcg_global_reg_new_internal(TCGType type, int reg,
311 const char *name)
313 TCGContext *s = &tcg_ctx;
314 TCGTemp *ts;
315 int idx;
317 #if TCG_TARGET_REG_BITS == 32
318 if (type != TCG_TYPE_I32)
319 tcg_abort();
320 #endif
321 if (tcg_regset_test_reg(s->reserved_regs, reg))
322 tcg_abort();
323 idx = s->nb_globals;
324 tcg_temp_alloc(s, s->nb_globals + 1);
325 ts = &s->temps[s->nb_globals];
326 ts->base_type = type;
327 ts->type = type;
328 ts->fixed_reg = 1;
329 ts->reg = reg;
330 ts->name = name;
331 s->nb_globals++;
332 tcg_regset_set_reg(s->reserved_regs, reg);
333 return idx;
336 TCGv_i32 tcg_global_reg_new_i32(int reg, const char *name)
338 int idx;
340 idx = tcg_global_reg_new_internal(TCG_TYPE_I32, reg, name);
341 return MAKE_TCGV_I32(idx);
344 TCGv_i64 tcg_global_reg_new_i64(int reg, const char *name)
346 int idx;
348 idx = tcg_global_reg_new_internal(TCG_TYPE_I64, reg, name);
349 return MAKE_TCGV_I64(idx);
352 static inline int tcg_global_mem_new_internal(TCGType type, int reg,
353 tcg_target_long offset,
354 const char *name)
356 TCGContext *s = &tcg_ctx;
357 TCGTemp *ts;
358 int idx;
360 idx = s->nb_globals;
361 #if TCG_TARGET_REG_BITS == 32
362 if (type == TCG_TYPE_I64) {
363 char buf[64];
364 tcg_temp_alloc(s, s->nb_globals + 2);
365 ts = &s->temps[s->nb_globals];
366 ts->base_type = type;
367 ts->type = TCG_TYPE_I32;
368 ts->fixed_reg = 0;
369 ts->mem_allocated = 1;
370 ts->mem_reg = reg;
371 #ifdef TCG_TARGET_WORDS_BIGENDIAN
372 ts->mem_offset = offset + 4;
373 #else
374 ts->mem_offset = offset;
375 #endif
376 pstrcpy(buf, sizeof(buf), name);
377 pstrcat(buf, sizeof(buf), "_0");
378 ts->name = strdup(buf);
379 ts++;
381 ts->base_type = type;
382 ts->type = TCG_TYPE_I32;
383 ts->fixed_reg = 0;
384 ts->mem_allocated = 1;
385 ts->mem_reg = reg;
386 #ifdef TCG_TARGET_WORDS_BIGENDIAN
387 ts->mem_offset = offset;
388 #else
389 ts->mem_offset = offset + 4;
390 #endif
391 pstrcpy(buf, sizeof(buf), name);
392 pstrcat(buf, sizeof(buf), "_1");
393 ts->name = strdup(buf);
395 s->nb_globals += 2;
396 } else
397 #endif
399 tcg_temp_alloc(s, s->nb_globals + 1);
400 ts = &s->temps[s->nb_globals];
401 ts->base_type = type;
402 ts->type = type;
403 ts->fixed_reg = 0;
404 ts->mem_allocated = 1;
405 ts->mem_reg = reg;
406 ts->mem_offset = offset;
407 ts->name = name;
408 s->nb_globals++;
410 return idx;
413 TCGv_i32 tcg_global_mem_new_i32(int reg, tcg_target_long offset,
414 const char *name)
416 int idx;
418 idx = tcg_global_mem_new_internal(TCG_TYPE_I32, reg, offset, name);
419 return MAKE_TCGV_I32(idx);
422 TCGv_i64 tcg_global_mem_new_i64(int reg, tcg_target_long offset,
423 const char *name)
425 int idx;
427 idx = tcg_global_mem_new_internal(TCG_TYPE_I64, reg, offset, name);
428 return MAKE_TCGV_I64(idx);
431 static inline int tcg_temp_new_internal(TCGType type, int temp_local)
433 TCGContext *s = &tcg_ctx;
434 TCGTemp *ts;
435 int idx, k;
437 k = type;
438 if (temp_local)
439 k += TCG_TYPE_COUNT;
440 idx = s->first_free_temp[k];
441 if (idx != -1) {
442 /* There is already an available temp with the
443 right type */
444 ts = &s->temps[idx];
445 s->first_free_temp[k] = ts->next_free_temp;
446 ts->temp_allocated = 1;
447 assert(ts->temp_local == temp_local);
448 } else {
449 idx = s->nb_temps;
450 #if TCG_TARGET_REG_BITS == 32
451 if (type == TCG_TYPE_I64) {
452 tcg_temp_alloc(s, s->nb_temps + 2);
453 ts = &s->temps[s->nb_temps];
454 ts->base_type = type;
455 ts->type = TCG_TYPE_I32;
456 ts->temp_allocated = 1;
457 ts->temp_local = temp_local;
458 ts->name = NULL;
459 ts++;
460 ts->base_type = TCG_TYPE_I32;
461 ts->type = TCG_TYPE_I32;
462 ts->temp_allocated = 1;
463 ts->temp_local = temp_local;
464 ts->name = NULL;
465 s->nb_temps += 2;
466 } else
467 #endif
469 tcg_temp_alloc(s, s->nb_temps + 1);
470 ts = &s->temps[s->nb_temps];
471 ts->base_type = type;
472 ts->type = type;
473 ts->temp_allocated = 1;
474 ts->temp_local = temp_local;
475 ts->name = NULL;
476 s->nb_temps++;
480 #if defined(CONFIG_DEBUG_TCG)
481 s->temps_in_use++;
482 #endif
483 return idx;
486 TCGv_i32 tcg_temp_new_internal_i32(int temp_local)
488 int idx;
490 idx = tcg_temp_new_internal(TCG_TYPE_I32, temp_local);
491 return MAKE_TCGV_I32(idx);
494 TCGv_i64 tcg_temp_new_internal_i64(int temp_local)
496 int idx;
498 idx = tcg_temp_new_internal(TCG_TYPE_I64, temp_local);
499 return MAKE_TCGV_I64(idx);
502 static inline void tcg_temp_free_internal(int idx)
504 TCGContext *s = &tcg_ctx;
505 TCGTemp *ts;
506 int k;
508 #if defined(CONFIG_DEBUG_TCG)
509 s->temps_in_use--;
510 if (s->temps_in_use < 0) {
511 fprintf(stderr, "More temporaries freed than allocated!\n");
513 #endif
515 assert(idx >= s->nb_globals && idx < s->nb_temps);
516 ts = &s->temps[idx];
517 assert(ts->temp_allocated != 0);
518 ts->temp_allocated = 0;
519 k = ts->base_type;
520 if (ts->temp_local)
521 k += TCG_TYPE_COUNT;
522 ts->next_free_temp = s->first_free_temp[k];
523 s->first_free_temp[k] = idx;
526 void tcg_temp_free_i32(TCGv_i32 arg)
528 tcg_temp_free_internal(GET_TCGV_I32(arg));
531 void tcg_temp_free_i64(TCGv_i64 arg)
533 tcg_temp_free_internal(GET_TCGV_I64(arg));
536 TCGv_i32 tcg_const_i32(int32_t val)
538 TCGv_i32 t0;
539 t0 = tcg_temp_new_i32();
540 tcg_gen_movi_i32(t0, val);
541 return t0;
544 TCGv_i64 tcg_const_i64(int64_t val)
546 TCGv_i64 t0;
547 t0 = tcg_temp_new_i64();
548 tcg_gen_movi_i64(t0, val);
549 return t0;
552 TCGv_i32 tcg_const_local_i32(int32_t val)
554 TCGv_i32 t0;
555 t0 = tcg_temp_local_new_i32();
556 tcg_gen_movi_i32(t0, val);
557 return t0;
560 TCGv_i64 tcg_const_local_i64(int64_t val)
562 TCGv_i64 t0;
563 t0 = tcg_temp_local_new_i64();
564 tcg_gen_movi_i64(t0, val);
565 return t0;
568 #if defined(CONFIG_DEBUG_TCG)
569 void tcg_clear_temp_count(void)
571 TCGContext *s = &tcg_ctx;
572 s->temps_in_use = 0;
575 int tcg_check_temp_count(void)
577 TCGContext *s = &tcg_ctx;
578 if (s->temps_in_use) {
579 /* Clear the count so that we don't give another
580 * warning immediately next time around.
582 s->temps_in_use = 0;
583 return 1;
585 return 0;
587 #endif
589 void tcg_register_helper(void *func, const char *name)
591 TCGContext *s = &tcg_ctx;
592 int n;
593 if ((s->nb_helpers + 1) > s->allocated_helpers) {
594 n = s->allocated_helpers;
595 if (n == 0) {
596 n = 4;
597 } else {
598 n *= 2;
600 s->helpers = realloc(s->helpers, n * sizeof(TCGHelperInfo));
601 s->allocated_helpers = n;
603 s->helpers[s->nb_helpers].func = (tcg_target_ulong)func;
604 s->helpers[s->nb_helpers].name = name;
605 s->nb_helpers++;
608 /* Note: we convert the 64 bit args to 32 bit and do some alignment
609 and endian swap. Maybe it would be better to do the alignment
610 and endian swap in tcg_reg_alloc_call(). */
611 void tcg_gen_callN(TCGContext *s, TCGv_ptr func, unsigned int flags,
612 int sizemask, TCGArg ret, int nargs, TCGArg *args)
614 int i;
615 int real_args;
616 int nb_rets;
617 TCGArg *nparam;
619 #if defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64
620 for (i = 0; i < nargs; ++i) {
621 int is_64bit = sizemask & (1 << (i+1)*2);
622 int is_signed = sizemask & (2 << (i+1)*2);
623 if (!is_64bit) {
624 TCGv_i64 temp = tcg_temp_new_i64();
625 TCGv_i64 orig = MAKE_TCGV_I64(args[i]);
626 if (is_signed) {
627 tcg_gen_ext32s_i64(temp, orig);
628 } else {
629 tcg_gen_ext32u_i64(temp, orig);
631 args[i] = GET_TCGV_I64(temp);
634 #endif /* TCG_TARGET_EXTEND_ARGS */
636 *gen_opc_ptr++ = INDEX_op_call;
637 nparam = gen_opparam_ptr++;
638 if (ret != TCG_CALL_DUMMY_ARG) {
639 #if TCG_TARGET_REG_BITS < 64
640 if (sizemask & 1) {
641 #ifdef TCG_TARGET_WORDS_BIGENDIAN
642 *gen_opparam_ptr++ = ret + 1;
643 *gen_opparam_ptr++ = ret;
644 #else
645 *gen_opparam_ptr++ = ret;
646 *gen_opparam_ptr++ = ret + 1;
647 #endif
648 nb_rets = 2;
649 } else
650 #endif
652 *gen_opparam_ptr++ = ret;
653 nb_rets = 1;
655 } else {
656 nb_rets = 0;
658 real_args = 0;
659 for (i = 0; i < nargs; i++) {
660 #if TCG_TARGET_REG_BITS < 64
661 int is_64bit = sizemask & (1 << (i+1)*2);
662 if (is_64bit) {
663 #ifdef TCG_TARGET_CALL_ALIGN_ARGS
664 /* some targets want aligned 64 bit args */
665 if (real_args & 1) {
666 *gen_opparam_ptr++ = TCG_CALL_DUMMY_ARG;
667 real_args++;
669 #endif
670 /* If stack grows up, then we will be placing successive
671 arguments at lower addresses, which means we need to
672 reverse the order compared to how we would normally
673 treat either big or little-endian. For those arguments
674 that will wind up in registers, this still works for
675 HPPA (the only current STACK_GROWSUP target) since the
676 argument registers are *also* allocated in decreasing
677 order. If another such target is added, this logic may
678 have to get more complicated to differentiate between
679 stack arguments and register arguments. */
680 #if defined(TCG_TARGET_WORDS_BIGENDIAN) != defined(TCG_TARGET_STACK_GROWSUP)
681 *gen_opparam_ptr++ = args[i] + 1;
682 *gen_opparam_ptr++ = args[i];
683 #else
684 *gen_opparam_ptr++ = args[i];
685 *gen_opparam_ptr++ = args[i] + 1;
686 #endif
687 real_args += 2;
688 continue;
690 #endif /* TCG_TARGET_REG_BITS < 64 */
692 *gen_opparam_ptr++ = args[i];
693 real_args++;
695 *gen_opparam_ptr++ = GET_TCGV_PTR(func);
697 *gen_opparam_ptr++ = flags;
699 *nparam = (nb_rets << 16) | (real_args + 1);
701 /* total parameters, needed to go backward in the instruction stream */
702 *gen_opparam_ptr++ = 1 + nb_rets + real_args + 3;
704 #if defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64
705 for (i = 0; i < nargs; ++i) {
706 int is_64bit = sizemask & (1 << (i+1)*2);
707 if (!is_64bit) {
708 TCGv_i64 temp = MAKE_TCGV_I64(args[i]);
709 tcg_temp_free_i64(temp);
712 #endif /* TCG_TARGET_EXTEND_ARGS */
715 #if TCG_TARGET_REG_BITS == 32
716 void tcg_gen_shifti_i64(TCGv_i64 ret, TCGv_i64 arg1,
717 int c, int right, int arith)
719 if (c == 0) {
720 tcg_gen_mov_i32(TCGV_LOW(ret), TCGV_LOW(arg1));
721 tcg_gen_mov_i32(TCGV_HIGH(ret), TCGV_HIGH(arg1));
722 } else if (c >= 32) {
723 c -= 32;
724 if (right) {
725 if (arith) {
726 tcg_gen_sari_i32(TCGV_LOW(ret), TCGV_HIGH(arg1), c);
727 tcg_gen_sari_i32(TCGV_HIGH(ret), TCGV_HIGH(arg1), 31);
728 } else {
729 tcg_gen_shri_i32(TCGV_LOW(ret), TCGV_HIGH(arg1), c);
730 tcg_gen_movi_i32(TCGV_HIGH(ret), 0);
732 } else {
733 tcg_gen_shli_i32(TCGV_HIGH(ret), TCGV_LOW(arg1), c);
734 tcg_gen_movi_i32(TCGV_LOW(ret), 0);
736 } else {
737 TCGv_i32 t0, t1;
739 t0 = tcg_temp_new_i32();
740 t1 = tcg_temp_new_i32();
741 if (right) {
742 tcg_gen_shli_i32(t0, TCGV_HIGH(arg1), 32 - c);
743 if (arith)
744 tcg_gen_sari_i32(t1, TCGV_HIGH(arg1), c);
745 else
746 tcg_gen_shri_i32(t1, TCGV_HIGH(arg1), c);
747 tcg_gen_shri_i32(TCGV_LOW(ret), TCGV_LOW(arg1), c);
748 tcg_gen_or_i32(TCGV_LOW(ret), TCGV_LOW(ret), t0);
749 tcg_gen_mov_i32(TCGV_HIGH(ret), t1);
750 } else {
751 tcg_gen_shri_i32(t0, TCGV_LOW(arg1), 32 - c);
752 /* Note: ret can be the same as arg1, so we use t1 */
753 tcg_gen_shli_i32(t1, TCGV_LOW(arg1), c);
754 tcg_gen_shli_i32(TCGV_HIGH(ret), TCGV_HIGH(arg1), c);
755 tcg_gen_or_i32(TCGV_HIGH(ret), TCGV_HIGH(ret), t0);
756 tcg_gen_mov_i32(TCGV_LOW(ret), t1);
758 tcg_temp_free_i32(t0);
759 tcg_temp_free_i32(t1);
762 #endif
765 static void tcg_reg_alloc_start(TCGContext *s)
767 int i;
768 TCGTemp *ts;
769 for(i = 0; i < s->nb_globals; i++) {
770 ts = &s->temps[i];
771 if (ts->fixed_reg) {
772 ts->val_type = TEMP_VAL_REG;
773 } else {
774 ts->val_type = TEMP_VAL_MEM;
777 for(i = s->nb_globals; i < s->nb_temps; i++) {
778 ts = &s->temps[i];
779 ts->val_type = TEMP_VAL_DEAD;
780 ts->mem_allocated = 0;
781 ts->fixed_reg = 0;
783 for(i = 0; i < TCG_TARGET_NB_REGS; i++) {
784 s->reg_to_temp[i] = -1;
788 static char *tcg_get_arg_str_idx(TCGContext *s, char *buf, int buf_size,
789 int idx)
791 TCGTemp *ts;
793 assert(idx >= 0 && idx < s->nb_temps);
794 ts = &s->temps[idx];
795 assert(ts);
796 if (idx < s->nb_globals) {
797 pstrcpy(buf, buf_size, ts->name);
798 } else {
799 if (ts->temp_local)
800 snprintf(buf, buf_size, "loc%d", idx - s->nb_globals);
801 else
802 snprintf(buf, buf_size, "tmp%d", idx - s->nb_globals);
804 return buf;
807 char *tcg_get_arg_str_i32(TCGContext *s, char *buf, int buf_size, TCGv_i32 arg)
809 return tcg_get_arg_str_idx(s, buf, buf_size, GET_TCGV_I32(arg));
812 char *tcg_get_arg_str_i64(TCGContext *s, char *buf, int buf_size, TCGv_i64 arg)
814 return tcg_get_arg_str_idx(s, buf, buf_size, GET_TCGV_I64(arg));
817 static int helper_cmp(const void *p1, const void *p2)
819 const TCGHelperInfo *th1 = p1;
820 const TCGHelperInfo *th2 = p2;
821 if (th1->func < th2->func)
822 return -1;
823 else if (th1->func == th2->func)
824 return 0;
825 else
826 return 1;
829 /* find helper definition (Note: A hash table would be better) */
830 static TCGHelperInfo *tcg_find_helper(TCGContext *s, tcg_target_ulong val)
832 int m, m_min, m_max;
833 TCGHelperInfo *th;
834 tcg_target_ulong v;
836 if (unlikely(!s->helpers_sorted)) {
837 qsort(s->helpers, s->nb_helpers, sizeof(TCGHelperInfo),
838 helper_cmp);
839 s->helpers_sorted = 1;
842 /* binary search */
843 m_min = 0;
844 m_max = s->nb_helpers - 1;
845 while (m_min <= m_max) {
846 m = (m_min + m_max) >> 1;
847 th = &s->helpers[m];
848 v = th->func;
849 if (v == val)
850 return th;
851 else if (val < v) {
852 m_max = m - 1;
853 } else {
854 m_min = m + 1;
857 return NULL;
860 static const char * const cond_name[] =
862 [TCG_COND_NEVER] = "never",
863 [TCG_COND_ALWAYS] = "always",
864 [TCG_COND_EQ] = "eq",
865 [TCG_COND_NE] = "ne",
866 [TCG_COND_LT] = "lt",
867 [TCG_COND_GE] = "ge",
868 [TCG_COND_LE] = "le",
869 [TCG_COND_GT] = "gt",
870 [TCG_COND_LTU] = "ltu",
871 [TCG_COND_GEU] = "geu",
872 [TCG_COND_LEU] = "leu",
873 [TCG_COND_GTU] = "gtu"
876 void tcg_dump_ops(TCGContext *s)
878 const uint16_t *opc_ptr;
879 const TCGArg *args;
880 TCGArg arg;
881 TCGOpcode c;
882 int i, k, nb_oargs, nb_iargs, nb_cargs, first_insn;
883 const TCGOpDef *def;
884 char buf[128];
886 first_insn = 1;
887 opc_ptr = gen_opc_buf;
888 args = gen_opparam_buf;
889 while (opc_ptr < gen_opc_ptr) {
890 c = *opc_ptr++;
891 def = &tcg_op_defs[c];
892 if (c == INDEX_op_debug_insn_start) {
893 uint64_t pc;
894 #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS
895 pc = ((uint64_t)args[1] << 32) | args[0];
896 #else
897 pc = args[0];
898 #endif
899 if (!first_insn) {
900 qemu_log("\n");
902 qemu_log(" ---- 0x%" PRIx64, pc);
903 first_insn = 0;
904 nb_oargs = def->nb_oargs;
905 nb_iargs = def->nb_iargs;
906 nb_cargs = def->nb_cargs;
907 } else if (c == INDEX_op_call) {
908 TCGArg arg;
910 /* variable number of arguments */
911 arg = *args++;
912 nb_oargs = arg >> 16;
913 nb_iargs = arg & 0xffff;
914 nb_cargs = def->nb_cargs;
916 qemu_log(" %s ", def->name);
918 /* function name */
919 qemu_log("%s",
920 tcg_get_arg_str_idx(s, buf, sizeof(buf),
921 args[nb_oargs + nb_iargs - 1]));
922 /* flags */
923 qemu_log(",$0x%" TCG_PRIlx, args[nb_oargs + nb_iargs]);
924 /* nb out args */
925 qemu_log(",$%d", nb_oargs);
926 for(i = 0; i < nb_oargs; i++) {
927 qemu_log(",");
928 qemu_log("%s", tcg_get_arg_str_idx(s, buf, sizeof(buf),
929 args[i]));
931 for(i = 0; i < (nb_iargs - 1); i++) {
932 qemu_log(",");
933 if (args[nb_oargs + i] == TCG_CALL_DUMMY_ARG) {
934 qemu_log("<dummy>");
935 } else {
936 qemu_log("%s", tcg_get_arg_str_idx(s, buf, sizeof(buf),
937 args[nb_oargs + i]));
940 } else if (c == INDEX_op_movi_i32 || c == INDEX_op_movi_i64) {
941 tcg_target_ulong val;
942 TCGHelperInfo *th;
944 nb_oargs = def->nb_oargs;
945 nb_iargs = def->nb_iargs;
946 nb_cargs = def->nb_cargs;
947 qemu_log(" %s %s,$", def->name,
948 tcg_get_arg_str_idx(s, buf, sizeof(buf), args[0]));
949 val = args[1];
950 th = tcg_find_helper(s, val);
951 if (th) {
952 qemu_log("%s", th->name);
953 } else {
954 if (c == INDEX_op_movi_i32) {
955 qemu_log("0x%x", (uint32_t)val);
956 } else {
957 qemu_log("0x%" PRIx64 , (uint64_t)val);
960 } else {
961 qemu_log(" %s ", def->name);
962 if (c == INDEX_op_nopn) {
963 /* variable number of arguments */
964 nb_cargs = *args;
965 nb_oargs = 0;
966 nb_iargs = 0;
967 } else {
968 nb_oargs = def->nb_oargs;
969 nb_iargs = def->nb_iargs;
970 nb_cargs = def->nb_cargs;
973 k = 0;
974 for(i = 0; i < nb_oargs; i++) {
975 if (k != 0) {
976 qemu_log(",");
978 qemu_log("%s", tcg_get_arg_str_idx(s, buf, sizeof(buf),
979 args[k++]));
981 for(i = 0; i < nb_iargs; i++) {
982 if (k != 0) {
983 qemu_log(",");
985 qemu_log("%s", tcg_get_arg_str_idx(s, buf, sizeof(buf),
986 args[k++]));
988 switch (c) {
989 case INDEX_op_brcond_i32:
990 case INDEX_op_setcond_i32:
991 case INDEX_op_movcond_i32:
992 case INDEX_op_brcond2_i32:
993 case INDEX_op_setcond2_i32:
994 case INDEX_op_brcond_i64:
995 case INDEX_op_setcond_i64:
996 case INDEX_op_movcond_i64:
997 if (args[k] < ARRAY_SIZE(cond_name) && cond_name[args[k]]) {
998 qemu_log(",%s", cond_name[args[k++]]);
999 } else {
1000 qemu_log(",$0x%" TCG_PRIlx, args[k++]);
1002 i = 1;
1003 break;
1004 default:
1005 i = 0;
1006 break;
1008 for(; i < nb_cargs; i++) {
1009 if (k != 0) {
1010 qemu_log(",");
1012 arg = args[k++];
1013 qemu_log("$0x%" TCG_PRIlx, arg);
1016 qemu_log("\n");
1017 args += nb_iargs + nb_oargs + nb_cargs;
1021 /* we give more priority to constraints with less registers */
1022 static int get_constraint_priority(const TCGOpDef *def, int k)
1024 const TCGArgConstraint *arg_ct;
1026 int i, n;
1027 arg_ct = &def->args_ct[k];
1028 if (arg_ct->ct & TCG_CT_ALIAS) {
1029 /* an alias is equivalent to a single register */
1030 n = 1;
1031 } else {
1032 if (!(arg_ct->ct & TCG_CT_REG))
1033 return 0;
1034 n = 0;
1035 for(i = 0; i < TCG_TARGET_NB_REGS; i++) {
1036 if (tcg_regset_test_reg(arg_ct->u.regs, i))
1037 n++;
1040 return TCG_TARGET_NB_REGS - n + 1;
1043 /* sort from highest priority to lowest */
1044 static void sort_constraints(TCGOpDef *def, int start, int n)
1046 int i, j, p1, p2, tmp;
1048 for(i = 0; i < n; i++)
1049 def->sorted_args[start + i] = start + i;
1050 if (n <= 1)
1051 return;
1052 for(i = 0; i < n - 1; i++) {
1053 for(j = i + 1; j < n; j++) {
1054 p1 = get_constraint_priority(def, def->sorted_args[start + i]);
1055 p2 = get_constraint_priority(def, def->sorted_args[start + j]);
1056 if (p1 < p2) {
1057 tmp = def->sorted_args[start + i];
1058 def->sorted_args[start + i] = def->sorted_args[start + j];
1059 def->sorted_args[start + j] = tmp;
1065 void tcg_add_target_add_op_defs(const TCGTargetOpDef *tdefs)
1067 TCGOpcode op;
1068 TCGOpDef *def;
1069 const char *ct_str;
1070 int i, nb_args;
1072 for(;;) {
1073 if (tdefs->op == (TCGOpcode)-1)
1074 break;
1075 op = tdefs->op;
1076 assert((unsigned)op < NB_OPS);
1077 def = &tcg_op_defs[op];
1078 #if defined(CONFIG_DEBUG_TCG)
1079 /* Duplicate entry in op definitions? */
1080 assert(!def->used);
1081 def->used = 1;
1082 #endif
1083 nb_args = def->nb_iargs + def->nb_oargs;
1084 for(i = 0; i < nb_args; i++) {
1085 ct_str = tdefs->args_ct_str[i];
1086 /* Incomplete TCGTargetOpDef entry? */
1087 assert(ct_str != NULL);
1088 tcg_regset_clear(def->args_ct[i].u.regs);
1089 def->args_ct[i].ct = 0;
1090 if (ct_str[0] >= '0' && ct_str[0] <= '9') {
1091 int oarg;
1092 oarg = ct_str[0] - '0';
1093 assert(oarg < def->nb_oargs);
1094 assert(def->args_ct[oarg].ct & TCG_CT_REG);
1095 /* TCG_CT_ALIAS is for the output arguments. The input
1096 argument is tagged with TCG_CT_IALIAS. */
1097 def->args_ct[i] = def->args_ct[oarg];
1098 def->args_ct[oarg].ct = TCG_CT_ALIAS;
1099 def->args_ct[oarg].alias_index = i;
1100 def->args_ct[i].ct |= TCG_CT_IALIAS;
1101 def->args_ct[i].alias_index = oarg;
1102 } else {
1103 for(;;) {
1104 if (*ct_str == '\0')
1105 break;
1106 switch(*ct_str) {
1107 case 'i':
1108 def->args_ct[i].ct |= TCG_CT_CONST;
1109 ct_str++;
1110 break;
1111 default:
1112 if (target_parse_constraint(&def->args_ct[i], &ct_str) < 0) {
1113 fprintf(stderr, "Invalid constraint '%s' for arg %d of operation '%s'\n",
1114 ct_str, i, def->name);
1115 exit(1);
1122 /* TCGTargetOpDef entry with too much information? */
1123 assert(i == TCG_MAX_OP_ARGS || tdefs->args_ct_str[i] == NULL);
1125 /* sort the constraints (XXX: this is just an heuristic) */
1126 sort_constraints(def, 0, def->nb_oargs);
1127 sort_constraints(def, def->nb_oargs, def->nb_iargs);
1129 #if 0
1131 int i;
1133 printf("%s: sorted=", def->name);
1134 for(i = 0; i < def->nb_oargs + def->nb_iargs; i++)
1135 printf(" %d", def->sorted_args[i]);
1136 printf("\n");
1138 #endif
1139 tdefs++;
1142 #if defined(CONFIG_DEBUG_TCG)
1143 i = 0;
1144 for (op = 0; op < ARRAY_SIZE(tcg_op_defs); op++) {
1145 const TCGOpDef *def = &tcg_op_defs[op];
1146 if (op < INDEX_op_call
1147 || op == INDEX_op_debug_insn_start
1148 || (def->flags & TCG_OPF_NOT_PRESENT)) {
1149 /* Wrong entry in op definitions? */
1150 if (def->used) {
1151 fprintf(stderr, "Invalid op definition for %s\n", def->name);
1152 i = 1;
1154 } else {
1155 /* Missing entry in op definitions? */
1156 if (!def->used) {
1157 fprintf(stderr, "Missing op definition for %s\n", def->name);
1158 i = 1;
1162 if (i == 1) {
1163 tcg_abort();
1165 #endif
1168 #ifdef USE_LIVENESS_ANALYSIS
1170 /* set a nop for an operation using 'nb_args' */
1171 static inline void tcg_set_nop(TCGContext *s, uint16_t *opc_ptr,
1172 TCGArg *args, int nb_args)
1174 if (nb_args == 0) {
1175 *opc_ptr = INDEX_op_nop;
1176 } else {
1177 *opc_ptr = INDEX_op_nopn;
1178 args[0] = nb_args;
1179 args[nb_args - 1] = nb_args;
1183 /* liveness analysis: end of function: globals are live, temps are
1184 dead. */
1185 /* XXX: at this stage, not used as there would be little gains because
1186 most TBs end with a conditional jump. */
1187 static inline void tcg_la_func_end(TCGContext *s, uint8_t *dead_temps)
1189 memset(dead_temps, 0, s->nb_globals);
1190 memset(dead_temps + s->nb_globals, 1, s->nb_temps - s->nb_globals);
1193 /* liveness analysis: end of basic block: globals are live, temps are
1194 dead, local temps are live. */
1195 static inline void tcg_la_bb_end(TCGContext *s, uint8_t *dead_temps)
1197 int i;
1198 TCGTemp *ts;
1200 memset(dead_temps, 0, s->nb_globals);
1201 ts = &s->temps[s->nb_globals];
1202 for(i = s->nb_globals; i < s->nb_temps; i++) {
1203 if (ts->temp_local)
1204 dead_temps[i] = 0;
1205 else
1206 dead_temps[i] = 1;
1207 ts++;
1211 /* Liveness analysis : update the opc_dead_args array to tell if a
1212 given input arguments is dead. Instructions updating dead
1213 temporaries are removed. */
1214 static void tcg_liveness_analysis(TCGContext *s)
1216 int i, op_index, nb_args, nb_iargs, nb_oargs, arg, nb_ops;
1217 TCGOpcode op;
1218 TCGArg *args;
1219 const TCGOpDef *def;
1220 uint8_t *dead_temps;
1221 unsigned int dead_args;
1223 gen_opc_ptr++; /* skip end */
1225 nb_ops = gen_opc_ptr - gen_opc_buf;
1227 s->op_dead_args = tcg_malloc(nb_ops * sizeof(uint16_t));
1229 dead_temps = tcg_malloc(s->nb_temps);
1230 memset(dead_temps, 1, s->nb_temps);
1232 args = gen_opparam_ptr;
1233 op_index = nb_ops - 1;
1234 while (op_index >= 0) {
1235 op = gen_opc_buf[op_index];
1236 def = &tcg_op_defs[op];
1237 switch(op) {
1238 case INDEX_op_call:
1240 int call_flags;
1242 nb_args = args[-1];
1243 args -= nb_args;
1244 nb_iargs = args[0] & 0xffff;
1245 nb_oargs = args[0] >> 16;
1246 args++;
1247 call_flags = args[nb_oargs + nb_iargs];
1249 /* pure functions can be removed if their result is not
1250 used */
1251 if (call_flags & TCG_CALL_PURE) {
1252 for(i = 0; i < nb_oargs; i++) {
1253 arg = args[i];
1254 if (!dead_temps[arg])
1255 goto do_not_remove_call;
1257 tcg_set_nop(s, gen_opc_buf + op_index,
1258 args - 1, nb_args);
1259 } else {
1260 do_not_remove_call:
1262 /* output args are dead */
1263 dead_args = 0;
1264 for(i = 0; i < nb_oargs; i++) {
1265 arg = args[i];
1266 if (dead_temps[arg]) {
1267 dead_args |= (1 << i);
1269 dead_temps[arg] = 1;
1272 if (!(call_flags & TCG_CALL_CONST)) {
1273 /* globals are live (they may be used by the call) */
1274 memset(dead_temps, 0, s->nb_globals);
1277 /* input args are live */
1278 for(i = nb_oargs; i < nb_iargs + nb_oargs; i++) {
1279 arg = args[i];
1280 if (arg != TCG_CALL_DUMMY_ARG) {
1281 if (dead_temps[arg]) {
1282 dead_args |= (1 << i);
1284 dead_temps[arg] = 0;
1287 s->op_dead_args[op_index] = dead_args;
1289 args--;
1291 break;
1292 case INDEX_op_debug_insn_start:
1293 args -= def->nb_args;
1294 break;
1295 case INDEX_op_nopn:
1296 nb_args = args[-1];
1297 args -= nb_args;
1298 break;
1299 case INDEX_op_discard:
1300 args--;
1301 /* mark the temporary as dead */
1302 dead_temps[args[0]] = 1;
1303 break;
1304 case INDEX_op_end:
1305 break;
1306 /* XXX: optimize by hardcoding common cases (e.g. triadic ops) */
1307 default:
1308 args -= def->nb_args;
1309 nb_iargs = def->nb_iargs;
1310 nb_oargs = def->nb_oargs;
1312 /* Test if the operation can be removed because all
1313 its outputs are dead. We assume that nb_oargs == 0
1314 implies side effects */
1315 if (!(def->flags & TCG_OPF_SIDE_EFFECTS) && nb_oargs != 0) {
1316 for(i = 0; i < nb_oargs; i++) {
1317 arg = args[i];
1318 if (!dead_temps[arg])
1319 goto do_not_remove;
1321 tcg_set_nop(s, gen_opc_buf + op_index, args, def->nb_args);
1322 #ifdef CONFIG_PROFILER
1323 s->del_op_count++;
1324 #endif
1325 } else {
1326 do_not_remove:
1328 /* output args are dead */
1329 dead_args = 0;
1330 for(i = 0; i < nb_oargs; i++) {
1331 arg = args[i];
1332 if (dead_temps[arg]) {
1333 dead_args |= (1 << i);
1335 dead_temps[arg] = 1;
1338 /* if end of basic block, update */
1339 if (def->flags & TCG_OPF_BB_END) {
1340 tcg_la_bb_end(s, dead_temps);
1341 } else if (def->flags & TCG_OPF_CALL_CLOBBER) {
1342 /* globals are live */
1343 memset(dead_temps, 0, s->nb_globals);
1346 /* input args are live */
1347 for(i = nb_oargs; i < nb_oargs + nb_iargs; i++) {
1348 arg = args[i];
1349 if (dead_temps[arg]) {
1350 dead_args |= (1 << i);
1352 dead_temps[arg] = 0;
1354 s->op_dead_args[op_index] = dead_args;
1356 break;
1358 op_index--;
1361 if (args != gen_opparam_buf)
1362 tcg_abort();
1364 #else
1365 /* dummy liveness analysis */
1366 static void tcg_liveness_analysis(TCGContext *s)
1368 int nb_ops;
1369 nb_ops = gen_opc_ptr - gen_opc_buf;
1371 s->op_dead_args = tcg_malloc(nb_ops * sizeof(uint16_t));
1372 memset(s->op_dead_args, 0, nb_ops * sizeof(uint16_t));
1374 #endif
1376 #ifndef NDEBUG
1377 static void dump_regs(TCGContext *s)
1379 TCGTemp *ts;
1380 int i;
1381 char buf[64];
1383 for(i = 0; i < s->nb_temps; i++) {
1384 ts = &s->temps[i];
1385 printf(" %10s: ", tcg_get_arg_str_idx(s, buf, sizeof(buf), i));
1386 switch(ts->val_type) {
1387 case TEMP_VAL_REG:
1388 printf("%s", tcg_target_reg_names[ts->reg]);
1389 break;
1390 case TEMP_VAL_MEM:
1391 printf("%d(%s)", (int)ts->mem_offset, tcg_target_reg_names[ts->mem_reg]);
1392 break;
1393 case TEMP_VAL_CONST:
1394 printf("$0x%" TCG_PRIlx, ts->val);
1395 break;
1396 case TEMP_VAL_DEAD:
1397 printf("D");
1398 break;
1399 default:
1400 printf("???");
1401 break;
1403 printf("\n");
1406 for(i = 0; i < TCG_TARGET_NB_REGS; i++) {
1407 if (s->reg_to_temp[i] >= 0) {
1408 printf("%s: %s\n",
1409 tcg_target_reg_names[i],
1410 tcg_get_arg_str_idx(s, buf, sizeof(buf), s->reg_to_temp[i]));
1415 static void check_regs(TCGContext *s)
1417 int reg, k;
1418 TCGTemp *ts;
1419 char buf[64];
1421 for(reg = 0; reg < TCG_TARGET_NB_REGS; reg++) {
1422 k = s->reg_to_temp[reg];
1423 if (k >= 0) {
1424 ts = &s->temps[k];
1425 if (ts->val_type != TEMP_VAL_REG ||
1426 ts->reg != reg) {
1427 printf("Inconsistency for register %s:\n",
1428 tcg_target_reg_names[reg]);
1429 goto fail;
1433 for(k = 0; k < s->nb_temps; k++) {
1434 ts = &s->temps[k];
1435 if (ts->val_type == TEMP_VAL_REG &&
1436 !ts->fixed_reg &&
1437 s->reg_to_temp[ts->reg] != k) {
1438 printf("Inconsistency for temp %s:\n",
1439 tcg_get_arg_str_idx(s, buf, sizeof(buf), k));
1440 fail:
1441 printf("reg state:\n");
1442 dump_regs(s);
1443 tcg_abort();
1447 #endif
1449 static void temp_allocate_frame(TCGContext *s, int temp)
1451 TCGTemp *ts;
1452 ts = &s->temps[temp];
1453 #if !(defined(__sparc__) && TCG_TARGET_REG_BITS == 64)
1454 /* Sparc64 stack is accessed with offset of 2047 */
1455 s->current_frame_offset = (s->current_frame_offset +
1456 (tcg_target_long)sizeof(tcg_target_long) - 1) &
1457 ~(sizeof(tcg_target_long) - 1);
1458 #endif
1459 if (s->current_frame_offset + (tcg_target_long)sizeof(tcg_target_long) >
1460 s->frame_end) {
1461 tcg_abort();
1463 ts->mem_offset = s->current_frame_offset;
1464 ts->mem_reg = s->frame_reg;
1465 ts->mem_allocated = 1;
1466 s->current_frame_offset += (tcg_target_long)sizeof(tcg_target_long);
1469 /* free register 'reg' by spilling the corresponding temporary if necessary */
1470 static void tcg_reg_free(TCGContext *s, int reg)
1472 TCGTemp *ts;
1473 int temp;
1475 temp = s->reg_to_temp[reg];
1476 if (temp != -1) {
1477 ts = &s->temps[temp];
1478 assert(ts->val_type == TEMP_VAL_REG);
1479 if (!ts->mem_coherent) {
1480 if (!ts->mem_allocated)
1481 temp_allocate_frame(s, temp);
1482 tcg_out_st(s, ts->type, reg, ts->mem_reg, ts->mem_offset);
1484 ts->val_type = TEMP_VAL_MEM;
1485 s->reg_to_temp[reg] = -1;
1489 /* Allocate a register belonging to reg1 & ~reg2 */
1490 static int tcg_reg_alloc(TCGContext *s, TCGRegSet reg1, TCGRegSet reg2)
1492 int i, reg;
1493 TCGRegSet reg_ct;
1495 tcg_regset_andnot(reg_ct, reg1, reg2);
1497 /* first try free registers */
1498 for(i = 0; i < ARRAY_SIZE(tcg_target_reg_alloc_order); i++) {
1499 reg = tcg_target_reg_alloc_order[i];
1500 if (tcg_regset_test_reg(reg_ct, reg) && s->reg_to_temp[reg] == -1)
1501 return reg;
1504 /* XXX: do better spill choice */
1505 for(i = 0; i < ARRAY_SIZE(tcg_target_reg_alloc_order); i++) {
1506 reg = tcg_target_reg_alloc_order[i];
1507 if (tcg_regset_test_reg(reg_ct, reg)) {
1508 tcg_reg_free(s, reg);
1509 return reg;
1513 tcg_abort();
1516 /* save a temporary to memory. 'allocated_regs' is used in case a
1517 temporary registers needs to be allocated to store a constant. */
1518 static void temp_save(TCGContext *s, int temp, TCGRegSet allocated_regs)
1520 TCGTemp *ts;
1521 int reg;
1523 ts = &s->temps[temp];
1524 if (!ts->fixed_reg) {
1525 switch(ts->val_type) {
1526 case TEMP_VAL_REG:
1527 tcg_reg_free(s, ts->reg);
1528 break;
1529 case TEMP_VAL_DEAD:
1530 ts->val_type = TEMP_VAL_MEM;
1531 break;
1532 case TEMP_VAL_CONST:
1533 reg = tcg_reg_alloc(s, tcg_target_available_regs[ts->type],
1534 allocated_regs);
1535 if (!ts->mem_allocated)
1536 temp_allocate_frame(s, temp);
1537 tcg_out_movi(s, ts->type, reg, ts->val);
1538 tcg_out_st(s, ts->type, reg, ts->mem_reg, ts->mem_offset);
1539 ts->val_type = TEMP_VAL_MEM;
1540 break;
1541 case TEMP_VAL_MEM:
1542 break;
1543 default:
1544 tcg_abort();
1549 /* save globals to their canonical location and assume they can be
1550 modified be the following code. 'allocated_regs' is used in case a
1551 temporary registers needs to be allocated to store a constant. */
1552 static void save_globals(TCGContext *s, TCGRegSet allocated_regs)
1554 int i;
1556 for(i = 0; i < s->nb_globals; i++) {
1557 temp_save(s, i, allocated_regs);
1561 /* at the end of a basic block, we assume all temporaries are dead and
1562 all globals are stored at their canonical location. */
1563 static void tcg_reg_alloc_bb_end(TCGContext *s, TCGRegSet allocated_regs)
1565 TCGTemp *ts;
1566 int i;
1568 for(i = s->nb_globals; i < s->nb_temps; i++) {
1569 ts = &s->temps[i];
1570 if (ts->temp_local) {
1571 temp_save(s, i, allocated_regs);
1572 } else {
1573 if (ts->val_type == TEMP_VAL_REG) {
1574 s->reg_to_temp[ts->reg] = -1;
1576 ts->val_type = TEMP_VAL_DEAD;
1580 save_globals(s, allocated_regs);
1583 #define IS_DEAD_ARG(n) ((dead_args >> (n)) & 1)
1585 static void tcg_reg_alloc_movi(TCGContext *s, const TCGArg *args)
1587 TCGTemp *ots;
1588 tcg_target_ulong val;
1590 ots = &s->temps[args[0]];
1591 val = args[1];
1593 if (ots->fixed_reg) {
1594 /* for fixed registers, we do not do any constant
1595 propagation */
1596 tcg_out_movi(s, ots->type, ots->reg, val);
1597 } else {
1598 /* The movi is not explicitly generated here */
1599 if (ots->val_type == TEMP_VAL_REG)
1600 s->reg_to_temp[ots->reg] = -1;
1601 ots->val_type = TEMP_VAL_CONST;
1602 ots->val = val;
1606 static void tcg_reg_alloc_mov(TCGContext *s, const TCGOpDef *def,
1607 const TCGArg *args,
1608 unsigned int dead_args)
1610 TCGTemp *ts, *ots;
1611 int reg;
1612 const TCGArgConstraint *arg_ct;
1614 ots = &s->temps[args[0]];
1615 ts = &s->temps[args[1]];
1616 arg_ct = &def->args_ct[0];
1618 /* XXX: always mark arg dead if IS_DEAD_ARG(1) */
1619 if (ts->val_type == TEMP_VAL_REG) {
1620 if (IS_DEAD_ARG(1) && !ts->fixed_reg && !ots->fixed_reg) {
1621 /* the mov can be suppressed */
1622 if (ots->val_type == TEMP_VAL_REG)
1623 s->reg_to_temp[ots->reg] = -1;
1624 reg = ts->reg;
1625 s->reg_to_temp[reg] = -1;
1626 ts->val_type = TEMP_VAL_DEAD;
1627 } else {
1628 if (ots->val_type == TEMP_VAL_REG) {
1629 reg = ots->reg;
1630 } else {
1631 reg = tcg_reg_alloc(s, arg_ct->u.regs, s->reserved_regs);
1633 if (ts->reg != reg) {
1634 tcg_out_mov(s, ots->type, reg, ts->reg);
1637 } else if (ts->val_type == TEMP_VAL_MEM) {
1638 if (ots->val_type == TEMP_VAL_REG) {
1639 reg = ots->reg;
1640 } else {
1641 reg = tcg_reg_alloc(s, arg_ct->u.regs, s->reserved_regs);
1643 tcg_out_ld(s, ts->type, reg, ts->mem_reg, ts->mem_offset);
1644 } else if (ts->val_type == TEMP_VAL_CONST) {
1645 if (ots->fixed_reg) {
1646 reg = ots->reg;
1647 tcg_out_movi(s, ots->type, reg, ts->val);
1648 } else {
1649 /* propagate constant */
1650 if (ots->val_type == TEMP_VAL_REG)
1651 s->reg_to_temp[ots->reg] = -1;
1652 ots->val_type = TEMP_VAL_CONST;
1653 ots->val = ts->val;
1654 return;
1656 } else {
1657 tcg_abort();
1659 s->reg_to_temp[reg] = args[0];
1660 ots->reg = reg;
1661 ots->val_type = TEMP_VAL_REG;
1662 ots->mem_coherent = 0;
1665 static void tcg_reg_alloc_op(TCGContext *s,
1666 const TCGOpDef *def, TCGOpcode opc,
1667 const TCGArg *args,
1668 unsigned int dead_args)
1670 TCGRegSet allocated_regs;
1671 int i, k, nb_iargs, nb_oargs, reg;
1672 TCGArg arg;
1673 const TCGArgConstraint *arg_ct;
1674 TCGTemp *ts;
1675 TCGArg new_args[TCG_MAX_OP_ARGS];
1676 int const_args[TCG_MAX_OP_ARGS];
1678 nb_oargs = def->nb_oargs;
1679 nb_iargs = def->nb_iargs;
1681 /* copy constants */
1682 memcpy(new_args + nb_oargs + nb_iargs,
1683 args + nb_oargs + nb_iargs,
1684 sizeof(TCGArg) * def->nb_cargs);
1686 /* satisfy input constraints */
1687 tcg_regset_set(allocated_regs, s->reserved_regs);
1688 for(k = 0; k < nb_iargs; k++) {
1689 i = def->sorted_args[nb_oargs + k];
1690 arg = args[i];
1691 arg_ct = &def->args_ct[i];
1692 ts = &s->temps[arg];
1693 if (ts->val_type == TEMP_VAL_MEM) {
1694 reg = tcg_reg_alloc(s, arg_ct->u.regs, allocated_regs);
1695 tcg_out_ld(s, ts->type, reg, ts->mem_reg, ts->mem_offset);
1696 ts->val_type = TEMP_VAL_REG;
1697 ts->reg = reg;
1698 ts->mem_coherent = 1;
1699 s->reg_to_temp[reg] = arg;
1700 } else if (ts->val_type == TEMP_VAL_CONST) {
1701 if (tcg_target_const_match(ts->val, arg_ct)) {
1702 /* constant is OK for instruction */
1703 const_args[i] = 1;
1704 new_args[i] = ts->val;
1705 goto iarg_end;
1706 } else {
1707 /* need to move to a register */
1708 reg = tcg_reg_alloc(s, arg_ct->u.regs, allocated_regs);
1709 tcg_out_movi(s, ts->type, reg, ts->val);
1710 ts->val_type = TEMP_VAL_REG;
1711 ts->reg = reg;
1712 ts->mem_coherent = 0;
1713 s->reg_to_temp[reg] = arg;
1716 assert(ts->val_type == TEMP_VAL_REG);
1717 if (arg_ct->ct & TCG_CT_IALIAS) {
1718 if (ts->fixed_reg) {
1719 /* if fixed register, we must allocate a new register
1720 if the alias is not the same register */
1721 if (arg != args[arg_ct->alias_index])
1722 goto allocate_in_reg;
1723 } else {
1724 /* if the input is aliased to an output and if it is
1725 not dead after the instruction, we must allocate
1726 a new register and move it */
1727 if (!IS_DEAD_ARG(i)) {
1728 goto allocate_in_reg;
1732 reg = ts->reg;
1733 if (tcg_regset_test_reg(arg_ct->u.regs, reg)) {
1734 /* nothing to do : the constraint is satisfied */
1735 } else {
1736 allocate_in_reg:
1737 /* allocate a new register matching the constraint
1738 and move the temporary register into it */
1739 reg = tcg_reg_alloc(s, arg_ct->u.regs, allocated_regs);
1740 tcg_out_mov(s, ts->type, reg, ts->reg);
1742 new_args[i] = reg;
1743 const_args[i] = 0;
1744 tcg_regset_set_reg(allocated_regs, reg);
1745 iarg_end: ;
1748 if (def->flags & TCG_OPF_BB_END) {
1749 tcg_reg_alloc_bb_end(s, allocated_regs);
1750 } else {
1751 /* mark dead temporaries and free the associated registers */
1752 for(i = nb_oargs; i < nb_oargs + nb_iargs; i++) {
1753 arg = args[i];
1754 if (IS_DEAD_ARG(i)) {
1755 ts = &s->temps[arg];
1756 if (!ts->fixed_reg) {
1757 if (ts->val_type == TEMP_VAL_REG)
1758 s->reg_to_temp[ts->reg] = -1;
1759 ts->val_type = TEMP_VAL_DEAD;
1764 if (def->flags & TCG_OPF_CALL_CLOBBER) {
1765 /* XXX: permit generic clobber register list ? */
1766 for(reg = 0; reg < TCG_TARGET_NB_REGS; reg++) {
1767 if (tcg_regset_test_reg(tcg_target_call_clobber_regs, reg)) {
1768 tcg_reg_free(s, reg);
1771 /* XXX: for load/store we could do that only for the slow path
1772 (i.e. when a memory callback is called) */
1774 /* store globals and free associated registers (we assume the insn
1775 can modify any global. */
1776 save_globals(s, allocated_regs);
1779 /* satisfy the output constraints */
1780 tcg_regset_set(allocated_regs, s->reserved_regs);
1781 for(k = 0; k < nb_oargs; k++) {
1782 i = def->sorted_args[k];
1783 arg = args[i];
1784 arg_ct = &def->args_ct[i];
1785 ts = &s->temps[arg];
1786 if (arg_ct->ct & TCG_CT_ALIAS) {
1787 reg = new_args[arg_ct->alias_index];
1788 } else {
1789 /* if fixed register, we try to use it */
1790 reg = ts->reg;
1791 if (ts->fixed_reg &&
1792 tcg_regset_test_reg(arg_ct->u.regs, reg)) {
1793 goto oarg_end;
1795 reg = tcg_reg_alloc(s, arg_ct->u.regs, allocated_regs);
1797 tcg_regset_set_reg(allocated_regs, reg);
1798 /* if a fixed register is used, then a move will be done afterwards */
1799 if (!ts->fixed_reg) {
1800 if (ts->val_type == TEMP_VAL_REG)
1801 s->reg_to_temp[ts->reg] = -1;
1802 if (IS_DEAD_ARG(i)) {
1803 ts->val_type = TEMP_VAL_DEAD;
1804 } else {
1805 ts->val_type = TEMP_VAL_REG;
1806 ts->reg = reg;
1807 /* temp value is modified, so the value kept in memory is
1808 potentially not the same */
1809 ts->mem_coherent = 0;
1810 s->reg_to_temp[reg] = arg;
1813 oarg_end:
1814 new_args[i] = reg;
1818 /* emit instruction */
1819 tcg_out_op(s, opc, new_args, const_args);
1821 /* move the outputs in the correct register if needed */
1822 for(i = 0; i < nb_oargs; i++) {
1823 ts = &s->temps[args[i]];
1824 reg = new_args[i];
1825 if (ts->fixed_reg && ts->reg != reg) {
1826 tcg_out_mov(s, ts->type, ts->reg, reg);
1831 #ifdef TCG_TARGET_STACK_GROWSUP
1832 #define STACK_DIR(x) (-(x))
1833 #else
1834 #define STACK_DIR(x) (x)
1835 #endif
1837 static int tcg_reg_alloc_call(TCGContext *s, const TCGOpDef *def,
1838 TCGOpcode opc, const TCGArg *args,
1839 unsigned int dead_args)
1841 int nb_iargs, nb_oargs, flags, nb_regs, i, reg, nb_params;
1842 TCGArg arg, func_arg;
1843 TCGTemp *ts;
1844 tcg_target_long stack_offset, call_stack_size, func_addr;
1845 int const_func_arg, allocate_args;
1846 TCGRegSet allocated_regs;
1847 const TCGArgConstraint *arg_ct;
1849 arg = *args++;
1851 nb_oargs = arg >> 16;
1852 nb_iargs = arg & 0xffff;
1853 nb_params = nb_iargs - 1;
1855 flags = args[nb_oargs + nb_iargs];
1857 nb_regs = ARRAY_SIZE(tcg_target_call_iarg_regs);
1858 if (nb_regs > nb_params)
1859 nb_regs = nb_params;
1861 /* assign stack slots first */
1862 call_stack_size = (nb_params - nb_regs) * sizeof(tcg_target_long);
1863 call_stack_size = (call_stack_size + TCG_TARGET_STACK_ALIGN - 1) &
1864 ~(TCG_TARGET_STACK_ALIGN - 1);
1865 allocate_args = (call_stack_size > TCG_STATIC_CALL_ARGS_SIZE);
1866 if (allocate_args) {
1867 /* XXX: if more than TCG_STATIC_CALL_ARGS_SIZE is needed,
1868 preallocate call stack */
1869 tcg_abort();
1872 stack_offset = TCG_TARGET_CALL_STACK_OFFSET;
1873 for(i = nb_regs; i < nb_params; i++) {
1874 arg = args[nb_oargs + i];
1875 #ifdef TCG_TARGET_STACK_GROWSUP
1876 stack_offset -= sizeof(tcg_target_long);
1877 #endif
1878 if (arg != TCG_CALL_DUMMY_ARG) {
1879 ts = &s->temps[arg];
1880 if (ts->val_type == TEMP_VAL_REG) {
1881 tcg_out_st(s, ts->type, ts->reg, TCG_REG_CALL_STACK, stack_offset);
1882 } else if (ts->val_type == TEMP_VAL_MEM) {
1883 reg = tcg_reg_alloc(s, tcg_target_available_regs[ts->type],
1884 s->reserved_regs);
1885 /* XXX: not correct if reading values from the stack */
1886 tcg_out_ld(s, ts->type, reg, ts->mem_reg, ts->mem_offset);
1887 tcg_out_st(s, ts->type, reg, TCG_REG_CALL_STACK, stack_offset);
1888 } else if (ts->val_type == TEMP_VAL_CONST) {
1889 reg = tcg_reg_alloc(s, tcg_target_available_regs[ts->type],
1890 s->reserved_regs);
1891 /* XXX: sign extend may be needed on some targets */
1892 tcg_out_movi(s, ts->type, reg, ts->val);
1893 tcg_out_st(s, ts->type, reg, TCG_REG_CALL_STACK, stack_offset);
1894 } else {
1895 tcg_abort();
1898 #ifndef TCG_TARGET_STACK_GROWSUP
1899 stack_offset += sizeof(tcg_target_long);
1900 #endif
1903 /* assign input registers */
1904 tcg_regset_set(allocated_regs, s->reserved_regs);
1905 for(i = 0; i < nb_regs; i++) {
1906 arg = args[nb_oargs + i];
1907 if (arg != TCG_CALL_DUMMY_ARG) {
1908 ts = &s->temps[arg];
1909 reg = tcg_target_call_iarg_regs[i];
1910 tcg_reg_free(s, reg);
1911 if (ts->val_type == TEMP_VAL_REG) {
1912 if (ts->reg != reg) {
1913 tcg_out_mov(s, ts->type, reg, ts->reg);
1915 } else if (ts->val_type == TEMP_VAL_MEM) {
1916 tcg_out_ld(s, ts->type, reg, ts->mem_reg, ts->mem_offset);
1917 } else if (ts->val_type == TEMP_VAL_CONST) {
1918 /* XXX: sign extend ? */
1919 tcg_out_movi(s, ts->type, reg, ts->val);
1920 } else {
1921 tcg_abort();
1923 tcg_regset_set_reg(allocated_regs, reg);
1927 /* assign function address */
1928 func_arg = args[nb_oargs + nb_iargs - 1];
1929 arg_ct = &def->args_ct[0];
1930 ts = &s->temps[func_arg];
1931 func_addr = ts->val;
1932 const_func_arg = 0;
1933 if (ts->val_type == TEMP_VAL_MEM) {
1934 reg = tcg_reg_alloc(s, arg_ct->u.regs, allocated_regs);
1935 tcg_out_ld(s, ts->type, reg, ts->mem_reg, ts->mem_offset);
1936 func_arg = reg;
1937 tcg_regset_set_reg(allocated_regs, reg);
1938 } else if (ts->val_type == TEMP_VAL_REG) {
1939 reg = ts->reg;
1940 if (!tcg_regset_test_reg(arg_ct->u.regs, reg)) {
1941 reg = tcg_reg_alloc(s, arg_ct->u.regs, allocated_regs);
1942 tcg_out_mov(s, ts->type, reg, ts->reg);
1944 func_arg = reg;
1945 tcg_regset_set_reg(allocated_regs, reg);
1946 } else if (ts->val_type == TEMP_VAL_CONST) {
1947 if (tcg_target_const_match(func_addr, arg_ct)) {
1948 const_func_arg = 1;
1949 func_arg = func_addr;
1950 } else {
1951 reg = tcg_reg_alloc(s, arg_ct->u.regs, allocated_regs);
1952 tcg_out_movi(s, ts->type, reg, func_addr);
1953 func_arg = reg;
1954 tcg_regset_set_reg(allocated_regs, reg);
1956 } else {
1957 tcg_abort();
1961 /* mark dead temporaries and free the associated registers */
1962 for(i = nb_oargs; i < nb_iargs + nb_oargs; i++) {
1963 arg = args[i];
1964 if (IS_DEAD_ARG(i)) {
1965 ts = &s->temps[arg];
1966 if (!ts->fixed_reg) {
1967 if (ts->val_type == TEMP_VAL_REG)
1968 s->reg_to_temp[ts->reg] = -1;
1969 ts->val_type = TEMP_VAL_DEAD;
1974 /* clobber call registers */
1975 for(reg = 0; reg < TCG_TARGET_NB_REGS; reg++) {
1976 if (tcg_regset_test_reg(tcg_target_call_clobber_regs, reg)) {
1977 tcg_reg_free(s, reg);
1981 /* store globals and free associated registers (we assume the call
1982 can modify any global. */
1983 if (!(flags & TCG_CALL_CONST)) {
1984 save_globals(s, allocated_regs);
1987 tcg_out_op(s, opc, &func_arg, &const_func_arg);
1989 /* assign output registers and emit moves if needed */
1990 for(i = 0; i < nb_oargs; i++) {
1991 arg = args[i];
1992 ts = &s->temps[arg];
1993 reg = tcg_target_call_oarg_regs[i];
1994 assert(s->reg_to_temp[reg] == -1);
1995 if (ts->fixed_reg) {
1996 if (ts->reg != reg) {
1997 tcg_out_mov(s, ts->type, ts->reg, reg);
1999 } else {
2000 if (ts->val_type == TEMP_VAL_REG)
2001 s->reg_to_temp[ts->reg] = -1;
2002 if (IS_DEAD_ARG(i)) {
2003 ts->val_type = TEMP_VAL_DEAD;
2004 } else {
2005 ts->val_type = TEMP_VAL_REG;
2006 ts->reg = reg;
2007 ts->mem_coherent = 0;
2008 s->reg_to_temp[reg] = arg;
2013 return nb_iargs + nb_oargs + def->nb_cargs + 1;
2016 #ifdef CONFIG_PROFILER
2018 static int64_t tcg_table_op_count[NB_OPS];
2020 static void dump_op_count(void)
2022 int i;
2023 FILE *f;
2024 f = fopen("/tmp/op.log", "w");
2025 for(i = INDEX_op_end; i < NB_OPS; i++) {
2026 fprintf(f, "%s %" PRId64 "\n", tcg_op_defs[i].name, tcg_table_op_count[i]);
2028 fclose(f);
2030 #endif
2033 static inline int tcg_gen_code_common(TCGContext *s, uint8_t *gen_code_buf,
2034 long search_pc)
2036 TCGOpcode opc;
2037 int op_index;
2038 const TCGOpDef *def;
2039 unsigned int dead_args;
2040 const TCGArg *args;
2042 #ifdef DEBUG_DISAS
2043 if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP))) {
2044 qemu_log("OP:\n");
2045 tcg_dump_ops(s);
2046 qemu_log("\n");
2048 #endif
2050 #ifdef CONFIG_PROFILER
2051 s->opt_time -= profile_getclock();
2052 #endif
2054 #ifdef USE_TCG_OPTIMIZATIONS
2055 gen_opparam_ptr =
2056 tcg_optimize(s, gen_opc_ptr, gen_opparam_buf, tcg_op_defs);
2057 #endif
2059 #ifdef CONFIG_PROFILER
2060 s->opt_time += profile_getclock();
2061 s->la_time -= profile_getclock();
2062 #endif
2064 tcg_liveness_analysis(s);
2066 #ifdef CONFIG_PROFILER
2067 s->la_time += profile_getclock();
2068 #endif
2070 #ifdef DEBUG_DISAS
2071 if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_OPT))) {
2072 qemu_log("OP after optimization and liveness analysis:\n");
2073 tcg_dump_ops(s);
2074 qemu_log("\n");
2076 #endif
2078 tcg_reg_alloc_start(s);
2080 s->code_buf = gen_code_buf;
2081 s->code_ptr = gen_code_buf;
2083 args = gen_opparam_buf;
2084 op_index = 0;
2086 for(;;) {
2087 opc = gen_opc_buf[op_index];
2088 #ifdef CONFIG_PROFILER
2089 tcg_table_op_count[opc]++;
2090 #endif
2091 def = &tcg_op_defs[opc];
2092 #if 0
2093 printf("%s: %d %d %d\n", def->name,
2094 def->nb_oargs, def->nb_iargs, def->nb_cargs);
2095 // dump_regs(s);
2096 #endif
2097 switch(opc) {
2098 case INDEX_op_mov_i32:
2099 case INDEX_op_mov_i64:
2100 dead_args = s->op_dead_args[op_index];
2101 tcg_reg_alloc_mov(s, def, args, dead_args);
2102 break;
2103 case INDEX_op_movi_i32:
2104 case INDEX_op_movi_i64:
2105 tcg_reg_alloc_movi(s, args);
2106 break;
2107 case INDEX_op_debug_insn_start:
2108 /* debug instruction */
2109 break;
2110 case INDEX_op_nop:
2111 case INDEX_op_nop1:
2112 case INDEX_op_nop2:
2113 case INDEX_op_nop3:
2114 break;
2115 case INDEX_op_nopn:
2116 args += args[0];
2117 goto next;
2118 case INDEX_op_discard:
2120 TCGTemp *ts;
2121 ts = &s->temps[args[0]];
2122 /* mark the temporary as dead */
2123 if (!ts->fixed_reg) {
2124 if (ts->val_type == TEMP_VAL_REG)
2125 s->reg_to_temp[ts->reg] = -1;
2126 ts->val_type = TEMP_VAL_DEAD;
2129 break;
2130 case INDEX_op_set_label:
2131 tcg_reg_alloc_bb_end(s, s->reserved_regs);
2132 tcg_out_label(s, args[0], s->code_ptr);
2133 break;
2134 case INDEX_op_call:
2135 dead_args = s->op_dead_args[op_index];
2136 args += tcg_reg_alloc_call(s, def, opc, args, dead_args);
2137 goto next;
2138 case INDEX_op_end:
2139 goto the_end;
2140 default:
2141 /* Sanity check that we've not introduced any unhandled opcodes. */
2142 if (def->flags & TCG_OPF_NOT_PRESENT) {
2143 tcg_abort();
2145 /* Note: in order to speed up the code, it would be much
2146 faster to have specialized register allocator functions for
2147 some common argument patterns */
2148 dead_args = s->op_dead_args[op_index];
2149 tcg_reg_alloc_op(s, def, opc, args, dead_args);
2150 break;
2152 args += def->nb_args;
2153 next:
2154 if (search_pc >= 0 && search_pc < s->code_ptr - gen_code_buf) {
2155 return op_index;
2157 op_index++;
2158 #ifndef NDEBUG
2159 check_regs(s);
2160 #endif
2162 the_end:
2163 return -1;
2166 int tcg_gen_code(TCGContext *s, uint8_t *gen_code_buf)
2168 #ifdef CONFIG_PROFILER
2170 int n;
2171 n = (gen_opc_ptr - gen_opc_buf);
2172 s->op_count += n;
2173 if (n > s->op_count_max)
2174 s->op_count_max = n;
2176 s->temp_count += s->nb_temps;
2177 if (s->nb_temps > s->temp_count_max)
2178 s->temp_count_max = s->nb_temps;
2180 #endif
2182 tcg_gen_code_common(s, gen_code_buf, -1);
2184 /* flush instruction cache */
2185 flush_icache_range((tcg_target_ulong)gen_code_buf,
2186 (tcg_target_ulong)s->code_ptr);
2188 return s->code_ptr - gen_code_buf;
2191 /* Return the index of the micro operation such as the pc after is <
2192 offset bytes from the start of the TB. The contents of gen_code_buf must
2193 not be changed, though writing the same values is ok.
2194 Return -1 if not found. */
2195 int tcg_gen_code_search_pc(TCGContext *s, uint8_t *gen_code_buf, long offset)
2197 return tcg_gen_code_common(s, gen_code_buf, offset);
2200 #ifdef CONFIG_PROFILER
2201 void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf)
2203 TCGContext *s = &tcg_ctx;
2204 int64_t tot;
2206 tot = s->interm_time + s->code_time;
2207 cpu_fprintf(f, "JIT cycles %" PRId64 " (%0.3f s at 2.4 GHz)\n",
2208 tot, tot / 2.4e9);
2209 cpu_fprintf(f, "translated TBs %" PRId64 " (aborted=%" PRId64 " %0.1f%%)\n",
2210 s->tb_count,
2211 s->tb_count1 - s->tb_count,
2212 s->tb_count1 ? (double)(s->tb_count1 - s->tb_count) / s->tb_count1 * 100.0 : 0);
2213 cpu_fprintf(f, "avg ops/TB %0.1f max=%d\n",
2214 s->tb_count ? (double)s->op_count / s->tb_count : 0, s->op_count_max);
2215 cpu_fprintf(f, "deleted ops/TB %0.2f\n",
2216 s->tb_count ?
2217 (double)s->del_op_count / s->tb_count : 0);
2218 cpu_fprintf(f, "avg temps/TB %0.2f max=%d\n",
2219 s->tb_count ?
2220 (double)s->temp_count / s->tb_count : 0,
2221 s->temp_count_max);
2223 cpu_fprintf(f, "cycles/op %0.1f\n",
2224 s->op_count ? (double)tot / s->op_count : 0);
2225 cpu_fprintf(f, "cycles/in byte %0.1f\n",
2226 s->code_in_len ? (double)tot / s->code_in_len : 0);
2227 cpu_fprintf(f, "cycles/out byte %0.1f\n",
2228 s->code_out_len ? (double)tot / s->code_out_len : 0);
2229 if (tot == 0)
2230 tot = 1;
2231 cpu_fprintf(f, " gen_interm time %0.1f%%\n",
2232 (double)s->interm_time / tot * 100.0);
2233 cpu_fprintf(f, " gen_code time %0.1f%%\n",
2234 (double)s->code_time / tot * 100.0);
2235 cpu_fprintf(f, "optim./code time %0.1f%%\n",
2236 (double)s->opt_time / (s->code_time ? s->code_time : 1)
2237 * 100.0);
2238 cpu_fprintf(f, "liveness/code time %0.1f%%\n",
2239 (double)s->la_time / (s->code_time ? s->code_time : 1) * 100.0);
2240 cpu_fprintf(f, "cpu_restore count %" PRId64 "\n",
2241 s->restore_count);
2242 cpu_fprintf(f, " avg cycles %0.1f\n",
2243 s->restore_count ? (double)s->restore_time / s->restore_count : 0);
2245 dump_op_count();
2247 #else
2248 void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf)
2250 cpu_fprintf(f, "[TCG profiler not compiled]\n");
2252 #endif
2254 #ifdef ELF_HOST_MACHINE
2255 /* In order to use this feature, the backend needs to do three things:
2257 (1) Define ELF_HOST_MACHINE to indicate both what value to
2258 put into the ELF image and to indicate support for the feature.
2260 (2) Define tcg_register_jit. This should create a buffer containing
2261 the contents of a .debug_frame section that describes the post-
2262 prologue unwind info for the tcg machine.
2264 (3) Call tcg_register_jit_int, with the constructed .debug_frame.
2267 /* Begin GDB interface. THE FOLLOWING MUST MATCH GDB DOCS. */
2268 typedef enum {
2269 JIT_NOACTION = 0,
2270 JIT_REGISTER_FN,
2271 JIT_UNREGISTER_FN
2272 } jit_actions_t;
2274 struct jit_code_entry {
2275 struct jit_code_entry *next_entry;
2276 struct jit_code_entry *prev_entry;
2277 const void *symfile_addr;
2278 uint64_t symfile_size;
2281 struct jit_descriptor {
2282 uint32_t version;
2283 uint32_t action_flag;
2284 struct jit_code_entry *relevant_entry;
2285 struct jit_code_entry *first_entry;
2288 void __jit_debug_register_code(void) __attribute__((noinline));
2289 void __jit_debug_register_code(void)
2291 asm("");
2294 /* Must statically initialize the version, because GDB may check
2295 the version before we can set it. */
2296 struct jit_descriptor __jit_debug_descriptor = { 1, 0, 0, 0 };
2298 /* End GDB interface. */
2300 static int find_string(const char *strtab, const char *str)
2302 const char *p = strtab + 1;
2304 while (1) {
2305 if (strcmp(p, str) == 0) {
2306 return p - strtab;
2308 p += strlen(p) + 1;
2312 static void tcg_register_jit_int(void *buf_ptr, size_t buf_size,
2313 void *debug_frame, size_t debug_frame_size)
2315 struct __attribute__((packed)) DebugInfo {
2316 uint32_t len;
2317 uint16_t version;
2318 uint32_t abbrev;
2319 uint8_t ptr_size;
2320 uint8_t cu_die;
2321 uint16_t cu_lang;
2322 uintptr_t cu_low_pc;
2323 uintptr_t cu_high_pc;
2324 uint8_t fn_die;
2325 char fn_name[16];
2326 uintptr_t fn_low_pc;
2327 uintptr_t fn_high_pc;
2328 uint8_t cu_eoc;
2331 struct ElfImage {
2332 ElfW(Ehdr) ehdr;
2333 ElfW(Phdr) phdr;
2334 ElfW(Shdr) shdr[7];
2335 ElfW(Sym) sym[2];
2336 struct DebugInfo di;
2337 uint8_t da[24];
2338 char str[80];
2341 struct ElfImage *img;
2343 static const struct ElfImage img_template = {
2344 .ehdr = {
2345 .e_ident[EI_MAG0] = ELFMAG0,
2346 .e_ident[EI_MAG1] = ELFMAG1,
2347 .e_ident[EI_MAG2] = ELFMAG2,
2348 .e_ident[EI_MAG3] = ELFMAG3,
2349 .e_ident[EI_CLASS] = ELF_CLASS,
2350 .e_ident[EI_DATA] = ELF_DATA,
2351 .e_ident[EI_VERSION] = EV_CURRENT,
2352 .e_type = ET_EXEC,
2353 .e_machine = ELF_HOST_MACHINE,
2354 .e_version = EV_CURRENT,
2355 .e_phoff = offsetof(struct ElfImage, phdr),
2356 .e_shoff = offsetof(struct ElfImage, shdr),
2357 .e_ehsize = sizeof(ElfW(Shdr)),
2358 .e_phentsize = sizeof(ElfW(Phdr)),
2359 .e_phnum = 1,
2360 .e_shentsize = sizeof(ElfW(Shdr)),
2361 .e_shnum = ARRAY_SIZE(img->shdr),
2362 .e_shstrndx = ARRAY_SIZE(img->shdr) - 1,
2363 #ifdef ELF_HOST_FLAGS
2364 .e_flags = ELF_HOST_FLAGS,
2365 #endif
2366 #ifdef ELF_OSABI
2367 .e_ident[EI_OSABI] = ELF_OSABI,
2368 #endif
2370 .phdr = {
2371 .p_type = PT_LOAD,
2372 .p_flags = PF_X,
2374 .shdr = {
2375 [0] = { .sh_type = SHT_NULL },
2376 /* Trick: The contents of code_gen_buffer are not present in
2377 this fake ELF file; that got allocated elsewhere. Therefore
2378 we mark .text as SHT_NOBITS (similar to .bss) so that readers
2379 will not look for contents. We can record any address. */
2380 [1] = { /* .text */
2381 .sh_type = SHT_NOBITS,
2382 .sh_flags = SHF_EXECINSTR | SHF_ALLOC,
2384 [2] = { /* .debug_info */
2385 .sh_type = SHT_PROGBITS,
2386 .sh_offset = offsetof(struct ElfImage, di),
2387 .sh_size = sizeof(struct DebugInfo),
2389 [3] = { /* .debug_abbrev */
2390 .sh_type = SHT_PROGBITS,
2391 .sh_offset = offsetof(struct ElfImage, da),
2392 .sh_size = sizeof(img->da),
2394 [4] = { /* .debug_frame */
2395 .sh_type = SHT_PROGBITS,
2396 .sh_offset = sizeof(struct ElfImage),
2398 [5] = { /* .symtab */
2399 .sh_type = SHT_SYMTAB,
2400 .sh_offset = offsetof(struct ElfImage, sym),
2401 .sh_size = sizeof(img->sym),
2402 .sh_info = 1,
2403 .sh_link = ARRAY_SIZE(img->shdr) - 1,
2404 .sh_entsize = sizeof(ElfW(Sym)),
2406 [6] = { /* .strtab */
2407 .sh_type = SHT_STRTAB,
2408 .sh_offset = offsetof(struct ElfImage, str),
2409 .sh_size = sizeof(img->str),
2412 .sym = {
2413 [1] = { /* code_gen_buffer */
2414 .st_info = ELF_ST_INFO(STB_GLOBAL, STT_FUNC),
2415 .st_shndx = 1,
2418 .di = {
2419 .len = sizeof(struct DebugInfo) - 4,
2420 .version = 2,
2421 .ptr_size = sizeof(void *),
2422 .cu_die = 1,
2423 .cu_lang = 0x8001, /* DW_LANG_Mips_Assembler */
2424 .fn_die = 2,
2425 .fn_name = "code_gen_buffer"
2427 .da = {
2428 1, /* abbrev number (the cu) */
2429 0x11, 1, /* DW_TAG_compile_unit, has children */
2430 0x13, 0x5, /* DW_AT_language, DW_FORM_data2 */
2431 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */
2432 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */
2433 0, 0, /* end of abbrev */
2434 2, /* abbrev number (the fn) */
2435 0x2e, 0, /* DW_TAG_subprogram, no children */
2436 0x3, 0x8, /* DW_AT_name, DW_FORM_string */
2437 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */
2438 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */
2439 0, 0, /* end of abbrev */
2440 0 /* no more abbrev */
2442 .str = "\0" ".text\0" ".debug_info\0" ".debug_abbrev\0"
2443 ".debug_frame\0" ".symtab\0" ".strtab\0" "code_gen_buffer",
2446 /* We only need a single jit entry; statically allocate it. */
2447 static struct jit_code_entry one_entry;
2449 uintptr_t buf = (uintptr_t)buf_ptr;
2450 size_t img_size = sizeof(struct ElfImage) + debug_frame_size;
2452 img = g_malloc(img_size);
2453 *img = img_template;
2454 memcpy(img + 1, debug_frame, debug_frame_size);
2456 img->phdr.p_vaddr = buf;
2457 img->phdr.p_paddr = buf;
2458 img->phdr.p_memsz = buf_size;
2460 img->shdr[1].sh_name = find_string(img->str, ".text");
2461 img->shdr[1].sh_addr = buf;
2462 img->shdr[1].sh_size = buf_size;
2464 img->shdr[2].sh_name = find_string(img->str, ".debug_info");
2465 img->shdr[3].sh_name = find_string(img->str, ".debug_abbrev");
2467 img->shdr[4].sh_name = find_string(img->str, ".debug_frame");
2468 img->shdr[4].sh_size = debug_frame_size;
2470 img->shdr[5].sh_name = find_string(img->str, ".symtab");
2471 img->shdr[6].sh_name = find_string(img->str, ".strtab");
2473 img->sym[1].st_name = find_string(img->str, "code_gen_buffer");
2474 img->sym[1].st_value = buf;
2475 img->sym[1].st_size = buf_size;
2477 img->di.cu_low_pc = buf;
2478 img->di.cu_high_pc = buf_size;
2479 img->di.fn_low_pc = buf;
2480 img->di.fn_high_pc = buf_size;
2482 #ifdef DEBUG_JIT
2483 /* Enable this block to be able to debug the ELF image file creation.
2484 One can use readelf, objdump, or other inspection utilities. */
2486 FILE *f = fopen("/tmp/qemu.jit", "w+b");
2487 if (f) {
2488 if (fwrite(img, img_size, 1, f) != img_size) {
2489 /* Avoid stupid unused return value warning for fwrite. */
2491 fclose(f);
2494 #endif
2496 one_entry.symfile_addr = img;
2497 one_entry.symfile_size = img_size;
2499 __jit_debug_descriptor.action_flag = JIT_REGISTER_FN;
2500 __jit_debug_descriptor.relevant_entry = &one_entry;
2501 __jit_debug_descriptor.first_entry = &one_entry;
2502 __jit_debug_register_code();
2504 #else
2505 /* No support for the feature. Provide the entry point expected by exec.c,
2506 and implement the internal function we declared earlier. */
2508 static void tcg_register_jit_int(void *buf, size_t size,
2509 void *debug_frame, size_t debug_frame_size)
2513 void tcg_register_jit(void *buf, size_t buf_size)
2516 #endif /* ELF_HOST_MACHINE */