2 * Tiny Code Generator for QEMU
4 * Copyright (c) 2008 Fabrice Bellard
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
25 #include "tcg-be-null.h"
27 #ifdef CONFIG_DEBUG_TCG
28 static const char * const tcg_target_reg_names
[TCG_TARGET_NB_REGS
] = {
70 /* Note that sparcv8plus can only hold 64 bit quantities in %g and %o
71 registers. These are saved manually by the kernel in full 64-bit
72 slots. The %i and %l registers are saved by the register window
73 mechanism, which only allocates space for 32 bits. Given that this
74 window spill/fill can happen on any signal, we must consider the
75 high bits of the %i and %l registers garbage at all times. */
77 # define ALL_64 0xffffffffu
79 # define ALL_64 0xffffu
82 /* Define some temporary registers. T2 is used for constant generation. */
83 #define TCG_REG_T1 TCG_REG_G1
84 #define TCG_REG_T2 TCG_REG_O7
86 #ifndef CONFIG_SOFTMMU
87 # define TCG_GUEST_BASE_REG TCG_REG_I5
90 static const int tcg_target_reg_alloc_order
[] = {
120 static const int tcg_target_call_iarg_regs
[6] = {
129 static const int tcg_target_call_oarg_regs
[] = {
136 #define INSN_OP(x) ((x) << 30)
137 #define INSN_OP2(x) ((x) << 22)
138 #define INSN_OP3(x) ((x) << 19)
139 #define INSN_OPF(x) ((x) << 5)
140 #define INSN_RD(x) ((x) << 25)
141 #define INSN_RS1(x) ((x) << 14)
142 #define INSN_RS2(x) (x)
143 #define INSN_ASI(x) ((x) << 5)
145 #define INSN_IMM10(x) ((1 << 13) | ((x) & 0x3ff))
146 #define INSN_IMM11(x) ((1 << 13) | ((x) & 0x7ff))
147 #define INSN_IMM13(x) ((1 << 13) | ((x) & 0x1fff))
148 #define INSN_OFF16(x) ((((x) >> 2) & 0x3fff) | ((((x) >> 16) & 3) << 20))
149 #define INSN_OFF19(x) (((x) >> 2) & 0x07ffff)
150 #define INSN_COND(x) ((x) << 25)
168 #define BA (INSN_OP(0) | INSN_COND(COND_A) | INSN_OP2(0x2))
177 #define MOVCC_ICC (1 << 18)
178 #define MOVCC_XCC (1 << 18 | 1 << 12)
181 #define BPCC_XCC (2 << 20)
182 #define BPCC_PT (1 << 19)
184 #define BPCC_A (1 << 29)
186 #define BPR_PT BPCC_PT
188 #define ARITH_ADD (INSN_OP(2) | INSN_OP3(0x00))
189 #define ARITH_ADDCC (INSN_OP(2) | INSN_OP3(0x10))
190 #define ARITH_AND (INSN_OP(2) | INSN_OP3(0x01))
191 #define ARITH_ANDN (INSN_OP(2) | INSN_OP3(0x05))
192 #define ARITH_OR (INSN_OP(2) | INSN_OP3(0x02))
193 #define ARITH_ORCC (INSN_OP(2) | INSN_OP3(0x12))
194 #define ARITH_ORN (INSN_OP(2) | INSN_OP3(0x06))
195 #define ARITH_XOR (INSN_OP(2) | INSN_OP3(0x03))
196 #define ARITH_SUB (INSN_OP(2) | INSN_OP3(0x04))
197 #define ARITH_SUBCC (INSN_OP(2) | INSN_OP3(0x14))
198 #define ARITH_ADDC (INSN_OP(2) | INSN_OP3(0x08))
199 #define ARITH_SUBC (INSN_OP(2) | INSN_OP3(0x0c))
200 #define ARITH_UMUL (INSN_OP(2) | INSN_OP3(0x0a))
201 #define ARITH_SMUL (INSN_OP(2) | INSN_OP3(0x0b))
202 #define ARITH_UDIV (INSN_OP(2) | INSN_OP3(0x0e))
203 #define ARITH_SDIV (INSN_OP(2) | INSN_OP3(0x0f))
204 #define ARITH_MULX (INSN_OP(2) | INSN_OP3(0x09))
205 #define ARITH_UDIVX (INSN_OP(2) | INSN_OP3(0x0d))
206 #define ARITH_SDIVX (INSN_OP(2) | INSN_OP3(0x2d))
207 #define ARITH_MOVCC (INSN_OP(2) | INSN_OP3(0x2c))
208 #define ARITH_MOVR (INSN_OP(2) | INSN_OP3(0x2f))
210 #define ARITH_ADDXC (INSN_OP(2) | INSN_OP3(0x36) | INSN_OPF(0x11))
211 #define ARITH_UMULXHI (INSN_OP(2) | INSN_OP3(0x36) | INSN_OPF(0x16))
213 #define SHIFT_SLL (INSN_OP(2) | INSN_OP3(0x25))
214 #define SHIFT_SRL (INSN_OP(2) | INSN_OP3(0x26))
215 #define SHIFT_SRA (INSN_OP(2) | INSN_OP3(0x27))
217 #define SHIFT_SLLX (INSN_OP(2) | INSN_OP3(0x25) | (1 << 12))
218 #define SHIFT_SRLX (INSN_OP(2) | INSN_OP3(0x26) | (1 << 12))
219 #define SHIFT_SRAX (INSN_OP(2) | INSN_OP3(0x27) | (1 << 12))
221 #define RDY (INSN_OP(2) | INSN_OP3(0x28) | INSN_RS1(0))
222 #define WRY (INSN_OP(2) | INSN_OP3(0x30) | INSN_RD(0))
223 #define JMPL (INSN_OP(2) | INSN_OP3(0x38))
224 #define RETURN (INSN_OP(2) | INSN_OP3(0x39))
225 #define SAVE (INSN_OP(2) | INSN_OP3(0x3c))
226 #define RESTORE (INSN_OP(2) | INSN_OP3(0x3d))
227 #define SETHI (INSN_OP(0) | INSN_OP2(0x4))
228 #define CALL INSN_OP(1)
229 #define LDUB (INSN_OP(3) | INSN_OP3(0x01))
230 #define LDSB (INSN_OP(3) | INSN_OP3(0x09))
231 #define LDUH (INSN_OP(3) | INSN_OP3(0x02))
232 #define LDSH (INSN_OP(3) | INSN_OP3(0x0a))
233 #define LDUW (INSN_OP(3) | INSN_OP3(0x00))
234 #define LDSW (INSN_OP(3) | INSN_OP3(0x08))
235 #define LDX (INSN_OP(3) | INSN_OP3(0x0b))
236 #define STB (INSN_OP(3) | INSN_OP3(0x05))
237 #define STH (INSN_OP(3) | INSN_OP3(0x06))
238 #define STW (INSN_OP(3) | INSN_OP3(0x04))
239 #define STX (INSN_OP(3) | INSN_OP3(0x0e))
240 #define LDUBA (INSN_OP(3) | INSN_OP3(0x11))
241 #define LDSBA (INSN_OP(3) | INSN_OP3(0x19))
242 #define LDUHA (INSN_OP(3) | INSN_OP3(0x12))
243 #define LDSHA (INSN_OP(3) | INSN_OP3(0x1a))
244 #define LDUWA (INSN_OP(3) | INSN_OP3(0x10))
245 #define LDSWA (INSN_OP(3) | INSN_OP3(0x18))
246 #define LDXA (INSN_OP(3) | INSN_OP3(0x1b))
247 #define STBA (INSN_OP(3) | INSN_OP3(0x15))
248 #define STHA (INSN_OP(3) | INSN_OP3(0x16))
249 #define STWA (INSN_OP(3) | INSN_OP3(0x14))
250 #define STXA (INSN_OP(3) | INSN_OP3(0x1e))
252 #define MEMBAR (INSN_OP(2) | INSN_OP3(0x28) | INSN_RS1(15) | (1 << 13))
254 #ifndef ASI_PRIMARY_LITTLE
255 #define ASI_PRIMARY_LITTLE 0x88
258 #define LDUH_LE (LDUHA | INSN_ASI(ASI_PRIMARY_LITTLE))
259 #define LDSH_LE (LDSHA | INSN_ASI(ASI_PRIMARY_LITTLE))
260 #define LDUW_LE (LDUWA | INSN_ASI(ASI_PRIMARY_LITTLE))
261 #define LDSW_LE (LDSWA | INSN_ASI(ASI_PRIMARY_LITTLE))
262 #define LDX_LE (LDXA | INSN_ASI(ASI_PRIMARY_LITTLE))
264 #define STH_LE (STHA | INSN_ASI(ASI_PRIMARY_LITTLE))
265 #define STW_LE (STWA | INSN_ASI(ASI_PRIMARY_LITTLE))
266 #define STX_LE (STXA | INSN_ASI(ASI_PRIMARY_LITTLE))
268 #ifndef use_vis3_instructions
269 bool use_vis3_instructions
;
272 static inline int check_fit_i64(int64_t val
, unsigned int bits
)
274 return val
== sextract64(val
, 0, bits
);
277 static inline int check_fit_i32(int32_t val
, unsigned int bits
)
279 return val
== sextract32(val
, 0, bits
);
282 #define check_fit_tl check_fit_i64
284 # define check_fit_ptr check_fit_i64
286 # define check_fit_ptr check_fit_i32
289 static void patch_reloc(tcg_insn_unit
*code_ptr
, int type
,
290 intptr_t value
, intptr_t addend
)
294 tcg_debug_assert(addend
== 0);
295 value
= tcg_ptr_byte_diff((tcg_insn_unit
*)value
, code_ptr
);
298 case R_SPARC_WDISP16
:
299 if (!check_fit_ptr(value
>> 2, 16)) {
303 insn
&= ~INSN_OFF16(-1);
304 insn
|= INSN_OFF16(value
);
307 case R_SPARC_WDISP19
:
308 if (!check_fit_ptr(value
>> 2, 19)) {
312 insn
&= ~INSN_OFF19(-1);
313 insn
|= INSN_OFF19(value
);
321 /* parse target specific constraints */
322 static const char *target_parse_constraint(TCGArgConstraint
*ct
,
323 const char *ct_str
, TCGType type
)
327 ct
->ct
|= TCG_CT_REG
;
328 tcg_regset_set32(ct
->u
.regs
, 0, 0xffffffff);
331 ct
->ct
|= TCG_CT_REG
;
332 tcg_regset_set32(ct
->u
.regs
, 0, ALL_64
);
334 case 'A': /* qemu_ld/st address constraint */
335 ct
->ct
|= TCG_CT_REG
;
336 tcg_regset_set32(ct
->u
.regs
, 0,
337 TARGET_LONG_BITS
== 64 ? ALL_64
: 0xffffffff);
339 tcg_regset_reset_reg(ct
->u
.regs
, TCG_REG_O0
);
340 tcg_regset_reset_reg(ct
->u
.regs
, TCG_REG_O1
);
341 tcg_regset_reset_reg(ct
->u
.regs
, TCG_REG_O2
);
343 case 's': /* qemu_st data 32-bit constraint */
344 ct
->ct
|= TCG_CT_REG
;
345 tcg_regset_set32(ct
->u
.regs
, 0, 0xffffffff);
346 goto reserve_helpers
;
347 case 'S': /* qemu_st data 64-bit constraint */
348 ct
->ct
|= TCG_CT_REG
;
349 tcg_regset_set32(ct
->u
.regs
, 0, ALL_64
);
350 goto reserve_helpers
;
352 ct
->ct
|= TCG_CT_CONST_S11
;
355 ct
->ct
|= TCG_CT_CONST_S13
;
358 ct
->ct
|= TCG_CT_CONST_ZERO
;
366 /* test if a constant matches the constraint */
367 static inline int tcg_target_const_match(tcg_target_long val
, TCGType type
,
368 const TCGArgConstraint
*arg_ct
)
372 if (ct
& TCG_CT_CONST
) {
376 if (type
== TCG_TYPE_I32
) {
380 if ((ct
& TCG_CT_CONST_ZERO
) && val
== 0) {
382 } else if ((ct
& TCG_CT_CONST_S11
) && check_fit_tl(val
, 11)) {
384 } else if ((ct
& TCG_CT_CONST_S13
) && check_fit_tl(val
, 13)) {
391 static inline void tcg_out_arith(TCGContext
*s
, TCGReg rd
, TCGReg rs1
,
394 tcg_out32(s
, op
| INSN_RD(rd
) | INSN_RS1(rs1
) | INSN_RS2(rs2
));
397 static inline void tcg_out_arithi(TCGContext
*s
, TCGReg rd
, TCGReg rs1
,
398 int32_t offset
, int op
)
400 tcg_out32(s
, op
| INSN_RD(rd
) | INSN_RS1(rs1
) | INSN_IMM13(offset
));
403 static void tcg_out_arithc(TCGContext
*s
, TCGReg rd
, TCGReg rs1
,
404 int32_t val2
, int val2const
, int op
)
406 tcg_out32(s
, op
| INSN_RD(rd
) | INSN_RS1(rs1
)
407 | (val2const
? INSN_IMM13(val2
) : INSN_RS2(val2
)));
410 static inline void tcg_out_mov(TCGContext
*s
, TCGType type
,
411 TCGReg ret
, TCGReg arg
)
414 tcg_out_arith(s
, ret
, arg
, TCG_REG_G0
, ARITH_OR
);
418 static inline void tcg_out_sethi(TCGContext
*s
, TCGReg ret
, uint32_t arg
)
420 tcg_out32(s
, SETHI
| INSN_RD(ret
) | ((arg
& 0xfffffc00) >> 10));
423 static inline void tcg_out_movi_imm13(TCGContext
*s
, TCGReg ret
, int32_t arg
)
425 tcg_out_arithi(s
, ret
, TCG_REG_G0
, arg
, ARITH_OR
);
428 static void tcg_out_movi(TCGContext
*s
, TCGType type
,
429 TCGReg ret
, tcg_target_long arg
)
431 tcg_target_long hi
, lo
= (int32_t)arg
;
433 /* Make sure we test 32-bit constants for imm13 properly. */
434 if (type
== TCG_TYPE_I32
) {
438 /* A 13-bit constant sign-extended to 64-bits. */
439 if (check_fit_tl(arg
, 13)) {
440 tcg_out_movi_imm13(s
, ret
, arg
);
444 /* A 32-bit constant, or 32-bit zero-extended to 64-bits. */
445 if (type
== TCG_TYPE_I32
|| arg
== (uint32_t)arg
) {
446 tcg_out_sethi(s
, ret
, arg
);
448 tcg_out_arithi(s
, ret
, ret
, arg
& 0x3ff, ARITH_OR
);
453 /* A 32-bit constant sign-extended to 64-bits. */
455 tcg_out_sethi(s
, ret
, ~arg
);
456 tcg_out_arithi(s
, ret
, ret
, (arg
& 0x3ff) | -0x400, ARITH_XOR
);
460 /* A 64-bit constant decomposed into 2 32-bit pieces. */
461 if (check_fit_i32(lo
, 13)) {
462 hi
= (arg
- lo
) >> 32;
463 tcg_out_movi(s
, TCG_TYPE_I32
, ret
, hi
);
464 tcg_out_arithi(s
, ret
, ret
, 32, SHIFT_SLLX
);
465 tcg_out_arithi(s
, ret
, ret
, lo
, ARITH_ADD
);
468 tcg_out_movi(s
, TCG_TYPE_I32
, ret
, hi
);
469 tcg_out_movi(s
, TCG_TYPE_I32
, TCG_REG_T2
, lo
);
470 tcg_out_arithi(s
, ret
, ret
, 32, SHIFT_SLLX
);
471 tcg_out_arith(s
, ret
, ret
, TCG_REG_T2
, ARITH_OR
);
475 static inline void tcg_out_ldst_rr(TCGContext
*s
, TCGReg data
, TCGReg a1
,
478 tcg_out32(s
, op
| INSN_RD(data
) | INSN_RS1(a1
) | INSN_RS2(a2
));
481 static void tcg_out_ldst(TCGContext
*s
, TCGReg ret
, TCGReg addr
,
482 intptr_t offset
, int op
)
484 if (check_fit_ptr(offset
, 13)) {
485 tcg_out32(s
, op
| INSN_RD(ret
) | INSN_RS1(addr
) |
488 tcg_out_movi(s
, TCG_TYPE_PTR
, TCG_REG_T1
, offset
);
489 tcg_out_ldst_rr(s
, ret
, addr
, TCG_REG_T1
, op
);
493 static inline void tcg_out_ld(TCGContext
*s
, TCGType type
, TCGReg ret
,
494 TCGReg arg1
, intptr_t arg2
)
496 tcg_out_ldst(s
, ret
, arg1
, arg2
, (type
== TCG_TYPE_I32
? LDUW
: LDX
));
499 static inline void tcg_out_st(TCGContext
*s
, TCGType type
, TCGReg arg
,
500 TCGReg arg1
, intptr_t arg2
)
502 tcg_out_ldst(s
, arg
, arg1
, arg2
, (type
== TCG_TYPE_I32
? STW
: STX
));
505 static inline bool tcg_out_sti(TCGContext
*s
, TCGType type
, TCGArg val
,
506 TCGReg base
, intptr_t ofs
)
509 tcg_out_st(s
, type
, TCG_REG_G0
, base
, ofs
);
515 static void tcg_out_ld_ptr(TCGContext
*s
, TCGReg ret
, uintptr_t arg
)
517 tcg_out_movi(s
, TCG_TYPE_PTR
, ret
, arg
& ~0x3ff);
518 tcg_out_ld(s
, TCG_TYPE_PTR
, ret
, ret
, arg
& 0x3ff);
521 static inline void tcg_out_sety(TCGContext
*s
, TCGReg rs
)
523 tcg_out32(s
, WRY
| INSN_RS1(TCG_REG_G0
) | INSN_RS2(rs
));
526 static inline void tcg_out_rdy(TCGContext
*s
, TCGReg rd
)
528 tcg_out32(s
, RDY
| INSN_RD(rd
));
531 static void tcg_out_div32(TCGContext
*s
, TCGReg rd
, TCGReg rs1
,
532 int32_t val2
, int val2const
, int uns
)
534 /* Load Y with the sign/zero extension of RS1 to 64-bits. */
536 tcg_out_sety(s
, TCG_REG_G0
);
538 tcg_out_arithi(s
, TCG_REG_T1
, rs1
, 31, SHIFT_SRA
);
539 tcg_out_sety(s
, TCG_REG_T1
);
542 tcg_out_arithc(s
, rd
, rs1
, val2
, val2const
,
543 uns
? ARITH_UDIV
: ARITH_SDIV
);
546 static inline void tcg_out_nop(TCGContext
*s
)
548 tcg_out_sethi(s
, TCG_REG_G0
, 0);
551 static const uint8_t tcg_cond_to_bcond
[] = {
552 [TCG_COND_EQ
] = COND_E
,
553 [TCG_COND_NE
] = COND_NE
,
554 [TCG_COND_LT
] = COND_L
,
555 [TCG_COND_GE
] = COND_GE
,
556 [TCG_COND_LE
] = COND_LE
,
557 [TCG_COND_GT
] = COND_G
,
558 [TCG_COND_LTU
] = COND_CS
,
559 [TCG_COND_GEU
] = COND_CC
,
560 [TCG_COND_LEU
] = COND_LEU
,
561 [TCG_COND_GTU
] = COND_GU
,
564 static const uint8_t tcg_cond_to_rcond
[] = {
565 [TCG_COND_EQ
] = RCOND_Z
,
566 [TCG_COND_NE
] = RCOND_NZ
,
567 [TCG_COND_LT
] = RCOND_LZ
,
568 [TCG_COND_GT
] = RCOND_GZ
,
569 [TCG_COND_LE
] = RCOND_LEZ
,
570 [TCG_COND_GE
] = RCOND_GEZ
573 static void tcg_out_bpcc0(TCGContext
*s
, int scond
, int flags
, int off19
)
575 tcg_out32(s
, INSN_OP(0) | INSN_OP2(1) | INSN_COND(scond
) | flags
| off19
);
578 static void tcg_out_bpcc(TCGContext
*s
, int scond
, int flags
, TCGLabel
*l
)
583 off19
= INSN_OFF19(tcg_pcrel_diff(s
, l
->u
.value_ptr
));
585 /* Make sure to preserve destinations during retranslation. */
586 off19
= *s
->code_ptr
& INSN_OFF19(-1);
587 tcg_out_reloc(s
, s
->code_ptr
, R_SPARC_WDISP19
, l
, 0);
589 tcg_out_bpcc0(s
, scond
, flags
, off19
);
592 static void tcg_out_cmp(TCGContext
*s
, TCGReg c1
, int32_t c2
, int c2const
)
594 tcg_out_arithc(s
, TCG_REG_G0
, c1
, c2
, c2const
, ARITH_SUBCC
);
597 static void tcg_out_brcond_i32(TCGContext
*s
, TCGCond cond
, TCGReg arg1
,
598 int32_t arg2
, int const_arg2
, TCGLabel
*l
)
600 tcg_out_cmp(s
, arg1
, arg2
, const_arg2
);
601 tcg_out_bpcc(s
, tcg_cond_to_bcond
[cond
], BPCC_ICC
| BPCC_PT
, l
);
605 static void tcg_out_movcc(TCGContext
*s
, TCGCond cond
, int cc
, TCGReg ret
,
606 int32_t v1
, int v1const
)
608 tcg_out32(s
, ARITH_MOVCC
| cc
| INSN_RD(ret
)
609 | INSN_RS1(tcg_cond_to_bcond
[cond
])
610 | (v1const
? INSN_IMM11(v1
) : INSN_RS2(v1
)));
613 static void tcg_out_movcond_i32(TCGContext
*s
, TCGCond cond
, TCGReg ret
,
614 TCGReg c1
, int32_t c2
, int c2const
,
615 int32_t v1
, int v1const
)
617 tcg_out_cmp(s
, c1
, c2
, c2const
);
618 tcg_out_movcc(s
, cond
, MOVCC_ICC
, ret
, v1
, v1const
);
621 static void tcg_out_brcond_i64(TCGContext
*s
, TCGCond cond
, TCGReg arg1
,
622 int32_t arg2
, int const_arg2
, TCGLabel
*l
)
624 /* For 64-bit signed comparisons vs zero, we can avoid the compare. */
625 if (arg2
== 0 && !is_unsigned_cond(cond
)) {
629 off16
= INSN_OFF16(tcg_pcrel_diff(s
, l
->u
.value_ptr
));
631 /* Make sure to preserve destinations during retranslation. */
632 off16
= *s
->code_ptr
& INSN_OFF16(-1);
633 tcg_out_reloc(s
, s
->code_ptr
, R_SPARC_WDISP16
, l
, 0);
635 tcg_out32(s
, INSN_OP(0) | INSN_OP2(3) | BPR_PT
| INSN_RS1(arg1
)
636 | INSN_COND(tcg_cond_to_rcond
[cond
]) | off16
);
638 tcg_out_cmp(s
, arg1
, arg2
, const_arg2
);
639 tcg_out_bpcc(s
, tcg_cond_to_bcond
[cond
], BPCC_XCC
| BPCC_PT
, l
);
644 static void tcg_out_movr(TCGContext
*s
, TCGCond cond
, TCGReg ret
, TCGReg c1
,
645 int32_t v1
, int v1const
)
647 tcg_out32(s
, ARITH_MOVR
| INSN_RD(ret
) | INSN_RS1(c1
)
648 | (tcg_cond_to_rcond
[cond
] << 10)
649 | (v1const
? INSN_IMM10(v1
) : INSN_RS2(v1
)));
652 static void tcg_out_movcond_i64(TCGContext
*s
, TCGCond cond
, TCGReg ret
,
653 TCGReg c1
, int32_t c2
, int c2const
,
654 int32_t v1
, int v1const
)
656 /* For 64-bit signed comparisons vs zero, we can avoid the compare.
657 Note that the immediate range is one bit smaller, so we must check
659 if (c2
== 0 && !is_unsigned_cond(cond
)
660 && (!v1const
|| check_fit_i32(v1
, 10))) {
661 tcg_out_movr(s
, cond
, ret
, c1
, v1
, v1const
);
663 tcg_out_cmp(s
, c1
, c2
, c2const
);
664 tcg_out_movcc(s
, cond
, MOVCC_XCC
, ret
, v1
, v1const
);
668 static void tcg_out_setcond_i32(TCGContext
*s
, TCGCond cond
, TCGReg ret
,
669 TCGReg c1
, int32_t c2
, int c2const
)
671 /* For 32-bit comparisons, we can play games with ADDC/SUBC. */
675 /* The result of the comparison is in the carry bit. */
680 /* For equality, we can transform to inequality vs zero. */
682 tcg_out_arithc(s
, TCG_REG_T1
, c1
, c2
, c2const
, ARITH_XOR
);
687 c1
= TCG_REG_G0
, c2const
= 0;
688 cond
= (cond
== TCG_COND_EQ
? TCG_COND_GEU
: TCG_COND_LTU
);
693 /* If we don't need to load a constant into a register, we can
694 swap the operands on GTU/LEU. There's no benefit to loading
695 the constant into a temporary register. */
696 if (!c2const
|| c2
== 0) {
701 cond
= tcg_swap_cond(cond
);
707 tcg_out_cmp(s
, c1
, c2
, c2const
);
708 tcg_out_movi_imm13(s
, ret
, 0);
709 tcg_out_movcc(s
, cond
, MOVCC_ICC
, ret
, 1, 1);
713 tcg_out_cmp(s
, c1
, c2
, c2const
);
714 if (cond
== TCG_COND_LTU
) {
715 tcg_out_arithi(s
, ret
, TCG_REG_G0
, 0, ARITH_ADDC
);
717 tcg_out_arithi(s
, ret
, TCG_REG_G0
, -1, ARITH_SUBC
);
721 static void tcg_out_setcond_i64(TCGContext
*s
, TCGCond cond
, TCGReg ret
,
722 TCGReg c1
, int32_t c2
, int c2const
)
724 if (use_vis3_instructions
) {
730 c2
= c1
, c2const
= 0, c1
= TCG_REG_G0
;
733 tcg_out_cmp(s
, c1
, c2
, c2const
);
734 tcg_out_arith(s
, ret
, TCG_REG_G0
, TCG_REG_G0
, ARITH_ADDXC
);
741 /* For 64-bit signed comparisons vs zero, we can avoid the compare
742 if the input does not overlap the output. */
743 if (c2
== 0 && !is_unsigned_cond(cond
) && c1
!= ret
) {
744 tcg_out_movi_imm13(s
, ret
, 0);
745 tcg_out_movr(s
, cond
, ret
, c1
, 1, 1);
747 tcg_out_cmp(s
, c1
, c2
, c2const
);
748 tcg_out_movi_imm13(s
, ret
, 0);
749 tcg_out_movcc(s
, cond
, MOVCC_XCC
, ret
, 1, 1);
753 static void tcg_out_addsub2_i32(TCGContext
*s
, TCGReg rl
, TCGReg rh
,
754 TCGReg al
, TCGReg ah
, int32_t bl
, int blconst
,
755 int32_t bh
, int bhconst
, int opl
, int oph
)
757 TCGReg tmp
= TCG_REG_T1
;
759 /* Note that the low parts are fully consumed before tmp is set. */
760 if (rl
!= ah
&& (bhconst
|| rl
!= bh
)) {
764 tcg_out_arithc(s
, tmp
, al
, bl
, blconst
, opl
);
765 tcg_out_arithc(s
, rh
, ah
, bh
, bhconst
, oph
);
766 tcg_out_mov(s
, TCG_TYPE_I32
, rl
, tmp
);
769 static void tcg_out_addsub2_i64(TCGContext
*s
, TCGReg rl
, TCGReg rh
,
770 TCGReg al
, TCGReg ah
, int32_t bl
, int blconst
,
771 int32_t bh
, int bhconst
, bool is_sub
)
773 TCGReg tmp
= TCG_REG_T1
;
775 /* Note that the low parts are fully consumed before tmp is set. */
776 if (rl
!= ah
&& (bhconst
|| rl
!= bh
)) {
780 tcg_out_arithc(s
, tmp
, al
, bl
, blconst
, is_sub
? ARITH_SUBCC
: ARITH_ADDCC
);
782 if (use_vis3_instructions
&& !is_sub
) {
783 /* Note that ADDXC doesn't accept immediates. */
784 if (bhconst
&& bh
!= 0) {
785 tcg_out_movi(s
, TCG_TYPE_I64
, TCG_REG_T2
, bh
);
788 tcg_out_arith(s
, rh
, ah
, bh
, ARITH_ADDXC
);
789 } else if (bh
== TCG_REG_G0
) {
790 /* If we have a zero, we can perform the operation in two insns,
791 with the arithmetic first, and a conditional move into place. */
793 tcg_out_arithi(s
, TCG_REG_T2
, ah
, 1,
794 is_sub
? ARITH_SUB
: ARITH_ADD
);
795 tcg_out_movcc(s
, TCG_COND_LTU
, MOVCC_XCC
, rh
, TCG_REG_T2
, 0);
797 tcg_out_arithi(s
, rh
, ah
, 1, is_sub
? ARITH_SUB
: ARITH_ADD
);
798 tcg_out_movcc(s
, TCG_COND_GEU
, MOVCC_XCC
, rh
, ah
, 0);
801 /* Otherwise adjust BH as if there is carry into T2 ... */
803 tcg_out_movi(s
, TCG_TYPE_I64
, TCG_REG_T2
, bh
+ (is_sub
? -1 : 1));
805 tcg_out_arithi(s
, TCG_REG_T2
, bh
, 1,
806 is_sub
? ARITH_SUB
: ARITH_ADD
);
808 /* ... smoosh T2 back to original BH if carry is clear ... */
809 tcg_out_movcc(s
, TCG_COND_GEU
, MOVCC_XCC
, TCG_REG_T2
, bh
, bhconst
);
810 /* ... and finally perform the arithmetic with the new operand. */
811 tcg_out_arith(s
, rh
, ah
, TCG_REG_T2
, is_sub
? ARITH_SUB
: ARITH_ADD
);
814 tcg_out_mov(s
, TCG_TYPE_I64
, rl
, tmp
);
817 static void tcg_out_call_nodelay(TCGContext
*s
, tcg_insn_unit
*dest
)
819 ptrdiff_t disp
= tcg_pcrel_diff(s
, dest
);
821 if (disp
== (int32_t)disp
) {
822 tcg_out32(s
, CALL
| (uint32_t)disp
>> 2);
824 uintptr_t desti
= (uintptr_t)dest
;
825 tcg_out_movi(s
, TCG_TYPE_PTR
, TCG_REG_T1
, desti
& ~0xfff);
826 tcg_out_arithi(s
, TCG_REG_O7
, TCG_REG_T1
, desti
& 0xfff, JMPL
);
830 static void tcg_out_call(TCGContext
*s
, tcg_insn_unit
*dest
)
832 tcg_out_call_nodelay(s
, dest
);
836 static void tcg_out_mb(TCGContext
*s
, TCGArg a0
)
838 /* Note that the TCG memory order constants mirror the Sparc MEMBAR. */
839 tcg_out32(s
, MEMBAR
| (a0
& TCG_MO_ALL
));
842 #ifdef CONFIG_SOFTMMU
843 static tcg_insn_unit
*qemu_ld_trampoline
[16];
844 static tcg_insn_unit
*qemu_st_trampoline
[16];
846 static void emit_extend(TCGContext
*s
, TCGReg r
, int op
)
848 /* Emit zero extend of 8, 16 or 32 bit data as
849 * required by the MO_* value op; do nothing for 64 bit.
851 switch (op
& MO_SIZE
) {
853 tcg_out_arithi(s
, r
, r
, 0xff, ARITH_AND
);
856 tcg_out_arithi(s
, r
, r
, 16, SHIFT_SLL
);
857 tcg_out_arithi(s
, r
, r
, 16, SHIFT_SRL
);
861 tcg_out_arith(s
, r
, r
, 0, SHIFT_SRL
);
869 static void build_trampolines(TCGContext
*s
)
871 static void * const qemu_ld_helpers
[16] = {
872 [MO_UB
] = helper_ret_ldub_mmu
,
873 [MO_SB
] = helper_ret_ldsb_mmu
,
874 [MO_LEUW
] = helper_le_lduw_mmu
,
875 [MO_LESW
] = helper_le_ldsw_mmu
,
876 [MO_LEUL
] = helper_le_ldul_mmu
,
877 [MO_LEQ
] = helper_le_ldq_mmu
,
878 [MO_BEUW
] = helper_be_lduw_mmu
,
879 [MO_BESW
] = helper_be_ldsw_mmu
,
880 [MO_BEUL
] = helper_be_ldul_mmu
,
881 [MO_BEQ
] = helper_be_ldq_mmu
,
883 static void * const qemu_st_helpers
[16] = {
884 [MO_UB
] = helper_ret_stb_mmu
,
885 [MO_LEUW
] = helper_le_stw_mmu
,
886 [MO_LEUL
] = helper_le_stl_mmu
,
887 [MO_LEQ
] = helper_le_stq_mmu
,
888 [MO_BEUW
] = helper_be_stw_mmu
,
889 [MO_BEUL
] = helper_be_stl_mmu
,
890 [MO_BEQ
] = helper_be_stq_mmu
,
896 for (i
= 0; i
< 16; ++i
) {
897 if (qemu_ld_helpers
[i
] == NULL
) {
901 /* May as well align the trampoline. */
902 while ((uintptr_t)s
->code_ptr
& 15) {
905 qemu_ld_trampoline
[i
] = s
->code_ptr
;
907 if (SPARC64
|| TARGET_LONG_BITS
== 32) {
910 /* Install the high part of the address. */
911 tcg_out_arithi(s
, TCG_REG_O1
, TCG_REG_O2
, 32, SHIFT_SRLX
);
915 /* Set the retaddr operand. */
916 tcg_out_mov(s
, TCG_TYPE_PTR
, ra
, TCG_REG_O7
);
917 /* Set the env operand. */
918 tcg_out_mov(s
, TCG_TYPE_PTR
, TCG_REG_O0
, TCG_AREG0
);
920 tcg_out_call_nodelay(s
, qemu_ld_helpers
[i
]);
921 tcg_out_mov(s
, TCG_TYPE_PTR
, TCG_REG_O7
, ra
);
924 for (i
= 0; i
< 16; ++i
) {
925 if (qemu_st_helpers
[i
] == NULL
) {
929 /* May as well align the trampoline. */
930 while ((uintptr_t)s
->code_ptr
& 15) {
933 qemu_st_trampoline
[i
] = s
->code_ptr
;
936 emit_extend(s
, TCG_REG_O2
, i
);
940 if (TARGET_LONG_BITS
== 64) {
941 /* Install the high part of the address. */
942 tcg_out_arithi(s
, ra
, ra
+ 1, 32, SHIFT_SRLX
);
947 if ((i
& MO_SIZE
) == MO_64
) {
948 /* Install the high part of the data. */
949 tcg_out_arithi(s
, ra
, ra
+ 1, 32, SHIFT_SRLX
);
952 emit_extend(s
, ra
, i
);
955 /* Skip the oi argument. */
959 /* Set the retaddr operand. */
960 if (ra
>= TCG_REG_O6
) {
961 tcg_out_st(s
, TCG_TYPE_PTR
, TCG_REG_O7
, TCG_REG_CALL_STACK
,
962 TCG_TARGET_CALL_STACK_OFFSET
);
965 tcg_out_mov(s
, TCG_TYPE_PTR
, ra
, TCG_REG_O7
);
966 /* Set the env operand. */
967 tcg_out_mov(s
, TCG_TYPE_PTR
, TCG_REG_O0
, TCG_AREG0
);
969 tcg_out_call_nodelay(s
, qemu_st_helpers
[i
]);
970 tcg_out_mov(s
, TCG_TYPE_PTR
, TCG_REG_O7
, ra
);
975 /* Generate global QEMU prologue and epilogue code */
976 static void tcg_target_qemu_prologue(TCGContext
*s
)
978 int tmp_buf_size
, frame_size
;
980 /* The TCG temp buffer is at the top of the frame, immediately
981 below the frame pointer. */
982 tmp_buf_size
= CPU_TEMP_BUF_NLONGS
* (int)sizeof(long);
983 tcg_set_frame(s
, TCG_REG_I6
, TCG_TARGET_STACK_BIAS
- tmp_buf_size
,
986 /* TCG_TARGET_CALL_STACK_OFFSET includes the stack bias, but is
987 otherwise the minimal frame usable by callees. */
988 frame_size
= TCG_TARGET_CALL_STACK_OFFSET
- TCG_TARGET_STACK_BIAS
;
989 frame_size
+= TCG_STATIC_CALL_ARGS_SIZE
+ tmp_buf_size
;
990 frame_size
+= TCG_TARGET_STACK_ALIGN
- 1;
991 frame_size
&= -TCG_TARGET_STACK_ALIGN
;
992 tcg_out32(s
, SAVE
| INSN_RD(TCG_REG_O6
) | INSN_RS1(TCG_REG_O6
) |
993 INSN_IMM13(-frame_size
));
995 #ifndef CONFIG_SOFTMMU
996 if (guest_base
!= 0) {
997 tcg_out_movi(s
, TCG_TYPE_PTR
, TCG_GUEST_BASE_REG
, guest_base
);
998 tcg_regset_set_reg(s
->reserved_regs
, TCG_GUEST_BASE_REG
);
1002 tcg_out_arithi(s
, TCG_REG_G0
, TCG_REG_I1
, 0, JMPL
);
1006 /* No epilogue required. We issue ret + restore directly in the TB. */
1008 #ifdef CONFIG_SOFTMMU
1009 build_trampolines(s
);
1013 #if defined(CONFIG_SOFTMMU)
1014 /* Perform the TLB load and compare.
1017 ADDRLO and ADDRHI contain the possible two parts of the address.
1019 MEM_INDEX and S_BITS are the memory context and log2 size of the load.
1021 WHICH is the offset into the CPUTLBEntry structure of the slot to read.
1022 This should be offsetof addr_read or addr_write.
1024 The result of the TLB comparison is in %[ix]cc. The sanitized address
1025 is in the returned register, maybe %o0. The TLB addend is in %o1. */
1027 static TCGReg
tcg_out_tlb_load(TCGContext
*s
, TCGReg addr
, int mem_index
,
1028 TCGMemOp opc
, int which
)
1030 const TCGReg r0
= TCG_REG_O0
;
1031 const TCGReg r1
= TCG_REG_O1
;
1032 const TCGReg r2
= TCG_REG_O2
;
1033 unsigned s_bits
= opc
& MO_SIZE
;
1034 unsigned a_bits
= get_alignment_bits(opc
);
1037 /* Shift the page number down. */
1038 tcg_out_arithi(s
, r1
, addr
, TARGET_PAGE_BITS
, SHIFT_SRL
);
1040 /* Mask out the page offset, except for the required alignment.
1041 We don't support unaligned accesses. */
1042 if (a_bits
< s_bits
) {
1045 tcg_out_movi(s
, TCG_TYPE_TL
, TCG_REG_T1
,
1046 TARGET_PAGE_MASK
| ((1 << a_bits
) - 1));
1048 /* Mask the tlb index. */
1049 tcg_out_arithi(s
, r1
, r1
, CPU_TLB_SIZE
- 1, ARITH_AND
);
1051 /* Mask page, part 2. */
1052 tcg_out_arith(s
, r0
, addr
, TCG_REG_T1
, ARITH_AND
);
1054 /* Shift the tlb index into place. */
1055 tcg_out_arithi(s
, r1
, r1
, CPU_TLB_ENTRY_BITS
, SHIFT_SLL
);
1057 /* Relative to the current ENV. */
1058 tcg_out_arith(s
, r1
, TCG_AREG0
, r1
, ARITH_ADD
);
1060 /* Find a base address that can load both tlb comparator and addend. */
1061 tlb_ofs
= offsetof(CPUArchState
, tlb_table
[mem_index
][0]);
1062 if (!check_fit_ptr(tlb_ofs
+ sizeof(CPUTLBEntry
), 13)) {
1063 if (tlb_ofs
& ~0x3ff) {
1064 tcg_out_movi(s
, TCG_TYPE_PTR
, TCG_REG_T1
, tlb_ofs
& ~0x3ff);
1065 tcg_out_arith(s
, r1
, r1
, TCG_REG_T1
, ARITH_ADD
);
1070 /* Load the tlb comparator and the addend. */
1071 tcg_out_ld(s
, TCG_TYPE_TL
, r2
, r1
, tlb_ofs
+ which
);
1072 tcg_out_ld(s
, TCG_TYPE_PTR
, r1
, r1
, tlb_ofs
+offsetof(CPUTLBEntry
, addend
));
1074 /* subcc arg0, arg2, %g0 */
1075 tcg_out_cmp(s
, r0
, r2
, 0);
1077 /* If the guest address must be zero-extended, do so now. */
1078 if (SPARC64
&& TARGET_LONG_BITS
== 32) {
1079 tcg_out_arithi(s
, r0
, addr
, 0, SHIFT_SRL
);
1084 #endif /* CONFIG_SOFTMMU */
1086 static const int qemu_ld_opc
[16] = {
1096 [MO_LEUW
] = LDUH_LE
,
1097 [MO_LESW
] = LDSH_LE
,
1098 [MO_LEUL
] = LDUW_LE
,
1099 [MO_LESL
] = LDSW_LE
,
1103 static const int qemu_st_opc
[16] = {
1115 static void tcg_out_qemu_ld(TCGContext
*s
, TCGReg data
, TCGReg addr
,
1116 TCGMemOpIdx oi
, bool is_64
)
1118 TCGMemOp memop
= get_memop(oi
);
1119 #ifdef CONFIG_SOFTMMU
1120 unsigned memi
= get_mmuidx(oi
);
1121 TCGReg addrz
, param
;
1122 tcg_insn_unit
*func
;
1123 tcg_insn_unit
*label_ptr
;
1125 addrz
= tcg_out_tlb_load(s
, addr
, memi
, memop
,
1126 offsetof(CPUTLBEntry
, addr_read
));
1128 /* The fast path is exactly one insn. Thus we can perform the
1129 entire TLB Hit in the (annulled) delay slot of the branch
1130 over the TLB Miss case. */
1132 /* beq,a,pt %[xi]cc, label0 */
1133 label_ptr
= s
->code_ptr
;
1134 tcg_out_bpcc0(s
, COND_E
, BPCC_A
| BPCC_PT
1135 | (TARGET_LONG_BITS
== 64 ? BPCC_XCC
: BPCC_ICC
), 0);
1137 tcg_out_ldst_rr(s
, data
, addrz
, TCG_REG_O1
,
1138 qemu_ld_opc
[memop
& (MO_BSWAP
| MO_SSIZE
)]);
1143 if (!SPARC64
&& TARGET_LONG_BITS
== 64) {
1144 /* Skip the high-part; we'll perform the extract in the trampoline. */
1147 tcg_out_mov(s
, TCG_TYPE_REG
, param
++, addrz
);
1149 /* We use the helpers to extend SB and SW data, leaving the case
1150 of SL needing explicit extending below. */
1151 if ((memop
& MO_SSIZE
) == MO_SL
) {
1152 func
= qemu_ld_trampoline
[memop
& (MO_BSWAP
| MO_SIZE
)];
1154 func
= qemu_ld_trampoline
[memop
& (MO_BSWAP
| MO_SSIZE
)];
1156 tcg_debug_assert(func
!= NULL
);
1157 tcg_out_call_nodelay(s
, func
);
1159 tcg_out_movi(s
, TCG_TYPE_I32
, param
, oi
);
1161 /* Recall that all of the helpers return 64-bit results.
1162 Which complicates things for sparcv8plus. */
1164 /* We let the helper sign-extend SB and SW, but leave SL for here. */
1165 if (is_64
&& (memop
& MO_SSIZE
) == MO_SL
) {
1166 tcg_out_arithi(s
, data
, TCG_REG_O0
, 0, SHIFT_SRA
);
1168 tcg_out_mov(s
, TCG_TYPE_REG
, data
, TCG_REG_O0
);
1171 if ((memop
& MO_SIZE
) == MO_64
) {
1172 tcg_out_arithi(s
, TCG_REG_O0
, TCG_REG_O0
, 32, SHIFT_SLLX
);
1173 tcg_out_arithi(s
, TCG_REG_O1
, TCG_REG_O1
, 0, SHIFT_SRL
);
1174 tcg_out_arith(s
, data
, TCG_REG_O0
, TCG_REG_O1
, ARITH_OR
);
1176 /* Re-extend from 32-bit rather than reassembling when we
1177 know the high register must be an extension. */
1178 tcg_out_arithi(s
, data
, TCG_REG_O1
, 0,
1179 memop
& MO_SIGN
? SHIFT_SRA
: SHIFT_SRL
);
1181 tcg_out_mov(s
, TCG_TYPE_I32
, data
, TCG_REG_O1
);
1185 *label_ptr
|= INSN_OFF19(tcg_ptr_byte_diff(s
->code_ptr
, label_ptr
));
1187 if (SPARC64
&& TARGET_LONG_BITS
== 32) {
1188 tcg_out_arithi(s
, TCG_REG_T1
, addr
, 0, SHIFT_SRL
);
1191 tcg_out_ldst_rr(s
, data
, addr
,
1192 (guest_base
? TCG_GUEST_BASE_REG
: TCG_REG_G0
),
1193 qemu_ld_opc
[memop
& (MO_BSWAP
| MO_SSIZE
)]);
1194 #endif /* CONFIG_SOFTMMU */
1197 static void tcg_out_qemu_st(TCGContext
*s
, TCGReg data
, TCGReg addr
,
1200 TCGMemOp memop
= get_memop(oi
);
1201 #ifdef CONFIG_SOFTMMU
1202 unsigned memi
= get_mmuidx(oi
);
1203 TCGReg addrz
, param
;
1204 tcg_insn_unit
*func
;
1205 tcg_insn_unit
*label_ptr
;
1207 addrz
= tcg_out_tlb_load(s
, addr
, memi
, memop
,
1208 offsetof(CPUTLBEntry
, addr_write
));
1210 /* The fast path is exactly one insn. Thus we can perform the entire
1211 TLB Hit in the (annulled) delay slot of the branch over TLB Miss. */
1212 /* beq,a,pt %[xi]cc, label0 */
1213 label_ptr
= s
->code_ptr
;
1214 tcg_out_bpcc0(s
, COND_E
, BPCC_A
| BPCC_PT
1215 | (TARGET_LONG_BITS
== 64 ? BPCC_XCC
: BPCC_ICC
), 0);
1217 tcg_out_ldst_rr(s
, data
, addrz
, TCG_REG_O1
,
1218 qemu_st_opc
[memop
& (MO_BSWAP
| MO_SIZE
)]);
1223 if (!SPARC64
&& TARGET_LONG_BITS
== 64) {
1224 /* Skip the high-part; we'll perform the extract in the trampoline. */
1227 tcg_out_mov(s
, TCG_TYPE_REG
, param
++, addrz
);
1228 if (!SPARC64
&& (memop
& MO_SIZE
) == MO_64
) {
1229 /* Skip the high-part; we'll perform the extract in the trampoline. */
1232 tcg_out_mov(s
, TCG_TYPE_REG
, param
++, data
);
1234 func
= qemu_st_trampoline
[memop
& (MO_BSWAP
| MO_SIZE
)];
1235 tcg_debug_assert(func
!= NULL
);
1236 tcg_out_call_nodelay(s
, func
);
1238 tcg_out_movi(s
, TCG_TYPE_I32
, param
, oi
);
1240 *label_ptr
|= INSN_OFF19(tcg_ptr_byte_diff(s
->code_ptr
, label_ptr
));
1242 if (SPARC64
&& TARGET_LONG_BITS
== 32) {
1243 tcg_out_arithi(s
, TCG_REG_T1
, addr
, 0, SHIFT_SRL
);
1246 tcg_out_ldst_rr(s
, data
, addr
,
1247 (guest_base
? TCG_GUEST_BASE_REG
: TCG_REG_G0
),
1248 qemu_st_opc
[memop
& (MO_BSWAP
| MO_SIZE
)]);
1249 #endif /* CONFIG_SOFTMMU */
1252 static void tcg_out_op(TCGContext
*s
, TCGOpcode opc
,
1253 const TCGArg args
[TCG_MAX_OP_ARGS
],
1254 const int const_args
[TCG_MAX_OP_ARGS
])
1259 /* Hoist the loads of the most common arguments. */
1266 case INDEX_op_exit_tb
:
1267 if (check_fit_ptr(a0
, 13)) {
1268 tcg_out_arithi(s
, TCG_REG_G0
, TCG_REG_I7
, 8, RETURN
);
1269 tcg_out_movi_imm13(s
, TCG_REG_O0
, a0
);
1271 tcg_out_movi(s
, TCG_TYPE_PTR
, TCG_REG_I0
, a0
& ~0x3ff);
1272 tcg_out_arithi(s
, TCG_REG_G0
, TCG_REG_I7
, 8, RETURN
);
1273 tcg_out_arithi(s
, TCG_REG_O0
, TCG_REG_O0
, a0
& 0x3ff, ARITH_OR
);
1276 case INDEX_op_goto_tb
:
1277 if (s
->tb_jmp_insn_offset
) {
1278 /* direct jump method */
1279 s
->tb_jmp_insn_offset
[a0
] = tcg_current_code_size(s
);
1280 /* Make sure to preserve links during retranslation. */
1281 tcg_out32(s
, CALL
| (*s
->code_ptr
& ~INSN_OP(-1)));
1283 /* indirect jump method */
1284 tcg_out_ld_ptr(s
, TCG_REG_T1
,
1285 (uintptr_t)(s
->tb_jmp_target_addr
+ a0
));
1286 tcg_out_arithi(s
, TCG_REG_G0
, TCG_REG_T1
, 0, JMPL
);
1289 s
->tb_jmp_reset_offset
[a0
] = tcg_current_code_size(s
);
1292 tcg_out_bpcc(s
, COND_A
, BPCC_PT
, arg_label(a0
));
1296 #define OP_32_64(x) \
1297 glue(glue(case INDEX_op_, x), _i32): \
1298 glue(glue(case INDEX_op_, x), _i64)
1301 tcg_out_ldst(s
, a0
, a1
, a2
, LDUB
);
1304 tcg_out_ldst(s
, a0
, a1
, a2
, LDSB
);
1307 tcg_out_ldst(s
, a0
, a1
, a2
, LDUH
);
1310 tcg_out_ldst(s
, a0
, a1
, a2
, LDSH
);
1312 case INDEX_op_ld_i32
:
1313 case INDEX_op_ld32u_i64
:
1314 tcg_out_ldst(s
, a0
, a1
, a2
, LDUW
);
1317 tcg_out_ldst(s
, a0
, a1
, a2
, STB
);
1320 tcg_out_ldst(s
, a0
, a1
, a2
, STH
);
1322 case INDEX_op_st_i32
:
1323 case INDEX_op_st32_i64
:
1324 tcg_out_ldst(s
, a0
, a1
, a2
, STW
);
1347 case INDEX_op_shl_i32
:
1350 /* Limit immediate shift count lest we create an illegal insn. */
1351 tcg_out_arithc(s
, a0
, a1
, a2
& 31, c2
, c
);
1353 case INDEX_op_shr_i32
:
1356 case INDEX_op_sar_i32
:
1359 case INDEX_op_mul_i32
:
1370 case INDEX_op_div_i32
:
1371 tcg_out_div32(s
, a0
, a1
, a2
, c2
, 0);
1373 case INDEX_op_divu_i32
:
1374 tcg_out_div32(s
, a0
, a1
, a2
, c2
, 1);
1377 case INDEX_op_brcond_i32
:
1378 tcg_out_brcond_i32(s
, a2
, a0
, a1
, const_args
[1], arg_label(args
[3]));
1380 case INDEX_op_setcond_i32
:
1381 tcg_out_setcond_i32(s
, args
[3], a0
, a1
, a2
, c2
);
1383 case INDEX_op_movcond_i32
:
1384 tcg_out_movcond_i32(s
, args
[5], a0
, a1
, a2
, c2
, args
[3], const_args
[3]);
1387 case INDEX_op_add2_i32
:
1388 tcg_out_addsub2_i32(s
, args
[0], args
[1], args
[2], args
[3],
1389 args
[4], const_args
[4], args
[5], const_args
[5],
1390 ARITH_ADDCC
, ARITH_ADDC
);
1392 case INDEX_op_sub2_i32
:
1393 tcg_out_addsub2_i32(s
, args
[0], args
[1], args
[2], args
[3],
1394 args
[4], const_args
[4], args
[5], const_args
[5],
1395 ARITH_SUBCC
, ARITH_SUBC
);
1397 case INDEX_op_mulu2_i32
:
1400 case INDEX_op_muls2_i32
:
1403 /* The 32-bit multiply insns produce a full 64-bit result. If the
1404 destination register can hold it, we can avoid the slower RDY. */
1405 tcg_out_arithc(s
, a0
, a2
, args
[3], const_args
[3], c
);
1406 if (SPARC64
|| a0
<= TCG_REG_O7
) {
1407 tcg_out_arithi(s
, a1
, a0
, 32, SHIFT_SRLX
);
1413 case INDEX_op_qemu_ld_i32
:
1414 tcg_out_qemu_ld(s
, a0
, a1
, a2
, false);
1416 case INDEX_op_qemu_ld_i64
:
1417 tcg_out_qemu_ld(s
, a0
, a1
, a2
, true);
1419 case INDEX_op_qemu_st_i32
:
1420 case INDEX_op_qemu_st_i64
:
1421 tcg_out_qemu_st(s
, a0
, a1
, a2
);
1424 case INDEX_op_ld32s_i64
:
1425 tcg_out_ldst(s
, a0
, a1
, a2
, LDSW
);
1427 case INDEX_op_ld_i64
:
1428 tcg_out_ldst(s
, a0
, a1
, a2
, LDX
);
1430 case INDEX_op_st_i64
:
1431 tcg_out_ldst(s
, a0
, a1
, a2
, STX
);
1433 case INDEX_op_shl_i64
:
1436 /* Limit immediate shift count lest we create an illegal insn. */
1437 tcg_out_arithc(s
, a0
, a1
, a2
& 63, c2
, c
);
1439 case INDEX_op_shr_i64
:
1442 case INDEX_op_sar_i64
:
1445 case INDEX_op_mul_i64
:
1448 case INDEX_op_div_i64
:
1451 case INDEX_op_divu_i64
:
1454 case INDEX_op_ext_i32_i64
:
1455 case INDEX_op_ext32s_i64
:
1456 tcg_out_arithi(s
, a0
, a1
, 0, SHIFT_SRA
);
1458 case INDEX_op_extu_i32_i64
:
1459 case INDEX_op_ext32u_i64
:
1460 tcg_out_arithi(s
, a0
, a1
, 0, SHIFT_SRL
);
1462 case INDEX_op_extrl_i64_i32
:
1463 tcg_out_mov(s
, TCG_TYPE_I32
, a0
, a1
);
1465 case INDEX_op_extrh_i64_i32
:
1466 tcg_out_arithi(s
, a0
, a1
, 32, SHIFT_SRLX
);
1469 case INDEX_op_brcond_i64
:
1470 tcg_out_brcond_i64(s
, a2
, a0
, a1
, const_args
[1], arg_label(args
[3]));
1472 case INDEX_op_setcond_i64
:
1473 tcg_out_setcond_i64(s
, args
[3], a0
, a1
, a2
, c2
);
1475 case INDEX_op_movcond_i64
:
1476 tcg_out_movcond_i64(s
, args
[5], a0
, a1
, a2
, c2
, args
[3], const_args
[3]);
1478 case INDEX_op_add2_i64
:
1479 tcg_out_addsub2_i64(s
, args
[0], args
[1], args
[2], args
[3], args
[4],
1480 const_args
[4], args
[5], const_args
[5], false);
1482 case INDEX_op_sub2_i64
:
1483 tcg_out_addsub2_i64(s
, args
[0], args
[1], args
[2], args
[3], args
[4],
1484 const_args
[4], args
[5], const_args
[5], true);
1486 case INDEX_op_muluh_i64
:
1487 tcg_out_arith(s
, args
[0], args
[1], args
[2], ARITH_UMULXHI
);
1491 tcg_out_arithc(s
, a0
, a1
, a2
, c2
, c
);
1495 tcg_out_arithc(s
, a0
, TCG_REG_G0
, a1
, const_args
[1], c
);
1502 case INDEX_op_mov_i32
: /* Always emitted via tcg_out_mov. */
1503 case INDEX_op_mov_i64
:
1504 case INDEX_op_movi_i32
: /* Always emitted via tcg_out_movi. */
1505 case INDEX_op_movi_i64
:
1506 case INDEX_op_call
: /* Always emitted via tcg_out_call. */
1512 static const TCGTargetOpDef sparc_op_defs
[] = {
1513 { INDEX_op_exit_tb
, { } },
1514 { INDEX_op_goto_tb
, { } },
1515 { INDEX_op_br
, { } },
1517 { INDEX_op_ld8u_i32
, { "r", "r" } },
1518 { INDEX_op_ld8s_i32
, { "r", "r" } },
1519 { INDEX_op_ld16u_i32
, { "r", "r" } },
1520 { INDEX_op_ld16s_i32
, { "r", "r" } },
1521 { INDEX_op_ld_i32
, { "r", "r" } },
1522 { INDEX_op_st8_i32
, { "rZ", "r" } },
1523 { INDEX_op_st16_i32
, { "rZ", "r" } },
1524 { INDEX_op_st_i32
, { "rZ", "r" } },
1526 { INDEX_op_add_i32
, { "r", "rZ", "rJ" } },
1527 { INDEX_op_mul_i32
, { "r", "rZ", "rJ" } },
1528 { INDEX_op_div_i32
, { "r", "rZ", "rJ" } },
1529 { INDEX_op_divu_i32
, { "r", "rZ", "rJ" } },
1530 { INDEX_op_sub_i32
, { "r", "rZ", "rJ" } },
1531 { INDEX_op_and_i32
, { "r", "rZ", "rJ" } },
1532 { INDEX_op_andc_i32
, { "r", "rZ", "rJ" } },
1533 { INDEX_op_or_i32
, { "r", "rZ", "rJ" } },
1534 { INDEX_op_orc_i32
, { "r", "rZ", "rJ" } },
1535 { INDEX_op_xor_i32
, { "r", "rZ", "rJ" } },
1537 { INDEX_op_shl_i32
, { "r", "rZ", "rJ" } },
1538 { INDEX_op_shr_i32
, { "r", "rZ", "rJ" } },
1539 { INDEX_op_sar_i32
, { "r", "rZ", "rJ" } },
1541 { INDEX_op_neg_i32
, { "r", "rJ" } },
1542 { INDEX_op_not_i32
, { "r", "rJ" } },
1544 { INDEX_op_brcond_i32
, { "rZ", "rJ" } },
1545 { INDEX_op_setcond_i32
, { "r", "rZ", "rJ" } },
1546 { INDEX_op_movcond_i32
, { "r", "rZ", "rJ", "rI", "0" } },
1548 { INDEX_op_add2_i32
, { "r", "r", "rZ", "rZ", "rJ", "rJ" } },
1549 { INDEX_op_sub2_i32
, { "r", "r", "rZ", "rZ", "rJ", "rJ" } },
1550 { INDEX_op_mulu2_i32
, { "r", "r", "rZ", "rJ" } },
1551 { INDEX_op_muls2_i32
, { "r", "r", "rZ", "rJ" } },
1553 { INDEX_op_ld8u_i64
, { "R", "r" } },
1554 { INDEX_op_ld8s_i64
, { "R", "r" } },
1555 { INDEX_op_ld16u_i64
, { "R", "r" } },
1556 { INDEX_op_ld16s_i64
, { "R", "r" } },
1557 { INDEX_op_ld32u_i64
, { "R", "r" } },
1558 { INDEX_op_ld32s_i64
, { "R", "r" } },
1559 { INDEX_op_ld_i64
, { "R", "r" } },
1560 { INDEX_op_st8_i64
, { "RZ", "r" } },
1561 { INDEX_op_st16_i64
, { "RZ", "r" } },
1562 { INDEX_op_st32_i64
, { "RZ", "r" } },
1563 { INDEX_op_st_i64
, { "RZ", "r" } },
1565 { INDEX_op_add_i64
, { "R", "RZ", "RJ" } },
1566 { INDEX_op_mul_i64
, { "R", "RZ", "RJ" } },
1567 { INDEX_op_div_i64
, { "R", "RZ", "RJ" } },
1568 { INDEX_op_divu_i64
, { "R", "RZ", "RJ" } },
1569 { INDEX_op_sub_i64
, { "R", "RZ", "RJ" } },
1570 { INDEX_op_and_i64
, { "R", "RZ", "RJ" } },
1571 { INDEX_op_andc_i64
, { "R", "RZ", "RJ" } },
1572 { INDEX_op_or_i64
, { "R", "RZ", "RJ" } },
1573 { INDEX_op_orc_i64
, { "R", "RZ", "RJ" } },
1574 { INDEX_op_xor_i64
, { "R", "RZ", "RJ" } },
1576 { INDEX_op_shl_i64
, { "R", "RZ", "RJ" } },
1577 { INDEX_op_shr_i64
, { "R", "RZ", "RJ" } },
1578 { INDEX_op_sar_i64
, { "R", "RZ", "RJ" } },
1580 { INDEX_op_neg_i64
, { "R", "RJ" } },
1581 { INDEX_op_not_i64
, { "R", "RJ" } },
1583 { INDEX_op_ext32s_i64
, { "R", "R" } },
1584 { INDEX_op_ext32u_i64
, { "R", "R" } },
1585 { INDEX_op_ext_i32_i64
, { "R", "r" } },
1586 { INDEX_op_extu_i32_i64
, { "R", "r" } },
1587 { INDEX_op_extrl_i64_i32
, { "r", "R" } },
1588 { INDEX_op_extrh_i64_i32
, { "r", "R" } },
1590 { INDEX_op_brcond_i64
, { "RZ", "RJ" } },
1591 { INDEX_op_setcond_i64
, { "R", "RZ", "RJ" } },
1592 { INDEX_op_movcond_i64
, { "R", "RZ", "RJ", "RI", "0" } },
1594 { INDEX_op_add2_i64
, { "R", "R", "RZ", "RZ", "RJ", "RI" } },
1595 { INDEX_op_sub2_i64
, { "R", "R", "RZ", "RZ", "RJ", "RI" } },
1596 { INDEX_op_muluh_i64
, { "R", "RZ", "RZ" } },
1598 { INDEX_op_qemu_ld_i32
, { "r", "A" } },
1599 { INDEX_op_qemu_ld_i64
, { "R", "A" } },
1600 { INDEX_op_qemu_st_i32
, { "sZ", "A" } },
1601 { INDEX_op_qemu_st_i64
, { "SZ", "A" } },
1603 { INDEX_op_mb
, { } },
1607 static const TCGTargetOpDef
*tcg_target_op_def(TCGOpcode op
)
1609 int i
, n
= ARRAY_SIZE(sparc_op_defs
);
1611 for (i
= 0; i
< n
; ++i
) {
1612 if (sparc_op_defs
[i
].op
== op
) {
1613 return &sparc_op_defs
[i
];
1619 static void tcg_target_init(TCGContext
*s
)
1621 /* Only probe for the platform and capabilities if we havn't already
1622 determined maximum values at compile time. */
1623 #ifndef use_vis3_instructions
1625 unsigned long hwcap
= qemu_getauxval(AT_HWCAP
);
1626 use_vis3_instructions
= (hwcap
& HWCAP_SPARC_VIS3
) != 0;
1630 tcg_regset_set32(tcg_target_available_regs
[TCG_TYPE_I32
], 0, 0xffffffff);
1631 tcg_regset_set32(tcg_target_available_regs
[TCG_TYPE_I64
], 0, ALL_64
);
1633 tcg_regset_set32(tcg_target_call_clobber_regs
, 0,
1649 tcg_regset_clear(s
->reserved_regs
);
1650 tcg_regset_set_reg(s
->reserved_regs
, TCG_REG_G0
); /* zero */
1651 tcg_regset_set_reg(s
->reserved_regs
, TCG_REG_G6
); /* reserved for os */
1652 tcg_regset_set_reg(s
->reserved_regs
, TCG_REG_G7
); /* thread pointer */
1653 tcg_regset_set_reg(s
->reserved_regs
, TCG_REG_I6
); /* frame pointer */
1654 tcg_regset_set_reg(s
->reserved_regs
, TCG_REG_I7
); /* return address */
1655 tcg_regset_set_reg(s
->reserved_regs
, TCG_REG_O6
); /* stack pointer */
1656 tcg_regset_set_reg(s
->reserved_regs
, TCG_REG_T1
); /* for internal use */
1657 tcg_regset_set_reg(s
->reserved_regs
, TCG_REG_T2
); /* for internal use */
1661 # define ELF_HOST_MACHINE EM_SPARCV9
1663 # define ELF_HOST_MACHINE EM_SPARC32PLUS
1664 # define ELF_HOST_FLAGS EF_SPARC_32PLUS
1669 uint8_t fde_def_cfa
[SPARC64
? 4 : 2];
1670 uint8_t fde_win_save
;
1671 uint8_t fde_ret_save
[3];
1674 static const DebugFrame debug_frame
= {
1675 .h
.cie
.len
= sizeof(DebugFrameCIE
)-4, /* length after .len member */
1678 .h
.cie
.code_align
= 1,
1679 .h
.cie
.data_align
= -sizeof(void *) & 0x7f,
1680 .h
.cie
.return_column
= 15, /* o7 */
1682 /* Total FDE size does not include the "len" member. */
1683 .h
.fde
.len
= sizeof(DebugFrame
) - offsetof(DebugFrame
, h
.fde
.cie_offset
),
1687 12, 30, /* DW_CFA_def_cfa i6, 2047 */
1688 (2047 & 0x7f) | 0x80, (2047 >> 7)
1690 13, 30 /* DW_CFA_def_cfa_register i6 */
1693 .fde_win_save
= 0x2d, /* DW_CFA_GNU_window_save */
1694 .fde_ret_save
= { 9, 15, 31 }, /* DW_CFA_register o7, i7 */
1697 void tcg_register_jit(void *buf
, size_t buf_size
)
1699 tcg_register_jit_int(buf
, buf_size
, &debug_frame
, sizeof(debug_frame
));
1702 void tb_set_jmp_target1(uintptr_t jmp_addr
, uintptr_t addr
)
1704 uint32_t *ptr
= (uint32_t *)jmp_addr
;
1705 uintptr_t disp
= addr
- jmp_addr
;
1707 /* We can reach the entire address space for 32-bit. For 64-bit
1708 the code_gen_buffer can't be larger than 2GB. */
1709 tcg_debug_assert(disp
== (int32_t)disp
);
1711 atomic_set(ptr
, deposit32(CALL
, 0, 30, disp
>> 2));
1712 flush_icache_range(jmp_addr
, jmp_addr
+ 4);