4 * Copyright (c) 2003 Fabrice Bellard
5 * Copyright (c) 2005-2007 CodeSourcery
6 * Copyright (c) 2007 OpenedHand, Ltd.
8 * This library is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2 of the License, or (at your option) any later version.
13 * This library is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * Lesser General Public License for more details.
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
37 #define ENABLE_ARCH_5J 0
38 #define ENABLE_ARCH_6 arm_feature(env, ARM_FEATURE_V6)
39 #define ENABLE_ARCH_6K arm_feature(env, ARM_FEATURE_V6K)
40 #define ENABLE_ARCH_6T2 arm_feature(env, ARM_FEATURE_THUMB2)
41 #define ENABLE_ARCH_7 arm_feature(env, ARM_FEATURE_V7)
43 #define ARCH(x) do { if (!ENABLE_ARCH_##x) goto illegal_op; } while(0)
45 /* internal defines */
46 typedef struct DisasContext
{
49 /* Nonzero if this instruction has been conditionally skipped. */
51 /* The label that will be jumped to when the instruction is skipped. */
53 /* Thumb-2 condtional execution bits. */
56 struct TranslationBlock
*tb
;
57 int singlestep_enabled
;
59 #if !defined(CONFIG_USER_ONLY)
64 #if defined(CONFIG_USER_ONLY)
67 #define IS_USER(s) (s->user)
70 /* These instructions trap after executing, so defer them until after the
71 conditional executions state has been updated. */
75 static TCGv_ptr cpu_env
;
76 /* We reuse the same 64-bit temporaries for efficiency. */
77 static TCGv_i64 cpu_V0
, cpu_V1
, cpu_M0
;
78 static TCGv_i32 cpu_R
[16];
79 static TCGv_i32 cpu_exclusive_addr
;
80 static TCGv_i32 cpu_exclusive_val
;
81 static TCGv_i32 cpu_exclusive_high
;
82 #ifdef CONFIG_USER_ONLY
83 static TCGv_i32 cpu_exclusive_test
;
84 static TCGv_i32 cpu_exclusive_info
;
87 /* FIXME: These should be removed. */
88 static TCGv cpu_F0s
, cpu_F1s
;
89 static TCGv_i64 cpu_F0d
, cpu_F1d
;
91 #include "gen-icount.h"
93 static const char *regnames
[] =
94 { "r0", "r1", "r2", "r3", "r4", "r5", "r6", "r7",
95 "r8", "r9", "r10", "r11", "r12", "r13", "r14", "pc" };
97 /* initialize TCG globals. */
98 void arm_translate_init(void)
102 cpu_env
= tcg_global_reg_new_ptr(TCG_AREG0
, "env");
104 for (i
= 0; i
< 16; i
++) {
105 cpu_R
[i
] = tcg_global_mem_new_i32(TCG_AREG0
,
106 offsetof(CPUState
, regs
[i
]),
109 cpu_exclusive_addr
= tcg_global_mem_new_i32(TCG_AREG0
,
110 offsetof(CPUState
, exclusive_addr
), "exclusive_addr");
111 cpu_exclusive_val
= tcg_global_mem_new_i32(TCG_AREG0
,
112 offsetof(CPUState
, exclusive_val
), "exclusive_val");
113 cpu_exclusive_high
= tcg_global_mem_new_i32(TCG_AREG0
,
114 offsetof(CPUState
, exclusive_high
), "exclusive_high");
115 #ifdef CONFIG_USER_ONLY
116 cpu_exclusive_test
= tcg_global_mem_new_i32(TCG_AREG0
,
117 offsetof(CPUState
, exclusive_test
), "exclusive_test");
118 cpu_exclusive_info
= tcg_global_mem_new_i32(TCG_AREG0
,
119 offsetof(CPUState
, exclusive_info
), "exclusive_info");
126 static int num_temps
;
128 /* Allocate a temporary variable. */
129 static TCGv_i32
new_tmp(void)
132 return tcg_temp_new_i32();
135 /* Release a temporary variable. */
136 static void dead_tmp(TCGv tmp
)
142 static inline TCGv
load_cpu_offset(int offset
)
144 TCGv tmp
= new_tmp();
145 tcg_gen_ld_i32(tmp
, cpu_env
, offset
);
149 #define load_cpu_field(name) load_cpu_offset(offsetof(CPUState, name))
151 static inline void store_cpu_offset(TCGv var
, int offset
)
153 tcg_gen_st_i32(var
, cpu_env
, offset
);
157 #define store_cpu_field(var, name) \
158 store_cpu_offset(var, offsetof(CPUState, name))
160 /* Set a variable to the value of a CPU register. */
161 static void load_reg_var(DisasContext
*s
, TCGv var
, int reg
)
165 /* normaly, since we updated PC, we need only to add one insn */
167 addr
= (long)s
->pc
+ 2;
169 addr
= (long)s
->pc
+ 4;
170 tcg_gen_movi_i32(var
, addr
);
172 tcg_gen_mov_i32(var
, cpu_R
[reg
]);
176 /* Create a new temporary and set it to the value of a CPU register. */
177 static inline TCGv
load_reg(DisasContext
*s
, int reg
)
179 TCGv tmp
= new_tmp();
180 load_reg_var(s
, tmp
, reg
);
184 /* Set a CPU register. The source must be a temporary and will be
186 static void store_reg(DisasContext
*s
, int reg
, TCGv var
)
189 tcg_gen_andi_i32(var
, var
, ~1);
190 s
->is_jmp
= DISAS_JUMP
;
192 tcg_gen_mov_i32(cpu_R
[reg
], var
);
196 /* Value extensions. */
197 #define gen_uxtb(var) tcg_gen_ext8u_i32(var, var)
198 #define gen_uxth(var) tcg_gen_ext16u_i32(var, var)
199 #define gen_sxtb(var) tcg_gen_ext8s_i32(var, var)
200 #define gen_sxth(var) tcg_gen_ext16s_i32(var, var)
202 #define gen_sxtb16(var) gen_helper_sxtb16(var, var)
203 #define gen_uxtb16(var) gen_helper_uxtb16(var, var)
206 static inline void gen_set_cpsr(TCGv var
, uint32_t mask
)
208 TCGv tmp_mask
= tcg_const_i32(mask
);
209 gen_helper_cpsr_write(var
, tmp_mask
);
210 tcg_temp_free_i32(tmp_mask
);
212 /* Set NZCV flags from the high 4 bits of var. */
213 #define gen_set_nzcv(var) gen_set_cpsr(var, CPSR_NZCV)
215 static void gen_exception(int excp
)
217 TCGv tmp
= new_tmp();
218 tcg_gen_movi_i32(tmp
, excp
);
219 gen_helper_exception(tmp
);
223 static void gen_smul_dual(TCGv a
, TCGv b
)
225 TCGv tmp1
= new_tmp();
226 TCGv tmp2
= new_tmp();
227 tcg_gen_ext16s_i32(tmp1
, a
);
228 tcg_gen_ext16s_i32(tmp2
, b
);
229 tcg_gen_mul_i32(tmp1
, tmp1
, tmp2
);
231 tcg_gen_sari_i32(a
, a
, 16);
232 tcg_gen_sari_i32(b
, b
, 16);
233 tcg_gen_mul_i32(b
, b
, a
);
234 tcg_gen_mov_i32(a
, tmp1
);
238 /* Byteswap each halfword. */
239 static void gen_rev16(TCGv var
)
241 TCGv tmp
= new_tmp();
242 tcg_gen_shri_i32(tmp
, var
, 8);
243 tcg_gen_andi_i32(tmp
, tmp
, 0x00ff00ff);
244 tcg_gen_shli_i32(var
, var
, 8);
245 tcg_gen_andi_i32(var
, var
, 0xff00ff00);
246 tcg_gen_or_i32(var
, var
, tmp
);
250 /* Byteswap low halfword and sign extend. */
251 static void gen_revsh(TCGv var
)
253 tcg_gen_ext16u_i32(var
, var
);
254 tcg_gen_bswap16_i32(var
, var
);
255 tcg_gen_ext16s_i32(var
, var
);
258 /* Unsigned bitfield extract. */
259 static void gen_ubfx(TCGv var
, int shift
, uint32_t mask
)
262 tcg_gen_shri_i32(var
, var
, shift
);
263 tcg_gen_andi_i32(var
, var
, mask
);
266 /* Signed bitfield extract. */
267 static void gen_sbfx(TCGv var
, int shift
, int width
)
272 tcg_gen_sari_i32(var
, var
, shift
);
273 if (shift
+ width
< 32) {
274 signbit
= 1u << (width
- 1);
275 tcg_gen_andi_i32(var
, var
, (1u << width
) - 1);
276 tcg_gen_xori_i32(var
, var
, signbit
);
277 tcg_gen_subi_i32(var
, var
, signbit
);
281 /* Bitfield insertion. Insert val into base. Clobbers base and val. */
282 static void gen_bfi(TCGv dest
, TCGv base
, TCGv val
, int shift
, uint32_t mask
)
284 tcg_gen_andi_i32(val
, val
, mask
);
285 tcg_gen_shli_i32(val
, val
, shift
);
286 tcg_gen_andi_i32(base
, base
, ~(mask
<< shift
));
287 tcg_gen_or_i32(dest
, base
, val
);
290 /* Return (b << 32) + a. Mark inputs as dead */
291 static TCGv_i64
gen_addq_msw(TCGv_i64 a
, TCGv b
)
293 TCGv_i64 tmp64
= tcg_temp_new_i64();
295 tcg_gen_extu_i32_i64(tmp64
, b
);
297 tcg_gen_shli_i64(tmp64
, tmp64
, 32);
298 tcg_gen_add_i64(a
, tmp64
, a
);
300 tcg_temp_free_i64(tmp64
);
304 /* Return (b << 32) - a. Mark inputs as dead. */
305 static TCGv_i64
gen_subq_msw(TCGv_i64 a
, TCGv b
)
307 TCGv_i64 tmp64
= tcg_temp_new_i64();
309 tcg_gen_extu_i32_i64(tmp64
, b
);
311 tcg_gen_shli_i64(tmp64
, tmp64
, 32);
312 tcg_gen_sub_i64(a
, tmp64
, a
);
314 tcg_temp_free_i64(tmp64
);
318 /* FIXME: Most targets have native widening multiplication.
319 It would be good to use that instead of a full wide multiply. */
320 /* 32x32->64 multiply. Marks inputs as dead. */
321 static TCGv_i64
gen_mulu_i64_i32(TCGv a
, TCGv b
)
323 TCGv_i64 tmp1
= tcg_temp_new_i64();
324 TCGv_i64 tmp2
= tcg_temp_new_i64();
326 tcg_gen_extu_i32_i64(tmp1
, a
);
328 tcg_gen_extu_i32_i64(tmp2
, b
);
330 tcg_gen_mul_i64(tmp1
, tmp1
, tmp2
);
331 tcg_temp_free_i64(tmp2
);
335 static TCGv_i64
gen_muls_i64_i32(TCGv a
, TCGv b
)
337 TCGv_i64 tmp1
= tcg_temp_new_i64();
338 TCGv_i64 tmp2
= tcg_temp_new_i64();
340 tcg_gen_ext_i32_i64(tmp1
, a
);
342 tcg_gen_ext_i32_i64(tmp2
, b
);
344 tcg_gen_mul_i64(tmp1
, tmp1
, tmp2
);
345 tcg_temp_free_i64(tmp2
);
349 /* Swap low and high halfwords. */
350 static void gen_swap_half(TCGv var
)
352 TCGv tmp
= new_tmp();
353 tcg_gen_shri_i32(tmp
, var
, 16);
354 tcg_gen_shli_i32(var
, var
, 16);
355 tcg_gen_or_i32(var
, var
, tmp
);
359 /* Dual 16-bit add. Result placed in t0 and t1 is marked as dead.
360 tmp = (t0 ^ t1) & 0x8000;
363 t0 = (t0 + t1) ^ tmp;
366 static void gen_add16(TCGv t0
, TCGv t1
)
368 TCGv tmp
= new_tmp();
369 tcg_gen_xor_i32(tmp
, t0
, t1
);
370 tcg_gen_andi_i32(tmp
, tmp
, 0x8000);
371 tcg_gen_andi_i32(t0
, t0
, ~0x8000);
372 tcg_gen_andi_i32(t1
, t1
, ~0x8000);
373 tcg_gen_add_i32(t0
, t0
, t1
);
374 tcg_gen_xor_i32(t0
, t0
, tmp
);
379 #define gen_set_CF(var) tcg_gen_st_i32(var, cpu_env, offsetof(CPUState, CF))
381 /* Set CF to the top bit of var. */
382 static void gen_set_CF_bit31(TCGv var
)
384 TCGv tmp
= new_tmp();
385 tcg_gen_shri_i32(tmp
, var
, 31);
390 /* Set N and Z flags from var. */
391 static inline void gen_logic_CC(TCGv var
)
393 tcg_gen_st_i32(var
, cpu_env
, offsetof(CPUState
, NF
));
394 tcg_gen_st_i32(var
, cpu_env
, offsetof(CPUState
, ZF
));
398 static void gen_adc(TCGv t0
, TCGv t1
)
401 tcg_gen_add_i32(t0
, t0
, t1
);
402 tmp
= load_cpu_field(CF
);
403 tcg_gen_add_i32(t0
, t0
, tmp
);
407 /* dest = T0 + T1 + CF. */
408 static void gen_add_carry(TCGv dest
, TCGv t0
, TCGv t1
)
411 tcg_gen_add_i32(dest
, t0
, t1
);
412 tmp
= load_cpu_field(CF
);
413 tcg_gen_add_i32(dest
, dest
, tmp
);
417 /* dest = T0 - T1 + CF - 1. */
418 static void gen_sub_carry(TCGv dest
, TCGv t0
, TCGv t1
)
421 tcg_gen_sub_i32(dest
, t0
, t1
);
422 tmp
= load_cpu_field(CF
);
423 tcg_gen_add_i32(dest
, dest
, tmp
);
424 tcg_gen_subi_i32(dest
, dest
, 1);
428 /* FIXME: Implement this natively. */
429 #define tcg_gen_abs_i32(t0, t1) gen_helper_abs(t0, t1)
431 static void shifter_out_im(TCGv var
, int shift
)
433 TCGv tmp
= new_tmp();
435 tcg_gen_andi_i32(tmp
, var
, 1);
437 tcg_gen_shri_i32(tmp
, var
, shift
);
439 tcg_gen_andi_i32(tmp
, tmp
, 1);
445 /* Shift by immediate. Includes special handling for shift == 0. */
446 static inline void gen_arm_shift_im(TCGv var
, int shiftop
, int shift
, int flags
)
452 shifter_out_im(var
, 32 - shift
);
453 tcg_gen_shli_i32(var
, var
, shift
);
459 tcg_gen_shri_i32(var
, var
, 31);
462 tcg_gen_movi_i32(var
, 0);
465 shifter_out_im(var
, shift
- 1);
466 tcg_gen_shri_i32(var
, var
, shift
);
473 shifter_out_im(var
, shift
- 1);
476 tcg_gen_sari_i32(var
, var
, shift
);
478 case 3: /* ROR/RRX */
481 shifter_out_im(var
, shift
- 1);
482 tcg_gen_rotri_i32(var
, var
, shift
); break;
484 TCGv tmp
= load_cpu_field(CF
);
486 shifter_out_im(var
, 0);
487 tcg_gen_shri_i32(var
, var
, 1);
488 tcg_gen_shli_i32(tmp
, tmp
, 31);
489 tcg_gen_or_i32(var
, var
, tmp
);
495 static inline void gen_arm_shift_reg(TCGv var
, int shiftop
,
496 TCGv shift
, int flags
)
500 case 0: gen_helper_shl_cc(var
, var
, shift
); break;
501 case 1: gen_helper_shr_cc(var
, var
, shift
); break;
502 case 2: gen_helper_sar_cc(var
, var
, shift
); break;
503 case 3: gen_helper_ror_cc(var
, var
, shift
); break;
507 case 0: gen_helper_shl(var
, var
, shift
); break;
508 case 1: gen_helper_shr(var
, var
, shift
); break;
509 case 2: gen_helper_sar(var
, var
, shift
); break;
510 case 3: tcg_gen_andi_i32(shift
, shift
, 0x1f);
511 tcg_gen_rotr_i32(var
, var
, shift
); break;
517 #define PAS_OP(pfx) \
519 case 0: gen_pas_helper(glue(pfx,add16)); break; \
520 case 1: gen_pas_helper(glue(pfx,addsubx)); break; \
521 case 2: gen_pas_helper(glue(pfx,subaddx)); break; \
522 case 3: gen_pas_helper(glue(pfx,sub16)); break; \
523 case 4: gen_pas_helper(glue(pfx,add8)); break; \
524 case 7: gen_pas_helper(glue(pfx,sub8)); break; \
526 static void gen_arm_parallel_addsub(int op1
, int op2
, TCGv a
, TCGv b
)
531 #define gen_pas_helper(name) glue(gen_helper_,name)(a, a, b, tmp)
533 tmp
= tcg_temp_new_ptr();
534 tcg_gen_addi_ptr(tmp
, cpu_env
, offsetof(CPUState
, GE
));
536 tcg_temp_free_ptr(tmp
);
539 tmp
= tcg_temp_new_ptr();
540 tcg_gen_addi_ptr(tmp
, cpu_env
, offsetof(CPUState
, GE
));
542 tcg_temp_free_ptr(tmp
);
544 #undef gen_pas_helper
545 #define gen_pas_helper(name) glue(gen_helper_,name)(a, a, b)
558 #undef gen_pas_helper
563 /* For unknown reasons Arm and Thumb-2 use arbitrarily different encodings. */
564 #define PAS_OP(pfx) \
566 case 0: gen_pas_helper(glue(pfx,add8)); break; \
567 case 1: gen_pas_helper(glue(pfx,add16)); break; \
568 case 2: gen_pas_helper(glue(pfx,addsubx)); break; \
569 case 4: gen_pas_helper(glue(pfx,sub8)); break; \
570 case 5: gen_pas_helper(glue(pfx,sub16)); break; \
571 case 6: gen_pas_helper(glue(pfx,subaddx)); break; \
573 static void gen_thumb2_parallel_addsub(int op1
, int op2
, TCGv a
, TCGv b
)
578 #define gen_pas_helper(name) glue(gen_helper_,name)(a, a, b, tmp)
580 tmp
= tcg_temp_new_ptr();
581 tcg_gen_addi_ptr(tmp
, cpu_env
, offsetof(CPUState
, GE
));
583 tcg_temp_free_ptr(tmp
);
586 tmp
= tcg_temp_new_ptr();
587 tcg_gen_addi_ptr(tmp
, cpu_env
, offsetof(CPUState
, GE
));
589 tcg_temp_free_ptr(tmp
);
591 #undef gen_pas_helper
592 #define gen_pas_helper(name) glue(gen_helper_,name)(a, a, b)
605 #undef gen_pas_helper
610 static void gen_test_cc(int cc
, int label
)
618 tmp
= load_cpu_field(ZF
);
619 tcg_gen_brcondi_i32(TCG_COND_EQ
, tmp
, 0, label
);
622 tmp
= load_cpu_field(ZF
);
623 tcg_gen_brcondi_i32(TCG_COND_NE
, tmp
, 0, label
);
626 tmp
= load_cpu_field(CF
);
627 tcg_gen_brcondi_i32(TCG_COND_NE
, tmp
, 0, label
);
630 tmp
= load_cpu_field(CF
);
631 tcg_gen_brcondi_i32(TCG_COND_EQ
, tmp
, 0, label
);
634 tmp
= load_cpu_field(NF
);
635 tcg_gen_brcondi_i32(TCG_COND_LT
, tmp
, 0, label
);
638 tmp
= load_cpu_field(NF
);
639 tcg_gen_brcondi_i32(TCG_COND_GE
, tmp
, 0, label
);
642 tmp
= load_cpu_field(VF
);
643 tcg_gen_brcondi_i32(TCG_COND_LT
, tmp
, 0, label
);
646 tmp
= load_cpu_field(VF
);
647 tcg_gen_brcondi_i32(TCG_COND_GE
, tmp
, 0, label
);
649 case 8: /* hi: C && !Z */
650 inv
= gen_new_label();
651 tmp
= load_cpu_field(CF
);
652 tcg_gen_brcondi_i32(TCG_COND_EQ
, tmp
, 0, inv
);
654 tmp
= load_cpu_field(ZF
);
655 tcg_gen_brcondi_i32(TCG_COND_NE
, tmp
, 0, label
);
658 case 9: /* ls: !C || Z */
659 tmp
= load_cpu_field(CF
);
660 tcg_gen_brcondi_i32(TCG_COND_EQ
, tmp
, 0, label
);
662 tmp
= load_cpu_field(ZF
);
663 tcg_gen_brcondi_i32(TCG_COND_EQ
, tmp
, 0, label
);
665 case 10: /* ge: N == V -> N ^ V == 0 */
666 tmp
= load_cpu_field(VF
);
667 tmp2
= load_cpu_field(NF
);
668 tcg_gen_xor_i32(tmp
, tmp
, tmp2
);
670 tcg_gen_brcondi_i32(TCG_COND_GE
, tmp
, 0, label
);
672 case 11: /* lt: N != V -> N ^ V != 0 */
673 tmp
= load_cpu_field(VF
);
674 tmp2
= load_cpu_field(NF
);
675 tcg_gen_xor_i32(tmp
, tmp
, tmp2
);
677 tcg_gen_brcondi_i32(TCG_COND_LT
, tmp
, 0, label
);
679 case 12: /* gt: !Z && N == V */
680 inv
= gen_new_label();
681 tmp
= load_cpu_field(ZF
);
682 tcg_gen_brcondi_i32(TCG_COND_EQ
, tmp
, 0, inv
);
684 tmp
= load_cpu_field(VF
);
685 tmp2
= load_cpu_field(NF
);
686 tcg_gen_xor_i32(tmp
, tmp
, tmp2
);
688 tcg_gen_brcondi_i32(TCG_COND_GE
, tmp
, 0, label
);
691 case 13: /* le: Z || N != V */
692 tmp
= load_cpu_field(ZF
);
693 tcg_gen_brcondi_i32(TCG_COND_EQ
, tmp
, 0, label
);
695 tmp
= load_cpu_field(VF
);
696 tmp2
= load_cpu_field(NF
);
697 tcg_gen_xor_i32(tmp
, tmp
, tmp2
);
699 tcg_gen_brcondi_i32(TCG_COND_LT
, tmp
, 0, label
);
702 fprintf(stderr
, "Bad condition code 0x%x\n", cc
);
708 static const uint8_t table_logic_cc
[16] = {
727 /* Set PC and Thumb state from an immediate address. */
728 static inline void gen_bx_im(DisasContext
*s
, uint32_t addr
)
732 s
->is_jmp
= DISAS_UPDATE
;
733 if (s
->thumb
!= (addr
& 1)) {
735 tcg_gen_movi_i32(tmp
, addr
& 1);
736 tcg_gen_st_i32(tmp
, cpu_env
, offsetof(CPUState
, thumb
));
739 tcg_gen_movi_i32(cpu_R
[15], addr
& ~1);
742 /* Set PC and Thumb state from var. var is marked as dead. */
743 static inline void gen_bx(DisasContext
*s
, TCGv var
)
745 s
->is_jmp
= DISAS_UPDATE
;
746 tcg_gen_andi_i32(cpu_R
[15], var
, ~1);
747 tcg_gen_andi_i32(var
, var
, 1);
748 store_cpu_field(var
, thumb
);
751 /* Variant of store_reg which uses branch&exchange logic when storing
752 to r15 in ARM architecture v7 and above. The source must be a temporary
753 and will be marked as dead. */
754 static inline void store_reg_bx(CPUState
*env
, DisasContext
*s
,
757 if (reg
== 15 && ENABLE_ARCH_7
) {
760 store_reg(s
, reg
, var
);
764 static inline TCGv
gen_ld8s(TCGv addr
, int index
)
766 TCGv tmp
= new_tmp();
767 tcg_gen_qemu_ld8s(tmp
, addr
, index
);
770 static inline TCGv
gen_ld8u(TCGv addr
, int index
)
772 TCGv tmp
= new_tmp();
773 tcg_gen_qemu_ld8u(tmp
, addr
, index
);
776 static inline TCGv
gen_ld16s(TCGv addr
, int index
)
778 TCGv tmp
= new_tmp();
779 tcg_gen_qemu_ld16s(tmp
, addr
, index
);
782 static inline TCGv
gen_ld16u(TCGv addr
, int index
)
784 TCGv tmp
= new_tmp();
785 tcg_gen_qemu_ld16u(tmp
, addr
, index
);
788 static inline TCGv
gen_ld32(TCGv addr
, int index
)
790 TCGv tmp
= new_tmp();
791 tcg_gen_qemu_ld32u(tmp
, addr
, index
);
794 static inline TCGv_i64
gen_ld64(TCGv addr
, int index
)
796 TCGv_i64 tmp
= tcg_temp_new_i64();
797 tcg_gen_qemu_ld64(tmp
, addr
, index
);
800 static inline void gen_st8(TCGv val
, TCGv addr
, int index
)
802 tcg_gen_qemu_st8(val
, addr
, index
);
805 static inline void gen_st16(TCGv val
, TCGv addr
, int index
)
807 tcg_gen_qemu_st16(val
, addr
, index
);
810 static inline void gen_st32(TCGv val
, TCGv addr
, int index
)
812 tcg_gen_qemu_st32(val
, addr
, index
);
815 static inline void gen_st64(TCGv_i64 val
, TCGv addr
, int index
)
817 tcg_gen_qemu_st64(val
, addr
, index
);
818 tcg_temp_free_i64(val
);
821 static inline void gen_set_pc_im(uint32_t val
)
823 tcg_gen_movi_i32(cpu_R
[15], val
);
826 /* Force a TB lookup after an instruction that changes the CPU state. */
827 static inline void gen_lookup_tb(DisasContext
*s
)
829 tcg_gen_movi_i32(cpu_R
[15], s
->pc
& ~1);
830 s
->is_jmp
= DISAS_UPDATE
;
833 static inline void gen_add_data_offset(DisasContext
*s
, unsigned int insn
,
836 int val
, rm
, shift
, shiftop
;
839 if (!(insn
& (1 << 25))) {
842 if (!(insn
& (1 << 23)))
845 tcg_gen_addi_i32(var
, var
, val
);
849 shift
= (insn
>> 7) & 0x1f;
850 shiftop
= (insn
>> 5) & 3;
851 offset
= load_reg(s
, rm
);
852 gen_arm_shift_im(offset
, shiftop
, shift
, 0);
853 if (!(insn
& (1 << 23)))
854 tcg_gen_sub_i32(var
, var
, offset
);
856 tcg_gen_add_i32(var
, var
, offset
);
861 static inline void gen_add_datah_offset(DisasContext
*s
, unsigned int insn
,
867 if (insn
& (1 << 22)) {
869 val
= (insn
& 0xf) | ((insn
>> 4) & 0xf0);
870 if (!(insn
& (1 << 23)))
874 tcg_gen_addi_i32(var
, var
, val
);
878 tcg_gen_addi_i32(var
, var
, extra
);
880 offset
= load_reg(s
, rm
);
881 if (!(insn
& (1 << 23)))
882 tcg_gen_sub_i32(var
, var
, offset
);
884 tcg_gen_add_i32(var
, var
, offset
);
889 #define VFP_OP2(name) \
890 static inline void gen_vfp_##name(int dp) \
893 gen_helper_vfp_##name##d(cpu_F0d, cpu_F0d, cpu_F1d, cpu_env); \
895 gen_helper_vfp_##name##s(cpu_F0s, cpu_F0s, cpu_F1s, cpu_env); \
905 static inline void gen_vfp_abs(int dp
)
908 gen_helper_vfp_absd(cpu_F0d
, cpu_F0d
);
910 gen_helper_vfp_abss(cpu_F0s
, cpu_F0s
);
913 static inline void gen_vfp_neg(int dp
)
916 gen_helper_vfp_negd(cpu_F0d
, cpu_F0d
);
918 gen_helper_vfp_negs(cpu_F0s
, cpu_F0s
);
921 static inline void gen_vfp_sqrt(int dp
)
924 gen_helper_vfp_sqrtd(cpu_F0d
, cpu_F0d
, cpu_env
);
926 gen_helper_vfp_sqrts(cpu_F0s
, cpu_F0s
, cpu_env
);
929 static inline void gen_vfp_cmp(int dp
)
932 gen_helper_vfp_cmpd(cpu_F0d
, cpu_F1d
, cpu_env
);
934 gen_helper_vfp_cmps(cpu_F0s
, cpu_F1s
, cpu_env
);
937 static inline void gen_vfp_cmpe(int dp
)
940 gen_helper_vfp_cmped(cpu_F0d
, cpu_F1d
, cpu_env
);
942 gen_helper_vfp_cmpes(cpu_F0s
, cpu_F1s
, cpu_env
);
945 static inline void gen_vfp_F1_ld0(int dp
)
948 tcg_gen_movi_i64(cpu_F1d
, 0);
950 tcg_gen_movi_i32(cpu_F1s
, 0);
953 static inline void gen_vfp_uito(int dp
)
956 gen_helper_vfp_uitod(cpu_F0d
, cpu_F0s
, cpu_env
);
958 gen_helper_vfp_uitos(cpu_F0s
, cpu_F0s
, cpu_env
);
961 static inline void gen_vfp_sito(int dp
)
964 gen_helper_vfp_sitod(cpu_F0d
, cpu_F0s
, cpu_env
);
966 gen_helper_vfp_sitos(cpu_F0s
, cpu_F0s
, cpu_env
);
969 static inline void gen_vfp_toui(int dp
)
972 gen_helper_vfp_touid(cpu_F0s
, cpu_F0d
, cpu_env
);
974 gen_helper_vfp_touis(cpu_F0s
, cpu_F0s
, cpu_env
);
977 static inline void gen_vfp_touiz(int dp
)
980 gen_helper_vfp_touizd(cpu_F0s
, cpu_F0d
, cpu_env
);
982 gen_helper_vfp_touizs(cpu_F0s
, cpu_F0s
, cpu_env
);
985 static inline void gen_vfp_tosi(int dp
)
988 gen_helper_vfp_tosid(cpu_F0s
, cpu_F0d
, cpu_env
);
990 gen_helper_vfp_tosis(cpu_F0s
, cpu_F0s
, cpu_env
);
993 static inline void gen_vfp_tosiz(int dp
)
996 gen_helper_vfp_tosizd(cpu_F0s
, cpu_F0d
, cpu_env
);
998 gen_helper_vfp_tosizs(cpu_F0s
, cpu_F0s
, cpu_env
);
1001 #define VFP_GEN_FIX(name) \
1002 static inline void gen_vfp_##name(int dp, int shift) \
1004 TCGv tmp_shift = tcg_const_i32(shift); \
1006 gen_helper_vfp_##name##d(cpu_F0d, cpu_F0d, tmp_shift, cpu_env);\
1008 gen_helper_vfp_##name##s(cpu_F0s, cpu_F0s, tmp_shift, cpu_env);\
1009 tcg_temp_free_i32(tmp_shift); \
1021 static inline void gen_vfp_ld(DisasContext
*s
, int dp
, TCGv addr
)
1024 tcg_gen_qemu_ld64(cpu_F0d
, addr
, IS_USER(s
));
1026 tcg_gen_qemu_ld32u(cpu_F0s
, addr
, IS_USER(s
));
1029 static inline void gen_vfp_st(DisasContext
*s
, int dp
, TCGv addr
)
1032 tcg_gen_qemu_st64(cpu_F0d
, addr
, IS_USER(s
));
1034 tcg_gen_qemu_st32(cpu_F0s
, addr
, IS_USER(s
));
1038 vfp_reg_offset (int dp
, int reg
)
1041 return offsetof(CPUARMState
, vfp
.regs
[reg
]);
1043 return offsetof(CPUARMState
, vfp
.regs
[reg
>> 1])
1044 + offsetof(CPU_DoubleU
, l
.upper
);
1046 return offsetof(CPUARMState
, vfp
.regs
[reg
>> 1])
1047 + offsetof(CPU_DoubleU
, l
.lower
);
1051 /* Return the offset of a 32-bit piece of a NEON register.
1052 zero is the least significant end of the register. */
1054 neon_reg_offset (int reg
, int n
)
1058 return vfp_reg_offset(0, sreg
);
1061 static TCGv
neon_load_reg(int reg
, int pass
)
1063 TCGv tmp
= new_tmp();
1064 tcg_gen_ld_i32(tmp
, cpu_env
, neon_reg_offset(reg
, pass
));
1068 static void neon_store_reg(int reg
, int pass
, TCGv var
)
1070 tcg_gen_st_i32(var
, cpu_env
, neon_reg_offset(reg
, pass
));
1074 static inline void neon_load_reg64(TCGv_i64 var
, int reg
)
1076 tcg_gen_ld_i64(var
, cpu_env
, vfp_reg_offset(1, reg
));
1079 static inline void neon_store_reg64(TCGv_i64 var
, int reg
)
1081 tcg_gen_st_i64(var
, cpu_env
, vfp_reg_offset(1, reg
));
1084 #define tcg_gen_ld_f32 tcg_gen_ld_i32
1085 #define tcg_gen_ld_f64 tcg_gen_ld_i64
1086 #define tcg_gen_st_f32 tcg_gen_st_i32
1087 #define tcg_gen_st_f64 tcg_gen_st_i64
1089 static inline void gen_mov_F0_vreg(int dp
, int reg
)
1092 tcg_gen_ld_f64(cpu_F0d
, cpu_env
, vfp_reg_offset(dp
, reg
));
1094 tcg_gen_ld_f32(cpu_F0s
, cpu_env
, vfp_reg_offset(dp
, reg
));
1097 static inline void gen_mov_F1_vreg(int dp
, int reg
)
1100 tcg_gen_ld_f64(cpu_F1d
, cpu_env
, vfp_reg_offset(dp
, reg
));
1102 tcg_gen_ld_f32(cpu_F1s
, cpu_env
, vfp_reg_offset(dp
, reg
));
1105 static inline void gen_mov_vreg_F0(int dp
, int reg
)
1108 tcg_gen_st_f64(cpu_F0d
, cpu_env
, vfp_reg_offset(dp
, reg
));
1110 tcg_gen_st_f32(cpu_F0s
, cpu_env
, vfp_reg_offset(dp
, reg
));
1113 #define ARM_CP_RW_BIT (1 << 20)
1115 static inline void iwmmxt_load_reg(TCGv_i64 var
, int reg
)
1117 tcg_gen_ld_i64(var
, cpu_env
, offsetof(CPUState
, iwmmxt
.regs
[reg
]));
1120 static inline void iwmmxt_store_reg(TCGv_i64 var
, int reg
)
1122 tcg_gen_st_i64(var
, cpu_env
, offsetof(CPUState
, iwmmxt
.regs
[reg
]));
1125 static inline TCGv
iwmmxt_load_creg(int reg
)
1127 TCGv var
= new_tmp();
1128 tcg_gen_ld_i32(var
, cpu_env
, offsetof(CPUState
, iwmmxt
.cregs
[reg
]));
1132 static inline void iwmmxt_store_creg(int reg
, TCGv var
)
1134 tcg_gen_st_i32(var
, cpu_env
, offsetof(CPUState
, iwmmxt
.cregs
[reg
]));
1138 static inline void gen_op_iwmmxt_movq_wRn_M0(int rn
)
1140 iwmmxt_store_reg(cpu_M0
, rn
);
1143 static inline void gen_op_iwmmxt_movq_M0_wRn(int rn
)
1145 iwmmxt_load_reg(cpu_M0
, rn
);
1148 static inline void gen_op_iwmmxt_orq_M0_wRn(int rn
)
1150 iwmmxt_load_reg(cpu_V1
, rn
);
1151 tcg_gen_or_i64(cpu_M0
, cpu_M0
, cpu_V1
);
1154 static inline void gen_op_iwmmxt_andq_M0_wRn(int rn
)
1156 iwmmxt_load_reg(cpu_V1
, rn
);
1157 tcg_gen_and_i64(cpu_M0
, cpu_M0
, cpu_V1
);
1160 static inline void gen_op_iwmmxt_xorq_M0_wRn(int rn
)
1162 iwmmxt_load_reg(cpu_V1
, rn
);
1163 tcg_gen_xor_i64(cpu_M0
, cpu_M0
, cpu_V1
);
1166 #define IWMMXT_OP(name) \
1167 static inline void gen_op_iwmmxt_##name##_M0_wRn(int rn) \
1169 iwmmxt_load_reg(cpu_V1, rn); \
1170 gen_helper_iwmmxt_##name(cpu_M0, cpu_M0, cpu_V1); \
1173 #define IWMMXT_OP_ENV(name) \
1174 static inline void gen_op_iwmmxt_##name##_M0_wRn(int rn) \
1176 iwmmxt_load_reg(cpu_V1, rn); \
1177 gen_helper_iwmmxt_##name(cpu_M0, cpu_env, cpu_M0, cpu_V1); \
1180 #define IWMMXT_OP_ENV_SIZE(name) \
1181 IWMMXT_OP_ENV(name##b) \
1182 IWMMXT_OP_ENV(name##w) \
1183 IWMMXT_OP_ENV(name##l)
1185 #define IWMMXT_OP_ENV1(name) \
1186 static inline void gen_op_iwmmxt_##name##_M0(void) \
1188 gen_helper_iwmmxt_##name(cpu_M0, cpu_env, cpu_M0); \
1202 IWMMXT_OP_ENV_SIZE(unpackl
)
1203 IWMMXT_OP_ENV_SIZE(unpackh
)
1205 IWMMXT_OP_ENV1(unpacklub
)
1206 IWMMXT_OP_ENV1(unpackluw
)
1207 IWMMXT_OP_ENV1(unpacklul
)
1208 IWMMXT_OP_ENV1(unpackhub
)
1209 IWMMXT_OP_ENV1(unpackhuw
)
1210 IWMMXT_OP_ENV1(unpackhul
)
1211 IWMMXT_OP_ENV1(unpacklsb
)
1212 IWMMXT_OP_ENV1(unpacklsw
)
1213 IWMMXT_OP_ENV1(unpacklsl
)
1214 IWMMXT_OP_ENV1(unpackhsb
)
1215 IWMMXT_OP_ENV1(unpackhsw
)
1216 IWMMXT_OP_ENV1(unpackhsl
)
1218 IWMMXT_OP_ENV_SIZE(cmpeq
)
1219 IWMMXT_OP_ENV_SIZE(cmpgtu
)
1220 IWMMXT_OP_ENV_SIZE(cmpgts
)
1222 IWMMXT_OP_ENV_SIZE(mins
)
1223 IWMMXT_OP_ENV_SIZE(minu
)
1224 IWMMXT_OP_ENV_SIZE(maxs
)
1225 IWMMXT_OP_ENV_SIZE(maxu
)
1227 IWMMXT_OP_ENV_SIZE(subn
)
1228 IWMMXT_OP_ENV_SIZE(addn
)
1229 IWMMXT_OP_ENV_SIZE(subu
)
1230 IWMMXT_OP_ENV_SIZE(addu
)
1231 IWMMXT_OP_ENV_SIZE(subs
)
1232 IWMMXT_OP_ENV_SIZE(adds
)
1234 IWMMXT_OP_ENV(avgb0
)
1235 IWMMXT_OP_ENV(avgb1
)
1236 IWMMXT_OP_ENV(avgw0
)
1237 IWMMXT_OP_ENV(avgw1
)
1241 IWMMXT_OP_ENV(packuw
)
1242 IWMMXT_OP_ENV(packul
)
1243 IWMMXT_OP_ENV(packuq
)
1244 IWMMXT_OP_ENV(packsw
)
1245 IWMMXT_OP_ENV(packsl
)
1246 IWMMXT_OP_ENV(packsq
)
1248 static void gen_op_iwmmxt_set_mup(void)
1251 tmp
= load_cpu_field(iwmmxt
.cregs
[ARM_IWMMXT_wCon
]);
1252 tcg_gen_ori_i32(tmp
, tmp
, 2);
1253 store_cpu_field(tmp
, iwmmxt
.cregs
[ARM_IWMMXT_wCon
]);
1256 static void gen_op_iwmmxt_set_cup(void)
1259 tmp
= load_cpu_field(iwmmxt
.cregs
[ARM_IWMMXT_wCon
]);
1260 tcg_gen_ori_i32(tmp
, tmp
, 1);
1261 store_cpu_field(tmp
, iwmmxt
.cregs
[ARM_IWMMXT_wCon
]);
1264 static void gen_op_iwmmxt_setpsr_nz(void)
1266 TCGv tmp
= new_tmp();
1267 gen_helper_iwmmxt_setpsr_nz(tmp
, cpu_M0
);
1268 store_cpu_field(tmp
, iwmmxt
.cregs
[ARM_IWMMXT_wCASF
]);
1271 static inline void gen_op_iwmmxt_addl_M0_wRn(int rn
)
1273 iwmmxt_load_reg(cpu_V1
, rn
);
1274 tcg_gen_ext32u_i64(cpu_V1
, cpu_V1
);
1275 tcg_gen_add_i64(cpu_M0
, cpu_M0
, cpu_V1
);
1278 static inline int gen_iwmmxt_address(DisasContext
*s
, uint32_t insn
, TCGv dest
)
1284 rd
= (insn
>> 16) & 0xf;
1285 tmp
= load_reg(s
, rd
);
1287 offset
= (insn
& 0xff) << ((insn
>> 7) & 2);
1288 if (insn
& (1 << 24)) {
1290 if (insn
& (1 << 23))
1291 tcg_gen_addi_i32(tmp
, tmp
, offset
);
1293 tcg_gen_addi_i32(tmp
, tmp
, -offset
);
1294 tcg_gen_mov_i32(dest
, tmp
);
1295 if (insn
& (1 << 21))
1296 store_reg(s
, rd
, tmp
);
1299 } else if (insn
& (1 << 21)) {
1301 tcg_gen_mov_i32(dest
, tmp
);
1302 if (insn
& (1 << 23))
1303 tcg_gen_addi_i32(tmp
, tmp
, offset
);
1305 tcg_gen_addi_i32(tmp
, tmp
, -offset
);
1306 store_reg(s
, rd
, tmp
);
1307 } else if (!(insn
& (1 << 23)))
1312 static inline int gen_iwmmxt_shift(uint32_t insn
, uint32_t mask
, TCGv dest
)
1314 int rd
= (insn
>> 0) & 0xf;
1317 if (insn
& (1 << 8)) {
1318 if (rd
< ARM_IWMMXT_wCGR0
|| rd
> ARM_IWMMXT_wCGR3
) {
1321 tmp
= iwmmxt_load_creg(rd
);
1325 iwmmxt_load_reg(cpu_V0
, rd
);
1326 tcg_gen_trunc_i64_i32(tmp
, cpu_V0
);
1328 tcg_gen_andi_i32(tmp
, tmp
, mask
);
1329 tcg_gen_mov_i32(dest
, tmp
);
1334 /* Disassemble an iwMMXt instruction. Returns nonzero if an error occured
1335 (ie. an undefined instruction). */
1336 static int disas_iwmmxt_insn(CPUState
*env
, DisasContext
*s
, uint32_t insn
)
1339 int rdhi
, rdlo
, rd0
, rd1
, i
;
1341 TCGv tmp
, tmp2
, tmp3
;
1343 if ((insn
& 0x0e000e00) == 0x0c000000) {
1344 if ((insn
& 0x0fe00ff0) == 0x0c400000) {
1346 rdlo
= (insn
>> 12) & 0xf;
1347 rdhi
= (insn
>> 16) & 0xf;
1348 if (insn
& ARM_CP_RW_BIT
) { /* TMRRC */
1349 iwmmxt_load_reg(cpu_V0
, wrd
);
1350 tcg_gen_trunc_i64_i32(cpu_R
[rdlo
], cpu_V0
);
1351 tcg_gen_shri_i64(cpu_V0
, cpu_V0
, 32);
1352 tcg_gen_trunc_i64_i32(cpu_R
[rdhi
], cpu_V0
);
1353 } else { /* TMCRR */
1354 tcg_gen_concat_i32_i64(cpu_V0
, cpu_R
[rdlo
], cpu_R
[rdhi
]);
1355 iwmmxt_store_reg(cpu_V0
, wrd
);
1356 gen_op_iwmmxt_set_mup();
1361 wrd
= (insn
>> 12) & 0xf;
1363 if (gen_iwmmxt_address(s
, insn
, addr
)) {
1367 if (insn
& ARM_CP_RW_BIT
) {
1368 if ((insn
>> 28) == 0xf) { /* WLDRW wCx */
1370 tcg_gen_qemu_ld32u(tmp
, addr
, IS_USER(s
));
1371 iwmmxt_store_creg(wrd
, tmp
);
1374 if (insn
& (1 << 8)) {
1375 if (insn
& (1 << 22)) { /* WLDRD */
1376 tcg_gen_qemu_ld64(cpu_M0
, addr
, IS_USER(s
));
1378 } else { /* WLDRW wRd */
1379 tmp
= gen_ld32(addr
, IS_USER(s
));
1382 if (insn
& (1 << 22)) { /* WLDRH */
1383 tmp
= gen_ld16u(addr
, IS_USER(s
));
1384 } else { /* WLDRB */
1385 tmp
= gen_ld8u(addr
, IS_USER(s
));
1389 tcg_gen_extu_i32_i64(cpu_M0
, tmp
);
1392 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1395 if ((insn
>> 28) == 0xf) { /* WSTRW wCx */
1396 tmp
= iwmmxt_load_creg(wrd
);
1397 gen_st32(tmp
, addr
, IS_USER(s
));
1399 gen_op_iwmmxt_movq_M0_wRn(wrd
);
1401 if (insn
& (1 << 8)) {
1402 if (insn
& (1 << 22)) { /* WSTRD */
1404 tcg_gen_qemu_st64(cpu_M0
, addr
, IS_USER(s
));
1405 } else { /* WSTRW wRd */
1406 tcg_gen_trunc_i64_i32(tmp
, cpu_M0
);
1407 gen_st32(tmp
, addr
, IS_USER(s
));
1410 if (insn
& (1 << 22)) { /* WSTRH */
1411 tcg_gen_trunc_i64_i32(tmp
, cpu_M0
);
1412 gen_st16(tmp
, addr
, IS_USER(s
));
1413 } else { /* WSTRB */
1414 tcg_gen_trunc_i64_i32(tmp
, cpu_M0
);
1415 gen_st8(tmp
, addr
, IS_USER(s
));
1424 if ((insn
& 0x0f000000) != 0x0e000000)
1427 switch (((insn
>> 12) & 0xf00) | ((insn
>> 4) & 0xff)) {
1428 case 0x000: /* WOR */
1429 wrd
= (insn
>> 12) & 0xf;
1430 rd0
= (insn
>> 0) & 0xf;
1431 rd1
= (insn
>> 16) & 0xf;
1432 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1433 gen_op_iwmmxt_orq_M0_wRn(rd1
);
1434 gen_op_iwmmxt_setpsr_nz();
1435 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1436 gen_op_iwmmxt_set_mup();
1437 gen_op_iwmmxt_set_cup();
1439 case 0x011: /* TMCR */
1442 rd
= (insn
>> 12) & 0xf;
1443 wrd
= (insn
>> 16) & 0xf;
1445 case ARM_IWMMXT_wCID
:
1446 case ARM_IWMMXT_wCASF
:
1448 case ARM_IWMMXT_wCon
:
1449 gen_op_iwmmxt_set_cup();
1451 case ARM_IWMMXT_wCSSF
:
1452 tmp
= iwmmxt_load_creg(wrd
);
1453 tmp2
= load_reg(s
, rd
);
1454 tcg_gen_andc_i32(tmp
, tmp
, tmp2
);
1456 iwmmxt_store_creg(wrd
, tmp
);
1458 case ARM_IWMMXT_wCGR0
:
1459 case ARM_IWMMXT_wCGR1
:
1460 case ARM_IWMMXT_wCGR2
:
1461 case ARM_IWMMXT_wCGR3
:
1462 gen_op_iwmmxt_set_cup();
1463 tmp
= load_reg(s
, rd
);
1464 iwmmxt_store_creg(wrd
, tmp
);
1470 case 0x100: /* WXOR */
1471 wrd
= (insn
>> 12) & 0xf;
1472 rd0
= (insn
>> 0) & 0xf;
1473 rd1
= (insn
>> 16) & 0xf;
1474 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1475 gen_op_iwmmxt_xorq_M0_wRn(rd1
);
1476 gen_op_iwmmxt_setpsr_nz();
1477 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1478 gen_op_iwmmxt_set_mup();
1479 gen_op_iwmmxt_set_cup();
1481 case 0x111: /* TMRC */
1484 rd
= (insn
>> 12) & 0xf;
1485 wrd
= (insn
>> 16) & 0xf;
1486 tmp
= iwmmxt_load_creg(wrd
);
1487 store_reg(s
, rd
, tmp
);
1489 case 0x300: /* WANDN */
1490 wrd
= (insn
>> 12) & 0xf;
1491 rd0
= (insn
>> 0) & 0xf;
1492 rd1
= (insn
>> 16) & 0xf;
1493 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1494 tcg_gen_neg_i64(cpu_M0
, cpu_M0
);
1495 gen_op_iwmmxt_andq_M0_wRn(rd1
);
1496 gen_op_iwmmxt_setpsr_nz();
1497 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1498 gen_op_iwmmxt_set_mup();
1499 gen_op_iwmmxt_set_cup();
1501 case 0x200: /* WAND */
1502 wrd
= (insn
>> 12) & 0xf;
1503 rd0
= (insn
>> 0) & 0xf;
1504 rd1
= (insn
>> 16) & 0xf;
1505 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1506 gen_op_iwmmxt_andq_M0_wRn(rd1
);
1507 gen_op_iwmmxt_setpsr_nz();
1508 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1509 gen_op_iwmmxt_set_mup();
1510 gen_op_iwmmxt_set_cup();
1512 case 0x810: case 0xa10: /* WMADD */
1513 wrd
= (insn
>> 12) & 0xf;
1514 rd0
= (insn
>> 0) & 0xf;
1515 rd1
= (insn
>> 16) & 0xf;
1516 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1517 if (insn
& (1 << 21))
1518 gen_op_iwmmxt_maddsq_M0_wRn(rd1
);
1520 gen_op_iwmmxt_madduq_M0_wRn(rd1
);
1521 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1522 gen_op_iwmmxt_set_mup();
1524 case 0x10e: case 0x50e: case 0x90e: case 0xd0e: /* WUNPCKIL */
1525 wrd
= (insn
>> 12) & 0xf;
1526 rd0
= (insn
>> 16) & 0xf;
1527 rd1
= (insn
>> 0) & 0xf;
1528 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1529 switch ((insn
>> 22) & 3) {
1531 gen_op_iwmmxt_unpacklb_M0_wRn(rd1
);
1534 gen_op_iwmmxt_unpacklw_M0_wRn(rd1
);
1537 gen_op_iwmmxt_unpackll_M0_wRn(rd1
);
1542 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1543 gen_op_iwmmxt_set_mup();
1544 gen_op_iwmmxt_set_cup();
1546 case 0x10c: case 0x50c: case 0x90c: case 0xd0c: /* WUNPCKIH */
1547 wrd
= (insn
>> 12) & 0xf;
1548 rd0
= (insn
>> 16) & 0xf;
1549 rd1
= (insn
>> 0) & 0xf;
1550 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1551 switch ((insn
>> 22) & 3) {
1553 gen_op_iwmmxt_unpackhb_M0_wRn(rd1
);
1556 gen_op_iwmmxt_unpackhw_M0_wRn(rd1
);
1559 gen_op_iwmmxt_unpackhl_M0_wRn(rd1
);
1564 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1565 gen_op_iwmmxt_set_mup();
1566 gen_op_iwmmxt_set_cup();
1568 case 0x012: case 0x112: case 0x412: case 0x512: /* WSAD */
1569 wrd
= (insn
>> 12) & 0xf;
1570 rd0
= (insn
>> 16) & 0xf;
1571 rd1
= (insn
>> 0) & 0xf;
1572 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1573 if (insn
& (1 << 22))
1574 gen_op_iwmmxt_sadw_M0_wRn(rd1
);
1576 gen_op_iwmmxt_sadb_M0_wRn(rd1
);
1577 if (!(insn
& (1 << 20)))
1578 gen_op_iwmmxt_addl_M0_wRn(wrd
);
1579 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1580 gen_op_iwmmxt_set_mup();
1582 case 0x010: case 0x110: case 0x210: case 0x310: /* WMUL */
1583 wrd
= (insn
>> 12) & 0xf;
1584 rd0
= (insn
>> 16) & 0xf;
1585 rd1
= (insn
>> 0) & 0xf;
1586 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1587 if (insn
& (1 << 21)) {
1588 if (insn
& (1 << 20))
1589 gen_op_iwmmxt_mulshw_M0_wRn(rd1
);
1591 gen_op_iwmmxt_mulslw_M0_wRn(rd1
);
1593 if (insn
& (1 << 20))
1594 gen_op_iwmmxt_muluhw_M0_wRn(rd1
);
1596 gen_op_iwmmxt_mululw_M0_wRn(rd1
);
1598 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1599 gen_op_iwmmxt_set_mup();
1601 case 0x410: case 0x510: case 0x610: case 0x710: /* WMAC */
1602 wrd
= (insn
>> 12) & 0xf;
1603 rd0
= (insn
>> 16) & 0xf;
1604 rd1
= (insn
>> 0) & 0xf;
1605 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1606 if (insn
& (1 << 21))
1607 gen_op_iwmmxt_macsw_M0_wRn(rd1
);
1609 gen_op_iwmmxt_macuw_M0_wRn(rd1
);
1610 if (!(insn
& (1 << 20))) {
1611 iwmmxt_load_reg(cpu_V1
, wrd
);
1612 tcg_gen_add_i64(cpu_M0
, cpu_M0
, cpu_V1
);
1614 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1615 gen_op_iwmmxt_set_mup();
1617 case 0x006: case 0x406: case 0x806: case 0xc06: /* WCMPEQ */
1618 wrd
= (insn
>> 12) & 0xf;
1619 rd0
= (insn
>> 16) & 0xf;
1620 rd1
= (insn
>> 0) & 0xf;
1621 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1622 switch ((insn
>> 22) & 3) {
1624 gen_op_iwmmxt_cmpeqb_M0_wRn(rd1
);
1627 gen_op_iwmmxt_cmpeqw_M0_wRn(rd1
);
1630 gen_op_iwmmxt_cmpeql_M0_wRn(rd1
);
1635 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1636 gen_op_iwmmxt_set_mup();
1637 gen_op_iwmmxt_set_cup();
1639 case 0x800: case 0x900: case 0xc00: case 0xd00: /* WAVG2 */
1640 wrd
= (insn
>> 12) & 0xf;
1641 rd0
= (insn
>> 16) & 0xf;
1642 rd1
= (insn
>> 0) & 0xf;
1643 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1644 if (insn
& (1 << 22)) {
1645 if (insn
& (1 << 20))
1646 gen_op_iwmmxt_avgw1_M0_wRn(rd1
);
1648 gen_op_iwmmxt_avgw0_M0_wRn(rd1
);
1650 if (insn
& (1 << 20))
1651 gen_op_iwmmxt_avgb1_M0_wRn(rd1
);
1653 gen_op_iwmmxt_avgb0_M0_wRn(rd1
);
1655 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1656 gen_op_iwmmxt_set_mup();
1657 gen_op_iwmmxt_set_cup();
1659 case 0x802: case 0x902: case 0xa02: case 0xb02: /* WALIGNR */
1660 wrd
= (insn
>> 12) & 0xf;
1661 rd0
= (insn
>> 16) & 0xf;
1662 rd1
= (insn
>> 0) & 0xf;
1663 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1664 tmp
= iwmmxt_load_creg(ARM_IWMMXT_wCGR0
+ ((insn
>> 20) & 3));
1665 tcg_gen_andi_i32(tmp
, tmp
, 7);
1666 iwmmxt_load_reg(cpu_V1
, rd1
);
1667 gen_helper_iwmmxt_align(cpu_M0
, cpu_M0
, cpu_V1
, tmp
);
1669 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1670 gen_op_iwmmxt_set_mup();
1672 case 0x601: case 0x605: case 0x609: case 0x60d: /* TINSR */
1673 if (((insn
>> 6) & 3) == 3)
1675 rd
= (insn
>> 12) & 0xf;
1676 wrd
= (insn
>> 16) & 0xf;
1677 tmp
= load_reg(s
, rd
);
1678 gen_op_iwmmxt_movq_M0_wRn(wrd
);
1679 switch ((insn
>> 6) & 3) {
1681 tmp2
= tcg_const_i32(0xff);
1682 tmp3
= tcg_const_i32((insn
& 7) << 3);
1685 tmp2
= tcg_const_i32(0xffff);
1686 tmp3
= tcg_const_i32((insn
& 3) << 4);
1689 tmp2
= tcg_const_i32(0xffffffff);
1690 tmp3
= tcg_const_i32((insn
& 1) << 5);
1696 gen_helper_iwmmxt_insr(cpu_M0
, cpu_M0
, tmp
, tmp2
, tmp3
);
1697 tcg_temp_free(tmp3
);
1698 tcg_temp_free(tmp2
);
1700 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1701 gen_op_iwmmxt_set_mup();
1703 case 0x107: case 0x507: case 0x907: case 0xd07: /* TEXTRM */
1704 rd
= (insn
>> 12) & 0xf;
1705 wrd
= (insn
>> 16) & 0xf;
1706 if (rd
== 15 || ((insn
>> 22) & 3) == 3)
1708 gen_op_iwmmxt_movq_M0_wRn(wrd
);
1710 switch ((insn
>> 22) & 3) {
1712 tcg_gen_shri_i64(cpu_M0
, cpu_M0
, (insn
& 7) << 3);
1713 tcg_gen_trunc_i64_i32(tmp
, cpu_M0
);
1715 tcg_gen_ext8s_i32(tmp
, tmp
);
1717 tcg_gen_andi_i32(tmp
, tmp
, 0xff);
1721 tcg_gen_shri_i64(cpu_M0
, cpu_M0
, (insn
& 3) << 4);
1722 tcg_gen_trunc_i64_i32(tmp
, cpu_M0
);
1724 tcg_gen_ext16s_i32(tmp
, tmp
);
1726 tcg_gen_andi_i32(tmp
, tmp
, 0xffff);
1730 tcg_gen_shri_i64(cpu_M0
, cpu_M0
, (insn
& 1) << 5);
1731 tcg_gen_trunc_i64_i32(tmp
, cpu_M0
);
1734 store_reg(s
, rd
, tmp
);
1736 case 0x117: case 0x517: case 0x917: case 0xd17: /* TEXTRC */
1737 if ((insn
& 0x000ff008) != 0x0003f000 || ((insn
>> 22) & 3) == 3)
1739 tmp
= iwmmxt_load_creg(ARM_IWMMXT_wCASF
);
1740 switch ((insn
>> 22) & 3) {
1742 tcg_gen_shri_i32(tmp
, tmp
, ((insn
& 7) << 2) + 0);
1745 tcg_gen_shri_i32(tmp
, tmp
, ((insn
& 3) << 3) + 4);
1748 tcg_gen_shri_i32(tmp
, tmp
, ((insn
& 1) << 4) + 12);
1751 tcg_gen_shli_i32(tmp
, tmp
, 28);
1755 case 0x401: case 0x405: case 0x409: case 0x40d: /* TBCST */
1756 if (((insn
>> 6) & 3) == 3)
1758 rd
= (insn
>> 12) & 0xf;
1759 wrd
= (insn
>> 16) & 0xf;
1760 tmp
= load_reg(s
, rd
);
1761 switch ((insn
>> 6) & 3) {
1763 gen_helper_iwmmxt_bcstb(cpu_M0
, tmp
);
1766 gen_helper_iwmmxt_bcstw(cpu_M0
, tmp
);
1769 gen_helper_iwmmxt_bcstl(cpu_M0
, tmp
);
1773 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1774 gen_op_iwmmxt_set_mup();
1776 case 0x113: case 0x513: case 0x913: case 0xd13: /* TANDC */
1777 if ((insn
& 0x000ff00f) != 0x0003f000 || ((insn
>> 22) & 3) == 3)
1779 tmp
= iwmmxt_load_creg(ARM_IWMMXT_wCASF
);
1781 tcg_gen_mov_i32(tmp2
, tmp
);
1782 switch ((insn
>> 22) & 3) {
1784 for (i
= 0; i
< 7; i
++) {
1785 tcg_gen_shli_i32(tmp2
, tmp2
, 4);
1786 tcg_gen_and_i32(tmp
, tmp
, tmp2
);
1790 for (i
= 0; i
< 3; i
++) {
1791 tcg_gen_shli_i32(tmp2
, tmp2
, 8);
1792 tcg_gen_and_i32(tmp
, tmp
, tmp2
);
1796 tcg_gen_shli_i32(tmp2
, tmp2
, 16);
1797 tcg_gen_and_i32(tmp
, tmp
, tmp2
);
1804 case 0x01c: case 0x41c: case 0x81c: case 0xc1c: /* WACC */
1805 wrd
= (insn
>> 12) & 0xf;
1806 rd0
= (insn
>> 16) & 0xf;
1807 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1808 switch ((insn
>> 22) & 3) {
1810 gen_helper_iwmmxt_addcb(cpu_M0
, cpu_M0
);
1813 gen_helper_iwmmxt_addcw(cpu_M0
, cpu_M0
);
1816 gen_helper_iwmmxt_addcl(cpu_M0
, cpu_M0
);
1821 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1822 gen_op_iwmmxt_set_mup();
1824 case 0x115: case 0x515: case 0x915: case 0xd15: /* TORC */
1825 if ((insn
& 0x000ff00f) != 0x0003f000 || ((insn
>> 22) & 3) == 3)
1827 tmp
= iwmmxt_load_creg(ARM_IWMMXT_wCASF
);
1829 tcg_gen_mov_i32(tmp2
, tmp
);
1830 switch ((insn
>> 22) & 3) {
1832 for (i
= 0; i
< 7; i
++) {
1833 tcg_gen_shli_i32(tmp2
, tmp2
, 4);
1834 tcg_gen_or_i32(tmp
, tmp
, tmp2
);
1838 for (i
= 0; i
< 3; i
++) {
1839 tcg_gen_shli_i32(tmp2
, tmp2
, 8);
1840 tcg_gen_or_i32(tmp
, tmp
, tmp2
);
1844 tcg_gen_shli_i32(tmp2
, tmp2
, 16);
1845 tcg_gen_or_i32(tmp
, tmp
, tmp2
);
1852 case 0x103: case 0x503: case 0x903: case 0xd03: /* TMOVMSK */
1853 rd
= (insn
>> 12) & 0xf;
1854 rd0
= (insn
>> 16) & 0xf;
1855 if ((insn
& 0xf) != 0 || ((insn
>> 22) & 3) == 3)
1857 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1859 switch ((insn
>> 22) & 3) {
1861 gen_helper_iwmmxt_msbb(tmp
, cpu_M0
);
1864 gen_helper_iwmmxt_msbw(tmp
, cpu_M0
);
1867 gen_helper_iwmmxt_msbl(tmp
, cpu_M0
);
1870 store_reg(s
, rd
, tmp
);
1872 case 0x106: case 0x306: case 0x506: case 0x706: /* WCMPGT */
1873 case 0x906: case 0xb06: case 0xd06: case 0xf06:
1874 wrd
= (insn
>> 12) & 0xf;
1875 rd0
= (insn
>> 16) & 0xf;
1876 rd1
= (insn
>> 0) & 0xf;
1877 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1878 switch ((insn
>> 22) & 3) {
1880 if (insn
& (1 << 21))
1881 gen_op_iwmmxt_cmpgtsb_M0_wRn(rd1
);
1883 gen_op_iwmmxt_cmpgtub_M0_wRn(rd1
);
1886 if (insn
& (1 << 21))
1887 gen_op_iwmmxt_cmpgtsw_M0_wRn(rd1
);
1889 gen_op_iwmmxt_cmpgtuw_M0_wRn(rd1
);
1892 if (insn
& (1 << 21))
1893 gen_op_iwmmxt_cmpgtsl_M0_wRn(rd1
);
1895 gen_op_iwmmxt_cmpgtul_M0_wRn(rd1
);
1900 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1901 gen_op_iwmmxt_set_mup();
1902 gen_op_iwmmxt_set_cup();
1904 case 0x00e: case 0x20e: case 0x40e: case 0x60e: /* WUNPCKEL */
1905 case 0x80e: case 0xa0e: case 0xc0e: case 0xe0e:
1906 wrd
= (insn
>> 12) & 0xf;
1907 rd0
= (insn
>> 16) & 0xf;
1908 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1909 switch ((insn
>> 22) & 3) {
1911 if (insn
& (1 << 21))
1912 gen_op_iwmmxt_unpacklsb_M0();
1914 gen_op_iwmmxt_unpacklub_M0();
1917 if (insn
& (1 << 21))
1918 gen_op_iwmmxt_unpacklsw_M0();
1920 gen_op_iwmmxt_unpackluw_M0();
1923 if (insn
& (1 << 21))
1924 gen_op_iwmmxt_unpacklsl_M0();
1926 gen_op_iwmmxt_unpacklul_M0();
1931 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1932 gen_op_iwmmxt_set_mup();
1933 gen_op_iwmmxt_set_cup();
1935 case 0x00c: case 0x20c: case 0x40c: case 0x60c: /* WUNPCKEH */
1936 case 0x80c: case 0xa0c: case 0xc0c: case 0xe0c:
1937 wrd
= (insn
>> 12) & 0xf;
1938 rd0
= (insn
>> 16) & 0xf;
1939 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1940 switch ((insn
>> 22) & 3) {
1942 if (insn
& (1 << 21))
1943 gen_op_iwmmxt_unpackhsb_M0();
1945 gen_op_iwmmxt_unpackhub_M0();
1948 if (insn
& (1 << 21))
1949 gen_op_iwmmxt_unpackhsw_M0();
1951 gen_op_iwmmxt_unpackhuw_M0();
1954 if (insn
& (1 << 21))
1955 gen_op_iwmmxt_unpackhsl_M0();
1957 gen_op_iwmmxt_unpackhul_M0();
1962 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1963 gen_op_iwmmxt_set_mup();
1964 gen_op_iwmmxt_set_cup();
1966 case 0x204: case 0x604: case 0xa04: case 0xe04: /* WSRL */
1967 case 0x214: case 0x614: case 0xa14: case 0xe14:
1968 if (((insn
>> 22) & 3) == 0)
1970 wrd
= (insn
>> 12) & 0xf;
1971 rd0
= (insn
>> 16) & 0xf;
1972 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1974 if (gen_iwmmxt_shift(insn
, 0xff, tmp
)) {
1978 switch ((insn
>> 22) & 3) {
1980 gen_helper_iwmmxt_srlw(cpu_M0
, cpu_env
, cpu_M0
, tmp
);
1983 gen_helper_iwmmxt_srll(cpu_M0
, cpu_env
, cpu_M0
, tmp
);
1986 gen_helper_iwmmxt_srlq(cpu_M0
, cpu_env
, cpu_M0
, tmp
);
1990 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1991 gen_op_iwmmxt_set_mup();
1992 gen_op_iwmmxt_set_cup();
1994 case 0x004: case 0x404: case 0x804: case 0xc04: /* WSRA */
1995 case 0x014: case 0x414: case 0x814: case 0xc14:
1996 if (((insn
>> 22) & 3) == 0)
1998 wrd
= (insn
>> 12) & 0xf;
1999 rd0
= (insn
>> 16) & 0xf;
2000 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2002 if (gen_iwmmxt_shift(insn
, 0xff, tmp
)) {
2006 switch ((insn
>> 22) & 3) {
2008 gen_helper_iwmmxt_sraw(cpu_M0
, cpu_env
, cpu_M0
, tmp
);
2011 gen_helper_iwmmxt_sral(cpu_M0
, cpu_env
, cpu_M0
, tmp
);
2014 gen_helper_iwmmxt_sraq(cpu_M0
, cpu_env
, cpu_M0
, tmp
);
2018 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2019 gen_op_iwmmxt_set_mup();
2020 gen_op_iwmmxt_set_cup();
2022 case 0x104: case 0x504: case 0x904: case 0xd04: /* WSLL */
2023 case 0x114: case 0x514: case 0x914: case 0xd14:
2024 if (((insn
>> 22) & 3) == 0)
2026 wrd
= (insn
>> 12) & 0xf;
2027 rd0
= (insn
>> 16) & 0xf;
2028 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2030 if (gen_iwmmxt_shift(insn
, 0xff, tmp
)) {
2034 switch ((insn
>> 22) & 3) {
2036 gen_helper_iwmmxt_sllw(cpu_M0
, cpu_env
, cpu_M0
, tmp
);
2039 gen_helper_iwmmxt_slll(cpu_M0
, cpu_env
, cpu_M0
, tmp
);
2042 gen_helper_iwmmxt_sllq(cpu_M0
, cpu_env
, cpu_M0
, tmp
);
2046 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2047 gen_op_iwmmxt_set_mup();
2048 gen_op_iwmmxt_set_cup();
2050 case 0x304: case 0x704: case 0xb04: case 0xf04: /* WROR */
2051 case 0x314: case 0x714: case 0xb14: case 0xf14:
2052 if (((insn
>> 22) & 3) == 0)
2054 wrd
= (insn
>> 12) & 0xf;
2055 rd0
= (insn
>> 16) & 0xf;
2056 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2058 switch ((insn
>> 22) & 3) {
2060 if (gen_iwmmxt_shift(insn
, 0xf, tmp
)) {
2064 gen_helper_iwmmxt_rorw(cpu_M0
, cpu_env
, cpu_M0
, tmp
);
2067 if (gen_iwmmxt_shift(insn
, 0x1f, tmp
)) {
2071 gen_helper_iwmmxt_rorl(cpu_M0
, cpu_env
, cpu_M0
, tmp
);
2074 if (gen_iwmmxt_shift(insn
, 0x3f, tmp
)) {
2078 gen_helper_iwmmxt_rorq(cpu_M0
, cpu_env
, cpu_M0
, tmp
);
2082 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2083 gen_op_iwmmxt_set_mup();
2084 gen_op_iwmmxt_set_cup();
2086 case 0x116: case 0x316: case 0x516: case 0x716: /* WMIN */
2087 case 0x916: case 0xb16: case 0xd16: case 0xf16:
2088 wrd
= (insn
>> 12) & 0xf;
2089 rd0
= (insn
>> 16) & 0xf;
2090 rd1
= (insn
>> 0) & 0xf;
2091 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2092 switch ((insn
>> 22) & 3) {
2094 if (insn
& (1 << 21))
2095 gen_op_iwmmxt_minsb_M0_wRn(rd1
);
2097 gen_op_iwmmxt_minub_M0_wRn(rd1
);
2100 if (insn
& (1 << 21))
2101 gen_op_iwmmxt_minsw_M0_wRn(rd1
);
2103 gen_op_iwmmxt_minuw_M0_wRn(rd1
);
2106 if (insn
& (1 << 21))
2107 gen_op_iwmmxt_minsl_M0_wRn(rd1
);
2109 gen_op_iwmmxt_minul_M0_wRn(rd1
);
2114 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2115 gen_op_iwmmxt_set_mup();
2117 case 0x016: case 0x216: case 0x416: case 0x616: /* WMAX */
2118 case 0x816: case 0xa16: case 0xc16: case 0xe16:
2119 wrd
= (insn
>> 12) & 0xf;
2120 rd0
= (insn
>> 16) & 0xf;
2121 rd1
= (insn
>> 0) & 0xf;
2122 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2123 switch ((insn
>> 22) & 3) {
2125 if (insn
& (1 << 21))
2126 gen_op_iwmmxt_maxsb_M0_wRn(rd1
);
2128 gen_op_iwmmxt_maxub_M0_wRn(rd1
);
2131 if (insn
& (1 << 21))
2132 gen_op_iwmmxt_maxsw_M0_wRn(rd1
);
2134 gen_op_iwmmxt_maxuw_M0_wRn(rd1
);
2137 if (insn
& (1 << 21))
2138 gen_op_iwmmxt_maxsl_M0_wRn(rd1
);
2140 gen_op_iwmmxt_maxul_M0_wRn(rd1
);
2145 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2146 gen_op_iwmmxt_set_mup();
2148 case 0x002: case 0x102: case 0x202: case 0x302: /* WALIGNI */
2149 case 0x402: case 0x502: case 0x602: case 0x702:
2150 wrd
= (insn
>> 12) & 0xf;
2151 rd0
= (insn
>> 16) & 0xf;
2152 rd1
= (insn
>> 0) & 0xf;
2153 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2154 tmp
= tcg_const_i32((insn
>> 20) & 3);
2155 iwmmxt_load_reg(cpu_V1
, rd1
);
2156 gen_helper_iwmmxt_align(cpu_M0
, cpu_M0
, cpu_V1
, tmp
);
2158 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2159 gen_op_iwmmxt_set_mup();
2161 case 0x01a: case 0x11a: case 0x21a: case 0x31a: /* WSUB */
2162 case 0x41a: case 0x51a: case 0x61a: case 0x71a:
2163 case 0x81a: case 0x91a: case 0xa1a: case 0xb1a:
2164 case 0xc1a: case 0xd1a: case 0xe1a: case 0xf1a:
2165 wrd
= (insn
>> 12) & 0xf;
2166 rd0
= (insn
>> 16) & 0xf;
2167 rd1
= (insn
>> 0) & 0xf;
2168 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2169 switch ((insn
>> 20) & 0xf) {
2171 gen_op_iwmmxt_subnb_M0_wRn(rd1
);
2174 gen_op_iwmmxt_subub_M0_wRn(rd1
);
2177 gen_op_iwmmxt_subsb_M0_wRn(rd1
);
2180 gen_op_iwmmxt_subnw_M0_wRn(rd1
);
2183 gen_op_iwmmxt_subuw_M0_wRn(rd1
);
2186 gen_op_iwmmxt_subsw_M0_wRn(rd1
);
2189 gen_op_iwmmxt_subnl_M0_wRn(rd1
);
2192 gen_op_iwmmxt_subul_M0_wRn(rd1
);
2195 gen_op_iwmmxt_subsl_M0_wRn(rd1
);
2200 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2201 gen_op_iwmmxt_set_mup();
2202 gen_op_iwmmxt_set_cup();
2204 case 0x01e: case 0x11e: case 0x21e: case 0x31e: /* WSHUFH */
2205 case 0x41e: case 0x51e: case 0x61e: case 0x71e:
2206 case 0x81e: case 0x91e: case 0xa1e: case 0xb1e:
2207 case 0xc1e: case 0xd1e: case 0xe1e: case 0xf1e:
2208 wrd
= (insn
>> 12) & 0xf;
2209 rd0
= (insn
>> 16) & 0xf;
2210 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2211 tmp
= tcg_const_i32(((insn
>> 16) & 0xf0) | (insn
& 0x0f));
2212 gen_helper_iwmmxt_shufh(cpu_M0
, cpu_env
, cpu_M0
, tmp
);
2214 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2215 gen_op_iwmmxt_set_mup();
2216 gen_op_iwmmxt_set_cup();
2218 case 0x018: case 0x118: case 0x218: case 0x318: /* WADD */
2219 case 0x418: case 0x518: case 0x618: case 0x718:
2220 case 0x818: case 0x918: case 0xa18: case 0xb18:
2221 case 0xc18: case 0xd18: case 0xe18: case 0xf18:
2222 wrd
= (insn
>> 12) & 0xf;
2223 rd0
= (insn
>> 16) & 0xf;
2224 rd1
= (insn
>> 0) & 0xf;
2225 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2226 switch ((insn
>> 20) & 0xf) {
2228 gen_op_iwmmxt_addnb_M0_wRn(rd1
);
2231 gen_op_iwmmxt_addub_M0_wRn(rd1
);
2234 gen_op_iwmmxt_addsb_M0_wRn(rd1
);
2237 gen_op_iwmmxt_addnw_M0_wRn(rd1
);
2240 gen_op_iwmmxt_adduw_M0_wRn(rd1
);
2243 gen_op_iwmmxt_addsw_M0_wRn(rd1
);
2246 gen_op_iwmmxt_addnl_M0_wRn(rd1
);
2249 gen_op_iwmmxt_addul_M0_wRn(rd1
);
2252 gen_op_iwmmxt_addsl_M0_wRn(rd1
);
2257 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2258 gen_op_iwmmxt_set_mup();
2259 gen_op_iwmmxt_set_cup();
2261 case 0x008: case 0x108: case 0x208: case 0x308: /* WPACK */
2262 case 0x408: case 0x508: case 0x608: case 0x708:
2263 case 0x808: case 0x908: case 0xa08: case 0xb08:
2264 case 0xc08: case 0xd08: case 0xe08: case 0xf08:
2265 if (!(insn
& (1 << 20)) || ((insn
>> 22) & 3) == 0)
2267 wrd
= (insn
>> 12) & 0xf;
2268 rd0
= (insn
>> 16) & 0xf;
2269 rd1
= (insn
>> 0) & 0xf;
2270 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2271 switch ((insn
>> 22) & 3) {
2273 if (insn
& (1 << 21))
2274 gen_op_iwmmxt_packsw_M0_wRn(rd1
);
2276 gen_op_iwmmxt_packuw_M0_wRn(rd1
);
2279 if (insn
& (1 << 21))
2280 gen_op_iwmmxt_packsl_M0_wRn(rd1
);
2282 gen_op_iwmmxt_packul_M0_wRn(rd1
);
2285 if (insn
& (1 << 21))
2286 gen_op_iwmmxt_packsq_M0_wRn(rd1
);
2288 gen_op_iwmmxt_packuq_M0_wRn(rd1
);
2291 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2292 gen_op_iwmmxt_set_mup();
2293 gen_op_iwmmxt_set_cup();
2295 case 0x201: case 0x203: case 0x205: case 0x207:
2296 case 0x209: case 0x20b: case 0x20d: case 0x20f:
2297 case 0x211: case 0x213: case 0x215: case 0x217:
2298 case 0x219: case 0x21b: case 0x21d: case 0x21f:
2299 wrd
= (insn
>> 5) & 0xf;
2300 rd0
= (insn
>> 12) & 0xf;
2301 rd1
= (insn
>> 0) & 0xf;
2302 if (rd0
== 0xf || rd1
== 0xf)
2304 gen_op_iwmmxt_movq_M0_wRn(wrd
);
2305 tmp
= load_reg(s
, rd0
);
2306 tmp2
= load_reg(s
, rd1
);
2307 switch ((insn
>> 16) & 0xf) {
2308 case 0x0: /* TMIA */
2309 gen_helper_iwmmxt_muladdsl(cpu_M0
, cpu_M0
, tmp
, tmp2
);
2311 case 0x8: /* TMIAPH */
2312 gen_helper_iwmmxt_muladdsw(cpu_M0
, cpu_M0
, tmp
, tmp2
);
2314 case 0xc: case 0xd: case 0xe: case 0xf: /* TMIAxy */
2315 if (insn
& (1 << 16))
2316 tcg_gen_shri_i32(tmp
, tmp
, 16);
2317 if (insn
& (1 << 17))
2318 tcg_gen_shri_i32(tmp2
, tmp2
, 16);
2319 gen_helper_iwmmxt_muladdswl(cpu_M0
, cpu_M0
, tmp
, tmp2
);
2328 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2329 gen_op_iwmmxt_set_mup();
2338 /* Disassemble an XScale DSP instruction. Returns nonzero if an error occured
2339 (ie. an undefined instruction). */
2340 static int disas_dsp_insn(CPUState
*env
, DisasContext
*s
, uint32_t insn
)
2342 int acc
, rd0
, rd1
, rdhi
, rdlo
;
2345 if ((insn
& 0x0ff00f10) == 0x0e200010) {
2346 /* Multiply with Internal Accumulate Format */
2347 rd0
= (insn
>> 12) & 0xf;
2349 acc
= (insn
>> 5) & 7;
2354 tmp
= load_reg(s
, rd0
);
2355 tmp2
= load_reg(s
, rd1
);
2356 switch ((insn
>> 16) & 0xf) {
2358 gen_helper_iwmmxt_muladdsl(cpu_M0
, cpu_M0
, tmp
, tmp2
);
2360 case 0x8: /* MIAPH */
2361 gen_helper_iwmmxt_muladdsw(cpu_M0
, cpu_M0
, tmp
, tmp2
);
2363 case 0xc: /* MIABB */
2364 case 0xd: /* MIABT */
2365 case 0xe: /* MIATB */
2366 case 0xf: /* MIATT */
2367 if (insn
& (1 << 16))
2368 tcg_gen_shri_i32(tmp
, tmp
, 16);
2369 if (insn
& (1 << 17))
2370 tcg_gen_shri_i32(tmp2
, tmp2
, 16);
2371 gen_helper_iwmmxt_muladdswl(cpu_M0
, cpu_M0
, tmp
, tmp2
);
2379 gen_op_iwmmxt_movq_wRn_M0(acc
);
2383 if ((insn
& 0x0fe00ff8) == 0x0c400000) {
2384 /* Internal Accumulator Access Format */
2385 rdhi
= (insn
>> 16) & 0xf;
2386 rdlo
= (insn
>> 12) & 0xf;
2392 if (insn
& ARM_CP_RW_BIT
) { /* MRA */
2393 iwmmxt_load_reg(cpu_V0
, acc
);
2394 tcg_gen_trunc_i64_i32(cpu_R
[rdlo
], cpu_V0
);
2395 tcg_gen_shri_i64(cpu_V0
, cpu_V0
, 32);
2396 tcg_gen_trunc_i64_i32(cpu_R
[rdhi
], cpu_V0
);
2397 tcg_gen_andi_i32(cpu_R
[rdhi
], cpu_R
[rdhi
], (1 << (40 - 32)) - 1);
2399 tcg_gen_concat_i32_i64(cpu_V0
, cpu_R
[rdlo
], cpu_R
[rdhi
]);
2400 iwmmxt_store_reg(cpu_V0
, acc
);
2408 /* Disassemble system coprocessor instruction. Return nonzero if
2409 instruction is not defined. */
2410 static int disas_cp_insn(CPUState
*env
, DisasContext
*s
, uint32_t insn
)
2413 uint32_t rd
= (insn
>> 12) & 0xf;
2414 uint32_t cp
= (insn
>> 8) & 0xf;
2419 if (insn
& ARM_CP_RW_BIT
) {
2420 if (!env
->cp
[cp
].cp_read
)
2422 gen_set_pc_im(s
->pc
);
2424 tmp2
= tcg_const_i32(insn
);
2425 gen_helper_get_cp(tmp
, cpu_env
, tmp2
);
2426 tcg_temp_free(tmp2
);
2427 store_reg(s
, rd
, tmp
);
2429 if (!env
->cp
[cp
].cp_write
)
2431 gen_set_pc_im(s
->pc
);
2432 tmp
= load_reg(s
, rd
);
2433 tmp2
= tcg_const_i32(insn
);
2434 gen_helper_set_cp(cpu_env
, tmp2
, tmp
);
2435 tcg_temp_free(tmp2
);
2441 static int cp15_user_ok(uint32_t insn
)
2443 int cpn
= (insn
>> 16) & 0xf;
2444 int cpm
= insn
& 0xf;
2445 int op
= ((insn
>> 5) & 7) | ((insn
>> 18) & 0x38);
2447 if (cpn
== 13 && cpm
== 0) {
2449 if (op
== 2 || (op
== 3 && (insn
& ARM_CP_RW_BIT
)))
2453 /* ISB, DSB, DMB. */
2454 if ((cpm
== 5 && op
== 4)
2455 || (cpm
== 10 && (op
== 4 || op
== 5)))
2461 static int cp15_tls_load_store(CPUState
*env
, DisasContext
*s
, uint32_t insn
, uint32_t rd
)
2464 int cpn
= (insn
>> 16) & 0xf;
2465 int cpm
= insn
& 0xf;
2466 int op
= ((insn
>> 5) & 7) | ((insn
>> 18) & 0x38);
2468 if (!arm_feature(env
, ARM_FEATURE_V6K
))
2471 if (!(cpn
== 13 && cpm
== 0))
2474 if (insn
& ARM_CP_RW_BIT
) {
2477 tmp
= load_cpu_field(cp15
.c13_tls1
);
2480 tmp
= load_cpu_field(cp15
.c13_tls2
);
2483 tmp
= load_cpu_field(cp15
.c13_tls3
);
2488 store_reg(s
, rd
, tmp
);
2491 tmp
= load_reg(s
, rd
);
2494 store_cpu_field(tmp
, cp15
.c13_tls1
);
2497 store_cpu_field(tmp
, cp15
.c13_tls2
);
2500 store_cpu_field(tmp
, cp15
.c13_tls3
);
2510 /* Disassemble system coprocessor (cp15) instruction. Return nonzero if
2511 instruction is not defined. */
2512 static int disas_cp15_insn(CPUState
*env
, DisasContext
*s
, uint32_t insn
)
2517 /* M profile cores use memory mapped registers instead of cp15. */
2518 if (arm_feature(env
, ARM_FEATURE_M
))
2521 if ((insn
& (1 << 25)) == 0) {
2522 if (insn
& (1 << 20)) {
2526 /* mcrr. Used for block cache operations, so implement as no-op. */
2529 if ((insn
& (1 << 4)) == 0) {
2533 if (IS_USER(s
) && !cp15_user_ok(insn
)) {
2536 if ((insn
& 0x0fff0fff) == 0x0e070f90
2537 || (insn
& 0x0fff0fff) == 0x0e070f58) {
2538 /* Wait for interrupt. */
2539 gen_set_pc_im(s
->pc
);
2540 s
->is_jmp
= DISAS_WFI
;
2543 rd
= (insn
>> 12) & 0xf;
2545 if (cp15_tls_load_store(env
, s
, insn
, rd
))
2548 tmp2
= tcg_const_i32(insn
);
2549 if (insn
& ARM_CP_RW_BIT
) {
2551 gen_helper_get_cp15(tmp
, cpu_env
, tmp2
);
2552 /* If the destination register is r15 then sets condition codes. */
2554 store_reg(s
, rd
, tmp
);
2558 tmp
= load_reg(s
, rd
);
2559 gen_helper_set_cp15(cpu_env
, tmp2
, tmp
);
2561 /* Normally we would always end the TB here, but Linux
2562 * arch/arm/mach-pxa/sleep.S expects two instructions following
2563 * an MMU enable to execute from cache. Imitate this behaviour. */
2564 if (!arm_feature(env
, ARM_FEATURE_XSCALE
) ||
2565 (insn
& 0x0fff0fff) != 0x0e010f10)
2568 tcg_temp_free_i32(tmp2
);
2572 #define VFP_REG_SHR(x, n) (((n) > 0) ? (x) >> (n) : (x) << -(n))
2573 #define VFP_SREG(insn, bigbit, smallbit) \
2574 ((VFP_REG_SHR(insn, bigbit - 1) & 0x1e) | (((insn) >> (smallbit)) & 1))
2575 #define VFP_DREG(reg, insn, bigbit, smallbit) do { \
2576 if (arm_feature(env, ARM_FEATURE_VFP3)) { \
2577 reg = (((insn) >> (bigbit)) & 0x0f) \
2578 | (((insn) >> ((smallbit) - 4)) & 0x10); \
2580 if (insn & (1 << (smallbit))) \
2582 reg = ((insn) >> (bigbit)) & 0x0f; \
2585 #define VFP_SREG_D(insn) VFP_SREG(insn, 12, 22)
2586 #define VFP_DREG_D(reg, insn) VFP_DREG(reg, insn, 12, 22)
2587 #define VFP_SREG_N(insn) VFP_SREG(insn, 16, 7)
2588 #define VFP_DREG_N(reg, insn) VFP_DREG(reg, insn, 16, 7)
2589 #define VFP_SREG_M(insn) VFP_SREG(insn, 0, 5)
2590 #define VFP_DREG_M(reg, insn) VFP_DREG(reg, insn, 0, 5)
2592 /* Move between integer and VFP cores. */
2593 static TCGv
gen_vfp_mrs(void)
2595 TCGv tmp
= new_tmp();
2596 tcg_gen_mov_i32(tmp
, cpu_F0s
);
2600 static void gen_vfp_msr(TCGv tmp
)
2602 tcg_gen_mov_i32(cpu_F0s
, tmp
);
2607 vfp_enabled(CPUState
* env
)
2609 return ((env
->vfp
.xregs
[ARM_VFP_FPEXC
] & (1 << 30)) != 0);
2612 static void gen_neon_dup_u8(TCGv var
, int shift
)
2614 TCGv tmp
= new_tmp();
2616 tcg_gen_shri_i32(var
, var
, shift
);
2617 tcg_gen_ext8u_i32(var
, var
);
2618 tcg_gen_shli_i32(tmp
, var
, 8);
2619 tcg_gen_or_i32(var
, var
, tmp
);
2620 tcg_gen_shli_i32(tmp
, var
, 16);
2621 tcg_gen_or_i32(var
, var
, tmp
);
2625 static void gen_neon_dup_low16(TCGv var
)
2627 TCGv tmp
= new_tmp();
2628 tcg_gen_ext16u_i32(var
, var
);
2629 tcg_gen_shli_i32(tmp
, var
, 16);
2630 tcg_gen_or_i32(var
, var
, tmp
);
2634 static void gen_neon_dup_high16(TCGv var
)
2636 TCGv tmp
= new_tmp();
2637 tcg_gen_andi_i32(var
, var
, 0xffff0000);
2638 tcg_gen_shri_i32(tmp
, var
, 16);
2639 tcg_gen_or_i32(var
, var
, tmp
);
2643 /* Disassemble a VFP instruction. Returns nonzero if an error occured
2644 (ie. an undefined instruction). */
2645 static int disas_vfp_insn(CPUState
* env
, DisasContext
*s
, uint32_t insn
)
2647 uint32_t rd
, rn
, rm
, op
, i
, n
, offset
, delta_d
, delta_m
, bank_mask
;
2653 if (!arm_feature(env
, ARM_FEATURE_VFP
))
2656 if (!vfp_enabled(env
)) {
2657 /* VFP disabled. Only allow fmxr/fmrx to/from some control regs. */
2658 if ((insn
& 0x0fe00fff) != 0x0ee00a10)
2660 rn
= (insn
>> 16) & 0xf;
2661 if (rn
!= ARM_VFP_FPSID
&& rn
!= ARM_VFP_FPEXC
2662 && rn
!= ARM_VFP_MVFR1
&& rn
!= ARM_VFP_MVFR0
)
2665 dp
= ((insn
& 0xf00) == 0xb00);
2666 switch ((insn
>> 24) & 0xf) {
2668 if (insn
& (1 << 4)) {
2669 /* single register transfer */
2670 rd
= (insn
>> 12) & 0xf;
2675 VFP_DREG_N(rn
, insn
);
2678 if (insn
& 0x00c00060
2679 && !arm_feature(env
, ARM_FEATURE_NEON
))
2682 pass
= (insn
>> 21) & 1;
2683 if (insn
& (1 << 22)) {
2685 offset
= ((insn
>> 5) & 3) * 8;
2686 } else if (insn
& (1 << 5)) {
2688 offset
= (insn
& (1 << 6)) ? 16 : 0;
2693 if (insn
& ARM_CP_RW_BIT
) {
2695 tmp
= neon_load_reg(rn
, pass
);
2699 tcg_gen_shri_i32(tmp
, tmp
, offset
);
2700 if (insn
& (1 << 23))
2706 if (insn
& (1 << 23)) {
2708 tcg_gen_shri_i32(tmp
, tmp
, 16);
2714 tcg_gen_sari_i32(tmp
, tmp
, 16);
2723 store_reg(s
, rd
, tmp
);
2726 tmp
= load_reg(s
, rd
);
2727 if (insn
& (1 << 23)) {
2730 gen_neon_dup_u8(tmp
, 0);
2731 } else if (size
== 1) {
2732 gen_neon_dup_low16(tmp
);
2734 for (n
= 0; n
<= pass
* 2; n
++) {
2736 tcg_gen_mov_i32(tmp2
, tmp
);
2737 neon_store_reg(rn
, n
, tmp2
);
2739 neon_store_reg(rn
, n
, tmp
);
2744 tmp2
= neon_load_reg(rn
, pass
);
2745 gen_bfi(tmp
, tmp2
, tmp
, offset
, 0xff);
2749 tmp2
= neon_load_reg(rn
, pass
);
2750 gen_bfi(tmp
, tmp2
, tmp
, offset
, 0xffff);
2756 neon_store_reg(rn
, pass
, tmp
);
2760 if ((insn
& 0x6f) != 0x00)
2762 rn
= VFP_SREG_N(insn
);
2763 if (insn
& ARM_CP_RW_BIT
) {
2765 if (insn
& (1 << 21)) {
2766 /* system register */
2771 /* VFP2 allows access to FSID from userspace.
2772 VFP3 restricts all id registers to privileged
2775 && arm_feature(env
, ARM_FEATURE_VFP3
))
2777 tmp
= load_cpu_field(vfp
.xregs
[rn
]);
2782 tmp
= load_cpu_field(vfp
.xregs
[rn
]);
2784 case ARM_VFP_FPINST
:
2785 case ARM_VFP_FPINST2
:
2786 /* Not present in VFP3. */
2788 || arm_feature(env
, ARM_FEATURE_VFP3
))
2790 tmp
= load_cpu_field(vfp
.xregs
[rn
]);
2794 tmp
= load_cpu_field(vfp
.xregs
[ARM_VFP_FPSCR
]);
2795 tcg_gen_andi_i32(tmp
, tmp
, 0xf0000000);
2798 gen_helper_vfp_get_fpscr(tmp
, cpu_env
);
2804 || !arm_feature(env
, ARM_FEATURE_VFP3
))
2806 tmp
= load_cpu_field(vfp
.xregs
[rn
]);
2812 gen_mov_F0_vreg(0, rn
);
2813 tmp
= gen_vfp_mrs();
2816 /* Set the 4 flag bits in the CPSR. */
2820 store_reg(s
, rd
, tmp
);
2824 tmp
= load_reg(s
, rd
);
2825 if (insn
& (1 << 21)) {
2827 /* system register */
2832 /* Writes are ignored. */
2835 gen_helper_vfp_set_fpscr(cpu_env
, tmp
);
2842 /* TODO: VFP subarchitecture support.
2843 * For now, keep the EN bit only */
2844 tcg_gen_andi_i32(tmp
, tmp
, 1 << 30);
2845 store_cpu_field(tmp
, vfp
.xregs
[rn
]);
2848 case ARM_VFP_FPINST
:
2849 case ARM_VFP_FPINST2
:
2850 store_cpu_field(tmp
, vfp
.xregs
[rn
]);
2857 gen_mov_vreg_F0(0, rn
);
2862 /* data processing */
2863 /* The opcode is in bits 23, 21, 20 and 6. */
2864 op
= ((insn
>> 20) & 8) | ((insn
>> 19) & 6) | ((insn
>> 6) & 1);
2868 rn
= ((insn
>> 15) & 0x1e) | ((insn
>> 7) & 1);
2870 /* rn is register number */
2871 VFP_DREG_N(rn
, insn
);
2874 if (op
== 15 && (rn
== 15 || ((rn
& 0x1c) == 0x18))) {
2875 /* Integer or single precision destination. */
2876 rd
= VFP_SREG_D(insn
);
2878 VFP_DREG_D(rd
, insn
);
2881 (((rn
& 0x1c) == 0x10) || ((rn
& 0x14) == 0x14))) {
2882 /* VCVT from int is always from S reg regardless of dp bit.
2883 * VCVT with immediate frac_bits has same format as SREG_M
2885 rm
= VFP_SREG_M(insn
);
2887 VFP_DREG_M(rm
, insn
);
2890 rn
= VFP_SREG_N(insn
);
2891 if (op
== 15 && rn
== 15) {
2892 /* Double precision destination. */
2893 VFP_DREG_D(rd
, insn
);
2895 rd
= VFP_SREG_D(insn
);
2897 /* NB that we implicitly rely on the encoding for the frac_bits
2898 * in VCVT of fixed to float being the same as that of an SREG_M
2900 rm
= VFP_SREG_M(insn
);
2903 veclen
= env
->vfp
.vec_len
;
2904 if (op
== 15 && rn
> 3)
2907 /* Shut up compiler warnings. */
2918 /* Figure out what type of vector operation this is. */
2919 if ((rd
& bank_mask
) == 0) {
2924 delta_d
= (env
->vfp
.vec_stride
>> 1) + 1;
2926 delta_d
= env
->vfp
.vec_stride
+ 1;
2928 if ((rm
& bank_mask
) == 0) {
2929 /* mixed scalar/vector */
2938 /* Load the initial operands. */
2943 /* Integer source */
2944 gen_mov_F0_vreg(0, rm
);
2949 gen_mov_F0_vreg(dp
, rd
);
2950 gen_mov_F1_vreg(dp
, rm
);
2954 /* Compare with zero */
2955 gen_mov_F0_vreg(dp
, rd
);
2966 /* Source and destination the same. */
2967 gen_mov_F0_vreg(dp
, rd
);
2970 /* One source operand. */
2971 gen_mov_F0_vreg(dp
, rm
);
2975 /* Two source operands. */
2976 gen_mov_F0_vreg(dp
, rn
);
2977 gen_mov_F1_vreg(dp
, rm
);
2981 /* Perform the calculation. */
2983 case 0: /* mac: fd + (fn * fm) */
2985 gen_mov_F1_vreg(dp
, rd
);
2988 case 1: /* nmac: fd - (fn * fm) */
2991 gen_mov_F1_vreg(dp
, rd
);
2994 case 2: /* msc: -fd + (fn * fm) */
2996 gen_mov_F1_vreg(dp
, rd
);
2999 case 3: /* nmsc: -fd - (fn * fm) */
3002 gen_mov_F1_vreg(dp
, rd
);
3005 case 4: /* mul: fn * fm */
3008 case 5: /* nmul: -(fn * fm) */
3012 case 6: /* add: fn + fm */
3015 case 7: /* sub: fn - fm */
3018 case 8: /* div: fn / fm */
3021 case 14: /* fconst */
3022 if (!arm_feature(env
, ARM_FEATURE_VFP3
))
3025 n
= (insn
<< 12) & 0x80000000;
3026 i
= ((insn
>> 12) & 0x70) | (insn
& 0xf);
3033 tcg_gen_movi_i64(cpu_F0d
, ((uint64_t)n
) << 32);
3040 tcg_gen_movi_i32(cpu_F0s
, n
);
3043 case 15: /* extension space */
3057 case 4: /* vcvtb.f32.f16 */
3058 if (!arm_feature(env
, ARM_FEATURE_VFP_FP16
))
3060 tmp
= gen_vfp_mrs();
3061 tcg_gen_ext16u_i32(tmp
, tmp
);
3062 gen_helper_vfp_fcvt_f16_to_f32(cpu_F0s
, tmp
, cpu_env
);
3065 case 5: /* vcvtt.f32.f16 */
3066 if (!arm_feature(env
, ARM_FEATURE_VFP_FP16
))
3068 tmp
= gen_vfp_mrs();
3069 tcg_gen_shri_i32(tmp
, tmp
, 16);
3070 gen_helper_vfp_fcvt_f16_to_f32(cpu_F0s
, tmp
, cpu_env
);
3073 case 6: /* vcvtb.f16.f32 */
3074 if (!arm_feature(env
, ARM_FEATURE_VFP_FP16
))
3077 gen_helper_vfp_fcvt_f32_to_f16(tmp
, cpu_F0s
, cpu_env
);
3078 gen_mov_F0_vreg(0, rd
);
3079 tmp2
= gen_vfp_mrs();
3080 tcg_gen_andi_i32(tmp2
, tmp2
, 0xffff0000);
3081 tcg_gen_or_i32(tmp
, tmp
, tmp2
);
3085 case 7: /* vcvtt.f16.f32 */
3086 if (!arm_feature(env
, ARM_FEATURE_VFP_FP16
))
3089 gen_helper_vfp_fcvt_f32_to_f16(tmp
, cpu_F0s
, cpu_env
);
3090 tcg_gen_shli_i32(tmp
, tmp
, 16);
3091 gen_mov_F0_vreg(0, rd
);
3092 tmp2
= gen_vfp_mrs();
3093 tcg_gen_ext16u_i32(tmp2
, tmp2
);
3094 tcg_gen_or_i32(tmp
, tmp
, tmp2
);
3107 case 11: /* cmpez */
3111 case 15: /* single<->double conversion */
3113 gen_helper_vfp_fcvtsd(cpu_F0s
, cpu_F0d
, cpu_env
);
3115 gen_helper_vfp_fcvtds(cpu_F0d
, cpu_F0s
, cpu_env
);
3117 case 16: /* fuito */
3120 case 17: /* fsito */
3123 case 20: /* fshto */
3124 if (!arm_feature(env
, ARM_FEATURE_VFP3
))
3126 gen_vfp_shto(dp
, 16 - rm
);
3128 case 21: /* fslto */
3129 if (!arm_feature(env
, ARM_FEATURE_VFP3
))
3131 gen_vfp_slto(dp
, 32 - rm
);
3133 case 22: /* fuhto */
3134 if (!arm_feature(env
, ARM_FEATURE_VFP3
))
3136 gen_vfp_uhto(dp
, 16 - rm
);
3138 case 23: /* fulto */
3139 if (!arm_feature(env
, ARM_FEATURE_VFP3
))
3141 gen_vfp_ulto(dp
, 32 - rm
);
3143 case 24: /* ftoui */
3146 case 25: /* ftouiz */
3149 case 26: /* ftosi */
3152 case 27: /* ftosiz */
3155 case 28: /* ftosh */
3156 if (!arm_feature(env
, ARM_FEATURE_VFP3
))
3158 gen_vfp_tosh(dp
, 16 - rm
);
3160 case 29: /* ftosl */
3161 if (!arm_feature(env
, ARM_FEATURE_VFP3
))
3163 gen_vfp_tosl(dp
, 32 - rm
);
3165 case 30: /* ftouh */
3166 if (!arm_feature(env
, ARM_FEATURE_VFP3
))
3168 gen_vfp_touh(dp
, 16 - rm
);
3170 case 31: /* ftoul */
3171 if (!arm_feature(env
, ARM_FEATURE_VFP3
))
3173 gen_vfp_toul(dp
, 32 - rm
);
3175 default: /* undefined */
3176 printf ("rn:%d\n", rn
);
3180 default: /* undefined */
3181 printf ("op:%d\n", op
);
3185 /* Write back the result. */
3186 if (op
== 15 && (rn
>= 8 && rn
<= 11))
3187 ; /* Comparison, do nothing. */
3188 else if (op
== 15 && dp
&& ((rn
& 0x1c) == 0x18))
3189 /* VCVT double to int: always integer result. */
3190 gen_mov_vreg_F0(0, rd
);
3191 else if (op
== 15 && rn
== 15)
3193 gen_mov_vreg_F0(!dp
, rd
);
3195 gen_mov_vreg_F0(dp
, rd
);
3197 /* break out of the loop if we have finished */
3201 if (op
== 15 && delta_m
== 0) {
3202 /* single source one-many */
3204 rd
= ((rd
+ delta_d
) & (bank_mask
- 1))
3206 gen_mov_vreg_F0(dp
, rd
);
3210 /* Setup the next operands. */
3212 rd
= ((rd
+ delta_d
) & (bank_mask
- 1))
3216 /* One source operand. */
3217 rm
= ((rm
+ delta_m
) & (bank_mask
- 1))
3219 gen_mov_F0_vreg(dp
, rm
);
3221 /* Two source operands. */
3222 rn
= ((rn
+ delta_d
) & (bank_mask
- 1))
3224 gen_mov_F0_vreg(dp
, rn
);
3226 rm
= ((rm
+ delta_m
) & (bank_mask
- 1))
3228 gen_mov_F1_vreg(dp
, rm
);
3236 if (dp
&& (insn
& 0x03e00000) == 0x00400000) {
3237 /* two-register transfer */
3238 rn
= (insn
>> 16) & 0xf;
3239 rd
= (insn
>> 12) & 0xf;
3241 VFP_DREG_M(rm
, insn
);
3243 rm
= VFP_SREG_M(insn
);
3246 if (insn
& ARM_CP_RW_BIT
) {
3249 gen_mov_F0_vreg(0, rm
* 2);
3250 tmp
= gen_vfp_mrs();
3251 store_reg(s
, rd
, tmp
);
3252 gen_mov_F0_vreg(0, rm
* 2 + 1);
3253 tmp
= gen_vfp_mrs();
3254 store_reg(s
, rn
, tmp
);
3256 gen_mov_F0_vreg(0, rm
);
3257 tmp
= gen_vfp_mrs();
3258 store_reg(s
, rn
, tmp
);
3259 gen_mov_F0_vreg(0, rm
+ 1);
3260 tmp
= gen_vfp_mrs();
3261 store_reg(s
, rd
, tmp
);
3266 tmp
= load_reg(s
, rd
);
3268 gen_mov_vreg_F0(0, rm
* 2);
3269 tmp
= load_reg(s
, rn
);
3271 gen_mov_vreg_F0(0, rm
* 2 + 1);
3273 tmp
= load_reg(s
, rn
);
3275 gen_mov_vreg_F0(0, rm
);
3276 tmp
= load_reg(s
, rd
);
3278 gen_mov_vreg_F0(0, rm
+ 1);
3283 rn
= (insn
>> 16) & 0xf;
3285 VFP_DREG_D(rd
, insn
);
3287 rd
= VFP_SREG_D(insn
);
3288 if (s
->thumb
&& rn
== 15) {
3290 tcg_gen_movi_i32(addr
, s
->pc
& ~2);
3292 addr
= load_reg(s
, rn
);
3294 if ((insn
& 0x01200000) == 0x01000000) {
3295 /* Single load/store */
3296 offset
= (insn
& 0xff) << 2;
3297 if ((insn
& (1 << 23)) == 0)
3299 tcg_gen_addi_i32(addr
, addr
, offset
);
3300 if (insn
& (1 << 20)) {
3301 gen_vfp_ld(s
, dp
, addr
);
3302 gen_mov_vreg_F0(dp
, rd
);
3304 gen_mov_F0_vreg(dp
, rd
);
3305 gen_vfp_st(s
, dp
, addr
);
3309 /* load/store multiple */
3311 n
= (insn
>> 1) & 0x7f;
3315 if (insn
& (1 << 24)) /* pre-decrement */
3316 tcg_gen_addi_i32(addr
, addr
, -((insn
& 0xff) << 2));
3322 for (i
= 0; i
< n
; i
++) {
3323 if (insn
& ARM_CP_RW_BIT
) {
3325 gen_vfp_ld(s
, dp
, addr
);
3326 gen_mov_vreg_F0(dp
, rd
+ i
);
3329 gen_mov_F0_vreg(dp
, rd
+ i
);
3330 gen_vfp_st(s
, dp
, addr
);
3332 tcg_gen_addi_i32(addr
, addr
, offset
);
3334 if (insn
& (1 << 21)) {
3336 if (insn
& (1 << 24))
3337 offset
= -offset
* n
;
3338 else if (dp
&& (insn
& 1))
3344 tcg_gen_addi_i32(addr
, addr
, offset
);
3345 store_reg(s
, rn
, addr
);
3353 /* Should never happen. */
3359 static inline void gen_goto_tb(DisasContext
*s
, int n
, uint32_t dest
)
3361 TranslationBlock
*tb
;
3364 if ((tb
->pc
& TARGET_PAGE_MASK
) == (dest
& TARGET_PAGE_MASK
)) {
3366 gen_set_pc_im(dest
);
3367 tcg_gen_exit_tb((long)tb
+ n
);
3369 gen_set_pc_im(dest
);
3374 static inline void gen_jmp (DisasContext
*s
, uint32_t dest
)
3376 if (unlikely(s
->singlestep_enabled
)) {
3377 /* An indirect jump so that we still trigger the debug exception. */
3382 gen_goto_tb(s
, 0, dest
);
3383 s
->is_jmp
= DISAS_TB_JUMP
;
3387 static inline void gen_mulxy(TCGv t0
, TCGv t1
, int x
, int y
)
3390 tcg_gen_sari_i32(t0
, t0
, 16);
3394 tcg_gen_sari_i32(t1
, t1
, 16);
3397 tcg_gen_mul_i32(t0
, t0
, t1
);
3400 /* Return the mask of PSR bits set by a MSR instruction. */
3401 static uint32_t msr_mask(CPUState
*env
, DisasContext
*s
, int flags
, int spsr
) {
3405 if (flags
& (1 << 0))
3407 if (flags
& (1 << 1))
3409 if (flags
& (1 << 2))
3411 if (flags
& (1 << 3))
3414 /* Mask out undefined bits. */
3415 mask
&= ~CPSR_RESERVED
;
3416 if (!arm_feature(env
, ARM_FEATURE_V6
))
3417 mask
&= ~(CPSR_E
| CPSR_GE
);
3418 if (!arm_feature(env
, ARM_FEATURE_THUMB2
))
3420 /* Mask out execution state bits. */
3423 /* Mask out privileged bits. */
3429 /* Returns nonzero if access to the PSR is not permitted. Marks t0 as dead. */
3430 static int gen_set_psr(DisasContext
*s
, uint32_t mask
, int spsr
, TCGv t0
)
3434 /* ??? This is also undefined in system mode. */
3438 tmp
= load_cpu_field(spsr
);
3439 tcg_gen_andi_i32(tmp
, tmp
, ~mask
);
3440 tcg_gen_andi_i32(t0
, t0
, mask
);
3441 tcg_gen_or_i32(tmp
, tmp
, t0
);
3442 store_cpu_field(tmp
, spsr
);
3444 gen_set_cpsr(t0
, mask
);
3451 /* Returns nonzero if access to the PSR is not permitted. */
3452 static int gen_set_psr_im(DisasContext
*s
, uint32_t mask
, int spsr
, uint32_t val
)
3456 tcg_gen_movi_i32(tmp
, val
);
3457 return gen_set_psr(s
, mask
, spsr
, tmp
);
3460 /* Generate an old-style exception return. Marks pc as dead. */
3461 static void gen_exception_return(DisasContext
*s
, TCGv pc
)
3464 store_reg(s
, 15, pc
);
3465 tmp
= load_cpu_field(spsr
);
3466 gen_set_cpsr(tmp
, 0xffffffff);
3468 s
->is_jmp
= DISAS_UPDATE
;
3471 /* Generate a v6 exception return. Marks both values as dead. */
3472 static void gen_rfe(DisasContext
*s
, TCGv pc
, TCGv cpsr
)
3474 gen_set_cpsr(cpsr
, 0xffffffff);
3476 store_reg(s
, 15, pc
);
3477 s
->is_jmp
= DISAS_UPDATE
;
3481 gen_set_condexec (DisasContext
*s
)
3483 if (s
->condexec_mask
) {
3484 uint32_t val
= (s
->condexec_cond
<< 4) | (s
->condexec_mask
>> 1);
3485 TCGv tmp
= new_tmp();
3486 tcg_gen_movi_i32(tmp
, val
);
3487 store_cpu_field(tmp
, condexec_bits
);
3491 static void gen_nop_hint(DisasContext
*s
, int val
)
3495 gen_set_pc_im(s
->pc
);
3496 s
->is_jmp
= DISAS_WFI
;
3500 /* TODO: Implement SEV and WFE. May help SMP performance. */
3506 #define CPU_V001 cpu_V0, cpu_V0, cpu_V1
3508 static inline int gen_neon_add(int size
, TCGv t0
, TCGv t1
)
3511 case 0: gen_helper_neon_add_u8(t0
, t0
, t1
); break;
3512 case 1: gen_helper_neon_add_u16(t0
, t0
, t1
); break;
3513 case 2: tcg_gen_add_i32(t0
, t0
, t1
); break;
3519 static inline void gen_neon_rsb(int size
, TCGv t0
, TCGv t1
)
3522 case 0: gen_helper_neon_sub_u8(t0
, t1
, t0
); break;
3523 case 1: gen_helper_neon_sub_u16(t0
, t1
, t0
); break;
3524 case 2: tcg_gen_sub_i32(t0
, t1
, t0
); break;
3529 /* 32-bit pairwise ops end up the same as the elementwise versions. */
3530 #define gen_helper_neon_pmax_s32 gen_helper_neon_max_s32
3531 #define gen_helper_neon_pmax_u32 gen_helper_neon_max_u32
3532 #define gen_helper_neon_pmin_s32 gen_helper_neon_min_s32
3533 #define gen_helper_neon_pmin_u32 gen_helper_neon_min_u32
3535 /* FIXME: This is wrong. They set the wrong overflow bit. */
3536 #define gen_helper_neon_qadd_s32(a, e, b, c) gen_helper_add_saturate(a, b, c)
3537 #define gen_helper_neon_qadd_u32(a, e, b, c) gen_helper_add_usaturate(a, b, c)
3538 #define gen_helper_neon_qsub_s32(a, e, b, c) gen_helper_sub_saturate(a, b, c)
3539 #define gen_helper_neon_qsub_u32(a, e, b, c) gen_helper_sub_usaturate(a, b, c)
3541 #define GEN_NEON_INTEGER_OP_ENV(name) do { \
3542 switch ((size << 1) | u) { \
3544 gen_helper_neon_##name##_s8(tmp, cpu_env, tmp, tmp2); \
3547 gen_helper_neon_##name##_u8(tmp, cpu_env, tmp, tmp2); \
3550 gen_helper_neon_##name##_s16(tmp, cpu_env, tmp, tmp2); \
3553 gen_helper_neon_##name##_u16(tmp, cpu_env, tmp, tmp2); \
3556 gen_helper_neon_##name##_s32(tmp, cpu_env, tmp, tmp2); \
3559 gen_helper_neon_##name##_u32(tmp, cpu_env, tmp, tmp2); \
3561 default: return 1; \
3564 #define GEN_NEON_INTEGER_OP(name) do { \
3565 switch ((size << 1) | u) { \
3567 gen_helper_neon_##name##_s8(tmp, tmp, tmp2); \
3570 gen_helper_neon_##name##_u8(tmp, tmp, tmp2); \
3573 gen_helper_neon_##name##_s16(tmp, tmp, tmp2); \
3576 gen_helper_neon_##name##_u16(tmp, tmp, tmp2); \
3579 gen_helper_neon_##name##_s32(tmp, tmp, tmp2); \
3582 gen_helper_neon_##name##_u32(tmp, tmp, tmp2); \
3584 default: return 1; \
3587 static TCGv
neon_load_scratch(int scratch
)
3589 TCGv tmp
= new_tmp();
3590 tcg_gen_ld_i32(tmp
, cpu_env
, offsetof(CPUARMState
, vfp
.scratch
[scratch
]));
3594 static void neon_store_scratch(int scratch
, TCGv var
)
3596 tcg_gen_st_i32(var
, cpu_env
, offsetof(CPUARMState
, vfp
.scratch
[scratch
]));
3600 static inline TCGv
neon_get_scalar(int size
, int reg
)
3604 tmp
= neon_load_reg(reg
>> 1, reg
& 1);
3606 tmp
= neon_load_reg(reg
>> 2, (reg
>> 1) & 1);
3608 gen_neon_dup_low16(tmp
);
3610 gen_neon_dup_high16(tmp
);
3616 static void gen_neon_unzip_u8(TCGv t0
, TCGv t1
)
3624 tcg_gen_andi_i32(rd
, t0
, 0xff);
3625 tcg_gen_shri_i32(tmp
, t0
, 8);
3626 tcg_gen_andi_i32(tmp
, tmp
, 0xff00);
3627 tcg_gen_or_i32(rd
, rd
, tmp
);
3628 tcg_gen_shli_i32(tmp
, t1
, 16);
3629 tcg_gen_andi_i32(tmp
, tmp
, 0xff0000);
3630 tcg_gen_or_i32(rd
, rd
, tmp
);
3631 tcg_gen_shli_i32(tmp
, t1
, 8);
3632 tcg_gen_andi_i32(tmp
, tmp
, 0xff000000);
3633 tcg_gen_or_i32(rd
, rd
, tmp
);
3635 tcg_gen_shri_i32(rm
, t0
, 8);
3636 tcg_gen_andi_i32(rm
, rm
, 0xff);
3637 tcg_gen_shri_i32(tmp
, t0
, 16);
3638 tcg_gen_andi_i32(tmp
, tmp
, 0xff00);
3639 tcg_gen_or_i32(rm
, rm
, tmp
);
3640 tcg_gen_shli_i32(tmp
, t1
, 8);
3641 tcg_gen_andi_i32(tmp
, tmp
, 0xff0000);
3642 tcg_gen_or_i32(rm
, rm
, tmp
);
3643 tcg_gen_andi_i32(tmp
, t1
, 0xff000000);
3644 tcg_gen_or_i32(t1
, rm
, tmp
);
3645 tcg_gen_mov_i32(t0
, rd
);
3652 static void gen_neon_zip_u8(TCGv t0
, TCGv t1
)
3660 tcg_gen_andi_i32(rd
, t0
, 0xff);
3661 tcg_gen_shli_i32(tmp
, t1
, 8);
3662 tcg_gen_andi_i32(tmp
, tmp
, 0xff00);
3663 tcg_gen_or_i32(rd
, rd
, tmp
);
3664 tcg_gen_shli_i32(tmp
, t0
, 16);
3665 tcg_gen_andi_i32(tmp
, tmp
, 0xff0000);
3666 tcg_gen_or_i32(rd
, rd
, tmp
);
3667 tcg_gen_shli_i32(tmp
, t1
, 24);
3668 tcg_gen_andi_i32(tmp
, tmp
, 0xff000000);
3669 tcg_gen_or_i32(rd
, rd
, tmp
);
3671 tcg_gen_andi_i32(rm
, t1
, 0xff000000);
3672 tcg_gen_shri_i32(tmp
, t0
, 8);
3673 tcg_gen_andi_i32(tmp
, tmp
, 0xff0000);
3674 tcg_gen_or_i32(rm
, rm
, tmp
);
3675 tcg_gen_shri_i32(tmp
, t1
, 8);
3676 tcg_gen_andi_i32(tmp
, tmp
, 0xff00);
3677 tcg_gen_or_i32(rm
, rm
, tmp
);
3678 tcg_gen_shri_i32(tmp
, t0
, 16);
3679 tcg_gen_andi_i32(tmp
, tmp
, 0xff);
3680 tcg_gen_or_i32(t1
, rm
, tmp
);
3681 tcg_gen_mov_i32(t0
, rd
);
3688 static void gen_neon_zip_u16(TCGv t0
, TCGv t1
)
3695 tcg_gen_andi_i32(tmp
, t0
, 0xffff);
3696 tcg_gen_shli_i32(tmp2
, t1
, 16);
3697 tcg_gen_or_i32(tmp
, tmp
, tmp2
);
3698 tcg_gen_andi_i32(t1
, t1
, 0xffff0000);
3699 tcg_gen_shri_i32(tmp2
, t0
, 16);
3700 tcg_gen_or_i32(t1
, t1
, tmp2
);
3701 tcg_gen_mov_i32(t0
, tmp
);
3707 static void gen_neon_unzip(int reg
, int q
, int tmp
, int size
)
3712 for (n
= 0; n
< q
+ 1; n
+= 2) {
3713 t0
= neon_load_reg(reg
, n
);
3714 t1
= neon_load_reg(reg
, n
+ 1);
3716 case 0: gen_neon_unzip_u8(t0
, t1
); break;
3717 case 1: gen_neon_zip_u16(t0
, t1
); break; /* zip and unzip are the same. */
3718 case 2: /* no-op */; break;
3721 neon_store_scratch(tmp
+ n
, t0
);
3722 neon_store_scratch(tmp
+ n
+ 1, t1
);
3726 static void gen_neon_trn_u8(TCGv t0
, TCGv t1
)
3733 tcg_gen_shli_i32(rd
, t0
, 8);
3734 tcg_gen_andi_i32(rd
, rd
, 0xff00ff00);
3735 tcg_gen_andi_i32(tmp
, t1
, 0x00ff00ff);
3736 tcg_gen_or_i32(rd
, rd
, tmp
);
3738 tcg_gen_shri_i32(t1
, t1
, 8);
3739 tcg_gen_andi_i32(t1
, t1
, 0x00ff00ff);
3740 tcg_gen_andi_i32(tmp
, t0
, 0xff00ff00);
3741 tcg_gen_or_i32(t1
, t1
, tmp
);
3742 tcg_gen_mov_i32(t0
, rd
);
3748 static void gen_neon_trn_u16(TCGv t0
, TCGv t1
)
3755 tcg_gen_shli_i32(rd
, t0
, 16);
3756 tcg_gen_andi_i32(tmp
, t1
, 0xffff);
3757 tcg_gen_or_i32(rd
, rd
, tmp
);
3758 tcg_gen_shri_i32(t1
, t1
, 16);
3759 tcg_gen_andi_i32(tmp
, t0
, 0xffff0000);
3760 tcg_gen_or_i32(t1
, t1
, tmp
);
3761 tcg_gen_mov_i32(t0
, rd
);
3772 } neon_ls_element_type
[11] = {
3786 /* Translate a NEON load/store element instruction. Return nonzero if the
3787 instruction is invalid. */
3788 static int disas_neon_ls_insn(CPUState
* env
, DisasContext
*s
, uint32_t insn
)
3807 if (!vfp_enabled(env
))
3809 VFP_DREG_D(rd
, insn
);
3810 rn
= (insn
>> 16) & 0xf;
3812 load
= (insn
& (1 << 21)) != 0;
3814 if ((insn
& (1 << 23)) == 0) {
3815 /* Load store all elements. */
3816 op
= (insn
>> 8) & 0xf;
3817 size
= (insn
>> 6) & 3;
3820 nregs
= neon_ls_element_type
[op
].nregs
;
3821 interleave
= neon_ls_element_type
[op
].interleave
;
3822 spacing
= neon_ls_element_type
[op
].spacing
;
3823 if (size
== 3 && (interleave
| spacing
) != 1)
3825 load_reg_var(s
, addr
, rn
);
3826 stride
= (1 << size
) * interleave
;
3827 for (reg
= 0; reg
< nregs
; reg
++) {
3828 if (interleave
> 2 || (interleave
== 2 && nregs
== 2)) {
3829 load_reg_var(s
, addr
, rn
);
3830 tcg_gen_addi_i32(addr
, addr
, (1 << size
) * reg
);
3831 } else if (interleave
== 2 && nregs
== 4 && reg
== 2) {
3832 load_reg_var(s
, addr
, rn
);
3833 tcg_gen_addi_i32(addr
, addr
, 1 << size
);
3837 tmp64
= gen_ld64(addr
, IS_USER(s
));
3838 neon_store_reg64(tmp64
, rd
);
3839 tcg_temp_free_i64(tmp64
);
3841 tmp64
= tcg_temp_new_i64();
3842 neon_load_reg64(tmp64
, rd
);
3843 gen_st64(tmp64
, addr
, IS_USER(s
));
3845 tcg_gen_addi_i32(addr
, addr
, stride
);
3847 for (pass
= 0; pass
< 2; pass
++) {
3850 tmp
= gen_ld32(addr
, IS_USER(s
));
3851 neon_store_reg(rd
, pass
, tmp
);
3853 tmp
= neon_load_reg(rd
, pass
);
3854 gen_st32(tmp
, addr
, IS_USER(s
));
3856 tcg_gen_addi_i32(addr
, addr
, stride
);
3857 } else if (size
== 1) {
3859 tmp
= gen_ld16u(addr
, IS_USER(s
));
3860 tcg_gen_addi_i32(addr
, addr
, stride
);
3861 tmp2
= gen_ld16u(addr
, IS_USER(s
));
3862 tcg_gen_addi_i32(addr
, addr
, stride
);
3863 tcg_gen_shli_i32(tmp2
, tmp2
, 16);
3864 tcg_gen_or_i32(tmp
, tmp
, tmp2
);
3866 neon_store_reg(rd
, pass
, tmp
);
3868 tmp
= neon_load_reg(rd
, pass
);
3870 tcg_gen_shri_i32(tmp2
, tmp
, 16);
3871 gen_st16(tmp
, addr
, IS_USER(s
));
3872 tcg_gen_addi_i32(addr
, addr
, stride
);
3873 gen_st16(tmp2
, addr
, IS_USER(s
));
3874 tcg_gen_addi_i32(addr
, addr
, stride
);
3876 } else /* size == 0 */ {
3879 for (n
= 0; n
< 4; n
++) {
3880 tmp
= gen_ld8u(addr
, IS_USER(s
));
3881 tcg_gen_addi_i32(addr
, addr
, stride
);
3885 tcg_gen_shli_i32(tmp
, tmp
, n
* 8);
3886 tcg_gen_or_i32(tmp2
, tmp2
, tmp
);
3890 neon_store_reg(rd
, pass
, tmp2
);
3892 tmp2
= neon_load_reg(rd
, pass
);
3893 for (n
= 0; n
< 4; n
++) {
3896 tcg_gen_mov_i32(tmp
, tmp2
);
3898 tcg_gen_shri_i32(tmp
, tmp2
, n
* 8);
3900 gen_st8(tmp
, addr
, IS_USER(s
));
3901 tcg_gen_addi_i32(addr
, addr
, stride
);
3912 size
= (insn
>> 10) & 3;
3914 /* Load single element to all lanes. */
3917 size
= (insn
>> 6) & 3;
3918 nregs
= ((insn
>> 8) & 3) + 1;
3919 stride
= (insn
& (1 << 5)) ? 2 : 1;
3920 load_reg_var(s
, addr
, rn
);
3921 for (reg
= 0; reg
< nregs
; reg
++) {
3924 tmp
= gen_ld8u(addr
, IS_USER(s
));
3925 gen_neon_dup_u8(tmp
, 0);
3928 tmp
= gen_ld16u(addr
, IS_USER(s
));
3929 gen_neon_dup_low16(tmp
);
3932 tmp
= gen_ld32(addr
, IS_USER(s
));
3936 default: /* Avoid compiler warnings. */
3939 tcg_gen_addi_i32(addr
, addr
, 1 << size
);
3941 tcg_gen_mov_i32(tmp2
, tmp
);
3942 neon_store_reg(rd
, 0, tmp2
);
3943 neon_store_reg(rd
, 1, tmp
);
3946 stride
= (1 << size
) * nregs
;
3948 /* Single element. */
3949 pass
= (insn
>> 7) & 1;
3952 shift
= ((insn
>> 5) & 3) * 8;
3956 shift
= ((insn
>> 6) & 1) * 16;
3957 stride
= (insn
& (1 << 5)) ? 2 : 1;
3961 stride
= (insn
& (1 << 6)) ? 2 : 1;
3966 nregs
= ((insn
>> 8) & 3) + 1;
3967 load_reg_var(s
, addr
, rn
);
3968 for (reg
= 0; reg
< nregs
; reg
++) {
3972 tmp
= gen_ld8u(addr
, IS_USER(s
));
3975 tmp
= gen_ld16u(addr
, IS_USER(s
));
3978 tmp
= gen_ld32(addr
, IS_USER(s
));
3980 default: /* Avoid compiler warnings. */
3984 tmp2
= neon_load_reg(rd
, pass
);
3985 gen_bfi(tmp
, tmp2
, tmp
, shift
, size
? 0xffff : 0xff);
3988 neon_store_reg(rd
, pass
, tmp
);
3989 } else { /* Store */
3990 tmp
= neon_load_reg(rd
, pass
);
3992 tcg_gen_shri_i32(tmp
, tmp
, shift
);
3995 gen_st8(tmp
, addr
, IS_USER(s
));
3998 gen_st16(tmp
, addr
, IS_USER(s
));
4001 gen_st32(tmp
, addr
, IS_USER(s
));
4006 tcg_gen_addi_i32(addr
, addr
, 1 << size
);
4008 stride
= nregs
* (1 << size
);
4015 base
= load_reg(s
, rn
);
4017 tcg_gen_addi_i32(base
, base
, stride
);
4020 index
= load_reg(s
, rm
);
4021 tcg_gen_add_i32(base
, base
, index
);
4024 store_reg(s
, rn
, base
);
4029 /* Bitwise select. dest = c ? t : f. Clobbers T and F. */
4030 static void gen_neon_bsl(TCGv dest
, TCGv t
, TCGv f
, TCGv c
)
4032 tcg_gen_and_i32(t
, t
, c
);
4033 tcg_gen_andc_i32(f
, f
, c
);
4034 tcg_gen_or_i32(dest
, t
, f
);
4037 static inline void gen_neon_narrow(int size
, TCGv dest
, TCGv_i64 src
)
4040 case 0: gen_helper_neon_narrow_u8(dest
, src
); break;
4041 case 1: gen_helper_neon_narrow_u16(dest
, src
); break;
4042 case 2: tcg_gen_trunc_i64_i32(dest
, src
); break;
4047 static inline void gen_neon_narrow_sats(int size
, TCGv dest
, TCGv_i64 src
)
4050 case 0: gen_helper_neon_narrow_sat_s8(dest
, cpu_env
, src
); break;
4051 case 1: gen_helper_neon_narrow_sat_s16(dest
, cpu_env
, src
); break;
4052 case 2: gen_helper_neon_narrow_sat_s32(dest
, cpu_env
, src
); break;
4057 static inline void gen_neon_narrow_satu(int size
, TCGv dest
, TCGv_i64 src
)
4060 case 0: gen_helper_neon_narrow_sat_u8(dest
, cpu_env
, src
); break;
4061 case 1: gen_helper_neon_narrow_sat_u16(dest
, cpu_env
, src
); break;
4062 case 2: gen_helper_neon_narrow_sat_u32(dest
, cpu_env
, src
); break;
4067 static inline void gen_neon_shift_narrow(int size
, TCGv var
, TCGv shift
,
4073 case 1: gen_helper_neon_rshl_u16(var
, var
, shift
); break;
4074 case 2: gen_helper_neon_rshl_u32(var
, var
, shift
); break;
4079 case 1: gen_helper_neon_rshl_s16(var
, var
, shift
); break;
4080 case 2: gen_helper_neon_rshl_s32(var
, var
, shift
); break;
4087 case 1: gen_helper_neon_rshl_u16(var
, var
, shift
); break;
4088 case 2: gen_helper_neon_rshl_u32(var
, var
, shift
); break;
4093 case 1: gen_helper_neon_shl_s16(var
, var
, shift
); break;
4094 case 2: gen_helper_neon_shl_s32(var
, var
, shift
); break;
4101 static inline void gen_neon_widen(TCGv_i64 dest
, TCGv src
, int size
, int u
)
4105 case 0: gen_helper_neon_widen_u8(dest
, src
); break;
4106 case 1: gen_helper_neon_widen_u16(dest
, src
); break;
4107 case 2: tcg_gen_extu_i32_i64(dest
, src
); break;
4112 case 0: gen_helper_neon_widen_s8(dest
, src
); break;
4113 case 1: gen_helper_neon_widen_s16(dest
, src
); break;
4114 case 2: tcg_gen_ext_i32_i64(dest
, src
); break;
4121 static inline void gen_neon_addl(int size
)
4124 case 0: gen_helper_neon_addl_u16(CPU_V001
); break;
4125 case 1: gen_helper_neon_addl_u32(CPU_V001
); break;
4126 case 2: tcg_gen_add_i64(CPU_V001
); break;
4131 static inline void gen_neon_subl(int size
)
4134 case 0: gen_helper_neon_subl_u16(CPU_V001
); break;
4135 case 1: gen_helper_neon_subl_u32(CPU_V001
); break;
4136 case 2: tcg_gen_sub_i64(CPU_V001
); break;
4141 static inline void gen_neon_negl(TCGv_i64 var
, int size
)
4144 case 0: gen_helper_neon_negl_u16(var
, var
); break;
4145 case 1: gen_helper_neon_negl_u32(var
, var
); break;
4146 case 2: gen_helper_neon_negl_u64(var
, var
); break;
4151 static inline void gen_neon_addl_saturate(TCGv_i64 op0
, TCGv_i64 op1
, int size
)
4154 case 1: gen_helper_neon_addl_saturate_s32(op0
, cpu_env
, op0
, op1
); break;
4155 case 2: gen_helper_neon_addl_saturate_s64(op0
, cpu_env
, op0
, op1
); break;
4160 static inline void gen_neon_mull(TCGv_i64 dest
, TCGv a
, TCGv b
, int size
, int u
)
4164 switch ((size
<< 1) | u
) {
4165 case 0: gen_helper_neon_mull_s8(dest
, a
, b
); break;
4166 case 1: gen_helper_neon_mull_u8(dest
, a
, b
); break;
4167 case 2: gen_helper_neon_mull_s16(dest
, a
, b
); break;
4168 case 3: gen_helper_neon_mull_u16(dest
, a
, b
); break;
4170 tmp
= gen_muls_i64_i32(a
, b
);
4171 tcg_gen_mov_i64(dest
, tmp
);
4174 tmp
= gen_mulu_i64_i32(a
, b
);
4175 tcg_gen_mov_i64(dest
, tmp
);
4181 /* Translate a NEON data processing instruction. Return nonzero if the
4182 instruction is invalid.
4183 We process data in a mixture of 32-bit and 64-bit chunks.
4184 Mostly we use 32-bit chunks so we can use normal scalar instructions. */
4186 static int disas_neon_data_insn(CPUState
* env
, DisasContext
*s
, uint32_t insn
)
4199 TCGv tmp
, tmp2
, tmp3
, tmp4
, tmp5
;
4202 if (!vfp_enabled(env
))
4204 q
= (insn
& (1 << 6)) != 0;
4205 u
= (insn
>> 24) & 1;
4206 VFP_DREG_D(rd
, insn
);
4207 VFP_DREG_N(rn
, insn
);
4208 VFP_DREG_M(rm
, insn
);
4209 size
= (insn
>> 20) & 3;
4210 if ((insn
& (1 << 23)) == 0) {
4211 /* Three register same length. */
4212 op
= ((insn
>> 7) & 0x1e) | ((insn
>> 4) & 1);
4213 if (size
== 3 && (op
== 1 || op
== 5 || op
== 8 || op
== 9
4214 || op
== 10 || op
== 11 || op
== 16)) {
4215 /* 64-bit element instructions. */
4216 for (pass
= 0; pass
< (q
? 2 : 1); pass
++) {
4217 neon_load_reg64(cpu_V0
, rn
+ pass
);
4218 neon_load_reg64(cpu_V1
, rm
+ pass
);
4222 gen_helper_neon_add_saturate_u64(CPU_V001
);
4224 gen_helper_neon_add_saturate_s64(CPU_V001
);
4229 gen_helper_neon_sub_saturate_u64(CPU_V001
);
4231 gen_helper_neon_sub_saturate_s64(CPU_V001
);
4236 gen_helper_neon_shl_u64(cpu_V0
, cpu_V1
, cpu_V0
);
4238 gen_helper_neon_shl_s64(cpu_V0
, cpu_V1
, cpu_V0
);
4243 gen_helper_neon_qshl_u64(cpu_V0
, cpu_env
,
4246 gen_helper_neon_qshl_s64(cpu_V0
, cpu_env
,
4250 case 10: /* VRSHL */
4252 gen_helper_neon_rshl_u64(cpu_V0
, cpu_V1
, cpu_V0
);
4254 gen_helper_neon_rshl_s64(cpu_V0
, cpu_V1
, cpu_V0
);
4257 case 11: /* VQRSHL */
4259 gen_helper_neon_qrshl_u64(cpu_V0
, cpu_env
,
4262 gen_helper_neon_qrshl_s64(cpu_V0
, cpu_env
,
4268 tcg_gen_sub_i64(CPU_V001
);
4270 tcg_gen_add_i64(CPU_V001
);
4276 neon_store_reg64(cpu_V0
, rd
+ pass
);
4283 case 10: /* VRSHL */
4284 case 11: /* VQRSHL */
4287 /* Shift instruction operands are reversed. */
4294 case 20: /* VPMAX */
4295 case 21: /* VPMIN */
4296 case 23: /* VPADD */
4299 case 26: /* VPADD (float) */
4300 pairwise
= (u
&& size
< 2);
4302 case 30: /* VPMIN/VPMAX (float) */
4310 for (pass
= 0; pass
< (q
? 4 : 2); pass
++) {
4319 tmp
= neon_load_reg(rn
, n
);
4320 tmp2
= neon_load_reg(rn
, n
+ 1);
4322 tmp
= neon_load_reg(rm
, n
);
4323 tmp2
= neon_load_reg(rm
, n
+ 1);
4327 tmp
= neon_load_reg(rn
, pass
);
4328 tmp2
= neon_load_reg(rm
, pass
);
4332 GEN_NEON_INTEGER_OP(hadd
);
4335 GEN_NEON_INTEGER_OP_ENV(qadd
);
4337 case 2: /* VRHADD */
4338 GEN_NEON_INTEGER_OP(rhadd
);
4340 case 3: /* Logic ops. */
4341 switch ((u
<< 2) | size
) {
4343 tcg_gen_and_i32(tmp
, tmp
, tmp2
);
4346 tcg_gen_andc_i32(tmp
, tmp
, tmp2
);
4349 tcg_gen_or_i32(tmp
, tmp
, tmp2
);
4352 tcg_gen_orc_i32(tmp
, tmp
, tmp2
);
4355 tcg_gen_xor_i32(tmp
, tmp
, tmp2
);
4358 tmp3
= neon_load_reg(rd
, pass
);
4359 gen_neon_bsl(tmp
, tmp
, tmp2
, tmp3
);
4363 tmp3
= neon_load_reg(rd
, pass
);
4364 gen_neon_bsl(tmp
, tmp
, tmp3
, tmp2
);
4368 tmp3
= neon_load_reg(rd
, pass
);
4369 gen_neon_bsl(tmp
, tmp3
, tmp
, tmp2
);
4375 GEN_NEON_INTEGER_OP(hsub
);
4378 GEN_NEON_INTEGER_OP_ENV(qsub
);
4381 GEN_NEON_INTEGER_OP(cgt
);
4384 GEN_NEON_INTEGER_OP(cge
);
4387 GEN_NEON_INTEGER_OP(shl
);
4390 GEN_NEON_INTEGER_OP_ENV(qshl
);
4392 case 10: /* VRSHL */
4393 GEN_NEON_INTEGER_OP(rshl
);
4395 case 11: /* VQRSHL */
4396 GEN_NEON_INTEGER_OP_ENV(qrshl
);
4399 GEN_NEON_INTEGER_OP(max
);
4402 GEN_NEON_INTEGER_OP(min
);
4405 GEN_NEON_INTEGER_OP(abd
);
4408 GEN_NEON_INTEGER_OP(abd
);
4410 tmp2
= neon_load_reg(rd
, pass
);
4411 gen_neon_add(size
, tmp
, tmp2
);
4414 if (!u
) { /* VADD */
4415 if (gen_neon_add(size
, tmp
, tmp2
))
4419 case 0: gen_helper_neon_sub_u8(tmp
, tmp
, tmp2
); break;
4420 case 1: gen_helper_neon_sub_u16(tmp
, tmp
, tmp2
); break;
4421 case 2: tcg_gen_sub_i32(tmp
, tmp
, tmp2
); break;
4427 if (!u
) { /* VTST */
4429 case 0: gen_helper_neon_tst_u8(tmp
, tmp
, tmp2
); break;
4430 case 1: gen_helper_neon_tst_u16(tmp
, tmp
, tmp2
); break;
4431 case 2: gen_helper_neon_tst_u32(tmp
, tmp
, tmp2
); break;
4436 case 0: gen_helper_neon_ceq_u8(tmp
, tmp
, tmp2
); break;
4437 case 1: gen_helper_neon_ceq_u16(tmp
, tmp
, tmp2
); break;
4438 case 2: gen_helper_neon_ceq_u32(tmp
, tmp
, tmp2
); break;
4443 case 18: /* Multiply. */
4445 case 0: gen_helper_neon_mul_u8(tmp
, tmp
, tmp2
); break;
4446 case 1: gen_helper_neon_mul_u16(tmp
, tmp
, tmp2
); break;
4447 case 2: tcg_gen_mul_i32(tmp
, tmp
, tmp2
); break;
4451 tmp2
= neon_load_reg(rd
, pass
);
4453 gen_neon_rsb(size
, tmp
, tmp2
);
4455 gen_neon_add(size
, tmp
, tmp2
);
4459 if (u
) { /* polynomial */
4460 gen_helper_neon_mul_p8(tmp
, tmp
, tmp2
);
4461 } else { /* Integer */
4463 case 0: gen_helper_neon_mul_u8(tmp
, tmp
, tmp2
); break;
4464 case 1: gen_helper_neon_mul_u16(tmp
, tmp
, tmp2
); break;
4465 case 2: tcg_gen_mul_i32(tmp
, tmp
, tmp2
); break;
4470 case 20: /* VPMAX */
4471 GEN_NEON_INTEGER_OP(pmax
);
4473 case 21: /* VPMIN */
4474 GEN_NEON_INTEGER_OP(pmin
);
4476 case 22: /* Hultiply high. */
4477 if (!u
) { /* VQDMULH */
4479 case 1: gen_helper_neon_qdmulh_s16(tmp
, cpu_env
, tmp
, tmp2
); break;
4480 case 2: gen_helper_neon_qdmulh_s32(tmp
, cpu_env
, tmp
, tmp2
); break;
4483 } else { /* VQRDHMUL */
4485 case 1: gen_helper_neon_qrdmulh_s16(tmp
, cpu_env
, tmp
, tmp2
); break;
4486 case 2: gen_helper_neon_qrdmulh_s32(tmp
, cpu_env
, tmp
, tmp2
); break;
4491 case 23: /* VPADD */
4495 case 0: gen_helper_neon_padd_u8(tmp
, tmp
, tmp2
); break;
4496 case 1: gen_helper_neon_padd_u16(tmp
, tmp
, tmp2
); break;
4497 case 2: tcg_gen_add_i32(tmp
, tmp
, tmp2
); break;
4501 case 26: /* Floating point arithnetic. */
4502 switch ((u
<< 2) | size
) {
4504 gen_helper_neon_add_f32(tmp
, tmp
, tmp2
);
4507 gen_helper_neon_sub_f32(tmp
, tmp
, tmp2
);
4510 gen_helper_neon_add_f32(tmp
, tmp
, tmp2
);
4513 gen_helper_neon_abd_f32(tmp
, tmp
, tmp2
);
4519 case 27: /* Float multiply. */
4520 gen_helper_neon_mul_f32(tmp
, tmp
, tmp2
);
4523 tmp2
= neon_load_reg(rd
, pass
);
4525 gen_helper_neon_add_f32(tmp
, tmp
, tmp2
);
4527 gen_helper_neon_sub_f32(tmp
, tmp2
, tmp
);
4531 case 28: /* Float compare. */
4533 gen_helper_neon_ceq_f32(tmp
, tmp
, tmp2
);
4536 gen_helper_neon_cge_f32(tmp
, tmp
, tmp2
);
4538 gen_helper_neon_cgt_f32(tmp
, tmp
, tmp2
);
4541 case 29: /* Float compare absolute. */
4545 gen_helper_neon_acge_f32(tmp
, tmp
, tmp2
);
4547 gen_helper_neon_acgt_f32(tmp
, tmp
, tmp2
);
4549 case 30: /* Float min/max. */
4551 gen_helper_neon_max_f32(tmp
, tmp
, tmp2
);
4553 gen_helper_neon_min_f32(tmp
, tmp
, tmp2
);
4557 gen_helper_recps_f32(tmp
, tmp
, tmp2
, cpu_env
);
4559 gen_helper_rsqrts_f32(tmp
, tmp
, tmp2
, cpu_env
);
4566 /* Save the result. For elementwise operations we can put it
4567 straight into the destination register. For pairwise operations
4568 we have to be careful to avoid clobbering the source operands. */
4569 if (pairwise
&& rd
== rm
) {
4570 neon_store_scratch(pass
, tmp
);
4572 neon_store_reg(rd
, pass
, tmp
);
4576 if (pairwise
&& rd
== rm
) {
4577 for (pass
= 0; pass
< (q
? 4 : 2); pass
++) {
4578 tmp
= neon_load_scratch(pass
);
4579 neon_store_reg(rd
, pass
, tmp
);
4582 /* End of 3 register same size operations. */
4583 } else if (insn
& (1 << 4)) {
4584 if ((insn
& 0x00380080) != 0) {
4585 /* Two registers and shift. */
4586 op
= (insn
>> 8) & 0xf;
4587 if (insn
& (1 << 7)) {
4592 while ((insn
& (1 << (size
+ 19))) == 0)
4595 shift
= (insn
>> 16) & ((1 << (3 + size
)) - 1);
4596 /* To avoid excessive dumplication of ops we implement shift
4597 by immediate using the variable shift operations. */
4599 /* Shift by immediate:
4600 VSHR, VSRA, VRSHR, VRSRA, VSRI, VSHL, VQSHL, VQSHLU. */
4601 /* Right shifts are encoded as N - shift, where N is the
4602 element size in bits. */
4604 shift
= shift
- (1 << (size
+ 3));
4612 imm
= (uint8_t) shift
;
4617 imm
= (uint16_t) shift
;
4628 for (pass
= 0; pass
< count
; pass
++) {
4630 neon_load_reg64(cpu_V0
, rm
+ pass
);
4631 tcg_gen_movi_i64(cpu_V1
, imm
);
4636 gen_helper_neon_shl_u64(cpu_V0
, cpu_V0
, cpu_V1
);
4638 gen_helper_neon_shl_s64(cpu_V0
, cpu_V0
, cpu_V1
);
4643 gen_helper_neon_rshl_u64(cpu_V0
, cpu_V0
, cpu_V1
);
4645 gen_helper_neon_rshl_s64(cpu_V0
, cpu_V0
, cpu_V1
);
4650 gen_helper_neon_shl_u64(cpu_V0
, cpu_V0
, cpu_V1
);
4652 case 5: /* VSHL, VSLI */
4653 gen_helper_neon_shl_u64(cpu_V0
, cpu_V0
, cpu_V1
);
4655 case 6: /* VQSHLU */
4657 gen_helper_neon_qshlu_s64(cpu_V0
, cpu_env
,
4665 gen_helper_neon_qshl_u64(cpu_V0
, cpu_env
,
4668 gen_helper_neon_qshl_s64(cpu_V0
, cpu_env
,
4673 if (op
== 1 || op
== 3) {
4675 neon_load_reg64(cpu_V0
, rd
+ pass
);
4676 tcg_gen_add_i64(cpu_V0
, cpu_V0
, cpu_V1
);
4677 } else if (op
== 4 || (op
== 5 && u
)) {
4679 cpu_abort(env
, "VS[LR]I.64 not implemented");
4681 neon_store_reg64(cpu_V0
, rd
+ pass
);
4682 } else { /* size < 3 */
4683 /* Operands in T0 and T1. */
4684 tmp
= neon_load_reg(rm
, pass
);
4686 tcg_gen_movi_i32(tmp2
, imm
);
4690 GEN_NEON_INTEGER_OP(shl
);
4694 GEN_NEON_INTEGER_OP(rshl
);
4699 GEN_NEON_INTEGER_OP(shl
);
4701 case 5: /* VSHL, VSLI */
4703 case 0: gen_helper_neon_shl_u8(tmp
, tmp
, tmp2
); break;
4704 case 1: gen_helper_neon_shl_u16(tmp
, tmp
, tmp2
); break;
4705 case 2: gen_helper_neon_shl_u32(tmp
, tmp
, tmp2
); break;
4709 case 6: /* VQSHLU */
4715 gen_helper_neon_qshlu_s8(tmp
, cpu_env
,
4719 gen_helper_neon_qshlu_s16(tmp
, cpu_env
,
4723 gen_helper_neon_qshlu_s32(tmp
, cpu_env
,
4731 GEN_NEON_INTEGER_OP_ENV(qshl
);
4736 if (op
== 1 || op
== 3) {
4738 tmp2
= neon_load_reg(rd
, pass
);
4739 gen_neon_add(size
, tmp2
, tmp
);
4741 } else if (op
== 4 || (op
== 5 && u
)) {
4746 mask
= 0xff >> -shift
;
4748 mask
= (uint8_t)(0xff << shift
);
4754 mask
= 0xffff >> -shift
;
4756 mask
= (uint16_t)(0xffff << shift
);
4760 if (shift
< -31 || shift
> 31) {
4764 mask
= 0xffffffffu
>> -shift
;
4766 mask
= 0xffffffffu
<< shift
;
4772 tmp2
= neon_load_reg(rd
, pass
);
4773 tcg_gen_andi_i32(tmp
, tmp
, mask
);
4774 tcg_gen_andi_i32(tmp2
, tmp2
, ~mask
);
4775 tcg_gen_or_i32(tmp
, tmp
, tmp2
);
4778 neon_store_reg(rd
, pass
, tmp
);
4781 } else if (op
< 10) {
4782 /* Shift by immediate and narrow:
4783 VSHRN, VRSHRN, VQSHRN, VQRSHRN. */
4784 shift
= shift
- (1 << (size
+ 3));
4788 imm
= (uint16_t)shift
;
4790 tmp2
= tcg_const_i32(imm
);
4791 TCGV_UNUSED_I64(tmp64
);
4794 imm
= (uint32_t)shift
;
4795 tmp2
= tcg_const_i32(imm
);
4796 TCGV_UNUSED_I64(tmp64
);
4799 tmp64
= tcg_const_i64(shift
);
4806 for (pass
= 0; pass
< 2; pass
++) {
4808 neon_load_reg64(cpu_V0
, rm
+ pass
);
4811 gen_helper_neon_rshl_u64(cpu_V0
, cpu_V0
, tmp64
);
4813 gen_helper_neon_rshl_s64(cpu_V0
, cpu_V0
, tmp64
);
4816 gen_helper_neon_shl_u64(cpu_V0
, cpu_V0
, tmp64
);
4818 gen_helper_neon_shl_s64(cpu_V0
, cpu_V0
, tmp64
);
4821 tmp
= neon_load_reg(rm
+ pass
, 0);
4822 gen_neon_shift_narrow(size
, tmp
, tmp2
, q
, u
);
4823 tmp3
= neon_load_reg(rm
+ pass
, 1);
4824 gen_neon_shift_narrow(size
, tmp3
, tmp2
, q
, u
);
4825 tcg_gen_concat_i32_i64(cpu_V0
, tmp
, tmp3
);
4830 if (op
== 8 && !u
) {
4831 gen_neon_narrow(size
- 1, tmp
, cpu_V0
);
4834 gen_neon_narrow_sats(size
- 1, tmp
, cpu_V0
);
4836 gen_neon_narrow_satu(size
- 1, tmp
, cpu_V0
);
4838 neon_store_reg(rd
, pass
, tmp
);
4841 tcg_temp_free_i64(tmp64
);
4845 } else if (op
== 10) {
4849 tmp
= neon_load_reg(rm
, 0);
4850 tmp2
= neon_load_reg(rm
, 1);
4851 for (pass
= 0; pass
< 2; pass
++) {
4855 gen_neon_widen(cpu_V0
, tmp
, size
, u
);
4858 /* The shift is less than the width of the source
4859 type, so we can just shift the whole register. */
4860 tcg_gen_shli_i64(cpu_V0
, cpu_V0
, shift
);
4861 if (size
< 2 || !u
) {
4864 imm
= (0xffu
>> (8 - shift
));
4867 imm
= 0xffff >> (16 - shift
);
4869 imm64
= imm
| (((uint64_t)imm
) << 32);
4870 tcg_gen_andi_i64(cpu_V0
, cpu_V0
, imm64
);
4873 neon_store_reg64(cpu_V0
, rd
+ pass
);
4875 } else if (op
>= 14) {
4876 /* VCVT fixed-point. */
4877 /* We have already masked out the must-be-1 top bit of imm6,
4878 * hence this 32-shift where the ARM ARM has 64-imm6.
4881 for (pass
= 0; pass
< (q
? 4 : 2); pass
++) {
4882 tcg_gen_ld_f32(cpu_F0s
, cpu_env
, neon_reg_offset(rm
, pass
));
4885 gen_vfp_ulto(0, shift
);
4887 gen_vfp_slto(0, shift
);
4890 gen_vfp_toul(0, shift
);
4892 gen_vfp_tosl(0, shift
);
4894 tcg_gen_st_f32(cpu_F0s
, cpu_env
, neon_reg_offset(rd
, pass
));
4899 } else { /* (insn & 0x00380080) == 0 */
4902 op
= (insn
>> 8) & 0xf;
4903 /* One register and immediate. */
4904 imm
= (u
<< 7) | ((insn
>> 12) & 0x70) | (insn
& 0xf);
4905 invert
= (insn
& (1 << 5)) != 0;
4923 imm
= (imm
<< 8) | (imm
<< 24);
4926 imm
= (imm
<< 8) | 0xff;
4929 imm
= (imm
<< 16) | 0xffff;
4932 imm
|= (imm
<< 8) | (imm
<< 16) | (imm
<< 24);
4937 imm
= ((imm
& 0x80) << 24) | ((imm
& 0x3f) << 19)
4938 | ((imm
& 0x40) ? (0x1f << 25) : (1 << 30));
4944 for (pass
= 0; pass
< (q
? 4 : 2); pass
++) {
4945 if (op
& 1 && op
< 12) {
4946 tmp
= neon_load_reg(rd
, pass
);
4948 /* The immediate value has already been inverted, so
4950 tcg_gen_andi_i32(tmp
, tmp
, imm
);
4952 tcg_gen_ori_i32(tmp
, tmp
, imm
);
4957 if (op
== 14 && invert
) {
4960 for (n
= 0; n
< 4; n
++) {
4961 if (imm
& (1 << (n
+ (pass
& 1) * 4)))
4962 val
|= 0xff << (n
* 8);
4964 tcg_gen_movi_i32(tmp
, val
);
4966 tcg_gen_movi_i32(tmp
, imm
);
4969 neon_store_reg(rd
, pass
, tmp
);
4972 } else { /* (insn & 0x00800010 == 0x00800000) */
4974 op
= (insn
>> 8) & 0xf;
4975 if ((insn
& (1 << 6)) == 0) {
4976 /* Three registers of different lengths. */
4980 /* prewiden, src1_wide, src2_wide */
4981 static const int neon_3reg_wide
[16][3] = {
4982 {1, 0, 0}, /* VADDL */
4983 {1, 1, 0}, /* VADDW */
4984 {1, 0, 0}, /* VSUBL */
4985 {1, 1, 0}, /* VSUBW */
4986 {0, 1, 1}, /* VADDHN */
4987 {0, 0, 0}, /* VABAL */
4988 {0, 1, 1}, /* VSUBHN */
4989 {0, 0, 0}, /* VABDL */
4990 {0, 0, 0}, /* VMLAL */
4991 {0, 0, 0}, /* VQDMLAL */
4992 {0, 0, 0}, /* VMLSL */
4993 {0, 0, 0}, /* VQDMLSL */
4994 {0, 0, 0}, /* Integer VMULL */
4995 {0, 0, 0}, /* VQDMULL */
4996 {0, 0, 0} /* Polynomial VMULL */
4999 prewiden
= neon_3reg_wide
[op
][0];
5000 src1_wide
= neon_3reg_wide
[op
][1];
5001 src2_wide
= neon_3reg_wide
[op
][2];
5003 if (size
== 0 && (op
== 9 || op
== 11 || op
== 13))
5006 /* Avoid overlapping operands. Wide source operands are
5007 always aligned so will never overlap with wide
5008 destinations in problematic ways. */
5009 if (rd
== rm
&& !src2_wide
) {
5010 tmp
= neon_load_reg(rm
, 1);
5011 neon_store_scratch(2, tmp
);
5012 } else if (rd
== rn
&& !src1_wide
) {
5013 tmp
= neon_load_reg(rn
, 1);
5014 neon_store_scratch(2, tmp
);
5017 for (pass
= 0; pass
< 2; pass
++) {
5019 neon_load_reg64(cpu_V0
, rn
+ pass
);
5022 if (pass
== 1 && rd
== rn
) {
5023 tmp
= neon_load_scratch(2);
5025 tmp
= neon_load_reg(rn
, pass
);
5028 gen_neon_widen(cpu_V0
, tmp
, size
, u
);
5032 neon_load_reg64(cpu_V1
, rm
+ pass
);
5035 if (pass
== 1 && rd
== rm
) {
5036 tmp2
= neon_load_scratch(2);
5038 tmp2
= neon_load_reg(rm
, pass
);
5041 gen_neon_widen(cpu_V1
, tmp2
, size
, u
);
5045 case 0: case 1: case 4: /* VADDL, VADDW, VADDHN, VRADDHN */
5046 gen_neon_addl(size
);
5048 case 2: case 3: case 6: /* VSUBL, VSUBW, VSUBHN, VRSUBHN */
5049 gen_neon_subl(size
);
5051 case 5: case 7: /* VABAL, VABDL */
5052 switch ((size
<< 1) | u
) {
5054 gen_helper_neon_abdl_s16(cpu_V0
, tmp
, tmp2
);
5057 gen_helper_neon_abdl_u16(cpu_V0
, tmp
, tmp2
);
5060 gen_helper_neon_abdl_s32(cpu_V0
, tmp
, tmp2
);
5063 gen_helper_neon_abdl_u32(cpu_V0
, tmp
, tmp2
);
5066 gen_helper_neon_abdl_s64(cpu_V0
, tmp
, tmp2
);
5069 gen_helper_neon_abdl_u64(cpu_V0
, tmp
, tmp2
);
5076 case 8: case 9: case 10: case 11: case 12: case 13:
5077 /* VMLAL, VQDMLAL, VMLSL, VQDMLSL, VMULL, VQDMULL */
5078 gen_neon_mull(cpu_V0
, tmp
, tmp2
, size
, u
);
5082 case 14: /* Polynomial VMULL */
5083 cpu_abort(env
, "Polynomial VMULL not implemented");
5085 default: /* 15 is RESERVED. */
5088 if (op
== 5 || op
== 13 || (op
>= 8 && op
<= 11)) {
5090 if (op
== 10 || op
== 11) {
5091 gen_neon_negl(cpu_V0
, size
);
5095 neon_load_reg64(cpu_V1
, rd
+ pass
);
5099 case 5: case 8: case 10: /* VABAL, VMLAL, VMLSL */
5100 gen_neon_addl(size
);
5102 case 9: case 11: /* VQDMLAL, VQDMLSL */
5103 gen_neon_addl_saturate(cpu_V0
, cpu_V0
, size
);
5104 gen_neon_addl_saturate(cpu_V0
, cpu_V1
, size
);
5107 case 13: /* VQDMULL */
5108 gen_neon_addl_saturate(cpu_V0
, cpu_V0
, size
);
5113 neon_store_reg64(cpu_V0
, rd
+ pass
);
5114 } else if (op
== 4 || op
== 6) {
5115 /* Narrowing operation. */
5120 gen_helper_neon_narrow_high_u8(tmp
, cpu_V0
);
5123 gen_helper_neon_narrow_high_u16(tmp
, cpu_V0
);
5126 tcg_gen_shri_i64(cpu_V0
, cpu_V0
, 32);
5127 tcg_gen_trunc_i64_i32(tmp
, cpu_V0
);
5134 gen_helper_neon_narrow_round_high_u8(tmp
, cpu_V0
);
5137 gen_helper_neon_narrow_round_high_u16(tmp
, cpu_V0
);
5140 tcg_gen_addi_i64(cpu_V0
, cpu_V0
, 1u << 31);
5141 tcg_gen_shri_i64(cpu_V0
, cpu_V0
, 32);
5142 tcg_gen_trunc_i64_i32(tmp
, cpu_V0
);
5150 neon_store_reg(rd
, 0, tmp3
);
5151 neon_store_reg(rd
, 1, tmp
);
5154 /* Write back the result. */
5155 neon_store_reg64(cpu_V0
, rd
+ pass
);
5159 /* Two registers and a scalar. */
5161 case 0: /* Integer VMLA scalar */
5162 case 1: /* Float VMLA scalar */
5163 case 4: /* Integer VMLS scalar */
5164 case 5: /* Floating point VMLS scalar */
5165 case 8: /* Integer VMUL scalar */
5166 case 9: /* Floating point VMUL scalar */
5167 case 12: /* VQDMULH scalar */
5168 case 13: /* VQRDMULH scalar */
5169 tmp
= neon_get_scalar(size
, rm
);
5170 neon_store_scratch(0, tmp
);
5171 for (pass
= 0; pass
< (u
? 4 : 2); pass
++) {
5172 tmp
= neon_load_scratch(0);
5173 tmp2
= neon_load_reg(rn
, pass
);
5176 gen_helper_neon_qdmulh_s16(tmp
, cpu_env
, tmp
, tmp2
);
5178 gen_helper_neon_qdmulh_s32(tmp
, cpu_env
, tmp
, tmp2
);
5180 } else if (op
== 13) {
5182 gen_helper_neon_qrdmulh_s16(tmp
, cpu_env
, tmp
, tmp2
);
5184 gen_helper_neon_qrdmulh_s32(tmp
, cpu_env
, tmp
, tmp2
);
5186 } else if (op
& 1) {
5187 gen_helper_neon_mul_f32(tmp
, tmp
, tmp2
);
5190 case 0: gen_helper_neon_mul_u8(tmp
, tmp
, tmp2
); break;
5191 case 1: gen_helper_neon_mul_u16(tmp
, tmp
, tmp2
); break;
5192 case 2: tcg_gen_mul_i32(tmp
, tmp
, tmp2
); break;
5199 tmp2
= neon_load_reg(rd
, pass
);
5202 gen_neon_add(size
, tmp
, tmp2
);
5205 gen_helper_neon_add_f32(tmp
, tmp
, tmp2
);
5208 gen_neon_rsb(size
, tmp
, tmp2
);
5211 gen_helper_neon_sub_f32(tmp
, tmp2
, tmp
);
5218 neon_store_reg(rd
, pass
, tmp
);
5221 case 2: /* VMLAL sclar */
5222 case 3: /* VQDMLAL scalar */
5223 case 6: /* VMLSL scalar */
5224 case 7: /* VQDMLSL scalar */
5225 case 10: /* VMULL scalar */
5226 case 11: /* VQDMULL scalar */
5227 if (size
== 0 && (op
== 3 || op
== 7 || op
== 11))
5230 tmp2
= neon_get_scalar(size
, rm
);
5231 tmp3
= neon_load_reg(rn
, 1);
5233 for (pass
= 0; pass
< 2; pass
++) {
5235 tmp
= neon_load_reg(rn
, 0);
5239 gen_neon_mull(cpu_V0
, tmp
, tmp2
, size
, u
);
5241 if (op
== 6 || op
== 7) {
5242 gen_neon_negl(cpu_V0
, size
);
5245 neon_load_reg64(cpu_V1
, rd
+ pass
);
5249 gen_neon_addl(size
);
5252 gen_neon_addl_saturate(cpu_V0
, cpu_V0
, size
);
5253 gen_neon_addl_saturate(cpu_V0
, cpu_V1
, size
);
5259 gen_neon_addl_saturate(cpu_V0
, cpu_V0
, size
);
5264 neon_store_reg64(cpu_V0
, rd
+ pass
);
5270 default: /* 14 and 15 are RESERVED */
5274 } else { /* size == 3 */
5277 imm
= (insn
>> 8) & 0xf;
5283 neon_load_reg64(cpu_V0
, rn
);
5285 neon_load_reg64(cpu_V1
, rn
+ 1);
5287 } else if (imm
== 8) {
5288 neon_load_reg64(cpu_V0
, rn
+ 1);
5290 neon_load_reg64(cpu_V1
, rm
);
5293 tmp64
= tcg_temp_new_i64();
5295 neon_load_reg64(cpu_V0
, rn
);
5296 neon_load_reg64(tmp64
, rn
+ 1);
5298 neon_load_reg64(cpu_V0
, rn
+ 1);
5299 neon_load_reg64(tmp64
, rm
);
5301 tcg_gen_shri_i64(cpu_V0
, cpu_V0
, (imm
& 7) * 8);
5302 tcg_gen_shli_i64(cpu_V1
, tmp64
, 64 - ((imm
& 7) * 8));
5303 tcg_gen_or_i64(cpu_V0
, cpu_V0
, cpu_V1
);
5305 neon_load_reg64(cpu_V1
, rm
);
5307 neon_load_reg64(cpu_V1
, rm
+ 1);
5310 tcg_gen_shli_i64(cpu_V1
, cpu_V1
, 64 - (imm
* 8));
5311 tcg_gen_shri_i64(tmp64
, tmp64
, imm
* 8);
5312 tcg_gen_or_i64(cpu_V1
, cpu_V1
, tmp64
);
5313 tcg_temp_free_i64(tmp64
);
5316 neon_load_reg64(cpu_V0
, rn
);
5317 tcg_gen_shri_i64(cpu_V0
, cpu_V0
, imm
* 8);
5318 neon_load_reg64(cpu_V1
, rm
);
5319 tcg_gen_shli_i64(cpu_V1
, cpu_V1
, 64 - (imm
* 8));
5320 tcg_gen_or_i64(cpu_V0
, cpu_V0
, cpu_V1
);
5322 neon_store_reg64(cpu_V0
, rd
);
5324 neon_store_reg64(cpu_V1
, rd
+ 1);
5326 } else if ((insn
& (1 << 11)) == 0) {
5327 /* Two register misc. */
5328 op
= ((insn
>> 12) & 0x30) | ((insn
>> 7) & 0xf);
5329 size
= (insn
>> 18) & 3;
5331 case 0: /* VREV64 */
5334 for (pass
= 0; pass
< (q
? 2 : 1); pass
++) {
5335 tmp
= neon_load_reg(rm
, pass
* 2);
5336 tmp2
= neon_load_reg(rm
, pass
* 2 + 1);
5338 case 0: tcg_gen_bswap32_i32(tmp
, tmp
); break;
5339 case 1: gen_swap_half(tmp
); break;
5340 case 2: /* no-op */ break;
5343 neon_store_reg(rd
, pass
* 2 + 1, tmp
);
5345 neon_store_reg(rd
, pass
* 2, tmp2
);
5348 case 0: tcg_gen_bswap32_i32(tmp2
, tmp2
); break;
5349 case 1: gen_swap_half(tmp2
); break;
5352 neon_store_reg(rd
, pass
* 2, tmp2
);
5356 case 4: case 5: /* VPADDL */
5357 case 12: case 13: /* VPADAL */
5360 for (pass
= 0; pass
< q
+ 1; pass
++) {
5361 tmp
= neon_load_reg(rm
, pass
* 2);
5362 gen_neon_widen(cpu_V0
, tmp
, size
, op
& 1);
5363 tmp
= neon_load_reg(rm
, pass
* 2 + 1);
5364 gen_neon_widen(cpu_V1
, tmp
, size
, op
& 1);
5366 case 0: gen_helper_neon_paddl_u16(CPU_V001
); break;
5367 case 1: gen_helper_neon_paddl_u32(CPU_V001
); break;
5368 case 2: tcg_gen_add_i64(CPU_V001
); break;
5373 neon_load_reg64(cpu_V1
, rd
+ pass
);
5374 gen_neon_addl(size
);
5376 neon_store_reg64(cpu_V0
, rd
+ pass
);
5381 for (n
= 0; n
< (q
? 4 : 2); n
+= 2) {
5382 tmp
= neon_load_reg(rm
, n
);
5383 tmp2
= neon_load_reg(rd
, n
+ 1);
5384 neon_store_reg(rm
, n
, tmp2
);
5385 neon_store_reg(rd
, n
+ 1, tmp
);
5393 Rd A3 A2 A1 A0 B2 B0 A2 A0
5394 Rm B3 B2 B1 B0 B3 B1 A3 A1
5398 gen_neon_unzip(rd
, q
, 0, size
);
5399 gen_neon_unzip(rm
, q
, 4, size
);
5401 static int unzip_order_q
[8] =
5402 {0, 2, 4, 6, 1, 3, 5, 7};
5403 for (n
= 0; n
< 8; n
++) {
5404 int reg
= (n
< 4) ? rd
: rm
;
5405 tmp
= neon_load_scratch(unzip_order_q
[n
]);
5406 neon_store_reg(reg
, n
% 4, tmp
);
5409 static int unzip_order
[4] =
5411 for (n
= 0; n
< 4; n
++) {
5412 int reg
= (n
< 2) ? rd
: rm
;
5413 tmp
= neon_load_scratch(unzip_order
[n
]);
5414 neon_store_reg(reg
, n
% 2, tmp
);
5420 Rd A3 A2 A1 A0 B1 A1 B0 A0
5421 Rm B3 B2 B1 B0 B3 A3 B2 A2
5425 count
= (q
? 4 : 2);
5426 for (n
= 0; n
< count
; n
++) {
5427 tmp
= neon_load_reg(rd
, n
);
5428 tmp2
= neon_load_reg(rd
, n
);
5430 case 0: gen_neon_zip_u8(tmp
, tmp2
); break;
5431 case 1: gen_neon_zip_u16(tmp
, tmp2
); break;
5432 case 2: /* no-op */; break;
5435 neon_store_scratch(n
* 2, tmp
);
5436 neon_store_scratch(n
* 2 + 1, tmp2
);
5438 for (n
= 0; n
< count
* 2; n
++) {
5439 int reg
= (n
< count
) ? rd
: rm
;
5440 tmp
= neon_load_scratch(n
);
5441 neon_store_reg(reg
, n
% count
, tmp
);
5444 case 36: case 37: /* VMOVN, VQMOVUN, VQMOVN */
5448 for (pass
= 0; pass
< 2; pass
++) {
5449 neon_load_reg64(cpu_V0
, rm
+ pass
);
5451 if (op
== 36 && q
== 0) {
5452 gen_neon_narrow(size
, tmp
, cpu_V0
);
5454 gen_neon_narrow_satu(size
, tmp
, cpu_V0
);
5456 gen_neon_narrow_sats(size
, tmp
, cpu_V0
);
5461 neon_store_reg(rd
, 0, tmp2
);
5462 neon_store_reg(rd
, 1, tmp
);
5466 case 38: /* VSHLL */
5469 tmp
= neon_load_reg(rm
, 0);
5470 tmp2
= neon_load_reg(rm
, 1);
5471 for (pass
= 0; pass
< 2; pass
++) {
5474 gen_neon_widen(cpu_V0
, tmp
, size
, 1);
5475 tcg_gen_shli_i64(cpu_V0
, cpu_V0
, 8 << size
);
5476 neon_store_reg64(cpu_V0
, rd
+ pass
);
5479 case 44: /* VCVT.F16.F32 */
5480 if (!arm_feature(env
, ARM_FEATURE_VFP_FP16
))
5484 tcg_gen_ld_f32(cpu_F0s
, cpu_env
, neon_reg_offset(rm
, 0));
5485 gen_helper_vfp_fcvt_f32_to_f16(tmp
, cpu_F0s
, cpu_env
);
5486 tcg_gen_ld_f32(cpu_F0s
, cpu_env
, neon_reg_offset(rm
, 1));
5487 gen_helper_vfp_fcvt_f32_to_f16(tmp2
, cpu_F0s
, cpu_env
);
5488 tcg_gen_shli_i32(tmp2
, tmp2
, 16);
5489 tcg_gen_or_i32(tmp2
, tmp2
, tmp
);
5490 tcg_gen_ld_f32(cpu_F0s
, cpu_env
, neon_reg_offset(rm
, 2));
5491 gen_helper_vfp_fcvt_f32_to_f16(tmp
, cpu_F0s
, cpu_env
);
5492 tcg_gen_ld_f32(cpu_F0s
, cpu_env
, neon_reg_offset(rm
, 3));
5493 neon_store_reg(rd
, 0, tmp2
);
5495 gen_helper_vfp_fcvt_f32_to_f16(tmp2
, cpu_F0s
, cpu_env
);
5496 tcg_gen_shli_i32(tmp2
, tmp2
, 16);
5497 tcg_gen_or_i32(tmp2
, tmp2
, tmp
);
5498 neon_store_reg(rd
, 1, tmp2
);
5501 case 46: /* VCVT.F32.F16 */
5502 if (!arm_feature(env
, ARM_FEATURE_VFP_FP16
))
5505 tmp
= neon_load_reg(rm
, 0);
5506 tmp2
= neon_load_reg(rm
, 1);
5507 tcg_gen_ext16u_i32(tmp3
, tmp
);
5508 gen_helper_vfp_fcvt_f16_to_f32(cpu_F0s
, tmp3
, cpu_env
);
5509 tcg_gen_st_f32(cpu_F0s
, cpu_env
, neon_reg_offset(rd
, 0));
5510 tcg_gen_shri_i32(tmp3
, tmp
, 16);
5511 gen_helper_vfp_fcvt_f16_to_f32(cpu_F0s
, tmp3
, cpu_env
);
5512 tcg_gen_st_f32(cpu_F0s
, cpu_env
, neon_reg_offset(rd
, 1));
5514 tcg_gen_ext16u_i32(tmp3
, tmp2
);
5515 gen_helper_vfp_fcvt_f16_to_f32(cpu_F0s
, tmp3
, cpu_env
);
5516 tcg_gen_st_f32(cpu_F0s
, cpu_env
, neon_reg_offset(rd
, 2));
5517 tcg_gen_shri_i32(tmp3
, tmp2
, 16);
5518 gen_helper_vfp_fcvt_f16_to_f32(cpu_F0s
, tmp3
, cpu_env
);
5519 tcg_gen_st_f32(cpu_F0s
, cpu_env
, neon_reg_offset(rd
, 3));
5525 for (pass
= 0; pass
< (q
? 4 : 2); pass
++) {
5526 if (op
== 30 || op
== 31 || op
>= 58) {
5527 tcg_gen_ld_f32(cpu_F0s
, cpu_env
,
5528 neon_reg_offset(rm
, pass
));
5531 tmp
= neon_load_reg(rm
, pass
);
5534 case 1: /* VREV32 */
5536 case 0: tcg_gen_bswap32_i32(tmp
, tmp
); break;
5537 case 1: gen_swap_half(tmp
); break;
5541 case 2: /* VREV16 */
5548 case 0: gen_helper_neon_cls_s8(tmp
, tmp
); break;
5549 case 1: gen_helper_neon_cls_s16(tmp
, tmp
); break;
5550 case 2: gen_helper_neon_cls_s32(tmp
, tmp
); break;
5556 case 0: gen_helper_neon_clz_u8(tmp
, tmp
); break;
5557 case 1: gen_helper_neon_clz_u16(tmp
, tmp
); break;
5558 case 2: gen_helper_clz(tmp
, tmp
); break;
5565 gen_helper_neon_cnt_u8(tmp
, tmp
);
5570 tcg_gen_not_i32(tmp
, tmp
);
5572 case 14: /* VQABS */
5574 case 0: gen_helper_neon_qabs_s8(tmp
, cpu_env
, tmp
); break;
5575 case 1: gen_helper_neon_qabs_s16(tmp
, cpu_env
, tmp
); break;
5576 case 2: gen_helper_neon_qabs_s32(tmp
, cpu_env
, tmp
); break;
5580 case 15: /* VQNEG */
5582 case 0: gen_helper_neon_qneg_s8(tmp
, cpu_env
, tmp
); break;
5583 case 1: gen_helper_neon_qneg_s16(tmp
, cpu_env
, tmp
); break;
5584 case 2: gen_helper_neon_qneg_s32(tmp
, cpu_env
, tmp
); break;
5588 case 16: case 19: /* VCGT #0, VCLE #0 */
5589 tmp2
= tcg_const_i32(0);
5591 case 0: gen_helper_neon_cgt_s8(tmp
, tmp
, tmp2
); break;
5592 case 1: gen_helper_neon_cgt_s16(tmp
, tmp
, tmp2
); break;
5593 case 2: gen_helper_neon_cgt_s32(tmp
, tmp
, tmp2
); break;
5596 tcg_temp_free(tmp2
);
5598 tcg_gen_not_i32(tmp
, tmp
);
5600 case 17: case 20: /* VCGE #0, VCLT #0 */
5601 tmp2
= tcg_const_i32(0);
5603 case 0: gen_helper_neon_cge_s8(tmp
, tmp
, tmp2
); break;
5604 case 1: gen_helper_neon_cge_s16(tmp
, tmp
, tmp2
); break;
5605 case 2: gen_helper_neon_cge_s32(tmp
, tmp
, tmp2
); break;
5608 tcg_temp_free(tmp2
);
5610 tcg_gen_not_i32(tmp
, tmp
);
5612 case 18: /* VCEQ #0 */
5613 tmp2
= tcg_const_i32(0);
5615 case 0: gen_helper_neon_ceq_u8(tmp
, tmp
, tmp2
); break;
5616 case 1: gen_helper_neon_ceq_u16(tmp
, tmp
, tmp2
); break;
5617 case 2: gen_helper_neon_ceq_u32(tmp
, tmp
, tmp2
); break;
5620 tcg_temp_free(tmp2
);
5624 case 0: gen_helper_neon_abs_s8(tmp
, tmp
); break;
5625 case 1: gen_helper_neon_abs_s16(tmp
, tmp
); break;
5626 case 2: tcg_gen_abs_i32(tmp
, tmp
); break;
5633 tmp2
= tcg_const_i32(0);
5634 gen_neon_rsb(size
, tmp
, tmp2
);
5635 tcg_temp_free(tmp2
);
5637 case 24: case 27: /* Float VCGT #0, Float VCLE #0 */
5638 tmp2
= tcg_const_i32(0);
5639 gen_helper_neon_cgt_f32(tmp
, tmp
, tmp2
);
5640 tcg_temp_free(tmp2
);
5642 tcg_gen_not_i32(tmp
, tmp
);
5644 case 25: case 28: /* Float VCGE #0, Float VCLT #0 */
5645 tmp2
= tcg_const_i32(0);
5646 gen_helper_neon_cge_f32(tmp
, tmp
, tmp2
);
5647 tcg_temp_free(tmp2
);
5649 tcg_gen_not_i32(tmp
, tmp
);
5651 case 26: /* Float VCEQ #0 */
5652 tmp2
= tcg_const_i32(0);
5653 gen_helper_neon_ceq_f32(tmp
, tmp
, tmp2
);
5654 tcg_temp_free(tmp2
);
5656 case 30: /* Float VABS */
5659 case 31: /* Float VNEG */
5663 tmp2
= neon_load_reg(rd
, pass
);
5664 neon_store_reg(rm
, pass
, tmp2
);
5667 tmp2
= neon_load_reg(rd
, pass
);
5669 case 0: gen_neon_trn_u8(tmp
, tmp2
); break;
5670 case 1: gen_neon_trn_u16(tmp
, tmp2
); break;
5674 neon_store_reg(rm
, pass
, tmp2
);
5676 case 56: /* Integer VRECPE */
5677 gen_helper_recpe_u32(tmp
, tmp
, cpu_env
);
5679 case 57: /* Integer VRSQRTE */
5680 gen_helper_rsqrte_u32(tmp
, tmp
, cpu_env
);
5682 case 58: /* Float VRECPE */
5683 gen_helper_recpe_f32(cpu_F0s
, cpu_F0s
, cpu_env
);
5685 case 59: /* Float VRSQRTE */
5686 gen_helper_rsqrte_f32(cpu_F0s
, cpu_F0s
, cpu_env
);
5688 case 60: /* VCVT.F32.S32 */
5691 case 61: /* VCVT.F32.U32 */
5694 case 62: /* VCVT.S32.F32 */
5697 case 63: /* VCVT.U32.F32 */
5701 /* Reserved: 21, 29, 39-56 */
5704 if (op
== 30 || op
== 31 || op
>= 58) {
5705 tcg_gen_st_f32(cpu_F0s
, cpu_env
,
5706 neon_reg_offset(rd
, pass
));
5708 neon_store_reg(rd
, pass
, tmp
);
5713 } else if ((insn
& (1 << 10)) == 0) {
5715 n
= ((insn
>> 5) & 0x18) + 8;
5716 if (insn
& (1 << 6)) {
5717 tmp
= neon_load_reg(rd
, 0);
5720 tcg_gen_movi_i32(tmp
, 0);
5722 tmp2
= neon_load_reg(rm
, 0);
5723 tmp4
= tcg_const_i32(rn
);
5724 tmp5
= tcg_const_i32(n
);
5725 gen_helper_neon_tbl(tmp2
, tmp2
, tmp
, tmp4
, tmp5
);
5727 if (insn
& (1 << 6)) {
5728 tmp
= neon_load_reg(rd
, 1);
5731 tcg_gen_movi_i32(tmp
, 0);
5733 tmp3
= neon_load_reg(rm
, 1);
5734 gen_helper_neon_tbl(tmp3
, tmp3
, tmp
, tmp4
, tmp5
);
5735 tcg_temp_free_i32(tmp5
);
5736 tcg_temp_free_i32(tmp4
);
5737 neon_store_reg(rd
, 0, tmp2
);
5738 neon_store_reg(rd
, 1, tmp3
);
5740 } else if ((insn
& 0x380) == 0) {
5742 if (insn
& (1 << 19)) {
5743 tmp
= neon_load_reg(rm
, 1);
5745 tmp
= neon_load_reg(rm
, 0);
5747 if (insn
& (1 << 16)) {
5748 gen_neon_dup_u8(tmp
, ((insn
>> 17) & 3) * 8);
5749 } else if (insn
& (1 << 17)) {
5750 if ((insn
>> 18) & 1)
5751 gen_neon_dup_high16(tmp
);
5753 gen_neon_dup_low16(tmp
);
5755 for (pass
= 0; pass
< (q
? 4 : 2); pass
++) {
5757 tcg_gen_mov_i32(tmp2
, tmp
);
5758 neon_store_reg(rd
, pass
, tmp2
);
5769 static int disas_cp14_read(CPUState
* env
, DisasContext
*s
, uint32_t insn
)
5771 int crn
= (insn
>> 16) & 0xf;
5772 int crm
= insn
& 0xf;
5773 int op1
= (insn
>> 21) & 7;
5774 int op2
= (insn
>> 5) & 7;
5775 int rt
= (insn
>> 12) & 0xf;
5778 if (arm_feature(env
, ARM_FEATURE_THUMB2EE
)) {
5779 if (op1
== 6 && crn
== 0 && crm
== 0 && op2
== 0) {
5783 tmp
= load_cpu_field(teecr
);
5784 store_reg(s
, rt
, tmp
);
5787 if (op1
== 6 && crn
== 1 && crm
== 0 && op2
== 0) {
5789 if (IS_USER(s
) && (env
->teecr
& 1))
5791 tmp
= load_cpu_field(teehbr
);
5792 store_reg(s
, rt
, tmp
);
5796 fprintf(stderr
, "Unknown cp14 read op1:%d crn:%d crm:%d op2:%d\n",
5797 op1
, crn
, crm
, op2
);
5801 static int disas_cp14_write(CPUState
* env
, DisasContext
*s
, uint32_t insn
)
5803 int crn
= (insn
>> 16) & 0xf;
5804 int crm
= insn
& 0xf;
5805 int op1
= (insn
>> 21) & 7;
5806 int op2
= (insn
>> 5) & 7;
5807 int rt
= (insn
>> 12) & 0xf;
5810 if (arm_feature(env
, ARM_FEATURE_THUMB2EE
)) {
5811 if (op1
== 6 && crn
== 0 && crm
== 0 && op2
== 0) {
5815 tmp
= load_reg(s
, rt
);
5816 gen_helper_set_teecr(cpu_env
, tmp
);
5820 if (op1
== 6 && crn
== 1 && crm
== 0 && op2
== 0) {
5822 if (IS_USER(s
) && (env
->teecr
& 1))
5824 tmp
= load_reg(s
, rt
);
5825 store_cpu_field(tmp
, teehbr
);
5829 fprintf(stderr
, "Unknown cp14 write op1:%d crn:%d crm:%d op2:%d\n",
5830 op1
, crn
, crm
, op2
);
5834 static int disas_coproc_insn(CPUState
* env
, DisasContext
*s
, uint32_t insn
)
5838 cpnum
= (insn
>> 8) & 0xf;
5839 if (arm_feature(env
, ARM_FEATURE_XSCALE
)
5840 && ((env
->cp15
.c15_cpar
^ 0x3fff) & (1 << cpnum
)))
5846 if (arm_feature(env
, ARM_FEATURE_IWMMXT
)) {
5847 return disas_iwmmxt_insn(env
, s
, insn
);
5848 } else if (arm_feature(env
, ARM_FEATURE_XSCALE
)) {
5849 return disas_dsp_insn(env
, s
, insn
);
5854 return disas_vfp_insn (env
, s
, insn
);
5856 /* Coprocessors 7-15 are architecturally reserved by ARM.
5857 Unfortunately Intel decided to ignore this. */
5858 if (arm_feature(env
, ARM_FEATURE_XSCALE
))
5860 if (insn
& (1 << 20))
5861 return disas_cp14_read(env
, s
, insn
);
5863 return disas_cp14_write(env
, s
, insn
);
5865 return disas_cp15_insn (env
, s
, insn
);
5868 /* Unknown coprocessor. See if the board has hooked it. */
5869 return disas_cp_insn (env
, s
, insn
);
5874 /* Store a 64-bit value to a register pair. Clobbers val. */
5875 static void gen_storeq_reg(DisasContext
*s
, int rlow
, int rhigh
, TCGv_i64 val
)
5879 tcg_gen_trunc_i64_i32(tmp
, val
);
5880 store_reg(s
, rlow
, tmp
);
5882 tcg_gen_shri_i64(val
, val
, 32);
5883 tcg_gen_trunc_i64_i32(tmp
, val
);
5884 store_reg(s
, rhigh
, tmp
);
5887 /* load a 32-bit value from a register and perform a 64-bit accumulate. */
5888 static void gen_addq_lo(DisasContext
*s
, TCGv_i64 val
, int rlow
)
5893 /* Load value and extend to 64 bits. */
5894 tmp
= tcg_temp_new_i64();
5895 tmp2
= load_reg(s
, rlow
);
5896 tcg_gen_extu_i32_i64(tmp
, tmp2
);
5898 tcg_gen_add_i64(val
, val
, tmp
);
5899 tcg_temp_free_i64(tmp
);
5902 /* load and add a 64-bit value from a register pair. */
5903 static void gen_addq(DisasContext
*s
, TCGv_i64 val
, int rlow
, int rhigh
)
5909 /* Load 64-bit value rd:rn. */
5910 tmpl
= load_reg(s
, rlow
);
5911 tmph
= load_reg(s
, rhigh
);
5912 tmp
= tcg_temp_new_i64();
5913 tcg_gen_concat_i32_i64(tmp
, tmpl
, tmph
);
5916 tcg_gen_add_i64(val
, val
, tmp
);
5917 tcg_temp_free_i64(tmp
);
5920 /* Set N and Z flags from a 64-bit value. */
5921 static void gen_logicq_cc(TCGv_i64 val
)
5923 TCGv tmp
= new_tmp();
5924 gen_helper_logicq_cc(tmp
, val
);
5929 /* Load/Store exclusive instructions are implemented by remembering
5930 the value/address loaded, and seeing if these are the same
5931 when the store is performed. This should be is sufficient to implement
5932 the architecturally mandated semantics, and avoids having to monitor
5935 In system emulation mode only one CPU will be running at once, so
5936 this sequence is effectively atomic. In user emulation mode we
5937 throw an exception and handle the atomic operation elsewhere. */
5938 static void gen_load_exclusive(DisasContext
*s
, int rt
, int rt2
,
5939 TCGv addr
, int size
)
5945 tmp
= gen_ld8u(addr
, IS_USER(s
));
5948 tmp
= gen_ld16u(addr
, IS_USER(s
));
5952 tmp
= gen_ld32(addr
, IS_USER(s
));
5957 tcg_gen_mov_i32(cpu_exclusive_val
, tmp
);
5958 store_reg(s
, rt
, tmp
);
5960 TCGv tmp2
= new_tmp();
5961 tcg_gen_addi_i32(tmp2
, addr
, 4);
5962 tmp
= gen_ld32(tmp2
, IS_USER(s
));
5964 tcg_gen_mov_i32(cpu_exclusive_high
, tmp
);
5965 store_reg(s
, rt2
, tmp
);
5967 tcg_gen_mov_i32(cpu_exclusive_addr
, addr
);
5970 static void gen_clrex(DisasContext
*s
)
5972 tcg_gen_movi_i32(cpu_exclusive_addr
, -1);
5975 #ifdef CONFIG_USER_ONLY
5976 static void gen_store_exclusive(DisasContext
*s
, int rd
, int rt
, int rt2
,
5977 TCGv addr
, int size
)
5979 tcg_gen_mov_i32(cpu_exclusive_test
, addr
);
5980 tcg_gen_movi_i32(cpu_exclusive_info
,
5981 size
| (rd
<< 4) | (rt
<< 8) | (rt2
<< 12));
5982 gen_set_condexec(s
);
5983 gen_set_pc_im(s
->pc
- 4);
5984 gen_exception(EXCP_STREX
);
5985 s
->is_jmp
= DISAS_JUMP
;
5988 static void gen_store_exclusive(DisasContext
*s
, int rd
, int rt
, int rt2
,
5989 TCGv addr
, int size
)
5995 /* if (env->exclusive_addr == addr && env->exclusive_val == [addr]) {
6001 fail_label
= gen_new_label();
6002 done_label
= gen_new_label();
6003 tcg_gen_brcond_i32(TCG_COND_NE
, addr
, cpu_exclusive_addr
, fail_label
);
6006 tmp
= gen_ld8u(addr
, IS_USER(s
));
6009 tmp
= gen_ld16u(addr
, IS_USER(s
));
6013 tmp
= gen_ld32(addr
, IS_USER(s
));
6018 tcg_gen_brcond_i32(TCG_COND_NE
, tmp
, cpu_exclusive_val
, fail_label
);
6021 TCGv tmp2
= new_tmp();
6022 tcg_gen_addi_i32(tmp2
, addr
, 4);
6023 tmp
= gen_ld32(tmp2
, IS_USER(s
));
6025 tcg_gen_brcond_i32(TCG_COND_NE
, tmp
, cpu_exclusive_high
, fail_label
);
6028 tmp
= load_reg(s
, rt
);
6031 gen_st8(tmp
, addr
, IS_USER(s
));
6034 gen_st16(tmp
, addr
, IS_USER(s
));
6038 gen_st32(tmp
, addr
, IS_USER(s
));
6044 tcg_gen_addi_i32(addr
, addr
, 4);
6045 tmp
= load_reg(s
, rt2
);
6046 gen_st32(tmp
, addr
, IS_USER(s
));
6048 tcg_gen_movi_i32(cpu_R
[rd
], 0);
6049 tcg_gen_br(done_label
);
6050 gen_set_label(fail_label
);
6051 tcg_gen_movi_i32(cpu_R
[rd
], 1);
6052 gen_set_label(done_label
);
6053 tcg_gen_movi_i32(cpu_exclusive_addr
, -1);
6057 static void disas_arm_insn(CPUState
* env
, DisasContext
*s
)
6059 unsigned int cond
, insn
, val
, op1
, i
, shift
, rm
, rs
, rn
, rd
, sh
;
6066 insn
= ldl_code(s
->pc
);
6069 /* M variants do not implement ARM mode. */
6074 /* Unconditional instructions. */
6075 if (((insn
>> 25) & 7) == 1) {
6076 /* NEON Data processing. */
6077 if (!arm_feature(env
, ARM_FEATURE_NEON
))
6080 if (disas_neon_data_insn(env
, s
, insn
))
6084 if ((insn
& 0x0f100000) == 0x04000000) {
6085 /* NEON load/store. */
6086 if (!arm_feature(env
, ARM_FEATURE_NEON
))
6089 if (disas_neon_ls_insn(env
, s
, insn
))
6093 if ((insn
& 0x0d70f000) == 0x0550f000)
6095 else if ((insn
& 0x0ffffdff) == 0x01010000) {
6098 if (insn
& (1 << 9)) {
6099 /* BE8 mode not implemented. */
6103 } else if ((insn
& 0x0fffff00) == 0x057ff000) {
6104 switch ((insn
>> 4) & 0xf) {
6113 /* We don't emulate caches so these are a no-op. */
6118 } else if ((insn
& 0x0e5fffe0) == 0x084d0500) {
6124 op1
= (insn
& 0x1f);
6125 if (op1
== (env
->uncached_cpsr
& CPSR_M
)) {
6126 addr
= load_reg(s
, 13);
6129 tmp
= tcg_const_i32(op1
);
6130 gen_helper_get_r13_banked(addr
, cpu_env
, tmp
);
6131 tcg_temp_free_i32(tmp
);
6133 i
= (insn
>> 23) & 3;
6135 case 0: offset
= -4; break; /* DA */
6136 case 1: offset
= 0; break; /* IA */
6137 case 2: offset
= -8; break; /* DB */
6138 case 3: offset
= 4; break; /* IB */
6142 tcg_gen_addi_i32(addr
, addr
, offset
);
6143 tmp
= load_reg(s
, 14);
6144 gen_st32(tmp
, addr
, 0);
6145 tmp
= load_cpu_field(spsr
);
6146 tcg_gen_addi_i32(addr
, addr
, 4);
6147 gen_st32(tmp
, addr
, 0);
6148 if (insn
& (1 << 21)) {
6149 /* Base writeback. */
6151 case 0: offset
= -8; break;
6152 case 1: offset
= 4; break;
6153 case 2: offset
= -4; break;
6154 case 3: offset
= 0; break;
6158 tcg_gen_addi_i32(addr
, addr
, offset
);
6159 if (op1
== (env
->uncached_cpsr
& CPSR_M
)) {
6160 store_reg(s
, 13, addr
);
6162 tmp
= tcg_const_i32(op1
);
6163 gen_helper_set_r13_banked(cpu_env
, tmp
, addr
);
6164 tcg_temp_free_i32(tmp
);
6171 } else if ((insn
& 0x0e50ffe0) == 0x08100a00) {
6177 rn
= (insn
>> 16) & 0xf;
6178 addr
= load_reg(s
, rn
);
6179 i
= (insn
>> 23) & 3;
6181 case 0: offset
= -4; break; /* DA */
6182 case 1: offset
= 0; break; /* IA */
6183 case 2: offset
= -8; break; /* DB */
6184 case 3: offset
= 4; break; /* IB */
6188 tcg_gen_addi_i32(addr
, addr
, offset
);
6189 /* Load PC into tmp and CPSR into tmp2. */
6190 tmp
= gen_ld32(addr
, 0);
6191 tcg_gen_addi_i32(addr
, addr
, 4);
6192 tmp2
= gen_ld32(addr
, 0);
6193 if (insn
& (1 << 21)) {
6194 /* Base writeback. */
6196 case 0: offset
= -8; break;
6197 case 1: offset
= 4; break;
6198 case 2: offset
= -4; break;
6199 case 3: offset
= 0; break;
6203 tcg_gen_addi_i32(addr
, addr
, offset
);
6204 store_reg(s
, rn
, addr
);
6208 gen_rfe(s
, tmp
, tmp2
);
6210 } else if ((insn
& 0x0e000000) == 0x0a000000) {
6211 /* branch link and change to thumb (blx <offset>) */
6214 val
= (uint32_t)s
->pc
;
6216 tcg_gen_movi_i32(tmp
, val
);
6217 store_reg(s
, 14, tmp
);
6218 /* Sign-extend the 24-bit offset */
6219 offset
= (((int32_t)insn
) << 8) >> 8;
6220 /* offset * 4 + bit24 * 2 + (thumb bit) */
6221 val
+= (offset
<< 2) | ((insn
>> 23) & 2) | 1;
6222 /* pipeline offset */
6226 } else if ((insn
& 0x0e000f00) == 0x0c000100) {
6227 if (arm_feature(env
, ARM_FEATURE_IWMMXT
)) {
6228 /* iWMMXt register transfer. */
6229 if (env
->cp15
.c15_cpar
& (1 << 1))
6230 if (!disas_iwmmxt_insn(env
, s
, insn
))
6233 } else if ((insn
& 0x0fe00000) == 0x0c400000) {
6234 /* Coprocessor double register transfer. */
6235 } else if ((insn
& 0x0f000010) == 0x0e000010) {
6236 /* Additional coprocessor register transfer. */
6237 } else if ((insn
& 0x0ff10020) == 0x01000000) {
6240 /* cps (privileged) */
6244 if (insn
& (1 << 19)) {
6245 if (insn
& (1 << 8))
6247 if (insn
& (1 << 7))
6249 if (insn
& (1 << 6))
6251 if (insn
& (1 << 18))
6254 if (insn
& (1 << 17)) {
6256 val
|= (insn
& 0x1f);
6259 gen_set_psr_im(s
, mask
, 0, val
);
6266 /* if not always execute, we generate a conditional jump to
6268 s
->condlabel
= gen_new_label();
6269 gen_test_cc(cond
^ 1, s
->condlabel
);
6272 if ((insn
& 0x0f900000) == 0x03000000) {
6273 if ((insn
& (1 << 21)) == 0) {
6275 rd
= (insn
>> 12) & 0xf;
6276 val
= ((insn
>> 4) & 0xf000) | (insn
& 0xfff);
6277 if ((insn
& (1 << 22)) == 0) {
6280 tcg_gen_movi_i32(tmp
, val
);
6283 tmp
= load_reg(s
, rd
);
6284 tcg_gen_ext16u_i32(tmp
, tmp
);
6285 tcg_gen_ori_i32(tmp
, tmp
, val
<< 16);
6287 store_reg(s
, rd
, tmp
);
6289 if (((insn
>> 12) & 0xf) != 0xf)
6291 if (((insn
>> 16) & 0xf) == 0) {
6292 gen_nop_hint(s
, insn
& 0xff);
6294 /* CPSR = immediate */
6296 shift
= ((insn
>> 8) & 0xf) * 2;
6298 val
= (val
>> shift
) | (val
<< (32 - shift
));
6299 i
= ((insn
& (1 << 22)) != 0);
6300 if (gen_set_psr_im(s
, msr_mask(env
, s
, (insn
>> 16) & 0xf, i
), i
, val
))
6304 } else if ((insn
& 0x0f900000) == 0x01000000
6305 && (insn
& 0x00000090) != 0x00000090) {
6306 /* miscellaneous instructions */
6307 op1
= (insn
>> 21) & 3;
6308 sh
= (insn
>> 4) & 0xf;
6311 case 0x0: /* move program status register */
6314 tmp
= load_reg(s
, rm
);
6315 i
= ((op1
& 2) != 0);
6316 if (gen_set_psr(s
, msr_mask(env
, s
, (insn
>> 16) & 0xf, i
), i
, tmp
))
6320 rd
= (insn
>> 12) & 0xf;
6324 tmp
= load_cpu_field(spsr
);
6327 gen_helper_cpsr_read(tmp
);
6329 store_reg(s
, rd
, tmp
);
6334 /* branch/exchange thumb (bx). */
6335 tmp
= load_reg(s
, rm
);
6337 } else if (op1
== 3) {
6339 rd
= (insn
>> 12) & 0xf;
6340 tmp
= load_reg(s
, rm
);
6341 gen_helper_clz(tmp
, tmp
);
6342 store_reg(s
, rd
, tmp
);
6350 /* Trivial implementation equivalent to bx. */
6351 tmp
= load_reg(s
, rm
);
6361 /* branch link/exchange thumb (blx) */
6362 tmp
= load_reg(s
, rm
);
6364 tcg_gen_movi_i32(tmp2
, s
->pc
);
6365 store_reg(s
, 14, tmp2
);
6368 case 0x5: /* saturating add/subtract */
6369 rd
= (insn
>> 12) & 0xf;
6370 rn
= (insn
>> 16) & 0xf;
6371 tmp
= load_reg(s
, rm
);
6372 tmp2
= load_reg(s
, rn
);
6374 gen_helper_double_saturate(tmp2
, tmp2
);
6376 gen_helper_sub_saturate(tmp
, tmp
, tmp2
);
6378 gen_helper_add_saturate(tmp
, tmp
, tmp2
);
6380 store_reg(s
, rd
, tmp
);
6383 /* SMC instruction (op1 == 3)
6384 and undefined instructions (op1 == 0 || op1 == 2)
6390 gen_set_condexec(s
);
6391 gen_set_pc_im(s
->pc
- 4);
6392 gen_exception(EXCP_BKPT
);
6393 s
->is_jmp
= DISAS_JUMP
;
6395 case 0x8: /* signed multiply */
6399 rs
= (insn
>> 8) & 0xf;
6400 rn
= (insn
>> 12) & 0xf;
6401 rd
= (insn
>> 16) & 0xf;
6403 /* (32 * 16) >> 16 */
6404 tmp
= load_reg(s
, rm
);
6405 tmp2
= load_reg(s
, rs
);
6407 tcg_gen_sari_i32(tmp2
, tmp2
, 16);
6410 tmp64
= gen_muls_i64_i32(tmp
, tmp2
);
6411 tcg_gen_shri_i64(tmp64
, tmp64
, 16);
6413 tcg_gen_trunc_i64_i32(tmp
, tmp64
);
6414 tcg_temp_free_i64(tmp64
);
6415 if ((sh
& 2) == 0) {
6416 tmp2
= load_reg(s
, rn
);
6417 gen_helper_add_setq(tmp
, tmp
, tmp2
);
6420 store_reg(s
, rd
, tmp
);
6423 tmp
= load_reg(s
, rm
);
6424 tmp2
= load_reg(s
, rs
);
6425 gen_mulxy(tmp
, tmp2
, sh
& 2, sh
& 4);
6428 tmp64
= tcg_temp_new_i64();
6429 tcg_gen_ext_i32_i64(tmp64
, tmp
);
6431 gen_addq(s
, tmp64
, rn
, rd
);
6432 gen_storeq_reg(s
, rn
, rd
, tmp64
);
6433 tcg_temp_free_i64(tmp64
);
6436 tmp2
= load_reg(s
, rn
);
6437 gen_helper_add_setq(tmp
, tmp
, tmp2
);
6440 store_reg(s
, rd
, tmp
);
6447 } else if (((insn
& 0x0e000000) == 0 &&
6448 (insn
& 0x00000090) != 0x90) ||
6449 ((insn
& 0x0e000000) == (1 << 25))) {
6450 int set_cc
, logic_cc
, shiftop
;
6452 op1
= (insn
>> 21) & 0xf;
6453 set_cc
= (insn
>> 20) & 1;
6454 logic_cc
= table_logic_cc
[op1
] & set_cc
;
6456 /* data processing instruction */
6457 if (insn
& (1 << 25)) {
6458 /* immediate operand */
6460 shift
= ((insn
>> 8) & 0xf) * 2;
6462 val
= (val
>> shift
) | (val
<< (32 - shift
));
6465 tcg_gen_movi_i32(tmp2
, val
);
6466 if (logic_cc
&& shift
) {
6467 gen_set_CF_bit31(tmp2
);
6472 tmp2
= load_reg(s
, rm
);
6473 shiftop
= (insn
>> 5) & 3;
6474 if (!(insn
& (1 << 4))) {
6475 shift
= (insn
>> 7) & 0x1f;
6476 gen_arm_shift_im(tmp2
, shiftop
, shift
, logic_cc
);
6478 rs
= (insn
>> 8) & 0xf;
6479 tmp
= load_reg(s
, rs
);
6480 gen_arm_shift_reg(tmp2
, shiftop
, tmp
, logic_cc
);
6483 if (op1
!= 0x0f && op1
!= 0x0d) {
6484 rn
= (insn
>> 16) & 0xf;
6485 tmp
= load_reg(s
, rn
);
6489 rd
= (insn
>> 12) & 0xf;
6492 tcg_gen_and_i32(tmp
, tmp
, tmp2
);
6496 store_reg_bx(env
, s
, rd
, tmp
);
6499 tcg_gen_xor_i32(tmp
, tmp
, tmp2
);
6503 store_reg_bx(env
, s
, rd
, tmp
);
6506 if (set_cc
&& rd
== 15) {
6507 /* SUBS r15, ... is used for exception return. */
6511 gen_helper_sub_cc(tmp
, tmp
, tmp2
);
6512 gen_exception_return(s
, tmp
);
6515 gen_helper_sub_cc(tmp
, tmp
, tmp2
);
6517 tcg_gen_sub_i32(tmp
, tmp
, tmp2
);
6519 store_reg_bx(env
, s
, rd
, tmp
);
6524 gen_helper_sub_cc(tmp
, tmp2
, tmp
);
6526 tcg_gen_sub_i32(tmp
, tmp2
, tmp
);
6528 store_reg_bx(env
, s
, rd
, tmp
);
6532 gen_helper_add_cc(tmp
, tmp
, tmp2
);
6534 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
6536 store_reg_bx(env
, s
, rd
, tmp
);
6540 gen_helper_adc_cc(tmp
, tmp
, tmp2
);
6542 gen_add_carry(tmp
, tmp
, tmp2
);
6544 store_reg_bx(env
, s
, rd
, tmp
);
6548 gen_helper_sbc_cc(tmp
, tmp
, tmp2
);
6550 gen_sub_carry(tmp
, tmp
, tmp2
);
6552 store_reg_bx(env
, s
, rd
, tmp
);
6556 gen_helper_sbc_cc(tmp
, tmp2
, tmp
);
6558 gen_sub_carry(tmp
, tmp2
, tmp
);
6560 store_reg_bx(env
, s
, rd
, tmp
);
6564 tcg_gen_and_i32(tmp
, tmp
, tmp2
);
6571 tcg_gen_xor_i32(tmp
, tmp
, tmp2
);
6578 gen_helper_sub_cc(tmp
, tmp
, tmp2
);
6584 gen_helper_add_cc(tmp
, tmp
, tmp2
);
6589 tcg_gen_or_i32(tmp
, tmp
, tmp2
);
6593 store_reg_bx(env
, s
, rd
, tmp
);
6596 if (logic_cc
&& rd
== 15) {
6597 /* MOVS r15, ... is used for exception return. */
6601 gen_exception_return(s
, tmp2
);
6606 store_reg_bx(env
, s
, rd
, tmp2
);
6610 tcg_gen_andc_i32(tmp
, tmp
, tmp2
);
6614 store_reg_bx(env
, s
, rd
, tmp
);
6618 tcg_gen_not_i32(tmp2
, tmp2
);
6622 store_reg_bx(env
, s
, rd
, tmp2
);
6625 if (op1
!= 0x0f && op1
!= 0x0d) {
6629 /* other instructions */
6630 op1
= (insn
>> 24) & 0xf;
6634 /* multiplies, extra load/stores */
6635 sh
= (insn
>> 5) & 3;
6638 rd
= (insn
>> 16) & 0xf;
6639 rn
= (insn
>> 12) & 0xf;
6640 rs
= (insn
>> 8) & 0xf;
6642 op1
= (insn
>> 20) & 0xf;
6644 case 0: case 1: case 2: case 3: case 6:
6646 tmp
= load_reg(s
, rs
);
6647 tmp2
= load_reg(s
, rm
);
6648 tcg_gen_mul_i32(tmp
, tmp
, tmp2
);
6650 if (insn
& (1 << 22)) {
6651 /* Subtract (mls) */
6653 tmp2
= load_reg(s
, rn
);
6654 tcg_gen_sub_i32(tmp
, tmp2
, tmp
);
6656 } else if (insn
& (1 << 21)) {
6658 tmp2
= load_reg(s
, rn
);
6659 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
6662 if (insn
& (1 << 20))
6664 store_reg(s
, rd
, tmp
);
6667 /* 64 bit mul double accumulate (UMAAL) */
6669 tmp
= load_reg(s
, rs
);
6670 tmp2
= load_reg(s
, rm
);
6671 tmp64
= gen_mulu_i64_i32(tmp
, tmp2
);
6672 gen_addq_lo(s
, tmp64
, rn
);
6673 gen_addq_lo(s
, tmp64
, rd
);
6674 gen_storeq_reg(s
, rn
, rd
, tmp64
);
6675 tcg_temp_free_i64(tmp64
);
6677 case 8: case 9: case 10: case 11:
6678 case 12: case 13: case 14: case 15:
6679 /* 64 bit mul: UMULL, UMLAL, SMULL, SMLAL. */
6680 tmp
= load_reg(s
, rs
);
6681 tmp2
= load_reg(s
, rm
);
6682 if (insn
& (1 << 22)) {
6683 tmp64
= gen_muls_i64_i32(tmp
, tmp2
);
6685 tmp64
= gen_mulu_i64_i32(tmp
, tmp2
);
6687 if (insn
& (1 << 21)) { /* mult accumulate */
6688 gen_addq(s
, tmp64
, rn
, rd
);
6690 if (insn
& (1 << 20)) {
6691 gen_logicq_cc(tmp64
);
6693 gen_storeq_reg(s
, rn
, rd
, tmp64
);
6694 tcg_temp_free_i64(tmp64
);
6700 rn
= (insn
>> 16) & 0xf;
6701 rd
= (insn
>> 12) & 0xf;
6702 if (insn
& (1 << 23)) {
6703 /* load/store exclusive */
6704 op1
= (insn
>> 21) & 0x3;
6709 addr
= tcg_temp_local_new_i32();
6710 load_reg_var(s
, addr
, rn
);
6711 if (insn
& (1 << 20)) {
6714 gen_load_exclusive(s
, rd
, 15, addr
, 2);
6716 case 1: /* ldrexd */
6717 gen_load_exclusive(s
, rd
, rd
+ 1, addr
, 3);
6719 case 2: /* ldrexb */
6720 gen_load_exclusive(s
, rd
, 15, addr
, 0);
6722 case 3: /* ldrexh */
6723 gen_load_exclusive(s
, rd
, 15, addr
, 1);
6732 gen_store_exclusive(s
, rd
, rm
, 15, addr
, 2);
6734 case 1: /* strexd */
6735 gen_store_exclusive(s
, rd
, rm
, rm
+ 1, addr
, 3);
6737 case 2: /* strexb */
6738 gen_store_exclusive(s
, rd
, rm
, 15, addr
, 0);
6740 case 3: /* strexh */
6741 gen_store_exclusive(s
, rd
, rm
, 15, addr
, 1);
6747 tcg_temp_free(addr
);
6749 /* SWP instruction */
6752 /* ??? This is not really atomic. However we know
6753 we never have multiple CPUs running in parallel,
6754 so it is good enough. */
6755 addr
= load_reg(s
, rn
);
6756 tmp
= load_reg(s
, rm
);
6757 if (insn
& (1 << 22)) {
6758 tmp2
= gen_ld8u(addr
, IS_USER(s
));
6759 gen_st8(tmp
, addr
, IS_USER(s
));
6761 tmp2
= gen_ld32(addr
, IS_USER(s
));
6762 gen_st32(tmp
, addr
, IS_USER(s
));
6765 store_reg(s
, rd
, tmp2
);
6771 /* Misc load/store */
6772 rn
= (insn
>> 16) & 0xf;
6773 rd
= (insn
>> 12) & 0xf;
6774 addr
= load_reg(s
, rn
);
6775 if (insn
& (1 << 24))
6776 gen_add_datah_offset(s
, insn
, 0, addr
);
6778 if (insn
& (1 << 20)) {
6782 tmp
= gen_ld16u(addr
, IS_USER(s
));
6785 tmp
= gen_ld8s(addr
, IS_USER(s
));
6789 tmp
= gen_ld16s(addr
, IS_USER(s
));
6793 } else if (sh
& 2) {
6797 tmp
= load_reg(s
, rd
);
6798 gen_st32(tmp
, addr
, IS_USER(s
));
6799 tcg_gen_addi_i32(addr
, addr
, 4);
6800 tmp
= load_reg(s
, rd
+ 1);
6801 gen_st32(tmp
, addr
, IS_USER(s
));
6805 tmp
= gen_ld32(addr
, IS_USER(s
));
6806 store_reg(s
, rd
, tmp
);
6807 tcg_gen_addi_i32(addr
, addr
, 4);
6808 tmp
= gen_ld32(addr
, IS_USER(s
));
6812 address_offset
= -4;
6815 tmp
= load_reg(s
, rd
);
6816 gen_st16(tmp
, addr
, IS_USER(s
));
6819 /* Perform base writeback before the loaded value to
6820 ensure correct behavior with overlapping index registers.
6821 ldrd with base writeback is is undefined if the
6822 destination and index registers overlap. */
6823 if (!(insn
& (1 << 24))) {
6824 gen_add_datah_offset(s
, insn
, address_offset
, addr
);
6825 store_reg(s
, rn
, addr
);
6826 } else if (insn
& (1 << 21)) {
6828 tcg_gen_addi_i32(addr
, addr
, address_offset
);
6829 store_reg(s
, rn
, addr
);
6834 /* Complete the load. */
6835 store_reg(s
, rd
, tmp
);
6844 if (insn
& (1 << 4)) {
6846 /* Armv6 Media instructions. */
6848 rn
= (insn
>> 16) & 0xf;
6849 rd
= (insn
>> 12) & 0xf;
6850 rs
= (insn
>> 8) & 0xf;
6851 switch ((insn
>> 23) & 3) {
6852 case 0: /* Parallel add/subtract. */
6853 op1
= (insn
>> 20) & 7;
6854 tmp
= load_reg(s
, rn
);
6855 tmp2
= load_reg(s
, rm
);
6856 sh
= (insn
>> 5) & 7;
6857 if ((op1
& 3) == 0 || sh
== 5 || sh
== 6)
6859 gen_arm_parallel_addsub(op1
, sh
, tmp
, tmp2
);
6861 store_reg(s
, rd
, tmp
);
6864 if ((insn
& 0x00700020) == 0) {
6865 /* Halfword pack. */
6866 tmp
= load_reg(s
, rn
);
6867 tmp2
= load_reg(s
, rm
);
6868 shift
= (insn
>> 7) & 0x1f;
6869 if (insn
& (1 << 6)) {
6873 tcg_gen_sari_i32(tmp2
, tmp2
, shift
);
6874 tcg_gen_andi_i32(tmp
, tmp
, 0xffff0000);
6875 tcg_gen_ext16u_i32(tmp2
, tmp2
);
6879 tcg_gen_shli_i32(tmp2
, tmp2
, shift
);
6880 tcg_gen_ext16u_i32(tmp
, tmp
);
6881 tcg_gen_andi_i32(tmp2
, tmp2
, 0xffff0000);
6883 tcg_gen_or_i32(tmp
, tmp
, tmp2
);
6885 store_reg(s
, rd
, tmp
);
6886 } else if ((insn
& 0x00200020) == 0x00200000) {
6888 tmp
= load_reg(s
, rm
);
6889 shift
= (insn
>> 7) & 0x1f;
6890 if (insn
& (1 << 6)) {
6893 tcg_gen_sari_i32(tmp
, tmp
, shift
);
6895 tcg_gen_shli_i32(tmp
, tmp
, shift
);
6897 sh
= (insn
>> 16) & 0x1f;
6899 tmp2
= tcg_const_i32(sh
);
6900 if (insn
& (1 << 22))
6901 gen_helper_usat(tmp
, tmp
, tmp2
);
6903 gen_helper_ssat(tmp
, tmp
, tmp2
);
6904 tcg_temp_free_i32(tmp2
);
6906 store_reg(s
, rd
, tmp
);
6907 } else if ((insn
& 0x00300fe0) == 0x00200f20) {
6909 tmp
= load_reg(s
, rm
);
6910 sh
= (insn
>> 16) & 0x1f;
6912 tmp2
= tcg_const_i32(sh
);
6913 if (insn
& (1 << 22))
6914 gen_helper_usat16(tmp
, tmp
, tmp2
);
6916 gen_helper_ssat16(tmp
, tmp
, tmp2
);
6917 tcg_temp_free_i32(tmp2
);
6919 store_reg(s
, rd
, tmp
);
6920 } else if ((insn
& 0x00700fe0) == 0x00000fa0) {
6922 tmp
= load_reg(s
, rn
);
6923 tmp2
= load_reg(s
, rm
);
6925 tcg_gen_ld_i32(tmp3
, cpu_env
, offsetof(CPUState
, GE
));
6926 gen_helper_sel_flags(tmp
, tmp3
, tmp
, tmp2
);
6929 store_reg(s
, rd
, tmp
);
6930 } else if ((insn
& 0x000003e0) == 0x00000060) {
6931 tmp
= load_reg(s
, rm
);
6932 shift
= (insn
>> 10) & 3;
6933 /* ??? In many cases it's not neccessary to do a
6934 rotate, a shift is sufficient. */
6936 tcg_gen_rotri_i32(tmp
, tmp
, shift
* 8);
6937 op1
= (insn
>> 20) & 7;
6939 case 0: gen_sxtb16(tmp
); break;
6940 case 2: gen_sxtb(tmp
); break;
6941 case 3: gen_sxth(tmp
); break;
6942 case 4: gen_uxtb16(tmp
); break;
6943 case 6: gen_uxtb(tmp
); break;
6944 case 7: gen_uxth(tmp
); break;
6945 default: goto illegal_op
;
6948 tmp2
= load_reg(s
, rn
);
6949 if ((op1
& 3) == 0) {
6950 gen_add16(tmp
, tmp2
);
6952 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
6956 store_reg(s
, rd
, tmp
);
6957 } else if ((insn
& 0x003f0f60) == 0x003f0f20) {
6959 tmp
= load_reg(s
, rm
);
6960 if (insn
& (1 << 22)) {
6961 if (insn
& (1 << 7)) {
6965 gen_helper_rbit(tmp
, tmp
);
6968 if (insn
& (1 << 7))
6971 tcg_gen_bswap32_i32(tmp
, tmp
);
6973 store_reg(s
, rd
, tmp
);
6978 case 2: /* Multiplies (Type 3). */
6979 tmp
= load_reg(s
, rm
);
6980 tmp2
= load_reg(s
, rs
);
6981 if (insn
& (1 << 20)) {
6982 /* Signed multiply most significant [accumulate].
6983 (SMMUL, SMMLA, SMMLS) */
6984 tmp64
= gen_muls_i64_i32(tmp
, tmp2
);
6987 tmp
= load_reg(s
, rd
);
6988 if (insn
& (1 << 6)) {
6989 tmp64
= gen_subq_msw(tmp64
, tmp
);
6991 tmp64
= gen_addq_msw(tmp64
, tmp
);
6994 if (insn
& (1 << 5)) {
6995 tcg_gen_addi_i64(tmp64
, tmp64
, 0x80000000u
);
6997 tcg_gen_shri_i64(tmp64
, tmp64
, 32);
6999 tcg_gen_trunc_i64_i32(tmp
, tmp64
);
7000 tcg_temp_free_i64(tmp64
);
7001 store_reg(s
, rn
, tmp
);
7003 if (insn
& (1 << 5))
7004 gen_swap_half(tmp2
);
7005 gen_smul_dual(tmp
, tmp2
);
7006 /* This addition cannot overflow. */
7007 if (insn
& (1 << 6)) {
7008 tcg_gen_sub_i32(tmp
, tmp
, tmp2
);
7010 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
7013 if (insn
& (1 << 22)) {
7014 /* smlald, smlsld */
7015 tmp64
= tcg_temp_new_i64();
7016 tcg_gen_ext_i32_i64(tmp64
, tmp
);
7018 gen_addq(s
, tmp64
, rd
, rn
);
7019 gen_storeq_reg(s
, rd
, rn
, tmp64
);
7020 tcg_temp_free_i64(tmp64
);
7022 /* smuad, smusd, smlad, smlsd */
7025 tmp2
= load_reg(s
, rd
);
7026 gen_helper_add_setq(tmp
, tmp
, tmp2
);
7029 store_reg(s
, rn
, tmp
);
7034 op1
= ((insn
>> 17) & 0x38) | ((insn
>> 5) & 7);
7036 case 0: /* Unsigned sum of absolute differences. */
7038 tmp
= load_reg(s
, rm
);
7039 tmp2
= load_reg(s
, rs
);
7040 gen_helper_usad8(tmp
, tmp
, tmp2
);
7043 tmp2
= load_reg(s
, rd
);
7044 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
7047 store_reg(s
, rn
, tmp
);
7049 case 0x20: case 0x24: case 0x28: case 0x2c:
7050 /* Bitfield insert/clear. */
7052 shift
= (insn
>> 7) & 0x1f;
7053 i
= (insn
>> 16) & 0x1f;
7057 tcg_gen_movi_i32(tmp
, 0);
7059 tmp
= load_reg(s
, rm
);
7062 tmp2
= load_reg(s
, rd
);
7063 gen_bfi(tmp
, tmp2
, tmp
, shift
, (1u << i
) - 1);
7066 store_reg(s
, rd
, tmp
);
7068 case 0x12: case 0x16: case 0x1a: case 0x1e: /* sbfx */
7069 case 0x32: case 0x36: case 0x3a: case 0x3e: /* ubfx */
7071 tmp
= load_reg(s
, rm
);
7072 shift
= (insn
>> 7) & 0x1f;
7073 i
= ((insn
>> 16) & 0x1f) + 1;
7078 gen_ubfx(tmp
, shift
, (1u << i
) - 1);
7080 gen_sbfx(tmp
, shift
, i
);
7083 store_reg(s
, rd
, tmp
);
7093 /* Check for undefined extension instructions
7094 * per the ARM Bible IE:
7095 * xxxx 0111 1111 xxxx xxxx xxxx 1111 xxxx
7097 sh
= (0xf << 20) | (0xf << 4);
7098 if (op1
== 0x7 && ((insn
& sh
) == sh
))
7102 /* load/store byte/word */
7103 rn
= (insn
>> 16) & 0xf;
7104 rd
= (insn
>> 12) & 0xf;
7105 tmp2
= load_reg(s
, rn
);
7106 i
= (IS_USER(s
) || (insn
& 0x01200000) == 0x00200000);
7107 if (insn
& (1 << 24))
7108 gen_add_data_offset(s
, insn
, tmp2
);
7109 if (insn
& (1 << 20)) {
7111 if (insn
& (1 << 22)) {
7112 tmp
= gen_ld8u(tmp2
, i
);
7114 tmp
= gen_ld32(tmp2
, i
);
7118 tmp
= load_reg(s
, rd
);
7119 if (insn
& (1 << 22))
7120 gen_st8(tmp
, tmp2
, i
);
7122 gen_st32(tmp
, tmp2
, i
);
7124 if (!(insn
& (1 << 24))) {
7125 gen_add_data_offset(s
, insn
, tmp2
);
7126 store_reg(s
, rn
, tmp2
);
7127 } else if (insn
& (1 << 21)) {
7128 store_reg(s
, rn
, tmp2
);
7132 if (insn
& (1 << 20)) {
7133 /* Complete the load. */
7137 store_reg(s
, rd
, tmp
);
7143 int j
, n
, user
, loaded_base
;
7145 /* load/store multiple words */
7146 /* XXX: store correct base if write back */
7148 if (insn
& (1 << 22)) {
7150 goto illegal_op
; /* only usable in supervisor mode */
7152 if ((insn
& (1 << 15)) == 0)
7155 rn
= (insn
>> 16) & 0xf;
7156 addr
= load_reg(s
, rn
);
7158 /* compute total size */
7160 TCGV_UNUSED(loaded_var
);
7163 if (insn
& (1 << i
))
7166 /* XXX: test invalid n == 0 case ? */
7167 if (insn
& (1 << 23)) {
7168 if (insn
& (1 << 24)) {
7170 tcg_gen_addi_i32(addr
, addr
, 4);
7172 /* post increment */
7175 if (insn
& (1 << 24)) {
7177 tcg_gen_addi_i32(addr
, addr
, -(n
* 4));
7179 /* post decrement */
7181 tcg_gen_addi_i32(addr
, addr
, -((n
- 1) * 4));
7186 if (insn
& (1 << i
)) {
7187 if (insn
& (1 << 20)) {
7189 tmp
= gen_ld32(addr
, IS_USER(s
));
7193 tmp2
= tcg_const_i32(i
);
7194 gen_helper_set_user_reg(tmp2
, tmp
);
7195 tcg_temp_free_i32(tmp2
);
7197 } else if (i
== rn
) {
7201 store_reg(s
, i
, tmp
);
7206 /* special case: r15 = PC + 8 */
7207 val
= (long)s
->pc
+ 4;
7209 tcg_gen_movi_i32(tmp
, val
);
7212 tmp2
= tcg_const_i32(i
);
7213 gen_helper_get_user_reg(tmp
, tmp2
);
7214 tcg_temp_free_i32(tmp2
);
7216 tmp
= load_reg(s
, i
);
7218 gen_st32(tmp
, addr
, IS_USER(s
));
7221 /* no need to add after the last transfer */
7223 tcg_gen_addi_i32(addr
, addr
, 4);
7226 if (insn
& (1 << 21)) {
7228 if (insn
& (1 << 23)) {
7229 if (insn
& (1 << 24)) {
7232 /* post increment */
7233 tcg_gen_addi_i32(addr
, addr
, 4);
7236 if (insn
& (1 << 24)) {
7239 tcg_gen_addi_i32(addr
, addr
, -((n
- 1) * 4));
7241 /* post decrement */
7242 tcg_gen_addi_i32(addr
, addr
, -(n
* 4));
7245 store_reg(s
, rn
, addr
);
7250 store_reg(s
, rn
, loaded_var
);
7252 if ((insn
& (1 << 22)) && !user
) {
7253 /* Restore CPSR from SPSR. */
7254 tmp
= load_cpu_field(spsr
);
7255 gen_set_cpsr(tmp
, 0xffffffff);
7257 s
->is_jmp
= DISAS_UPDATE
;
7266 /* branch (and link) */
7267 val
= (int32_t)s
->pc
;
7268 if (insn
& (1 << 24)) {
7270 tcg_gen_movi_i32(tmp
, val
);
7271 store_reg(s
, 14, tmp
);
7273 offset
= (((int32_t)insn
<< 8) >> 8);
7274 val
+= (offset
<< 2) + 4;
7282 if (disas_coproc_insn(env
, s
, insn
))
7287 gen_set_pc_im(s
->pc
);
7288 s
->is_jmp
= DISAS_SWI
;
7292 gen_set_condexec(s
);
7293 gen_set_pc_im(s
->pc
- 4);
7294 gen_exception(EXCP_UDEF
);
7295 s
->is_jmp
= DISAS_JUMP
;
7301 /* Return true if this is a Thumb-2 logical op. */
7303 thumb2_logic_op(int op
)
7308 /* Generate code for a Thumb-2 data processing operation. If CONDS is nonzero
7309 then set condition code flags based on the result of the operation.
7310 If SHIFTER_OUT is nonzero then set the carry flag for logical operations
7311 to the high bit of T1.
7312 Returns zero if the opcode is valid. */
7315 gen_thumb2_data_op(DisasContext
*s
, int op
, int conds
, uint32_t shifter_out
, TCGv t0
, TCGv t1
)
7322 tcg_gen_and_i32(t0
, t0
, t1
);
7326 tcg_gen_andc_i32(t0
, t0
, t1
);
7330 tcg_gen_or_i32(t0
, t0
, t1
);
7334 tcg_gen_not_i32(t1
, t1
);
7335 tcg_gen_or_i32(t0
, t0
, t1
);
7339 tcg_gen_xor_i32(t0
, t0
, t1
);
7344 gen_helper_add_cc(t0
, t0
, t1
);
7346 tcg_gen_add_i32(t0
, t0
, t1
);
7350 gen_helper_adc_cc(t0
, t0
, t1
);
7356 gen_helper_sbc_cc(t0
, t0
, t1
);
7358 gen_sub_carry(t0
, t0
, t1
);
7362 gen_helper_sub_cc(t0
, t0
, t1
);
7364 tcg_gen_sub_i32(t0
, t0
, t1
);
7368 gen_helper_sub_cc(t0
, t1
, t0
);
7370 tcg_gen_sub_i32(t0
, t1
, t0
);
7372 default: /* 5, 6, 7, 9, 12, 15. */
7378 gen_set_CF_bit31(t1
);
7383 /* Translate a 32-bit thumb instruction. Returns nonzero if the instruction
7385 static int disas_thumb2_insn(CPUState
*env
, DisasContext
*s
, uint16_t insn_hw1
)
7387 uint32_t insn
, imm
, shift
, offset
;
7388 uint32_t rd
, rn
, rm
, rs
;
7399 if (!(arm_feature(env
, ARM_FEATURE_THUMB2
)
7400 || arm_feature (env
, ARM_FEATURE_M
))) {
7401 /* Thumb-1 cores may need to treat bl and blx as a pair of
7402 16-bit instructions to get correct prefetch abort behavior. */
7404 if ((insn
& (1 << 12)) == 0) {
7405 /* Second half of blx. */
7406 offset
= ((insn
& 0x7ff) << 1);
7407 tmp
= load_reg(s
, 14);
7408 tcg_gen_addi_i32(tmp
, tmp
, offset
);
7409 tcg_gen_andi_i32(tmp
, tmp
, 0xfffffffc);
7412 tcg_gen_movi_i32(tmp2
, s
->pc
| 1);
7413 store_reg(s
, 14, tmp2
);
7417 if (insn
& (1 << 11)) {
7418 /* Second half of bl. */
7419 offset
= ((insn
& 0x7ff) << 1) | 1;
7420 tmp
= load_reg(s
, 14);
7421 tcg_gen_addi_i32(tmp
, tmp
, offset
);
7424 tcg_gen_movi_i32(tmp2
, s
->pc
| 1);
7425 store_reg(s
, 14, tmp2
);
7429 if ((s
->pc
& ~TARGET_PAGE_MASK
) == 0) {
7430 /* Instruction spans a page boundary. Implement it as two
7431 16-bit instructions in case the second half causes an
7433 offset
= ((int32_t)insn
<< 21) >> 9;
7434 tcg_gen_movi_i32(cpu_R
[14], s
->pc
+ 2 + offset
);
7437 /* Fall through to 32-bit decode. */
7440 insn
= lduw_code(s
->pc
);
7442 insn
|= (uint32_t)insn_hw1
<< 16;
7444 if ((insn
& 0xf800e800) != 0xf000e800) {
7448 rn
= (insn
>> 16) & 0xf;
7449 rs
= (insn
>> 12) & 0xf;
7450 rd
= (insn
>> 8) & 0xf;
7452 switch ((insn
>> 25) & 0xf) {
7453 case 0: case 1: case 2: case 3:
7454 /* 16-bit instructions. Should never happen. */
7457 if (insn
& (1 << 22)) {
7458 /* Other load/store, table branch. */
7459 if (insn
& 0x01200000) {
7460 /* Load/store doubleword. */
7463 tcg_gen_movi_i32(addr
, s
->pc
& ~3);
7465 addr
= load_reg(s
, rn
);
7467 offset
= (insn
& 0xff) * 4;
7468 if ((insn
& (1 << 23)) == 0)
7470 if (insn
& (1 << 24)) {
7471 tcg_gen_addi_i32(addr
, addr
, offset
);
7474 if (insn
& (1 << 20)) {
7476 tmp
= gen_ld32(addr
, IS_USER(s
));
7477 store_reg(s
, rs
, tmp
);
7478 tcg_gen_addi_i32(addr
, addr
, 4);
7479 tmp
= gen_ld32(addr
, IS_USER(s
));
7480 store_reg(s
, rd
, tmp
);
7483 tmp
= load_reg(s
, rs
);
7484 gen_st32(tmp
, addr
, IS_USER(s
));
7485 tcg_gen_addi_i32(addr
, addr
, 4);
7486 tmp
= load_reg(s
, rd
);
7487 gen_st32(tmp
, addr
, IS_USER(s
));
7489 if (insn
& (1 << 21)) {
7490 /* Base writeback. */
7493 tcg_gen_addi_i32(addr
, addr
, offset
- 4);
7494 store_reg(s
, rn
, addr
);
7498 } else if ((insn
& (1 << 23)) == 0) {
7499 /* Load/store exclusive word. */
7500 addr
= tcg_temp_local_new();
7501 load_reg_var(s
, addr
, rn
);
7502 tcg_gen_addi_i32(addr
, addr
, (insn
& 0xff) << 2);
7503 if (insn
& (1 << 20)) {
7504 gen_load_exclusive(s
, rs
, 15, addr
, 2);
7506 gen_store_exclusive(s
, rd
, rs
, 15, addr
, 2);
7508 tcg_temp_free(addr
);
7509 } else if ((insn
& (1 << 6)) == 0) {
7513 tcg_gen_movi_i32(addr
, s
->pc
);
7515 addr
= load_reg(s
, rn
);
7517 tmp
= load_reg(s
, rm
);
7518 tcg_gen_add_i32(addr
, addr
, tmp
);
7519 if (insn
& (1 << 4)) {
7521 tcg_gen_add_i32(addr
, addr
, tmp
);
7523 tmp
= gen_ld16u(addr
, IS_USER(s
));
7526 tmp
= gen_ld8u(addr
, IS_USER(s
));
7529 tcg_gen_shli_i32(tmp
, tmp
, 1);
7530 tcg_gen_addi_i32(tmp
, tmp
, s
->pc
);
7531 store_reg(s
, 15, tmp
);
7533 /* Load/store exclusive byte/halfword/doubleword. */
7535 op
= (insn
>> 4) & 0x3;
7539 addr
= tcg_temp_local_new();
7540 load_reg_var(s
, addr
, rn
);
7541 if (insn
& (1 << 20)) {
7542 gen_load_exclusive(s
, rs
, rd
, addr
, op
);
7544 gen_store_exclusive(s
, rm
, rs
, rd
, addr
, op
);
7546 tcg_temp_free(addr
);
7549 /* Load/store multiple, RFE, SRS. */
7550 if (((insn
>> 23) & 1) == ((insn
>> 24) & 1)) {
7551 /* Not available in user mode. */
7554 if (insn
& (1 << 20)) {
7556 addr
= load_reg(s
, rn
);
7557 if ((insn
& (1 << 24)) == 0)
7558 tcg_gen_addi_i32(addr
, addr
, -8);
7559 /* Load PC into tmp and CPSR into tmp2. */
7560 tmp
= gen_ld32(addr
, 0);
7561 tcg_gen_addi_i32(addr
, addr
, 4);
7562 tmp2
= gen_ld32(addr
, 0);
7563 if (insn
& (1 << 21)) {
7564 /* Base writeback. */
7565 if (insn
& (1 << 24)) {
7566 tcg_gen_addi_i32(addr
, addr
, 4);
7568 tcg_gen_addi_i32(addr
, addr
, -4);
7570 store_reg(s
, rn
, addr
);
7574 gen_rfe(s
, tmp
, tmp2
);
7578 if (op
== (env
->uncached_cpsr
& CPSR_M
)) {
7579 addr
= load_reg(s
, 13);
7582 tmp
= tcg_const_i32(op
);
7583 gen_helper_get_r13_banked(addr
, cpu_env
, tmp
);
7584 tcg_temp_free_i32(tmp
);
7586 if ((insn
& (1 << 24)) == 0) {
7587 tcg_gen_addi_i32(addr
, addr
, -8);
7589 tmp
= load_reg(s
, 14);
7590 gen_st32(tmp
, addr
, 0);
7591 tcg_gen_addi_i32(addr
, addr
, 4);
7593 gen_helper_cpsr_read(tmp
);
7594 gen_st32(tmp
, addr
, 0);
7595 if (insn
& (1 << 21)) {
7596 if ((insn
& (1 << 24)) == 0) {
7597 tcg_gen_addi_i32(addr
, addr
, -4);
7599 tcg_gen_addi_i32(addr
, addr
, 4);
7601 if (op
== (env
->uncached_cpsr
& CPSR_M
)) {
7602 store_reg(s
, 13, addr
);
7604 tmp
= tcg_const_i32(op
);
7605 gen_helper_set_r13_banked(cpu_env
, tmp
, addr
);
7606 tcg_temp_free_i32(tmp
);
7614 /* Load/store multiple. */
7615 addr
= load_reg(s
, rn
);
7617 for (i
= 0; i
< 16; i
++) {
7618 if (insn
& (1 << i
))
7621 if (insn
& (1 << 24)) {
7622 tcg_gen_addi_i32(addr
, addr
, -offset
);
7625 for (i
= 0; i
< 16; i
++) {
7626 if ((insn
& (1 << i
)) == 0)
7628 if (insn
& (1 << 20)) {
7630 tmp
= gen_ld32(addr
, IS_USER(s
));
7634 store_reg(s
, i
, tmp
);
7638 tmp
= load_reg(s
, i
);
7639 gen_st32(tmp
, addr
, IS_USER(s
));
7641 tcg_gen_addi_i32(addr
, addr
, 4);
7643 if (insn
& (1 << 21)) {
7644 /* Base register writeback. */
7645 if (insn
& (1 << 24)) {
7646 tcg_gen_addi_i32(addr
, addr
, -offset
);
7648 /* Fault if writeback register is in register list. */
7649 if (insn
& (1 << rn
))
7651 store_reg(s
, rn
, addr
);
7660 op
= (insn
>> 21) & 0xf;
7662 /* Halfword pack. */
7663 tmp
= load_reg(s
, rn
);
7664 tmp2
= load_reg(s
, rm
);
7665 shift
= ((insn
>> 10) & 0x1c) | ((insn
>> 6) & 0x3);
7666 if (insn
& (1 << 5)) {
7670 tcg_gen_sari_i32(tmp2
, tmp2
, shift
);
7671 tcg_gen_andi_i32(tmp
, tmp
, 0xffff0000);
7672 tcg_gen_ext16u_i32(tmp2
, tmp2
);
7676 tcg_gen_shli_i32(tmp2
, tmp2
, shift
);
7677 tcg_gen_ext16u_i32(tmp
, tmp
);
7678 tcg_gen_andi_i32(tmp2
, tmp2
, 0xffff0000);
7680 tcg_gen_or_i32(tmp
, tmp
, tmp2
);
7682 store_reg(s
, rd
, tmp
);
7684 /* Data processing register constant shift. */
7687 tcg_gen_movi_i32(tmp
, 0);
7689 tmp
= load_reg(s
, rn
);
7691 tmp2
= load_reg(s
, rm
);
7693 shiftop
= (insn
>> 4) & 3;
7694 shift
= ((insn
>> 6) & 3) | ((insn
>> 10) & 0x1c);
7695 conds
= (insn
& (1 << 20)) != 0;
7696 logic_cc
= (conds
&& thumb2_logic_op(op
));
7697 gen_arm_shift_im(tmp2
, shiftop
, shift
, logic_cc
);
7698 if (gen_thumb2_data_op(s
, op
, conds
, 0, tmp
, tmp2
))
7702 store_reg(s
, rd
, tmp
);
7708 case 13: /* Misc data processing. */
7709 op
= ((insn
>> 22) & 6) | ((insn
>> 7) & 1);
7710 if (op
< 4 && (insn
& 0xf000) != 0xf000)
7713 case 0: /* Register controlled shift. */
7714 tmp
= load_reg(s
, rn
);
7715 tmp2
= load_reg(s
, rm
);
7716 if ((insn
& 0x70) != 0)
7718 op
= (insn
>> 21) & 3;
7719 logic_cc
= (insn
& (1 << 20)) != 0;
7720 gen_arm_shift_reg(tmp
, op
, tmp2
, logic_cc
);
7723 store_reg_bx(env
, s
, rd
, tmp
);
7725 case 1: /* Sign/zero extend. */
7726 tmp
= load_reg(s
, rm
);
7727 shift
= (insn
>> 4) & 3;
7728 /* ??? In many cases it's not neccessary to do a
7729 rotate, a shift is sufficient. */
7731 tcg_gen_rotri_i32(tmp
, tmp
, shift
* 8);
7732 op
= (insn
>> 20) & 7;
7734 case 0: gen_sxth(tmp
); break;
7735 case 1: gen_uxth(tmp
); break;
7736 case 2: gen_sxtb16(tmp
); break;
7737 case 3: gen_uxtb16(tmp
); break;
7738 case 4: gen_sxtb(tmp
); break;
7739 case 5: gen_uxtb(tmp
); break;
7740 default: goto illegal_op
;
7743 tmp2
= load_reg(s
, rn
);
7744 if ((op
>> 1) == 1) {
7745 gen_add16(tmp
, tmp2
);
7747 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
7751 store_reg(s
, rd
, tmp
);
7753 case 2: /* SIMD add/subtract. */
7754 op
= (insn
>> 20) & 7;
7755 shift
= (insn
>> 4) & 7;
7756 if ((op
& 3) == 3 || (shift
& 3) == 3)
7758 tmp
= load_reg(s
, rn
);
7759 tmp2
= load_reg(s
, rm
);
7760 gen_thumb2_parallel_addsub(op
, shift
, tmp
, tmp2
);
7762 store_reg(s
, rd
, tmp
);
7764 case 3: /* Other data processing. */
7765 op
= ((insn
>> 17) & 0x38) | ((insn
>> 4) & 7);
7767 /* Saturating add/subtract. */
7768 tmp
= load_reg(s
, rn
);
7769 tmp2
= load_reg(s
, rm
);
7771 gen_helper_double_saturate(tmp
, tmp
);
7773 gen_helper_sub_saturate(tmp
, tmp2
, tmp
);
7775 gen_helper_add_saturate(tmp
, tmp
, tmp2
);
7778 tmp
= load_reg(s
, rn
);
7780 case 0x0a: /* rbit */
7781 gen_helper_rbit(tmp
, tmp
);
7783 case 0x08: /* rev */
7784 tcg_gen_bswap32_i32(tmp
, tmp
);
7786 case 0x09: /* rev16 */
7789 case 0x0b: /* revsh */
7792 case 0x10: /* sel */
7793 tmp2
= load_reg(s
, rm
);
7795 tcg_gen_ld_i32(tmp3
, cpu_env
, offsetof(CPUState
, GE
));
7796 gen_helper_sel_flags(tmp
, tmp3
, tmp
, tmp2
);
7800 case 0x18: /* clz */
7801 gen_helper_clz(tmp
, tmp
);
7807 store_reg(s
, rd
, tmp
);
7809 case 4: case 5: /* 32-bit multiply. Sum of absolute differences. */
7810 op
= (insn
>> 4) & 0xf;
7811 tmp
= load_reg(s
, rn
);
7812 tmp2
= load_reg(s
, rm
);
7813 switch ((insn
>> 20) & 7) {
7814 case 0: /* 32 x 32 -> 32 */
7815 tcg_gen_mul_i32(tmp
, tmp
, tmp2
);
7818 tmp2
= load_reg(s
, rs
);
7820 tcg_gen_sub_i32(tmp
, tmp2
, tmp
);
7822 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
7826 case 1: /* 16 x 16 -> 32 */
7827 gen_mulxy(tmp
, tmp2
, op
& 2, op
& 1);
7830 tmp2
= load_reg(s
, rs
);
7831 gen_helper_add_setq(tmp
, tmp
, tmp2
);
7835 case 2: /* Dual multiply add. */
7836 case 4: /* Dual multiply subtract. */
7838 gen_swap_half(tmp2
);
7839 gen_smul_dual(tmp
, tmp2
);
7840 /* This addition cannot overflow. */
7841 if (insn
& (1 << 22)) {
7842 tcg_gen_sub_i32(tmp
, tmp
, tmp2
);
7844 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
7849 tmp2
= load_reg(s
, rs
);
7850 gen_helper_add_setq(tmp
, tmp
, tmp2
);
7854 case 3: /* 32 * 16 -> 32msb */
7856 tcg_gen_sari_i32(tmp2
, tmp2
, 16);
7859 tmp64
= gen_muls_i64_i32(tmp
, tmp2
);
7860 tcg_gen_shri_i64(tmp64
, tmp64
, 16);
7862 tcg_gen_trunc_i64_i32(tmp
, tmp64
);
7863 tcg_temp_free_i64(tmp64
);
7866 tmp2
= load_reg(s
, rs
);
7867 gen_helper_add_setq(tmp
, tmp
, tmp2
);
7871 case 5: case 6: /* 32 * 32 -> 32msb (SMMUL, SMMLA, SMMLS) */
7872 tmp64
= gen_muls_i64_i32(tmp
, tmp2
);
7874 tmp
= load_reg(s
, rs
);
7875 if (insn
& (1 << 20)) {
7876 tmp64
= gen_addq_msw(tmp64
, tmp
);
7878 tmp64
= gen_subq_msw(tmp64
, tmp
);
7881 if (insn
& (1 << 4)) {
7882 tcg_gen_addi_i64(tmp64
, tmp64
, 0x80000000u
);
7884 tcg_gen_shri_i64(tmp64
, tmp64
, 32);
7886 tcg_gen_trunc_i64_i32(tmp
, tmp64
);
7887 tcg_temp_free_i64(tmp64
);
7889 case 7: /* Unsigned sum of absolute differences. */
7890 gen_helper_usad8(tmp
, tmp
, tmp2
);
7893 tmp2
= load_reg(s
, rs
);
7894 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
7899 store_reg(s
, rd
, tmp
);
7901 case 6: case 7: /* 64-bit multiply, Divide. */
7902 op
= ((insn
>> 4) & 0xf) | ((insn
>> 16) & 0x70);
7903 tmp
= load_reg(s
, rn
);
7904 tmp2
= load_reg(s
, rm
);
7905 if ((op
& 0x50) == 0x10) {
7907 if (!arm_feature(env
, ARM_FEATURE_DIV
))
7910 gen_helper_udiv(tmp
, tmp
, tmp2
);
7912 gen_helper_sdiv(tmp
, tmp
, tmp2
);
7914 store_reg(s
, rd
, tmp
);
7915 } else if ((op
& 0xe) == 0xc) {
7916 /* Dual multiply accumulate long. */
7918 gen_swap_half(tmp2
);
7919 gen_smul_dual(tmp
, tmp2
);
7921 tcg_gen_sub_i32(tmp
, tmp
, tmp2
);
7923 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
7927 tmp64
= tcg_temp_new_i64();
7928 tcg_gen_ext_i32_i64(tmp64
, tmp
);
7930 gen_addq(s
, tmp64
, rs
, rd
);
7931 gen_storeq_reg(s
, rs
, rd
, tmp64
);
7932 tcg_temp_free_i64(tmp64
);
7935 /* Unsigned 64-bit multiply */
7936 tmp64
= gen_mulu_i64_i32(tmp
, tmp2
);
7940 gen_mulxy(tmp
, tmp2
, op
& 2, op
& 1);
7942 tmp64
= tcg_temp_new_i64();
7943 tcg_gen_ext_i32_i64(tmp64
, tmp
);
7946 /* Signed 64-bit multiply */
7947 tmp64
= gen_muls_i64_i32(tmp
, tmp2
);
7952 gen_addq_lo(s
, tmp64
, rs
);
7953 gen_addq_lo(s
, tmp64
, rd
);
7954 } else if (op
& 0x40) {
7955 /* 64-bit accumulate. */
7956 gen_addq(s
, tmp64
, rs
, rd
);
7958 gen_storeq_reg(s
, rs
, rd
, tmp64
);
7959 tcg_temp_free_i64(tmp64
);
7964 case 6: case 7: case 14: case 15:
7966 if (((insn
>> 24) & 3) == 3) {
7967 /* Translate into the equivalent ARM encoding. */
7968 insn
= (insn
& 0xe2ffffff) | ((insn
& (1 << 28)) >> 4);
7969 if (disas_neon_data_insn(env
, s
, insn
))
7972 if (insn
& (1 << 28))
7974 if (disas_coproc_insn (env
, s
, insn
))
7978 case 8: case 9: case 10: case 11:
7979 if (insn
& (1 << 15)) {
7980 /* Branches, misc control. */
7981 if (insn
& 0x5000) {
7982 /* Unconditional branch. */
7983 /* signextend(hw1[10:0]) -> offset[:12]. */
7984 offset
= ((int32_t)insn
<< 5) >> 9 & ~(int32_t)0xfff;
7985 /* hw1[10:0] -> offset[11:1]. */
7986 offset
|= (insn
& 0x7ff) << 1;
7987 /* (~hw2[13, 11] ^ offset[24]) -> offset[23,22]
7988 offset[24:22] already have the same value because of the
7989 sign extension above. */
7990 offset
^= ((~insn
) & (1 << 13)) << 10;
7991 offset
^= ((~insn
) & (1 << 11)) << 11;
7993 if (insn
& (1 << 14)) {
7994 /* Branch and link. */
7995 tcg_gen_movi_i32(cpu_R
[14], s
->pc
| 1);
7999 if (insn
& (1 << 12)) {
8004 offset
&= ~(uint32_t)2;
8005 gen_bx_im(s
, offset
);
8007 } else if (((insn
>> 23) & 7) == 7) {
8009 if (insn
& (1 << 13))
8012 if (insn
& (1 << 26)) {
8013 /* Secure monitor call (v6Z) */
8014 goto illegal_op
; /* not implemented. */
8016 op
= (insn
>> 20) & 7;
8018 case 0: /* msr cpsr. */
8020 tmp
= load_reg(s
, rn
);
8021 addr
= tcg_const_i32(insn
& 0xff);
8022 gen_helper_v7m_msr(cpu_env
, addr
, tmp
);
8023 tcg_temp_free_i32(addr
);
8029 case 1: /* msr spsr. */
8032 tmp
= load_reg(s
, rn
);
8034 msr_mask(env
, s
, (insn
>> 8) & 0xf, op
== 1),
8038 case 2: /* cps, nop-hint. */
8039 if (((insn
>> 8) & 7) == 0) {
8040 gen_nop_hint(s
, insn
& 0xff);
8042 /* Implemented as NOP in user mode. */
8047 if (insn
& (1 << 10)) {
8048 if (insn
& (1 << 7))
8050 if (insn
& (1 << 6))
8052 if (insn
& (1 << 5))
8054 if (insn
& (1 << 9))
8055 imm
= CPSR_A
| CPSR_I
| CPSR_F
;
8057 if (insn
& (1 << 8)) {
8059 imm
|= (insn
& 0x1f);
8062 gen_set_psr_im(s
, offset
, 0, imm
);
8065 case 3: /* Special control operations. */
8067 op
= (insn
>> 4) & 0xf;
8075 /* These execute as NOPs. */
8082 /* Trivial implementation equivalent to bx. */
8083 tmp
= load_reg(s
, rn
);
8086 case 5: /* Exception return. */
8090 if (rn
!= 14 || rd
!= 15) {
8093 tmp
= load_reg(s
, rn
);
8094 tcg_gen_subi_i32(tmp
, tmp
, insn
& 0xff);
8095 gen_exception_return(s
, tmp
);
8097 case 6: /* mrs cpsr. */
8100 addr
= tcg_const_i32(insn
& 0xff);
8101 gen_helper_v7m_mrs(tmp
, cpu_env
, addr
);
8102 tcg_temp_free_i32(addr
);
8104 gen_helper_cpsr_read(tmp
);
8106 store_reg(s
, rd
, tmp
);
8108 case 7: /* mrs spsr. */
8109 /* Not accessible in user mode. */
8110 if (IS_USER(s
) || IS_M(env
))
8112 tmp
= load_cpu_field(spsr
);
8113 store_reg(s
, rd
, tmp
);
8118 /* Conditional branch. */
8119 op
= (insn
>> 22) & 0xf;
8120 /* Generate a conditional jump to next instruction. */
8121 s
->condlabel
= gen_new_label();
8122 gen_test_cc(op
^ 1, s
->condlabel
);
8125 /* offset[11:1] = insn[10:0] */
8126 offset
= (insn
& 0x7ff) << 1;
8127 /* offset[17:12] = insn[21:16]. */
8128 offset
|= (insn
& 0x003f0000) >> 4;
8129 /* offset[31:20] = insn[26]. */
8130 offset
|= ((int32_t)((insn
<< 5) & 0x80000000)) >> 11;
8131 /* offset[18] = insn[13]. */
8132 offset
|= (insn
& (1 << 13)) << 5;
8133 /* offset[19] = insn[11]. */
8134 offset
|= (insn
& (1 << 11)) << 8;
8136 /* jump to the offset */
8137 gen_jmp(s
, s
->pc
+ offset
);
8140 /* Data processing immediate. */
8141 if (insn
& (1 << 25)) {
8142 if (insn
& (1 << 24)) {
8143 if (insn
& (1 << 20))
8145 /* Bitfield/Saturate. */
8146 op
= (insn
>> 21) & 7;
8148 shift
= ((insn
>> 6) & 3) | ((insn
>> 10) & 0x1c);
8151 tcg_gen_movi_i32(tmp
, 0);
8153 tmp
= load_reg(s
, rn
);
8156 case 2: /* Signed bitfield extract. */
8158 if (shift
+ imm
> 32)
8161 gen_sbfx(tmp
, shift
, imm
);
8163 case 6: /* Unsigned bitfield extract. */
8165 if (shift
+ imm
> 32)
8168 gen_ubfx(tmp
, shift
, (1u << imm
) - 1);
8170 case 3: /* Bitfield insert/clear. */
8173 imm
= imm
+ 1 - shift
;
8175 tmp2
= load_reg(s
, rd
);
8176 gen_bfi(tmp
, tmp2
, tmp
, shift
, (1u << imm
) - 1);
8182 default: /* Saturate. */
8185 tcg_gen_sari_i32(tmp
, tmp
, shift
);
8187 tcg_gen_shli_i32(tmp
, tmp
, shift
);
8189 tmp2
= tcg_const_i32(imm
);
8192 if ((op
& 1) && shift
== 0)
8193 gen_helper_usat16(tmp
, tmp
, tmp2
);
8195 gen_helper_usat(tmp
, tmp
, tmp2
);
8198 if ((op
& 1) && shift
== 0)
8199 gen_helper_ssat16(tmp
, tmp
, tmp2
);
8201 gen_helper_ssat(tmp
, tmp
, tmp2
);
8203 tcg_temp_free_i32(tmp2
);
8206 store_reg(s
, rd
, tmp
);
8208 imm
= ((insn
& 0x04000000) >> 15)
8209 | ((insn
& 0x7000) >> 4) | (insn
& 0xff);
8210 if (insn
& (1 << 22)) {
8211 /* 16-bit immediate. */
8212 imm
|= (insn
>> 4) & 0xf000;
8213 if (insn
& (1 << 23)) {
8215 tmp
= load_reg(s
, rd
);
8216 tcg_gen_ext16u_i32(tmp
, tmp
);
8217 tcg_gen_ori_i32(tmp
, tmp
, imm
<< 16);
8221 tcg_gen_movi_i32(tmp
, imm
);
8224 /* Add/sub 12-bit immediate. */
8226 offset
= s
->pc
& ~(uint32_t)3;
8227 if (insn
& (1 << 23))
8232 tcg_gen_movi_i32(tmp
, offset
);
8234 tmp
= load_reg(s
, rn
);
8235 if (insn
& (1 << 23))
8236 tcg_gen_subi_i32(tmp
, tmp
, imm
);
8238 tcg_gen_addi_i32(tmp
, tmp
, imm
);
8241 store_reg(s
, rd
, tmp
);
8244 int shifter_out
= 0;
8245 /* modified 12-bit immediate. */
8246 shift
= ((insn
& 0x04000000) >> 23) | ((insn
& 0x7000) >> 12);
8247 imm
= (insn
& 0xff);
8250 /* Nothing to do. */
8252 case 1: /* 00XY00XY */
8255 case 2: /* XY00XY00 */
8259 case 3: /* XYXYXYXY */
8263 default: /* Rotated constant. */
8264 shift
= (shift
<< 1) | (imm
>> 7);
8266 imm
= imm
<< (32 - shift
);
8271 tcg_gen_movi_i32(tmp2
, imm
);
8272 rn
= (insn
>> 16) & 0xf;
8275 tcg_gen_movi_i32(tmp
, 0);
8277 tmp
= load_reg(s
, rn
);
8279 op
= (insn
>> 21) & 0xf;
8280 if (gen_thumb2_data_op(s
, op
, (insn
& (1 << 20)) != 0,
8281 shifter_out
, tmp
, tmp2
))
8284 rd
= (insn
>> 8) & 0xf;
8286 store_reg(s
, rd
, tmp
);
8293 case 12: /* Load/store single data item. */
8298 if ((insn
& 0x01100000) == 0x01000000) {
8299 if (disas_neon_ls_insn(env
, s
, insn
))
8307 /* s->pc has already been incremented by 4. */
8308 imm
= s
->pc
& 0xfffffffc;
8309 if (insn
& (1 << 23))
8310 imm
+= insn
& 0xfff;
8312 imm
-= insn
& 0xfff;
8313 tcg_gen_movi_i32(addr
, imm
);
8315 addr
= load_reg(s
, rn
);
8316 if (insn
& (1 << 23)) {
8317 /* Positive offset. */
8319 tcg_gen_addi_i32(addr
, addr
, imm
);
8321 op
= (insn
>> 8) & 7;
8324 case 0: case 8: /* Shifted Register. */
8325 shift
= (insn
>> 4) & 0xf;
8328 tmp
= load_reg(s
, rm
);
8330 tcg_gen_shli_i32(tmp
, tmp
, shift
);
8331 tcg_gen_add_i32(addr
, addr
, tmp
);
8334 case 4: /* Negative offset. */
8335 tcg_gen_addi_i32(addr
, addr
, -imm
);
8337 case 6: /* User privilege. */
8338 tcg_gen_addi_i32(addr
, addr
, imm
);
8341 case 1: /* Post-decrement. */
8344 case 3: /* Post-increment. */
8348 case 5: /* Pre-decrement. */
8351 case 7: /* Pre-increment. */
8352 tcg_gen_addi_i32(addr
, addr
, imm
);
8360 op
= ((insn
>> 21) & 3) | ((insn
>> 22) & 4);
8361 if (insn
& (1 << 20)) {
8363 if (rs
== 15 && op
!= 2) {
8366 /* Memory hint. Implemented as NOP. */
8369 case 0: tmp
= gen_ld8u(addr
, user
); break;
8370 case 4: tmp
= gen_ld8s(addr
, user
); break;
8371 case 1: tmp
= gen_ld16u(addr
, user
); break;
8372 case 5: tmp
= gen_ld16s(addr
, user
); break;
8373 case 2: tmp
= gen_ld32(addr
, user
); break;
8374 default: goto illegal_op
;
8379 store_reg(s
, rs
, tmp
);
8386 tmp
= load_reg(s
, rs
);
8388 case 0: gen_st8(tmp
, addr
, user
); break;
8389 case 1: gen_st16(tmp
, addr
, user
); break;
8390 case 2: gen_st32(tmp
, addr
, user
); break;
8391 default: goto illegal_op
;
8395 tcg_gen_addi_i32(addr
, addr
, imm
);
8397 store_reg(s
, rn
, addr
);
8411 static void disas_thumb_insn(CPUState
*env
, DisasContext
*s
)
8413 uint32_t val
, insn
, op
, rm
, rn
, rd
, shift
, cond
;
8420 if (s
->condexec_mask
) {
8421 cond
= s
->condexec_cond
;
8422 if (cond
!= 0x0e) { /* Skip conditional when condition is AL. */
8423 s
->condlabel
= gen_new_label();
8424 gen_test_cc(cond
^ 1, s
->condlabel
);
8429 insn
= lduw_code(s
->pc
);
8432 switch (insn
>> 12) {
8436 op
= (insn
>> 11) & 3;
8439 rn
= (insn
>> 3) & 7;
8440 tmp
= load_reg(s
, rn
);
8441 if (insn
& (1 << 10)) {
8444 tcg_gen_movi_i32(tmp2
, (insn
>> 6) & 7);
8447 rm
= (insn
>> 6) & 7;
8448 tmp2
= load_reg(s
, rm
);
8450 if (insn
& (1 << 9)) {
8451 if (s
->condexec_mask
)
8452 tcg_gen_sub_i32(tmp
, tmp
, tmp2
);
8454 gen_helper_sub_cc(tmp
, tmp
, tmp2
);
8456 if (s
->condexec_mask
)
8457 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
8459 gen_helper_add_cc(tmp
, tmp
, tmp2
);
8462 store_reg(s
, rd
, tmp
);
8464 /* shift immediate */
8465 rm
= (insn
>> 3) & 7;
8466 shift
= (insn
>> 6) & 0x1f;
8467 tmp
= load_reg(s
, rm
);
8468 gen_arm_shift_im(tmp
, op
, shift
, s
->condexec_mask
== 0);
8469 if (!s
->condexec_mask
)
8471 store_reg(s
, rd
, tmp
);
8475 /* arithmetic large immediate */
8476 op
= (insn
>> 11) & 3;
8477 rd
= (insn
>> 8) & 0x7;
8478 if (op
== 0) { /* mov */
8480 tcg_gen_movi_i32(tmp
, insn
& 0xff);
8481 if (!s
->condexec_mask
)
8483 store_reg(s
, rd
, tmp
);
8485 tmp
= load_reg(s
, rd
);
8487 tcg_gen_movi_i32(tmp2
, insn
& 0xff);
8490 gen_helper_sub_cc(tmp
, tmp
, tmp2
);
8495 if (s
->condexec_mask
)
8496 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
8498 gen_helper_add_cc(tmp
, tmp
, tmp2
);
8500 store_reg(s
, rd
, tmp
);
8503 if (s
->condexec_mask
)
8504 tcg_gen_sub_i32(tmp
, tmp
, tmp2
);
8506 gen_helper_sub_cc(tmp
, tmp
, tmp2
);
8508 store_reg(s
, rd
, tmp
);
8514 if (insn
& (1 << 11)) {
8515 rd
= (insn
>> 8) & 7;
8516 /* load pc-relative. Bit 1 of PC is ignored. */
8517 val
= s
->pc
+ 2 + ((insn
& 0xff) * 4);
8518 val
&= ~(uint32_t)2;
8520 tcg_gen_movi_i32(addr
, val
);
8521 tmp
= gen_ld32(addr
, IS_USER(s
));
8523 store_reg(s
, rd
, tmp
);
8526 if (insn
& (1 << 10)) {
8527 /* data processing extended or blx */
8528 rd
= (insn
& 7) | ((insn
>> 4) & 8);
8529 rm
= (insn
>> 3) & 0xf;
8530 op
= (insn
>> 8) & 3;
8533 tmp
= load_reg(s
, rd
);
8534 tmp2
= load_reg(s
, rm
);
8535 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
8537 store_reg(s
, rd
, tmp
);
8540 tmp
= load_reg(s
, rd
);
8541 tmp2
= load_reg(s
, rm
);
8542 gen_helper_sub_cc(tmp
, tmp
, tmp2
);
8546 case 2: /* mov/cpy */
8547 tmp
= load_reg(s
, rm
);
8548 store_reg(s
, rd
, tmp
);
8550 case 3:/* branch [and link] exchange thumb register */
8551 tmp
= load_reg(s
, rm
);
8552 if (insn
& (1 << 7)) {
8553 val
= (uint32_t)s
->pc
| 1;
8555 tcg_gen_movi_i32(tmp2
, val
);
8556 store_reg(s
, 14, tmp2
);
8564 /* data processing register */
8566 rm
= (insn
>> 3) & 7;
8567 op
= (insn
>> 6) & 0xf;
8568 if (op
== 2 || op
== 3 || op
== 4 || op
== 7) {
8569 /* the shift/rotate ops want the operands backwards */
8578 if (op
== 9) { /* neg */
8580 tcg_gen_movi_i32(tmp
, 0);
8581 } else if (op
!= 0xf) { /* mvn doesn't read its first operand */
8582 tmp
= load_reg(s
, rd
);
8587 tmp2
= load_reg(s
, rm
);
8590 tcg_gen_and_i32(tmp
, tmp
, tmp2
);
8591 if (!s
->condexec_mask
)
8595 tcg_gen_xor_i32(tmp
, tmp
, tmp2
);
8596 if (!s
->condexec_mask
)
8600 if (s
->condexec_mask
) {
8601 gen_helper_shl(tmp2
, tmp2
, tmp
);
8603 gen_helper_shl_cc(tmp2
, tmp2
, tmp
);
8608 if (s
->condexec_mask
) {
8609 gen_helper_shr(tmp2
, tmp2
, tmp
);
8611 gen_helper_shr_cc(tmp2
, tmp2
, tmp
);
8616 if (s
->condexec_mask
) {
8617 gen_helper_sar(tmp2
, tmp2
, tmp
);
8619 gen_helper_sar_cc(tmp2
, tmp2
, tmp
);
8624 if (s
->condexec_mask
)
8627 gen_helper_adc_cc(tmp
, tmp
, tmp2
);
8630 if (s
->condexec_mask
)
8631 gen_sub_carry(tmp
, tmp
, tmp2
);
8633 gen_helper_sbc_cc(tmp
, tmp
, tmp2
);
8636 if (s
->condexec_mask
) {
8637 tcg_gen_andi_i32(tmp
, tmp
, 0x1f);
8638 tcg_gen_rotr_i32(tmp2
, tmp2
, tmp
);
8640 gen_helper_ror_cc(tmp2
, tmp2
, tmp
);
8645 tcg_gen_and_i32(tmp
, tmp
, tmp2
);
8650 if (s
->condexec_mask
)
8651 tcg_gen_neg_i32(tmp
, tmp2
);
8653 gen_helper_sub_cc(tmp
, tmp
, tmp2
);
8656 gen_helper_sub_cc(tmp
, tmp
, tmp2
);
8660 gen_helper_add_cc(tmp
, tmp
, tmp2
);
8664 tcg_gen_or_i32(tmp
, tmp
, tmp2
);
8665 if (!s
->condexec_mask
)
8669 tcg_gen_mul_i32(tmp
, tmp
, tmp2
);
8670 if (!s
->condexec_mask
)
8674 tcg_gen_andc_i32(tmp
, tmp
, tmp2
);
8675 if (!s
->condexec_mask
)
8679 tcg_gen_not_i32(tmp2
, tmp2
);
8680 if (!s
->condexec_mask
)
8688 store_reg(s
, rm
, tmp2
);
8692 store_reg(s
, rd
, tmp
);
8702 /* load/store register offset. */
8704 rn
= (insn
>> 3) & 7;
8705 rm
= (insn
>> 6) & 7;
8706 op
= (insn
>> 9) & 7;
8707 addr
= load_reg(s
, rn
);
8708 tmp
= load_reg(s
, rm
);
8709 tcg_gen_add_i32(addr
, addr
, tmp
);
8712 if (op
< 3) /* store */
8713 tmp
= load_reg(s
, rd
);
8717 gen_st32(tmp
, addr
, IS_USER(s
));
8720 gen_st16(tmp
, addr
, IS_USER(s
));
8723 gen_st8(tmp
, addr
, IS_USER(s
));
8726 tmp
= gen_ld8s(addr
, IS_USER(s
));
8729 tmp
= gen_ld32(addr
, IS_USER(s
));
8732 tmp
= gen_ld16u(addr
, IS_USER(s
));
8735 tmp
= gen_ld8u(addr
, IS_USER(s
));
8738 tmp
= gen_ld16s(addr
, IS_USER(s
));
8741 if (op
>= 3) /* load */
8742 store_reg(s
, rd
, tmp
);
8747 /* load/store word immediate offset */
8749 rn
= (insn
>> 3) & 7;
8750 addr
= load_reg(s
, rn
);
8751 val
= (insn
>> 4) & 0x7c;
8752 tcg_gen_addi_i32(addr
, addr
, val
);
8754 if (insn
& (1 << 11)) {
8756 tmp
= gen_ld32(addr
, IS_USER(s
));
8757 store_reg(s
, rd
, tmp
);
8760 tmp
= load_reg(s
, rd
);
8761 gen_st32(tmp
, addr
, IS_USER(s
));
8767 /* load/store byte immediate offset */
8769 rn
= (insn
>> 3) & 7;
8770 addr
= load_reg(s
, rn
);
8771 val
= (insn
>> 6) & 0x1f;
8772 tcg_gen_addi_i32(addr
, addr
, val
);
8774 if (insn
& (1 << 11)) {
8776 tmp
= gen_ld8u(addr
, IS_USER(s
));
8777 store_reg(s
, rd
, tmp
);
8780 tmp
= load_reg(s
, rd
);
8781 gen_st8(tmp
, addr
, IS_USER(s
));
8787 /* load/store halfword immediate offset */
8789 rn
= (insn
>> 3) & 7;
8790 addr
= load_reg(s
, rn
);
8791 val
= (insn
>> 5) & 0x3e;
8792 tcg_gen_addi_i32(addr
, addr
, val
);
8794 if (insn
& (1 << 11)) {
8796 tmp
= gen_ld16u(addr
, IS_USER(s
));
8797 store_reg(s
, rd
, tmp
);
8800 tmp
= load_reg(s
, rd
);
8801 gen_st16(tmp
, addr
, IS_USER(s
));
8807 /* load/store from stack */
8808 rd
= (insn
>> 8) & 7;
8809 addr
= load_reg(s
, 13);
8810 val
= (insn
& 0xff) * 4;
8811 tcg_gen_addi_i32(addr
, addr
, val
);
8813 if (insn
& (1 << 11)) {
8815 tmp
= gen_ld32(addr
, IS_USER(s
));
8816 store_reg(s
, rd
, tmp
);
8819 tmp
= load_reg(s
, rd
);
8820 gen_st32(tmp
, addr
, IS_USER(s
));
8826 /* add to high reg */
8827 rd
= (insn
>> 8) & 7;
8828 if (insn
& (1 << 11)) {
8830 tmp
= load_reg(s
, 13);
8832 /* PC. bit 1 is ignored. */
8834 tcg_gen_movi_i32(tmp
, (s
->pc
+ 2) & ~(uint32_t)2);
8836 val
= (insn
& 0xff) * 4;
8837 tcg_gen_addi_i32(tmp
, tmp
, val
);
8838 store_reg(s
, rd
, tmp
);
8843 op
= (insn
>> 8) & 0xf;
8846 /* adjust stack pointer */
8847 tmp
= load_reg(s
, 13);
8848 val
= (insn
& 0x7f) * 4;
8849 if (insn
& (1 << 7))
8850 val
= -(int32_t)val
;
8851 tcg_gen_addi_i32(tmp
, tmp
, val
);
8852 store_reg(s
, 13, tmp
);
8855 case 2: /* sign/zero extend. */
8858 rm
= (insn
>> 3) & 7;
8859 tmp
= load_reg(s
, rm
);
8860 switch ((insn
>> 6) & 3) {
8861 case 0: gen_sxth(tmp
); break;
8862 case 1: gen_sxtb(tmp
); break;
8863 case 2: gen_uxth(tmp
); break;
8864 case 3: gen_uxtb(tmp
); break;
8866 store_reg(s
, rd
, tmp
);
8868 case 4: case 5: case 0xc: case 0xd:
8870 addr
= load_reg(s
, 13);
8871 if (insn
& (1 << 8))
8875 for (i
= 0; i
< 8; i
++) {
8876 if (insn
& (1 << i
))
8879 if ((insn
& (1 << 11)) == 0) {
8880 tcg_gen_addi_i32(addr
, addr
, -offset
);
8882 for (i
= 0; i
< 8; i
++) {
8883 if (insn
& (1 << i
)) {
8884 if (insn
& (1 << 11)) {
8886 tmp
= gen_ld32(addr
, IS_USER(s
));
8887 store_reg(s
, i
, tmp
);
8890 tmp
= load_reg(s
, i
);
8891 gen_st32(tmp
, addr
, IS_USER(s
));
8893 /* advance to the next address. */
8894 tcg_gen_addi_i32(addr
, addr
, 4);
8898 if (insn
& (1 << 8)) {
8899 if (insn
& (1 << 11)) {
8901 tmp
= gen_ld32(addr
, IS_USER(s
));
8902 /* don't set the pc until the rest of the instruction
8906 tmp
= load_reg(s
, 14);
8907 gen_st32(tmp
, addr
, IS_USER(s
));
8909 tcg_gen_addi_i32(addr
, addr
, 4);
8911 if ((insn
& (1 << 11)) == 0) {
8912 tcg_gen_addi_i32(addr
, addr
, -offset
);
8914 /* write back the new stack pointer */
8915 store_reg(s
, 13, addr
);
8916 /* set the new PC value */
8917 if ((insn
& 0x0900) == 0x0900)
8921 case 1: case 3: case 9: case 11: /* czb */
8923 tmp
= load_reg(s
, rm
);
8924 s
->condlabel
= gen_new_label();
8926 if (insn
& (1 << 11))
8927 tcg_gen_brcondi_i32(TCG_COND_EQ
, tmp
, 0, s
->condlabel
);
8929 tcg_gen_brcondi_i32(TCG_COND_NE
, tmp
, 0, s
->condlabel
);
8931 offset
= ((insn
& 0xf8) >> 2) | (insn
& 0x200) >> 3;
8932 val
= (uint32_t)s
->pc
+ 2;
8937 case 15: /* IT, nop-hint. */
8938 if ((insn
& 0xf) == 0) {
8939 gen_nop_hint(s
, (insn
>> 4) & 0xf);
8943 s
->condexec_cond
= (insn
>> 4) & 0xe;
8944 s
->condexec_mask
= insn
& 0x1f;
8945 /* No actual code generated for this insn, just setup state. */
8948 case 0xe: /* bkpt */
8949 gen_set_condexec(s
);
8950 gen_set_pc_im(s
->pc
- 2);
8951 gen_exception(EXCP_BKPT
);
8952 s
->is_jmp
= DISAS_JUMP
;
8957 rn
= (insn
>> 3) & 0x7;
8959 tmp
= load_reg(s
, rn
);
8960 switch ((insn
>> 6) & 3) {
8961 case 0: tcg_gen_bswap32_i32(tmp
, tmp
); break;
8962 case 1: gen_rev16(tmp
); break;
8963 case 3: gen_revsh(tmp
); break;
8964 default: goto illegal_op
;
8966 store_reg(s
, rd
, tmp
);
8974 tmp
= tcg_const_i32((insn
& (1 << 4)) != 0);
8977 addr
= tcg_const_i32(16);
8978 gen_helper_v7m_msr(cpu_env
, addr
, tmp
);
8979 tcg_temp_free_i32(addr
);
8983 addr
= tcg_const_i32(17);
8984 gen_helper_v7m_msr(cpu_env
, addr
, tmp
);
8985 tcg_temp_free_i32(addr
);
8987 tcg_temp_free_i32(tmp
);
8990 if (insn
& (1 << 4))
8991 shift
= CPSR_A
| CPSR_I
| CPSR_F
;
8994 gen_set_psr_im(s
, ((insn
& 7) << 6), 0, shift
);
9004 /* load/store multiple */
9005 rn
= (insn
>> 8) & 0x7;
9006 addr
= load_reg(s
, rn
);
9007 for (i
= 0; i
< 8; i
++) {
9008 if (insn
& (1 << i
)) {
9009 if (insn
& (1 << 11)) {
9011 tmp
= gen_ld32(addr
, IS_USER(s
));
9012 store_reg(s
, i
, tmp
);
9015 tmp
= load_reg(s
, i
);
9016 gen_st32(tmp
, addr
, IS_USER(s
));
9018 /* advance to the next address */
9019 tcg_gen_addi_i32(addr
, addr
, 4);
9022 /* Base register writeback. */
9023 if ((insn
& (1 << rn
)) == 0) {
9024 store_reg(s
, rn
, addr
);
9031 /* conditional branch or swi */
9032 cond
= (insn
>> 8) & 0xf;
9038 gen_set_condexec(s
);
9039 gen_set_pc_im(s
->pc
);
9040 s
->is_jmp
= DISAS_SWI
;
9043 /* generate a conditional jump to next instruction */
9044 s
->condlabel
= gen_new_label();
9045 gen_test_cc(cond
^ 1, s
->condlabel
);
9048 /* jump to the offset */
9049 val
= (uint32_t)s
->pc
+ 2;
9050 offset
= ((int32_t)insn
<< 24) >> 24;
9056 if (insn
& (1 << 11)) {
9057 if (disas_thumb2_insn(env
, s
, insn
))
9061 /* unconditional branch */
9062 val
= (uint32_t)s
->pc
;
9063 offset
= ((int32_t)insn
<< 21) >> 21;
9064 val
+= (offset
<< 1) + 2;
9069 if (disas_thumb2_insn(env
, s
, insn
))
9075 gen_set_condexec(s
);
9076 gen_set_pc_im(s
->pc
- 4);
9077 gen_exception(EXCP_UDEF
);
9078 s
->is_jmp
= DISAS_JUMP
;
9082 gen_set_condexec(s
);
9083 gen_set_pc_im(s
->pc
- 2);
9084 gen_exception(EXCP_UDEF
);
9085 s
->is_jmp
= DISAS_JUMP
;
9088 /* generate intermediate code in gen_opc_buf and gen_opparam_buf for
9089 basic block 'tb'. If search_pc is TRUE, also generate PC
9090 information for each intermediate instruction. */
9091 static inline void gen_intermediate_code_internal(CPUState
*env
,
9092 TranslationBlock
*tb
,
9095 DisasContext dc1
, *dc
= &dc1
;
9097 uint16_t *gen_opc_end
;
9099 target_ulong pc_start
;
9100 uint32_t next_page_start
;
9104 /* generate intermediate code */
9111 gen_opc_end
= gen_opc_buf
+ OPC_MAX_SIZE
;
9113 dc
->is_jmp
= DISAS_NEXT
;
9115 dc
->singlestep_enabled
= env
->singlestep_enabled
;
9117 dc
->thumb
= env
->thumb
;
9118 dc
->condexec_mask
= (env
->condexec_bits
& 0xf) << 1;
9119 dc
->condexec_cond
= env
->condexec_bits
>> 4;
9120 #if !defined(CONFIG_USER_ONLY)
9122 dc
->user
= ((env
->v7m
.exception
== 0) && (env
->v7m
.control
& 1));
9124 dc
->user
= (env
->uncached_cpsr
& 0x1f) == ARM_CPU_MODE_USR
;
9127 cpu_F0s
= tcg_temp_new_i32();
9128 cpu_F1s
= tcg_temp_new_i32();
9129 cpu_F0d
= tcg_temp_new_i64();
9130 cpu_F1d
= tcg_temp_new_i64();
9133 /* FIXME: cpu_M0 can probably be the same as cpu_V0. */
9134 cpu_M0
= tcg_temp_new_i64();
9135 next_page_start
= (pc_start
& TARGET_PAGE_MASK
) + TARGET_PAGE_SIZE
;
9138 max_insns
= tb
->cflags
& CF_COUNT_MASK
;
9140 max_insns
= CF_COUNT_MASK
;
9143 /* Reset the conditional execution bits immediately. This avoids
9144 complications trying to do it at the end of the block. */
9145 if (env
->condexec_bits
)
9147 TCGv tmp
= new_tmp();
9148 tcg_gen_movi_i32(tmp
, 0);
9149 store_cpu_field(tmp
, condexec_bits
);
9152 #ifdef CONFIG_USER_ONLY
9153 /* Intercept jump to the magic kernel page. */
9154 if (dc
->pc
>= 0xffff0000) {
9155 /* We always get here via a jump, so know we are not in a
9156 conditional execution block. */
9157 gen_exception(EXCP_KERNEL_TRAP
);
9158 dc
->is_jmp
= DISAS_UPDATE
;
9162 if (dc
->pc
>= 0xfffffff0 && IS_M(env
)) {
9163 /* We always get here via a jump, so know we are not in a
9164 conditional execution block. */
9165 gen_exception(EXCP_EXCEPTION_EXIT
);
9166 dc
->is_jmp
= DISAS_UPDATE
;
9171 if (unlikely(!QTAILQ_EMPTY(&env
->breakpoints
))) {
9172 QTAILQ_FOREACH(bp
, &env
->breakpoints
, entry
) {
9173 if (bp
->pc
== dc
->pc
) {
9174 gen_set_condexec(dc
);
9175 gen_set_pc_im(dc
->pc
);
9176 gen_exception(EXCP_DEBUG
);
9177 dc
->is_jmp
= DISAS_JUMP
;
9178 /* Advance PC so that clearing the breakpoint will
9179 invalidate this TB. */
9181 goto done_generating
;
9187 j
= gen_opc_ptr
- gen_opc_buf
;
9191 gen_opc_instr_start
[lj
++] = 0;
9193 gen_opc_pc
[lj
] = dc
->pc
;
9194 gen_opc_instr_start
[lj
] = 1;
9195 gen_opc_icount
[lj
] = num_insns
;
9198 if (num_insns
+ 1 == max_insns
&& (tb
->cflags
& CF_LAST_IO
))
9202 disas_thumb_insn(env
, dc
);
9203 if (dc
->condexec_mask
) {
9204 dc
->condexec_cond
= (dc
->condexec_cond
& 0xe)
9205 | ((dc
->condexec_mask
>> 4) & 1);
9206 dc
->condexec_mask
= (dc
->condexec_mask
<< 1) & 0x1f;
9207 if (dc
->condexec_mask
== 0) {
9208 dc
->condexec_cond
= 0;
9212 disas_arm_insn(env
, dc
);
9215 fprintf(stderr
, "Internal resource leak before %08x\n", dc
->pc
);
9219 if (dc
->condjmp
&& !dc
->is_jmp
) {
9220 gen_set_label(dc
->condlabel
);
9223 /* Translation stops when a conditional branch is encountered.
9224 * Otherwise the subsequent code could get translated several times.
9225 * Also stop translation when a page boundary is reached. This
9226 * ensures prefetch aborts occur at the right place. */
9228 } while (!dc
->is_jmp
&& gen_opc_ptr
< gen_opc_end
&&
9229 !env
->singlestep_enabled
&&
9231 dc
->pc
< next_page_start
&&
9232 num_insns
< max_insns
);
9234 if (tb
->cflags
& CF_LAST_IO
) {
9236 /* FIXME: This can theoretically happen with self-modifying
9238 cpu_abort(env
, "IO on conditional branch instruction");
9243 /* At this stage dc->condjmp will only be set when the skipped
9244 instruction was a conditional branch or trap, and the PC has
9245 already been written. */
9246 if (unlikely(env
->singlestep_enabled
)) {
9247 /* Make sure the pc is updated, and raise a debug exception. */
9249 gen_set_condexec(dc
);
9250 if (dc
->is_jmp
== DISAS_SWI
) {
9251 gen_exception(EXCP_SWI
);
9253 gen_exception(EXCP_DEBUG
);
9255 gen_set_label(dc
->condlabel
);
9257 if (dc
->condjmp
|| !dc
->is_jmp
) {
9258 gen_set_pc_im(dc
->pc
);
9261 gen_set_condexec(dc
);
9262 if (dc
->is_jmp
== DISAS_SWI
&& !dc
->condjmp
) {
9263 gen_exception(EXCP_SWI
);
9265 /* FIXME: Single stepping a WFI insn will not halt
9267 gen_exception(EXCP_DEBUG
);
9270 /* While branches must always occur at the end of an IT block,
9271 there are a few other things that can cause us to terminate
9272 the TB in the middel of an IT block:
9273 - Exception generating instructions (bkpt, swi, undefined).
9275 - Hardware watchpoints.
9276 Hardware breakpoints have already been handled and skip this code.
9278 gen_set_condexec(dc
);
9279 switch(dc
->is_jmp
) {
9281 gen_goto_tb(dc
, 1, dc
->pc
);
9286 /* indicate that the hash table must be used to find the next TB */
9290 /* nothing more to generate */
9296 gen_exception(EXCP_SWI
);
9300 gen_set_label(dc
->condlabel
);
9301 gen_set_condexec(dc
);
9302 gen_goto_tb(dc
, 1, dc
->pc
);
9308 gen_icount_end(tb
, num_insns
);
9309 *gen_opc_ptr
= INDEX_op_end
;
9312 if (qemu_loglevel_mask(CPU_LOG_TB_IN_ASM
)) {
9313 qemu_log("----------------\n");
9314 qemu_log("IN: %s\n", lookup_symbol(pc_start
));
9315 log_target_disas(pc_start
, dc
->pc
- pc_start
, env
->thumb
);
9320 j
= gen_opc_ptr
- gen_opc_buf
;
9323 gen_opc_instr_start
[lj
++] = 0;
9325 tb
->size
= dc
->pc
- pc_start
;
9326 tb
->icount
= num_insns
;
9330 void gen_intermediate_code(CPUState
*env
, TranslationBlock
*tb
)
9332 gen_intermediate_code_internal(env
, tb
, 0);
9335 void gen_intermediate_code_pc(CPUState
*env
, TranslationBlock
*tb
)
9337 gen_intermediate_code_internal(env
, tb
, 1);
9340 static const char *cpu_mode_names
[16] = {
9341 "usr", "fiq", "irq", "svc", "???", "???", "???", "abt",
9342 "???", "???", "???", "und", "???", "???", "???", "sys"
9345 void cpu_dump_state(CPUState
*env
, FILE *f
, fprintf_function cpu_fprintf
,
9355 /* ??? This assumes float64 and double have the same layout.
9356 Oh well, it's only debug dumps. */
9365 cpu_fprintf(f
, "R%02d=%08x", i
, env
->regs
[i
]);
9367 cpu_fprintf(f
, "\n");
9369 cpu_fprintf(f
, " ");
9371 psr
= cpsr_read(env
);
9372 cpu_fprintf(f
, "PSR=%08x %c%c%c%c %c %s%d\n",
9374 psr
& (1 << 31) ? 'N' : '-',
9375 psr
& (1 << 30) ? 'Z' : '-',
9376 psr
& (1 << 29) ? 'C' : '-',
9377 psr
& (1 << 28) ? 'V' : '-',
9378 psr
& CPSR_T
? 'T' : 'A',
9379 cpu_mode_names
[psr
& 0xf], (psr
& 0x10) ? 32 : 26);
9382 for (i
= 0; i
< 16; i
++) {
9383 d
.d
= env
->vfp
.regs
[i
];
9387 cpu_fprintf(f
, "s%02d=%08x(%8g) s%02d=%08x(%8g) d%02d=%08x%08x(%8g)\n",
9388 i
* 2, (int)s0
.i
, s0
.s
,
9389 i
* 2 + 1, (int)s1
.i
, s1
.s
,
9390 i
, (int)(uint32_t)d
.l
.upper
, (int)(uint32_t)d
.l
.lower
,
9393 cpu_fprintf(f
, "FPSCR: %08x\n", (int)env
->vfp
.xregs
[ARM_VFP_FPSCR
]);
9397 void gen_pc_load(CPUState
*env
, TranslationBlock
*tb
,
9398 unsigned long searched_pc
, int pc_pos
, void *puc
)
9400 env
->regs
[15] = gen_opc_pc
[pc_pos
];