4 * Copyright (c) 2003 Fabrice Bellard
5 * Copyright (c) 2005-2007 CodeSourcery
6 * Copyright (c) 2007 OpenedHand, Ltd.
8 * This library is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2 of the License, or (at your option) any later version.
13 * This library is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * Lesser General Public License for more details.
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with this library; if not, write to the Free Software
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301 USA
38 #define ENABLE_ARCH_5J 0
39 #define ENABLE_ARCH_6 arm_feature(env, ARM_FEATURE_V6)
40 #define ENABLE_ARCH_6K arm_feature(env, ARM_FEATURE_V6K)
41 #define ENABLE_ARCH_6T2 arm_feature(env, ARM_FEATURE_THUMB2)
42 #define ENABLE_ARCH_7 arm_feature(env, ARM_FEATURE_V7)
44 #define ARCH(x) do { if (!ENABLE_ARCH_##x) goto illegal_op; } while(0)
46 /* internal defines */
47 typedef struct DisasContext
{
50 /* Nonzero if this instruction has been conditionally skipped. */
52 /* The label that will be jumped to when the instruction is skipped. */
54 /* Thumb-2 condtional execution bits. */
57 struct TranslationBlock
*tb
;
58 int singlestep_enabled
;
60 #if !defined(CONFIG_USER_ONLY)
65 #if defined(CONFIG_USER_ONLY)
68 #define IS_USER(s) (s->user)
71 /* These instructions trap after executing, so defer them until after the
72 conditional executions state has been updated. */
76 static TCGv_ptr cpu_env
;
77 /* We reuse the same 64-bit temporaries for efficiency. */
78 static TCGv_i64 cpu_V0
, cpu_V1
, cpu_M0
;
80 /* FIXME: These should be removed. */
82 static TCGv cpu_F0s
, cpu_F1s
;
83 static TCGv_i64 cpu_F0d
, cpu_F1d
;
85 #define ICOUNT_TEMP cpu_T[0]
86 #include "gen-icount.h"
88 /* initialize TCG globals. */
89 void arm_translate_init(void)
91 cpu_env
= tcg_global_reg_new_ptr(TCG_AREG0
, "env");
93 cpu_T
[0] = tcg_global_reg_new_i32(TCG_AREG1
, "T0");
94 cpu_T
[1] = tcg_global_reg_new_i32(TCG_AREG2
, "T1");
100 /* The code generator doesn't like lots of temporaries, so maintain our own
101 cache for reuse within a function. */
103 static int num_temps
;
104 static TCGv temps
[MAX_TEMPS
];
106 /* Allocate a temporary variable. */
107 static TCGv_i32
new_tmp(void)
110 if (num_temps
== MAX_TEMPS
)
113 if (GET_TCGV_I32(temps
[num_temps
]))
114 return temps
[num_temps
++];
116 tmp
= tcg_temp_new_i32();
117 temps
[num_temps
++] = tmp
;
121 /* Release a temporary variable. */
122 static void dead_tmp(TCGv tmp
)
127 if (TCGV_EQUAL(temps
[i
], tmp
))
130 /* Shuffle this temp to the last slot. */
131 while (!TCGV_EQUAL(temps
[i
], tmp
))
133 while (i
< num_temps
) {
134 temps
[i
] = temps
[i
+ 1];
140 static inline TCGv
load_cpu_offset(int offset
)
142 TCGv tmp
= new_tmp();
143 tcg_gen_ld_i32(tmp
, cpu_env
, offset
);
147 #define load_cpu_field(name) load_cpu_offset(offsetof(CPUState, name))
149 static inline void store_cpu_offset(TCGv var
, int offset
)
151 tcg_gen_st_i32(var
, cpu_env
, offset
);
155 #define store_cpu_field(var, name) \
156 store_cpu_offset(var, offsetof(CPUState, name))
158 /* Set a variable to the value of a CPU register. */
159 static void load_reg_var(DisasContext
*s
, TCGv var
, int reg
)
163 /* normaly, since we updated PC, we need only to add one insn */
165 addr
= (long)s
->pc
+ 2;
167 addr
= (long)s
->pc
+ 4;
168 tcg_gen_movi_i32(var
, addr
);
170 tcg_gen_ld_i32(var
, cpu_env
, offsetof(CPUState
, regs
[reg
]));
174 /* Create a new temporary and set it to the value of a CPU register. */
175 static inline TCGv
load_reg(DisasContext
*s
, int reg
)
177 TCGv tmp
= new_tmp();
178 load_reg_var(s
, tmp
, reg
);
182 /* Set a CPU register. The source must be a temporary and will be
184 static void store_reg(DisasContext
*s
, int reg
, TCGv var
)
187 tcg_gen_andi_i32(var
, var
, ~1);
188 s
->is_jmp
= DISAS_JUMP
;
190 tcg_gen_st_i32(var
, cpu_env
, offsetof(CPUState
, regs
[reg
]));
195 /* Basic operations. */
196 #define gen_op_movl_T0_T1() tcg_gen_mov_i32(cpu_T[0], cpu_T[1])
197 #define gen_op_movl_T0_im(im) tcg_gen_movi_i32(cpu_T[0], im)
198 #define gen_op_movl_T1_im(im) tcg_gen_movi_i32(cpu_T[1], im)
200 #define gen_op_addl_T1_im(im) tcg_gen_addi_i32(cpu_T[1], cpu_T[1], im)
201 #define gen_op_addl_T0_T1() tcg_gen_add_i32(cpu_T[0], cpu_T[0], cpu_T[1])
202 #define gen_op_subl_T0_T1() tcg_gen_sub_i32(cpu_T[0], cpu_T[0], cpu_T[1])
203 #define gen_op_rsbl_T0_T1() tcg_gen_sub_i32(cpu_T[0], cpu_T[1], cpu_T[0])
205 #define gen_op_addl_T0_T1_cc() gen_helper_add_cc(cpu_T[0], cpu_T[0], cpu_T[1])
206 #define gen_op_adcl_T0_T1_cc() gen_helper_adc_cc(cpu_T[0], cpu_T[0], cpu_T[1])
207 #define gen_op_subl_T0_T1_cc() gen_helper_sub_cc(cpu_T[0], cpu_T[0], cpu_T[1])
208 #define gen_op_sbcl_T0_T1_cc() gen_helper_sbc_cc(cpu_T[0], cpu_T[0], cpu_T[1])
209 #define gen_op_rsbl_T0_T1_cc() gen_helper_sub_cc(cpu_T[0], cpu_T[1], cpu_T[0])
210 #define gen_op_rscl_T0_T1_cc() gen_helper_sbc_cc(cpu_T[0], cpu_T[1], cpu_T[0])
212 #define gen_op_andl_T0_T1() tcg_gen_and_i32(cpu_T[0], cpu_T[0], cpu_T[1])
213 #define gen_op_xorl_T0_T1() tcg_gen_xor_i32(cpu_T[0], cpu_T[0], cpu_T[1])
214 #define gen_op_orl_T0_T1() tcg_gen_or_i32(cpu_T[0], cpu_T[0], cpu_T[1])
215 #define gen_op_notl_T0() tcg_gen_not_i32(cpu_T[0], cpu_T[0])
216 #define gen_op_notl_T1() tcg_gen_not_i32(cpu_T[1], cpu_T[1])
217 #define gen_op_logic_T0_cc() gen_logic_CC(cpu_T[0]);
218 #define gen_op_logic_T1_cc() gen_logic_CC(cpu_T[1]);
220 #define gen_op_shll_T1_im(im) tcg_gen_shli_i32(cpu_T[1], cpu_T[1], im)
221 #define gen_op_shrl_T1_im(im) tcg_gen_shri_i32(cpu_T[1], cpu_T[1], im)
223 /* Value extensions. */
224 #define gen_uxtb(var) tcg_gen_ext8u_i32(var, var)
225 #define gen_uxth(var) tcg_gen_ext16u_i32(var, var)
226 #define gen_sxtb(var) tcg_gen_ext8s_i32(var, var)
227 #define gen_sxth(var) tcg_gen_ext16s_i32(var, var)
229 #define gen_sxtb16(var) gen_helper_sxtb16(var, var)
230 #define gen_uxtb16(var) gen_helper_uxtb16(var, var)
232 #define gen_op_mul_T0_T1() tcg_gen_mul_i32(cpu_T[0], cpu_T[0], cpu_T[1])
234 #define gen_set_cpsr(var, mask) gen_helper_cpsr_write(var, tcg_const_i32(mask))
235 /* Set NZCV flags from the high 4 bits of var. */
236 #define gen_set_nzcv(var) gen_set_cpsr(var, CPSR_NZCV)
238 static void gen_exception(int excp
)
240 TCGv tmp
= new_tmp();
241 tcg_gen_movi_i32(tmp
, excp
);
242 gen_helper_exception(tmp
);
246 static void gen_smul_dual(TCGv a
, TCGv b
)
248 TCGv tmp1
= new_tmp();
249 TCGv tmp2
= new_tmp();
250 tcg_gen_ext16s_i32(tmp1
, a
);
251 tcg_gen_ext16s_i32(tmp2
, b
);
252 tcg_gen_mul_i32(tmp1
, tmp1
, tmp2
);
254 tcg_gen_sari_i32(a
, a
, 16);
255 tcg_gen_sari_i32(b
, b
, 16);
256 tcg_gen_mul_i32(b
, b
, a
);
257 tcg_gen_mov_i32(a
, tmp1
);
261 /* Byteswap each halfword. */
262 static void gen_rev16(TCGv var
)
264 TCGv tmp
= new_tmp();
265 tcg_gen_shri_i32(tmp
, var
, 8);
266 tcg_gen_andi_i32(tmp
, tmp
, 0x00ff00ff);
267 tcg_gen_shli_i32(var
, var
, 8);
268 tcg_gen_andi_i32(var
, var
, 0xff00ff00);
269 tcg_gen_or_i32(var
, var
, tmp
);
273 /* Byteswap low halfword and sign extend. */
274 static void gen_revsh(TCGv var
)
276 TCGv tmp
= new_tmp();
277 tcg_gen_shri_i32(tmp
, var
, 8);
278 tcg_gen_andi_i32(tmp
, tmp
, 0x00ff);
279 tcg_gen_shli_i32(var
, var
, 8);
280 tcg_gen_ext8s_i32(var
, var
);
281 tcg_gen_or_i32(var
, var
, tmp
);
285 /* Unsigned bitfield extract. */
286 static void gen_ubfx(TCGv var
, int shift
, uint32_t mask
)
289 tcg_gen_shri_i32(var
, var
, shift
);
290 tcg_gen_andi_i32(var
, var
, mask
);
293 /* Signed bitfield extract. */
294 static void gen_sbfx(TCGv var
, int shift
, int width
)
299 tcg_gen_sari_i32(var
, var
, shift
);
300 if (shift
+ width
< 32) {
301 signbit
= 1u << (width
- 1);
302 tcg_gen_andi_i32(var
, var
, (1u << width
) - 1);
303 tcg_gen_xori_i32(var
, var
, signbit
);
304 tcg_gen_subi_i32(var
, var
, signbit
);
308 /* Bitfield insertion. Insert val into base. Clobbers base and val. */
309 static void gen_bfi(TCGv dest
, TCGv base
, TCGv val
, int shift
, uint32_t mask
)
311 tcg_gen_andi_i32(val
, val
, mask
);
312 tcg_gen_shli_i32(val
, val
, shift
);
313 tcg_gen_andi_i32(base
, base
, ~(mask
<< shift
));
314 tcg_gen_or_i32(dest
, base
, val
);
317 /* Round the top 32 bits of a 64-bit value. */
318 static void gen_roundqd(TCGv a
, TCGv b
)
320 tcg_gen_shri_i32(a
, a
, 31);
321 tcg_gen_add_i32(a
, a
, b
);
324 /* FIXME: Most targets have native widening multiplication.
325 It would be good to use that instead of a full wide multiply. */
326 /* 32x32->64 multiply. Marks inputs as dead. */
327 static TCGv_i64
gen_mulu_i64_i32(TCGv a
, TCGv b
)
329 TCGv_i64 tmp1
= tcg_temp_new_i64();
330 TCGv_i64 tmp2
= tcg_temp_new_i64();
332 tcg_gen_extu_i32_i64(tmp1
, a
);
334 tcg_gen_extu_i32_i64(tmp2
, b
);
336 tcg_gen_mul_i64(tmp1
, tmp1
, tmp2
);
340 static TCGv_i64
gen_muls_i64_i32(TCGv a
, TCGv b
)
342 TCGv_i64 tmp1
= tcg_temp_new_i64();
343 TCGv_i64 tmp2
= tcg_temp_new_i64();
345 tcg_gen_ext_i32_i64(tmp1
, a
);
347 tcg_gen_ext_i32_i64(tmp2
, b
);
349 tcg_gen_mul_i64(tmp1
, tmp1
, tmp2
);
353 /* Unsigned 32x32->64 multiply. */
354 static void gen_op_mull_T0_T1(void)
356 TCGv_i64 tmp1
= tcg_temp_new_i64();
357 TCGv_i64 tmp2
= tcg_temp_new_i64();
359 tcg_gen_extu_i32_i64(tmp1
, cpu_T
[0]);
360 tcg_gen_extu_i32_i64(tmp2
, cpu_T
[1]);
361 tcg_gen_mul_i64(tmp1
, tmp1
, tmp2
);
362 tcg_gen_trunc_i64_i32(cpu_T
[0], tmp1
);
363 tcg_gen_shri_i64(tmp1
, tmp1
, 32);
364 tcg_gen_trunc_i64_i32(cpu_T
[1], tmp1
);
367 /* Signed 32x32->64 multiply. */
368 static void gen_imull(TCGv a
, TCGv b
)
370 TCGv_i64 tmp1
= tcg_temp_new_i64();
371 TCGv_i64 tmp2
= tcg_temp_new_i64();
373 tcg_gen_ext_i32_i64(tmp1
, a
);
374 tcg_gen_ext_i32_i64(tmp2
, b
);
375 tcg_gen_mul_i64(tmp1
, tmp1
, tmp2
);
376 tcg_gen_trunc_i64_i32(a
, tmp1
);
377 tcg_gen_shri_i64(tmp1
, tmp1
, 32);
378 tcg_gen_trunc_i64_i32(b
, tmp1
);
381 /* Swap low and high halfwords. */
382 static void gen_swap_half(TCGv var
)
384 TCGv tmp
= new_tmp();
385 tcg_gen_shri_i32(tmp
, var
, 16);
386 tcg_gen_shli_i32(var
, var
, 16);
387 tcg_gen_or_i32(var
, var
, tmp
);
391 /* Dual 16-bit add. Result placed in t0 and t1 is marked as dead.
392 tmp = (t0 ^ t1) & 0x8000;
395 t0 = (t0 + t1) ^ tmp;
398 static void gen_add16(TCGv t0
, TCGv t1
)
400 TCGv tmp
= new_tmp();
401 tcg_gen_xor_i32(tmp
, t0
, t1
);
402 tcg_gen_andi_i32(tmp
, tmp
, 0x8000);
403 tcg_gen_andi_i32(t0
, t0
, ~0x8000);
404 tcg_gen_andi_i32(t1
, t1
, ~0x8000);
405 tcg_gen_add_i32(t0
, t0
, t1
);
406 tcg_gen_xor_i32(t0
, t0
, tmp
);
411 #define gen_set_CF(var) tcg_gen_st_i32(var, cpu_env, offsetof(CPUState, CF))
413 /* Set CF to the top bit of var. */
414 static void gen_set_CF_bit31(TCGv var
)
416 TCGv tmp
= new_tmp();
417 tcg_gen_shri_i32(tmp
, var
, 31);
422 /* Set N and Z flags from var. */
423 static inline void gen_logic_CC(TCGv var
)
425 tcg_gen_st_i32(var
, cpu_env
, offsetof(CPUState
, NF
));
426 tcg_gen_st_i32(var
, cpu_env
, offsetof(CPUState
, ZF
));
430 static void gen_adc_T0_T1(void)
434 tmp
= load_cpu_field(CF
);
435 tcg_gen_add_i32(cpu_T
[0], cpu_T
[0], tmp
);
439 /* dest = T0 - T1 + CF - 1. */
440 static void gen_sub_carry(TCGv dest
, TCGv t0
, TCGv t1
)
443 tcg_gen_sub_i32(dest
, t0
, t1
);
444 tmp
= load_cpu_field(CF
);
445 tcg_gen_add_i32(dest
, dest
, tmp
);
446 tcg_gen_subi_i32(dest
, dest
, 1);
450 #define gen_sbc_T0_T1() gen_sub_carry(cpu_T[0], cpu_T[0], cpu_T[1])
451 #define gen_rsc_T0_T1() gen_sub_carry(cpu_T[0], cpu_T[1], cpu_T[0])
453 /* T0 &= ~T1. Clobbers T1. */
454 /* FIXME: Implement bic natively. */
455 static inline void tcg_gen_bic_i32(TCGv dest
, TCGv t0
, TCGv t1
)
457 TCGv tmp
= new_tmp();
458 tcg_gen_not_i32(tmp
, t1
);
459 tcg_gen_and_i32(dest
, t0
, tmp
);
462 static inline void gen_op_bicl_T0_T1(void)
468 /* FIXME: Implement this natively. */
469 #define tcg_gen_abs_i32(t0, t1) gen_helper_abs(t0, t1)
471 /* FIXME: Implement this natively. */
472 static void tcg_gen_rori_i32(TCGv t0
, TCGv t1
, int i
)
480 tcg_gen_shri_i32(tmp
, t1
, i
);
481 tcg_gen_shli_i32(t1
, t1
, 32 - i
);
482 tcg_gen_or_i32(t0
, t1
, tmp
);
486 static void shifter_out_im(TCGv var
, int shift
)
488 TCGv tmp
= new_tmp();
490 tcg_gen_andi_i32(tmp
, var
, 1);
492 tcg_gen_shri_i32(tmp
, var
, shift
);
494 tcg_gen_andi_i32(tmp
, tmp
, 1);
500 /* Shift by immediate. Includes special handling for shift == 0. */
501 static inline void gen_arm_shift_im(TCGv var
, int shiftop
, int shift
, int flags
)
507 shifter_out_im(var
, 32 - shift
);
508 tcg_gen_shli_i32(var
, var
, shift
);
514 tcg_gen_shri_i32(var
, var
, 31);
517 tcg_gen_movi_i32(var
, 0);
520 shifter_out_im(var
, shift
- 1);
521 tcg_gen_shri_i32(var
, var
, shift
);
528 shifter_out_im(var
, shift
- 1);
531 tcg_gen_sari_i32(var
, var
, shift
);
533 case 3: /* ROR/RRX */
536 shifter_out_im(var
, shift
- 1);
537 tcg_gen_rori_i32(var
, var
, shift
); break;
539 TCGv tmp
= load_cpu_field(CF
);
541 shifter_out_im(var
, 0);
542 tcg_gen_shri_i32(var
, var
, 1);
543 tcg_gen_shli_i32(tmp
, tmp
, 31);
544 tcg_gen_or_i32(var
, var
, tmp
);
550 static inline void gen_arm_shift_reg(TCGv var
, int shiftop
,
551 TCGv shift
, int flags
)
555 case 0: gen_helper_shl_cc(var
, var
, shift
); break;
556 case 1: gen_helper_shr_cc(var
, var
, shift
); break;
557 case 2: gen_helper_sar_cc(var
, var
, shift
); break;
558 case 3: gen_helper_ror_cc(var
, var
, shift
); break;
562 case 0: gen_helper_shl(var
, var
, shift
); break;
563 case 1: gen_helper_shr(var
, var
, shift
); break;
564 case 2: gen_helper_sar(var
, var
, shift
); break;
565 case 3: gen_helper_ror(var
, var
, shift
); break;
571 #define PAS_OP(pfx) \
573 case 0: gen_pas_helper(glue(pfx,add16)); break; \
574 case 1: gen_pas_helper(glue(pfx,addsubx)); break; \
575 case 2: gen_pas_helper(glue(pfx,subaddx)); break; \
576 case 3: gen_pas_helper(glue(pfx,sub16)); break; \
577 case 4: gen_pas_helper(glue(pfx,add8)); break; \
578 case 7: gen_pas_helper(glue(pfx,sub8)); break; \
580 static void gen_arm_parallel_addsub(int op1
, int op2
, TCGv a
, TCGv b
)
585 #define gen_pas_helper(name) glue(gen_helper_,name)(a, a, b, tmp)
587 tmp
= tcg_temp_new_ptr();
588 tcg_gen_addi_ptr(tmp
, cpu_env
, offsetof(CPUState
, GE
));
592 tmp
= tcg_temp_new_ptr();
593 tcg_gen_addi_ptr(tmp
, cpu_env
, offsetof(CPUState
, GE
));
596 #undef gen_pas_helper
597 #define gen_pas_helper(name) glue(gen_helper_,name)(a, a, b)
610 #undef gen_pas_helper
615 /* For unknown reasons Arm and Thumb-2 use arbitrarily different encodings. */
616 #define PAS_OP(pfx) \
618 case 0: gen_pas_helper(glue(pfx,add8)); break; \
619 case 1: gen_pas_helper(glue(pfx,add16)); break; \
620 case 2: gen_pas_helper(glue(pfx,addsubx)); break; \
621 case 4: gen_pas_helper(glue(pfx,sub8)); break; \
622 case 5: gen_pas_helper(glue(pfx,sub16)); break; \
623 case 6: gen_pas_helper(glue(pfx,subaddx)); break; \
625 static void gen_thumb2_parallel_addsub(int op1
, int op2
, TCGv a
, TCGv b
)
630 #define gen_pas_helper(name) glue(gen_helper_,name)(a, a, b, tmp)
632 tmp
= tcg_temp_new_ptr();
633 tcg_gen_addi_ptr(tmp
, cpu_env
, offsetof(CPUState
, GE
));
637 tmp
= tcg_temp_new_ptr();
638 tcg_gen_addi_ptr(tmp
, cpu_env
, offsetof(CPUState
, GE
));
641 #undef gen_pas_helper
642 #define gen_pas_helper(name) glue(gen_helper_,name)(a, a, b)
655 #undef gen_pas_helper
660 static void gen_test_cc(int cc
, int label
)
668 tmp
= load_cpu_field(ZF
);
669 tcg_gen_brcondi_i32(TCG_COND_EQ
, tmp
, 0, label
);
672 tmp
= load_cpu_field(ZF
);
673 tcg_gen_brcondi_i32(TCG_COND_NE
, tmp
, 0, label
);
676 tmp
= load_cpu_field(CF
);
677 tcg_gen_brcondi_i32(TCG_COND_NE
, tmp
, 0, label
);
680 tmp
= load_cpu_field(CF
);
681 tcg_gen_brcondi_i32(TCG_COND_EQ
, tmp
, 0, label
);
684 tmp
= load_cpu_field(NF
);
685 tcg_gen_brcondi_i32(TCG_COND_LT
, tmp
, 0, label
);
688 tmp
= load_cpu_field(NF
);
689 tcg_gen_brcondi_i32(TCG_COND_GE
, tmp
, 0, label
);
692 tmp
= load_cpu_field(VF
);
693 tcg_gen_brcondi_i32(TCG_COND_LT
, tmp
, 0, label
);
696 tmp
= load_cpu_field(VF
);
697 tcg_gen_brcondi_i32(TCG_COND_GE
, tmp
, 0, label
);
699 case 8: /* hi: C && !Z */
700 inv
= gen_new_label();
701 tmp
= load_cpu_field(CF
);
702 tcg_gen_brcondi_i32(TCG_COND_EQ
, tmp
, 0, inv
);
704 tmp
= load_cpu_field(ZF
);
705 tcg_gen_brcondi_i32(TCG_COND_NE
, tmp
, 0, label
);
708 case 9: /* ls: !C || Z */
709 tmp
= load_cpu_field(CF
);
710 tcg_gen_brcondi_i32(TCG_COND_EQ
, tmp
, 0, label
);
712 tmp
= load_cpu_field(ZF
);
713 tcg_gen_brcondi_i32(TCG_COND_EQ
, tmp
, 0, label
);
715 case 10: /* ge: N == V -> N ^ V == 0 */
716 tmp
= load_cpu_field(VF
);
717 tmp2
= load_cpu_field(NF
);
718 tcg_gen_xor_i32(tmp
, tmp
, tmp2
);
720 tcg_gen_brcondi_i32(TCG_COND_GE
, tmp
, 0, label
);
722 case 11: /* lt: N != V -> N ^ V != 0 */
723 tmp
= load_cpu_field(VF
);
724 tmp2
= load_cpu_field(NF
);
725 tcg_gen_xor_i32(tmp
, tmp
, tmp2
);
727 tcg_gen_brcondi_i32(TCG_COND_LT
, tmp
, 0, label
);
729 case 12: /* gt: !Z && N == V */
730 inv
= gen_new_label();
731 tmp
= load_cpu_field(ZF
);
732 tcg_gen_brcondi_i32(TCG_COND_EQ
, tmp
, 0, inv
);
734 tmp
= load_cpu_field(VF
);
735 tmp2
= load_cpu_field(NF
);
736 tcg_gen_xor_i32(tmp
, tmp
, tmp2
);
738 tcg_gen_brcondi_i32(TCG_COND_GE
, tmp
, 0, label
);
741 case 13: /* le: Z || N != V */
742 tmp
= load_cpu_field(ZF
);
743 tcg_gen_brcondi_i32(TCG_COND_EQ
, tmp
, 0, label
);
745 tmp
= load_cpu_field(VF
);
746 tmp2
= load_cpu_field(NF
);
747 tcg_gen_xor_i32(tmp
, tmp
, tmp2
);
749 tcg_gen_brcondi_i32(TCG_COND_LT
, tmp
, 0, label
);
752 fprintf(stderr
, "Bad condition code 0x%x\n", cc
);
758 static const uint8_t table_logic_cc
[16] = {
777 /* Set PC and Thumb state from an immediate address. */
778 static inline void gen_bx_im(DisasContext
*s
, uint32_t addr
)
782 s
->is_jmp
= DISAS_UPDATE
;
784 if (s
->thumb
!= (addr
& 1)) {
785 tcg_gen_movi_i32(tmp
, addr
& 1);
786 tcg_gen_st_i32(tmp
, cpu_env
, offsetof(CPUState
, thumb
));
788 tcg_gen_movi_i32(tmp
, addr
& ~1);
789 tcg_gen_st_i32(tmp
, cpu_env
, offsetof(CPUState
, regs
[15]));
793 /* Set PC and Thumb state from var. var is marked as dead. */
794 static inline void gen_bx(DisasContext
*s
, TCGv var
)
798 s
->is_jmp
= DISAS_UPDATE
;
800 tcg_gen_andi_i32(tmp
, var
, 1);
801 store_cpu_field(tmp
, thumb
);
802 tcg_gen_andi_i32(var
, var
, ~1);
803 store_cpu_field(var
, regs
[15]);
806 /* TODO: This should be removed. Use gen_bx instead. */
807 static inline void gen_bx_T0(DisasContext
*s
)
809 TCGv tmp
= new_tmp();
810 tcg_gen_mov_i32(tmp
, cpu_T
[0]);
814 static inline TCGv
gen_ld8s(TCGv addr
, int index
)
816 TCGv tmp
= new_tmp();
817 tcg_gen_qemu_ld8s(tmp
, addr
, index
);
820 static inline TCGv
gen_ld8u(TCGv addr
, int index
)
822 TCGv tmp
= new_tmp();
823 tcg_gen_qemu_ld8u(tmp
, addr
, index
);
826 static inline TCGv
gen_ld16s(TCGv addr
, int index
)
828 TCGv tmp
= new_tmp();
829 tcg_gen_qemu_ld16s(tmp
, addr
, index
);
832 static inline TCGv
gen_ld16u(TCGv addr
, int index
)
834 TCGv tmp
= new_tmp();
835 tcg_gen_qemu_ld16u(tmp
, addr
, index
);
838 static inline TCGv
gen_ld32(TCGv addr
, int index
)
840 TCGv tmp
= new_tmp();
841 tcg_gen_qemu_ld32u(tmp
, addr
, index
);
844 static inline void gen_st8(TCGv val
, TCGv addr
, int index
)
846 tcg_gen_qemu_st8(val
, addr
, index
);
849 static inline void gen_st16(TCGv val
, TCGv addr
, int index
)
851 tcg_gen_qemu_st16(val
, addr
, index
);
854 static inline void gen_st32(TCGv val
, TCGv addr
, int index
)
856 tcg_gen_qemu_st32(val
, addr
, index
);
860 static inline void gen_movl_T0_reg(DisasContext
*s
, int reg
)
862 load_reg_var(s
, cpu_T
[0], reg
);
865 static inline void gen_movl_T1_reg(DisasContext
*s
, int reg
)
867 load_reg_var(s
, cpu_T
[1], reg
);
870 static inline void gen_movl_T2_reg(DisasContext
*s
, int reg
)
872 load_reg_var(s
, cpu_T
[2], reg
);
875 static inline void gen_set_pc_im(uint32_t val
)
877 TCGv tmp
= new_tmp();
878 tcg_gen_movi_i32(tmp
, val
);
879 store_cpu_field(tmp
, regs
[15]);
882 static inline void gen_movl_reg_TN(DisasContext
*s
, int reg
, int t
)
887 tcg_gen_andi_i32(tmp
, cpu_T
[t
], ~1);
891 tcg_gen_st_i32(tmp
, cpu_env
, offsetof(CPUState
, regs
[reg
]));
894 s
->is_jmp
= DISAS_JUMP
;
898 static inline void gen_movl_reg_T0(DisasContext
*s
, int reg
)
900 gen_movl_reg_TN(s
, reg
, 0);
903 static inline void gen_movl_reg_T1(DisasContext
*s
, int reg
)
905 gen_movl_reg_TN(s
, reg
, 1);
908 /* Force a TB lookup after an instruction that changes the CPU state. */
909 static inline void gen_lookup_tb(DisasContext
*s
)
911 gen_op_movl_T0_im(s
->pc
);
912 gen_movl_reg_T0(s
, 15);
913 s
->is_jmp
= DISAS_UPDATE
;
916 static inline void gen_add_data_offset(DisasContext
*s
, unsigned int insn
,
919 int val
, rm
, shift
, shiftop
;
922 if (!(insn
& (1 << 25))) {
925 if (!(insn
& (1 << 23)))
928 tcg_gen_addi_i32(var
, var
, val
);
932 shift
= (insn
>> 7) & 0x1f;
933 shiftop
= (insn
>> 5) & 3;
934 offset
= load_reg(s
, rm
);
935 gen_arm_shift_im(offset
, shiftop
, shift
, 0);
936 if (!(insn
& (1 << 23)))
937 tcg_gen_sub_i32(var
, var
, offset
);
939 tcg_gen_add_i32(var
, var
, offset
);
944 static inline void gen_add_datah_offset(DisasContext
*s
, unsigned int insn
,
950 if (insn
& (1 << 22)) {
952 val
= (insn
& 0xf) | ((insn
>> 4) & 0xf0);
953 if (!(insn
& (1 << 23)))
957 tcg_gen_addi_i32(var
, var
, val
);
961 tcg_gen_addi_i32(var
, var
, extra
);
963 offset
= load_reg(s
, rm
);
964 if (!(insn
& (1 << 23)))
965 tcg_gen_sub_i32(var
, var
, offset
);
967 tcg_gen_add_i32(var
, var
, offset
);
972 #define VFP_OP2(name) \
973 static inline void gen_vfp_##name(int dp) \
976 gen_helper_vfp_##name##d(cpu_F0d, cpu_F0d, cpu_F1d, cpu_env); \
978 gen_helper_vfp_##name##s(cpu_F0s, cpu_F0s, cpu_F1s, cpu_env); \
988 static inline void gen_vfp_abs(int dp
)
991 gen_helper_vfp_absd(cpu_F0d
, cpu_F0d
);
993 gen_helper_vfp_abss(cpu_F0s
, cpu_F0s
);
996 static inline void gen_vfp_neg(int dp
)
999 gen_helper_vfp_negd(cpu_F0d
, cpu_F0d
);
1001 gen_helper_vfp_negs(cpu_F0s
, cpu_F0s
);
1004 static inline void gen_vfp_sqrt(int dp
)
1007 gen_helper_vfp_sqrtd(cpu_F0d
, cpu_F0d
, cpu_env
);
1009 gen_helper_vfp_sqrts(cpu_F0s
, cpu_F0s
, cpu_env
);
1012 static inline void gen_vfp_cmp(int dp
)
1015 gen_helper_vfp_cmpd(cpu_F0d
, cpu_F1d
, cpu_env
);
1017 gen_helper_vfp_cmps(cpu_F0s
, cpu_F1s
, cpu_env
);
1020 static inline void gen_vfp_cmpe(int dp
)
1023 gen_helper_vfp_cmped(cpu_F0d
, cpu_F1d
, cpu_env
);
1025 gen_helper_vfp_cmpes(cpu_F0s
, cpu_F1s
, cpu_env
);
1028 static inline void gen_vfp_F1_ld0(int dp
)
1031 tcg_gen_movi_i64(cpu_F1d
, 0);
1033 tcg_gen_movi_i32(cpu_F1s
, 0);
1036 static inline void gen_vfp_uito(int dp
)
1039 gen_helper_vfp_uitod(cpu_F0d
, cpu_F0s
, cpu_env
);
1041 gen_helper_vfp_uitos(cpu_F0s
, cpu_F0s
, cpu_env
);
1044 static inline void gen_vfp_sito(int dp
)
1047 gen_helper_vfp_sitod(cpu_F0d
, cpu_F0s
, cpu_env
);
1049 gen_helper_vfp_sitos(cpu_F0s
, cpu_F0s
, cpu_env
);
1052 static inline void gen_vfp_toui(int dp
)
1055 gen_helper_vfp_touid(cpu_F0s
, cpu_F0d
, cpu_env
);
1057 gen_helper_vfp_touis(cpu_F0s
, cpu_F0s
, cpu_env
);
1060 static inline void gen_vfp_touiz(int dp
)
1063 gen_helper_vfp_touizd(cpu_F0s
, cpu_F0d
, cpu_env
);
1065 gen_helper_vfp_touizs(cpu_F0s
, cpu_F0s
, cpu_env
);
1068 static inline void gen_vfp_tosi(int dp
)
1071 gen_helper_vfp_tosid(cpu_F0s
, cpu_F0d
, cpu_env
);
1073 gen_helper_vfp_tosis(cpu_F0s
, cpu_F0s
, cpu_env
);
1076 static inline void gen_vfp_tosiz(int dp
)
1079 gen_helper_vfp_tosizd(cpu_F0s
, cpu_F0d
, cpu_env
);
1081 gen_helper_vfp_tosizs(cpu_F0s
, cpu_F0s
, cpu_env
);
1084 #define VFP_GEN_FIX(name) \
1085 static inline void gen_vfp_##name(int dp, int shift) \
1088 gen_helper_vfp_##name##d(cpu_F0d, cpu_F0d, tcg_const_i32(shift), cpu_env);\
1090 gen_helper_vfp_##name##s(cpu_F0s, cpu_F0s, tcg_const_i32(shift), cpu_env);\
1102 static inline void gen_vfp_ld(DisasContext
*s
, int dp
)
1105 tcg_gen_qemu_ld64(cpu_F0d
, cpu_T
[1], IS_USER(s
));
1107 tcg_gen_qemu_ld32u(cpu_F0s
, cpu_T
[1], IS_USER(s
));
1110 static inline void gen_vfp_st(DisasContext
*s
, int dp
)
1113 tcg_gen_qemu_st64(cpu_F0d
, cpu_T
[1], IS_USER(s
));
1115 tcg_gen_qemu_st32(cpu_F0s
, cpu_T
[1], IS_USER(s
));
1119 vfp_reg_offset (int dp
, int reg
)
1122 return offsetof(CPUARMState
, vfp
.regs
[reg
]);
1124 return offsetof(CPUARMState
, vfp
.regs
[reg
>> 1])
1125 + offsetof(CPU_DoubleU
, l
.upper
);
1127 return offsetof(CPUARMState
, vfp
.regs
[reg
>> 1])
1128 + offsetof(CPU_DoubleU
, l
.lower
);
1132 /* Return the offset of a 32-bit piece of a NEON register.
1133 zero is the least significant end of the register. */
1135 neon_reg_offset (int reg
, int n
)
1139 return vfp_reg_offset(0, sreg
);
1142 /* FIXME: Remove these. */
1143 #define neon_T0 cpu_T[0]
1144 #define neon_T1 cpu_T[1]
1145 #define NEON_GET_REG(T, reg, n) \
1146 tcg_gen_ld_i32(neon_##T, cpu_env, neon_reg_offset(reg, n))
1147 #define NEON_SET_REG(T, reg, n) \
1148 tcg_gen_st_i32(neon_##T, cpu_env, neon_reg_offset(reg, n))
1150 static TCGv
neon_load_reg(int reg
, int pass
)
1152 TCGv tmp
= new_tmp();
1153 tcg_gen_ld_i32(tmp
, cpu_env
, neon_reg_offset(reg
, pass
));
1157 static void neon_store_reg(int reg
, int pass
, TCGv var
)
1159 tcg_gen_st_i32(var
, cpu_env
, neon_reg_offset(reg
, pass
));
1163 static inline void neon_load_reg64(TCGv_i64 var
, int reg
)
1165 tcg_gen_ld_i64(var
, cpu_env
, vfp_reg_offset(1, reg
));
1168 static inline void neon_store_reg64(TCGv_i64 var
, int reg
)
1170 tcg_gen_st_i64(var
, cpu_env
, vfp_reg_offset(1, reg
));
1173 #define tcg_gen_ld_f32 tcg_gen_ld_i32
1174 #define tcg_gen_ld_f64 tcg_gen_ld_i64
1175 #define tcg_gen_st_f32 tcg_gen_st_i32
1176 #define tcg_gen_st_f64 tcg_gen_st_i64
1178 static inline void gen_mov_F0_vreg(int dp
, int reg
)
1181 tcg_gen_ld_f64(cpu_F0d
, cpu_env
, vfp_reg_offset(dp
, reg
));
1183 tcg_gen_ld_f32(cpu_F0s
, cpu_env
, vfp_reg_offset(dp
, reg
));
1186 static inline void gen_mov_F1_vreg(int dp
, int reg
)
1189 tcg_gen_ld_f64(cpu_F1d
, cpu_env
, vfp_reg_offset(dp
, reg
));
1191 tcg_gen_ld_f32(cpu_F1s
, cpu_env
, vfp_reg_offset(dp
, reg
));
1194 static inline void gen_mov_vreg_F0(int dp
, int reg
)
1197 tcg_gen_st_f64(cpu_F0d
, cpu_env
, vfp_reg_offset(dp
, reg
));
1199 tcg_gen_st_f32(cpu_F0s
, cpu_env
, vfp_reg_offset(dp
, reg
));
1202 #define ARM_CP_RW_BIT (1 << 20)
1204 static inline void iwmmxt_load_reg(TCGv_i64 var
, int reg
)
1206 tcg_gen_ld_i64(var
, cpu_env
, offsetof(CPUState
, iwmmxt
.regs
[reg
]));
1209 static inline void iwmmxt_store_reg(TCGv_i64 var
, int reg
)
1211 tcg_gen_st_i64(var
, cpu_env
, offsetof(CPUState
, iwmmxt
.regs
[reg
]));
1214 static inline void gen_op_iwmmxt_movl_wCx_T0(int reg
)
1216 tcg_gen_st_i32(cpu_T
[0], cpu_env
, offsetof(CPUState
, iwmmxt
.cregs
[reg
]));
1219 static inline void gen_op_iwmmxt_movl_T0_wCx(int reg
)
1221 tcg_gen_ld_i32(cpu_T
[0], cpu_env
, offsetof(CPUState
, iwmmxt
.cregs
[reg
]));
1224 static inline void gen_op_iwmmxt_movl_T1_wCx(int reg
)
1226 tcg_gen_ld_i32(cpu_T
[1], cpu_env
, offsetof(CPUState
, iwmmxt
.cregs
[reg
]));
1229 static inline void gen_op_iwmmxt_movq_wRn_M0(int rn
)
1231 iwmmxt_store_reg(cpu_M0
, rn
);
1234 static inline void gen_op_iwmmxt_movq_M0_wRn(int rn
)
1236 iwmmxt_load_reg(cpu_M0
, rn
);
1239 static inline void gen_op_iwmmxt_orq_M0_wRn(int rn
)
1241 iwmmxt_load_reg(cpu_V1
, rn
);
1242 tcg_gen_or_i64(cpu_M0
, cpu_M0
, cpu_V1
);
1245 static inline void gen_op_iwmmxt_andq_M0_wRn(int rn
)
1247 iwmmxt_load_reg(cpu_V1
, rn
);
1248 tcg_gen_and_i64(cpu_M0
, cpu_M0
, cpu_V1
);
1251 static inline void gen_op_iwmmxt_xorq_M0_wRn(int rn
)
1253 iwmmxt_load_reg(cpu_V1
, rn
);
1254 tcg_gen_xor_i64(cpu_M0
, cpu_M0
, cpu_V1
);
1257 #define IWMMXT_OP(name) \
1258 static inline void gen_op_iwmmxt_##name##_M0_wRn(int rn) \
1260 iwmmxt_load_reg(cpu_V1, rn); \
1261 gen_helper_iwmmxt_##name(cpu_M0, cpu_M0, cpu_V1); \
1264 #define IWMMXT_OP_ENV(name) \
1265 static inline void gen_op_iwmmxt_##name##_M0_wRn(int rn) \
1267 iwmmxt_load_reg(cpu_V1, rn); \
1268 gen_helper_iwmmxt_##name(cpu_M0, cpu_env, cpu_M0, cpu_V1); \
1271 #define IWMMXT_OP_ENV_SIZE(name) \
1272 IWMMXT_OP_ENV(name##b) \
1273 IWMMXT_OP_ENV(name##w) \
1274 IWMMXT_OP_ENV(name##l)
1276 #define IWMMXT_OP_ENV1(name) \
1277 static inline void gen_op_iwmmxt_##name##_M0(void) \
1279 gen_helper_iwmmxt_##name(cpu_M0, cpu_env, cpu_M0); \
1293 IWMMXT_OP_ENV_SIZE(unpackl
)
1294 IWMMXT_OP_ENV_SIZE(unpackh
)
1296 IWMMXT_OP_ENV1(unpacklub
)
1297 IWMMXT_OP_ENV1(unpackluw
)
1298 IWMMXT_OP_ENV1(unpacklul
)
1299 IWMMXT_OP_ENV1(unpackhub
)
1300 IWMMXT_OP_ENV1(unpackhuw
)
1301 IWMMXT_OP_ENV1(unpackhul
)
1302 IWMMXT_OP_ENV1(unpacklsb
)
1303 IWMMXT_OP_ENV1(unpacklsw
)
1304 IWMMXT_OP_ENV1(unpacklsl
)
1305 IWMMXT_OP_ENV1(unpackhsb
)
1306 IWMMXT_OP_ENV1(unpackhsw
)
1307 IWMMXT_OP_ENV1(unpackhsl
)
1309 IWMMXT_OP_ENV_SIZE(cmpeq
)
1310 IWMMXT_OP_ENV_SIZE(cmpgtu
)
1311 IWMMXT_OP_ENV_SIZE(cmpgts
)
1313 IWMMXT_OP_ENV_SIZE(mins
)
1314 IWMMXT_OP_ENV_SIZE(minu
)
1315 IWMMXT_OP_ENV_SIZE(maxs
)
1316 IWMMXT_OP_ENV_SIZE(maxu
)
1318 IWMMXT_OP_ENV_SIZE(subn
)
1319 IWMMXT_OP_ENV_SIZE(addn
)
1320 IWMMXT_OP_ENV_SIZE(subu
)
1321 IWMMXT_OP_ENV_SIZE(addu
)
1322 IWMMXT_OP_ENV_SIZE(subs
)
1323 IWMMXT_OP_ENV_SIZE(adds
)
1325 IWMMXT_OP_ENV(avgb0
)
1326 IWMMXT_OP_ENV(avgb1
)
1327 IWMMXT_OP_ENV(avgw0
)
1328 IWMMXT_OP_ENV(avgw1
)
1332 IWMMXT_OP_ENV(packuw
)
1333 IWMMXT_OP_ENV(packul
)
1334 IWMMXT_OP_ENV(packuq
)
1335 IWMMXT_OP_ENV(packsw
)
1336 IWMMXT_OP_ENV(packsl
)
1337 IWMMXT_OP_ENV(packsq
)
1339 static inline void gen_op_iwmmxt_muladdsl_M0_T0_T1(void)
1341 gen_helper_iwmmxt_muladdsl(cpu_M0
, cpu_M0
, cpu_T
[0], cpu_T
[1]);
1344 static inline void gen_op_iwmmxt_muladdsw_M0_T0_T1(void)
1346 gen_helper_iwmmxt_muladdsw(cpu_M0
, cpu_M0
, cpu_T
[0], cpu_T
[1]);
1349 static inline void gen_op_iwmmxt_muladdswl_M0_T0_T1(void)
1351 gen_helper_iwmmxt_muladdswl(cpu_M0
, cpu_M0
, cpu_T
[0], cpu_T
[1]);
1354 static inline void gen_op_iwmmxt_align_M0_T0_wRn(int rn
)
1356 iwmmxt_load_reg(cpu_V1
, rn
);
1357 gen_helper_iwmmxt_align(cpu_M0
, cpu_M0
, cpu_V1
, cpu_T
[0]);
1360 static inline void gen_op_iwmmxt_insr_M0_T0_T1(int shift
)
1362 TCGv tmp
= tcg_const_i32(shift
);
1363 gen_helper_iwmmxt_insr(cpu_M0
, cpu_M0
, cpu_T
[0], cpu_T
[1], tmp
);
1366 static inline void gen_op_iwmmxt_extrsb_T0_M0(int shift
)
1368 tcg_gen_shri_i64(cpu_M0
, cpu_M0
, shift
);
1369 tcg_gen_trunc_i64_i32(cpu_T
[0], cpu_M0
);
1370 tcg_gen_ext8s_i32(cpu_T
[0], cpu_T
[0]);
1373 static inline void gen_op_iwmmxt_extrsw_T0_M0(int shift
)
1375 tcg_gen_shri_i64(cpu_M0
, cpu_M0
, shift
);
1376 tcg_gen_trunc_i64_i32(cpu_T
[0], cpu_M0
);
1377 tcg_gen_ext16s_i32(cpu_T
[0], cpu_T
[0]);
1380 static inline void gen_op_iwmmxt_extru_T0_M0(int shift
, uint32_t mask
)
1382 tcg_gen_shri_i64(cpu_M0
, cpu_M0
, shift
);
1383 tcg_gen_trunc_i64_i32(cpu_T
[0], cpu_M0
);
1385 tcg_gen_andi_i32(cpu_T
[0], cpu_T
[0], mask
);
1388 static void gen_op_iwmmxt_set_mup(void)
1391 tmp
= load_cpu_field(iwmmxt
.cregs
[ARM_IWMMXT_wCon
]);
1392 tcg_gen_ori_i32(tmp
, tmp
, 2);
1393 store_cpu_field(tmp
, iwmmxt
.cregs
[ARM_IWMMXT_wCon
]);
1396 static void gen_op_iwmmxt_set_cup(void)
1399 tmp
= load_cpu_field(iwmmxt
.cregs
[ARM_IWMMXT_wCon
]);
1400 tcg_gen_ori_i32(tmp
, tmp
, 1);
1401 store_cpu_field(tmp
, iwmmxt
.cregs
[ARM_IWMMXT_wCon
]);
1404 static void gen_op_iwmmxt_setpsr_nz(void)
1406 TCGv tmp
= new_tmp();
1407 gen_helper_iwmmxt_setpsr_nz(tmp
, cpu_M0
);
1408 store_cpu_field(tmp
, iwmmxt
.cregs
[ARM_IWMMXT_wCASF
]);
1411 static inline void gen_op_iwmmxt_addl_M0_wRn(int rn
)
1413 iwmmxt_load_reg(cpu_V1
, rn
);
1414 tcg_gen_ext32u_i64(cpu_V1
, cpu_V1
);
1415 tcg_gen_add_i64(cpu_M0
, cpu_M0
, cpu_V1
);
1419 static void gen_iwmmxt_movl_T0_T1_wRn(int rn
)
1421 iwmmxt_load_reg(cpu_V0
, rn
);
1422 tcg_gen_trunc_i64_i32(cpu_T
[0], cpu_V0
);
1423 tcg_gen_shri_i64(cpu_V0
, cpu_V0
, 32);
1424 tcg_gen_trunc_i64_i32(cpu_T
[1], cpu_V0
);
1427 static void gen_iwmmxt_movl_wRn_T0_T1(int rn
)
1429 tcg_gen_concat_i32_i64(cpu_V0
, cpu_T
[0], cpu_T
[1]);
1430 iwmmxt_store_reg(cpu_V0
, rn
);
1433 static inline int gen_iwmmxt_address(DisasContext
*s
, uint32_t insn
)
1438 rd
= (insn
>> 16) & 0xf;
1439 gen_movl_T1_reg(s
, rd
);
1441 offset
= (insn
& 0xff) << ((insn
>> 7) & 2);
1442 if (insn
& (1 << 24)) {
1444 if (insn
& (1 << 23))
1445 gen_op_addl_T1_im(offset
);
1447 gen_op_addl_T1_im(-offset
);
1449 if (insn
& (1 << 21))
1450 gen_movl_reg_T1(s
, rd
);
1451 } else if (insn
& (1 << 21)) {
1453 if (insn
& (1 << 23))
1454 gen_op_movl_T0_im(offset
);
1456 gen_op_movl_T0_im(- offset
);
1457 gen_op_addl_T0_T1();
1458 gen_movl_reg_T0(s
, rd
);
1459 } else if (!(insn
& (1 << 23)))
1464 static inline int gen_iwmmxt_shift(uint32_t insn
, uint32_t mask
)
1466 int rd
= (insn
>> 0) & 0xf;
1468 if (insn
& (1 << 8))
1469 if (rd
< ARM_IWMMXT_wCGR0
|| rd
> ARM_IWMMXT_wCGR3
)
1472 gen_op_iwmmxt_movl_T0_wCx(rd
);
1474 gen_iwmmxt_movl_T0_T1_wRn(rd
);
1476 gen_op_movl_T1_im(mask
);
1477 gen_op_andl_T0_T1();
1481 /* Disassemble an iwMMXt instruction. Returns nonzero if an error occured
1482 (ie. an undefined instruction). */
1483 static int disas_iwmmxt_insn(CPUState
*env
, DisasContext
*s
, uint32_t insn
)
1486 int rdhi
, rdlo
, rd0
, rd1
, i
;
1489 if ((insn
& 0x0e000e00) == 0x0c000000) {
1490 if ((insn
& 0x0fe00ff0) == 0x0c400000) {
1492 rdlo
= (insn
>> 12) & 0xf;
1493 rdhi
= (insn
>> 16) & 0xf;
1494 if (insn
& ARM_CP_RW_BIT
) { /* TMRRC */
1495 gen_iwmmxt_movl_T0_T1_wRn(wrd
);
1496 gen_movl_reg_T0(s
, rdlo
);
1497 gen_movl_reg_T1(s
, rdhi
);
1498 } else { /* TMCRR */
1499 gen_movl_T0_reg(s
, rdlo
);
1500 gen_movl_T1_reg(s
, rdhi
);
1501 gen_iwmmxt_movl_wRn_T0_T1(wrd
);
1502 gen_op_iwmmxt_set_mup();
1507 wrd
= (insn
>> 12) & 0xf;
1508 if (gen_iwmmxt_address(s
, insn
))
1510 if (insn
& ARM_CP_RW_BIT
) {
1511 if ((insn
>> 28) == 0xf) { /* WLDRW wCx */
1512 tmp
= gen_ld32(cpu_T
[1], IS_USER(s
));
1513 tcg_gen_mov_i32(cpu_T
[0], tmp
);
1515 gen_op_iwmmxt_movl_wCx_T0(wrd
);
1518 if (insn
& (1 << 8)) {
1519 if (insn
& (1 << 22)) { /* WLDRD */
1520 tcg_gen_qemu_ld64(cpu_M0
, cpu_T
[1], IS_USER(s
));
1522 } else { /* WLDRW wRd */
1523 tmp
= gen_ld32(cpu_T
[1], IS_USER(s
));
1526 if (insn
& (1 << 22)) { /* WLDRH */
1527 tmp
= gen_ld16u(cpu_T
[1], IS_USER(s
));
1528 } else { /* WLDRB */
1529 tmp
= gen_ld8u(cpu_T
[1], IS_USER(s
));
1533 tcg_gen_extu_i32_i64(cpu_M0
, tmp
);
1536 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1539 if ((insn
>> 28) == 0xf) { /* WSTRW wCx */
1540 gen_op_iwmmxt_movl_T0_wCx(wrd
);
1542 tcg_gen_mov_i32(tmp
, cpu_T
[0]);
1543 gen_st32(tmp
, cpu_T
[1], IS_USER(s
));
1545 gen_op_iwmmxt_movq_M0_wRn(wrd
);
1547 if (insn
& (1 << 8)) {
1548 if (insn
& (1 << 22)) { /* WSTRD */
1550 tcg_gen_qemu_st64(cpu_M0
, cpu_T
[1], IS_USER(s
));
1551 } else { /* WSTRW wRd */
1552 tcg_gen_trunc_i64_i32(tmp
, cpu_M0
);
1553 gen_st32(tmp
, cpu_T
[1], IS_USER(s
));
1556 if (insn
& (1 << 22)) { /* WSTRH */
1557 tcg_gen_trunc_i64_i32(tmp
, cpu_M0
);
1558 gen_st16(tmp
, cpu_T
[1], IS_USER(s
));
1559 } else { /* WSTRB */
1560 tcg_gen_trunc_i64_i32(tmp
, cpu_M0
);
1561 gen_st8(tmp
, cpu_T
[1], IS_USER(s
));
1569 if ((insn
& 0x0f000000) != 0x0e000000)
1572 switch (((insn
>> 12) & 0xf00) | ((insn
>> 4) & 0xff)) {
1573 case 0x000: /* WOR */
1574 wrd
= (insn
>> 12) & 0xf;
1575 rd0
= (insn
>> 0) & 0xf;
1576 rd1
= (insn
>> 16) & 0xf;
1577 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1578 gen_op_iwmmxt_orq_M0_wRn(rd1
);
1579 gen_op_iwmmxt_setpsr_nz();
1580 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1581 gen_op_iwmmxt_set_mup();
1582 gen_op_iwmmxt_set_cup();
1584 case 0x011: /* TMCR */
1587 rd
= (insn
>> 12) & 0xf;
1588 wrd
= (insn
>> 16) & 0xf;
1590 case ARM_IWMMXT_wCID
:
1591 case ARM_IWMMXT_wCASF
:
1593 case ARM_IWMMXT_wCon
:
1594 gen_op_iwmmxt_set_cup();
1596 case ARM_IWMMXT_wCSSF
:
1597 gen_op_iwmmxt_movl_T0_wCx(wrd
);
1598 gen_movl_T1_reg(s
, rd
);
1599 gen_op_bicl_T0_T1();
1600 gen_op_iwmmxt_movl_wCx_T0(wrd
);
1602 case ARM_IWMMXT_wCGR0
:
1603 case ARM_IWMMXT_wCGR1
:
1604 case ARM_IWMMXT_wCGR2
:
1605 case ARM_IWMMXT_wCGR3
:
1606 gen_op_iwmmxt_set_cup();
1607 gen_movl_reg_T0(s
, rd
);
1608 gen_op_iwmmxt_movl_wCx_T0(wrd
);
1614 case 0x100: /* WXOR */
1615 wrd
= (insn
>> 12) & 0xf;
1616 rd0
= (insn
>> 0) & 0xf;
1617 rd1
= (insn
>> 16) & 0xf;
1618 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1619 gen_op_iwmmxt_xorq_M0_wRn(rd1
);
1620 gen_op_iwmmxt_setpsr_nz();
1621 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1622 gen_op_iwmmxt_set_mup();
1623 gen_op_iwmmxt_set_cup();
1625 case 0x111: /* TMRC */
1628 rd
= (insn
>> 12) & 0xf;
1629 wrd
= (insn
>> 16) & 0xf;
1630 gen_op_iwmmxt_movl_T0_wCx(wrd
);
1631 gen_movl_reg_T0(s
, rd
);
1633 case 0x300: /* WANDN */
1634 wrd
= (insn
>> 12) & 0xf;
1635 rd0
= (insn
>> 0) & 0xf;
1636 rd1
= (insn
>> 16) & 0xf;
1637 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1638 tcg_gen_neg_i64(cpu_M0
, cpu_M0
);
1639 gen_op_iwmmxt_andq_M0_wRn(rd1
);
1640 gen_op_iwmmxt_setpsr_nz();
1641 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1642 gen_op_iwmmxt_set_mup();
1643 gen_op_iwmmxt_set_cup();
1645 case 0x200: /* WAND */
1646 wrd
= (insn
>> 12) & 0xf;
1647 rd0
= (insn
>> 0) & 0xf;
1648 rd1
= (insn
>> 16) & 0xf;
1649 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1650 gen_op_iwmmxt_andq_M0_wRn(rd1
);
1651 gen_op_iwmmxt_setpsr_nz();
1652 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1653 gen_op_iwmmxt_set_mup();
1654 gen_op_iwmmxt_set_cup();
1656 case 0x810: case 0xa10: /* WMADD */
1657 wrd
= (insn
>> 12) & 0xf;
1658 rd0
= (insn
>> 0) & 0xf;
1659 rd1
= (insn
>> 16) & 0xf;
1660 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1661 if (insn
& (1 << 21))
1662 gen_op_iwmmxt_maddsq_M0_wRn(rd1
);
1664 gen_op_iwmmxt_madduq_M0_wRn(rd1
);
1665 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1666 gen_op_iwmmxt_set_mup();
1668 case 0x10e: case 0x50e: case 0x90e: case 0xd0e: /* WUNPCKIL */
1669 wrd
= (insn
>> 12) & 0xf;
1670 rd0
= (insn
>> 16) & 0xf;
1671 rd1
= (insn
>> 0) & 0xf;
1672 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1673 switch ((insn
>> 22) & 3) {
1675 gen_op_iwmmxt_unpacklb_M0_wRn(rd1
);
1678 gen_op_iwmmxt_unpacklw_M0_wRn(rd1
);
1681 gen_op_iwmmxt_unpackll_M0_wRn(rd1
);
1686 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1687 gen_op_iwmmxt_set_mup();
1688 gen_op_iwmmxt_set_cup();
1690 case 0x10c: case 0x50c: case 0x90c: case 0xd0c: /* WUNPCKIH */
1691 wrd
= (insn
>> 12) & 0xf;
1692 rd0
= (insn
>> 16) & 0xf;
1693 rd1
= (insn
>> 0) & 0xf;
1694 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1695 switch ((insn
>> 22) & 3) {
1697 gen_op_iwmmxt_unpackhb_M0_wRn(rd1
);
1700 gen_op_iwmmxt_unpackhw_M0_wRn(rd1
);
1703 gen_op_iwmmxt_unpackhl_M0_wRn(rd1
);
1708 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1709 gen_op_iwmmxt_set_mup();
1710 gen_op_iwmmxt_set_cup();
1712 case 0x012: case 0x112: case 0x412: case 0x512: /* WSAD */
1713 wrd
= (insn
>> 12) & 0xf;
1714 rd0
= (insn
>> 16) & 0xf;
1715 rd1
= (insn
>> 0) & 0xf;
1716 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1717 if (insn
& (1 << 22))
1718 gen_op_iwmmxt_sadw_M0_wRn(rd1
);
1720 gen_op_iwmmxt_sadb_M0_wRn(rd1
);
1721 if (!(insn
& (1 << 20)))
1722 gen_op_iwmmxt_addl_M0_wRn(wrd
);
1723 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1724 gen_op_iwmmxt_set_mup();
1726 case 0x010: case 0x110: case 0x210: case 0x310: /* WMUL */
1727 wrd
= (insn
>> 12) & 0xf;
1728 rd0
= (insn
>> 16) & 0xf;
1729 rd1
= (insn
>> 0) & 0xf;
1730 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1731 if (insn
& (1 << 21)) {
1732 if (insn
& (1 << 20))
1733 gen_op_iwmmxt_mulshw_M0_wRn(rd1
);
1735 gen_op_iwmmxt_mulslw_M0_wRn(rd1
);
1737 if (insn
& (1 << 20))
1738 gen_op_iwmmxt_muluhw_M0_wRn(rd1
);
1740 gen_op_iwmmxt_mululw_M0_wRn(rd1
);
1742 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1743 gen_op_iwmmxt_set_mup();
1745 case 0x410: case 0x510: case 0x610: case 0x710: /* WMAC */
1746 wrd
= (insn
>> 12) & 0xf;
1747 rd0
= (insn
>> 16) & 0xf;
1748 rd1
= (insn
>> 0) & 0xf;
1749 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1750 if (insn
& (1 << 21))
1751 gen_op_iwmmxt_macsw_M0_wRn(rd1
);
1753 gen_op_iwmmxt_macuw_M0_wRn(rd1
);
1754 if (!(insn
& (1 << 20))) {
1755 iwmmxt_load_reg(cpu_V1
, wrd
);
1756 tcg_gen_add_i64(cpu_M0
, cpu_M0
, cpu_V1
);
1758 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1759 gen_op_iwmmxt_set_mup();
1761 case 0x006: case 0x406: case 0x806: case 0xc06: /* WCMPEQ */
1762 wrd
= (insn
>> 12) & 0xf;
1763 rd0
= (insn
>> 16) & 0xf;
1764 rd1
= (insn
>> 0) & 0xf;
1765 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1766 switch ((insn
>> 22) & 3) {
1768 gen_op_iwmmxt_cmpeqb_M0_wRn(rd1
);
1771 gen_op_iwmmxt_cmpeqw_M0_wRn(rd1
);
1774 gen_op_iwmmxt_cmpeql_M0_wRn(rd1
);
1779 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1780 gen_op_iwmmxt_set_mup();
1781 gen_op_iwmmxt_set_cup();
1783 case 0x800: case 0x900: case 0xc00: case 0xd00: /* WAVG2 */
1784 wrd
= (insn
>> 12) & 0xf;
1785 rd0
= (insn
>> 16) & 0xf;
1786 rd1
= (insn
>> 0) & 0xf;
1787 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1788 if (insn
& (1 << 22)) {
1789 if (insn
& (1 << 20))
1790 gen_op_iwmmxt_avgw1_M0_wRn(rd1
);
1792 gen_op_iwmmxt_avgw0_M0_wRn(rd1
);
1794 if (insn
& (1 << 20))
1795 gen_op_iwmmxt_avgb1_M0_wRn(rd1
);
1797 gen_op_iwmmxt_avgb0_M0_wRn(rd1
);
1799 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1800 gen_op_iwmmxt_set_mup();
1801 gen_op_iwmmxt_set_cup();
1803 case 0x802: case 0x902: case 0xa02: case 0xb02: /* WALIGNR */
1804 wrd
= (insn
>> 12) & 0xf;
1805 rd0
= (insn
>> 16) & 0xf;
1806 rd1
= (insn
>> 0) & 0xf;
1807 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1808 gen_op_iwmmxt_movl_T0_wCx(ARM_IWMMXT_wCGR0
+ ((insn
>> 20) & 3));
1809 gen_op_movl_T1_im(7);
1810 gen_op_andl_T0_T1();
1811 gen_op_iwmmxt_align_M0_T0_wRn(rd1
);
1812 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1813 gen_op_iwmmxt_set_mup();
1815 case 0x601: case 0x605: case 0x609: case 0x60d: /* TINSR */
1816 rd
= (insn
>> 12) & 0xf;
1817 wrd
= (insn
>> 16) & 0xf;
1818 gen_movl_T0_reg(s
, rd
);
1819 gen_op_iwmmxt_movq_M0_wRn(wrd
);
1820 switch ((insn
>> 6) & 3) {
1822 gen_op_movl_T1_im(0xff);
1823 gen_op_iwmmxt_insr_M0_T0_T1((insn
& 7) << 3);
1826 gen_op_movl_T1_im(0xffff);
1827 gen_op_iwmmxt_insr_M0_T0_T1((insn
& 3) << 4);
1830 gen_op_movl_T1_im(0xffffffff);
1831 gen_op_iwmmxt_insr_M0_T0_T1((insn
& 1) << 5);
1836 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1837 gen_op_iwmmxt_set_mup();
1839 case 0x107: case 0x507: case 0x907: case 0xd07: /* TEXTRM */
1840 rd
= (insn
>> 12) & 0xf;
1841 wrd
= (insn
>> 16) & 0xf;
1844 gen_op_iwmmxt_movq_M0_wRn(wrd
);
1845 switch ((insn
>> 22) & 3) {
1848 gen_op_iwmmxt_extrsb_T0_M0((insn
& 7) << 3);
1850 gen_op_iwmmxt_extru_T0_M0((insn
& 7) << 3, 0xff);
1855 gen_op_iwmmxt_extrsw_T0_M0((insn
& 3) << 4);
1857 gen_op_iwmmxt_extru_T0_M0((insn
& 3) << 4, 0xffff);
1861 gen_op_iwmmxt_extru_T0_M0((insn
& 1) << 5, ~0u);
1866 gen_movl_reg_T0(s
, rd
);
1868 case 0x117: case 0x517: case 0x917: case 0xd17: /* TEXTRC */
1869 if ((insn
& 0x000ff008) != 0x0003f000)
1871 gen_op_iwmmxt_movl_T1_wCx(ARM_IWMMXT_wCASF
);
1872 switch ((insn
>> 22) & 3) {
1874 gen_op_shrl_T1_im(((insn
& 7) << 2) + 0);
1877 gen_op_shrl_T1_im(((insn
& 3) << 3) + 4);
1880 gen_op_shrl_T1_im(((insn
& 1) << 4) + 12);
1885 gen_op_shll_T1_im(28);
1886 gen_set_nzcv(cpu_T
[1]);
1888 case 0x401: case 0x405: case 0x409: case 0x40d: /* TBCST */
1889 rd
= (insn
>> 12) & 0xf;
1890 wrd
= (insn
>> 16) & 0xf;
1891 gen_movl_T0_reg(s
, rd
);
1892 switch ((insn
>> 6) & 3) {
1894 gen_helper_iwmmxt_bcstb(cpu_M0
, cpu_T
[0]);
1897 gen_helper_iwmmxt_bcstw(cpu_M0
, cpu_T
[0]);
1900 gen_helper_iwmmxt_bcstl(cpu_M0
, cpu_T
[0]);
1905 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1906 gen_op_iwmmxt_set_mup();
1908 case 0x113: case 0x513: case 0x913: case 0xd13: /* TANDC */
1909 if ((insn
& 0x000ff00f) != 0x0003f000)
1911 gen_op_iwmmxt_movl_T1_wCx(ARM_IWMMXT_wCASF
);
1912 switch ((insn
>> 22) & 3) {
1914 for (i
= 0; i
< 7; i
++) {
1915 gen_op_shll_T1_im(4);
1916 gen_op_andl_T0_T1();
1920 for (i
= 0; i
< 3; i
++) {
1921 gen_op_shll_T1_im(8);
1922 gen_op_andl_T0_T1();
1926 gen_op_shll_T1_im(16);
1927 gen_op_andl_T0_T1();
1932 gen_set_nzcv(cpu_T
[0]);
1934 case 0x01c: case 0x41c: case 0x81c: case 0xc1c: /* WACC */
1935 wrd
= (insn
>> 12) & 0xf;
1936 rd0
= (insn
>> 16) & 0xf;
1937 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1938 switch ((insn
>> 22) & 3) {
1940 gen_helper_iwmmxt_addcb(cpu_M0
, cpu_M0
);
1943 gen_helper_iwmmxt_addcw(cpu_M0
, cpu_M0
);
1946 gen_helper_iwmmxt_addcl(cpu_M0
, cpu_M0
);
1951 gen_op_iwmmxt_movq_wRn_M0(wrd
);
1952 gen_op_iwmmxt_set_mup();
1954 case 0x115: case 0x515: case 0x915: case 0xd15: /* TORC */
1955 if ((insn
& 0x000ff00f) != 0x0003f000)
1957 gen_op_iwmmxt_movl_T1_wCx(ARM_IWMMXT_wCASF
);
1958 switch ((insn
>> 22) & 3) {
1960 for (i
= 0; i
< 7; i
++) {
1961 gen_op_shll_T1_im(4);
1966 for (i
= 0; i
< 3; i
++) {
1967 gen_op_shll_T1_im(8);
1972 gen_op_shll_T1_im(16);
1978 gen_set_nzcv(cpu_T
[0]);
1980 case 0x103: case 0x503: case 0x903: case 0xd03: /* TMOVMSK */
1981 rd
= (insn
>> 12) & 0xf;
1982 rd0
= (insn
>> 16) & 0xf;
1983 if ((insn
& 0xf) != 0)
1985 gen_op_iwmmxt_movq_M0_wRn(rd0
);
1986 switch ((insn
>> 22) & 3) {
1988 gen_helper_iwmmxt_msbb(cpu_T
[0], cpu_M0
);
1991 gen_helper_iwmmxt_msbw(cpu_T
[0], cpu_M0
);
1994 gen_helper_iwmmxt_msbl(cpu_T
[0], cpu_M0
);
1999 gen_movl_reg_T0(s
, rd
);
2001 case 0x106: case 0x306: case 0x506: case 0x706: /* WCMPGT */
2002 case 0x906: case 0xb06: case 0xd06: case 0xf06:
2003 wrd
= (insn
>> 12) & 0xf;
2004 rd0
= (insn
>> 16) & 0xf;
2005 rd1
= (insn
>> 0) & 0xf;
2006 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2007 switch ((insn
>> 22) & 3) {
2009 if (insn
& (1 << 21))
2010 gen_op_iwmmxt_cmpgtsb_M0_wRn(rd1
);
2012 gen_op_iwmmxt_cmpgtub_M0_wRn(rd1
);
2015 if (insn
& (1 << 21))
2016 gen_op_iwmmxt_cmpgtsw_M0_wRn(rd1
);
2018 gen_op_iwmmxt_cmpgtuw_M0_wRn(rd1
);
2021 if (insn
& (1 << 21))
2022 gen_op_iwmmxt_cmpgtsl_M0_wRn(rd1
);
2024 gen_op_iwmmxt_cmpgtul_M0_wRn(rd1
);
2029 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2030 gen_op_iwmmxt_set_mup();
2031 gen_op_iwmmxt_set_cup();
2033 case 0x00e: case 0x20e: case 0x40e: case 0x60e: /* WUNPCKEL */
2034 case 0x80e: case 0xa0e: case 0xc0e: case 0xe0e:
2035 wrd
= (insn
>> 12) & 0xf;
2036 rd0
= (insn
>> 16) & 0xf;
2037 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2038 switch ((insn
>> 22) & 3) {
2040 if (insn
& (1 << 21))
2041 gen_op_iwmmxt_unpacklsb_M0();
2043 gen_op_iwmmxt_unpacklub_M0();
2046 if (insn
& (1 << 21))
2047 gen_op_iwmmxt_unpacklsw_M0();
2049 gen_op_iwmmxt_unpackluw_M0();
2052 if (insn
& (1 << 21))
2053 gen_op_iwmmxt_unpacklsl_M0();
2055 gen_op_iwmmxt_unpacklul_M0();
2060 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2061 gen_op_iwmmxt_set_mup();
2062 gen_op_iwmmxt_set_cup();
2064 case 0x00c: case 0x20c: case 0x40c: case 0x60c: /* WUNPCKEH */
2065 case 0x80c: case 0xa0c: case 0xc0c: case 0xe0c:
2066 wrd
= (insn
>> 12) & 0xf;
2067 rd0
= (insn
>> 16) & 0xf;
2068 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2069 switch ((insn
>> 22) & 3) {
2071 if (insn
& (1 << 21))
2072 gen_op_iwmmxt_unpackhsb_M0();
2074 gen_op_iwmmxt_unpackhub_M0();
2077 if (insn
& (1 << 21))
2078 gen_op_iwmmxt_unpackhsw_M0();
2080 gen_op_iwmmxt_unpackhuw_M0();
2083 if (insn
& (1 << 21))
2084 gen_op_iwmmxt_unpackhsl_M0();
2086 gen_op_iwmmxt_unpackhul_M0();
2091 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2092 gen_op_iwmmxt_set_mup();
2093 gen_op_iwmmxt_set_cup();
2095 case 0x204: case 0x604: case 0xa04: case 0xe04: /* WSRL */
2096 case 0x214: case 0x614: case 0xa14: case 0xe14:
2097 wrd
= (insn
>> 12) & 0xf;
2098 rd0
= (insn
>> 16) & 0xf;
2099 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2100 if (gen_iwmmxt_shift(insn
, 0xff))
2102 switch ((insn
>> 22) & 3) {
2106 gen_helper_iwmmxt_srlw(cpu_M0
, cpu_env
, cpu_M0
, cpu_T
[0]);
2109 gen_helper_iwmmxt_srll(cpu_M0
, cpu_env
, cpu_M0
, cpu_T
[0]);
2112 gen_helper_iwmmxt_srlq(cpu_M0
, cpu_env
, cpu_M0
, cpu_T
[0]);
2115 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2116 gen_op_iwmmxt_set_mup();
2117 gen_op_iwmmxt_set_cup();
2119 case 0x004: case 0x404: case 0x804: case 0xc04: /* WSRA */
2120 case 0x014: case 0x414: case 0x814: case 0xc14:
2121 wrd
= (insn
>> 12) & 0xf;
2122 rd0
= (insn
>> 16) & 0xf;
2123 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2124 if (gen_iwmmxt_shift(insn
, 0xff))
2126 switch ((insn
>> 22) & 3) {
2130 gen_helper_iwmmxt_sraw(cpu_M0
, cpu_env
, cpu_M0
, cpu_T
[0]);
2133 gen_helper_iwmmxt_sral(cpu_M0
, cpu_env
, cpu_M0
, cpu_T
[0]);
2136 gen_helper_iwmmxt_sraq(cpu_M0
, cpu_env
, cpu_M0
, cpu_T
[0]);
2139 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2140 gen_op_iwmmxt_set_mup();
2141 gen_op_iwmmxt_set_cup();
2143 case 0x104: case 0x504: case 0x904: case 0xd04: /* WSLL */
2144 case 0x114: case 0x514: case 0x914: case 0xd14:
2145 wrd
= (insn
>> 12) & 0xf;
2146 rd0
= (insn
>> 16) & 0xf;
2147 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2148 if (gen_iwmmxt_shift(insn
, 0xff))
2150 switch ((insn
>> 22) & 3) {
2154 gen_helper_iwmmxt_sllw(cpu_M0
, cpu_env
, cpu_M0
, cpu_T
[0]);
2157 gen_helper_iwmmxt_slll(cpu_M0
, cpu_env
, cpu_M0
, cpu_T
[0]);
2160 gen_helper_iwmmxt_sllq(cpu_M0
, cpu_env
, cpu_M0
, cpu_T
[0]);
2163 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2164 gen_op_iwmmxt_set_mup();
2165 gen_op_iwmmxt_set_cup();
2167 case 0x304: case 0x704: case 0xb04: case 0xf04: /* WROR */
2168 case 0x314: case 0x714: case 0xb14: case 0xf14:
2169 wrd
= (insn
>> 12) & 0xf;
2170 rd0
= (insn
>> 16) & 0xf;
2171 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2172 switch ((insn
>> 22) & 3) {
2176 if (gen_iwmmxt_shift(insn
, 0xf))
2178 gen_helper_iwmmxt_rorw(cpu_M0
, cpu_env
, cpu_M0
, cpu_T
[0]);
2181 if (gen_iwmmxt_shift(insn
, 0x1f))
2183 gen_helper_iwmmxt_rorl(cpu_M0
, cpu_env
, cpu_M0
, cpu_T
[0]);
2186 if (gen_iwmmxt_shift(insn
, 0x3f))
2188 gen_helper_iwmmxt_rorq(cpu_M0
, cpu_env
, cpu_M0
, cpu_T
[0]);
2191 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2192 gen_op_iwmmxt_set_mup();
2193 gen_op_iwmmxt_set_cup();
2195 case 0x116: case 0x316: case 0x516: case 0x716: /* WMIN */
2196 case 0x916: case 0xb16: case 0xd16: case 0xf16:
2197 wrd
= (insn
>> 12) & 0xf;
2198 rd0
= (insn
>> 16) & 0xf;
2199 rd1
= (insn
>> 0) & 0xf;
2200 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2201 switch ((insn
>> 22) & 3) {
2203 if (insn
& (1 << 21))
2204 gen_op_iwmmxt_minsb_M0_wRn(rd1
);
2206 gen_op_iwmmxt_minub_M0_wRn(rd1
);
2209 if (insn
& (1 << 21))
2210 gen_op_iwmmxt_minsw_M0_wRn(rd1
);
2212 gen_op_iwmmxt_minuw_M0_wRn(rd1
);
2215 if (insn
& (1 << 21))
2216 gen_op_iwmmxt_minsl_M0_wRn(rd1
);
2218 gen_op_iwmmxt_minul_M0_wRn(rd1
);
2223 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2224 gen_op_iwmmxt_set_mup();
2226 case 0x016: case 0x216: case 0x416: case 0x616: /* WMAX */
2227 case 0x816: case 0xa16: case 0xc16: case 0xe16:
2228 wrd
= (insn
>> 12) & 0xf;
2229 rd0
= (insn
>> 16) & 0xf;
2230 rd1
= (insn
>> 0) & 0xf;
2231 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2232 switch ((insn
>> 22) & 3) {
2234 if (insn
& (1 << 21))
2235 gen_op_iwmmxt_maxsb_M0_wRn(rd1
);
2237 gen_op_iwmmxt_maxub_M0_wRn(rd1
);
2240 if (insn
& (1 << 21))
2241 gen_op_iwmmxt_maxsw_M0_wRn(rd1
);
2243 gen_op_iwmmxt_maxuw_M0_wRn(rd1
);
2246 if (insn
& (1 << 21))
2247 gen_op_iwmmxt_maxsl_M0_wRn(rd1
);
2249 gen_op_iwmmxt_maxul_M0_wRn(rd1
);
2254 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2255 gen_op_iwmmxt_set_mup();
2257 case 0x002: case 0x102: case 0x202: case 0x302: /* WALIGNI */
2258 case 0x402: case 0x502: case 0x602: case 0x702:
2259 wrd
= (insn
>> 12) & 0xf;
2260 rd0
= (insn
>> 16) & 0xf;
2261 rd1
= (insn
>> 0) & 0xf;
2262 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2263 gen_op_movl_T0_im((insn
>> 20) & 3);
2264 gen_op_iwmmxt_align_M0_T0_wRn(rd1
);
2265 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2266 gen_op_iwmmxt_set_mup();
2268 case 0x01a: case 0x11a: case 0x21a: case 0x31a: /* WSUB */
2269 case 0x41a: case 0x51a: case 0x61a: case 0x71a:
2270 case 0x81a: case 0x91a: case 0xa1a: case 0xb1a:
2271 case 0xc1a: case 0xd1a: case 0xe1a: case 0xf1a:
2272 wrd
= (insn
>> 12) & 0xf;
2273 rd0
= (insn
>> 16) & 0xf;
2274 rd1
= (insn
>> 0) & 0xf;
2275 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2276 switch ((insn
>> 20) & 0xf) {
2278 gen_op_iwmmxt_subnb_M0_wRn(rd1
);
2281 gen_op_iwmmxt_subub_M0_wRn(rd1
);
2284 gen_op_iwmmxt_subsb_M0_wRn(rd1
);
2287 gen_op_iwmmxt_subnw_M0_wRn(rd1
);
2290 gen_op_iwmmxt_subuw_M0_wRn(rd1
);
2293 gen_op_iwmmxt_subsw_M0_wRn(rd1
);
2296 gen_op_iwmmxt_subnl_M0_wRn(rd1
);
2299 gen_op_iwmmxt_subul_M0_wRn(rd1
);
2302 gen_op_iwmmxt_subsl_M0_wRn(rd1
);
2307 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2308 gen_op_iwmmxt_set_mup();
2309 gen_op_iwmmxt_set_cup();
2311 case 0x01e: case 0x11e: case 0x21e: case 0x31e: /* WSHUFH */
2312 case 0x41e: case 0x51e: case 0x61e: case 0x71e:
2313 case 0x81e: case 0x91e: case 0xa1e: case 0xb1e:
2314 case 0xc1e: case 0xd1e: case 0xe1e: case 0xf1e:
2315 wrd
= (insn
>> 12) & 0xf;
2316 rd0
= (insn
>> 16) & 0xf;
2317 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2318 gen_op_movl_T0_im(((insn
>> 16) & 0xf0) | (insn
& 0x0f));
2319 gen_helper_iwmmxt_shufh(cpu_M0
, cpu_env
, cpu_M0
, cpu_T
[0]);
2320 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2321 gen_op_iwmmxt_set_mup();
2322 gen_op_iwmmxt_set_cup();
2324 case 0x018: case 0x118: case 0x218: case 0x318: /* WADD */
2325 case 0x418: case 0x518: case 0x618: case 0x718:
2326 case 0x818: case 0x918: case 0xa18: case 0xb18:
2327 case 0xc18: case 0xd18: case 0xe18: case 0xf18:
2328 wrd
= (insn
>> 12) & 0xf;
2329 rd0
= (insn
>> 16) & 0xf;
2330 rd1
= (insn
>> 0) & 0xf;
2331 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2332 switch ((insn
>> 20) & 0xf) {
2334 gen_op_iwmmxt_addnb_M0_wRn(rd1
);
2337 gen_op_iwmmxt_addub_M0_wRn(rd1
);
2340 gen_op_iwmmxt_addsb_M0_wRn(rd1
);
2343 gen_op_iwmmxt_addnw_M0_wRn(rd1
);
2346 gen_op_iwmmxt_adduw_M0_wRn(rd1
);
2349 gen_op_iwmmxt_addsw_M0_wRn(rd1
);
2352 gen_op_iwmmxt_addnl_M0_wRn(rd1
);
2355 gen_op_iwmmxt_addul_M0_wRn(rd1
);
2358 gen_op_iwmmxt_addsl_M0_wRn(rd1
);
2363 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2364 gen_op_iwmmxt_set_mup();
2365 gen_op_iwmmxt_set_cup();
2367 case 0x008: case 0x108: case 0x208: case 0x308: /* WPACK */
2368 case 0x408: case 0x508: case 0x608: case 0x708:
2369 case 0x808: case 0x908: case 0xa08: case 0xb08:
2370 case 0xc08: case 0xd08: case 0xe08: case 0xf08:
2371 wrd
= (insn
>> 12) & 0xf;
2372 rd0
= (insn
>> 16) & 0xf;
2373 rd1
= (insn
>> 0) & 0xf;
2374 gen_op_iwmmxt_movq_M0_wRn(rd0
);
2375 if (!(insn
& (1 << 20)))
2377 switch ((insn
>> 22) & 3) {
2381 if (insn
& (1 << 21))
2382 gen_op_iwmmxt_packsw_M0_wRn(rd1
);
2384 gen_op_iwmmxt_packuw_M0_wRn(rd1
);
2387 if (insn
& (1 << 21))
2388 gen_op_iwmmxt_packsl_M0_wRn(rd1
);
2390 gen_op_iwmmxt_packul_M0_wRn(rd1
);
2393 if (insn
& (1 << 21))
2394 gen_op_iwmmxt_packsq_M0_wRn(rd1
);
2396 gen_op_iwmmxt_packuq_M0_wRn(rd1
);
2399 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2400 gen_op_iwmmxt_set_mup();
2401 gen_op_iwmmxt_set_cup();
2403 case 0x201: case 0x203: case 0x205: case 0x207:
2404 case 0x209: case 0x20b: case 0x20d: case 0x20f:
2405 case 0x211: case 0x213: case 0x215: case 0x217:
2406 case 0x219: case 0x21b: case 0x21d: case 0x21f:
2407 wrd
= (insn
>> 5) & 0xf;
2408 rd0
= (insn
>> 12) & 0xf;
2409 rd1
= (insn
>> 0) & 0xf;
2410 if (rd0
== 0xf || rd1
== 0xf)
2412 gen_op_iwmmxt_movq_M0_wRn(wrd
);
2413 switch ((insn
>> 16) & 0xf) {
2414 case 0x0: /* TMIA */
2415 gen_movl_T0_reg(s
, rd0
);
2416 gen_movl_T1_reg(s
, rd1
);
2417 gen_op_iwmmxt_muladdsl_M0_T0_T1();
2419 case 0x8: /* TMIAPH */
2420 gen_movl_T0_reg(s
, rd0
);
2421 gen_movl_T1_reg(s
, rd1
);
2422 gen_op_iwmmxt_muladdsw_M0_T0_T1();
2424 case 0xc: case 0xd: case 0xe: case 0xf: /* TMIAxy */
2425 gen_movl_T1_reg(s
, rd0
);
2426 if (insn
& (1 << 16))
2427 gen_op_shrl_T1_im(16);
2428 gen_op_movl_T0_T1();
2429 gen_movl_T1_reg(s
, rd1
);
2430 if (insn
& (1 << 17))
2431 gen_op_shrl_T1_im(16);
2432 gen_op_iwmmxt_muladdswl_M0_T0_T1();
2437 gen_op_iwmmxt_movq_wRn_M0(wrd
);
2438 gen_op_iwmmxt_set_mup();
2447 /* Disassemble an XScale DSP instruction. Returns nonzero if an error occured
2448 (ie. an undefined instruction). */
2449 static int disas_dsp_insn(CPUState
*env
, DisasContext
*s
, uint32_t insn
)
2451 int acc
, rd0
, rd1
, rdhi
, rdlo
;
2453 if ((insn
& 0x0ff00f10) == 0x0e200010) {
2454 /* Multiply with Internal Accumulate Format */
2455 rd0
= (insn
>> 12) & 0xf;
2457 acc
= (insn
>> 5) & 7;
2462 switch ((insn
>> 16) & 0xf) {
2464 gen_movl_T0_reg(s
, rd0
);
2465 gen_movl_T1_reg(s
, rd1
);
2466 gen_op_iwmmxt_muladdsl_M0_T0_T1();
2468 case 0x8: /* MIAPH */
2469 gen_movl_T0_reg(s
, rd0
);
2470 gen_movl_T1_reg(s
, rd1
);
2471 gen_op_iwmmxt_muladdsw_M0_T0_T1();
2473 case 0xc: /* MIABB */
2474 case 0xd: /* MIABT */
2475 case 0xe: /* MIATB */
2476 case 0xf: /* MIATT */
2477 gen_movl_T1_reg(s
, rd0
);
2478 if (insn
& (1 << 16))
2479 gen_op_shrl_T1_im(16);
2480 gen_op_movl_T0_T1();
2481 gen_movl_T1_reg(s
, rd1
);
2482 if (insn
& (1 << 17))
2483 gen_op_shrl_T1_im(16);
2484 gen_op_iwmmxt_muladdswl_M0_T0_T1();
2490 gen_op_iwmmxt_movq_wRn_M0(acc
);
2494 if ((insn
& 0x0fe00ff8) == 0x0c400000) {
2495 /* Internal Accumulator Access Format */
2496 rdhi
= (insn
>> 16) & 0xf;
2497 rdlo
= (insn
>> 12) & 0xf;
2503 if (insn
& ARM_CP_RW_BIT
) { /* MRA */
2504 gen_iwmmxt_movl_T0_T1_wRn(acc
);
2505 gen_movl_reg_T0(s
, rdlo
);
2506 gen_op_movl_T0_im((1 << (40 - 32)) - 1);
2507 gen_op_andl_T0_T1();
2508 gen_movl_reg_T0(s
, rdhi
);
2510 gen_movl_T0_reg(s
, rdlo
);
2511 gen_movl_T1_reg(s
, rdhi
);
2512 gen_iwmmxt_movl_wRn_T0_T1(acc
);
2520 /* Disassemble system coprocessor instruction. Return nonzero if
2521 instruction is not defined. */
2522 static int disas_cp_insn(CPUState
*env
, DisasContext
*s
, uint32_t insn
)
2525 uint32_t rd
= (insn
>> 12) & 0xf;
2526 uint32_t cp
= (insn
>> 8) & 0xf;
2531 if (insn
& ARM_CP_RW_BIT
) {
2532 if (!env
->cp
[cp
].cp_read
)
2534 gen_set_pc_im(s
->pc
);
2536 gen_helper_get_cp(tmp
, cpu_env
, tcg_const_i32(insn
));
2537 store_reg(s
, rd
, tmp
);
2539 if (!env
->cp
[cp
].cp_write
)
2541 gen_set_pc_im(s
->pc
);
2542 tmp
= load_reg(s
, rd
);
2543 gen_helper_set_cp(cpu_env
, tcg_const_i32(insn
), tmp
);
2549 static int cp15_user_ok(uint32_t insn
)
2551 int cpn
= (insn
>> 16) & 0xf;
2552 int cpm
= insn
& 0xf;
2553 int op
= ((insn
>> 5) & 7) | ((insn
>> 18) & 0x38);
2555 if (cpn
== 13 && cpm
== 0) {
2557 if (op
== 2 || (op
== 3 && (insn
& ARM_CP_RW_BIT
)))
2561 /* ISB, DSB, DMB. */
2562 if ((cpm
== 5 && op
== 4)
2563 || (cpm
== 10 && (op
== 4 || op
== 5)))
2569 /* Disassemble system coprocessor (cp15) instruction. Return nonzero if
2570 instruction is not defined. */
2571 static int disas_cp15_insn(CPUState
*env
, DisasContext
*s
, uint32_t insn
)
2576 /* M profile cores use memory mapped registers instead of cp15. */
2577 if (arm_feature(env
, ARM_FEATURE_M
))
2580 if ((insn
& (1 << 25)) == 0) {
2581 if (insn
& (1 << 20)) {
2585 /* mcrr. Used for block cache operations, so implement as no-op. */
2588 if ((insn
& (1 << 4)) == 0) {
2592 if (IS_USER(s
) && !cp15_user_ok(insn
)) {
2595 if ((insn
& 0x0fff0fff) == 0x0e070f90
2596 || (insn
& 0x0fff0fff) == 0x0e070f58) {
2597 /* Wait for interrupt. */
2598 gen_set_pc_im(s
->pc
);
2599 s
->is_jmp
= DISAS_WFI
;
2602 rd
= (insn
>> 12) & 0xf;
2603 if (insn
& ARM_CP_RW_BIT
) {
2605 gen_helper_get_cp15(tmp
, cpu_env
, tcg_const_i32(insn
));
2606 /* If the destination register is r15 then sets condition codes. */
2608 store_reg(s
, rd
, tmp
);
2612 tmp
= load_reg(s
, rd
);
2613 gen_helper_set_cp15(cpu_env
, tcg_const_i32(insn
), tmp
);
2615 /* Normally we would always end the TB here, but Linux
2616 * arch/arm/mach-pxa/sleep.S expects two instructions following
2617 * an MMU enable to execute from cache. Imitate this behaviour. */
2618 if (!arm_feature(env
, ARM_FEATURE_XSCALE
) ||
2619 (insn
& 0x0fff0fff) != 0x0e010f10)
2625 #define VFP_REG_SHR(x, n) (((n) > 0) ? (x) >> (n) : (x) << -(n))
2626 #define VFP_SREG(insn, bigbit, smallbit) \
2627 ((VFP_REG_SHR(insn, bigbit - 1) & 0x1e) | (((insn) >> (smallbit)) & 1))
2628 #define VFP_DREG(reg, insn, bigbit, smallbit) do { \
2629 if (arm_feature(env, ARM_FEATURE_VFP3)) { \
2630 reg = (((insn) >> (bigbit)) & 0x0f) \
2631 | (((insn) >> ((smallbit) - 4)) & 0x10); \
2633 if (insn & (1 << (smallbit))) \
2635 reg = ((insn) >> (bigbit)) & 0x0f; \
2638 #define VFP_SREG_D(insn) VFP_SREG(insn, 12, 22)
2639 #define VFP_DREG_D(reg, insn) VFP_DREG(reg, insn, 12, 22)
2640 #define VFP_SREG_N(insn) VFP_SREG(insn, 16, 7)
2641 #define VFP_DREG_N(reg, insn) VFP_DREG(reg, insn, 16, 7)
2642 #define VFP_SREG_M(insn) VFP_SREG(insn, 0, 5)
2643 #define VFP_DREG_M(reg, insn) VFP_DREG(reg, insn, 0, 5)
2645 /* Move between integer and VFP cores. */
2646 static TCGv
gen_vfp_mrs(void)
2648 TCGv tmp
= new_tmp();
2649 tcg_gen_mov_i32(tmp
, cpu_F0s
);
2653 static void gen_vfp_msr(TCGv tmp
)
2655 tcg_gen_mov_i32(cpu_F0s
, tmp
);
2660 vfp_enabled(CPUState
* env
)
2662 return ((env
->vfp
.xregs
[ARM_VFP_FPEXC
] & (1 << 30)) != 0);
2665 static void gen_neon_dup_u8(TCGv var
, int shift
)
2667 TCGv tmp
= new_tmp();
2669 tcg_gen_shri_i32(var
, var
, shift
);
2670 tcg_gen_ext8u_i32(var
, var
);
2671 tcg_gen_shli_i32(tmp
, var
, 8);
2672 tcg_gen_or_i32(var
, var
, tmp
);
2673 tcg_gen_shli_i32(tmp
, var
, 16);
2674 tcg_gen_or_i32(var
, var
, tmp
);
2678 static void gen_neon_dup_low16(TCGv var
)
2680 TCGv tmp
= new_tmp();
2681 tcg_gen_ext16u_i32(var
, var
);
2682 tcg_gen_shli_i32(tmp
, var
, 16);
2683 tcg_gen_or_i32(var
, var
, tmp
);
2687 static void gen_neon_dup_high16(TCGv var
)
2689 TCGv tmp
= new_tmp();
2690 tcg_gen_andi_i32(var
, var
, 0xffff0000);
2691 tcg_gen_shri_i32(tmp
, var
, 16);
2692 tcg_gen_or_i32(var
, var
, tmp
);
2696 /* Disassemble a VFP instruction. Returns nonzero if an error occured
2697 (ie. an undefined instruction). */
2698 static int disas_vfp_insn(CPUState
* env
, DisasContext
*s
, uint32_t insn
)
2700 uint32_t rd
, rn
, rm
, op
, i
, n
, offset
, delta_d
, delta_m
, bank_mask
;
2705 if (!arm_feature(env
, ARM_FEATURE_VFP
))
2708 if (!vfp_enabled(env
)) {
2709 /* VFP disabled. Only allow fmxr/fmrx to/from some control regs. */
2710 if ((insn
& 0x0fe00fff) != 0x0ee00a10)
2712 rn
= (insn
>> 16) & 0xf;
2713 if (rn
!= ARM_VFP_FPSID
&& rn
!= ARM_VFP_FPEXC
2714 && rn
!= ARM_VFP_MVFR1
&& rn
!= ARM_VFP_MVFR0
)
2717 dp
= ((insn
& 0xf00) == 0xb00);
2718 switch ((insn
>> 24) & 0xf) {
2720 if (insn
& (1 << 4)) {
2721 /* single register transfer */
2722 rd
= (insn
>> 12) & 0xf;
2727 VFP_DREG_N(rn
, insn
);
2730 if (insn
& 0x00c00060
2731 && !arm_feature(env
, ARM_FEATURE_NEON
))
2734 pass
= (insn
>> 21) & 1;
2735 if (insn
& (1 << 22)) {
2737 offset
= ((insn
>> 5) & 3) * 8;
2738 } else if (insn
& (1 << 5)) {
2740 offset
= (insn
& (1 << 6)) ? 16 : 0;
2745 if (insn
& ARM_CP_RW_BIT
) {
2747 tmp
= neon_load_reg(rn
, pass
);
2751 tcg_gen_shri_i32(tmp
, tmp
, offset
);
2752 if (insn
& (1 << 23))
2758 if (insn
& (1 << 23)) {
2760 tcg_gen_shri_i32(tmp
, tmp
, 16);
2766 tcg_gen_sari_i32(tmp
, tmp
, 16);
2775 store_reg(s
, rd
, tmp
);
2778 tmp
= load_reg(s
, rd
);
2779 if (insn
& (1 << 23)) {
2782 gen_neon_dup_u8(tmp
, 0);
2783 } else if (size
== 1) {
2784 gen_neon_dup_low16(tmp
);
2786 for (n
= 0; n
<= pass
* 2; n
++) {
2788 tcg_gen_mov_i32(tmp2
, tmp
);
2789 neon_store_reg(rn
, n
, tmp2
);
2791 neon_store_reg(rn
, n
, tmp
);
2796 tmp2
= neon_load_reg(rn
, pass
);
2797 gen_bfi(tmp
, tmp2
, tmp
, offset
, 0xff);
2801 tmp2
= neon_load_reg(rn
, pass
);
2802 gen_bfi(tmp
, tmp2
, tmp
, offset
, 0xffff);
2808 neon_store_reg(rn
, pass
, tmp
);
2812 if ((insn
& 0x6f) != 0x00)
2814 rn
= VFP_SREG_N(insn
);
2815 if (insn
& ARM_CP_RW_BIT
) {
2817 if (insn
& (1 << 21)) {
2818 /* system register */
2823 /* VFP2 allows access to FSID from userspace.
2824 VFP3 restricts all id registers to privileged
2827 && arm_feature(env
, ARM_FEATURE_VFP3
))
2829 tmp
= load_cpu_field(vfp
.xregs
[rn
]);
2834 tmp
= load_cpu_field(vfp
.xregs
[rn
]);
2836 case ARM_VFP_FPINST
:
2837 case ARM_VFP_FPINST2
:
2838 /* Not present in VFP3. */
2840 || arm_feature(env
, ARM_FEATURE_VFP3
))
2842 tmp
= load_cpu_field(vfp
.xregs
[rn
]);
2846 tmp
= load_cpu_field(vfp
.xregs
[ARM_VFP_FPSCR
]);
2847 tcg_gen_andi_i32(tmp
, tmp
, 0xf0000000);
2850 gen_helper_vfp_get_fpscr(tmp
, cpu_env
);
2856 || !arm_feature(env
, ARM_FEATURE_VFP3
))
2858 tmp
= load_cpu_field(vfp
.xregs
[rn
]);
2864 gen_mov_F0_vreg(0, rn
);
2865 tmp
= gen_vfp_mrs();
2868 /* Set the 4 flag bits in the CPSR. */
2872 store_reg(s
, rd
, tmp
);
2876 tmp
= load_reg(s
, rd
);
2877 if (insn
& (1 << 21)) {
2879 /* system register */
2884 /* Writes are ignored. */
2887 gen_helper_vfp_set_fpscr(cpu_env
, tmp
);
2894 store_cpu_field(tmp
, vfp
.xregs
[rn
]);
2897 case ARM_VFP_FPINST
:
2898 case ARM_VFP_FPINST2
:
2899 store_cpu_field(tmp
, vfp
.xregs
[rn
]);
2906 gen_mov_vreg_F0(0, rn
);
2911 /* data processing */
2912 /* The opcode is in bits 23, 21, 20 and 6. */
2913 op
= ((insn
>> 20) & 8) | ((insn
>> 19) & 6) | ((insn
>> 6) & 1);
2917 rn
= ((insn
>> 15) & 0x1e) | ((insn
>> 7) & 1);
2919 /* rn is register number */
2920 VFP_DREG_N(rn
, insn
);
2923 if (op
== 15 && (rn
== 15 || rn
> 17)) {
2924 /* Integer or single precision destination. */
2925 rd
= VFP_SREG_D(insn
);
2927 VFP_DREG_D(rd
, insn
);
2930 if (op
== 15 && (rn
== 16 || rn
== 17)) {
2931 /* Integer source. */
2932 rm
= ((insn
<< 1) & 0x1e) | ((insn
>> 5) & 1);
2934 VFP_DREG_M(rm
, insn
);
2937 rn
= VFP_SREG_N(insn
);
2938 if (op
== 15 && rn
== 15) {
2939 /* Double precision destination. */
2940 VFP_DREG_D(rd
, insn
);
2942 rd
= VFP_SREG_D(insn
);
2944 rm
= VFP_SREG_M(insn
);
2947 veclen
= env
->vfp
.vec_len
;
2948 if (op
== 15 && rn
> 3)
2951 /* Shut up compiler warnings. */
2962 /* Figure out what type of vector operation this is. */
2963 if ((rd
& bank_mask
) == 0) {
2968 delta_d
= (env
->vfp
.vec_stride
>> 1) + 1;
2970 delta_d
= env
->vfp
.vec_stride
+ 1;
2972 if ((rm
& bank_mask
) == 0) {
2973 /* mixed scalar/vector */
2982 /* Load the initial operands. */
2987 /* Integer source */
2988 gen_mov_F0_vreg(0, rm
);
2993 gen_mov_F0_vreg(dp
, rd
);
2994 gen_mov_F1_vreg(dp
, rm
);
2998 /* Compare with zero */
2999 gen_mov_F0_vreg(dp
, rd
);
3010 /* Source and destination the same. */
3011 gen_mov_F0_vreg(dp
, rd
);
3014 /* One source operand. */
3015 gen_mov_F0_vreg(dp
, rm
);
3019 /* Two source operands. */
3020 gen_mov_F0_vreg(dp
, rn
);
3021 gen_mov_F1_vreg(dp
, rm
);
3025 /* Perform the calculation. */
3027 case 0: /* mac: fd + (fn * fm) */
3029 gen_mov_F1_vreg(dp
, rd
);
3032 case 1: /* nmac: fd - (fn * fm) */
3035 gen_mov_F1_vreg(dp
, rd
);
3038 case 2: /* msc: -fd + (fn * fm) */
3040 gen_mov_F1_vreg(dp
, rd
);
3043 case 3: /* nmsc: -fd - (fn * fm) */
3046 gen_mov_F1_vreg(dp
, rd
);
3049 case 4: /* mul: fn * fm */
3052 case 5: /* nmul: -(fn * fm) */
3056 case 6: /* add: fn + fm */
3059 case 7: /* sub: fn - fm */
3062 case 8: /* div: fn / fm */
3065 case 14: /* fconst */
3066 if (!arm_feature(env
, ARM_FEATURE_VFP3
))
3069 n
= (insn
<< 12) & 0x80000000;
3070 i
= ((insn
>> 12) & 0x70) | (insn
& 0xf);
3077 tcg_gen_movi_i64(cpu_F0d
, ((uint64_t)n
) << 32);
3084 tcg_gen_movi_i32(cpu_F0s
, n
);
3087 case 15: /* extension space */
3110 case 11: /* cmpez */
3114 case 15: /* single<->double conversion */
3116 gen_helper_vfp_fcvtsd(cpu_F0s
, cpu_F0d
, cpu_env
);
3118 gen_helper_vfp_fcvtds(cpu_F0d
, cpu_F0s
, cpu_env
);
3120 case 16: /* fuito */
3123 case 17: /* fsito */
3126 case 20: /* fshto */
3127 if (!arm_feature(env
, ARM_FEATURE_VFP3
))
3129 gen_vfp_shto(dp
, 16 - rm
);
3131 case 21: /* fslto */
3132 if (!arm_feature(env
, ARM_FEATURE_VFP3
))
3134 gen_vfp_slto(dp
, 32 - rm
);
3136 case 22: /* fuhto */
3137 if (!arm_feature(env
, ARM_FEATURE_VFP3
))
3139 gen_vfp_uhto(dp
, 16 - rm
);
3141 case 23: /* fulto */
3142 if (!arm_feature(env
, ARM_FEATURE_VFP3
))
3144 gen_vfp_ulto(dp
, 32 - rm
);
3146 case 24: /* ftoui */
3149 case 25: /* ftouiz */
3152 case 26: /* ftosi */
3155 case 27: /* ftosiz */
3158 case 28: /* ftosh */
3159 if (!arm_feature(env
, ARM_FEATURE_VFP3
))
3161 gen_vfp_tosh(dp
, 16 - rm
);
3163 case 29: /* ftosl */
3164 if (!arm_feature(env
, ARM_FEATURE_VFP3
))
3166 gen_vfp_tosl(dp
, 32 - rm
);
3168 case 30: /* ftouh */
3169 if (!arm_feature(env
, ARM_FEATURE_VFP3
))
3171 gen_vfp_touh(dp
, 16 - rm
);
3173 case 31: /* ftoul */
3174 if (!arm_feature(env
, ARM_FEATURE_VFP3
))
3176 gen_vfp_toul(dp
, 32 - rm
);
3178 default: /* undefined */
3179 printf ("rn:%d\n", rn
);
3183 default: /* undefined */
3184 printf ("op:%d\n", op
);
3188 /* Write back the result. */
3189 if (op
== 15 && (rn
>= 8 && rn
<= 11))
3190 ; /* Comparison, do nothing. */
3191 else if (op
== 15 && rn
> 17)
3192 /* Integer result. */
3193 gen_mov_vreg_F0(0, rd
);
3194 else if (op
== 15 && rn
== 15)
3196 gen_mov_vreg_F0(!dp
, rd
);
3198 gen_mov_vreg_F0(dp
, rd
);
3200 /* break out of the loop if we have finished */
3204 if (op
== 15 && delta_m
== 0) {
3205 /* single source one-many */
3207 rd
= ((rd
+ delta_d
) & (bank_mask
- 1))
3209 gen_mov_vreg_F0(dp
, rd
);
3213 /* Setup the next operands. */
3215 rd
= ((rd
+ delta_d
) & (bank_mask
- 1))
3219 /* One source operand. */
3220 rm
= ((rm
+ delta_m
) & (bank_mask
- 1))
3222 gen_mov_F0_vreg(dp
, rm
);
3224 /* Two source operands. */
3225 rn
= ((rn
+ delta_d
) & (bank_mask
- 1))
3227 gen_mov_F0_vreg(dp
, rn
);
3229 rm
= ((rm
+ delta_m
) & (bank_mask
- 1))
3231 gen_mov_F1_vreg(dp
, rm
);
3239 if (dp
&& (insn
& 0x03e00000) == 0x00400000) {
3240 /* two-register transfer */
3241 rn
= (insn
>> 16) & 0xf;
3242 rd
= (insn
>> 12) & 0xf;
3244 VFP_DREG_M(rm
, insn
);
3246 rm
= VFP_SREG_M(insn
);
3249 if (insn
& ARM_CP_RW_BIT
) {
3252 gen_mov_F0_vreg(0, rm
* 2);
3253 tmp
= gen_vfp_mrs();
3254 store_reg(s
, rd
, tmp
);
3255 gen_mov_F0_vreg(0, rm
* 2 + 1);
3256 tmp
= gen_vfp_mrs();
3257 store_reg(s
, rn
, tmp
);
3259 gen_mov_F0_vreg(0, rm
);
3260 tmp
= gen_vfp_mrs();
3261 store_reg(s
, rn
, tmp
);
3262 gen_mov_F0_vreg(0, rm
+ 1);
3263 tmp
= gen_vfp_mrs();
3264 store_reg(s
, rd
, tmp
);
3269 tmp
= load_reg(s
, rd
);
3271 gen_mov_vreg_F0(0, rm
* 2);
3272 tmp
= load_reg(s
, rn
);
3274 gen_mov_vreg_F0(0, rm
* 2 + 1);
3276 tmp
= load_reg(s
, rn
);
3278 gen_mov_vreg_F0(0, rm
);
3279 tmp
= load_reg(s
, rd
);
3281 gen_mov_vreg_F0(0, rm
+ 1);
3286 rn
= (insn
>> 16) & 0xf;
3288 VFP_DREG_D(rd
, insn
);
3290 rd
= VFP_SREG_D(insn
);
3291 if (s
->thumb
&& rn
== 15) {
3292 gen_op_movl_T1_im(s
->pc
& ~2);
3294 gen_movl_T1_reg(s
, rn
);
3296 if ((insn
& 0x01200000) == 0x01000000) {
3297 /* Single load/store */
3298 offset
= (insn
& 0xff) << 2;
3299 if ((insn
& (1 << 23)) == 0)
3301 gen_op_addl_T1_im(offset
);
3302 if (insn
& (1 << 20)) {
3304 gen_mov_vreg_F0(dp
, rd
);
3306 gen_mov_F0_vreg(dp
, rd
);
3310 /* load/store multiple */
3312 n
= (insn
>> 1) & 0x7f;
3316 if (insn
& (1 << 24)) /* pre-decrement */
3317 gen_op_addl_T1_im(-((insn
& 0xff) << 2));
3323 for (i
= 0; i
< n
; i
++) {
3324 if (insn
& ARM_CP_RW_BIT
) {
3327 gen_mov_vreg_F0(dp
, rd
+ i
);
3330 gen_mov_F0_vreg(dp
, rd
+ i
);
3333 gen_op_addl_T1_im(offset
);
3335 if (insn
& (1 << 21)) {
3337 if (insn
& (1 << 24))
3338 offset
= -offset
* n
;
3339 else if (dp
&& (insn
& 1))
3345 gen_op_addl_T1_im(offset
);
3346 gen_movl_reg_T1(s
, rn
);
3352 /* Should never happen. */
3358 static inline void gen_goto_tb(DisasContext
*s
, int n
, uint32_t dest
)
3360 TranslationBlock
*tb
;
3363 if ((tb
->pc
& TARGET_PAGE_MASK
) == (dest
& TARGET_PAGE_MASK
)) {
3365 gen_set_pc_im(dest
);
3366 tcg_gen_exit_tb((long)tb
+ n
);
3368 gen_set_pc_im(dest
);
3373 static inline void gen_jmp (DisasContext
*s
, uint32_t dest
)
3375 if (unlikely(s
->singlestep_enabled
)) {
3376 /* An indirect jump so that we still trigger the debug exception. */
3381 gen_goto_tb(s
, 0, dest
);
3382 s
->is_jmp
= DISAS_TB_JUMP
;
3386 static inline void gen_mulxy(TCGv t0
, TCGv t1
, int x
, int y
)
3389 tcg_gen_sari_i32(t0
, t0
, 16);
3393 tcg_gen_sari_i32(t1
, t1
, 16);
3396 tcg_gen_mul_i32(t0
, t0
, t1
);
3399 /* Return the mask of PSR bits set by a MSR instruction. */
3400 static uint32_t msr_mask(CPUState
*env
, DisasContext
*s
, int flags
, int spsr
) {
3404 if (flags
& (1 << 0))
3406 if (flags
& (1 << 1))
3408 if (flags
& (1 << 2))
3410 if (flags
& (1 << 3))
3413 /* Mask out undefined bits. */
3414 mask
&= ~CPSR_RESERVED
;
3415 if (!arm_feature(env
, ARM_FEATURE_V6
))
3416 mask
&= ~(CPSR_E
| CPSR_GE
);
3417 if (!arm_feature(env
, ARM_FEATURE_THUMB2
))
3419 /* Mask out execution state bits. */
3422 /* Mask out privileged bits. */
3428 /* Returns nonzero if access to the PSR is not permitted. */
3429 static int gen_set_psr_T0(DisasContext
*s
, uint32_t mask
, int spsr
)
3433 /* ??? This is also undefined in system mode. */
3437 tmp
= load_cpu_field(spsr
);
3438 tcg_gen_andi_i32(tmp
, tmp
, ~mask
);
3439 tcg_gen_andi_i32(cpu_T
[0], cpu_T
[0], mask
);
3440 tcg_gen_or_i32(tmp
, tmp
, cpu_T
[0]);
3441 store_cpu_field(tmp
, spsr
);
3443 gen_set_cpsr(cpu_T
[0], mask
);
3449 /* Generate an old-style exception return. */
3450 static void gen_exception_return(DisasContext
*s
)
3453 gen_movl_reg_T0(s
, 15);
3454 tmp
= load_cpu_field(spsr
);
3455 gen_set_cpsr(tmp
, 0xffffffff);
3457 s
->is_jmp
= DISAS_UPDATE
;
3460 /* Generate a v6 exception return. Marks both values as dead. */
3461 static void gen_rfe(DisasContext
*s
, TCGv pc
, TCGv cpsr
)
3463 gen_set_cpsr(cpsr
, 0xffffffff);
3465 store_reg(s
, 15, pc
);
3466 s
->is_jmp
= DISAS_UPDATE
;
3470 gen_set_condexec (DisasContext
*s
)
3472 if (s
->condexec_mask
) {
3473 uint32_t val
= (s
->condexec_cond
<< 4) | (s
->condexec_mask
>> 1);
3474 TCGv tmp
= new_tmp();
3475 tcg_gen_movi_i32(tmp
, val
);
3476 store_cpu_field(tmp
, condexec_bits
);
3480 static void gen_nop_hint(DisasContext
*s
, int val
)
3484 gen_set_pc_im(s
->pc
);
3485 s
->is_jmp
= DISAS_WFI
;
3489 /* TODO: Implement SEV and WFE. May help SMP performance. */
3495 /* These macros help make the code more readable when migrating from the
3496 old dyngen helpers. They should probably be removed when
3497 T0/T1 are removed. */
3498 #define CPU_T001 cpu_T[0], cpu_T[0], cpu_T[1]
3499 #define CPU_T0E01 cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]
3501 #define CPU_V001 cpu_V0, cpu_V0, cpu_V1
3503 static inline int gen_neon_add(int size
)
3506 case 0: gen_helper_neon_add_u8(CPU_T001
); break;
3507 case 1: gen_helper_neon_add_u16(CPU_T001
); break;
3508 case 2: gen_op_addl_T0_T1(); break;
3514 static inline void gen_neon_rsb(int size
)
3517 case 0: gen_helper_neon_sub_u8(cpu_T
[0], cpu_T
[1], cpu_T
[0]); break;
3518 case 1: gen_helper_neon_sub_u16(cpu_T
[0], cpu_T
[1], cpu_T
[0]); break;
3519 case 2: gen_op_rsbl_T0_T1(); break;
3524 /* 32-bit pairwise ops end up the same as the elementwise versions. */
3525 #define gen_helper_neon_pmax_s32 gen_helper_neon_max_s32
3526 #define gen_helper_neon_pmax_u32 gen_helper_neon_max_u32
3527 #define gen_helper_neon_pmin_s32 gen_helper_neon_min_s32
3528 #define gen_helper_neon_pmin_u32 gen_helper_neon_min_u32
3530 /* FIXME: This is wrong. They set the wrong overflow bit. */
3531 #define gen_helper_neon_qadd_s32(a, e, b, c) gen_helper_add_saturate(a, b, c)
3532 #define gen_helper_neon_qadd_u32(a, e, b, c) gen_helper_add_usaturate(a, b, c)
3533 #define gen_helper_neon_qsub_s32(a, e, b, c) gen_helper_sub_saturate(a, b, c)
3534 #define gen_helper_neon_qsub_u32(a, e, b, c) gen_helper_sub_usaturate(a, b, c)
3536 #define GEN_NEON_INTEGER_OP_ENV(name) do { \
3537 switch ((size << 1) | u) { \
3539 gen_helper_neon_##name##_s8(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]); \
3542 gen_helper_neon_##name##_u8(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]); \
3545 gen_helper_neon_##name##_s16(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]); \
3548 gen_helper_neon_##name##_u16(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]); \
3551 gen_helper_neon_##name##_s32(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]); \
3554 gen_helper_neon_##name##_u32(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]); \
3556 default: return 1; \
3559 #define GEN_NEON_INTEGER_OP(name) do { \
3560 switch ((size << 1) | u) { \
3562 gen_helper_neon_##name##_s8(cpu_T[0], cpu_T[0], cpu_T[1]); \
3565 gen_helper_neon_##name##_u8(cpu_T[0], cpu_T[0], cpu_T[1]); \
3568 gen_helper_neon_##name##_s16(cpu_T[0], cpu_T[0], cpu_T[1]); \
3571 gen_helper_neon_##name##_u16(cpu_T[0], cpu_T[0], cpu_T[1]); \
3574 gen_helper_neon_##name##_s32(cpu_T[0], cpu_T[0], cpu_T[1]); \
3577 gen_helper_neon_##name##_u32(cpu_T[0], cpu_T[0], cpu_T[1]); \
3579 default: return 1; \
3583 gen_neon_movl_scratch_T0(int scratch
)
3587 offset
= offsetof(CPUARMState
, vfp
.scratch
[scratch
]);
3588 tcg_gen_st_i32(cpu_T
[0], cpu_env
, offset
);
3592 gen_neon_movl_scratch_T1(int scratch
)
3596 offset
= offsetof(CPUARMState
, vfp
.scratch
[scratch
]);
3597 tcg_gen_st_i32(cpu_T
[1], cpu_env
, offset
);
3601 gen_neon_movl_T0_scratch(int scratch
)
3605 offset
= offsetof(CPUARMState
, vfp
.scratch
[scratch
]);
3606 tcg_gen_ld_i32(cpu_T
[0], cpu_env
, offset
);
3610 gen_neon_movl_T1_scratch(int scratch
)
3614 offset
= offsetof(CPUARMState
, vfp
.scratch
[scratch
]);
3615 tcg_gen_ld_i32(cpu_T
[1], cpu_env
, offset
);
3618 static inline void gen_neon_get_scalar(int size
, int reg
)
3621 NEON_GET_REG(T0
, reg
>> 1, reg
& 1);
3623 NEON_GET_REG(T0
, reg
>> 2, (reg
>> 1) & 1);
3625 gen_neon_dup_low16(cpu_T
[0]);
3627 gen_neon_dup_high16(cpu_T
[0]);
3631 static void gen_neon_unzip(int reg
, int q
, int tmp
, int size
)
3635 for (n
= 0; n
< q
+ 1; n
+= 2) {
3636 NEON_GET_REG(T0
, reg
, n
);
3637 NEON_GET_REG(T0
, reg
, n
+ n
);
3639 case 0: gen_helper_neon_unzip_u8(); break;
3640 case 1: gen_helper_neon_zip_u16(); break; /* zip and unzip are the same. */
3641 case 2: /* no-op */; break;
3644 gen_neon_movl_scratch_T0(tmp
+ n
);
3645 gen_neon_movl_scratch_T1(tmp
+ n
+ 1);
3653 } neon_ls_element_type
[11] = {
3667 /* Translate a NEON load/store element instruction. Return nonzero if the
3668 instruction is invalid. */
3669 static int disas_neon_ls_insn(CPUState
* env
, DisasContext
*s
, uint32_t insn
)
3685 if (!vfp_enabled(env
))
3687 VFP_DREG_D(rd
, insn
);
3688 rn
= (insn
>> 16) & 0xf;
3690 load
= (insn
& (1 << 21)) != 0;
3691 if ((insn
& (1 << 23)) == 0) {
3692 /* Load store all elements. */
3693 op
= (insn
>> 8) & 0xf;
3694 size
= (insn
>> 6) & 3;
3695 if (op
> 10 || size
== 3)
3697 nregs
= neon_ls_element_type
[op
].nregs
;
3698 interleave
= neon_ls_element_type
[op
].interleave
;
3699 gen_movl_T1_reg(s
, rn
);
3700 stride
= (1 << size
) * interleave
;
3701 for (reg
= 0; reg
< nregs
; reg
++) {
3702 if (interleave
> 2 || (interleave
== 2 && nregs
== 2)) {
3703 gen_movl_T1_reg(s
, rn
);
3704 gen_op_addl_T1_im((1 << size
) * reg
);
3705 } else if (interleave
== 2 && nregs
== 4 && reg
== 2) {
3706 gen_movl_T1_reg(s
, rn
);
3707 gen_op_addl_T1_im(1 << size
);
3709 for (pass
= 0; pass
< 2; pass
++) {
3712 tmp
= gen_ld32(cpu_T
[1], IS_USER(s
));
3713 neon_store_reg(rd
, pass
, tmp
);
3715 tmp
= neon_load_reg(rd
, pass
);
3716 gen_st32(tmp
, cpu_T
[1], IS_USER(s
));
3718 gen_op_addl_T1_im(stride
);
3719 } else if (size
== 1) {
3721 tmp
= gen_ld16u(cpu_T
[1], IS_USER(s
));
3722 gen_op_addl_T1_im(stride
);
3723 tmp2
= gen_ld16u(cpu_T
[1], IS_USER(s
));
3724 gen_op_addl_T1_im(stride
);
3725 gen_bfi(tmp
, tmp
, tmp2
, 16, 0xffff);
3727 neon_store_reg(rd
, pass
, tmp
);
3729 tmp
= neon_load_reg(rd
, pass
);
3731 tcg_gen_shri_i32(tmp2
, tmp
, 16);
3732 gen_st16(tmp
, cpu_T
[1], IS_USER(s
));
3733 gen_op_addl_T1_im(stride
);
3734 gen_st16(tmp2
, cpu_T
[1], IS_USER(s
));
3735 gen_op_addl_T1_im(stride
);
3737 } else /* size == 0 */ {
3740 for (n
= 0; n
< 4; n
++) {
3741 tmp
= gen_ld8u(cpu_T
[1], IS_USER(s
));
3742 gen_op_addl_T1_im(stride
);
3746 gen_bfi(tmp2
, tmp2
, tmp
, n
* 8, 0xff);
3750 neon_store_reg(rd
, pass
, tmp2
);
3752 tmp2
= neon_load_reg(rd
, pass
);
3753 for (n
= 0; n
< 4; n
++) {
3756 tcg_gen_mov_i32(tmp
, tmp2
);
3758 tcg_gen_shri_i32(tmp
, tmp2
, n
* 8);
3760 gen_st8(tmp
, cpu_T
[1], IS_USER(s
));
3761 gen_op_addl_T1_im(stride
);
3767 rd
+= neon_ls_element_type
[op
].spacing
;
3771 size
= (insn
>> 10) & 3;
3773 /* Load single element to all lanes. */
3776 size
= (insn
>> 6) & 3;
3777 nregs
= ((insn
>> 8) & 3) + 1;
3778 stride
= (insn
& (1 << 5)) ? 2 : 1;
3779 gen_movl_T1_reg(s
, rn
);
3780 for (reg
= 0; reg
< nregs
; reg
++) {
3783 tmp
= gen_ld8u(cpu_T
[1], IS_USER(s
));
3784 gen_neon_dup_u8(tmp
, 0);
3787 tmp
= gen_ld16u(cpu_T
[1], IS_USER(s
));
3788 gen_neon_dup_low16(tmp
);
3791 tmp
= gen_ld32(cpu_T
[0], IS_USER(s
));
3795 default: /* Avoid compiler warnings. */
3798 gen_op_addl_T1_im(1 << size
);
3800 tcg_gen_mov_i32(tmp2
, tmp
);
3801 neon_store_reg(rd
, 0, tmp2
);
3802 neon_store_reg(rd
, 1, tmp
);
3805 stride
= (1 << size
) * nregs
;
3807 /* Single element. */
3808 pass
= (insn
>> 7) & 1;
3811 shift
= ((insn
>> 5) & 3) * 8;
3815 shift
= ((insn
>> 6) & 1) * 16;
3816 stride
= (insn
& (1 << 5)) ? 2 : 1;
3820 stride
= (insn
& (1 << 6)) ? 2 : 1;
3825 nregs
= ((insn
>> 8) & 3) + 1;
3826 gen_movl_T1_reg(s
, rn
);
3827 for (reg
= 0; reg
< nregs
; reg
++) {
3831 tmp
= gen_ld8u(cpu_T
[1], IS_USER(s
));
3834 tmp
= gen_ld16u(cpu_T
[1], IS_USER(s
));
3837 tmp
= gen_ld32(cpu_T
[1], IS_USER(s
));
3839 default: /* Avoid compiler warnings. */
3843 tmp2
= neon_load_reg(rd
, pass
);
3844 gen_bfi(tmp
, tmp2
, tmp
, shift
, size
? 0xffff : 0xff);
3847 neon_store_reg(rd
, pass
, tmp
);
3848 } else { /* Store */
3849 tmp
= neon_load_reg(rd
, pass
);
3851 tcg_gen_shri_i32(tmp
, tmp
, shift
);
3854 gen_st8(tmp
, cpu_T
[1], IS_USER(s
));
3857 gen_st16(tmp
, cpu_T
[1], IS_USER(s
));
3860 gen_st32(tmp
, cpu_T
[1], IS_USER(s
));
3865 gen_op_addl_T1_im(1 << size
);
3867 stride
= nregs
* (1 << size
);
3873 base
= load_reg(s
, rn
);
3875 tcg_gen_addi_i32(base
, base
, stride
);
3878 index
= load_reg(s
, rm
);
3879 tcg_gen_add_i32(base
, base
, index
);
3882 store_reg(s
, rn
, base
);
3887 /* Bitwise select. dest = c ? t : f. Clobbers T and F. */
3888 static void gen_neon_bsl(TCGv dest
, TCGv t
, TCGv f
, TCGv c
)
3890 tcg_gen_and_i32(t
, t
, c
);
3891 tcg_gen_bic_i32(f
, f
, c
);
3892 tcg_gen_or_i32(dest
, t
, f
);
3895 static inline void gen_neon_narrow(int size
, TCGv dest
, TCGv_i64 src
)
3898 case 0: gen_helper_neon_narrow_u8(dest
, src
); break;
3899 case 1: gen_helper_neon_narrow_u16(dest
, src
); break;
3900 case 2: tcg_gen_trunc_i64_i32(dest
, src
); break;
3905 static inline void gen_neon_narrow_sats(int size
, TCGv dest
, TCGv_i64 src
)
3908 case 0: gen_helper_neon_narrow_sat_s8(dest
, cpu_env
, src
); break;
3909 case 1: gen_helper_neon_narrow_sat_s16(dest
, cpu_env
, src
); break;
3910 case 2: gen_helper_neon_narrow_sat_s32(dest
, cpu_env
, src
); break;
3915 static inline void gen_neon_narrow_satu(int size
, TCGv dest
, TCGv_i64 src
)
3918 case 0: gen_helper_neon_narrow_sat_u8(dest
, cpu_env
, src
); break;
3919 case 1: gen_helper_neon_narrow_sat_u16(dest
, cpu_env
, src
); break;
3920 case 2: gen_helper_neon_narrow_sat_u32(dest
, cpu_env
, src
); break;
3925 static inline void gen_neon_shift_narrow(int size
, TCGv var
, TCGv shift
,
3931 case 1: gen_helper_neon_rshl_u16(var
, var
, shift
); break;
3932 case 2: gen_helper_neon_rshl_u32(var
, var
, shift
); break;
3937 case 1: gen_helper_neon_rshl_s16(var
, var
, shift
); break;
3938 case 2: gen_helper_neon_rshl_s32(var
, var
, shift
); break;
3945 case 1: gen_helper_neon_rshl_u16(var
, var
, shift
); break;
3946 case 2: gen_helper_neon_rshl_u32(var
, var
, shift
); break;
3951 case 1: gen_helper_neon_shl_s16(var
, var
, shift
); break;
3952 case 2: gen_helper_neon_shl_s32(var
, var
, shift
); break;
3959 static inline void gen_neon_widen(TCGv_i64 dest
, TCGv src
, int size
, int u
)
3963 case 0: gen_helper_neon_widen_u8(dest
, src
); break;
3964 case 1: gen_helper_neon_widen_u16(dest
, src
); break;
3965 case 2: tcg_gen_extu_i32_i64(dest
, src
); break;
3970 case 0: gen_helper_neon_widen_s8(dest
, src
); break;
3971 case 1: gen_helper_neon_widen_s16(dest
, src
); break;
3972 case 2: tcg_gen_ext_i32_i64(dest
, src
); break;
3979 static inline void gen_neon_addl(int size
)
3982 case 0: gen_helper_neon_addl_u16(CPU_V001
); break;
3983 case 1: gen_helper_neon_addl_u32(CPU_V001
); break;
3984 case 2: tcg_gen_add_i64(CPU_V001
); break;
3989 static inline void gen_neon_subl(int size
)
3992 case 0: gen_helper_neon_subl_u16(CPU_V001
); break;
3993 case 1: gen_helper_neon_subl_u32(CPU_V001
); break;
3994 case 2: tcg_gen_sub_i64(CPU_V001
); break;
3999 static inline void gen_neon_negl(TCGv_i64 var
, int size
)
4002 case 0: gen_helper_neon_negl_u16(var
, var
); break;
4003 case 1: gen_helper_neon_negl_u32(var
, var
); break;
4004 case 2: gen_helper_neon_negl_u64(var
, var
); break;
4009 static inline void gen_neon_addl_saturate(TCGv_i64 op0
, TCGv_i64 op1
, int size
)
4012 case 1: gen_helper_neon_addl_saturate_s32(op0
, cpu_env
, op0
, op1
); break;
4013 case 2: gen_helper_neon_addl_saturate_s64(op0
, cpu_env
, op0
, op1
); break;
4018 static inline void gen_neon_mull(TCGv_i64 dest
, TCGv a
, TCGv b
, int size
, int u
)
4022 switch ((size
<< 1) | u
) {
4023 case 0: gen_helper_neon_mull_s8(dest
, a
, b
); break;
4024 case 1: gen_helper_neon_mull_u8(dest
, a
, b
); break;
4025 case 2: gen_helper_neon_mull_s16(dest
, a
, b
); break;
4026 case 3: gen_helper_neon_mull_u16(dest
, a
, b
); break;
4028 tmp
= gen_muls_i64_i32(a
, b
);
4029 tcg_gen_mov_i64(dest
, tmp
);
4032 tmp
= gen_mulu_i64_i32(a
, b
);
4033 tcg_gen_mov_i64(dest
, tmp
);
4043 /* Translate a NEON data processing instruction. Return nonzero if the
4044 instruction is invalid.
4045 We process data in a mixture of 32-bit and 64-bit chunks.
4046 Mostly we use 32-bit chunks so we can use normal scalar instructions. */
4048 static int disas_neon_data_insn(CPUState
* env
, DisasContext
*s
, uint32_t insn
)
4066 if (!vfp_enabled(env
))
4068 q
= (insn
& (1 << 6)) != 0;
4069 u
= (insn
>> 24) & 1;
4070 VFP_DREG_D(rd
, insn
);
4071 VFP_DREG_N(rn
, insn
);
4072 VFP_DREG_M(rm
, insn
);
4073 size
= (insn
>> 20) & 3;
4074 if ((insn
& (1 << 23)) == 0) {
4075 /* Three register same length. */
4076 op
= ((insn
>> 7) & 0x1e) | ((insn
>> 4) & 1);
4077 if (size
== 3 && (op
== 1 || op
== 5 || op
== 8 || op
== 9
4078 || op
== 10 || op
== 11 || op
== 16)) {
4079 /* 64-bit element instructions. */
4080 for (pass
= 0; pass
< (q
? 2 : 1); pass
++) {
4081 neon_load_reg64(cpu_V0
, rn
+ pass
);
4082 neon_load_reg64(cpu_V1
, rm
+ pass
);
4086 gen_helper_neon_add_saturate_u64(CPU_V001
);
4088 gen_helper_neon_add_saturate_s64(CPU_V001
);
4093 gen_helper_neon_sub_saturate_u64(CPU_V001
);
4095 gen_helper_neon_sub_saturate_s64(CPU_V001
);
4100 gen_helper_neon_shl_u64(cpu_V0
, cpu_V1
, cpu_V0
);
4102 gen_helper_neon_shl_s64(cpu_V0
, cpu_V1
, cpu_V0
);
4107 gen_helper_neon_qshl_u64(cpu_V0
, cpu_env
,
4110 gen_helper_neon_qshl_s64(cpu_V1
, cpu_env
,
4114 case 10: /* VRSHL */
4116 gen_helper_neon_rshl_u64(cpu_V0
, cpu_V1
, cpu_V0
);
4118 gen_helper_neon_rshl_s64(cpu_V0
, cpu_V1
, cpu_V0
);
4121 case 11: /* VQRSHL */
4123 gen_helper_neon_qrshl_u64(cpu_V0
, cpu_env
,
4126 gen_helper_neon_qrshl_s64(cpu_V0
, cpu_env
,
4132 tcg_gen_sub_i64(CPU_V001
);
4134 tcg_gen_add_i64(CPU_V001
);
4140 neon_store_reg64(cpu_V0
, rd
+ pass
);
4147 case 10: /* VRSHL */
4148 case 11: /* VQRSHL */
4151 /* Shift instruction operands are reversed. */
4158 case 20: /* VPMAX */
4159 case 21: /* VPMIN */
4160 case 23: /* VPADD */
4163 case 26: /* VPADD (float) */
4164 pairwise
= (u
&& size
< 2);
4166 case 30: /* VPMIN/VPMAX (float) */
4173 for (pass
= 0; pass
< (q
? 4 : 2); pass
++) {
4182 NEON_GET_REG(T0
, rn
, n
);
4183 NEON_GET_REG(T1
, rn
, n
+ 1);
4185 NEON_GET_REG(T0
, rm
, n
);
4186 NEON_GET_REG(T1
, rm
, n
+ 1);
4190 NEON_GET_REG(T0
, rn
, pass
);
4191 NEON_GET_REG(T1
, rm
, pass
);
4195 GEN_NEON_INTEGER_OP(hadd
);
4198 GEN_NEON_INTEGER_OP_ENV(qadd
);
4200 case 2: /* VRHADD */
4201 GEN_NEON_INTEGER_OP(rhadd
);
4203 case 3: /* Logic ops. */
4204 switch ((u
<< 2) | size
) {
4206 gen_op_andl_T0_T1();
4209 gen_op_bicl_T0_T1();
4219 gen_op_xorl_T0_T1();
4222 tmp
= neon_load_reg(rd
, pass
);
4223 gen_neon_bsl(cpu_T
[0], cpu_T
[0], cpu_T
[1], tmp
);
4227 tmp
= neon_load_reg(rd
, pass
);
4228 gen_neon_bsl(cpu_T
[0], cpu_T
[0], tmp
, cpu_T
[1]);
4232 tmp
= neon_load_reg(rd
, pass
);
4233 gen_neon_bsl(cpu_T
[0], tmp
, cpu_T
[0], cpu_T
[1]);
4239 GEN_NEON_INTEGER_OP(hsub
);
4242 GEN_NEON_INTEGER_OP_ENV(qsub
);
4245 GEN_NEON_INTEGER_OP(cgt
);
4248 GEN_NEON_INTEGER_OP(cge
);
4251 GEN_NEON_INTEGER_OP(shl
);
4254 GEN_NEON_INTEGER_OP_ENV(qshl
);
4256 case 10: /* VRSHL */
4257 GEN_NEON_INTEGER_OP(rshl
);
4259 case 11: /* VQRSHL */
4260 GEN_NEON_INTEGER_OP_ENV(qrshl
);
4263 GEN_NEON_INTEGER_OP(max
);
4266 GEN_NEON_INTEGER_OP(min
);
4269 GEN_NEON_INTEGER_OP(abd
);
4272 GEN_NEON_INTEGER_OP(abd
);
4273 NEON_GET_REG(T1
, rd
, pass
);
4277 if (!u
) { /* VADD */
4278 if (gen_neon_add(size
))
4282 case 0: gen_helper_neon_sub_u8(CPU_T001
); break;
4283 case 1: gen_helper_neon_sub_u16(CPU_T001
); break;
4284 case 2: gen_op_subl_T0_T1(); break;
4290 if (!u
) { /* VTST */
4292 case 0: gen_helper_neon_tst_u8(CPU_T001
); break;
4293 case 1: gen_helper_neon_tst_u16(CPU_T001
); break;
4294 case 2: gen_helper_neon_tst_u32(CPU_T001
); break;
4299 case 0: gen_helper_neon_ceq_u8(CPU_T001
); break;
4300 case 1: gen_helper_neon_ceq_u16(CPU_T001
); break;
4301 case 2: gen_helper_neon_ceq_u32(CPU_T001
); break;
4306 case 18: /* Multiply. */
4308 case 0: gen_helper_neon_mul_u8(CPU_T001
); break;
4309 case 1: gen_helper_neon_mul_u16(CPU_T001
); break;
4310 case 2: gen_op_mul_T0_T1(); break;
4313 NEON_GET_REG(T1
, rd
, pass
);
4321 if (u
) { /* polynomial */
4322 gen_helper_neon_mul_p8(CPU_T001
);
4323 } else { /* Integer */
4325 case 0: gen_helper_neon_mul_u8(CPU_T001
); break;
4326 case 1: gen_helper_neon_mul_u16(CPU_T001
); break;
4327 case 2: gen_op_mul_T0_T1(); break;
4332 case 20: /* VPMAX */
4333 GEN_NEON_INTEGER_OP(pmax
);
4335 case 21: /* VPMIN */
4336 GEN_NEON_INTEGER_OP(pmin
);
4338 case 22: /* Hultiply high. */
4339 if (!u
) { /* VQDMULH */
4341 case 1: gen_helper_neon_qdmulh_s16(CPU_T0E01
); break;
4342 case 2: gen_helper_neon_qdmulh_s32(CPU_T0E01
); break;
4345 } else { /* VQRDHMUL */
4347 case 1: gen_helper_neon_qrdmulh_s16(CPU_T0E01
); break;
4348 case 2: gen_helper_neon_qrdmulh_s32(CPU_T0E01
); break;
4353 case 23: /* VPADD */
4357 case 0: gen_helper_neon_padd_u8(CPU_T001
); break;
4358 case 1: gen_helper_neon_padd_u16(CPU_T001
); break;
4359 case 2: gen_op_addl_T0_T1(); break;
4363 case 26: /* Floating point arithnetic. */
4364 switch ((u
<< 2) | size
) {
4366 gen_helper_neon_add_f32(CPU_T001
);
4369 gen_helper_neon_sub_f32(CPU_T001
);
4372 gen_helper_neon_add_f32(CPU_T001
);
4375 gen_helper_neon_abd_f32(CPU_T001
);
4381 case 27: /* Float multiply. */
4382 gen_helper_neon_mul_f32(CPU_T001
);
4384 NEON_GET_REG(T1
, rd
, pass
);
4386 gen_helper_neon_add_f32(CPU_T001
);
4388 gen_helper_neon_sub_f32(cpu_T
[0], cpu_T
[1], cpu_T
[0]);
4392 case 28: /* Float compare. */
4394 gen_helper_neon_ceq_f32(CPU_T001
);
4397 gen_helper_neon_cge_f32(CPU_T001
);
4399 gen_helper_neon_cgt_f32(CPU_T001
);
4402 case 29: /* Float compare absolute. */
4406 gen_helper_neon_acge_f32(CPU_T001
);
4408 gen_helper_neon_acgt_f32(CPU_T001
);
4410 case 30: /* Float min/max. */
4412 gen_helper_neon_max_f32(CPU_T001
);
4414 gen_helper_neon_min_f32(CPU_T001
);
4418 gen_helper_recps_f32(cpu_T
[0], cpu_T
[0], cpu_T
[1], cpu_env
);
4420 gen_helper_rsqrts_f32(cpu_T
[0], cpu_T
[0], cpu_T
[1], cpu_env
);
4425 /* Save the result. For elementwise operations we can put it
4426 straight into the destination register. For pairwise operations
4427 we have to be careful to avoid clobbering the source operands. */
4428 if (pairwise
&& rd
== rm
) {
4429 gen_neon_movl_scratch_T0(pass
);
4431 NEON_SET_REG(T0
, rd
, pass
);
4435 if (pairwise
&& rd
== rm
) {
4436 for (pass
= 0; pass
< (q
? 4 : 2); pass
++) {
4437 gen_neon_movl_T0_scratch(pass
);
4438 NEON_SET_REG(T0
, rd
, pass
);
4441 /* End of 3 register same size operations. */
4442 } else if (insn
& (1 << 4)) {
4443 if ((insn
& 0x00380080) != 0) {
4444 /* Two registers and shift. */
4445 op
= (insn
>> 8) & 0xf;
4446 if (insn
& (1 << 7)) {
4451 while ((insn
& (1 << (size
+ 19))) == 0)
4454 shift
= (insn
>> 16) & ((1 << (3 + size
)) - 1);
4455 /* To avoid excessive dumplication of ops we implement shift
4456 by immediate using the variable shift operations. */
4458 /* Shift by immediate:
4459 VSHR, VSRA, VRSHR, VRSRA, VSRI, VSHL, VQSHL, VQSHLU. */
4460 /* Right shifts are encoded as N - shift, where N is the
4461 element size in bits. */
4463 shift
= shift
- (1 << (size
+ 3));
4471 imm
= (uint8_t) shift
;
4476 imm
= (uint16_t) shift
;
4487 for (pass
= 0; pass
< count
; pass
++) {
4489 neon_load_reg64(cpu_V0
, rm
+ pass
);
4490 tcg_gen_movi_i64(cpu_V1
, imm
);
4495 gen_helper_neon_shl_u64(cpu_V0
, cpu_V0
, cpu_V1
);
4497 gen_helper_neon_shl_s64(cpu_V0
, cpu_V0
, cpu_V1
);
4502 gen_helper_neon_rshl_u64(cpu_V0
, cpu_V0
, cpu_V1
);
4504 gen_helper_neon_rshl_s64(cpu_V0
, cpu_V0
, cpu_V1
);
4509 gen_helper_neon_shl_u64(cpu_V0
, cpu_V0
, cpu_V1
);
4511 case 5: /* VSHL, VSLI */
4512 gen_helper_neon_shl_u64(cpu_V0
, cpu_V0
, cpu_V1
);
4516 gen_helper_neon_qshl_u64(cpu_V0
, cpu_env
, cpu_V0
, cpu_V1
);
4518 gen_helper_neon_qshl_s64(cpu_V0
, cpu_env
, cpu_V0
, cpu_V1
);
4520 case 7: /* VQSHLU */
4521 gen_helper_neon_qshl_u64(cpu_V0
, cpu_env
, cpu_V0
, cpu_V1
);
4524 if (op
== 1 || op
== 3) {
4526 neon_load_reg64(cpu_V0
, rd
+ pass
);
4527 tcg_gen_add_i64(cpu_V0
, cpu_V0
, cpu_V1
);
4528 } else if (op
== 4 || (op
== 5 && u
)) {
4530 cpu_abort(env
, "VS[LR]I.64 not implemented");
4532 neon_store_reg64(cpu_V0
, rd
+ pass
);
4533 } else { /* size < 3 */
4534 /* Operands in T0 and T1. */
4535 gen_op_movl_T1_im(imm
);
4536 NEON_GET_REG(T0
, rm
, pass
);
4540 GEN_NEON_INTEGER_OP(shl
);
4544 GEN_NEON_INTEGER_OP(rshl
);
4549 GEN_NEON_INTEGER_OP(shl
);
4551 case 5: /* VSHL, VSLI */
4553 case 0: gen_helper_neon_shl_u8(CPU_T001
); break;
4554 case 1: gen_helper_neon_shl_u16(CPU_T001
); break;
4555 case 2: gen_helper_neon_shl_u32(CPU_T001
); break;
4560 GEN_NEON_INTEGER_OP_ENV(qshl
);
4562 case 7: /* VQSHLU */
4564 case 0: gen_helper_neon_qshl_u8(CPU_T0E01
); break;
4565 case 1: gen_helper_neon_qshl_u16(CPU_T0E01
); break;
4566 case 2: gen_helper_neon_qshl_u32(CPU_T0E01
); break;
4572 if (op
== 1 || op
== 3) {
4574 NEON_GET_REG(T1
, rd
, pass
);
4576 } else if (op
== 4 || (op
== 5 && u
)) {
4581 imm
= 0xff >> -shift
;
4583 imm
= (uint8_t)(0xff << shift
);
4589 imm
= 0xffff >> -shift
;
4591 imm
= (uint16_t)(0xffff << shift
);
4596 imm
= 0xffffffffu
>> -shift
;
4598 imm
= 0xffffffffu
<< shift
;
4603 tmp
= neon_load_reg(rd
, pass
);
4604 tcg_gen_andi_i32(cpu_T
[0], cpu_T
[0], imm
);
4605 tcg_gen_andi_i32(tmp
, tmp
, ~imm
);
4606 tcg_gen_or_i32(cpu_T
[0], cpu_T
[0], tmp
);
4608 NEON_SET_REG(T0
, rd
, pass
);
4611 } else if (op
< 10) {
4612 /* Shift by immediate and narrow:
4613 VSHRN, VRSHRN, VQSHRN, VQRSHRN. */
4614 shift
= shift
- (1 << (size
+ 3));
4618 imm
= (uint16_t)shift
;
4620 tmp2
= tcg_const_i32(imm
);
4621 TCGV_UNUSED_I64(tmp64
);
4624 imm
= (uint32_t)shift
;
4625 tmp2
= tcg_const_i32(imm
);
4626 TCGV_UNUSED_I64(tmp64
);
4629 tmp64
= tcg_const_i64(shift
);
4636 for (pass
= 0; pass
< 2; pass
++) {
4638 neon_load_reg64(cpu_V0
, rm
+ pass
);
4641 gen_helper_neon_rshl_u64(cpu_V0
, cpu_V0
, tmp64
);
4643 gen_helper_neon_rshl_s64(cpu_V0
, cpu_V0
, tmp64
);
4646 gen_helper_neon_shl_u64(cpu_V0
, cpu_V0
, tmp64
);
4648 gen_helper_neon_shl_s64(cpu_V0
, cpu_V0
, tmp64
);
4651 tmp
= neon_load_reg(rm
+ pass
, 0);
4652 gen_neon_shift_narrow(size
, tmp
, tmp2
, q
, u
);
4653 tmp3
= neon_load_reg(rm
+ pass
, 1);
4654 gen_neon_shift_narrow(size
, tmp3
, tmp2
, q
, u
);
4655 tcg_gen_concat_i32_i64(cpu_V0
, tmp
, tmp3
);
4660 if (op
== 8 && !u
) {
4661 gen_neon_narrow(size
- 1, tmp
, cpu_V0
);
4664 gen_neon_narrow_sats(size
- 1, tmp
, cpu_V0
);
4666 gen_neon_narrow_satu(size
- 1, tmp
, cpu_V0
);
4671 neon_store_reg(rd
, 0, tmp2
);
4672 neon_store_reg(rd
, 1, tmp
);
4675 } else if (op
== 10) {
4679 tmp
= neon_load_reg(rm
, 0);
4680 tmp2
= neon_load_reg(rm
, 1);
4681 for (pass
= 0; pass
< 2; pass
++) {
4685 gen_neon_widen(cpu_V0
, tmp
, size
, u
);
4688 /* The shift is less than the width of the source
4689 type, so we can just shift the whole register. */
4690 tcg_gen_shli_i64(cpu_V0
, cpu_V0
, shift
);
4691 if (size
< 2 || !u
) {
4694 imm
= (0xffu
>> (8 - shift
));
4697 imm
= 0xffff >> (16 - shift
);
4699 imm64
= imm
| (((uint64_t)imm
) << 32);
4700 tcg_gen_andi_i64(cpu_V0
, cpu_V0
, imm64
);
4703 neon_store_reg64(cpu_V0
, rd
+ pass
);
4705 } else if (op
== 15 || op
== 16) {
4706 /* VCVT fixed-point. */
4707 for (pass
= 0; pass
< (q
? 4 : 2); pass
++) {
4708 tcg_gen_ld_f32(cpu_F0s
, cpu_env
, neon_reg_offset(rm
, pass
));
4711 gen_vfp_ulto(0, shift
);
4713 gen_vfp_slto(0, shift
);
4716 gen_vfp_toul(0, shift
);
4718 gen_vfp_tosl(0, shift
);
4720 tcg_gen_st_f32(cpu_F0s
, cpu_env
, neon_reg_offset(rd
, pass
));
4725 } else { /* (insn & 0x00380080) == 0 */
4728 op
= (insn
>> 8) & 0xf;
4729 /* One register and immediate. */
4730 imm
= (u
<< 7) | ((insn
>> 12) & 0x70) | (insn
& 0xf);
4731 invert
= (insn
& (1 << 5)) != 0;
4749 imm
= (imm
<< 8) | (imm
<< 24);
4752 imm
= (imm
< 8) | 0xff;
4755 imm
= (imm
<< 16) | 0xffff;
4758 imm
|= (imm
<< 8) | (imm
<< 16) | (imm
<< 24);
4763 imm
= ((imm
& 0x80) << 24) | ((imm
& 0x3f) << 19)
4764 | ((imm
& 0x40) ? (0x1f << 25) : (1 << 30));
4770 if (op
!= 14 || !invert
)
4771 gen_op_movl_T1_im(imm
);
4773 for (pass
= 0; pass
< (q
? 4 : 2); pass
++) {
4774 if (op
& 1 && op
< 12) {
4775 tmp
= neon_load_reg(rd
, pass
);
4777 /* The immediate value has already been inverted, so
4779 tcg_gen_andi_i32(tmp
, tmp
, imm
);
4781 tcg_gen_ori_i32(tmp
, tmp
, imm
);
4786 if (op
== 14 && invert
) {
4789 for (n
= 0; n
< 4; n
++) {
4790 if (imm
& (1 << (n
+ (pass
& 1) * 4)))
4791 val
|= 0xff << (n
* 8);
4793 tcg_gen_movi_i32(tmp
, val
);
4795 tcg_gen_movi_i32(tmp
, imm
);
4798 neon_store_reg(rd
, pass
, tmp
);
4801 } else { /* (insn & 0x00800010 == 0x00800000) */
4803 op
= (insn
>> 8) & 0xf;
4804 if ((insn
& (1 << 6)) == 0) {
4805 /* Three registers of different lengths. */
4809 /* prewiden, src1_wide, src2_wide */
4810 static const int neon_3reg_wide
[16][3] = {
4811 {1, 0, 0}, /* VADDL */
4812 {1, 1, 0}, /* VADDW */
4813 {1, 0, 0}, /* VSUBL */
4814 {1, 1, 0}, /* VSUBW */
4815 {0, 1, 1}, /* VADDHN */
4816 {0, 0, 0}, /* VABAL */
4817 {0, 1, 1}, /* VSUBHN */
4818 {0, 0, 0}, /* VABDL */
4819 {0, 0, 0}, /* VMLAL */
4820 {0, 0, 0}, /* VQDMLAL */
4821 {0, 0, 0}, /* VMLSL */
4822 {0, 0, 0}, /* VQDMLSL */
4823 {0, 0, 0}, /* Integer VMULL */
4824 {0, 0, 0}, /* VQDMULL */
4825 {0, 0, 0} /* Polynomial VMULL */
4828 prewiden
= neon_3reg_wide
[op
][0];
4829 src1_wide
= neon_3reg_wide
[op
][1];
4830 src2_wide
= neon_3reg_wide
[op
][2];
4832 if (size
== 0 && (op
== 9 || op
== 11 || op
== 13))
4835 /* Avoid overlapping operands. Wide source operands are
4836 always aligned so will never overlap with wide
4837 destinations in problematic ways. */
4838 if (rd
== rm
&& !src2_wide
) {
4839 NEON_GET_REG(T0
, rm
, 1);
4840 gen_neon_movl_scratch_T0(2);
4841 } else if (rd
== rn
&& !src1_wide
) {
4842 NEON_GET_REG(T0
, rn
, 1);
4843 gen_neon_movl_scratch_T0(2);
4846 for (pass
= 0; pass
< 2; pass
++) {
4848 neon_load_reg64(cpu_V0
, rn
+ pass
);
4851 if (pass
== 1 && rd
== rn
) {
4852 gen_neon_movl_T0_scratch(2);
4854 tcg_gen_mov_i32(tmp
, cpu_T
[0]);
4856 tmp
= neon_load_reg(rn
, pass
);
4859 gen_neon_widen(cpu_V0
, tmp
, size
, u
);
4863 neon_load_reg64(cpu_V1
, rm
+ pass
);
4866 if (pass
== 1 && rd
== rm
) {
4867 gen_neon_movl_T0_scratch(2);
4869 tcg_gen_mov_i32(tmp2
, cpu_T
[0]);
4871 tmp2
= neon_load_reg(rm
, pass
);
4874 gen_neon_widen(cpu_V1
, tmp2
, size
, u
);
4878 case 0: case 1: case 4: /* VADDL, VADDW, VADDHN, VRADDHN */
4879 gen_neon_addl(size
);
4881 case 2: case 3: case 6: /* VSUBL, VSUBW, VSUBHL, VRSUBHL */
4882 gen_neon_subl(size
);
4884 case 5: case 7: /* VABAL, VABDL */
4885 switch ((size
<< 1) | u
) {
4887 gen_helper_neon_abdl_s16(cpu_V0
, tmp
, tmp2
);
4890 gen_helper_neon_abdl_u16(cpu_V0
, tmp
, tmp2
);
4893 gen_helper_neon_abdl_s32(cpu_V0
, tmp
, tmp2
);
4896 gen_helper_neon_abdl_u32(cpu_V0
, tmp
, tmp2
);
4899 gen_helper_neon_abdl_s64(cpu_V0
, tmp
, tmp2
);
4902 gen_helper_neon_abdl_u64(cpu_V0
, tmp
, tmp2
);
4909 case 8: case 9: case 10: case 11: case 12: case 13:
4910 /* VMLAL, VQDMLAL, VMLSL, VQDMLSL, VMULL, VQDMULL */
4911 gen_neon_mull(cpu_V0
, tmp
, tmp2
, size
, u
);
4913 case 14: /* Polynomial VMULL */
4914 cpu_abort(env
, "Polynomial VMULL not implemented");
4916 default: /* 15 is RESERVED. */
4919 if (op
== 5 || op
== 13 || (op
>= 8 && op
<= 11)) {
4921 if (op
== 10 || op
== 11) {
4922 gen_neon_negl(cpu_V0
, size
);
4926 neon_load_reg64(cpu_V1
, rd
+ pass
);
4930 case 5: case 8: case 10: /* VABAL, VMLAL, VMLSL */
4931 gen_neon_addl(size
);
4933 case 9: case 11: /* VQDMLAL, VQDMLSL */
4934 gen_neon_addl_saturate(cpu_V0
, cpu_V0
, size
);
4935 gen_neon_addl_saturate(cpu_V0
, cpu_V1
, size
);
4938 case 13: /* VQDMULL */
4939 gen_neon_addl_saturate(cpu_V0
, cpu_V0
, size
);
4944 neon_store_reg64(cpu_V0
, rd
+ pass
);
4945 } else if (op
== 4 || op
== 6) {
4946 /* Narrowing operation. */
4951 gen_helper_neon_narrow_high_u8(tmp
, cpu_V0
);
4954 gen_helper_neon_narrow_high_u16(tmp
, cpu_V0
);
4957 tcg_gen_shri_i64(cpu_V0
, cpu_V0
, 32);
4958 tcg_gen_trunc_i64_i32(tmp
, cpu_V0
);
4965 gen_helper_neon_narrow_round_high_u8(tmp
, cpu_V0
);
4968 gen_helper_neon_narrow_round_high_u16(tmp
, cpu_V0
);
4971 tcg_gen_addi_i64(cpu_V0
, cpu_V0
, 1u << 31);
4972 tcg_gen_shri_i64(cpu_V0
, cpu_V0
, 32);
4973 tcg_gen_trunc_i64_i32(tmp
, cpu_V0
);
4981 neon_store_reg(rd
, 0, tmp3
);
4982 neon_store_reg(rd
, 1, tmp
);
4985 /* Write back the result. */
4986 neon_store_reg64(cpu_V0
, rd
+ pass
);
4990 /* Two registers and a scalar. */
4992 case 0: /* Integer VMLA scalar */
4993 case 1: /* Float VMLA scalar */
4994 case 4: /* Integer VMLS scalar */
4995 case 5: /* Floating point VMLS scalar */
4996 case 8: /* Integer VMUL scalar */
4997 case 9: /* Floating point VMUL scalar */
4998 case 12: /* VQDMULH scalar */
4999 case 13: /* VQRDMULH scalar */
5000 gen_neon_get_scalar(size
, rm
);
5001 gen_neon_movl_scratch_T0(0);
5002 for (pass
= 0; pass
< (u
? 4 : 2); pass
++) {
5004 gen_neon_movl_T0_scratch(0);
5005 NEON_GET_REG(T1
, rn
, pass
);
5008 gen_helper_neon_qdmulh_s16(CPU_T0E01
);
5010 gen_helper_neon_qdmulh_s32(CPU_T0E01
);
5012 } else if (op
== 13) {
5014 gen_helper_neon_qrdmulh_s16(CPU_T0E01
);
5016 gen_helper_neon_qrdmulh_s32(CPU_T0E01
);
5018 } else if (op
& 1) {
5019 gen_helper_neon_mul_f32(CPU_T001
);
5022 case 0: gen_helper_neon_mul_u8(CPU_T001
); break;
5023 case 1: gen_helper_neon_mul_u16(CPU_T001
); break;
5024 case 2: gen_op_mul_T0_T1(); break;
5030 NEON_GET_REG(T1
, rd
, pass
);
5036 gen_helper_neon_add_f32(CPU_T001
);
5042 gen_helper_neon_sub_f32(cpu_T
[0], cpu_T
[1], cpu_T
[0]);
5048 NEON_SET_REG(T0
, rd
, pass
);
5051 case 2: /* VMLAL sclar */
5052 case 3: /* VQDMLAL scalar */
5053 case 6: /* VMLSL scalar */
5054 case 7: /* VQDMLSL scalar */
5055 case 10: /* VMULL scalar */
5056 case 11: /* VQDMULL scalar */
5057 if (size
== 0 && (op
== 3 || op
== 7 || op
== 11))
5060 gen_neon_get_scalar(size
, rm
);
5061 NEON_GET_REG(T1
, rn
, 1);
5063 for (pass
= 0; pass
< 2; pass
++) {
5065 tmp
= neon_load_reg(rn
, 0);
5068 tcg_gen_mov_i32(tmp
, cpu_T
[1]);
5071 tcg_gen_mov_i32(tmp2
, cpu_T
[0]);
5072 gen_neon_mull(cpu_V0
, tmp
, tmp2
, size
, u
);
5073 if (op
== 6 || op
== 7) {
5074 gen_neon_negl(cpu_V0
, size
);
5077 neon_load_reg64(cpu_V1
, rd
+ pass
);
5081 gen_neon_addl(size
);
5084 gen_neon_addl_saturate(cpu_V0
, cpu_V0
, size
);
5085 gen_neon_addl_saturate(cpu_V0
, cpu_V1
, size
);
5091 gen_neon_addl_saturate(cpu_V0
, cpu_V0
, size
);
5096 neon_store_reg64(cpu_V0
, rd
+ pass
);
5099 default: /* 14 and 15 are RESERVED */
5103 } else { /* size == 3 */
5106 imm
= (insn
>> 8) & 0xf;
5113 neon_load_reg64(cpu_V0
, rn
);
5115 neon_load_reg64(cpu_V1
, rn
+ 1);
5117 } else if (imm
== 8) {
5118 neon_load_reg64(cpu_V0
, rn
+ 1);
5120 neon_load_reg64(cpu_V1
, rm
);
5123 tmp64
= tcg_temp_new_i64();
5125 neon_load_reg64(cpu_V0
, rn
);
5126 neon_load_reg64(tmp64
, rn
+ 1);
5128 neon_load_reg64(cpu_V0
, rn
+ 1);
5129 neon_load_reg64(tmp64
, rm
);
5131 tcg_gen_shri_i64(cpu_V0
, cpu_V0
, (imm
& 7) * 8);
5132 tcg_gen_shli_i64(cpu_V1
, tmp64
, 64 - ((imm
& 7) * 8));
5133 tcg_gen_or_i64(cpu_V0
, cpu_V0
, cpu_V1
);
5135 neon_load_reg64(cpu_V1
, rm
);
5137 neon_load_reg64(cpu_V1
, rm
+ 1);
5140 tcg_gen_shli_i64(cpu_V1
, cpu_V1
, 64 - (imm
* 8));
5141 tcg_gen_shri_i64(tmp64
, tmp64
, imm
* 8);
5142 tcg_gen_or_i64(cpu_V1
, cpu_V1
, tmp64
);
5145 neon_load_reg64(cpu_V0
, rn
);
5146 tcg_gen_shri_i64(cpu_V0
, cpu_V0
, imm
* 8);
5147 neon_load_reg64(cpu_V1
, rm
);
5148 tcg_gen_shli_i64(cpu_V1
, cpu_V1
, 64 - (imm
* 8));
5149 tcg_gen_or_i64(cpu_V0
, cpu_V0
, cpu_V1
);
5151 neon_store_reg64(cpu_V0
, rd
);
5153 neon_store_reg64(cpu_V1
, rd
+ 1);
5155 } else if ((insn
& (1 << 11)) == 0) {
5156 /* Two register misc. */
5157 op
= ((insn
>> 12) & 0x30) | ((insn
>> 7) & 0xf);
5158 size
= (insn
>> 18) & 3;
5160 case 0: /* VREV64 */
5163 for (pass
= 0; pass
< (q
? 2 : 1); pass
++) {
5164 NEON_GET_REG(T0
, rm
, pass
* 2);
5165 NEON_GET_REG(T1
, rm
, pass
* 2 + 1);
5167 case 0: tcg_gen_bswap32_i32(cpu_T
[0], cpu_T
[0]); break;
5168 case 1: gen_swap_half(cpu_T
[0]); break;
5169 case 2: /* no-op */ break;
5172 NEON_SET_REG(T0
, rd
, pass
* 2 + 1);
5174 NEON_SET_REG(T1
, rd
, pass
* 2);
5176 gen_op_movl_T0_T1();
5178 case 0: tcg_gen_bswap32_i32(cpu_T
[0], cpu_T
[0]); break;
5179 case 1: gen_swap_half(cpu_T
[0]); break;
5182 NEON_SET_REG(T0
, rd
, pass
* 2);
5186 case 4: case 5: /* VPADDL */
5187 case 12: case 13: /* VPADAL */
5190 for (pass
= 0; pass
< q
+ 1; pass
++) {
5191 tmp
= neon_load_reg(rm
, pass
* 2);
5192 gen_neon_widen(cpu_V0
, tmp
, size
, op
& 1);
5193 tmp
= neon_load_reg(rm
, pass
* 2 + 1);
5194 gen_neon_widen(cpu_V1
, tmp
, size
, op
& 1);
5196 case 0: gen_helper_neon_paddl_u16(CPU_V001
); break;
5197 case 1: gen_helper_neon_paddl_u32(CPU_V001
); break;
5198 case 2: tcg_gen_add_i64(CPU_V001
); break;
5203 neon_load_reg64(cpu_V1
, rd
+ pass
);
5204 gen_neon_addl(size
);
5206 neon_store_reg64(cpu_V0
, rd
+ pass
);
5211 for (n
= 0; n
< (q
? 4 : 2); n
+= 2) {
5212 NEON_GET_REG(T0
, rm
, n
);
5213 NEON_GET_REG(T1
, rd
, n
+ 1);
5214 NEON_SET_REG(T1
, rm
, n
);
5215 NEON_SET_REG(T0
, rd
, n
+ 1);
5223 Rd A3 A2 A1 A0 B2 B0 A2 A0
5224 Rm B3 B2 B1 B0 B3 B1 A3 A1
5228 gen_neon_unzip(rd
, q
, 0, size
);
5229 gen_neon_unzip(rm
, q
, 4, size
);
5231 static int unzip_order_q
[8] =
5232 {0, 2, 4, 6, 1, 3, 5, 7};
5233 for (n
= 0; n
< 8; n
++) {
5234 int reg
= (n
< 4) ? rd
: rm
;
5235 gen_neon_movl_T0_scratch(unzip_order_q
[n
]);
5236 NEON_SET_REG(T0
, reg
, n
% 4);
5239 static int unzip_order
[4] =
5241 for (n
= 0; n
< 4; n
++) {
5242 int reg
= (n
< 2) ? rd
: rm
;
5243 gen_neon_movl_T0_scratch(unzip_order
[n
]);
5244 NEON_SET_REG(T0
, reg
, n
% 2);
5250 Rd A3 A2 A1 A0 B1 A1 B0 A0
5251 Rm B3 B2 B1 B0 B3 A3 B2 A2
5255 count
= (q
? 4 : 2);
5256 for (n
= 0; n
< count
; n
++) {
5257 NEON_GET_REG(T0
, rd
, n
);
5258 NEON_GET_REG(T1
, rd
, n
);
5260 case 0: gen_helper_neon_zip_u8(); break;
5261 case 1: gen_helper_neon_zip_u16(); break;
5262 case 2: /* no-op */; break;
5265 gen_neon_movl_scratch_T0(n
* 2);
5266 gen_neon_movl_scratch_T1(n
* 2 + 1);
5268 for (n
= 0; n
< count
* 2; n
++) {
5269 int reg
= (n
< count
) ? rd
: rm
;
5270 gen_neon_movl_T0_scratch(n
);
5271 NEON_SET_REG(T0
, reg
, n
% count
);
5274 case 36: case 37: /* VMOVN, VQMOVUN, VQMOVN */
5278 for (pass
= 0; pass
< 2; pass
++) {
5279 neon_load_reg64(cpu_V0
, rm
+ pass
);
5281 if (op
== 36 && q
== 0) {
5282 gen_neon_narrow(size
, tmp
, cpu_V0
);
5284 gen_neon_narrow_satu(size
, tmp
, cpu_V0
);
5286 gen_neon_narrow_sats(size
, tmp
, cpu_V0
);
5291 neon_store_reg(rd
, 0, tmp2
);
5292 neon_store_reg(rd
, 1, tmp
);
5296 case 38: /* VSHLL */
5299 tmp
= neon_load_reg(rm
, 0);
5300 tmp2
= neon_load_reg(rm
, 1);
5301 for (pass
= 0; pass
< 2; pass
++) {
5304 gen_neon_widen(cpu_V0
, tmp
, size
, 1);
5305 neon_store_reg64(cpu_V0
, rd
+ pass
);
5310 for (pass
= 0; pass
< (q
? 4 : 2); pass
++) {
5311 if (op
== 30 || op
== 31 || op
>= 58) {
5312 tcg_gen_ld_f32(cpu_F0s
, cpu_env
,
5313 neon_reg_offset(rm
, pass
));
5315 NEON_GET_REG(T0
, rm
, pass
);
5318 case 1: /* VREV32 */
5320 case 0: tcg_gen_bswap32_i32(cpu_T
[0], cpu_T
[0]); break;
5321 case 1: gen_swap_half(cpu_T
[0]); break;
5325 case 2: /* VREV16 */
5328 gen_rev16(cpu_T
[0]);
5332 case 0: gen_helper_neon_cls_s8(cpu_T
[0], cpu_T
[0]); break;
5333 case 1: gen_helper_neon_cls_s16(cpu_T
[0], cpu_T
[0]); break;
5334 case 2: gen_helper_neon_cls_s32(cpu_T
[0], cpu_T
[0]); break;
5340 case 0: gen_helper_neon_clz_u8(cpu_T
[0], cpu_T
[0]); break;
5341 case 1: gen_helper_neon_clz_u16(cpu_T
[0], cpu_T
[0]); break;
5342 case 2: gen_helper_clz(cpu_T
[0], cpu_T
[0]); break;
5349 gen_helper_neon_cnt_u8(cpu_T
[0], cpu_T
[0]);
5356 case 14: /* VQABS */
5358 case 0: gen_helper_neon_qabs_s8(cpu_T
[0], cpu_env
, cpu_T
[0]); break;
5359 case 1: gen_helper_neon_qabs_s16(cpu_T
[0], cpu_env
, cpu_T
[0]); break;
5360 case 2: gen_helper_neon_qabs_s32(cpu_T
[0], cpu_env
, cpu_T
[0]); break;
5364 case 15: /* VQNEG */
5366 case 0: gen_helper_neon_qneg_s8(cpu_T
[0], cpu_env
, cpu_T
[0]); break;
5367 case 1: gen_helper_neon_qneg_s16(cpu_T
[0], cpu_env
, cpu_T
[0]); break;
5368 case 2: gen_helper_neon_qneg_s32(cpu_T
[0], cpu_env
, cpu_T
[0]); break;
5372 case 16: case 19: /* VCGT #0, VCLE #0 */
5373 gen_op_movl_T1_im(0);
5375 case 0: gen_helper_neon_cgt_s8(CPU_T001
); break;
5376 case 1: gen_helper_neon_cgt_s16(CPU_T001
); break;
5377 case 2: gen_helper_neon_cgt_s32(CPU_T001
); break;
5383 case 17: case 20: /* VCGE #0, VCLT #0 */
5384 gen_op_movl_T1_im(0);
5386 case 0: gen_helper_neon_cge_s8(CPU_T001
); break;
5387 case 1: gen_helper_neon_cge_s16(CPU_T001
); break;
5388 case 2: gen_helper_neon_cge_s32(CPU_T001
); break;
5394 case 18: /* VCEQ #0 */
5395 gen_op_movl_T1_im(0);
5397 case 0: gen_helper_neon_ceq_u8(CPU_T001
); break;
5398 case 1: gen_helper_neon_ceq_u16(CPU_T001
); break;
5399 case 2: gen_helper_neon_ceq_u32(CPU_T001
); break;
5405 case 0: gen_helper_neon_abs_s8(cpu_T
[0], cpu_T
[0]); break;
5406 case 1: gen_helper_neon_abs_s16(cpu_T
[0], cpu_T
[0]); break;
5407 case 2: tcg_gen_abs_i32(cpu_T
[0], cpu_T
[0]); break;
5412 gen_op_movl_T1_im(0);
5417 case 24: case 27: /* Float VCGT #0, Float VCLE #0 */
5418 gen_op_movl_T1_im(0);
5419 gen_helper_neon_cgt_f32(CPU_T001
);
5423 case 25: case 28: /* Float VCGE #0, Float VCLT #0 */
5424 gen_op_movl_T1_im(0);
5425 gen_helper_neon_cge_f32(CPU_T001
);
5429 case 26: /* Float VCEQ #0 */
5430 gen_op_movl_T1_im(0);
5431 gen_helper_neon_ceq_f32(CPU_T001
);
5433 case 30: /* Float VABS */
5436 case 31: /* Float VNEG */
5440 NEON_GET_REG(T1
, rd
, pass
);
5441 NEON_SET_REG(T1
, rm
, pass
);
5444 NEON_GET_REG(T1
, rd
, pass
);
5446 case 0: gen_helper_neon_trn_u8(); break;
5447 case 1: gen_helper_neon_trn_u16(); break;
5451 NEON_SET_REG(T1
, rm
, pass
);
5453 case 56: /* Integer VRECPE */
5454 gen_helper_recpe_u32(cpu_T
[0], cpu_T
[0], cpu_env
);
5456 case 57: /* Integer VRSQRTE */
5457 gen_helper_rsqrte_u32(cpu_T
[0], cpu_T
[0], cpu_env
);
5459 case 58: /* Float VRECPE */
5460 gen_helper_recpe_f32(cpu_F0s
, cpu_F0s
, cpu_env
);
5462 case 59: /* Float VRSQRTE */
5463 gen_helper_rsqrte_f32(cpu_F0s
, cpu_F0s
, cpu_env
);
5465 case 60: /* VCVT.F32.S32 */
5468 case 61: /* VCVT.F32.U32 */
5471 case 62: /* VCVT.S32.F32 */
5474 case 63: /* VCVT.U32.F32 */
5478 /* Reserved: 21, 29, 39-56 */
5481 if (op
== 30 || op
== 31 || op
>= 58) {
5482 tcg_gen_st_f32(cpu_F0s
, cpu_env
,
5483 neon_reg_offset(rd
, pass
));
5485 NEON_SET_REG(T0
, rd
, pass
);
5490 } else if ((insn
& (1 << 10)) == 0) {
5492 n
= ((insn
>> 5) & 0x18) + 8;
5493 if (insn
& (1 << 6)) {
5494 tmp
= neon_load_reg(rd
, 0);
5497 tcg_gen_movi_i32(tmp
, 0);
5499 tmp2
= neon_load_reg(rm
, 0);
5500 gen_helper_neon_tbl(tmp2
, tmp2
, tmp
, tcg_const_i32(rn
),
5503 if (insn
& (1 << 6)) {
5504 tmp
= neon_load_reg(rd
, 1);
5507 tcg_gen_movi_i32(tmp
, 0);
5509 tmp3
= neon_load_reg(rm
, 1);
5510 gen_helper_neon_tbl(tmp3
, tmp3
, tmp
, tcg_const_i32(rn
),
5512 neon_store_reg(rd
, 0, tmp2
);
5513 neon_store_reg(rd
, 1, tmp3
);
5515 } else if ((insn
& 0x380) == 0) {
5517 if (insn
& (1 << 19)) {
5518 NEON_SET_REG(T0
, rm
, 1);
5520 NEON_SET_REG(T0
, rm
, 0);
5522 if (insn
& (1 << 16)) {
5523 gen_neon_dup_u8(cpu_T
[0], ((insn
>> 17) & 3) * 8);
5524 } else if (insn
& (1 << 17)) {
5525 if ((insn
>> 18) & 1)
5526 gen_neon_dup_high16(cpu_T
[0]);
5528 gen_neon_dup_low16(cpu_T
[0]);
5530 for (pass
= 0; pass
< (q
? 4 : 2); pass
++) {
5531 NEON_SET_REG(T0
, rd
, pass
);
5541 static int disas_cp14_read(CPUState
* env
, DisasContext
*s
, uint32_t insn
)
5543 int crn
= (insn
>> 16) & 0xf;
5544 int crm
= insn
& 0xf;
5545 int op1
= (insn
>> 21) & 7;
5546 int op2
= (insn
>> 5) & 7;
5547 int rt
= (insn
>> 12) & 0xf;
5550 if (arm_feature(env
, ARM_FEATURE_THUMB2EE
)) {
5551 if (op1
== 6 && crn
== 0 && crm
== 0 && op2
== 0) {
5555 tmp
= load_cpu_field(teecr
);
5556 store_reg(s
, rt
, tmp
);
5559 if (op1
== 6 && crn
== 1 && crm
== 0 && op2
== 0) {
5561 if (IS_USER(s
) && (env
->teecr
& 1))
5563 tmp
= load_cpu_field(teehbr
);
5564 store_reg(s
, rt
, tmp
);
5568 fprintf(stderr
, "Unknown cp14 read op1:%d crn:%d crm:%d op2:%d\n",
5569 op1
, crn
, crm
, op2
);
5573 static int disas_cp14_write(CPUState
* env
, DisasContext
*s
, uint32_t insn
)
5575 int crn
= (insn
>> 16) & 0xf;
5576 int crm
= insn
& 0xf;
5577 int op1
= (insn
>> 21) & 7;
5578 int op2
= (insn
>> 5) & 7;
5579 int rt
= (insn
>> 12) & 0xf;
5582 if (arm_feature(env
, ARM_FEATURE_THUMB2EE
)) {
5583 if (op1
== 6 && crn
== 0 && crm
== 0 && op2
== 0) {
5587 tmp
= load_reg(s
, rt
);
5588 gen_helper_set_teecr(cpu_env
, tmp
);
5592 if (op1
== 6 && crn
== 1 && crm
== 0 && op2
== 0) {
5594 if (IS_USER(s
) && (env
->teecr
& 1))
5596 tmp
= load_reg(s
, rt
);
5597 store_cpu_field(tmp
, teehbr
);
5601 fprintf(stderr
, "Unknown cp14 write op1:%d crn:%d crm:%d op2:%d\n",
5602 op1
, crn
, crm
, op2
);
5606 static int disas_coproc_insn(CPUState
* env
, DisasContext
*s
, uint32_t insn
)
5610 cpnum
= (insn
>> 8) & 0xf;
5611 if (arm_feature(env
, ARM_FEATURE_XSCALE
)
5612 && ((env
->cp15
.c15_cpar
^ 0x3fff) & (1 << cpnum
)))
5618 if (arm_feature(env
, ARM_FEATURE_IWMMXT
)) {
5619 return disas_iwmmxt_insn(env
, s
, insn
);
5620 } else if (arm_feature(env
, ARM_FEATURE_XSCALE
)) {
5621 return disas_dsp_insn(env
, s
, insn
);
5626 return disas_vfp_insn (env
, s
, insn
);
5628 /* Coprocessors 7-15 are architecturally reserved by ARM.
5629 Unfortunately Intel decided to ignore this. */
5630 if (arm_feature(env
, ARM_FEATURE_XSCALE
))
5632 if (insn
& (1 << 20))
5633 return disas_cp14_read(env
, s
, insn
);
5635 return disas_cp14_write(env
, s
, insn
);
5637 return disas_cp15_insn (env
, s
, insn
);
5640 /* Unknown coprocessor. See if the board has hooked it. */
5641 return disas_cp_insn (env
, s
, insn
);
5646 /* Store a 64-bit value to a register pair. Clobbers val. */
5647 static void gen_storeq_reg(DisasContext
*s
, int rlow
, int rhigh
, TCGv_i64 val
)
5651 tcg_gen_trunc_i64_i32(tmp
, val
);
5652 store_reg(s
, rlow
, tmp
);
5654 tcg_gen_shri_i64(val
, val
, 32);
5655 tcg_gen_trunc_i64_i32(tmp
, val
);
5656 store_reg(s
, rhigh
, tmp
);
5659 /* load a 32-bit value from a register and perform a 64-bit accumulate. */
5660 static void gen_addq_lo(DisasContext
*s
, TCGv_i64 val
, int rlow
)
5665 /* Load value and extend to 64 bits. */
5666 tmp
= tcg_temp_new_i64();
5667 tmp2
= load_reg(s
, rlow
);
5668 tcg_gen_extu_i32_i64(tmp
, tmp2
);
5670 tcg_gen_add_i64(val
, val
, tmp
);
5673 /* load and add a 64-bit value from a register pair. */
5674 static void gen_addq(DisasContext
*s
, TCGv_i64 val
, int rlow
, int rhigh
)
5680 /* Load 64-bit value rd:rn. */
5681 tmpl
= load_reg(s
, rlow
);
5682 tmph
= load_reg(s
, rhigh
);
5683 tmp
= tcg_temp_new_i64();
5684 tcg_gen_concat_i32_i64(tmp
, tmpl
, tmph
);
5687 tcg_gen_add_i64(val
, val
, tmp
);
5690 /* Set N and Z flags from a 64-bit value. */
5691 static void gen_logicq_cc(TCGv_i64 val
)
5693 TCGv tmp
= new_tmp();
5694 gen_helper_logicq_cc(tmp
, val
);
5699 static void disas_arm_insn(CPUState
* env
, DisasContext
*s
)
5701 unsigned int cond
, insn
, val
, op1
, i
, shift
, rm
, rs
, rn
, rd
, sh
;
5708 insn
= ldl_code(s
->pc
);
5711 /* M variants do not implement ARM mode. */
5716 /* Unconditional instructions. */
5717 if (((insn
>> 25) & 7) == 1) {
5718 /* NEON Data processing. */
5719 if (!arm_feature(env
, ARM_FEATURE_NEON
))
5722 if (disas_neon_data_insn(env
, s
, insn
))
5726 if ((insn
& 0x0f100000) == 0x04000000) {
5727 /* NEON load/store. */
5728 if (!arm_feature(env
, ARM_FEATURE_NEON
))
5731 if (disas_neon_ls_insn(env
, s
, insn
))
5735 if ((insn
& 0x0d70f000) == 0x0550f000)
5737 else if ((insn
& 0x0ffffdff) == 0x01010000) {
5740 if (insn
& (1 << 9)) {
5741 /* BE8 mode not implemented. */
5745 } else if ((insn
& 0x0fffff00) == 0x057ff000) {
5746 switch ((insn
>> 4) & 0xf) {
5749 gen_helper_clrex(cpu_env
);
5755 /* We don't emulate caches so these are a no-op. */
5760 } else if ((insn
& 0x0e5fffe0) == 0x084d0500) {
5766 op1
= (insn
& 0x1f);
5767 if (op1
== (env
->uncached_cpsr
& CPSR_M
)) {
5768 addr
= load_reg(s
, 13);
5771 gen_helper_get_r13_banked(addr
, cpu_env
, tcg_const_i32(op1
));
5773 i
= (insn
>> 23) & 3;
5775 case 0: offset
= -4; break; /* DA */
5776 case 1: offset
= -8; break; /* DB */
5777 case 2: offset
= 0; break; /* IA */
5778 case 3: offset
= 4; break; /* IB */
5782 tcg_gen_addi_i32(addr
, addr
, offset
);
5783 tmp
= load_reg(s
, 14);
5784 gen_st32(tmp
, addr
, 0);
5786 gen_helper_cpsr_read(tmp
);
5787 tcg_gen_addi_i32(addr
, addr
, 4);
5788 gen_st32(tmp
, addr
, 0);
5789 if (insn
& (1 << 21)) {
5790 /* Base writeback. */
5792 case 0: offset
= -8; break;
5793 case 1: offset
= -4; break;
5794 case 2: offset
= 4; break;
5795 case 3: offset
= 0; break;
5799 tcg_gen_addi_i32(addr
, tmp
, offset
);
5800 if (op1
== (env
->uncached_cpsr
& CPSR_M
)) {
5801 gen_movl_reg_T1(s
, 13);
5803 gen_helper_set_r13_banked(cpu_env
, tcg_const_i32(op1
), cpu_T
[1]);
5808 } else if ((insn
& 0x0e5fffe0) == 0x081d0a00) {
5814 rn
= (insn
>> 16) & 0xf;
5815 addr
= load_reg(s
, rn
);
5816 i
= (insn
>> 23) & 3;
5818 case 0: offset
= -4; break; /* DA */
5819 case 1: offset
= -8; break; /* DB */
5820 case 2: offset
= 0; break; /* IA */
5821 case 3: offset
= 4; break; /* IB */
5825 tcg_gen_addi_i32(addr
, addr
, offset
);
5826 /* Load PC into tmp and CPSR into tmp2. */
5827 tmp
= gen_ld32(addr
, 0);
5828 tcg_gen_addi_i32(addr
, addr
, 4);
5829 tmp2
= gen_ld32(addr
, 0);
5830 if (insn
& (1 << 21)) {
5831 /* Base writeback. */
5833 case 0: offset
= -8; break;
5834 case 1: offset
= -4; break;
5835 case 2: offset
= 4; break;
5836 case 3: offset
= 0; break;
5840 tcg_gen_addi_i32(addr
, addr
, offset
);
5841 store_reg(s
, rn
, addr
);
5845 gen_rfe(s
, tmp
, tmp2
);
5846 } else if ((insn
& 0x0e000000) == 0x0a000000) {
5847 /* branch link and change to thumb (blx <offset>) */
5850 val
= (uint32_t)s
->pc
;
5852 tcg_gen_movi_i32(tmp
, val
);
5853 store_reg(s
, 14, tmp
);
5854 /* Sign-extend the 24-bit offset */
5855 offset
= (((int32_t)insn
) << 8) >> 8;
5856 /* offset * 4 + bit24 * 2 + (thumb bit) */
5857 val
+= (offset
<< 2) | ((insn
>> 23) & 2) | 1;
5858 /* pipeline offset */
5862 } else if ((insn
& 0x0e000f00) == 0x0c000100) {
5863 if (arm_feature(env
, ARM_FEATURE_IWMMXT
)) {
5864 /* iWMMXt register transfer. */
5865 if (env
->cp15
.c15_cpar
& (1 << 1))
5866 if (!disas_iwmmxt_insn(env
, s
, insn
))
5869 } else if ((insn
& 0x0fe00000) == 0x0c400000) {
5870 /* Coprocessor double register transfer. */
5871 } else if ((insn
& 0x0f000010) == 0x0e000010) {
5872 /* Additional coprocessor register transfer. */
5873 } else if ((insn
& 0x0ff10020) == 0x01000000) {
5876 /* cps (privileged) */
5880 if (insn
& (1 << 19)) {
5881 if (insn
& (1 << 8))
5883 if (insn
& (1 << 7))
5885 if (insn
& (1 << 6))
5887 if (insn
& (1 << 18))
5890 if (insn
& (1 << 17)) {
5892 val
|= (insn
& 0x1f);
5895 gen_op_movl_T0_im(val
);
5896 gen_set_psr_T0(s
, mask
, 0);
5903 /* if not always execute, we generate a conditional jump to
5905 s
->condlabel
= gen_new_label();
5906 gen_test_cc(cond
^ 1, s
->condlabel
);
5909 if ((insn
& 0x0f900000) == 0x03000000) {
5910 if ((insn
& (1 << 21)) == 0) {
5912 rd
= (insn
>> 12) & 0xf;
5913 val
= ((insn
>> 4) & 0xf000) | (insn
& 0xfff);
5914 if ((insn
& (1 << 22)) == 0) {
5917 tcg_gen_movi_i32(tmp
, val
);
5920 tmp
= load_reg(s
, rd
);
5921 tcg_gen_ext16u_i32(tmp
, tmp
);
5922 tcg_gen_ori_i32(tmp
, tmp
, val
<< 16);
5924 store_reg(s
, rd
, tmp
);
5926 if (((insn
>> 12) & 0xf) != 0xf)
5928 if (((insn
>> 16) & 0xf) == 0) {
5929 gen_nop_hint(s
, insn
& 0xff);
5931 /* CPSR = immediate */
5933 shift
= ((insn
>> 8) & 0xf) * 2;
5935 val
= (val
>> shift
) | (val
<< (32 - shift
));
5936 gen_op_movl_T0_im(val
);
5937 i
= ((insn
& (1 << 22)) != 0);
5938 if (gen_set_psr_T0(s
, msr_mask(env
, s
, (insn
>> 16) & 0xf, i
), i
))
5942 } else if ((insn
& 0x0f900000) == 0x01000000
5943 && (insn
& 0x00000090) != 0x00000090) {
5944 /* miscellaneous instructions */
5945 op1
= (insn
>> 21) & 3;
5946 sh
= (insn
>> 4) & 0xf;
5949 case 0x0: /* move program status register */
5952 gen_movl_T0_reg(s
, rm
);
5953 i
= ((op1
& 2) != 0);
5954 if (gen_set_psr_T0(s
, msr_mask(env
, s
, (insn
>> 16) & 0xf, i
), i
))
5958 rd
= (insn
>> 12) & 0xf;
5962 tmp
= load_cpu_field(spsr
);
5965 gen_helper_cpsr_read(tmp
);
5967 store_reg(s
, rd
, tmp
);
5972 /* branch/exchange thumb (bx). */
5973 tmp
= load_reg(s
, rm
);
5975 } else if (op1
== 3) {
5977 rd
= (insn
>> 12) & 0xf;
5978 tmp
= load_reg(s
, rm
);
5979 gen_helper_clz(tmp
, tmp
);
5980 store_reg(s
, rd
, tmp
);
5988 /* Trivial implementation equivalent to bx. */
5989 tmp
= load_reg(s
, rm
);
5999 /* branch link/exchange thumb (blx) */
6000 tmp
= load_reg(s
, rm
);
6002 tcg_gen_movi_i32(tmp2
, s
->pc
);
6003 store_reg(s
, 14, tmp2
);
6006 case 0x5: /* saturating add/subtract */
6007 rd
= (insn
>> 12) & 0xf;
6008 rn
= (insn
>> 16) & 0xf;
6009 tmp
= load_reg(s
, rm
);
6010 tmp2
= load_reg(s
, rn
);
6012 gen_helper_double_saturate(tmp2
, tmp2
);
6014 gen_helper_sub_saturate(tmp
, tmp
, tmp2
);
6016 gen_helper_add_saturate(tmp
, tmp
, tmp2
);
6018 store_reg(s
, rd
, tmp
);
6021 gen_set_condexec(s
);
6022 gen_set_pc_im(s
->pc
- 4);
6023 gen_exception(EXCP_BKPT
);
6024 s
->is_jmp
= DISAS_JUMP
;
6026 case 0x8: /* signed multiply */
6030 rs
= (insn
>> 8) & 0xf;
6031 rn
= (insn
>> 12) & 0xf;
6032 rd
= (insn
>> 16) & 0xf;
6034 /* (32 * 16) >> 16 */
6035 tmp
= load_reg(s
, rm
);
6036 tmp2
= load_reg(s
, rs
);
6038 tcg_gen_sari_i32(tmp2
, tmp2
, 16);
6041 tmp64
= gen_muls_i64_i32(tmp
, tmp2
);
6042 tcg_gen_shri_i64(tmp64
, tmp64
, 16);
6044 tcg_gen_trunc_i64_i32(tmp
, tmp64
);
6045 if ((sh
& 2) == 0) {
6046 tmp2
= load_reg(s
, rn
);
6047 gen_helper_add_setq(tmp
, tmp
, tmp2
);
6050 store_reg(s
, rd
, tmp
);
6053 tmp
= load_reg(s
, rm
);
6054 tmp2
= load_reg(s
, rs
);
6055 gen_mulxy(tmp
, tmp2
, sh
& 2, sh
& 4);
6058 tmp64
= tcg_temp_new_i64();
6059 tcg_gen_ext_i32_i64(tmp64
, tmp
);
6061 gen_addq(s
, tmp64
, rn
, rd
);
6062 gen_storeq_reg(s
, rn
, rd
, tmp64
);
6065 tmp2
= load_reg(s
, rn
);
6066 gen_helper_add_setq(tmp
, tmp
, tmp2
);
6069 store_reg(s
, rd
, tmp
);
6076 } else if (((insn
& 0x0e000000) == 0 &&
6077 (insn
& 0x00000090) != 0x90) ||
6078 ((insn
& 0x0e000000) == (1 << 25))) {
6079 int set_cc
, logic_cc
, shiftop
;
6081 op1
= (insn
>> 21) & 0xf;
6082 set_cc
= (insn
>> 20) & 1;
6083 logic_cc
= table_logic_cc
[op1
] & set_cc
;
6085 /* data processing instruction */
6086 if (insn
& (1 << 25)) {
6087 /* immediate operand */
6089 shift
= ((insn
>> 8) & 0xf) * 2;
6091 val
= (val
>> shift
) | (val
<< (32 - shift
));
6092 gen_op_movl_T1_im(val
);
6093 if (logic_cc
&& shift
)
6094 gen_set_CF_bit31(cpu_T
[1]);
6098 gen_movl_T1_reg(s
, rm
);
6099 shiftop
= (insn
>> 5) & 3;
6100 if (!(insn
& (1 << 4))) {
6101 shift
= (insn
>> 7) & 0x1f;
6102 gen_arm_shift_im(cpu_T
[1], shiftop
, shift
, logic_cc
);
6104 rs
= (insn
>> 8) & 0xf;
6105 tmp
= load_reg(s
, rs
);
6106 gen_arm_shift_reg(cpu_T
[1], shiftop
, tmp
, logic_cc
);
6109 if (op1
!= 0x0f && op1
!= 0x0d) {
6110 rn
= (insn
>> 16) & 0xf;
6111 gen_movl_T0_reg(s
, rn
);
6113 rd
= (insn
>> 12) & 0xf;
6116 gen_op_andl_T0_T1();
6117 gen_movl_reg_T0(s
, rd
);
6119 gen_op_logic_T0_cc();
6122 gen_op_xorl_T0_T1();
6123 gen_movl_reg_T0(s
, rd
);
6125 gen_op_logic_T0_cc();
6128 if (set_cc
&& rd
== 15) {
6129 /* SUBS r15, ... is used for exception return. */
6132 gen_op_subl_T0_T1_cc();
6133 gen_exception_return(s
);
6136 gen_op_subl_T0_T1_cc();
6138 gen_op_subl_T0_T1();
6139 gen_movl_reg_T0(s
, rd
);
6144 gen_op_rsbl_T0_T1_cc();
6146 gen_op_rsbl_T0_T1();
6147 gen_movl_reg_T0(s
, rd
);
6151 gen_op_addl_T0_T1_cc();
6153 gen_op_addl_T0_T1();
6154 gen_movl_reg_T0(s
, rd
);
6158 gen_op_adcl_T0_T1_cc();
6161 gen_movl_reg_T0(s
, rd
);
6165 gen_op_sbcl_T0_T1_cc();
6168 gen_movl_reg_T0(s
, rd
);
6172 gen_op_rscl_T0_T1_cc();
6175 gen_movl_reg_T0(s
, rd
);
6179 gen_op_andl_T0_T1();
6180 gen_op_logic_T0_cc();
6185 gen_op_xorl_T0_T1();
6186 gen_op_logic_T0_cc();
6191 gen_op_subl_T0_T1_cc();
6196 gen_op_addl_T0_T1_cc();
6201 gen_movl_reg_T0(s
, rd
);
6203 gen_op_logic_T0_cc();
6206 if (logic_cc
&& rd
== 15) {
6207 /* MOVS r15, ... is used for exception return. */
6210 gen_op_movl_T0_T1();
6211 gen_exception_return(s
);
6213 gen_movl_reg_T1(s
, rd
);
6215 gen_op_logic_T1_cc();
6219 gen_op_bicl_T0_T1();
6220 gen_movl_reg_T0(s
, rd
);
6222 gen_op_logic_T0_cc();
6227 gen_movl_reg_T1(s
, rd
);
6229 gen_op_logic_T1_cc();
6233 /* other instructions */
6234 op1
= (insn
>> 24) & 0xf;
6238 /* multiplies, extra load/stores */
6239 sh
= (insn
>> 5) & 3;
6242 rd
= (insn
>> 16) & 0xf;
6243 rn
= (insn
>> 12) & 0xf;
6244 rs
= (insn
>> 8) & 0xf;
6246 op1
= (insn
>> 20) & 0xf;
6248 case 0: case 1: case 2: case 3: case 6:
6250 tmp
= load_reg(s
, rs
);
6251 tmp2
= load_reg(s
, rm
);
6252 tcg_gen_mul_i32(tmp
, tmp
, tmp2
);
6254 if (insn
& (1 << 22)) {
6255 /* Subtract (mls) */
6257 tmp2
= load_reg(s
, rn
);
6258 tcg_gen_sub_i32(tmp
, tmp2
, tmp
);
6260 } else if (insn
& (1 << 21)) {
6262 tmp2
= load_reg(s
, rn
);
6263 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
6266 if (insn
& (1 << 20))
6268 store_reg(s
, rd
, tmp
);
6272 tmp
= load_reg(s
, rs
);
6273 tmp2
= load_reg(s
, rm
);
6274 if (insn
& (1 << 22))
6275 tmp64
= gen_muls_i64_i32(tmp
, tmp2
);
6277 tmp64
= gen_mulu_i64_i32(tmp
, tmp2
);
6278 if (insn
& (1 << 21)) /* mult accumulate */
6279 gen_addq(s
, tmp64
, rn
, rd
);
6280 if (!(insn
& (1 << 23))) { /* double accumulate */
6282 gen_addq_lo(s
, tmp64
, rn
);
6283 gen_addq_lo(s
, tmp64
, rd
);
6285 if (insn
& (1 << 20))
6286 gen_logicq_cc(tmp64
);
6287 gen_storeq_reg(s
, rn
, rd
, tmp64
);
6291 rn
= (insn
>> 16) & 0xf;
6292 rd
= (insn
>> 12) & 0xf;
6293 if (insn
& (1 << 23)) {
6294 /* load/store exclusive */
6295 op1
= (insn
>> 21) & 0x3;
6300 gen_movl_T1_reg(s
, rn
);
6302 if (insn
& (1 << 20)) {
6303 gen_helper_mark_exclusive(cpu_env
, cpu_T
[1]);
6306 tmp
= gen_ld32(addr
, IS_USER(s
));
6308 case 1: /* ldrexd */
6309 tmp
= gen_ld32(addr
, IS_USER(s
));
6310 store_reg(s
, rd
, tmp
);
6311 tcg_gen_addi_i32(addr
, addr
, 4);
6312 tmp
= gen_ld32(addr
, IS_USER(s
));
6315 case 2: /* ldrexb */
6316 tmp
= gen_ld8u(addr
, IS_USER(s
));
6318 case 3: /* ldrexh */
6319 tmp
= gen_ld16u(addr
, IS_USER(s
));
6324 store_reg(s
, rd
, tmp
);
6326 int label
= gen_new_label();
6328 gen_helper_test_exclusive(cpu_T
[0], cpu_env
, addr
);
6329 tcg_gen_brcondi_i32(TCG_COND_NE
, cpu_T
[0],
6331 tmp
= load_reg(s
,rm
);
6334 gen_st32(tmp
, addr
, IS_USER(s
));
6336 case 1: /* strexd */
6337 gen_st32(tmp
, addr
, IS_USER(s
));
6338 tcg_gen_addi_i32(addr
, addr
, 4);
6339 tmp
= load_reg(s
, rm
+ 1);
6340 gen_st32(tmp
, addr
, IS_USER(s
));
6342 case 2: /* strexb */
6343 gen_st8(tmp
, addr
, IS_USER(s
));
6345 case 3: /* strexh */
6346 gen_st16(tmp
, addr
, IS_USER(s
));
6351 gen_set_label(label
);
6352 gen_movl_reg_T0(s
, rd
);
6355 /* SWP instruction */
6358 /* ??? This is not really atomic. However we know
6359 we never have multiple CPUs running in parallel,
6360 so it is good enough. */
6361 addr
= load_reg(s
, rn
);
6362 tmp
= load_reg(s
, rm
);
6363 if (insn
& (1 << 22)) {
6364 tmp2
= gen_ld8u(addr
, IS_USER(s
));
6365 gen_st8(tmp
, addr
, IS_USER(s
));
6367 tmp2
= gen_ld32(addr
, IS_USER(s
));
6368 gen_st32(tmp
, addr
, IS_USER(s
));
6371 store_reg(s
, rd
, tmp2
);
6377 /* Misc load/store */
6378 rn
= (insn
>> 16) & 0xf;
6379 rd
= (insn
>> 12) & 0xf;
6380 addr
= load_reg(s
, rn
);
6381 if (insn
& (1 << 24))
6382 gen_add_datah_offset(s
, insn
, 0, addr
);
6384 if (insn
& (1 << 20)) {
6388 tmp
= gen_ld16u(addr
, IS_USER(s
));
6391 tmp
= gen_ld8s(addr
, IS_USER(s
));
6395 tmp
= gen_ld16s(addr
, IS_USER(s
));
6399 } else if (sh
& 2) {
6403 tmp
= load_reg(s
, rd
);
6404 gen_st32(tmp
, addr
, IS_USER(s
));
6405 tcg_gen_addi_i32(addr
, addr
, 4);
6406 tmp
= load_reg(s
, rd
+ 1);
6407 gen_st32(tmp
, addr
, IS_USER(s
));
6411 tmp
= gen_ld32(addr
, IS_USER(s
));
6412 store_reg(s
, rd
, tmp
);
6413 tcg_gen_addi_i32(addr
, addr
, 4);
6414 tmp
= gen_ld32(addr
, IS_USER(s
));
6418 address_offset
= -4;
6421 tmp
= load_reg(s
, rd
);
6422 gen_st16(tmp
, addr
, IS_USER(s
));
6425 /* Perform base writeback before the loaded value to
6426 ensure correct behavior with overlapping index registers.
6427 ldrd with base writeback is is undefined if the
6428 destination and index registers overlap. */
6429 if (!(insn
& (1 << 24))) {
6430 gen_add_datah_offset(s
, insn
, address_offset
, addr
);
6431 store_reg(s
, rn
, addr
);
6432 } else if (insn
& (1 << 21)) {
6434 tcg_gen_addi_i32(addr
, addr
, address_offset
);
6435 store_reg(s
, rn
, addr
);
6440 /* Complete the load. */
6441 store_reg(s
, rd
, tmp
);
6450 if (insn
& (1 << 4)) {
6452 /* Armv6 Media instructions. */
6454 rn
= (insn
>> 16) & 0xf;
6455 rd
= (insn
>> 12) & 0xf;
6456 rs
= (insn
>> 8) & 0xf;
6457 switch ((insn
>> 23) & 3) {
6458 case 0: /* Parallel add/subtract. */
6459 op1
= (insn
>> 20) & 7;
6460 tmp
= load_reg(s
, rn
);
6461 tmp2
= load_reg(s
, rm
);
6462 sh
= (insn
>> 5) & 7;
6463 if ((op1
& 3) == 0 || sh
== 5 || sh
== 6)
6465 gen_arm_parallel_addsub(op1
, sh
, tmp
, tmp2
);
6467 store_reg(s
, rd
, tmp
);
6470 if ((insn
& 0x00700020) == 0) {
6471 /* Halfword pack. */
6472 tmp
= load_reg(s
, rn
);
6473 tmp2
= load_reg(s
, rm
);
6474 shift
= (insn
>> 7) & 0x1f;
6475 if (insn
& (1 << 6)) {
6479 tcg_gen_sari_i32(tmp2
, tmp2
, shift
);
6480 tcg_gen_andi_i32(tmp
, tmp
, 0xffff0000);
6481 tcg_gen_ext16u_i32(tmp2
, tmp2
);
6485 tcg_gen_shli_i32(tmp2
, tmp2
, shift
);
6486 tcg_gen_ext16u_i32(tmp
, tmp
);
6487 tcg_gen_andi_i32(tmp2
, tmp2
, 0xffff0000);
6489 tcg_gen_or_i32(tmp
, tmp
, tmp2
);
6491 store_reg(s
, rd
, tmp
);
6492 } else if ((insn
& 0x00200020) == 0x00200000) {
6494 tmp
= load_reg(s
, rm
);
6495 shift
= (insn
>> 7) & 0x1f;
6496 if (insn
& (1 << 6)) {
6499 tcg_gen_sari_i32(tmp
, tmp
, shift
);
6501 tcg_gen_shli_i32(tmp
, tmp
, shift
);
6503 sh
= (insn
>> 16) & 0x1f;
6505 if (insn
& (1 << 22))
6506 gen_helper_usat(tmp
, tmp
, tcg_const_i32(sh
));
6508 gen_helper_ssat(tmp
, tmp
, tcg_const_i32(sh
));
6510 store_reg(s
, rd
, tmp
);
6511 } else if ((insn
& 0x00300fe0) == 0x00200f20) {
6513 tmp
= load_reg(s
, rm
);
6514 sh
= (insn
>> 16) & 0x1f;
6516 if (insn
& (1 << 22))
6517 gen_helper_usat16(tmp
, tmp
, tcg_const_i32(sh
));
6519 gen_helper_ssat16(tmp
, tmp
, tcg_const_i32(sh
));
6521 store_reg(s
, rd
, tmp
);
6522 } else if ((insn
& 0x00700fe0) == 0x00000fa0) {
6524 tmp
= load_reg(s
, rn
);
6525 tmp2
= load_reg(s
, rm
);
6527 tcg_gen_ld_i32(tmp3
, cpu_env
, offsetof(CPUState
, GE
));
6528 gen_helper_sel_flags(tmp
, tmp3
, tmp
, tmp2
);
6531 store_reg(s
, rd
, tmp
);
6532 } else if ((insn
& 0x000003e0) == 0x00000060) {
6533 tmp
= load_reg(s
, rm
);
6534 shift
= (insn
>> 10) & 3;
6535 /* ??? In many cases it's not neccessary to do a
6536 rotate, a shift is sufficient. */
6538 tcg_gen_rori_i32(tmp
, tmp
, shift
* 8);
6539 op1
= (insn
>> 20) & 7;
6541 case 0: gen_sxtb16(tmp
); break;
6542 case 2: gen_sxtb(tmp
); break;
6543 case 3: gen_sxth(tmp
); break;
6544 case 4: gen_uxtb16(tmp
); break;
6545 case 6: gen_uxtb(tmp
); break;
6546 case 7: gen_uxth(tmp
); break;
6547 default: goto illegal_op
;
6550 tmp2
= load_reg(s
, rn
);
6551 if ((op1
& 3) == 0) {
6552 gen_add16(tmp
, tmp2
);
6554 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
6558 store_reg(s
, rd
, tmp
);
6559 } else if ((insn
& 0x003f0f60) == 0x003f0f20) {
6561 tmp
= load_reg(s
, rm
);
6562 if (insn
& (1 << 22)) {
6563 if (insn
& (1 << 7)) {
6567 gen_helper_rbit(tmp
, tmp
);
6570 if (insn
& (1 << 7))
6573 tcg_gen_bswap32_i32(tmp
, tmp
);
6575 store_reg(s
, rd
, tmp
);
6580 case 2: /* Multiplies (Type 3). */
6581 tmp
= load_reg(s
, rm
);
6582 tmp2
= load_reg(s
, rs
);
6583 if (insn
& (1 << 20)) {
6584 /* Signed multiply most significant [accumulate]. */
6585 tmp64
= gen_muls_i64_i32(tmp
, tmp2
);
6586 if (insn
& (1 << 5))
6587 tcg_gen_addi_i64(tmp64
, tmp64
, 0x80000000u
);
6588 tcg_gen_shri_i64(tmp64
, tmp64
, 32);
6590 tcg_gen_trunc_i64_i32(tmp
, tmp64
);
6592 tmp2
= load_reg(s
, rd
);
6593 if (insn
& (1 << 6)) {
6594 tcg_gen_sub_i32(tmp
, tmp
, tmp2
);
6596 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
6600 store_reg(s
, rn
, tmp
);
6602 if (insn
& (1 << 5))
6603 gen_swap_half(tmp2
);
6604 gen_smul_dual(tmp
, tmp2
);
6605 /* This addition cannot overflow. */
6606 if (insn
& (1 << 6)) {
6607 tcg_gen_sub_i32(tmp
, tmp
, tmp2
);
6609 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
6612 if (insn
& (1 << 22)) {
6613 /* smlald, smlsld */
6614 tmp64
= tcg_temp_new_i64();
6615 tcg_gen_ext_i32_i64(tmp64
, tmp
);
6617 gen_addq(s
, tmp64
, rd
, rn
);
6618 gen_storeq_reg(s
, rd
, rn
, tmp64
);
6620 /* smuad, smusd, smlad, smlsd */
6623 tmp2
= load_reg(s
, rd
);
6624 gen_helper_add_setq(tmp
, tmp
, tmp2
);
6627 store_reg(s
, rn
, tmp
);
6632 op1
= ((insn
>> 17) & 0x38) | ((insn
>> 5) & 7);
6634 case 0: /* Unsigned sum of absolute differences. */
6636 tmp
= load_reg(s
, rm
);
6637 tmp2
= load_reg(s
, rs
);
6638 gen_helper_usad8(tmp
, tmp
, tmp2
);
6641 tmp2
= load_reg(s
, rd
);
6642 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
6645 store_reg(s
, rn
, tmp
);
6647 case 0x20: case 0x24: case 0x28: case 0x2c:
6648 /* Bitfield insert/clear. */
6650 shift
= (insn
>> 7) & 0x1f;
6651 i
= (insn
>> 16) & 0x1f;
6655 tcg_gen_movi_i32(tmp
, 0);
6657 tmp
= load_reg(s
, rm
);
6660 tmp2
= load_reg(s
, rd
);
6661 gen_bfi(tmp
, tmp2
, tmp
, shift
, (1u << i
) - 1);
6664 store_reg(s
, rd
, tmp
);
6666 case 0x12: case 0x16: case 0x1a: case 0x1e: /* sbfx */
6667 case 0x32: case 0x36: case 0x3a: case 0x3e: /* ubfx */
6669 tmp
= load_reg(s
, rm
);
6670 shift
= (insn
>> 7) & 0x1f;
6671 i
= ((insn
>> 16) & 0x1f) + 1;
6676 gen_ubfx(tmp
, shift
, (1u << i
) - 1);
6678 gen_sbfx(tmp
, shift
, i
);
6681 store_reg(s
, rd
, tmp
);
6691 /* Check for undefined extension instructions
6692 * per the ARM Bible IE:
6693 * xxxx 0111 1111 xxxx xxxx xxxx 1111 xxxx
6695 sh
= (0xf << 20) | (0xf << 4);
6696 if (op1
== 0x7 && ((insn
& sh
) == sh
))
6700 /* load/store byte/word */
6701 rn
= (insn
>> 16) & 0xf;
6702 rd
= (insn
>> 12) & 0xf;
6703 tmp2
= load_reg(s
, rn
);
6704 i
= (IS_USER(s
) || (insn
& 0x01200000) == 0x00200000);
6705 if (insn
& (1 << 24))
6706 gen_add_data_offset(s
, insn
, tmp2
);
6707 if (insn
& (1 << 20)) {
6709 if (insn
& (1 << 22)) {
6710 tmp
= gen_ld8u(tmp2
, i
);
6712 tmp
= gen_ld32(tmp2
, i
);
6716 tmp
= load_reg(s
, rd
);
6717 if (insn
& (1 << 22))
6718 gen_st8(tmp
, tmp2
, i
);
6720 gen_st32(tmp
, tmp2
, i
);
6722 if (!(insn
& (1 << 24))) {
6723 gen_add_data_offset(s
, insn
, tmp2
);
6724 store_reg(s
, rn
, tmp2
);
6725 } else if (insn
& (1 << 21)) {
6726 store_reg(s
, rn
, tmp2
);
6730 if (insn
& (1 << 20)) {
6731 /* Complete the load. */
6735 store_reg(s
, rd
, tmp
);
6741 int j
, n
, user
, loaded_base
;
6743 /* load/store multiple words */
6744 /* XXX: store correct base if write back */
6746 if (insn
& (1 << 22)) {
6748 goto illegal_op
; /* only usable in supervisor mode */
6750 if ((insn
& (1 << 15)) == 0)
6753 rn
= (insn
>> 16) & 0xf;
6754 addr
= load_reg(s
, rn
);
6756 /* compute total size */
6758 TCGV_UNUSED(loaded_var
);
6761 if (insn
& (1 << i
))
6764 /* XXX: test invalid n == 0 case ? */
6765 if (insn
& (1 << 23)) {
6766 if (insn
& (1 << 24)) {
6768 tcg_gen_addi_i32(addr
, addr
, 4);
6770 /* post increment */
6773 if (insn
& (1 << 24)) {
6775 tcg_gen_addi_i32(addr
, addr
, -(n
* 4));
6777 /* post decrement */
6779 tcg_gen_addi_i32(addr
, addr
, -((n
- 1) * 4));
6784 if (insn
& (1 << i
)) {
6785 if (insn
& (1 << 20)) {
6787 tmp
= gen_ld32(addr
, IS_USER(s
));
6791 gen_helper_set_user_reg(tcg_const_i32(i
), tmp
);
6793 } else if (i
== rn
) {
6797 store_reg(s
, i
, tmp
);
6802 /* special case: r15 = PC + 8 */
6803 val
= (long)s
->pc
+ 4;
6805 tcg_gen_movi_i32(tmp
, val
);
6808 gen_helper_get_user_reg(tmp
, tcg_const_i32(i
));
6810 tmp
= load_reg(s
, i
);
6812 gen_st32(tmp
, addr
, IS_USER(s
));
6815 /* no need to add after the last transfer */
6817 tcg_gen_addi_i32(addr
, addr
, 4);
6820 if (insn
& (1 << 21)) {
6822 if (insn
& (1 << 23)) {
6823 if (insn
& (1 << 24)) {
6826 /* post increment */
6827 tcg_gen_addi_i32(addr
, addr
, 4);
6830 if (insn
& (1 << 24)) {
6833 tcg_gen_addi_i32(addr
, addr
, -((n
- 1) * 4));
6835 /* post decrement */
6836 tcg_gen_addi_i32(addr
, addr
, -(n
* 4));
6839 store_reg(s
, rn
, addr
);
6844 store_reg(s
, rn
, loaded_var
);
6846 if ((insn
& (1 << 22)) && !user
) {
6847 /* Restore CPSR from SPSR. */
6848 tmp
= load_cpu_field(spsr
);
6849 gen_set_cpsr(tmp
, 0xffffffff);
6851 s
->is_jmp
= DISAS_UPDATE
;
6860 /* branch (and link) */
6861 val
= (int32_t)s
->pc
;
6862 if (insn
& (1 << 24)) {
6864 tcg_gen_movi_i32(tmp
, val
);
6865 store_reg(s
, 14, tmp
);
6867 offset
= (((int32_t)insn
<< 8) >> 8);
6868 val
+= (offset
<< 2) + 4;
6876 if (disas_coproc_insn(env
, s
, insn
))
6881 gen_set_pc_im(s
->pc
);
6882 s
->is_jmp
= DISAS_SWI
;
6886 gen_set_condexec(s
);
6887 gen_set_pc_im(s
->pc
- 4);
6888 gen_exception(EXCP_UDEF
);
6889 s
->is_jmp
= DISAS_JUMP
;
6895 /* Return true if this is a Thumb-2 logical op. */
6897 thumb2_logic_op(int op
)
6902 /* Generate code for a Thumb-2 data processing operation. If CONDS is nonzero
6903 then set condition code flags based on the result of the operation.
6904 If SHIFTER_OUT is nonzero then set the carry flag for logical operations
6905 to the high bit of T1.
6906 Returns zero if the opcode is valid. */
6909 gen_thumb2_data_op(DisasContext
*s
, int op
, int conds
, uint32_t shifter_out
)
6916 gen_op_andl_T0_T1();
6920 gen_op_bicl_T0_T1();
6933 gen_op_xorl_T0_T1();
6938 gen_op_addl_T0_T1_cc();
6940 gen_op_addl_T0_T1();
6944 gen_op_adcl_T0_T1_cc();
6950 gen_op_sbcl_T0_T1_cc();
6956 gen_op_subl_T0_T1_cc();
6958 gen_op_subl_T0_T1();
6962 gen_op_rsbl_T0_T1_cc();
6964 gen_op_rsbl_T0_T1();
6966 default: /* 5, 6, 7, 9, 12, 15. */
6970 gen_op_logic_T0_cc();
6972 gen_set_CF_bit31(cpu_T
[1]);
6977 /* Translate a 32-bit thumb instruction. Returns nonzero if the instruction
6979 static int disas_thumb2_insn(CPUState
*env
, DisasContext
*s
, uint16_t insn_hw1
)
6981 uint32_t insn
, imm
, shift
, offset
;
6982 uint32_t rd
, rn
, rm
, rs
;
6993 if (!(arm_feature(env
, ARM_FEATURE_THUMB2
)
6994 || arm_feature (env
, ARM_FEATURE_M
))) {
6995 /* Thumb-1 cores may need to treat bl and blx as a pair of
6996 16-bit instructions to get correct prefetch abort behavior. */
6998 if ((insn
& (1 << 12)) == 0) {
6999 /* Second half of blx. */
7000 offset
= ((insn
& 0x7ff) << 1);
7001 tmp
= load_reg(s
, 14);
7002 tcg_gen_addi_i32(tmp
, tmp
, offset
);
7003 tcg_gen_andi_i32(tmp
, tmp
, 0xfffffffc);
7006 tcg_gen_movi_i32(tmp2
, s
->pc
| 1);
7007 store_reg(s
, 14, tmp2
);
7011 if (insn
& (1 << 11)) {
7012 /* Second half of bl. */
7013 offset
= ((insn
& 0x7ff) << 1) | 1;
7014 tmp
= load_reg(s
, 14);
7015 tcg_gen_addi_i32(tmp
, tmp
, offset
);
7018 tcg_gen_movi_i32(tmp2
, s
->pc
| 1);
7019 store_reg(s
, 14, tmp2
);
7023 if ((s
->pc
& ~TARGET_PAGE_MASK
) == 0) {
7024 /* Instruction spans a page boundary. Implement it as two
7025 16-bit instructions in case the second half causes an
7027 offset
= ((int32_t)insn
<< 21) >> 9;
7028 gen_op_movl_T0_im(s
->pc
+ 2 + offset
);
7029 gen_movl_reg_T0(s
, 14);
7032 /* Fall through to 32-bit decode. */
7035 insn
= lduw_code(s
->pc
);
7037 insn
|= (uint32_t)insn_hw1
<< 16;
7039 if ((insn
& 0xf800e800) != 0xf000e800) {
7043 rn
= (insn
>> 16) & 0xf;
7044 rs
= (insn
>> 12) & 0xf;
7045 rd
= (insn
>> 8) & 0xf;
7047 switch ((insn
>> 25) & 0xf) {
7048 case 0: case 1: case 2: case 3:
7049 /* 16-bit instructions. Should never happen. */
7052 if (insn
& (1 << 22)) {
7053 /* Other load/store, table branch. */
7054 if (insn
& 0x01200000) {
7055 /* Load/store doubleword. */
7058 tcg_gen_movi_i32(addr
, s
->pc
& ~3);
7060 addr
= load_reg(s
, rn
);
7062 offset
= (insn
& 0xff) * 4;
7063 if ((insn
& (1 << 23)) == 0)
7065 if (insn
& (1 << 24)) {
7066 tcg_gen_addi_i32(addr
, addr
, offset
);
7069 if (insn
& (1 << 20)) {
7071 tmp
= gen_ld32(addr
, IS_USER(s
));
7072 store_reg(s
, rs
, tmp
);
7073 tcg_gen_addi_i32(addr
, addr
, 4);
7074 tmp
= gen_ld32(addr
, IS_USER(s
));
7075 store_reg(s
, rd
, tmp
);
7078 tmp
= load_reg(s
, rs
);
7079 gen_st32(tmp
, addr
, IS_USER(s
));
7080 tcg_gen_addi_i32(addr
, addr
, 4);
7081 tmp
= load_reg(s
, rd
);
7082 gen_st32(tmp
, addr
, IS_USER(s
));
7084 if (insn
& (1 << 21)) {
7085 /* Base writeback. */
7088 tcg_gen_addi_i32(addr
, addr
, offset
- 4);
7089 store_reg(s
, rn
, addr
);
7093 } else if ((insn
& (1 << 23)) == 0) {
7094 /* Load/store exclusive word. */
7095 gen_movl_T1_reg(s
, rn
);
7097 if (insn
& (1 << 20)) {
7098 gen_helper_mark_exclusive(cpu_env
, cpu_T
[1]);
7099 tmp
= gen_ld32(addr
, IS_USER(s
));
7100 store_reg(s
, rd
, tmp
);
7102 int label
= gen_new_label();
7103 gen_helper_test_exclusive(cpu_T
[0], cpu_env
, addr
);
7104 tcg_gen_brcondi_i32(TCG_COND_NE
, cpu_T
[0],
7106 tmp
= load_reg(s
, rs
);
7107 gen_st32(tmp
, cpu_T
[1], IS_USER(s
));
7108 gen_set_label(label
);
7109 gen_movl_reg_T0(s
, rd
);
7111 } else if ((insn
& (1 << 6)) == 0) {
7115 tcg_gen_movi_i32(addr
, s
->pc
);
7117 addr
= load_reg(s
, rn
);
7119 tmp
= load_reg(s
, rm
);
7120 tcg_gen_add_i32(addr
, addr
, tmp
);
7121 if (insn
& (1 << 4)) {
7123 tcg_gen_add_i32(addr
, addr
, tmp
);
7125 tmp
= gen_ld16u(addr
, IS_USER(s
));
7128 tmp
= gen_ld8u(addr
, IS_USER(s
));
7131 tcg_gen_shli_i32(tmp
, tmp
, 1);
7132 tcg_gen_addi_i32(tmp
, tmp
, s
->pc
);
7133 store_reg(s
, 15, tmp
);
7135 /* Load/store exclusive byte/halfword/doubleword. */
7136 /* ??? These are not really atomic. However we know
7137 we never have multiple CPUs running in parallel,
7138 so it is good enough. */
7139 op
= (insn
>> 4) & 0x3;
7140 /* Must use a global reg for the address because we have
7141 a conditional branch in the store instruction. */
7142 gen_movl_T1_reg(s
, rn
);
7144 if (insn
& (1 << 20)) {
7145 gen_helper_mark_exclusive(cpu_env
, addr
);
7148 tmp
= gen_ld8u(addr
, IS_USER(s
));
7151 tmp
= gen_ld16u(addr
, IS_USER(s
));
7154 tmp
= gen_ld32(addr
, IS_USER(s
));
7155 tcg_gen_addi_i32(addr
, addr
, 4);
7156 tmp2
= gen_ld32(addr
, IS_USER(s
));
7157 store_reg(s
, rd
, tmp2
);
7162 store_reg(s
, rs
, tmp
);
7164 int label
= gen_new_label();
7165 /* Must use a global that is not killed by the branch. */
7166 gen_helper_test_exclusive(cpu_T
[0], cpu_env
, addr
);
7167 tcg_gen_brcondi_i32(TCG_COND_NE
, cpu_T
[0], 0, label
);
7168 tmp
= load_reg(s
, rs
);
7171 gen_st8(tmp
, addr
, IS_USER(s
));
7174 gen_st16(tmp
, addr
, IS_USER(s
));
7177 gen_st32(tmp
, addr
, IS_USER(s
));
7178 tcg_gen_addi_i32(addr
, addr
, 4);
7179 tmp
= load_reg(s
, rd
);
7180 gen_st32(tmp
, addr
, IS_USER(s
));
7185 gen_set_label(label
);
7186 gen_movl_reg_T0(s
, rm
);
7190 /* Load/store multiple, RFE, SRS. */
7191 if (((insn
>> 23) & 1) == ((insn
>> 24) & 1)) {
7192 /* Not available in user mode. */
7195 if (insn
& (1 << 20)) {
7197 addr
= load_reg(s
, rn
);
7198 if ((insn
& (1 << 24)) == 0)
7199 tcg_gen_addi_i32(addr
, addr
, -8);
7200 /* Load PC into tmp and CPSR into tmp2. */
7201 tmp
= gen_ld32(addr
, 0);
7202 tcg_gen_addi_i32(addr
, addr
, 4);
7203 tmp2
= gen_ld32(addr
, 0);
7204 if (insn
& (1 << 21)) {
7205 /* Base writeback. */
7206 if (insn
& (1 << 24)) {
7207 tcg_gen_addi_i32(addr
, addr
, 4);
7209 tcg_gen_addi_i32(addr
, addr
, -4);
7211 store_reg(s
, rn
, addr
);
7215 gen_rfe(s
, tmp
, tmp2
);
7219 if (op
== (env
->uncached_cpsr
& CPSR_M
)) {
7220 addr
= load_reg(s
, 13);
7223 gen_helper_get_r13_banked(addr
, cpu_env
, tcg_const_i32(op
));
7225 if ((insn
& (1 << 24)) == 0) {
7226 tcg_gen_addi_i32(addr
, addr
, -8);
7228 tmp
= load_reg(s
, 14);
7229 gen_st32(tmp
, addr
, 0);
7230 tcg_gen_addi_i32(addr
, addr
, 4);
7232 gen_helper_cpsr_read(tmp
);
7233 gen_st32(tmp
, addr
, 0);
7234 if (insn
& (1 << 21)) {
7235 if ((insn
& (1 << 24)) == 0) {
7236 tcg_gen_addi_i32(addr
, addr
, -4);
7238 tcg_gen_addi_i32(addr
, addr
, 4);
7240 if (op
== (env
->uncached_cpsr
& CPSR_M
)) {
7241 store_reg(s
, 13, addr
);
7243 gen_helper_set_r13_banked(cpu_env
,
7244 tcg_const_i32(op
), addr
);
7252 /* Load/store multiple. */
7253 addr
= load_reg(s
, rn
);
7255 for (i
= 0; i
< 16; i
++) {
7256 if (insn
& (1 << i
))
7259 if (insn
& (1 << 24)) {
7260 tcg_gen_addi_i32(addr
, addr
, -offset
);
7263 for (i
= 0; i
< 16; i
++) {
7264 if ((insn
& (1 << i
)) == 0)
7266 if (insn
& (1 << 20)) {
7268 tmp
= gen_ld32(addr
, IS_USER(s
));
7272 store_reg(s
, i
, tmp
);
7276 tmp
= load_reg(s
, i
);
7277 gen_st32(tmp
, addr
, IS_USER(s
));
7279 tcg_gen_addi_i32(addr
, addr
, 4);
7281 if (insn
& (1 << 21)) {
7282 /* Base register writeback. */
7283 if (insn
& (1 << 24)) {
7284 tcg_gen_addi_i32(addr
, addr
, -offset
);
7286 /* Fault if writeback register is in register list. */
7287 if (insn
& (1 << rn
))
7289 store_reg(s
, rn
, addr
);
7296 case 5: /* Data processing register constant shift. */
7298 gen_op_movl_T0_im(0);
7300 gen_movl_T0_reg(s
, rn
);
7301 gen_movl_T1_reg(s
, rm
);
7302 op
= (insn
>> 21) & 0xf;
7303 shiftop
= (insn
>> 4) & 3;
7304 shift
= ((insn
>> 6) & 3) | ((insn
>> 10) & 0x1c);
7305 conds
= (insn
& (1 << 20)) != 0;
7306 logic_cc
= (conds
&& thumb2_logic_op(op
));
7307 gen_arm_shift_im(cpu_T
[1], shiftop
, shift
, logic_cc
);
7308 if (gen_thumb2_data_op(s
, op
, conds
, 0))
7311 gen_movl_reg_T0(s
, rd
);
7313 case 13: /* Misc data processing. */
7314 op
= ((insn
>> 22) & 6) | ((insn
>> 7) & 1);
7315 if (op
< 4 && (insn
& 0xf000) != 0xf000)
7318 case 0: /* Register controlled shift. */
7319 tmp
= load_reg(s
, rn
);
7320 tmp2
= load_reg(s
, rm
);
7321 if ((insn
& 0x70) != 0)
7323 op
= (insn
>> 21) & 3;
7324 logic_cc
= (insn
& (1 << 20)) != 0;
7325 gen_arm_shift_reg(tmp
, op
, tmp2
, logic_cc
);
7328 store_reg(s
, rd
, tmp
);
7330 case 1: /* Sign/zero extend. */
7331 tmp
= load_reg(s
, rm
);
7332 shift
= (insn
>> 4) & 3;
7333 /* ??? In many cases it's not neccessary to do a
7334 rotate, a shift is sufficient. */
7336 tcg_gen_rori_i32(tmp
, tmp
, shift
* 8);
7337 op
= (insn
>> 20) & 7;
7339 case 0: gen_sxth(tmp
); break;
7340 case 1: gen_uxth(tmp
); break;
7341 case 2: gen_sxtb16(tmp
); break;
7342 case 3: gen_uxtb16(tmp
); break;
7343 case 4: gen_sxtb(tmp
); break;
7344 case 5: gen_uxtb(tmp
); break;
7345 default: goto illegal_op
;
7348 tmp2
= load_reg(s
, rn
);
7349 if ((op
>> 1) == 1) {
7350 gen_add16(tmp
, tmp2
);
7352 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
7356 store_reg(s
, rd
, tmp
);
7358 case 2: /* SIMD add/subtract. */
7359 op
= (insn
>> 20) & 7;
7360 shift
= (insn
>> 4) & 7;
7361 if ((op
& 3) == 3 || (shift
& 3) == 3)
7363 tmp
= load_reg(s
, rn
);
7364 tmp2
= load_reg(s
, rm
);
7365 gen_thumb2_parallel_addsub(op
, shift
, tmp
, tmp2
);
7367 store_reg(s
, rd
, tmp
);
7369 case 3: /* Other data processing. */
7370 op
= ((insn
>> 17) & 0x38) | ((insn
>> 4) & 7);
7372 /* Saturating add/subtract. */
7373 tmp
= load_reg(s
, rn
);
7374 tmp2
= load_reg(s
, rm
);
7376 gen_helper_double_saturate(tmp
, tmp
);
7378 gen_helper_sub_saturate(tmp
, tmp2
, tmp
);
7380 gen_helper_add_saturate(tmp
, tmp
, tmp2
);
7383 tmp
= load_reg(s
, rn
);
7385 case 0x0a: /* rbit */
7386 gen_helper_rbit(tmp
, tmp
);
7388 case 0x08: /* rev */
7389 tcg_gen_bswap32_i32(tmp
, tmp
);
7391 case 0x09: /* rev16 */
7394 case 0x0b: /* revsh */
7397 case 0x10: /* sel */
7398 tmp2
= load_reg(s
, rm
);
7400 tcg_gen_ld_i32(tmp3
, cpu_env
, offsetof(CPUState
, GE
));
7401 gen_helper_sel_flags(tmp
, tmp3
, tmp
, tmp2
);
7405 case 0x18: /* clz */
7406 gen_helper_clz(tmp
, tmp
);
7412 store_reg(s
, rd
, tmp
);
7414 case 4: case 5: /* 32-bit multiply. Sum of absolute differences. */
7415 op
= (insn
>> 4) & 0xf;
7416 tmp
= load_reg(s
, rn
);
7417 tmp2
= load_reg(s
, rm
);
7418 switch ((insn
>> 20) & 7) {
7419 case 0: /* 32 x 32 -> 32 */
7420 tcg_gen_mul_i32(tmp
, tmp
, tmp2
);
7423 tmp2
= load_reg(s
, rs
);
7425 tcg_gen_sub_i32(tmp
, tmp2
, tmp
);
7427 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
7431 case 1: /* 16 x 16 -> 32 */
7432 gen_mulxy(tmp
, tmp2
, op
& 2, op
& 1);
7435 tmp2
= load_reg(s
, rs
);
7436 gen_helper_add_setq(tmp
, tmp
, tmp2
);
7440 case 2: /* Dual multiply add. */
7441 case 4: /* Dual multiply subtract. */
7443 gen_swap_half(tmp2
);
7444 gen_smul_dual(tmp
, tmp2
);
7445 /* This addition cannot overflow. */
7446 if (insn
& (1 << 22)) {
7447 tcg_gen_sub_i32(tmp
, tmp
, tmp2
);
7449 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
7454 tmp2
= load_reg(s
, rs
);
7455 gen_helper_add_setq(tmp
, tmp
, tmp2
);
7459 case 3: /* 32 * 16 -> 32msb */
7461 tcg_gen_sari_i32(tmp2
, tmp2
, 16);
7464 tmp64
= gen_muls_i64_i32(tmp
, tmp2
);
7465 tcg_gen_shri_i64(tmp64
, tmp64
, 16);
7467 tcg_gen_trunc_i64_i32(tmp
, tmp64
);
7470 tmp2
= load_reg(s
, rs
);
7471 gen_helper_add_setq(tmp
, tmp
, tmp2
);
7475 case 5: case 6: /* 32 * 32 -> 32msb */
7476 gen_imull(tmp
, tmp2
);
7477 if (insn
& (1 << 5)) {
7478 gen_roundqd(tmp
, tmp2
);
7485 tmp2
= load_reg(s
, rs
);
7486 if (insn
& (1 << 21)) {
7487 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
7489 tcg_gen_sub_i32(tmp
, tmp2
, tmp
);
7494 case 7: /* Unsigned sum of absolute differences. */
7495 gen_helper_usad8(tmp
, tmp
, tmp2
);
7498 tmp2
= load_reg(s
, rs
);
7499 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
7504 store_reg(s
, rd
, tmp
);
7506 case 6: case 7: /* 64-bit multiply, Divide. */
7507 op
= ((insn
>> 4) & 0xf) | ((insn
>> 16) & 0x70);
7508 tmp
= load_reg(s
, rn
);
7509 tmp2
= load_reg(s
, rm
);
7510 if ((op
& 0x50) == 0x10) {
7512 if (!arm_feature(env
, ARM_FEATURE_DIV
))
7515 gen_helper_udiv(tmp
, tmp
, tmp2
);
7517 gen_helper_sdiv(tmp
, tmp
, tmp2
);
7519 store_reg(s
, rd
, tmp
);
7520 } else if ((op
& 0xe) == 0xc) {
7521 /* Dual multiply accumulate long. */
7523 gen_swap_half(tmp2
);
7524 gen_smul_dual(tmp
, tmp2
);
7526 tcg_gen_sub_i32(tmp
, tmp
, tmp2
);
7528 tcg_gen_add_i32(tmp
, tmp
, tmp2
);
7532 tmp64
= tcg_temp_new_i64();
7533 tcg_gen_ext_i32_i64(tmp64
, tmp
);
7535 gen_addq(s
, tmp64
, rs
, rd
);
7536 gen_storeq_reg(s
, rs
, rd
, tmp64
);
7539 /* Unsigned 64-bit multiply */
7540 tmp64
= gen_mulu_i64_i32(tmp
, tmp2
);
7544 gen_mulxy(tmp
, tmp2
, op
& 2, op
& 1);
7546 tmp64
= tcg_temp_new_i64();
7547 tcg_gen_ext_i32_i64(tmp64
, tmp
);
7550 /* Signed 64-bit multiply */
7551 tmp64
= gen_muls_i64_i32(tmp
, tmp2
);
7556 gen_addq_lo(s
, tmp64
, rs
);
7557 gen_addq_lo(s
, tmp64
, rd
);
7558 } else if (op
& 0x40) {
7559 /* 64-bit accumulate. */
7560 gen_addq(s
, tmp64
, rs
, rd
);
7562 gen_storeq_reg(s
, rs
, rd
, tmp64
);
7567 case 6: case 7: case 14: case 15:
7569 if (((insn
>> 24) & 3) == 3) {
7570 /* Translate into the equivalent ARM encoding. */
7571 insn
= (insn
& 0xe2ffffff) | ((insn
& (1 << 28)) >> 4);
7572 if (disas_neon_data_insn(env
, s
, insn
))
7575 if (insn
& (1 << 28))
7577 if (disas_coproc_insn (env
, s
, insn
))
7581 case 8: case 9: case 10: case 11:
7582 if (insn
& (1 << 15)) {
7583 /* Branches, misc control. */
7584 if (insn
& 0x5000) {
7585 /* Unconditional branch. */
7586 /* signextend(hw1[10:0]) -> offset[:12]. */
7587 offset
= ((int32_t)insn
<< 5) >> 9 & ~(int32_t)0xfff;
7588 /* hw1[10:0] -> offset[11:1]. */
7589 offset
|= (insn
& 0x7ff) << 1;
7590 /* (~hw2[13, 11] ^ offset[24]) -> offset[23,22]
7591 offset[24:22] already have the same value because of the
7592 sign extension above. */
7593 offset
^= ((~insn
) & (1 << 13)) << 10;
7594 offset
^= ((~insn
) & (1 << 11)) << 11;
7596 if (insn
& (1 << 14)) {
7597 /* Branch and link. */
7598 gen_op_movl_T1_im(s
->pc
| 1);
7599 gen_movl_reg_T1(s
, 14);
7603 if (insn
& (1 << 12)) {
7608 offset
&= ~(uint32_t)2;
7609 gen_bx_im(s
, offset
);
7611 } else if (((insn
>> 23) & 7) == 7) {
7613 if (insn
& (1 << 13))
7616 if (insn
& (1 << 26)) {
7617 /* Secure monitor call (v6Z) */
7618 goto illegal_op
; /* not implemented. */
7620 op
= (insn
>> 20) & 7;
7622 case 0: /* msr cpsr. */
7624 tmp
= load_reg(s
, rn
);
7625 addr
= tcg_const_i32(insn
& 0xff);
7626 gen_helper_v7m_msr(cpu_env
, addr
, tmp
);
7631 case 1: /* msr spsr. */
7634 gen_movl_T0_reg(s
, rn
);
7635 if (gen_set_psr_T0(s
,
7636 msr_mask(env
, s
, (insn
>> 8) & 0xf, op
== 1),
7640 case 2: /* cps, nop-hint. */
7641 if (((insn
>> 8) & 7) == 0) {
7642 gen_nop_hint(s
, insn
& 0xff);
7644 /* Implemented as NOP in user mode. */
7649 if (insn
& (1 << 10)) {
7650 if (insn
& (1 << 7))
7652 if (insn
& (1 << 6))
7654 if (insn
& (1 << 5))
7656 if (insn
& (1 << 9))
7657 imm
= CPSR_A
| CPSR_I
| CPSR_F
;
7659 if (insn
& (1 << 8)) {
7661 imm
|= (insn
& 0x1f);
7664 gen_op_movl_T0_im(imm
);
7665 gen_set_psr_T0(s
, offset
, 0);
7668 case 3: /* Special control operations. */
7669 op
= (insn
>> 4) & 0xf;
7672 gen_helper_clrex(cpu_env
);
7677 /* These execute as NOPs. */
7685 /* Trivial implementation equivalent to bx. */
7686 tmp
= load_reg(s
, rn
);
7689 case 5: /* Exception return. */
7690 /* Unpredictable in user mode. */
7692 case 6: /* mrs cpsr. */
7695 addr
= tcg_const_i32(insn
& 0xff);
7696 gen_helper_v7m_mrs(tmp
, cpu_env
, addr
);
7698 gen_helper_cpsr_read(tmp
);
7700 store_reg(s
, rd
, tmp
);
7702 case 7: /* mrs spsr. */
7703 /* Not accessible in user mode. */
7704 if (IS_USER(s
) || IS_M(env
))
7706 tmp
= load_cpu_field(spsr
);
7707 store_reg(s
, rd
, tmp
);
7712 /* Conditional branch. */
7713 op
= (insn
>> 22) & 0xf;
7714 /* Generate a conditional jump to next instruction. */
7715 s
->condlabel
= gen_new_label();
7716 gen_test_cc(op
^ 1, s
->condlabel
);
7719 /* offset[11:1] = insn[10:0] */
7720 offset
= (insn
& 0x7ff) << 1;
7721 /* offset[17:12] = insn[21:16]. */
7722 offset
|= (insn
& 0x003f0000) >> 4;
7723 /* offset[31:20] = insn[26]. */
7724 offset
|= ((int32_t)((insn
<< 5) & 0x80000000)) >> 11;
7725 /* offset[18] = insn[13]. */
7726 offset
|= (insn
& (1 << 13)) << 5;
7727 /* offset[19] = insn[11]. */
7728 offset
|= (insn
& (1 << 11)) << 8;
7730 /* jump to the offset */
7731 gen_jmp(s
, s
->pc
+ offset
);
7734 /* Data processing immediate. */
7735 if (insn
& (1 << 25)) {
7736 if (insn
& (1 << 24)) {
7737 if (insn
& (1 << 20))
7739 /* Bitfield/Saturate. */
7740 op
= (insn
>> 21) & 7;
7742 shift
= ((insn
>> 6) & 3) | ((insn
>> 10) & 0x1c);
7745 tcg_gen_movi_i32(tmp
, 0);
7747 tmp
= load_reg(s
, rn
);
7750 case 2: /* Signed bitfield extract. */
7752 if (shift
+ imm
> 32)
7755 gen_sbfx(tmp
, shift
, imm
);
7757 case 6: /* Unsigned bitfield extract. */
7759 if (shift
+ imm
> 32)
7762 gen_ubfx(tmp
, shift
, (1u << imm
) - 1);
7764 case 3: /* Bitfield insert/clear. */
7767 imm
= imm
+ 1 - shift
;
7769 tmp2
= load_reg(s
, rd
);
7770 gen_bfi(tmp
, tmp2
, tmp
, shift
, (1u << imm
) - 1);
7776 default: /* Saturate. */
7779 tcg_gen_sari_i32(tmp
, tmp
, shift
);
7781 tcg_gen_shli_i32(tmp
, tmp
, shift
);
7783 tmp2
= tcg_const_i32(imm
);
7786 if ((op
& 1) && shift
== 0)
7787 gen_helper_usat16(tmp
, tmp
, tmp2
);
7789 gen_helper_usat(tmp
, tmp
, tmp2
);
7792 if ((op
& 1) && shift
== 0)
7793 gen_helper_ssat16(tmp
, tmp
, tmp2
);
7795 gen_helper_ssat(tmp
, tmp
, tmp2
);
7799 store_reg(s
, rd
, tmp
);
7801 imm
= ((insn
& 0x04000000) >> 15)
7802 | ((insn
& 0x7000) >> 4) | (insn
& 0xff);
7803 if (insn
& (1 << 22)) {
7804 /* 16-bit immediate. */
7805 imm
|= (insn
>> 4) & 0xf000;
7806 if (insn
& (1 << 23)) {
7808 tmp
= load_reg(s
, rd
);
7809 tcg_gen_ext16u_i32(tmp
, tmp
);
7810 tcg_gen_ori_i32(tmp
, tmp
, imm
<< 16);
7814 tcg_gen_movi_i32(tmp
, imm
);
7817 /* Add/sub 12-bit immediate. */
7819 offset
= s
->pc
& ~(uint32_t)3;
7820 if (insn
& (1 << 23))
7825 tcg_gen_movi_i32(tmp
, offset
);
7827 tmp
= load_reg(s
, rn
);
7828 if (insn
& (1 << 23))
7829 tcg_gen_subi_i32(tmp
, tmp
, imm
);
7831 tcg_gen_addi_i32(tmp
, tmp
, imm
);
7834 store_reg(s
, rd
, tmp
);
7837 int shifter_out
= 0;
7838 /* modified 12-bit immediate. */
7839 shift
= ((insn
& 0x04000000) >> 23) | ((insn
& 0x7000) >> 12);
7840 imm
= (insn
& 0xff);
7843 /* Nothing to do. */
7845 case 1: /* 00XY00XY */
7848 case 2: /* XY00XY00 */
7852 case 3: /* XYXYXYXY */
7856 default: /* Rotated constant. */
7857 shift
= (shift
<< 1) | (imm
>> 7);
7859 imm
= imm
<< (32 - shift
);
7863 gen_op_movl_T1_im(imm
);
7864 rn
= (insn
>> 16) & 0xf;
7866 gen_op_movl_T0_im(0);
7868 gen_movl_T0_reg(s
, rn
);
7869 op
= (insn
>> 21) & 0xf;
7870 if (gen_thumb2_data_op(s
, op
, (insn
& (1 << 20)) != 0,
7873 rd
= (insn
>> 8) & 0xf;
7875 gen_movl_reg_T0(s
, rd
);
7880 case 12: /* Load/store single data item. */
7885 if ((insn
& 0x01100000) == 0x01000000) {
7886 if (disas_neon_ls_insn(env
, s
, insn
))
7894 /* s->pc has already been incremented by 4. */
7895 imm
= s
->pc
& 0xfffffffc;
7896 if (insn
& (1 << 23))
7897 imm
+= insn
& 0xfff;
7899 imm
-= insn
& 0xfff;
7900 tcg_gen_movi_i32(addr
, imm
);
7902 addr
= load_reg(s
, rn
);
7903 if (insn
& (1 << 23)) {
7904 /* Positive offset. */
7906 tcg_gen_addi_i32(addr
, addr
, imm
);
7908 op
= (insn
>> 8) & 7;
7911 case 0: case 8: /* Shifted Register. */
7912 shift
= (insn
>> 4) & 0xf;
7915 tmp
= load_reg(s
, rm
);
7917 tcg_gen_shli_i32(tmp
, tmp
, shift
);
7918 tcg_gen_add_i32(addr
, addr
, tmp
);
7921 case 4: /* Negative offset. */
7922 tcg_gen_addi_i32(addr
, addr
, -imm
);
7924 case 6: /* User privilege. */
7925 tcg_gen_addi_i32(addr
, addr
, imm
);
7928 case 1: /* Post-decrement. */
7931 case 3: /* Post-increment. */
7935 case 5: /* Pre-decrement. */
7938 case 7: /* Pre-increment. */
7939 tcg_gen_addi_i32(addr
, addr
, imm
);
7947 op
= ((insn
>> 21) & 3) | ((insn
>> 22) & 4);
7948 if (insn
& (1 << 20)) {
7950 if (rs
== 15 && op
!= 2) {
7953 /* Memory hint. Implemented as NOP. */
7956 case 0: tmp
= gen_ld8u(addr
, user
); break;
7957 case 4: tmp
= gen_ld8s(addr
, user
); break;
7958 case 1: tmp
= gen_ld16u(addr
, user
); break;
7959 case 5: tmp
= gen_ld16s(addr
, user
); break;
7960 case 2: tmp
= gen_ld32(addr
, user
); break;
7961 default: goto illegal_op
;
7966 store_reg(s
, rs
, tmp
);
7973 tmp
= load_reg(s
, rs
);
7975 case 0: gen_st8(tmp
, addr
, user
); break;
7976 case 1: gen_st16(tmp
, addr
, user
); break;
7977 case 2: gen_st32(tmp
, addr
, user
); break;
7978 default: goto illegal_op
;
7982 tcg_gen_addi_i32(addr
, addr
, imm
);
7984 store_reg(s
, rn
, addr
);
7998 static void disas_thumb_insn(CPUState
*env
, DisasContext
*s
)
8000 uint32_t val
, insn
, op
, rm
, rn
, rd
, shift
, cond
;
8007 if (s
->condexec_mask
) {
8008 cond
= s
->condexec_cond
;
8009 s
->condlabel
= gen_new_label();
8010 gen_test_cc(cond
^ 1, s
->condlabel
);
8014 insn
= lduw_code(s
->pc
);
8017 switch (insn
>> 12) {
8020 op
= (insn
>> 11) & 3;
8023 rn
= (insn
>> 3) & 7;
8024 gen_movl_T0_reg(s
, rn
);
8025 if (insn
& (1 << 10)) {
8027 gen_op_movl_T1_im((insn
>> 6) & 7);
8030 rm
= (insn
>> 6) & 7;
8031 gen_movl_T1_reg(s
, rm
);
8033 if (insn
& (1 << 9)) {
8034 if (s
->condexec_mask
)
8035 gen_op_subl_T0_T1();
8037 gen_op_subl_T0_T1_cc();
8039 if (s
->condexec_mask
)
8040 gen_op_addl_T0_T1();
8042 gen_op_addl_T0_T1_cc();
8044 gen_movl_reg_T0(s
, rd
);
8046 /* shift immediate */
8047 rm
= (insn
>> 3) & 7;
8048 shift
= (insn
>> 6) & 0x1f;
8049 tmp
= load_reg(s
, rm
);
8050 gen_arm_shift_im(tmp
, op
, shift
, s
->condexec_mask
== 0);
8051 if (!s
->condexec_mask
)
8053 store_reg(s
, rd
, tmp
);
8057 /* arithmetic large immediate */
8058 op
= (insn
>> 11) & 3;
8059 rd
= (insn
>> 8) & 0x7;
8061 gen_op_movl_T0_im(insn
& 0xff);
8063 gen_movl_T0_reg(s
, rd
);
8064 gen_op_movl_T1_im(insn
& 0xff);
8068 if (!s
->condexec_mask
)
8069 gen_op_logic_T0_cc();
8072 gen_op_subl_T0_T1_cc();
8075 if (s
->condexec_mask
)
8076 gen_op_addl_T0_T1();
8078 gen_op_addl_T0_T1_cc();
8081 if (s
->condexec_mask
)
8082 gen_op_subl_T0_T1();
8084 gen_op_subl_T0_T1_cc();
8088 gen_movl_reg_T0(s
, rd
);
8091 if (insn
& (1 << 11)) {
8092 rd
= (insn
>> 8) & 7;
8093 /* load pc-relative. Bit 1 of PC is ignored. */
8094 val
= s
->pc
+ 2 + ((insn
& 0xff) * 4);
8095 val
&= ~(uint32_t)2;
8097 tcg_gen_movi_i32(addr
, val
);
8098 tmp
= gen_ld32(addr
, IS_USER(s
));
8100 store_reg(s
, rd
, tmp
);
8103 if (insn
& (1 << 10)) {
8104 /* data processing extended or blx */
8105 rd
= (insn
& 7) | ((insn
>> 4) & 8);
8106 rm
= (insn
>> 3) & 0xf;
8107 op
= (insn
>> 8) & 3;
8110 gen_movl_T0_reg(s
, rd
);
8111 gen_movl_T1_reg(s
, rm
);
8112 gen_op_addl_T0_T1();
8113 gen_movl_reg_T0(s
, rd
);
8116 gen_movl_T0_reg(s
, rd
);
8117 gen_movl_T1_reg(s
, rm
);
8118 gen_op_subl_T0_T1_cc();
8120 case 2: /* mov/cpy */
8121 gen_movl_T0_reg(s
, rm
);
8122 gen_movl_reg_T0(s
, rd
);
8124 case 3:/* branch [and link] exchange thumb register */
8125 tmp
= load_reg(s
, rm
);
8126 if (insn
& (1 << 7)) {
8127 val
= (uint32_t)s
->pc
| 1;
8129 tcg_gen_movi_i32(tmp2
, val
);
8130 store_reg(s
, 14, tmp2
);
8138 /* data processing register */
8140 rm
= (insn
>> 3) & 7;
8141 op
= (insn
>> 6) & 0xf;
8142 if (op
== 2 || op
== 3 || op
== 4 || op
== 7) {
8143 /* the shift/rotate ops want the operands backwards */
8152 if (op
== 9) /* neg */
8153 gen_op_movl_T0_im(0);
8154 else if (op
!= 0xf) /* mvn doesn't read its first operand */
8155 gen_movl_T0_reg(s
, rd
);
8157 gen_movl_T1_reg(s
, rm
);
8160 gen_op_andl_T0_T1();
8161 if (!s
->condexec_mask
)
8162 gen_op_logic_T0_cc();
8165 gen_op_xorl_T0_T1();
8166 if (!s
->condexec_mask
)
8167 gen_op_logic_T0_cc();
8170 if (s
->condexec_mask
) {
8171 gen_helper_shl(cpu_T
[1], cpu_T
[1], cpu_T
[0]);
8173 gen_helper_shl_cc(cpu_T
[1], cpu_T
[1], cpu_T
[0]);
8174 gen_op_logic_T1_cc();
8178 if (s
->condexec_mask
) {
8179 gen_helper_shr(cpu_T
[1], cpu_T
[1], cpu_T
[0]);
8181 gen_helper_shr_cc(cpu_T
[1], cpu_T
[1], cpu_T
[0]);
8182 gen_op_logic_T1_cc();
8186 if (s
->condexec_mask
) {
8187 gen_helper_sar(cpu_T
[1], cpu_T
[1], cpu_T
[0]);
8189 gen_helper_sar_cc(cpu_T
[1], cpu_T
[1], cpu_T
[0]);
8190 gen_op_logic_T1_cc();
8194 if (s
->condexec_mask
)
8197 gen_op_adcl_T0_T1_cc();
8200 if (s
->condexec_mask
)
8203 gen_op_sbcl_T0_T1_cc();
8206 if (s
->condexec_mask
) {
8207 gen_helper_ror(cpu_T
[1], cpu_T
[1], cpu_T
[0]);
8209 gen_helper_ror_cc(cpu_T
[1], cpu_T
[1], cpu_T
[0]);
8210 gen_op_logic_T1_cc();
8214 gen_op_andl_T0_T1();
8215 gen_op_logic_T0_cc();
8219 if (s
->condexec_mask
)
8220 tcg_gen_neg_i32(cpu_T
[0], cpu_T
[1]);
8222 gen_op_subl_T0_T1_cc();
8225 gen_op_subl_T0_T1_cc();
8229 gen_op_addl_T0_T1_cc();
8234 if (!s
->condexec_mask
)
8235 gen_op_logic_T0_cc();
8238 gen_op_mull_T0_T1();
8239 if (!s
->condexec_mask
)
8240 gen_op_logic_T0_cc();
8243 gen_op_bicl_T0_T1();
8244 if (!s
->condexec_mask
)
8245 gen_op_logic_T0_cc();
8249 if (!s
->condexec_mask
)
8250 gen_op_logic_T1_cc();
8257 gen_movl_reg_T1(s
, rm
);
8259 gen_movl_reg_T0(s
, rd
);
8264 /* load/store register offset. */
8266 rn
= (insn
>> 3) & 7;
8267 rm
= (insn
>> 6) & 7;
8268 op
= (insn
>> 9) & 7;
8269 addr
= load_reg(s
, rn
);
8270 tmp
= load_reg(s
, rm
);
8271 tcg_gen_add_i32(addr
, addr
, tmp
);
8274 if (op
< 3) /* store */
8275 tmp
= load_reg(s
, rd
);
8279 gen_st32(tmp
, addr
, IS_USER(s
));
8282 gen_st16(tmp
, addr
, IS_USER(s
));
8285 gen_st8(tmp
, addr
, IS_USER(s
));
8288 tmp
= gen_ld8s(addr
, IS_USER(s
));
8291 tmp
= gen_ld32(addr
, IS_USER(s
));
8294 tmp
= gen_ld16u(addr
, IS_USER(s
));
8297 tmp
= gen_ld8u(addr
, IS_USER(s
));
8300 tmp
= gen_ld16s(addr
, IS_USER(s
));
8303 if (op
>= 3) /* load */
8304 store_reg(s
, rd
, tmp
);
8309 /* load/store word immediate offset */
8311 rn
= (insn
>> 3) & 7;
8312 addr
= load_reg(s
, rn
);
8313 val
= (insn
>> 4) & 0x7c;
8314 tcg_gen_addi_i32(addr
, addr
, val
);
8316 if (insn
& (1 << 11)) {
8318 tmp
= gen_ld32(addr
, IS_USER(s
));
8319 store_reg(s
, rd
, tmp
);
8322 tmp
= load_reg(s
, rd
);
8323 gen_st32(tmp
, addr
, IS_USER(s
));
8329 /* load/store byte immediate offset */
8331 rn
= (insn
>> 3) & 7;
8332 addr
= load_reg(s
, rn
);
8333 val
= (insn
>> 6) & 0x1f;
8334 tcg_gen_addi_i32(addr
, addr
, val
);
8336 if (insn
& (1 << 11)) {
8338 tmp
= gen_ld8u(addr
, IS_USER(s
));
8339 store_reg(s
, rd
, tmp
);
8342 tmp
= load_reg(s
, rd
);
8343 gen_st8(tmp
, addr
, IS_USER(s
));
8349 /* load/store halfword immediate offset */
8351 rn
= (insn
>> 3) & 7;
8352 addr
= load_reg(s
, rn
);
8353 val
= (insn
>> 5) & 0x3e;
8354 tcg_gen_addi_i32(addr
, addr
, val
);
8356 if (insn
& (1 << 11)) {
8358 tmp
= gen_ld16u(addr
, IS_USER(s
));
8359 store_reg(s
, rd
, tmp
);
8362 tmp
= load_reg(s
, rd
);
8363 gen_st16(tmp
, addr
, IS_USER(s
));
8369 /* load/store from stack */
8370 rd
= (insn
>> 8) & 7;
8371 addr
= load_reg(s
, 13);
8372 val
= (insn
& 0xff) * 4;
8373 tcg_gen_addi_i32(addr
, addr
, val
);
8375 if (insn
& (1 << 11)) {
8377 tmp
= gen_ld32(addr
, IS_USER(s
));
8378 store_reg(s
, rd
, tmp
);
8381 tmp
= load_reg(s
, rd
);
8382 gen_st32(tmp
, addr
, IS_USER(s
));
8388 /* add to high reg */
8389 rd
= (insn
>> 8) & 7;
8390 if (insn
& (1 << 11)) {
8392 tmp
= load_reg(s
, 13);
8394 /* PC. bit 1 is ignored. */
8396 tcg_gen_movi_i32(tmp
, (s
->pc
+ 2) & ~(uint32_t)2);
8398 val
= (insn
& 0xff) * 4;
8399 tcg_gen_addi_i32(tmp
, tmp
, val
);
8400 store_reg(s
, rd
, tmp
);
8405 op
= (insn
>> 8) & 0xf;
8408 /* adjust stack pointer */
8409 tmp
= load_reg(s
, 13);
8410 val
= (insn
& 0x7f) * 4;
8411 if (insn
& (1 << 7))
8412 val
= -(int32_t)val
;
8413 tcg_gen_addi_i32(tmp
, tmp
, val
);
8414 store_reg(s
, 13, tmp
);
8417 case 2: /* sign/zero extend. */
8420 rm
= (insn
>> 3) & 7;
8421 tmp
= load_reg(s
, rm
);
8422 switch ((insn
>> 6) & 3) {
8423 case 0: gen_sxth(tmp
); break;
8424 case 1: gen_sxtb(tmp
); break;
8425 case 2: gen_uxth(tmp
); break;
8426 case 3: gen_uxtb(tmp
); break;
8428 store_reg(s
, rd
, tmp
);
8430 case 4: case 5: case 0xc: case 0xd:
8432 addr
= load_reg(s
, 13);
8433 if (insn
& (1 << 8))
8437 for (i
= 0; i
< 8; i
++) {
8438 if (insn
& (1 << i
))
8441 if ((insn
& (1 << 11)) == 0) {
8442 tcg_gen_addi_i32(addr
, addr
, -offset
);
8444 for (i
= 0; i
< 8; i
++) {
8445 if (insn
& (1 << i
)) {
8446 if (insn
& (1 << 11)) {
8448 tmp
= gen_ld32(addr
, IS_USER(s
));
8449 store_reg(s
, i
, tmp
);
8452 tmp
= load_reg(s
, i
);
8453 gen_st32(tmp
, addr
, IS_USER(s
));
8455 /* advance to the next address. */
8456 tcg_gen_addi_i32(addr
, addr
, 4);
8460 if (insn
& (1 << 8)) {
8461 if (insn
& (1 << 11)) {
8463 tmp
= gen_ld32(addr
, IS_USER(s
));
8464 /* don't set the pc until the rest of the instruction
8468 tmp
= load_reg(s
, 14);
8469 gen_st32(tmp
, addr
, IS_USER(s
));
8471 tcg_gen_addi_i32(addr
, addr
, 4);
8473 if ((insn
& (1 << 11)) == 0) {
8474 tcg_gen_addi_i32(addr
, addr
, -offset
);
8476 /* write back the new stack pointer */
8477 store_reg(s
, 13, addr
);
8478 /* set the new PC value */
8479 if ((insn
& 0x0900) == 0x0900)
8483 case 1: case 3: case 9: case 11: /* czb */
8485 tmp
= load_reg(s
, rm
);
8486 s
->condlabel
= gen_new_label();
8488 if (insn
& (1 << 11))
8489 tcg_gen_brcondi_i32(TCG_COND_EQ
, tmp
, 0, s
->condlabel
);
8491 tcg_gen_brcondi_i32(TCG_COND_NE
, tmp
, 0, s
->condlabel
);
8493 offset
= ((insn
& 0xf8) >> 2) | (insn
& 0x200) >> 3;
8494 val
= (uint32_t)s
->pc
+ 2;
8499 case 15: /* IT, nop-hint. */
8500 if ((insn
& 0xf) == 0) {
8501 gen_nop_hint(s
, (insn
>> 4) & 0xf);
8505 s
->condexec_cond
= (insn
>> 4) & 0xe;
8506 s
->condexec_mask
= insn
& 0x1f;
8507 /* No actual code generated for this insn, just setup state. */
8510 case 0xe: /* bkpt */
8511 gen_set_condexec(s
);
8512 gen_set_pc_im(s
->pc
- 2);
8513 gen_exception(EXCP_BKPT
);
8514 s
->is_jmp
= DISAS_JUMP
;
8519 rn
= (insn
>> 3) & 0x7;
8521 tmp
= load_reg(s
, rn
);
8522 switch ((insn
>> 6) & 3) {
8523 case 0: tcg_gen_bswap32_i32(tmp
, tmp
); break;
8524 case 1: gen_rev16(tmp
); break;
8525 case 3: gen_revsh(tmp
); break;
8526 default: goto illegal_op
;
8528 store_reg(s
, rd
, tmp
);
8536 tmp
= tcg_const_i32((insn
& (1 << 4)) != 0);
8539 addr
= tcg_const_i32(16);
8540 gen_helper_v7m_msr(cpu_env
, addr
, tmp
);
8544 addr
= tcg_const_i32(17);
8545 gen_helper_v7m_msr(cpu_env
, addr
, tmp
);
8549 if (insn
& (1 << 4))
8550 shift
= CPSR_A
| CPSR_I
| CPSR_F
;
8554 val
= ((insn
& 7) << 6) & shift
;
8555 gen_op_movl_T0_im(val
);
8556 gen_set_psr_T0(s
, shift
, 0);
8566 /* load/store multiple */
8567 rn
= (insn
>> 8) & 0x7;
8568 addr
= load_reg(s
, rn
);
8569 for (i
= 0; i
< 8; i
++) {
8570 if (insn
& (1 << i
)) {
8571 if (insn
& (1 << 11)) {
8573 tmp
= gen_ld32(addr
, IS_USER(s
));
8574 store_reg(s
, i
, tmp
);
8577 tmp
= load_reg(s
, i
);
8578 gen_st32(tmp
, addr
, IS_USER(s
));
8580 /* advance to the next address */
8581 tcg_gen_addi_i32(addr
, addr
, 4);
8584 /* Base register writeback. */
8585 if ((insn
& (1 << rn
)) == 0) {
8586 store_reg(s
, rn
, addr
);
8593 /* conditional branch or swi */
8594 cond
= (insn
>> 8) & 0xf;
8600 gen_set_condexec(s
);
8601 gen_set_pc_im(s
->pc
);
8602 s
->is_jmp
= DISAS_SWI
;
8605 /* generate a conditional jump to next instruction */
8606 s
->condlabel
= gen_new_label();
8607 gen_test_cc(cond
^ 1, s
->condlabel
);
8609 gen_movl_T1_reg(s
, 15);
8611 /* jump to the offset */
8612 val
= (uint32_t)s
->pc
+ 2;
8613 offset
= ((int32_t)insn
<< 24) >> 24;
8619 if (insn
& (1 << 11)) {
8620 if (disas_thumb2_insn(env
, s
, insn
))
8624 /* unconditional branch */
8625 val
= (uint32_t)s
->pc
;
8626 offset
= ((int32_t)insn
<< 21) >> 21;
8627 val
+= (offset
<< 1) + 2;
8632 if (disas_thumb2_insn(env
, s
, insn
))
8638 gen_set_condexec(s
);
8639 gen_set_pc_im(s
->pc
- 4);
8640 gen_exception(EXCP_UDEF
);
8641 s
->is_jmp
= DISAS_JUMP
;
8645 gen_set_condexec(s
);
8646 gen_set_pc_im(s
->pc
- 2);
8647 gen_exception(EXCP_UDEF
);
8648 s
->is_jmp
= DISAS_JUMP
;
8651 /* generate intermediate code in gen_opc_buf and gen_opparam_buf for
8652 basic block 'tb'. If search_pc is TRUE, also generate PC
8653 information for each intermediate instruction. */
8654 static inline void gen_intermediate_code_internal(CPUState
*env
,
8655 TranslationBlock
*tb
,
8658 DisasContext dc1
, *dc
= &dc1
;
8660 uint16_t *gen_opc_end
;
8662 target_ulong pc_start
;
8663 uint32_t next_page_start
;
8667 /* generate intermediate code */
8669 memset(temps
, 0, sizeof(temps
));
8675 gen_opc_end
= gen_opc_buf
+ OPC_MAX_SIZE
;
8677 dc
->is_jmp
= DISAS_NEXT
;
8679 dc
->singlestep_enabled
= env
->singlestep_enabled
;
8681 dc
->thumb
= env
->thumb
;
8682 dc
->condexec_mask
= (env
->condexec_bits
& 0xf) << 1;
8683 dc
->condexec_cond
= env
->condexec_bits
>> 4;
8684 #if !defined(CONFIG_USER_ONLY)
8686 dc
->user
= ((env
->v7m
.exception
== 0) && (env
->v7m
.control
& 1));
8688 dc
->user
= (env
->uncached_cpsr
& 0x1f) == ARM_CPU_MODE_USR
;
8691 cpu_F0s
= tcg_temp_new_i32();
8692 cpu_F1s
= tcg_temp_new_i32();
8693 cpu_F0d
= tcg_temp_new_i64();
8694 cpu_F1d
= tcg_temp_new_i64();
8697 /* FIXME: cpu_M0 can probably be the same as cpu_V0. */
8698 cpu_M0
= tcg_temp_new_i64();
8699 next_page_start
= (pc_start
& TARGET_PAGE_MASK
) + TARGET_PAGE_SIZE
;
8702 max_insns
= tb
->cflags
& CF_COUNT_MASK
;
8704 max_insns
= CF_COUNT_MASK
;
8707 /* Reset the conditional execution bits immediately. This avoids
8708 complications trying to do it at the end of the block. */
8709 if (env
->condexec_bits
)
8711 TCGv tmp
= new_tmp();
8712 tcg_gen_movi_i32(tmp
, 0);
8713 store_cpu_field(tmp
, condexec_bits
);
8716 #ifdef CONFIG_USER_ONLY
8717 /* Intercept jump to the magic kernel page. */
8718 if (dc
->pc
>= 0xffff0000) {
8719 /* We always get here via a jump, so know we are not in a
8720 conditional execution block. */
8721 gen_exception(EXCP_KERNEL_TRAP
);
8722 dc
->is_jmp
= DISAS_UPDATE
;
8726 if (dc
->pc
>= 0xfffffff0 && IS_M(env
)) {
8727 /* We always get here via a jump, so know we are not in a
8728 conditional execution block. */
8729 gen_exception(EXCP_EXCEPTION_EXIT
);
8730 dc
->is_jmp
= DISAS_UPDATE
;
8735 if (unlikely(!TAILQ_EMPTY(&env
->breakpoints
))) {
8736 TAILQ_FOREACH(bp
, &env
->breakpoints
, entry
) {
8737 if (bp
->pc
== dc
->pc
) {
8738 gen_set_condexec(dc
);
8739 gen_set_pc_im(dc
->pc
);
8740 gen_exception(EXCP_DEBUG
);
8741 dc
->is_jmp
= DISAS_JUMP
;
8742 /* Advance PC so that clearing the breakpoint will
8743 invalidate this TB. */
8745 goto done_generating
;
8751 j
= gen_opc_ptr
- gen_opc_buf
;
8755 gen_opc_instr_start
[lj
++] = 0;
8757 gen_opc_pc
[lj
] = dc
->pc
;
8758 gen_opc_instr_start
[lj
] = 1;
8759 gen_opc_icount
[lj
] = num_insns
;
8762 if (num_insns
+ 1 == max_insns
&& (tb
->cflags
& CF_LAST_IO
))
8766 disas_thumb_insn(env
, dc
);
8767 if (dc
->condexec_mask
) {
8768 dc
->condexec_cond
= (dc
->condexec_cond
& 0xe)
8769 | ((dc
->condexec_mask
>> 4) & 1);
8770 dc
->condexec_mask
= (dc
->condexec_mask
<< 1) & 0x1f;
8771 if (dc
->condexec_mask
== 0) {
8772 dc
->condexec_cond
= 0;
8776 disas_arm_insn(env
, dc
);
8779 fprintf(stderr
, "Internal resource leak before %08x\n", dc
->pc
);
8783 if (dc
->condjmp
&& !dc
->is_jmp
) {
8784 gen_set_label(dc
->condlabel
);
8787 /* Translation stops when a conditional branch is encountered.
8788 * Otherwise the subsequent code could get translated several times.
8789 * Also stop translation when a page boundary is reached. This
8790 * ensures prefetch aborts occur at the right place. */
8792 } while (!dc
->is_jmp
&& gen_opc_ptr
< gen_opc_end
&&
8793 !env
->singlestep_enabled
&&
8795 dc
->pc
< next_page_start
&&
8796 num_insns
< max_insns
);
8798 if (tb
->cflags
& CF_LAST_IO
) {
8800 /* FIXME: This can theoretically happen with self-modifying
8802 cpu_abort(env
, "IO on conditional branch instruction");
8807 /* At this stage dc->condjmp will only be set when the skipped
8808 instruction was a conditional branch or trap, and the PC has
8809 already been written. */
8810 if (unlikely(env
->singlestep_enabled
)) {
8811 /* Make sure the pc is updated, and raise a debug exception. */
8813 gen_set_condexec(dc
);
8814 if (dc
->is_jmp
== DISAS_SWI
) {
8815 gen_exception(EXCP_SWI
);
8817 gen_exception(EXCP_DEBUG
);
8819 gen_set_label(dc
->condlabel
);
8821 if (dc
->condjmp
|| !dc
->is_jmp
) {
8822 gen_set_pc_im(dc
->pc
);
8825 gen_set_condexec(dc
);
8826 if (dc
->is_jmp
== DISAS_SWI
&& !dc
->condjmp
) {
8827 gen_exception(EXCP_SWI
);
8829 /* FIXME: Single stepping a WFI insn will not halt
8831 gen_exception(EXCP_DEBUG
);
8834 /* While branches must always occur at the end of an IT block,
8835 there are a few other things that can cause us to terminate
8836 the TB in the middel of an IT block:
8837 - Exception generating instructions (bkpt, swi, undefined).
8839 - Hardware watchpoints.
8840 Hardware breakpoints have already been handled and skip this code.
8842 gen_set_condexec(dc
);
8843 switch(dc
->is_jmp
) {
8845 gen_goto_tb(dc
, 1, dc
->pc
);
8850 /* indicate that the hash table must be used to find the next TB */
8854 /* nothing more to generate */
8860 gen_exception(EXCP_SWI
);
8864 gen_set_label(dc
->condlabel
);
8865 gen_set_condexec(dc
);
8866 gen_goto_tb(dc
, 1, dc
->pc
);
8872 gen_icount_end(tb
, num_insns
);
8873 *gen_opc_ptr
= INDEX_op_end
;
8876 if (qemu_loglevel_mask(CPU_LOG_TB_IN_ASM
)) {
8877 qemu_log("----------------\n");
8878 qemu_log("IN: %s\n", lookup_symbol(pc_start
));
8879 log_target_disas(pc_start
, dc
->pc
- pc_start
, env
->thumb
);
8884 j
= gen_opc_ptr
- gen_opc_buf
;
8887 gen_opc_instr_start
[lj
++] = 0;
8889 tb
->size
= dc
->pc
- pc_start
;
8890 tb
->icount
= num_insns
;
8894 void gen_intermediate_code(CPUState
*env
, TranslationBlock
*tb
)
8896 gen_intermediate_code_internal(env
, tb
, 0);
8899 void gen_intermediate_code_pc(CPUState
*env
, TranslationBlock
*tb
)
8901 gen_intermediate_code_internal(env
, tb
, 1);
8904 static const char *cpu_mode_names
[16] = {
8905 "usr", "fiq", "irq", "svc", "???", "???", "???", "abt",
8906 "???", "???", "???", "und", "???", "???", "???", "sys"
8909 void cpu_dump_state(CPUState
*env
, FILE *f
,
8910 int (*cpu_fprintf
)(FILE *f
, const char *fmt
, ...),
8920 /* ??? This assumes float64 and double have the same layout.
8921 Oh well, it's only debug dumps. */
8930 cpu_fprintf(f
, "R%02d=%08x", i
, env
->regs
[i
]);
8932 cpu_fprintf(f
, "\n");
8934 cpu_fprintf(f
, " ");
8936 psr
= cpsr_read(env
);
8937 cpu_fprintf(f
, "PSR=%08x %c%c%c%c %c %s%d\n",
8939 psr
& (1 << 31) ? 'N' : '-',
8940 psr
& (1 << 30) ? 'Z' : '-',
8941 psr
& (1 << 29) ? 'C' : '-',
8942 psr
& (1 << 28) ? 'V' : '-',
8943 psr
& CPSR_T
? 'T' : 'A',
8944 cpu_mode_names
[psr
& 0xf], (psr
& 0x10) ? 32 : 26);
8947 for (i
= 0; i
< 16; i
++) {
8948 d
.d
= env
->vfp
.regs
[i
];
8952 cpu_fprintf(f
, "s%02d=%08x(%8g) s%02d=%08x(%8g) d%02d=%08x%08x(%8g)\n",
8953 i
* 2, (int)s0
.i
, s0
.s
,
8954 i
* 2 + 1, (int)s1
.i
, s1
.s
,
8955 i
, (int)(uint32_t)d
.l
.upper
, (int)(uint32_t)d
.l
.lower
,
8958 cpu_fprintf(f
, "FPSCR: %08x\n", (int)env
->vfp
.xregs
[ARM_VFP_FPSCR
]);
8962 void gen_pc_load(CPUState
*env
, TranslationBlock
*tb
,
8963 unsigned long searched_pc
, int pc_pos
, void *puc
)
8965 env
->regs
[15] = gen_opc_pc
[pc_pos
];