x86: Filter out garbage from segment flags dump
[qemu.git] / target-arm / translate.c
blob8d494ec9248f884b36ae220ef75e6acedb665b26
1 /*
2 * ARM translation
4 * Copyright (c) 2003 Fabrice Bellard
5 * Copyright (c) 2005-2007 CodeSourcery
6 * Copyright (c) 2007 OpenedHand, Ltd.
8 * This library is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2 of the License, or (at your option) any later version.
13 * This library is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * Lesser General Public License for more details.
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
21 #include <stdarg.h>
22 #include <stdlib.h>
23 #include <stdio.h>
24 #include <string.h>
25 #include <inttypes.h>
27 #include "cpu.h"
28 #include "exec-all.h"
29 #include "disas.h"
30 #include "tcg-op.h"
31 #include "qemu-log.h"
33 #include "helpers.h"
34 #define GEN_HELPER 1
35 #include "helpers.h"
37 #define ENABLE_ARCH_5J 0
38 #define ENABLE_ARCH_6 arm_feature(env, ARM_FEATURE_V6)
39 #define ENABLE_ARCH_6K arm_feature(env, ARM_FEATURE_V6K)
40 #define ENABLE_ARCH_6T2 arm_feature(env, ARM_FEATURE_THUMB2)
41 #define ENABLE_ARCH_7 arm_feature(env, ARM_FEATURE_V7)
43 #define ARCH(x) do { if (!ENABLE_ARCH_##x) goto illegal_op; } while(0)
45 /* internal defines */
46 typedef struct DisasContext {
47 target_ulong pc;
48 int is_jmp;
49 /* Nonzero if this instruction has been conditionally skipped. */
50 int condjmp;
51 /* The label that will be jumped to when the instruction is skipped. */
52 int condlabel;
53 /* Thumb-2 condtional execution bits. */
54 int condexec_mask;
55 int condexec_cond;
56 struct TranslationBlock *tb;
57 int singlestep_enabled;
58 int thumb;
59 #if !defined(CONFIG_USER_ONLY)
60 int user;
61 #endif
62 } DisasContext;
64 #if defined(CONFIG_USER_ONLY)
65 #define IS_USER(s) 1
66 #else
67 #define IS_USER(s) (s->user)
68 #endif
70 /* These instructions trap after executing, so defer them until after the
71 conditional executions state has been updated. */
72 #define DISAS_WFI 4
73 #define DISAS_SWI 5
75 static TCGv_ptr cpu_env;
76 /* We reuse the same 64-bit temporaries for efficiency. */
77 static TCGv_i64 cpu_V0, cpu_V1, cpu_M0;
78 static TCGv_i32 cpu_R[16];
79 static TCGv_i32 cpu_exclusive_addr;
80 static TCGv_i32 cpu_exclusive_val;
81 static TCGv_i32 cpu_exclusive_high;
82 #ifdef CONFIG_USER_ONLY
83 static TCGv_i32 cpu_exclusive_test;
84 static TCGv_i32 cpu_exclusive_info;
85 #endif
87 /* FIXME: These should be removed. */
88 static TCGv cpu_F0s, cpu_F1s;
89 static TCGv_i64 cpu_F0d, cpu_F1d;
91 #include "gen-icount.h"
93 static const char *regnames[] =
94 { "r0", "r1", "r2", "r3", "r4", "r5", "r6", "r7",
95 "r8", "r9", "r10", "r11", "r12", "r13", "r14", "pc" };
97 /* initialize TCG globals. */
98 void arm_translate_init(void)
100 int i;
102 cpu_env = tcg_global_reg_new_ptr(TCG_AREG0, "env");
104 for (i = 0; i < 16; i++) {
105 cpu_R[i] = tcg_global_mem_new_i32(TCG_AREG0,
106 offsetof(CPUState, regs[i]),
107 regnames[i]);
109 cpu_exclusive_addr = tcg_global_mem_new_i32(TCG_AREG0,
110 offsetof(CPUState, exclusive_addr), "exclusive_addr");
111 cpu_exclusive_val = tcg_global_mem_new_i32(TCG_AREG0,
112 offsetof(CPUState, exclusive_val), "exclusive_val");
113 cpu_exclusive_high = tcg_global_mem_new_i32(TCG_AREG0,
114 offsetof(CPUState, exclusive_high), "exclusive_high");
115 #ifdef CONFIG_USER_ONLY
116 cpu_exclusive_test = tcg_global_mem_new_i32(TCG_AREG0,
117 offsetof(CPUState, exclusive_test), "exclusive_test");
118 cpu_exclusive_info = tcg_global_mem_new_i32(TCG_AREG0,
119 offsetof(CPUState, exclusive_info), "exclusive_info");
120 #endif
122 #define GEN_HELPER 2
123 #include "helpers.h"
126 static int num_temps;
128 /* Allocate a temporary variable. */
129 static TCGv_i32 new_tmp(void)
131 num_temps++;
132 return tcg_temp_new_i32();
135 /* Release a temporary variable. */
136 static void dead_tmp(TCGv tmp)
138 tcg_temp_free(tmp);
139 num_temps--;
142 static inline TCGv load_cpu_offset(int offset)
144 TCGv tmp = new_tmp();
145 tcg_gen_ld_i32(tmp, cpu_env, offset);
146 return tmp;
149 #define load_cpu_field(name) load_cpu_offset(offsetof(CPUState, name))
151 static inline void store_cpu_offset(TCGv var, int offset)
153 tcg_gen_st_i32(var, cpu_env, offset);
154 dead_tmp(var);
157 #define store_cpu_field(var, name) \
158 store_cpu_offset(var, offsetof(CPUState, name))
160 /* Set a variable to the value of a CPU register. */
161 static void load_reg_var(DisasContext *s, TCGv var, int reg)
163 if (reg == 15) {
164 uint32_t addr;
165 /* normaly, since we updated PC, we need only to add one insn */
166 if (s->thumb)
167 addr = (long)s->pc + 2;
168 else
169 addr = (long)s->pc + 4;
170 tcg_gen_movi_i32(var, addr);
171 } else {
172 tcg_gen_mov_i32(var, cpu_R[reg]);
176 /* Create a new temporary and set it to the value of a CPU register. */
177 static inline TCGv load_reg(DisasContext *s, int reg)
179 TCGv tmp = new_tmp();
180 load_reg_var(s, tmp, reg);
181 return tmp;
184 /* Set a CPU register. The source must be a temporary and will be
185 marked as dead. */
186 static void store_reg(DisasContext *s, int reg, TCGv var)
188 if (reg == 15) {
189 tcg_gen_andi_i32(var, var, ~1);
190 s->is_jmp = DISAS_JUMP;
192 tcg_gen_mov_i32(cpu_R[reg], var);
193 dead_tmp(var);
196 /* Value extensions. */
197 #define gen_uxtb(var) tcg_gen_ext8u_i32(var, var)
198 #define gen_uxth(var) tcg_gen_ext16u_i32(var, var)
199 #define gen_sxtb(var) tcg_gen_ext8s_i32(var, var)
200 #define gen_sxth(var) tcg_gen_ext16s_i32(var, var)
202 #define gen_sxtb16(var) gen_helper_sxtb16(var, var)
203 #define gen_uxtb16(var) gen_helper_uxtb16(var, var)
206 static inline void gen_set_cpsr(TCGv var, uint32_t mask)
208 TCGv tmp_mask = tcg_const_i32(mask);
209 gen_helper_cpsr_write(var, tmp_mask);
210 tcg_temp_free_i32(tmp_mask);
212 /* Set NZCV flags from the high 4 bits of var. */
213 #define gen_set_nzcv(var) gen_set_cpsr(var, CPSR_NZCV)
215 static void gen_exception(int excp)
217 TCGv tmp = new_tmp();
218 tcg_gen_movi_i32(tmp, excp);
219 gen_helper_exception(tmp);
220 dead_tmp(tmp);
223 static void gen_smul_dual(TCGv a, TCGv b)
225 TCGv tmp1 = new_tmp();
226 TCGv tmp2 = new_tmp();
227 tcg_gen_ext16s_i32(tmp1, a);
228 tcg_gen_ext16s_i32(tmp2, b);
229 tcg_gen_mul_i32(tmp1, tmp1, tmp2);
230 dead_tmp(tmp2);
231 tcg_gen_sari_i32(a, a, 16);
232 tcg_gen_sari_i32(b, b, 16);
233 tcg_gen_mul_i32(b, b, a);
234 tcg_gen_mov_i32(a, tmp1);
235 dead_tmp(tmp1);
238 /* Byteswap each halfword. */
239 static void gen_rev16(TCGv var)
241 TCGv tmp = new_tmp();
242 tcg_gen_shri_i32(tmp, var, 8);
243 tcg_gen_andi_i32(tmp, tmp, 0x00ff00ff);
244 tcg_gen_shli_i32(var, var, 8);
245 tcg_gen_andi_i32(var, var, 0xff00ff00);
246 tcg_gen_or_i32(var, var, tmp);
247 dead_tmp(tmp);
250 /* Byteswap low halfword and sign extend. */
251 static void gen_revsh(TCGv var)
253 tcg_gen_ext16u_i32(var, var);
254 tcg_gen_bswap16_i32(var, var);
255 tcg_gen_ext16s_i32(var, var);
258 /* Unsigned bitfield extract. */
259 static void gen_ubfx(TCGv var, int shift, uint32_t mask)
261 if (shift)
262 tcg_gen_shri_i32(var, var, shift);
263 tcg_gen_andi_i32(var, var, mask);
266 /* Signed bitfield extract. */
267 static void gen_sbfx(TCGv var, int shift, int width)
269 uint32_t signbit;
271 if (shift)
272 tcg_gen_sari_i32(var, var, shift);
273 if (shift + width < 32) {
274 signbit = 1u << (width - 1);
275 tcg_gen_andi_i32(var, var, (1u << width) - 1);
276 tcg_gen_xori_i32(var, var, signbit);
277 tcg_gen_subi_i32(var, var, signbit);
281 /* Bitfield insertion. Insert val into base. Clobbers base and val. */
282 static void gen_bfi(TCGv dest, TCGv base, TCGv val, int shift, uint32_t mask)
284 tcg_gen_andi_i32(val, val, mask);
285 tcg_gen_shli_i32(val, val, shift);
286 tcg_gen_andi_i32(base, base, ~(mask << shift));
287 tcg_gen_or_i32(dest, base, val);
290 /* Round the top 32 bits of a 64-bit value. */
291 static void gen_roundqd(TCGv a, TCGv b)
293 tcg_gen_shri_i32(a, a, 31);
294 tcg_gen_add_i32(a, a, b);
297 /* FIXME: Most targets have native widening multiplication.
298 It would be good to use that instead of a full wide multiply. */
299 /* 32x32->64 multiply. Marks inputs as dead. */
300 static TCGv_i64 gen_mulu_i64_i32(TCGv a, TCGv b)
302 TCGv_i64 tmp1 = tcg_temp_new_i64();
303 TCGv_i64 tmp2 = tcg_temp_new_i64();
305 tcg_gen_extu_i32_i64(tmp1, a);
306 dead_tmp(a);
307 tcg_gen_extu_i32_i64(tmp2, b);
308 dead_tmp(b);
309 tcg_gen_mul_i64(tmp1, tmp1, tmp2);
310 tcg_temp_free_i64(tmp2);
311 return tmp1;
314 static TCGv_i64 gen_muls_i64_i32(TCGv a, TCGv b)
316 TCGv_i64 tmp1 = tcg_temp_new_i64();
317 TCGv_i64 tmp2 = tcg_temp_new_i64();
319 tcg_gen_ext_i32_i64(tmp1, a);
320 dead_tmp(a);
321 tcg_gen_ext_i32_i64(tmp2, b);
322 dead_tmp(b);
323 tcg_gen_mul_i64(tmp1, tmp1, tmp2);
324 tcg_temp_free_i64(tmp2);
325 return tmp1;
328 /* Signed 32x32->64 multiply. */
329 static void gen_imull(TCGv a, TCGv b)
331 TCGv_i64 tmp1 = tcg_temp_new_i64();
332 TCGv_i64 tmp2 = tcg_temp_new_i64();
334 tcg_gen_ext_i32_i64(tmp1, a);
335 tcg_gen_ext_i32_i64(tmp2, b);
336 tcg_gen_mul_i64(tmp1, tmp1, tmp2);
337 tcg_temp_free_i64(tmp2);
338 tcg_gen_trunc_i64_i32(a, tmp1);
339 tcg_gen_shri_i64(tmp1, tmp1, 32);
340 tcg_gen_trunc_i64_i32(b, tmp1);
341 tcg_temp_free_i64(tmp1);
344 /* Swap low and high halfwords. */
345 static void gen_swap_half(TCGv var)
347 TCGv tmp = new_tmp();
348 tcg_gen_shri_i32(tmp, var, 16);
349 tcg_gen_shli_i32(var, var, 16);
350 tcg_gen_or_i32(var, var, tmp);
351 dead_tmp(tmp);
354 /* Dual 16-bit add. Result placed in t0 and t1 is marked as dead.
355 tmp = (t0 ^ t1) & 0x8000;
356 t0 &= ~0x8000;
357 t1 &= ~0x8000;
358 t0 = (t0 + t1) ^ tmp;
361 static void gen_add16(TCGv t0, TCGv t1)
363 TCGv tmp = new_tmp();
364 tcg_gen_xor_i32(tmp, t0, t1);
365 tcg_gen_andi_i32(tmp, tmp, 0x8000);
366 tcg_gen_andi_i32(t0, t0, ~0x8000);
367 tcg_gen_andi_i32(t1, t1, ~0x8000);
368 tcg_gen_add_i32(t0, t0, t1);
369 tcg_gen_xor_i32(t0, t0, tmp);
370 dead_tmp(tmp);
371 dead_tmp(t1);
374 #define gen_set_CF(var) tcg_gen_st_i32(var, cpu_env, offsetof(CPUState, CF))
376 /* Set CF to the top bit of var. */
377 static void gen_set_CF_bit31(TCGv var)
379 TCGv tmp = new_tmp();
380 tcg_gen_shri_i32(tmp, var, 31);
381 gen_set_CF(tmp);
382 dead_tmp(tmp);
385 /* Set N and Z flags from var. */
386 static inline void gen_logic_CC(TCGv var)
388 tcg_gen_st_i32(var, cpu_env, offsetof(CPUState, NF));
389 tcg_gen_st_i32(var, cpu_env, offsetof(CPUState, ZF));
392 /* T0 += T1 + CF. */
393 static void gen_adc(TCGv t0, TCGv t1)
395 TCGv tmp;
396 tcg_gen_add_i32(t0, t0, t1);
397 tmp = load_cpu_field(CF);
398 tcg_gen_add_i32(t0, t0, tmp);
399 dead_tmp(tmp);
402 /* dest = T0 + T1 + CF. */
403 static void gen_add_carry(TCGv dest, TCGv t0, TCGv t1)
405 TCGv tmp;
406 tcg_gen_add_i32(dest, t0, t1);
407 tmp = load_cpu_field(CF);
408 tcg_gen_add_i32(dest, dest, tmp);
409 dead_tmp(tmp);
412 /* dest = T0 - T1 + CF - 1. */
413 static void gen_sub_carry(TCGv dest, TCGv t0, TCGv t1)
415 TCGv tmp;
416 tcg_gen_sub_i32(dest, t0, t1);
417 tmp = load_cpu_field(CF);
418 tcg_gen_add_i32(dest, dest, tmp);
419 tcg_gen_subi_i32(dest, dest, 1);
420 dead_tmp(tmp);
423 /* FIXME: Implement this natively. */
424 #define tcg_gen_abs_i32(t0, t1) gen_helper_abs(t0, t1)
426 static void shifter_out_im(TCGv var, int shift)
428 TCGv tmp = new_tmp();
429 if (shift == 0) {
430 tcg_gen_andi_i32(tmp, var, 1);
431 } else {
432 tcg_gen_shri_i32(tmp, var, shift);
433 if (shift != 31)
434 tcg_gen_andi_i32(tmp, tmp, 1);
436 gen_set_CF(tmp);
437 dead_tmp(tmp);
440 /* Shift by immediate. Includes special handling for shift == 0. */
441 static inline void gen_arm_shift_im(TCGv var, int shiftop, int shift, int flags)
443 switch (shiftop) {
444 case 0: /* LSL */
445 if (shift != 0) {
446 if (flags)
447 shifter_out_im(var, 32 - shift);
448 tcg_gen_shli_i32(var, var, shift);
450 break;
451 case 1: /* LSR */
452 if (shift == 0) {
453 if (flags) {
454 tcg_gen_shri_i32(var, var, 31);
455 gen_set_CF(var);
457 tcg_gen_movi_i32(var, 0);
458 } else {
459 if (flags)
460 shifter_out_im(var, shift - 1);
461 tcg_gen_shri_i32(var, var, shift);
463 break;
464 case 2: /* ASR */
465 if (shift == 0)
466 shift = 32;
467 if (flags)
468 shifter_out_im(var, shift - 1);
469 if (shift == 32)
470 shift = 31;
471 tcg_gen_sari_i32(var, var, shift);
472 break;
473 case 3: /* ROR/RRX */
474 if (shift != 0) {
475 if (flags)
476 shifter_out_im(var, shift - 1);
477 tcg_gen_rotri_i32(var, var, shift); break;
478 } else {
479 TCGv tmp = load_cpu_field(CF);
480 if (flags)
481 shifter_out_im(var, 0);
482 tcg_gen_shri_i32(var, var, 1);
483 tcg_gen_shli_i32(tmp, tmp, 31);
484 tcg_gen_or_i32(var, var, tmp);
485 dead_tmp(tmp);
490 static inline void gen_arm_shift_reg(TCGv var, int shiftop,
491 TCGv shift, int flags)
493 if (flags) {
494 switch (shiftop) {
495 case 0: gen_helper_shl_cc(var, var, shift); break;
496 case 1: gen_helper_shr_cc(var, var, shift); break;
497 case 2: gen_helper_sar_cc(var, var, shift); break;
498 case 3: gen_helper_ror_cc(var, var, shift); break;
500 } else {
501 switch (shiftop) {
502 case 0: gen_helper_shl(var, var, shift); break;
503 case 1: gen_helper_shr(var, var, shift); break;
504 case 2: gen_helper_sar(var, var, shift); break;
505 case 3: tcg_gen_andi_i32(shift, shift, 0x1f);
506 tcg_gen_rotr_i32(var, var, shift); break;
509 dead_tmp(shift);
512 #define PAS_OP(pfx) \
513 switch (op2) { \
514 case 0: gen_pas_helper(glue(pfx,add16)); break; \
515 case 1: gen_pas_helper(glue(pfx,addsubx)); break; \
516 case 2: gen_pas_helper(glue(pfx,subaddx)); break; \
517 case 3: gen_pas_helper(glue(pfx,sub16)); break; \
518 case 4: gen_pas_helper(glue(pfx,add8)); break; \
519 case 7: gen_pas_helper(glue(pfx,sub8)); break; \
521 static void gen_arm_parallel_addsub(int op1, int op2, TCGv a, TCGv b)
523 TCGv_ptr tmp;
525 switch (op1) {
526 #define gen_pas_helper(name) glue(gen_helper_,name)(a, a, b, tmp)
527 case 1:
528 tmp = tcg_temp_new_ptr();
529 tcg_gen_addi_ptr(tmp, cpu_env, offsetof(CPUState, GE));
530 PAS_OP(s)
531 tcg_temp_free_ptr(tmp);
532 break;
533 case 5:
534 tmp = tcg_temp_new_ptr();
535 tcg_gen_addi_ptr(tmp, cpu_env, offsetof(CPUState, GE));
536 PAS_OP(u)
537 tcg_temp_free_ptr(tmp);
538 break;
539 #undef gen_pas_helper
540 #define gen_pas_helper(name) glue(gen_helper_,name)(a, a, b)
541 case 2:
542 PAS_OP(q);
543 break;
544 case 3:
545 PAS_OP(sh);
546 break;
547 case 6:
548 PAS_OP(uq);
549 break;
550 case 7:
551 PAS_OP(uh);
552 break;
553 #undef gen_pas_helper
556 #undef PAS_OP
558 /* For unknown reasons Arm and Thumb-2 use arbitrarily different encodings. */
559 #define PAS_OP(pfx) \
560 switch (op1) { \
561 case 0: gen_pas_helper(glue(pfx,add8)); break; \
562 case 1: gen_pas_helper(glue(pfx,add16)); break; \
563 case 2: gen_pas_helper(glue(pfx,addsubx)); break; \
564 case 4: gen_pas_helper(glue(pfx,sub8)); break; \
565 case 5: gen_pas_helper(glue(pfx,sub16)); break; \
566 case 6: gen_pas_helper(glue(pfx,subaddx)); break; \
568 static void gen_thumb2_parallel_addsub(int op1, int op2, TCGv a, TCGv b)
570 TCGv_ptr tmp;
572 switch (op2) {
573 #define gen_pas_helper(name) glue(gen_helper_,name)(a, a, b, tmp)
574 case 0:
575 tmp = tcg_temp_new_ptr();
576 tcg_gen_addi_ptr(tmp, cpu_env, offsetof(CPUState, GE));
577 PAS_OP(s)
578 tcg_temp_free_ptr(tmp);
579 break;
580 case 4:
581 tmp = tcg_temp_new_ptr();
582 tcg_gen_addi_ptr(tmp, cpu_env, offsetof(CPUState, GE));
583 PAS_OP(u)
584 tcg_temp_free_ptr(tmp);
585 break;
586 #undef gen_pas_helper
587 #define gen_pas_helper(name) glue(gen_helper_,name)(a, a, b)
588 case 1:
589 PAS_OP(q);
590 break;
591 case 2:
592 PAS_OP(sh);
593 break;
594 case 5:
595 PAS_OP(uq);
596 break;
597 case 6:
598 PAS_OP(uh);
599 break;
600 #undef gen_pas_helper
603 #undef PAS_OP
605 static void gen_test_cc(int cc, int label)
607 TCGv tmp;
608 TCGv tmp2;
609 int inv;
611 switch (cc) {
612 case 0: /* eq: Z */
613 tmp = load_cpu_field(ZF);
614 tcg_gen_brcondi_i32(TCG_COND_EQ, tmp, 0, label);
615 break;
616 case 1: /* ne: !Z */
617 tmp = load_cpu_field(ZF);
618 tcg_gen_brcondi_i32(TCG_COND_NE, tmp, 0, label);
619 break;
620 case 2: /* cs: C */
621 tmp = load_cpu_field(CF);
622 tcg_gen_brcondi_i32(TCG_COND_NE, tmp, 0, label);
623 break;
624 case 3: /* cc: !C */
625 tmp = load_cpu_field(CF);
626 tcg_gen_brcondi_i32(TCG_COND_EQ, tmp, 0, label);
627 break;
628 case 4: /* mi: N */
629 tmp = load_cpu_field(NF);
630 tcg_gen_brcondi_i32(TCG_COND_LT, tmp, 0, label);
631 break;
632 case 5: /* pl: !N */
633 tmp = load_cpu_field(NF);
634 tcg_gen_brcondi_i32(TCG_COND_GE, tmp, 0, label);
635 break;
636 case 6: /* vs: V */
637 tmp = load_cpu_field(VF);
638 tcg_gen_brcondi_i32(TCG_COND_LT, tmp, 0, label);
639 break;
640 case 7: /* vc: !V */
641 tmp = load_cpu_field(VF);
642 tcg_gen_brcondi_i32(TCG_COND_GE, tmp, 0, label);
643 break;
644 case 8: /* hi: C && !Z */
645 inv = gen_new_label();
646 tmp = load_cpu_field(CF);
647 tcg_gen_brcondi_i32(TCG_COND_EQ, tmp, 0, inv);
648 dead_tmp(tmp);
649 tmp = load_cpu_field(ZF);
650 tcg_gen_brcondi_i32(TCG_COND_NE, tmp, 0, label);
651 gen_set_label(inv);
652 break;
653 case 9: /* ls: !C || Z */
654 tmp = load_cpu_field(CF);
655 tcg_gen_brcondi_i32(TCG_COND_EQ, tmp, 0, label);
656 dead_tmp(tmp);
657 tmp = load_cpu_field(ZF);
658 tcg_gen_brcondi_i32(TCG_COND_EQ, tmp, 0, label);
659 break;
660 case 10: /* ge: N == V -> N ^ V == 0 */
661 tmp = load_cpu_field(VF);
662 tmp2 = load_cpu_field(NF);
663 tcg_gen_xor_i32(tmp, tmp, tmp2);
664 dead_tmp(tmp2);
665 tcg_gen_brcondi_i32(TCG_COND_GE, tmp, 0, label);
666 break;
667 case 11: /* lt: N != V -> N ^ V != 0 */
668 tmp = load_cpu_field(VF);
669 tmp2 = load_cpu_field(NF);
670 tcg_gen_xor_i32(tmp, tmp, tmp2);
671 dead_tmp(tmp2);
672 tcg_gen_brcondi_i32(TCG_COND_LT, tmp, 0, label);
673 break;
674 case 12: /* gt: !Z && N == V */
675 inv = gen_new_label();
676 tmp = load_cpu_field(ZF);
677 tcg_gen_brcondi_i32(TCG_COND_EQ, tmp, 0, inv);
678 dead_tmp(tmp);
679 tmp = load_cpu_field(VF);
680 tmp2 = load_cpu_field(NF);
681 tcg_gen_xor_i32(tmp, tmp, tmp2);
682 dead_tmp(tmp2);
683 tcg_gen_brcondi_i32(TCG_COND_GE, tmp, 0, label);
684 gen_set_label(inv);
685 break;
686 case 13: /* le: Z || N != V */
687 tmp = load_cpu_field(ZF);
688 tcg_gen_brcondi_i32(TCG_COND_EQ, tmp, 0, label);
689 dead_tmp(tmp);
690 tmp = load_cpu_field(VF);
691 tmp2 = load_cpu_field(NF);
692 tcg_gen_xor_i32(tmp, tmp, tmp2);
693 dead_tmp(tmp2);
694 tcg_gen_brcondi_i32(TCG_COND_LT, tmp, 0, label);
695 break;
696 default:
697 fprintf(stderr, "Bad condition code 0x%x\n", cc);
698 abort();
700 dead_tmp(tmp);
703 static const uint8_t table_logic_cc[16] = {
704 1, /* and */
705 1, /* xor */
706 0, /* sub */
707 0, /* rsb */
708 0, /* add */
709 0, /* adc */
710 0, /* sbc */
711 0, /* rsc */
712 1, /* andl */
713 1, /* xorl */
714 0, /* cmp */
715 0, /* cmn */
716 1, /* orr */
717 1, /* mov */
718 1, /* bic */
719 1, /* mvn */
722 /* Set PC and Thumb state from an immediate address. */
723 static inline void gen_bx_im(DisasContext *s, uint32_t addr)
725 TCGv tmp;
727 s->is_jmp = DISAS_UPDATE;
728 if (s->thumb != (addr & 1)) {
729 tmp = new_tmp();
730 tcg_gen_movi_i32(tmp, addr & 1);
731 tcg_gen_st_i32(tmp, cpu_env, offsetof(CPUState, thumb));
732 dead_tmp(tmp);
734 tcg_gen_movi_i32(cpu_R[15], addr & ~1);
737 /* Set PC and Thumb state from var. var is marked as dead. */
738 static inline void gen_bx(DisasContext *s, TCGv var)
740 s->is_jmp = DISAS_UPDATE;
741 tcg_gen_andi_i32(cpu_R[15], var, ~1);
742 tcg_gen_andi_i32(var, var, 1);
743 store_cpu_field(var, thumb);
746 /* Variant of store_reg which uses branch&exchange logic when storing
747 to r15 in ARM architecture v7 and above. The source must be a temporary
748 and will be marked as dead. */
749 static inline void store_reg_bx(CPUState *env, DisasContext *s,
750 int reg, TCGv var)
752 if (reg == 15 && ENABLE_ARCH_7) {
753 gen_bx(s, var);
754 } else {
755 store_reg(s, reg, var);
759 static inline TCGv gen_ld8s(TCGv addr, int index)
761 TCGv tmp = new_tmp();
762 tcg_gen_qemu_ld8s(tmp, addr, index);
763 return tmp;
765 static inline TCGv gen_ld8u(TCGv addr, int index)
767 TCGv tmp = new_tmp();
768 tcg_gen_qemu_ld8u(tmp, addr, index);
769 return tmp;
771 static inline TCGv gen_ld16s(TCGv addr, int index)
773 TCGv tmp = new_tmp();
774 tcg_gen_qemu_ld16s(tmp, addr, index);
775 return tmp;
777 static inline TCGv gen_ld16u(TCGv addr, int index)
779 TCGv tmp = new_tmp();
780 tcg_gen_qemu_ld16u(tmp, addr, index);
781 return tmp;
783 static inline TCGv gen_ld32(TCGv addr, int index)
785 TCGv tmp = new_tmp();
786 tcg_gen_qemu_ld32u(tmp, addr, index);
787 return tmp;
789 static inline TCGv_i64 gen_ld64(TCGv addr, int index)
791 TCGv_i64 tmp = tcg_temp_new_i64();
792 tcg_gen_qemu_ld64(tmp, addr, index);
793 return tmp;
795 static inline void gen_st8(TCGv val, TCGv addr, int index)
797 tcg_gen_qemu_st8(val, addr, index);
798 dead_tmp(val);
800 static inline void gen_st16(TCGv val, TCGv addr, int index)
802 tcg_gen_qemu_st16(val, addr, index);
803 dead_tmp(val);
805 static inline void gen_st32(TCGv val, TCGv addr, int index)
807 tcg_gen_qemu_st32(val, addr, index);
808 dead_tmp(val);
810 static inline void gen_st64(TCGv_i64 val, TCGv addr, int index)
812 tcg_gen_qemu_st64(val, addr, index);
813 tcg_temp_free_i64(val);
816 static inline void gen_set_pc_im(uint32_t val)
818 tcg_gen_movi_i32(cpu_R[15], val);
821 /* Force a TB lookup after an instruction that changes the CPU state. */
822 static inline void gen_lookup_tb(DisasContext *s)
824 tcg_gen_movi_i32(cpu_R[15], s->pc & ~1);
825 s->is_jmp = DISAS_UPDATE;
828 static inline void gen_add_data_offset(DisasContext *s, unsigned int insn,
829 TCGv var)
831 int val, rm, shift, shiftop;
832 TCGv offset;
834 if (!(insn & (1 << 25))) {
835 /* immediate */
836 val = insn & 0xfff;
837 if (!(insn & (1 << 23)))
838 val = -val;
839 if (val != 0)
840 tcg_gen_addi_i32(var, var, val);
841 } else {
842 /* shift/register */
843 rm = (insn) & 0xf;
844 shift = (insn >> 7) & 0x1f;
845 shiftop = (insn >> 5) & 3;
846 offset = load_reg(s, rm);
847 gen_arm_shift_im(offset, shiftop, shift, 0);
848 if (!(insn & (1 << 23)))
849 tcg_gen_sub_i32(var, var, offset);
850 else
851 tcg_gen_add_i32(var, var, offset);
852 dead_tmp(offset);
856 static inline void gen_add_datah_offset(DisasContext *s, unsigned int insn,
857 int extra, TCGv var)
859 int val, rm;
860 TCGv offset;
862 if (insn & (1 << 22)) {
863 /* immediate */
864 val = (insn & 0xf) | ((insn >> 4) & 0xf0);
865 if (!(insn & (1 << 23)))
866 val = -val;
867 val += extra;
868 if (val != 0)
869 tcg_gen_addi_i32(var, var, val);
870 } else {
871 /* register */
872 if (extra)
873 tcg_gen_addi_i32(var, var, extra);
874 rm = (insn) & 0xf;
875 offset = load_reg(s, rm);
876 if (!(insn & (1 << 23)))
877 tcg_gen_sub_i32(var, var, offset);
878 else
879 tcg_gen_add_i32(var, var, offset);
880 dead_tmp(offset);
884 #define VFP_OP2(name) \
885 static inline void gen_vfp_##name(int dp) \
887 if (dp) \
888 gen_helper_vfp_##name##d(cpu_F0d, cpu_F0d, cpu_F1d, cpu_env); \
889 else \
890 gen_helper_vfp_##name##s(cpu_F0s, cpu_F0s, cpu_F1s, cpu_env); \
893 VFP_OP2(add)
894 VFP_OP2(sub)
895 VFP_OP2(mul)
896 VFP_OP2(div)
898 #undef VFP_OP2
900 static inline void gen_vfp_abs(int dp)
902 if (dp)
903 gen_helper_vfp_absd(cpu_F0d, cpu_F0d);
904 else
905 gen_helper_vfp_abss(cpu_F0s, cpu_F0s);
908 static inline void gen_vfp_neg(int dp)
910 if (dp)
911 gen_helper_vfp_negd(cpu_F0d, cpu_F0d);
912 else
913 gen_helper_vfp_negs(cpu_F0s, cpu_F0s);
916 static inline void gen_vfp_sqrt(int dp)
918 if (dp)
919 gen_helper_vfp_sqrtd(cpu_F0d, cpu_F0d, cpu_env);
920 else
921 gen_helper_vfp_sqrts(cpu_F0s, cpu_F0s, cpu_env);
924 static inline void gen_vfp_cmp(int dp)
926 if (dp)
927 gen_helper_vfp_cmpd(cpu_F0d, cpu_F1d, cpu_env);
928 else
929 gen_helper_vfp_cmps(cpu_F0s, cpu_F1s, cpu_env);
932 static inline void gen_vfp_cmpe(int dp)
934 if (dp)
935 gen_helper_vfp_cmped(cpu_F0d, cpu_F1d, cpu_env);
936 else
937 gen_helper_vfp_cmpes(cpu_F0s, cpu_F1s, cpu_env);
940 static inline void gen_vfp_F1_ld0(int dp)
942 if (dp)
943 tcg_gen_movi_i64(cpu_F1d, 0);
944 else
945 tcg_gen_movi_i32(cpu_F1s, 0);
948 static inline void gen_vfp_uito(int dp)
950 if (dp)
951 gen_helper_vfp_uitod(cpu_F0d, cpu_F0s, cpu_env);
952 else
953 gen_helper_vfp_uitos(cpu_F0s, cpu_F0s, cpu_env);
956 static inline void gen_vfp_sito(int dp)
958 if (dp)
959 gen_helper_vfp_sitod(cpu_F0d, cpu_F0s, cpu_env);
960 else
961 gen_helper_vfp_sitos(cpu_F0s, cpu_F0s, cpu_env);
964 static inline void gen_vfp_toui(int dp)
966 if (dp)
967 gen_helper_vfp_touid(cpu_F0s, cpu_F0d, cpu_env);
968 else
969 gen_helper_vfp_touis(cpu_F0s, cpu_F0s, cpu_env);
972 static inline void gen_vfp_touiz(int dp)
974 if (dp)
975 gen_helper_vfp_touizd(cpu_F0s, cpu_F0d, cpu_env);
976 else
977 gen_helper_vfp_touizs(cpu_F0s, cpu_F0s, cpu_env);
980 static inline void gen_vfp_tosi(int dp)
982 if (dp)
983 gen_helper_vfp_tosid(cpu_F0s, cpu_F0d, cpu_env);
984 else
985 gen_helper_vfp_tosis(cpu_F0s, cpu_F0s, cpu_env);
988 static inline void gen_vfp_tosiz(int dp)
990 if (dp)
991 gen_helper_vfp_tosizd(cpu_F0s, cpu_F0d, cpu_env);
992 else
993 gen_helper_vfp_tosizs(cpu_F0s, cpu_F0s, cpu_env);
996 #define VFP_GEN_FIX(name) \
997 static inline void gen_vfp_##name(int dp, int shift) \
999 TCGv tmp_shift = tcg_const_i32(shift); \
1000 if (dp) \
1001 gen_helper_vfp_##name##d(cpu_F0d, cpu_F0d, tmp_shift, cpu_env);\
1002 else \
1003 gen_helper_vfp_##name##s(cpu_F0s, cpu_F0s, tmp_shift, cpu_env);\
1004 tcg_temp_free_i32(tmp_shift); \
1006 VFP_GEN_FIX(tosh)
1007 VFP_GEN_FIX(tosl)
1008 VFP_GEN_FIX(touh)
1009 VFP_GEN_FIX(toul)
1010 VFP_GEN_FIX(shto)
1011 VFP_GEN_FIX(slto)
1012 VFP_GEN_FIX(uhto)
1013 VFP_GEN_FIX(ulto)
1014 #undef VFP_GEN_FIX
1016 static inline void gen_vfp_ld(DisasContext *s, int dp, TCGv addr)
1018 if (dp)
1019 tcg_gen_qemu_ld64(cpu_F0d, addr, IS_USER(s));
1020 else
1021 tcg_gen_qemu_ld32u(cpu_F0s, addr, IS_USER(s));
1024 static inline void gen_vfp_st(DisasContext *s, int dp, TCGv addr)
1026 if (dp)
1027 tcg_gen_qemu_st64(cpu_F0d, addr, IS_USER(s));
1028 else
1029 tcg_gen_qemu_st32(cpu_F0s, addr, IS_USER(s));
1032 static inline long
1033 vfp_reg_offset (int dp, int reg)
1035 if (dp)
1036 return offsetof(CPUARMState, vfp.regs[reg]);
1037 else if (reg & 1) {
1038 return offsetof(CPUARMState, vfp.regs[reg >> 1])
1039 + offsetof(CPU_DoubleU, l.upper);
1040 } else {
1041 return offsetof(CPUARMState, vfp.regs[reg >> 1])
1042 + offsetof(CPU_DoubleU, l.lower);
1046 /* Return the offset of a 32-bit piece of a NEON register.
1047 zero is the least significant end of the register. */
1048 static inline long
1049 neon_reg_offset (int reg, int n)
1051 int sreg;
1052 sreg = reg * 2 + n;
1053 return vfp_reg_offset(0, sreg);
1056 static TCGv neon_load_reg(int reg, int pass)
1058 TCGv tmp = new_tmp();
1059 tcg_gen_ld_i32(tmp, cpu_env, neon_reg_offset(reg, pass));
1060 return tmp;
1063 static void neon_store_reg(int reg, int pass, TCGv var)
1065 tcg_gen_st_i32(var, cpu_env, neon_reg_offset(reg, pass));
1066 dead_tmp(var);
1069 static inline void neon_load_reg64(TCGv_i64 var, int reg)
1071 tcg_gen_ld_i64(var, cpu_env, vfp_reg_offset(1, reg));
1074 static inline void neon_store_reg64(TCGv_i64 var, int reg)
1076 tcg_gen_st_i64(var, cpu_env, vfp_reg_offset(1, reg));
1079 #define tcg_gen_ld_f32 tcg_gen_ld_i32
1080 #define tcg_gen_ld_f64 tcg_gen_ld_i64
1081 #define tcg_gen_st_f32 tcg_gen_st_i32
1082 #define tcg_gen_st_f64 tcg_gen_st_i64
1084 static inline void gen_mov_F0_vreg(int dp, int reg)
1086 if (dp)
1087 tcg_gen_ld_f64(cpu_F0d, cpu_env, vfp_reg_offset(dp, reg));
1088 else
1089 tcg_gen_ld_f32(cpu_F0s, cpu_env, vfp_reg_offset(dp, reg));
1092 static inline void gen_mov_F1_vreg(int dp, int reg)
1094 if (dp)
1095 tcg_gen_ld_f64(cpu_F1d, cpu_env, vfp_reg_offset(dp, reg));
1096 else
1097 tcg_gen_ld_f32(cpu_F1s, cpu_env, vfp_reg_offset(dp, reg));
1100 static inline void gen_mov_vreg_F0(int dp, int reg)
1102 if (dp)
1103 tcg_gen_st_f64(cpu_F0d, cpu_env, vfp_reg_offset(dp, reg));
1104 else
1105 tcg_gen_st_f32(cpu_F0s, cpu_env, vfp_reg_offset(dp, reg));
1108 #define ARM_CP_RW_BIT (1 << 20)
1110 static inline void iwmmxt_load_reg(TCGv_i64 var, int reg)
1112 tcg_gen_ld_i64(var, cpu_env, offsetof(CPUState, iwmmxt.regs[reg]));
1115 static inline void iwmmxt_store_reg(TCGv_i64 var, int reg)
1117 tcg_gen_st_i64(var, cpu_env, offsetof(CPUState, iwmmxt.regs[reg]));
1120 static inline TCGv iwmmxt_load_creg(int reg)
1122 TCGv var = new_tmp();
1123 tcg_gen_ld_i32(var, cpu_env, offsetof(CPUState, iwmmxt.cregs[reg]));
1124 return var;
1127 static inline void iwmmxt_store_creg(int reg, TCGv var)
1129 tcg_gen_st_i32(var, cpu_env, offsetof(CPUState, iwmmxt.cregs[reg]));
1130 dead_tmp(var);
1133 static inline void gen_op_iwmmxt_movq_wRn_M0(int rn)
1135 iwmmxt_store_reg(cpu_M0, rn);
1138 static inline void gen_op_iwmmxt_movq_M0_wRn(int rn)
1140 iwmmxt_load_reg(cpu_M0, rn);
1143 static inline void gen_op_iwmmxt_orq_M0_wRn(int rn)
1145 iwmmxt_load_reg(cpu_V1, rn);
1146 tcg_gen_or_i64(cpu_M0, cpu_M0, cpu_V1);
1149 static inline void gen_op_iwmmxt_andq_M0_wRn(int rn)
1151 iwmmxt_load_reg(cpu_V1, rn);
1152 tcg_gen_and_i64(cpu_M0, cpu_M0, cpu_V1);
1155 static inline void gen_op_iwmmxt_xorq_M0_wRn(int rn)
1157 iwmmxt_load_reg(cpu_V1, rn);
1158 tcg_gen_xor_i64(cpu_M0, cpu_M0, cpu_V1);
1161 #define IWMMXT_OP(name) \
1162 static inline void gen_op_iwmmxt_##name##_M0_wRn(int rn) \
1164 iwmmxt_load_reg(cpu_V1, rn); \
1165 gen_helper_iwmmxt_##name(cpu_M0, cpu_M0, cpu_V1); \
1168 #define IWMMXT_OP_ENV(name) \
1169 static inline void gen_op_iwmmxt_##name##_M0_wRn(int rn) \
1171 iwmmxt_load_reg(cpu_V1, rn); \
1172 gen_helper_iwmmxt_##name(cpu_M0, cpu_env, cpu_M0, cpu_V1); \
1175 #define IWMMXT_OP_ENV_SIZE(name) \
1176 IWMMXT_OP_ENV(name##b) \
1177 IWMMXT_OP_ENV(name##w) \
1178 IWMMXT_OP_ENV(name##l)
1180 #define IWMMXT_OP_ENV1(name) \
1181 static inline void gen_op_iwmmxt_##name##_M0(void) \
1183 gen_helper_iwmmxt_##name(cpu_M0, cpu_env, cpu_M0); \
1186 IWMMXT_OP(maddsq)
1187 IWMMXT_OP(madduq)
1188 IWMMXT_OP(sadb)
1189 IWMMXT_OP(sadw)
1190 IWMMXT_OP(mulslw)
1191 IWMMXT_OP(mulshw)
1192 IWMMXT_OP(mululw)
1193 IWMMXT_OP(muluhw)
1194 IWMMXT_OP(macsw)
1195 IWMMXT_OP(macuw)
1197 IWMMXT_OP_ENV_SIZE(unpackl)
1198 IWMMXT_OP_ENV_SIZE(unpackh)
1200 IWMMXT_OP_ENV1(unpacklub)
1201 IWMMXT_OP_ENV1(unpackluw)
1202 IWMMXT_OP_ENV1(unpacklul)
1203 IWMMXT_OP_ENV1(unpackhub)
1204 IWMMXT_OP_ENV1(unpackhuw)
1205 IWMMXT_OP_ENV1(unpackhul)
1206 IWMMXT_OP_ENV1(unpacklsb)
1207 IWMMXT_OP_ENV1(unpacklsw)
1208 IWMMXT_OP_ENV1(unpacklsl)
1209 IWMMXT_OP_ENV1(unpackhsb)
1210 IWMMXT_OP_ENV1(unpackhsw)
1211 IWMMXT_OP_ENV1(unpackhsl)
1213 IWMMXT_OP_ENV_SIZE(cmpeq)
1214 IWMMXT_OP_ENV_SIZE(cmpgtu)
1215 IWMMXT_OP_ENV_SIZE(cmpgts)
1217 IWMMXT_OP_ENV_SIZE(mins)
1218 IWMMXT_OP_ENV_SIZE(minu)
1219 IWMMXT_OP_ENV_SIZE(maxs)
1220 IWMMXT_OP_ENV_SIZE(maxu)
1222 IWMMXT_OP_ENV_SIZE(subn)
1223 IWMMXT_OP_ENV_SIZE(addn)
1224 IWMMXT_OP_ENV_SIZE(subu)
1225 IWMMXT_OP_ENV_SIZE(addu)
1226 IWMMXT_OP_ENV_SIZE(subs)
1227 IWMMXT_OP_ENV_SIZE(adds)
1229 IWMMXT_OP_ENV(avgb0)
1230 IWMMXT_OP_ENV(avgb1)
1231 IWMMXT_OP_ENV(avgw0)
1232 IWMMXT_OP_ENV(avgw1)
1234 IWMMXT_OP(msadb)
1236 IWMMXT_OP_ENV(packuw)
1237 IWMMXT_OP_ENV(packul)
1238 IWMMXT_OP_ENV(packuq)
1239 IWMMXT_OP_ENV(packsw)
1240 IWMMXT_OP_ENV(packsl)
1241 IWMMXT_OP_ENV(packsq)
1243 static void gen_op_iwmmxt_set_mup(void)
1245 TCGv tmp;
1246 tmp = load_cpu_field(iwmmxt.cregs[ARM_IWMMXT_wCon]);
1247 tcg_gen_ori_i32(tmp, tmp, 2);
1248 store_cpu_field(tmp, iwmmxt.cregs[ARM_IWMMXT_wCon]);
1251 static void gen_op_iwmmxt_set_cup(void)
1253 TCGv tmp;
1254 tmp = load_cpu_field(iwmmxt.cregs[ARM_IWMMXT_wCon]);
1255 tcg_gen_ori_i32(tmp, tmp, 1);
1256 store_cpu_field(tmp, iwmmxt.cregs[ARM_IWMMXT_wCon]);
1259 static void gen_op_iwmmxt_setpsr_nz(void)
1261 TCGv tmp = new_tmp();
1262 gen_helper_iwmmxt_setpsr_nz(tmp, cpu_M0);
1263 store_cpu_field(tmp, iwmmxt.cregs[ARM_IWMMXT_wCASF]);
1266 static inline void gen_op_iwmmxt_addl_M0_wRn(int rn)
1268 iwmmxt_load_reg(cpu_V1, rn);
1269 tcg_gen_ext32u_i64(cpu_V1, cpu_V1);
1270 tcg_gen_add_i64(cpu_M0, cpu_M0, cpu_V1);
1273 static inline int gen_iwmmxt_address(DisasContext *s, uint32_t insn, TCGv dest)
1275 int rd;
1276 uint32_t offset;
1277 TCGv tmp;
1279 rd = (insn >> 16) & 0xf;
1280 tmp = load_reg(s, rd);
1282 offset = (insn & 0xff) << ((insn >> 7) & 2);
1283 if (insn & (1 << 24)) {
1284 /* Pre indexed */
1285 if (insn & (1 << 23))
1286 tcg_gen_addi_i32(tmp, tmp, offset);
1287 else
1288 tcg_gen_addi_i32(tmp, tmp, -offset);
1289 tcg_gen_mov_i32(dest, tmp);
1290 if (insn & (1 << 21))
1291 store_reg(s, rd, tmp);
1292 else
1293 dead_tmp(tmp);
1294 } else if (insn & (1 << 21)) {
1295 /* Post indexed */
1296 tcg_gen_mov_i32(dest, tmp);
1297 if (insn & (1 << 23))
1298 tcg_gen_addi_i32(tmp, tmp, offset);
1299 else
1300 tcg_gen_addi_i32(tmp, tmp, -offset);
1301 store_reg(s, rd, tmp);
1302 } else if (!(insn & (1 << 23)))
1303 return 1;
1304 return 0;
1307 static inline int gen_iwmmxt_shift(uint32_t insn, uint32_t mask, TCGv dest)
1309 int rd = (insn >> 0) & 0xf;
1310 TCGv tmp;
1312 if (insn & (1 << 8)) {
1313 if (rd < ARM_IWMMXT_wCGR0 || rd > ARM_IWMMXT_wCGR3) {
1314 return 1;
1315 } else {
1316 tmp = iwmmxt_load_creg(rd);
1318 } else {
1319 tmp = new_tmp();
1320 iwmmxt_load_reg(cpu_V0, rd);
1321 tcg_gen_trunc_i64_i32(tmp, cpu_V0);
1323 tcg_gen_andi_i32(tmp, tmp, mask);
1324 tcg_gen_mov_i32(dest, tmp);
1325 dead_tmp(tmp);
1326 return 0;
1329 /* Disassemble an iwMMXt instruction. Returns nonzero if an error occured
1330 (ie. an undefined instruction). */
1331 static int disas_iwmmxt_insn(CPUState *env, DisasContext *s, uint32_t insn)
1333 int rd, wrd;
1334 int rdhi, rdlo, rd0, rd1, i;
1335 TCGv addr;
1336 TCGv tmp, tmp2, tmp3;
1338 if ((insn & 0x0e000e00) == 0x0c000000) {
1339 if ((insn & 0x0fe00ff0) == 0x0c400000) {
1340 wrd = insn & 0xf;
1341 rdlo = (insn >> 12) & 0xf;
1342 rdhi = (insn >> 16) & 0xf;
1343 if (insn & ARM_CP_RW_BIT) { /* TMRRC */
1344 iwmmxt_load_reg(cpu_V0, wrd);
1345 tcg_gen_trunc_i64_i32(cpu_R[rdlo], cpu_V0);
1346 tcg_gen_shri_i64(cpu_V0, cpu_V0, 32);
1347 tcg_gen_trunc_i64_i32(cpu_R[rdhi], cpu_V0);
1348 } else { /* TMCRR */
1349 tcg_gen_concat_i32_i64(cpu_V0, cpu_R[rdlo], cpu_R[rdhi]);
1350 iwmmxt_store_reg(cpu_V0, wrd);
1351 gen_op_iwmmxt_set_mup();
1353 return 0;
1356 wrd = (insn >> 12) & 0xf;
1357 addr = new_tmp();
1358 if (gen_iwmmxt_address(s, insn, addr)) {
1359 dead_tmp(addr);
1360 return 1;
1362 if (insn & ARM_CP_RW_BIT) {
1363 if ((insn >> 28) == 0xf) { /* WLDRW wCx */
1364 tmp = new_tmp();
1365 tcg_gen_qemu_ld32u(tmp, addr, IS_USER(s));
1366 iwmmxt_store_creg(wrd, tmp);
1367 } else {
1368 i = 1;
1369 if (insn & (1 << 8)) {
1370 if (insn & (1 << 22)) { /* WLDRD */
1371 tcg_gen_qemu_ld64(cpu_M0, addr, IS_USER(s));
1372 i = 0;
1373 } else { /* WLDRW wRd */
1374 tmp = gen_ld32(addr, IS_USER(s));
1376 } else {
1377 if (insn & (1 << 22)) { /* WLDRH */
1378 tmp = gen_ld16u(addr, IS_USER(s));
1379 } else { /* WLDRB */
1380 tmp = gen_ld8u(addr, IS_USER(s));
1383 if (i) {
1384 tcg_gen_extu_i32_i64(cpu_M0, tmp);
1385 dead_tmp(tmp);
1387 gen_op_iwmmxt_movq_wRn_M0(wrd);
1389 } else {
1390 if ((insn >> 28) == 0xf) { /* WSTRW wCx */
1391 tmp = iwmmxt_load_creg(wrd);
1392 gen_st32(tmp, addr, IS_USER(s));
1393 } else {
1394 gen_op_iwmmxt_movq_M0_wRn(wrd);
1395 tmp = new_tmp();
1396 if (insn & (1 << 8)) {
1397 if (insn & (1 << 22)) { /* WSTRD */
1398 dead_tmp(tmp);
1399 tcg_gen_qemu_st64(cpu_M0, addr, IS_USER(s));
1400 } else { /* WSTRW wRd */
1401 tcg_gen_trunc_i64_i32(tmp, cpu_M0);
1402 gen_st32(tmp, addr, IS_USER(s));
1404 } else {
1405 if (insn & (1 << 22)) { /* WSTRH */
1406 tcg_gen_trunc_i64_i32(tmp, cpu_M0);
1407 gen_st16(tmp, addr, IS_USER(s));
1408 } else { /* WSTRB */
1409 tcg_gen_trunc_i64_i32(tmp, cpu_M0);
1410 gen_st8(tmp, addr, IS_USER(s));
1415 dead_tmp(addr);
1416 return 0;
1419 if ((insn & 0x0f000000) != 0x0e000000)
1420 return 1;
1422 switch (((insn >> 12) & 0xf00) | ((insn >> 4) & 0xff)) {
1423 case 0x000: /* WOR */
1424 wrd = (insn >> 12) & 0xf;
1425 rd0 = (insn >> 0) & 0xf;
1426 rd1 = (insn >> 16) & 0xf;
1427 gen_op_iwmmxt_movq_M0_wRn(rd0);
1428 gen_op_iwmmxt_orq_M0_wRn(rd1);
1429 gen_op_iwmmxt_setpsr_nz();
1430 gen_op_iwmmxt_movq_wRn_M0(wrd);
1431 gen_op_iwmmxt_set_mup();
1432 gen_op_iwmmxt_set_cup();
1433 break;
1434 case 0x011: /* TMCR */
1435 if (insn & 0xf)
1436 return 1;
1437 rd = (insn >> 12) & 0xf;
1438 wrd = (insn >> 16) & 0xf;
1439 switch (wrd) {
1440 case ARM_IWMMXT_wCID:
1441 case ARM_IWMMXT_wCASF:
1442 break;
1443 case ARM_IWMMXT_wCon:
1444 gen_op_iwmmxt_set_cup();
1445 /* Fall through. */
1446 case ARM_IWMMXT_wCSSF:
1447 tmp = iwmmxt_load_creg(wrd);
1448 tmp2 = load_reg(s, rd);
1449 tcg_gen_andc_i32(tmp, tmp, tmp2);
1450 dead_tmp(tmp2);
1451 iwmmxt_store_creg(wrd, tmp);
1452 break;
1453 case ARM_IWMMXT_wCGR0:
1454 case ARM_IWMMXT_wCGR1:
1455 case ARM_IWMMXT_wCGR2:
1456 case ARM_IWMMXT_wCGR3:
1457 gen_op_iwmmxt_set_cup();
1458 tmp = load_reg(s, rd);
1459 iwmmxt_store_creg(wrd, tmp);
1460 break;
1461 default:
1462 return 1;
1464 break;
1465 case 0x100: /* WXOR */
1466 wrd = (insn >> 12) & 0xf;
1467 rd0 = (insn >> 0) & 0xf;
1468 rd1 = (insn >> 16) & 0xf;
1469 gen_op_iwmmxt_movq_M0_wRn(rd0);
1470 gen_op_iwmmxt_xorq_M0_wRn(rd1);
1471 gen_op_iwmmxt_setpsr_nz();
1472 gen_op_iwmmxt_movq_wRn_M0(wrd);
1473 gen_op_iwmmxt_set_mup();
1474 gen_op_iwmmxt_set_cup();
1475 break;
1476 case 0x111: /* TMRC */
1477 if (insn & 0xf)
1478 return 1;
1479 rd = (insn >> 12) & 0xf;
1480 wrd = (insn >> 16) & 0xf;
1481 tmp = iwmmxt_load_creg(wrd);
1482 store_reg(s, rd, tmp);
1483 break;
1484 case 0x300: /* WANDN */
1485 wrd = (insn >> 12) & 0xf;
1486 rd0 = (insn >> 0) & 0xf;
1487 rd1 = (insn >> 16) & 0xf;
1488 gen_op_iwmmxt_movq_M0_wRn(rd0);
1489 tcg_gen_neg_i64(cpu_M0, cpu_M0);
1490 gen_op_iwmmxt_andq_M0_wRn(rd1);
1491 gen_op_iwmmxt_setpsr_nz();
1492 gen_op_iwmmxt_movq_wRn_M0(wrd);
1493 gen_op_iwmmxt_set_mup();
1494 gen_op_iwmmxt_set_cup();
1495 break;
1496 case 0x200: /* WAND */
1497 wrd = (insn >> 12) & 0xf;
1498 rd0 = (insn >> 0) & 0xf;
1499 rd1 = (insn >> 16) & 0xf;
1500 gen_op_iwmmxt_movq_M0_wRn(rd0);
1501 gen_op_iwmmxt_andq_M0_wRn(rd1);
1502 gen_op_iwmmxt_setpsr_nz();
1503 gen_op_iwmmxt_movq_wRn_M0(wrd);
1504 gen_op_iwmmxt_set_mup();
1505 gen_op_iwmmxt_set_cup();
1506 break;
1507 case 0x810: case 0xa10: /* WMADD */
1508 wrd = (insn >> 12) & 0xf;
1509 rd0 = (insn >> 0) & 0xf;
1510 rd1 = (insn >> 16) & 0xf;
1511 gen_op_iwmmxt_movq_M0_wRn(rd0);
1512 if (insn & (1 << 21))
1513 gen_op_iwmmxt_maddsq_M0_wRn(rd1);
1514 else
1515 gen_op_iwmmxt_madduq_M0_wRn(rd1);
1516 gen_op_iwmmxt_movq_wRn_M0(wrd);
1517 gen_op_iwmmxt_set_mup();
1518 break;
1519 case 0x10e: case 0x50e: case 0x90e: case 0xd0e: /* WUNPCKIL */
1520 wrd = (insn >> 12) & 0xf;
1521 rd0 = (insn >> 16) & 0xf;
1522 rd1 = (insn >> 0) & 0xf;
1523 gen_op_iwmmxt_movq_M0_wRn(rd0);
1524 switch ((insn >> 22) & 3) {
1525 case 0:
1526 gen_op_iwmmxt_unpacklb_M0_wRn(rd1);
1527 break;
1528 case 1:
1529 gen_op_iwmmxt_unpacklw_M0_wRn(rd1);
1530 break;
1531 case 2:
1532 gen_op_iwmmxt_unpackll_M0_wRn(rd1);
1533 break;
1534 case 3:
1535 return 1;
1537 gen_op_iwmmxt_movq_wRn_M0(wrd);
1538 gen_op_iwmmxt_set_mup();
1539 gen_op_iwmmxt_set_cup();
1540 break;
1541 case 0x10c: case 0x50c: case 0x90c: case 0xd0c: /* WUNPCKIH */
1542 wrd = (insn >> 12) & 0xf;
1543 rd0 = (insn >> 16) & 0xf;
1544 rd1 = (insn >> 0) & 0xf;
1545 gen_op_iwmmxt_movq_M0_wRn(rd0);
1546 switch ((insn >> 22) & 3) {
1547 case 0:
1548 gen_op_iwmmxt_unpackhb_M0_wRn(rd1);
1549 break;
1550 case 1:
1551 gen_op_iwmmxt_unpackhw_M0_wRn(rd1);
1552 break;
1553 case 2:
1554 gen_op_iwmmxt_unpackhl_M0_wRn(rd1);
1555 break;
1556 case 3:
1557 return 1;
1559 gen_op_iwmmxt_movq_wRn_M0(wrd);
1560 gen_op_iwmmxt_set_mup();
1561 gen_op_iwmmxt_set_cup();
1562 break;
1563 case 0x012: case 0x112: case 0x412: case 0x512: /* WSAD */
1564 wrd = (insn >> 12) & 0xf;
1565 rd0 = (insn >> 16) & 0xf;
1566 rd1 = (insn >> 0) & 0xf;
1567 gen_op_iwmmxt_movq_M0_wRn(rd0);
1568 if (insn & (1 << 22))
1569 gen_op_iwmmxt_sadw_M0_wRn(rd1);
1570 else
1571 gen_op_iwmmxt_sadb_M0_wRn(rd1);
1572 if (!(insn & (1 << 20)))
1573 gen_op_iwmmxt_addl_M0_wRn(wrd);
1574 gen_op_iwmmxt_movq_wRn_M0(wrd);
1575 gen_op_iwmmxt_set_mup();
1576 break;
1577 case 0x010: case 0x110: case 0x210: case 0x310: /* WMUL */
1578 wrd = (insn >> 12) & 0xf;
1579 rd0 = (insn >> 16) & 0xf;
1580 rd1 = (insn >> 0) & 0xf;
1581 gen_op_iwmmxt_movq_M0_wRn(rd0);
1582 if (insn & (1 << 21)) {
1583 if (insn & (1 << 20))
1584 gen_op_iwmmxt_mulshw_M0_wRn(rd1);
1585 else
1586 gen_op_iwmmxt_mulslw_M0_wRn(rd1);
1587 } else {
1588 if (insn & (1 << 20))
1589 gen_op_iwmmxt_muluhw_M0_wRn(rd1);
1590 else
1591 gen_op_iwmmxt_mululw_M0_wRn(rd1);
1593 gen_op_iwmmxt_movq_wRn_M0(wrd);
1594 gen_op_iwmmxt_set_mup();
1595 break;
1596 case 0x410: case 0x510: case 0x610: case 0x710: /* WMAC */
1597 wrd = (insn >> 12) & 0xf;
1598 rd0 = (insn >> 16) & 0xf;
1599 rd1 = (insn >> 0) & 0xf;
1600 gen_op_iwmmxt_movq_M0_wRn(rd0);
1601 if (insn & (1 << 21))
1602 gen_op_iwmmxt_macsw_M0_wRn(rd1);
1603 else
1604 gen_op_iwmmxt_macuw_M0_wRn(rd1);
1605 if (!(insn & (1 << 20))) {
1606 iwmmxt_load_reg(cpu_V1, wrd);
1607 tcg_gen_add_i64(cpu_M0, cpu_M0, cpu_V1);
1609 gen_op_iwmmxt_movq_wRn_M0(wrd);
1610 gen_op_iwmmxt_set_mup();
1611 break;
1612 case 0x006: case 0x406: case 0x806: case 0xc06: /* WCMPEQ */
1613 wrd = (insn >> 12) & 0xf;
1614 rd0 = (insn >> 16) & 0xf;
1615 rd1 = (insn >> 0) & 0xf;
1616 gen_op_iwmmxt_movq_M0_wRn(rd0);
1617 switch ((insn >> 22) & 3) {
1618 case 0:
1619 gen_op_iwmmxt_cmpeqb_M0_wRn(rd1);
1620 break;
1621 case 1:
1622 gen_op_iwmmxt_cmpeqw_M0_wRn(rd1);
1623 break;
1624 case 2:
1625 gen_op_iwmmxt_cmpeql_M0_wRn(rd1);
1626 break;
1627 case 3:
1628 return 1;
1630 gen_op_iwmmxt_movq_wRn_M0(wrd);
1631 gen_op_iwmmxt_set_mup();
1632 gen_op_iwmmxt_set_cup();
1633 break;
1634 case 0x800: case 0x900: case 0xc00: case 0xd00: /* WAVG2 */
1635 wrd = (insn >> 12) & 0xf;
1636 rd0 = (insn >> 16) & 0xf;
1637 rd1 = (insn >> 0) & 0xf;
1638 gen_op_iwmmxt_movq_M0_wRn(rd0);
1639 if (insn & (1 << 22)) {
1640 if (insn & (1 << 20))
1641 gen_op_iwmmxt_avgw1_M0_wRn(rd1);
1642 else
1643 gen_op_iwmmxt_avgw0_M0_wRn(rd1);
1644 } else {
1645 if (insn & (1 << 20))
1646 gen_op_iwmmxt_avgb1_M0_wRn(rd1);
1647 else
1648 gen_op_iwmmxt_avgb0_M0_wRn(rd1);
1650 gen_op_iwmmxt_movq_wRn_M0(wrd);
1651 gen_op_iwmmxt_set_mup();
1652 gen_op_iwmmxt_set_cup();
1653 break;
1654 case 0x802: case 0x902: case 0xa02: case 0xb02: /* WALIGNR */
1655 wrd = (insn >> 12) & 0xf;
1656 rd0 = (insn >> 16) & 0xf;
1657 rd1 = (insn >> 0) & 0xf;
1658 gen_op_iwmmxt_movq_M0_wRn(rd0);
1659 tmp = iwmmxt_load_creg(ARM_IWMMXT_wCGR0 + ((insn >> 20) & 3));
1660 tcg_gen_andi_i32(tmp, tmp, 7);
1661 iwmmxt_load_reg(cpu_V1, rd1);
1662 gen_helper_iwmmxt_align(cpu_M0, cpu_M0, cpu_V1, tmp);
1663 dead_tmp(tmp);
1664 gen_op_iwmmxt_movq_wRn_M0(wrd);
1665 gen_op_iwmmxt_set_mup();
1666 break;
1667 case 0x601: case 0x605: case 0x609: case 0x60d: /* TINSR */
1668 if (((insn >> 6) & 3) == 3)
1669 return 1;
1670 rd = (insn >> 12) & 0xf;
1671 wrd = (insn >> 16) & 0xf;
1672 tmp = load_reg(s, rd);
1673 gen_op_iwmmxt_movq_M0_wRn(wrd);
1674 switch ((insn >> 6) & 3) {
1675 case 0:
1676 tmp2 = tcg_const_i32(0xff);
1677 tmp3 = tcg_const_i32((insn & 7) << 3);
1678 break;
1679 case 1:
1680 tmp2 = tcg_const_i32(0xffff);
1681 tmp3 = tcg_const_i32((insn & 3) << 4);
1682 break;
1683 case 2:
1684 tmp2 = tcg_const_i32(0xffffffff);
1685 tmp3 = tcg_const_i32((insn & 1) << 5);
1686 break;
1687 default:
1688 TCGV_UNUSED(tmp2);
1689 TCGV_UNUSED(tmp3);
1691 gen_helper_iwmmxt_insr(cpu_M0, cpu_M0, tmp, tmp2, tmp3);
1692 tcg_temp_free(tmp3);
1693 tcg_temp_free(tmp2);
1694 dead_tmp(tmp);
1695 gen_op_iwmmxt_movq_wRn_M0(wrd);
1696 gen_op_iwmmxt_set_mup();
1697 break;
1698 case 0x107: case 0x507: case 0x907: case 0xd07: /* TEXTRM */
1699 rd = (insn >> 12) & 0xf;
1700 wrd = (insn >> 16) & 0xf;
1701 if (rd == 15 || ((insn >> 22) & 3) == 3)
1702 return 1;
1703 gen_op_iwmmxt_movq_M0_wRn(wrd);
1704 tmp = new_tmp();
1705 switch ((insn >> 22) & 3) {
1706 case 0:
1707 tcg_gen_shri_i64(cpu_M0, cpu_M0, (insn & 7) << 3);
1708 tcg_gen_trunc_i64_i32(tmp, cpu_M0);
1709 if (insn & 8) {
1710 tcg_gen_ext8s_i32(tmp, tmp);
1711 } else {
1712 tcg_gen_andi_i32(tmp, tmp, 0xff);
1714 break;
1715 case 1:
1716 tcg_gen_shri_i64(cpu_M0, cpu_M0, (insn & 3) << 4);
1717 tcg_gen_trunc_i64_i32(tmp, cpu_M0);
1718 if (insn & 8) {
1719 tcg_gen_ext16s_i32(tmp, tmp);
1720 } else {
1721 tcg_gen_andi_i32(tmp, tmp, 0xffff);
1723 break;
1724 case 2:
1725 tcg_gen_shri_i64(cpu_M0, cpu_M0, (insn & 1) << 5);
1726 tcg_gen_trunc_i64_i32(tmp, cpu_M0);
1727 break;
1729 store_reg(s, rd, tmp);
1730 break;
1731 case 0x117: case 0x517: case 0x917: case 0xd17: /* TEXTRC */
1732 if ((insn & 0x000ff008) != 0x0003f000 || ((insn >> 22) & 3) == 3)
1733 return 1;
1734 tmp = iwmmxt_load_creg(ARM_IWMMXT_wCASF);
1735 switch ((insn >> 22) & 3) {
1736 case 0:
1737 tcg_gen_shri_i32(tmp, tmp, ((insn & 7) << 2) + 0);
1738 break;
1739 case 1:
1740 tcg_gen_shri_i32(tmp, tmp, ((insn & 3) << 3) + 4);
1741 break;
1742 case 2:
1743 tcg_gen_shri_i32(tmp, tmp, ((insn & 1) << 4) + 12);
1744 break;
1746 tcg_gen_shli_i32(tmp, tmp, 28);
1747 gen_set_nzcv(tmp);
1748 dead_tmp(tmp);
1749 break;
1750 case 0x401: case 0x405: case 0x409: case 0x40d: /* TBCST */
1751 if (((insn >> 6) & 3) == 3)
1752 return 1;
1753 rd = (insn >> 12) & 0xf;
1754 wrd = (insn >> 16) & 0xf;
1755 tmp = load_reg(s, rd);
1756 switch ((insn >> 6) & 3) {
1757 case 0:
1758 gen_helper_iwmmxt_bcstb(cpu_M0, tmp);
1759 break;
1760 case 1:
1761 gen_helper_iwmmxt_bcstw(cpu_M0, tmp);
1762 break;
1763 case 2:
1764 gen_helper_iwmmxt_bcstl(cpu_M0, tmp);
1765 break;
1767 dead_tmp(tmp);
1768 gen_op_iwmmxt_movq_wRn_M0(wrd);
1769 gen_op_iwmmxt_set_mup();
1770 break;
1771 case 0x113: case 0x513: case 0x913: case 0xd13: /* TANDC */
1772 if ((insn & 0x000ff00f) != 0x0003f000 || ((insn >> 22) & 3) == 3)
1773 return 1;
1774 tmp = iwmmxt_load_creg(ARM_IWMMXT_wCASF);
1775 tmp2 = new_tmp();
1776 tcg_gen_mov_i32(tmp2, tmp);
1777 switch ((insn >> 22) & 3) {
1778 case 0:
1779 for (i = 0; i < 7; i ++) {
1780 tcg_gen_shli_i32(tmp2, tmp2, 4);
1781 tcg_gen_and_i32(tmp, tmp, tmp2);
1783 break;
1784 case 1:
1785 for (i = 0; i < 3; i ++) {
1786 tcg_gen_shli_i32(tmp2, tmp2, 8);
1787 tcg_gen_and_i32(tmp, tmp, tmp2);
1789 break;
1790 case 2:
1791 tcg_gen_shli_i32(tmp2, tmp2, 16);
1792 tcg_gen_and_i32(tmp, tmp, tmp2);
1793 break;
1795 gen_set_nzcv(tmp);
1796 dead_tmp(tmp2);
1797 dead_tmp(tmp);
1798 break;
1799 case 0x01c: case 0x41c: case 0x81c: case 0xc1c: /* WACC */
1800 wrd = (insn >> 12) & 0xf;
1801 rd0 = (insn >> 16) & 0xf;
1802 gen_op_iwmmxt_movq_M0_wRn(rd0);
1803 switch ((insn >> 22) & 3) {
1804 case 0:
1805 gen_helper_iwmmxt_addcb(cpu_M0, cpu_M0);
1806 break;
1807 case 1:
1808 gen_helper_iwmmxt_addcw(cpu_M0, cpu_M0);
1809 break;
1810 case 2:
1811 gen_helper_iwmmxt_addcl(cpu_M0, cpu_M0);
1812 break;
1813 case 3:
1814 return 1;
1816 gen_op_iwmmxt_movq_wRn_M0(wrd);
1817 gen_op_iwmmxt_set_mup();
1818 break;
1819 case 0x115: case 0x515: case 0x915: case 0xd15: /* TORC */
1820 if ((insn & 0x000ff00f) != 0x0003f000 || ((insn >> 22) & 3) == 3)
1821 return 1;
1822 tmp = iwmmxt_load_creg(ARM_IWMMXT_wCASF);
1823 tmp2 = new_tmp();
1824 tcg_gen_mov_i32(tmp2, tmp);
1825 switch ((insn >> 22) & 3) {
1826 case 0:
1827 for (i = 0; i < 7; i ++) {
1828 tcg_gen_shli_i32(tmp2, tmp2, 4);
1829 tcg_gen_or_i32(tmp, tmp, tmp2);
1831 break;
1832 case 1:
1833 for (i = 0; i < 3; i ++) {
1834 tcg_gen_shli_i32(tmp2, tmp2, 8);
1835 tcg_gen_or_i32(tmp, tmp, tmp2);
1837 break;
1838 case 2:
1839 tcg_gen_shli_i32(tmp2, tmp2, 16);
1840 tcg_gen_or_i32(tmp, tmp, tmp2);
1841 break;
1843 gen_set_nzcv(tmp);
1844 dead_tmp(tmp2);
1845 dead_tmp(tmp);
1846 break;
1847 case 0x103: case 0x503: case 0x903: case 0xd03: /* TMOVMSK */
1848 rd = (insn >> 12) & 0xf;
1849 rd0 = (insn >> 16) & 0xf;
1850 if ((insn & 0xf) != 0 || ((insn >> 22) & 3) == 3)
1851 return 1;
1852 gen_op_iwmmxt_movq_M0_wRn(rd0);
1853 tmp = new_tmp();
1854 switch ((insn >> 22) & 3) {
1855 case 0:
1856 gen_helper_iwmmxt_msbb(tmp, cpu_M0);
1857 break;
1858 case 1:
1859 gen_helper_iwmmxt_msbw(tmp, cpu_M0);
1860 break;
1861 case 2:
1862 gen_helper_iwmmxt_msbl(tmp, cpu_M0);
1863 break;
1865 store_reg(s, rd, tmp);
1866 break;
1867 case 0x106: case 0x306: case 0x506: case 0x706: /* WCMPGT */
1868 case 0x906: case 0xb06: case 0xd06: case 0xf06:
1869 wrd = (insn >> 12) & 0xf;
1870 rd0 = (insn >> 16) & 0xf;
1871 rd1 = (insn >> 0) & 0xf;
1872 gen_op_iwmmxt_movq_M0_wRn(rd0);
1873 switch ((insn >> 22) & 3) {
1874 case 0:
1875 if (insn & (1 << 21))
1876 gen_op_iwmmxt_cmpgtsb_M0_wRn(rd1);
1877 else
1878 gen_op_iwmmxt_cmpgtub_M0_wRn(rd1);
1879 break;
1880 case 1:
1881 if (insn & (1 << 21))
1882 gen_op_iwmmxt_cmpgtsw_M0_wRn(rd1);
1883 else
1884 gen_op_iwmmxt_cmpgtuw_M0_wRn(rd1);
1885 break;
1886 case 2:
1887 if (insn & (1 << 21))
1888 gen_op_iwmmxt_cmpgtsl_M0_wRn(rd1);
1889 else
1890 gen_op_iwmmxt_cmpgtul_M0_wRn(rd1);
1891 break;
1892 case 3:
1893 return 1;
1895 gen_op_iwmmxt_movq_wRn_M0(wrd);
1896 gen_op_iwmmxt_set_mup();
1897 gen_op_iwmmxt_set_cup();
1898 break;
1899 case 0x00e: case 0x20e: case 0x40e: case 0x60e: /* WUNPCKEL */
1900 case 0x80e: case 0xa0e: case 0xc0e: case 0xe0e:
1901 wrd = (insn >> 12) & 0xf;
1902 rd0 = (insn >> 16) & 0xf;
1903 gen_op_iwmmxt_movq_M0_wRn(rd0);
1904 switch ((insn >> 22) & 3) {
1905 case 0:
1906 if (insn & (1 << 21))
1907 gen_op_iwmmxt_unpacklsb_M0();
1908 else
1909 gen_op_iwmmxt_unpacklub_M0();
1910 break;
1911 case 1:
1912 if (insn & (1 << 21))
1913 gen_op_iwmmxt_unpacklsw_M0();
1914 else
1915 gen_op_iwmmxt_unpackluw_M0();
1916 break;
1917 case 2:
1918 if (insn & (1 << 21))
1919 gen_op_iwmmxt_unpacklsl_M0();
1920 else
1921 gen_op_iwmmxt_unpacklul_M0();
1922 break;
1923 case 3:
1924 return 1;
1926 gen_op_iwmmxt_movq_wRn_M0(wrd);
1927 gen_op_iwmmxt_set_mup();
1928 gen_op_iwmmxt_set_cup();
1929 break;
1930 case 0x00c: case 0x20c: case 0x40c: case 0x60c: /* WUNPCKEH */
1931 case 0x80c: case 0xa0c: case 0xc0c: case 0xe0c:
1932 wrd = (insn >> 12) & 0xf;
1933 rd0 = (insn >> 16) & 0xf;
1934 gen_op_iwmmxt_movq_M0_wRn(rd0);
1935 switch ((insn >> 22) & 3) {
1936 case 0:
1937 if (insn & (1 << 21))
1938 gen_op_iwmmxt_unpackhsb_M0();
1939 else
1940 gen_op_iwmmxt_unpackhub_M0();
1941 break;
1942 case 1:
1943 if (insn & (1 << 21))
1944 gen_op_iwmmxt_unpackhsw_M0();
1945 else
1946 gen_op_iwmmxt_unpackhuw_M0();
1947 break;
1948 case 2:
1949 if (insn & (1 << 21))
1950 gen_op_iwmmxt_unpackhsl_M0();
1951 else
1952 gen_op_iwmmxt_unpackhul_M0();
1953 break;
1954 case 3:
1955 return 1;
1957 gen_op_iwmmxt_movq_wRn_M0(wrd);
1958 gen_op_iwmmxt_set_mup();
1959 gen_op_iwmmxt_set_cup();
1960 break;
1961 case 0x204: case 0x604: case 0xa04: case 0xe04: /* WSRL */
1962 case 0x214: case 0x614: case 0xa14: case 0xe14:
1963 if (((insn >> 22) & 3) == 0)
1964 return 1;
1965 wrd = (insn >> 12) & 0xf;
1966 rd0 = (insn >> 16) & 0xf;
1967 gen_op_iwmmxt_movq_M0_wRn(rd0);
1968 tmp = new_tmp();
1969 if (gen_iwmmxt_shift(insn, 0xff, tmp)) {
1970 dead_tmp(tmp);
1971 return 1;
1973 switch ((insn >> 22) & 3) {
1974 case 1:
1975 gen_helper_iwmmxt_srlw(cpu_M0, cpu_env, cpu_M0, tmp);
1976 break;
1977 case 2:
1978 gen_helper_iwmmxt_srll(cpu_M0, cpu_env, cpu_M0, tmp);
1979 break;
1980 case 3:
1981 gen_helper_iwmmxt_srlq(cpu_M0, cpu_env, cpu_M0, tmp);
1982 break;
1984 dead_tmp(tmp);
1985 gen_op_iwmmxt_movq_wRn_M0(wrd);
1986 gen_op_iwmmxt_set_mup();
1987 gen_op_iwmmxt_set_cup();
1988 break;
1989 case 0x004: case 0x404: case 0x804: case 0xc04: /* WSRA */
1990 case 0x014: case 0x414: case 0x814: case 0xc14:
1991 if (((insn >> 22) & 3) == 0)
1992 return 1;
1993 wrd = (insn >> 12) & 0xf;
1994 rd0 = (insn >> 16) & 0xf;
1995 gen_op_iwmmxt_movq_M0_wRn(rd0);
1996 tmp = new_tmp();
1997 if (gen_iwmmxt_shift(insn, 0xff, tmp)) {
1998 dead_tmp(tmp);
1999 return 1;
2001 switch ((insn >> 22) & 3) {
2002 case 1:
2003 gen_helper_iwmmxt_sraw(cpu_M0, cpu_env, cpu_M0, tmp);
2004 break;
2005 case 2:
2006 gen_helper_iwmmxt_sral(cpu_M0, cpu_env, cpu_M0, tmp);
2007 break;
2008 case 3:
2009 gen_helper_iwmmxt_sraq(cpu_M0, cpu_env, cpu_M0, tmp);
2010 break;
2012 dead_tmp(tmp);
2013 gen_op_iwmmxt_movq_wRn_M0(wrd);
2014 gen_op_iwmmxt_set_mup();
2015 gen_op_iwmmxt_set_cup();
2016 break;
2017 case 0x104: case 0x504: case 0x904: case 0xd04: /* WSLL */
2018 case 0x114: case 0x514: case 0x914: case 0xd14:
2019 if (((insn >> 22) & 3) == 0)
2020 return 1;
2021 wrd = (insn >> 12) & 0xf;
2022 rd0 = (insn >> 16) & 0xf;
2023 gen_op_iwmmxt_movq_M0_wRn(rd0);
2024 tmp = new_tmp();
2025 if (gen_iwmmxt_shift(insn, 0xff, tmp)) {
2026 dead_tmp(tmp);
2027 return 1;
2029 switch ((insn >> 22) & 3) {
2030 case 1:
2031 gen_helper_iwmmxt_sllw(cpu_M0, cpu_env, cpu_M0, tmp);
2032 break;
2033 case 2:
2034 gen_helper_iwmmxt_slll(cpu_M0, cpu_env, cpu_M0, tmp);
2035 break;
2036 case 3:
2037 gen_helper_iwmmxt_sllq(cpu_M0, cpu_env, cpu_M0, tmp);
2038 break;
2040 dead_tmp(tmp);
2041 gen_op_iwmmxt_movq_wRn_M0(wrd);
2042 gen_op_iwmmxt_set_mup();
2043 gen_op_iwmmxt_set_cup();
2044 break;
2045 case 0x304: case 0x704: case 0xb04: case 0xf04: /* WROR */
2046 case 0x314: case 0x714: case 0xb14: case 0xf14:
2047 if (((insn >> 22) & 3) == 0)
2048 return 1;
2049 wrd = (insn >> 12) & 0xf;
2050 rd0 = (insn >> 16) & 0xf;
2051 gen_op_iwmmxt_movq_M0_wRn(rd0);
2052 tmp = new_tmp();
2053 switch ((insn >> 22) & 3) {
2054 case 1:
2055 if (gen_iwmmxt_shift(insn, 0xf, tmp)) {
2056 dead_tmp(tmp);
2057 return 1;
2059 gen_helper_iwmmxt_rorw(cpu_M0, cpu_env, cpu_M0, tmp);
2060 break;
2061 case 2:
2062 if (gen_iwmmxt_shift(insn, 0x1f, tmp)) {
2063 dead_tmp(tmp);
2064 return 1;
2066 gen_helper_iwmmxt_rorl(cpu_M0, cpu_env, cpu_M0, tmp);
2067 break;
2068 case 3:
2069 if (gen_iwmmxt_shift(insn, 0x3f, tmp)) {
2070 dead_tmp(tmp);
2071 return 1;
2073 gen_helper_iwmmxt_rorq(cpu_M0, cpu_env, cpu_M0, tmp);
2074 break;
2076 dead_tmp(tmp);
2077 gen_op_iwmmxt_movq_wRn_M0(wrd);
2078 gen_op_iwmmxt_set_mup();
2079 gen_op_iwmmxt_set_cup();
2080 break;
2081 case 0x116: case 0x316: case 0x516: case 0x716: /* WMIN */
2082 case 0x916: case 0xb16: case 0xd16: case 0xf16:
2083 wrd = (insn >> 12) & 0xf;
2084 rd0 = (insn >> 16) & 0xf;
2085 rd1 = (insn >> 0) & 0xf;
2086 gen_op_iwmmxt_movq_M0_wRn(rd0);
2087 switch ((insn >> 22) & 3) {
2088 case 0:
2089 if (insn & (1 << 21))
2090 gen_op_iwmmxt_minsb_M0_wRn(rd1);
2091 else
2092 gen_op_iwmmxt_minub_M0_wRn(rd1);
2093 break;
2094 case 1:
2095 if (insn & (1 << 21))
2096 gen_op_iwmmxt_minsw_M0_wRn(rd1);
2097 else
2098 gen_op_iwmmxt_minuw_M0_wRn(rd1);
2099 break;
2100 case 2:
2101 if (insn & (1 << 21))
2102 gen_op_iwmmxt_minsl_M0_wRn(rd1);
2103 else
2104 gen_op_iwmmxt_minul_M0_wRn(rd1);
2105 break;
2106 case 3:
2107 return 1;
2109 gen_op_iwmmxt_movq_wRn_M0(wrd);
2110 gen_op_iwmmxt_set_mup();
2111 break;
2112 case 0x016: case 0x216: case 0x416: case 0x616: /* WMAX */
2113 case 0x816: case 0xa16: case 0xc16: case 0xe16:
2114 wrd = (insn >> 12) & 0xf;
2115 rd0 = (insn >> 16) & 0xf;
2116 rd1 = (insn >> 0) & 0xf;
2117 gen_op_iwmmxt_movq_M0_wRn(rd0);
2118 switch ((insn >> 22) & 3) {
2119 case 0:
2120 if (insn & (1 << 21))
2121 gen_op_iwmmxt_maxsb_M0_wRn(rd1);
2122 else
2123 gen_op_iwmmxt_maxub_M0_wRn(rd1);
2124 break;
2125 case 1:
2126 if (insn & (1 << 21))
2127 gen_op_iwmmxt_maxsw_M0_wRn(rd1);
2128 else
2129 gen_op_iwmmxt_maxuw_M0_wRn(rd1);
2130 break;
2131 case 2:
2132 if (insn & (1 << 21))
2133 gen_op_iwmmxt_maxsl_M0_wRn(rd1);
2134 else
2135 gen_op_iwmmxt_maxul_M0_wRn(rd1);
2136 break;
2137 case 3:
2138 return 1;
2140 gen_op_iwmmxt_movq_wRn_M0(wrd);
2141 gen_op_iwmmxt_set_mup();
2142 break;
2143 case 0x002: case 0x102: case 0x202: case 0x302: /* WALIGNI */
2144 case 0x402: case 0x502: case 0x602: case 0x702:
2145 wrd = (insn >> 12) & 0xf;
2146 rd0 = (insn >> 16) & 0xf;
2147 rd1 = (insn >> 0) & 0xf;
2148 gen_op_iwmmxt_movq_M0_wRn(rd0);
2149 tmp = tcg_const_i32((insn >> 20) & 3);
2150 iwmmxt_load_reg(cpu_V1, rd1);
2151 gen_helper_iwmmxt_align(cpu_M0, cpu_M0, cpu_V1, tmp);
2152 tcg_temp_free(tmp);
2153 gen_op_iwmmxt_movq_wRn_M0(wrd);
2154 gen_op_iwmmxt_set_mup();
2155 break;
2156 case 0x01a: case 0x11a: case 0x21a: case 0x31a: /* WSUB */
2157 case 0x41a: case 0x51a: case 0x61a: case 0x71a:
2158 case 0x81a: case 0x91a: case 0xa1a: case 0xb1a:
2159 case 0xc1a: case 0xd1a: case 0xe1a: case 0xf1a:
2160 wrd = (insn >> 12) & 0xf;
2161 rd0 = (insn >> 16) & 0xf;
2162 rd1 = (insn >> 0) & 0xf;
2163 gen_op_iwmmxt_movq_M0_wRn(rd0);
2164 switch ((insn >> 20) & 0xf) {
2165 case 0x0:
2166 gen_op_iwmmxt_subnb_M0_wRn(rd1);
2167 break;
2168 case 0x1:
2169 gen_op_iwmmxt_subub_M0_wRn(rd1);
2170 break;
2171 case 0x3:
2172 gen_op_iwmmxt_subsb_M0_wRn(rd1);
2173 break;
2174 case 0x4:
2175 gen_op_iwmmxt_subnw_M0_wRn(rd1);
2176 break;
2177 case 0x5:
2178 gen_op_iwmmxt_subuw_M0_wRn(rd1);
2179 break;
2180 case 0x7:
2181 gen_op_iwmmxt_subsw_M0_wRn(rd1);
2182 break;
2183 case 0x8:
2184 gen_op_iwmmxt_subnl_M0_wRn(rd1);
2185 break;
2186 case 0x9:
2187 gen_op_iwmmxt_subul_M0_wRn(rd1);
2188 break;
2189 case 0xb:
2190 gen_op_iwmmxt_subsl_M0_wRn(rd1);
2191 break;
2192 default:
2193 return 1;
2195 gen_op_iwmmxt_movq_wRn_M0(wrd);
2196 gen_op_iwmmxt_set_mup();
2197 gen_op_iwmmxt_set_cup();
2198 break;
2199 case 0x01e: case 0x11e: case 0x21e: case 0x31e: /* WSHUFH */
2200 case 0x41e: case 0x51e: case 0x61e: case 0x71e:
2201 case 0x81e: case 0x91e: case 0xa1e: case 0xb1e:
2202 case 0xc1e: case 0xd1e: case 0xe1e: case 0xf1e:
2203 wrd = (insn >> 12) & 0xf;
2204 rd0 = (insn >> 16) & 0xf;
2205 gen_op_iwmmxt_movq_M0_wRn(rd0);
2206 tmp = tcg_const_i32(((insn >> 16) & 0xf0) | (insn & 0x0f));
2207 gen_helper_iwmmxt_shufh(cpu_M0, cpu_env, cpu_M0, tmp);
2208 tcg_temp_free(tmp);
2209 gen_op_iwmmxt_movq_wRn_M0(wrd);
2210 gen_op_iwmmxt_set_mup();
2211 gen_op_iwmmxt_set_cup();
2212 break;
2213 case 0x018: case 0x118: case 0x218: case 0x318: /* WADD */
2214 case 0x418: case 0x518: case 0x618: case 0x718:
2215 case 0x818: case 0x918: case 0xa18: case 0xb18:
2216 case 0xc18: case 0xd18: case 0xe18: case 0xf18:
2217 wrd = (insn >> 12) & 0xf;
2218 rd0 = (insn >> 16) & 0xf;
2219 rd1 = (insn >> 0) & 0xf;
2220 gen_op_iwmmxt_movq_M0_wRn(rd0);
2221 switch ((insn >> 20) & 0xf) {
2222 case 0x0:
2223 gen_op_iwmmxt_addnb_M0_wRn(rd1);
2224 break;
2225 case 0x1:
2226 gen_op_iwmmxt_addub_M0_wRn(rd1);
2227 break;
2228 case 0x3:
2229 gen_op_iwmmxt_addsb_M0_wRn(rd1);
2230 break;
2231 case 0x4:
2232 gen_op_iwmmxt_addnw_M0_wRn(rd1);
2233 break;
2234 case 0x5:
2235 gen_op_iwmmxt_adduw_M0_wRn(rd1);
2236 break;
2237 case 0x7:
2238 gen_op_iwmmxt_addsw_M0_wRn(rd1);
2239 break;
2240 case 0x8:
2241 gen_op_iwmmxt_addnl_M0_wRn(rd1);
2242 break;
2243 case 0x9:
2244 gen_op_iwmmxt_addul_M0_wRn(rd1);
2245 break;
2246 case 0xb:
2247 gen_op_iwmmxt_addsl_M0_wRn(rd1);
2248 break;
2249 default:
2250 return 1;
2252 gen_op_iwmmxt_movq_wRn_M0(wrd);
2253 gen_op_iwmmxt_set_mup();
2254 gen_op_iwmmxt_set_cup();
2255 break;
2256 case 0x008: case 0x108: case 0x208: case 0x308: /* WPACK */
2257 case 0x408: case 0x508: case 0x608: case 0x708:
2258 case 0x808: case 0x908: case 0xa08: case 0xb08:
2259 case 0xc08: case 0xd08: case 0xe08: case 0xf08:
2260 if (!(insn & (1 << 20)) || ((insn >> 22) & 3) == 0)
2261 return 1;
2262 wrd = (insn >> 12) & 0xf;
2263 rd0 = (insn >> 16) & 0xf;
2264 rd1 = (insn >> 0) & 0xf;
2265 gen_op_iwmmxt_movq_M0_wRn(rd0);
2266 switch ((insn >> 22) & 3) {
2267 case 1:
2268 if (insn & (1 << 21))
2269 gen_op_iwmmxt_packsw_M0_wRn(rd1);
2270 else
2271 gen_op_iwmmxt_packuw_M0_wRn(rd1);
2272 break;
2273 case 2:
2274 if (insn & (1 << 21))
2275 gen_op_iwmmxt_packsl_M0_wRn(rd1);
2276 else
2277 gen_op_iwmmxt_packul_M0_wRn(rd1);
2278 break;
2279 case 3:
2280 if (insn & (1 << 21))
2281 gen_op_iwmmxt_packsq_M0_wRn(rd1);
2282 else
2283 gen_op_iwmmxt_packuq_M0_wRn(rd1);
2284 break;
2286 gen_op_iwmmxt_movq_wRn_M0(wrd);
2287 gen_op_iwmmxt_set_mup();
2288 gen_op_iwmmxt_set_cup();
2289 break;
2290 case 0x201: case 0x203: case 0x205: case 0x207:
2291 case 0x209: case 0x20b: case 0x20d: case 0x20f:
2292 case 0x211: case 0x213: case 0x215: case 0x217:
2293 case 0x219: case 0x21b: case 0x21d: case 0x21f:
2294 wrd = (insn >> 5) & 0xf;
2295 rd0 = (insn >> 12) & 0xf;
2296 rd1 = (insn >> 0) & 0xf;
2297 if (rd0 == 0xf || rd1 == 0xf)
2298 return 1;
2299 gen_op_iwmmxt_movq_M0_wRn(wrd);
2300 tmp = load_reg(s, rd0);
2301 tmp2 = load_reg(s, rd1);
2302 switch ((insn >> 16) & 0xf) {
2303 case 0x0: /* TMIA */
2304 gen_helper_iwmmxt_muladdsl(cpu_M0, cpu_M0, tmp, tmp2);
2305 break;
2306 case 0x8: /* TMIAPH */
2307 gen_helper_iwmmxt_muladdsw(cpu_M0, cpu_M0, tmp, tmp2);
2308 break;
2309 case 0xc: case 0xd: case 0xe: case 0xf: /* TMIAxy */
2310 if (insn & (1 << 16))
2311 tcg_gen_shri_i32(tmp, tmp, 16);
2312 if (insn & (1 << 17))
2313 tcg_gen_shri_i32(tmp2, tmp2, 16);
2314 gen_helper_iwmmxt_muladdswl(cpu_M0, cpu_M0, tmp, tmp2);
2315 break;
2316 default:
2317 dead_tmp(tmp2);
2318 dead_tmp(tmp);
2319 return 1;
2321 dead_tmp(tmp2);
2322 dead_tmp(tmp);
2323 gen_op_iwmmxt_movq_wRn_M0(wrd);
2324 gen_op_iwmmxt_set_mup();
2325 break;
2326 default:
2327 return 1;
2330 return 0;
2333 /* Disassemble an XScale DSP instruction. Returns nonzero if an error occured
2334 (ie. an undefined instruction). */
2335 static int disas_dsp_insn(CPUState *env, DisasContext *s, uint32_t insn)
2337 int acc, rd0, rd1, rdhi, rdlo;
2338 TCGv tmp, tmp2;
2340 if ((insn & 0x0ff00f10) == 0x0e200010) {
2341 /* Multiply with Internal Accumulate Format */
2342 rd0 = (insn >> 12) & 0xf;
2343 rd1 = insn & 0xf;
2344 acc = (insn >> 5) & 7;
2346 if (acc != 0)
2347 return 1;
2349 tmp = load_reg(s, rd0);
2350 tmp2 = load_reg(s, rd1);
2351 switch ((insn >> 16) & 0xf) {
2352 case 0x0: /* MIA */
2353 gen_helper_iwmmxt_muladdsl(cpu_M0, cpu_M0, tmp, tmp2);
2354 break;
2355 case 0x8: /* MIAPH */
2356 gen_helper_iwmmxt_muladdsw(cpu_M0, cpu_M0, tmp, tmp2);
2357 break;
2358 case 0xc: /* MIABB */
2359 case 0xd: /* MIABT */
2360 case 0xe: /* MIATB */
2361 case 0xf: /* MIATT */
2362 if (insn & (1 << 16))
2363 tcg_gen_shri_i32(tmp, tmp, 16);
2364 if (insn & (1 << 17))
2365 tcg_gen_shri_i32(tmp2, tmp2, 16);
2366 gen_helper_iwmmxt_muladdswl(cpu_M0, cpu_M0, tmp, tmp2);
2367 break;
2368 default:
2369 return 1;
2371 dead_tmp(tmp2);
2372 dead_tmp(tmp);
2374 gen_op_iwmmxt_movq_wRn_M0(acc);
2375 return 0;
2378 if ((insn & 0x0fe00ff8) == 0x0c400000) {
2379 /* Internal Accumulator Access Format */
2380 rdhi = (insn >> 16) & 0xf;
2381 rdlo = (insn >> 12) & 0xf;
2382 acc = insn & 7;
2384 if (acc != 0)
2385 return 1;
2387 if (insn & ARM_CP_RW_BIT) { /* MRA */
2388 iwmmxt_load_reg(cpu_V0, acc);
2389 tcg_gen_trunc_i64_i32(cpu_R[rdlo], cpu_V0);
2390 tcg_gen_shri_i64(cpu_V0, cpu_V0, 32);
2391 tcg_gen_trunc_i64_i32(cpu_R[rdhi], cpu_V0);
2392 tcg_gen_andi_i32(cpu_R[rdhi], cpu_R[rdhi], (1 << (40 - 32)) - 1);
2393 } else { /* MAR */
2394 tcg_gen_concat_i32_i64(cpu_V0, cpu_R[rdlo], cpu_R[rdhi]);
2395 iwmmxt_store_reg(cpu_V0, acc);
2397 return 0;
2400 return 1;
2403 /* Disassemble system coprocessor instruction. Return nonzero if
2404 instruction is not defined. */
2405 static int disas_cp_insn(CPUState *env, DisasContext *s, uint32_t insn)
2407 TCGv tmp, tmp2;
2408 uint32_t rd = (insn >> 12) & 0xf;
2409 uint32_t cp = (insn >> 8) & 0xf;
2410 if (IS_USER(s)) {
2411 return 1;
2414 if (insn & ARM_CP_RW_BIT) {
2415 if (!env->cp[cp].cp_read)
2416 return 1;
2417 gen_set_pc_im(s->pc);
2418 tmp = new_tmp();
2419 tmp2 = tcg_const_i32(insn);
2420 gen_helper_get_cp(tmp, cpu_env, tmp2);
2421 tcg_temp_free(tmp2);
2422 store_reg(s, rd, tmp);
2423 } else {
2424 if (!env->cp[cp].cp_write)
2425 return 1;
2426 gen_set_pc_im(s->pc);
2427 tmp = load_reg(s, rd);
2428 tmp2 = tcg_const_i32(insn);
2429 gen_helper_set_cp(cpu_env, tmp2, tmp);
2430 tcg_temp_free(tmp2);
2431 dead_tmp(tmp);
2433 return 0;
2436 static int cp15_user_ok(uint32_t insn)
2438 int cpn = (insn >> 16) & 0xf;
2439 int cpm = insn & 0xf;
2440 int op = ((insn >> 5) & 7) | ((insn >> 18) & 0x38);
2442 if (cpn == 13 && cpm == 0) {
2443 /* TLS register. */
2444 if (op == 2 || (op == 3 && (insn & ARM_CP_RW_BIT)))
2445 return 1;
2447 if (cpn == 7) {
2448 /* ISB, DSB, DMB. */
2449 if ((cpm == 5 && op == 4)
2450 || (cpm == 10 && (op == 4 || op == 5)))
2451 return 1;
2453 return 0;
2456 static int cp15_tls_load_store(CPUState *env, DisasContext *s, uint32_t insn, uint32_t rd)
2458 TCGv tmp;
2459 int cpn = (insn >> 16) & 0xf;
2460 int cpm = insn & 0xf;
2461 int op = ((insn >> 5) & 7) | ((insn >> 18) & 0x38);
2463 if (!arm_feature(env, ARM_FEATURE_V6K))
2464 return 0;
2466 if (!(cpn == 13 && cpm == 0))
2467 return 0;
2469 if (insn & ARM_CP_RW_BIT) {
2470 switch (op) {
2471 case 2:
2472 tmp = load_cpu_field(cp15.c13_tls1);
2473 break;
2474 case 3:
2475 tmp = load_cpu_field(cp15.c13_tls2);
2476 break;
2477 case 4:
2478 tmp = load_cpu_field(cp15.c13_tls3);
2479 break;
2480 default:
2481 return 0;
2483 store_reg(s, rd, tmp);
2485 } else {
2486 tmp = load_reg(s, rd);
2487 switch (op) {
2488 case 2:
2489 store_cpu_field(tmp, cp15.c13_tls1);
2490 break;
2491 case 3:
2492 store_cpu_field(tmp, cp15.c13_tls2);
2493 break;
2494 case 4:
2495 store_cpu_field(tmp, cp15.c13_tls3);
2496 break;
2497 default:
2498 dead_tmp(tmp);
2499 return 0;
2502 return 1;
2505 /* Disassemble system coprocessor (cp15) instruction. Return nonzero if
2506 instruction is not defined. */
2507 static int disas_cp15_insn(CPUState *env, DisasContext *s, uint32_t insn)
2509 uint32_t rd;
2510 TCGv tmp, tmp2;
2512 /* M profile cores use memory mapped registers instead of cp15. */
2513 if (arm_feature(env, ARM_FEATURE_M))
2514 return 1;
2516 if ((insn & (1 << 25)) == 0) {
2517 if (insn & (1 << 20)) {
2518 /* mrrc */
2519 return 1;
2521 /* mcrr. Used for block cache operations, so implement as no-op. */
2522 return 0;
2524 if ((insn & (1 << 4)) == 0) {
2525 /* cdp */
2526 return 1;
2528 if (IS_USER(s) && !cp15_user_ok(insn)) {
2529 return 1;
2531 if ((insn & 0x0fff0fff) == 0x0e070f90
2532 || (insn & 0x0fff0fff) == 0x0e070f58) {
2533 /* Wait for interrupt. */
2534 gen_set_pc_im(s->pc);
2535 s->is_jmp = DISAS_WFI;
2536 return 0;
2538 rd = (insn >> 12) & 0xf;
2540 if (cp15_tls_load_store(env, s, insn, rd))
2541 return 0;
2543 tmp2 = tcg_const_i32(insn);
2544 if (insn & ARM_CP_RW_BIT) {
2545 tmp = new_tmp();
2546 gen_helper_get_cp15(tmp, cpu_env, tmp2);
2547 /* If the destination register is r15 then sets condition codes. */
2548 if (rd != 15)
2549 store_reg(s, rd, tmp);
2550 else
2551 dead_tmp(tmp);
2552 } else {
2553 tmp = load_reg(s, rd);
2554 gen_helper_set_cp15(cpu_env, tmp2, tmp);
2555 dead_tmp(tmp);
2556 /* Normally we would always end the TB here, but Linux
2557 * arch/arm/mach-pxa/sleep.S expects two instructions following
2558 * an MMU enable to execute from cache. Imitate this behaviour. */
2559 if (!arm_feature(env, ARM_FEATURE_XSCALE) ||
2560 (insn & 0x0fff0fff) != 0x0e010f10)
2561 gen_lookup_tb(s);
2563 tcg_temp_free_i32(tmp2);
2564 return 0;
2567 #define VFP_REG_SHR(x, n) (((n) > 0) ? (x) >> (n) : (x) << -(n))
2568 #define VFP_SREG(insn, bigbit, smallbit) \
2569 ((VFP_REG_SHR(insn, bigbit - 1) & 0x1e) | (((insn) >> (smallbit)) & 1))
2570 #define VFP_DREG(reg, insn, bigbit, smallbit) do { \
2571 if (arm_feature(env, ARM_FEATURE_VFP3)) { \
2572 reg = (((insn) >> (bigbit)) & 0x0f) \
2573 | (((insn) >> ((smallbit) - 4)) & 0x10); \
2574 } else { \
2575 if (insn & (1 << (smallbit))) \
2576 return 1; \
2577 reg = ((insn) >> (bigbit)) & 0x0f; \
2578 }} while (0)
2580 #define VFP_SREG_D(insn) VFP_SREG(insn, 12, 22)
2581 #define VFP_DREG_D(reg, insn) VFP_DREG(reg, insn, 12, 22)
2582 #define VFP_SREG_N(insn) VFP_SREG(insn, 16, 7)
2583 #define VFP_DREG_N(reg, insn) VFP_DREG(reg, insn, 16, 7)
2584 #define VFP_SREG_M(insn) VFP_SREG(insn, 0, 5)
2585 #define VFP_DREG_M(reg, insn) VFP_DREG(reg, insn, 0, 5)
2587 /* Move between integer and VFP cores. */
2588 static TCGv gen_vfp_mrs(void)
2590 TCGv tmp = new_tmp();
2591 tcg_gen_mov_i32(tmp, cpu_F0s);
2592 return tmp;
2595 static void gen_vfp_msr(TCGv tmp)
2597 tcg_gen_mov_i32(cpu_F0s, tmp);
2598 dead_tmp(tmp);
2601 static inline int
2602 vfp_enabled(CPUState * env)
2604 return ((env->vfp.xregs[ARM_VFP_FPEXC] & (1 << 30)) != 0);
2607 static void gen_neon_dup_u8(TCGv var, int shift)
2609 TCGv tmp = new_tmp();
2610 if (shift)
2611 tcg_gen_shri_i32(var, var, shift);
2612 tcg_gen_ext8u_i32(var, var);
2613 tcg_gen_shli_i32(tmp, var, 8);
2614 tcg_gen_or_i32(var, var, tmp);
2615 tcg_gen_shli_i32(tmp, var, 16);
2616 tcg_gen_or_i32(var, var, tmp);
2617 dead_tmp(tmp);
2620 static void gen_neon_dup_low16(TCGv var)
2622 TCGv tmp = new_tmp();
2623 tcg_gen_ext16u_i32(var, var);
2624 tcg_gen_shli_i32(tmp, var, 16);
2625 tcg_gen_or_i32(var, var, tmp);
2626 dead_tmp(tmp);
2629 static void gen_neon_dup_high16(TCGv var)
2631 TCGv tmp = new_tmp();
2632 tcg_gen_andi_i32(var, var, 0xffff0000);
2633 tcg_gen_shri_i32(tmp, var, 16);
2634 tcg_gen_or_i32(var, var, tmp);
2635 dead_tmp(tmp);
2638 /* Disassemble a VFP instruction. Returns nonzero if an error occured
2639 (ie. an undefined instruction). */
2640 static int disas_vfp_insn(CPUState * env, DisasContext *s, uint32_t insn)
2642 uint32_t rd, rn, rm, op, i, n, offset, delta_d, delta_m, bank_mask;
2643 int dp, veclen;
2644 TCGv addr;
2645 TCGv tmp;
2646 TCGv tmp2;
2648 if (!arm_feature(env, ARM_FEATURE_VFP))
2649 return 1;
2651 if (!vfp_enabled(env)) {
2652 /* VFP disabled. Only allow fmxr/fmrx to/from some control regs. */
2653 if ((insn & 0x0fe00fff) != 0x0ee00a10)
2654 return 1;
2655 rn = (insn >> 16) & 0xf;
2656 if (rn != ARM_VFP_FPSID && rn != ARM_VFP_FPEXC
2657 && rn != ARM_VFP_MVFR1 && rn != ARM_VFP_MVFR0)
2658 return 1;
2660 dp = ((insn & 0xf00) == 0xb00);
2661 switch ((insn >> 24) & 0xf) {
2662 case 0xe:
2663 if (insn & (1 << 4)) {
2664 /* single register transfer */
2665 rd = (insn >> 12) & 0xf;
2666 if (dp) {
2667 int size;
2668 int pass;
2670 VFP_DREG_N(rn, insn);
2671 if (insn & 0xf)
2672 return 1;
2673 if (insn & 0x00c00060
2674 && !arm_feature(env, ARM_FEATURE_NEON))
2675 return 1;
2677 pass = (insn >> 21) & 1;
2678 if (insn & (1 << 22)) {
2679 size = 0;
2680 offset = ((insn >> 5) & 3) * 8;
2681 } else if (insn & (1 << 5)) {
2682 size = 1;
2683 offset = (insn & (1 << 6)) ? 16 : 0;
2684 } else {
2685 size = 2;
2686 offset = 0;
2688 if (insn & ARM_CP_RW_BIT) {
2689 /* vfp->arm */
2690 tmp = neon_load_reg(rn, pass);
2691 switch (size) {
2692 case 0:
2693 if (offset)
2694 tcg_gen_shri_i32(tmp, tmp, offset);
2695 if (insn & (1 << 23))
2696 gen_uxtb(tmp);
2697 else
2698 gen_sxtb(tmp);
2699 break;
2700 case 1:
2701 if (insn & (1 << 23)) {
2702 if (offset) {
2703 tcg_gen_shri_i32(tmp, tmp, 16);
2704 } else {
2705 gen_uxth(tmp);
2707 } else {
2708 if (offset) {
2709 tcg_gen_sari_i32(tmp, tmp, 16);
2710 } else {
2711 gen_sxth(tmp);
2714 break;
2715 case 2:
2716 break;
2718 store_reg(s, rd, tmp);
2719 } else {
2720 /* arm->vfp */
2721 tmp = load_reg(s, rd);
2722 if (insn & (1 << 23)) {
2723 /* VDUP */
2724 if (size == 0) {
2725 gen_neon_dup_u8(tmp, 0);
2726 } else if (size == 1) {
2727 gen_neon_dup_low16(tmp);
2729 for (n = 0; n <= pass * 2; n++) {
2730 tmp2 = new_tmp();
2731 tcg_gen_mov_i32(tmp2, tmp);
2732 neon_store_reg(rn, n, tmp2);
2734 neon_store_reg(rn, n, tmp);
2735 } else {
2736 /* VMOV */
2737 switch (size) {
2738 case 0:
2739 tmp2 = neon_load_reg(rn, pass);
2740 gen_bfi(tmp, tmp2, tmp, offset, 0xff);
2741 dead_tmp(tmp2);
2742 break;
2743 case 1:
2744 tmp2 = neon_load_reg(rn, pass);
2745 gen_bfi(tmp, tmp2, tmp, offset, 0xffff);
2746 dead_tmp(tmp2);
2747 break;
2748 case 2:
2749 break;
2751 neon_store_reg(rn, pass, tmp);
2754 } else { /* !dp */
2755 if ((insn & 0x6f) != 0x00)
2756 return 1;
2757 rn = VFP_SREG_N(insn);
2758 if (insn & ARM_CP_RW_BIT) {
2759 /* vfp->arm */
2760 if (insn & (1 << 21)) {
2761 /* system register */
2762 rn >>= 1;
2764 switch (rn) {
2765 case ARM_VFP_FPSID:
2766 /* VFP2 allows access to FSID from userspace.
2767 VFP3 restricts all id registers to privileged
2768 accesses. */
2769 if (IS_USER(s)
2770 && arm_feature(env, ARM_FEATURE_VFP3))
2771 return 1;
2772 tmp = load_cpu_field(vfp.xregs[rn]);
2773 break;
2774 case ARM_VFP_FPEXC:
2775 if (IS_USER(s))
2776 return 1;
2777 tmp = load_cpu_field(vfp.xregs[rn]);
2778 break;
2779 case ARM_VFP_FPINST:
2780 case ARM_VFP_FPINST2:
2781 /* Not present in VFP3. */
2782 if (IS_USER(s)
2783 || arm_feature(env, ARM_FEATURE_VFP3))
2784 return 1;
2785 tmp = load_cpu_field(vfp.xregs[rn]);
2786 break;
2787 case ARM_VFP_FPSCR:
2788 if (rd == 15) {
2789 tmp = load_cpu_field(vfp.xregs[ARM_VFP_FPSCR]);
2790 tcg_gen_andi_i32(tmp, tmp, 0xf0000000);
2791 } else {
2792 tmp = new_tmp();
2793 gen_helper_vfp_get_fpscr(tmp, cpu_env);
2795 break;
2796 case ARM_VFP_MVFR0:
2797 case ARM_VFP_MVFR1:
2798 if (IS_USER(s)
2799 || !arm_feature(env, ARM_FEATURE_VFP3))
2800 return 1;
2801 tmp = load_cpu_field(vfp.xregs[rn]);
2802 break;
2803 default:
2804 return 1;
2806 } else {
2807 gen_mov_F0_vreg(0, rn);
2808 tmp = gen_vfp_mrs();
2810 if (rd == 15) {
2811 /* Set the 4 flag bits in the CPSR. */
2812 gen_set_nzcv(tmp);
2813 dead_tmp(tmp);
2814 } else {
2815 store_reg(s, rd, tmp);
2817 } else {
2818 /* arm->vfp */
2819 tmp = load_reg(s, rd);
2820 if (insn & (1 << 21)) {
2821 rn >>= 1;
2822 /* system register */
2823 switch (rn) {
2824 case ARM_VFP_FPSID:
2825 case ARM_VFP_MVFR0:
2826 case ARM_VFP_MVFR1:
2827 /* Writes are ignored. */
2828 break;
2829 case ARM_VFP_FPSCR:
2830 gen_helper_vfp_set_fpscr(cpu_env, tmp);
2831 dead_tmp(tmp);
2832 gen_lookup_tb(s);
2833 break;
2834 case ARM_VFP_FPEXC:
2835 if (IS_USER(s))
2836 return 1;
2837 /* TODO: VFP subarchitecture support.
2838 * For now, keep the EN bit only */
2839 tcg_gen_andi_i32(tmp, tmp, 1 << 30);
2840 store_cpu_field(tmp, vfp.xregs[rn]);
2841 gen_lookup_tb(s);
2842 break;
2843 case ARM_VFP_FPINST:
2844 case ARM_VFP_FPINST2:
2845 store_cpu_field(tmp, vfp.xregs[rn]);
2846 break;
2847 default:
2848 return 1;
2850 } else {
2851 gen_vfp_msr(tmp);
2852 gen_mov_vreg_F0(0, rn);
2856 } else {
2857 /* data processing */
2858 /* The opcode is in bits 23, 21, 20 and 6. */
2859 op = ((insn >> 20) & 8) | ((insn >> 19) & 6) | ((insn >> 6) & 1);
2860 if (dp) {
2861 if (op == 15) {
2862 /* rn is opcode */
2863 rn = ((insn >> 15) & 0x1e) | ((insn >> 7) & 1);
2864 } else {
2865 /* rn is register number */
2866 VFP_DREG_N(rn, insn);
2869 if (op == 15 && (rn == 15 || ((rn & 0x1c) == 0x18))) {
2870 /* Integer or single precision destination. */
2871 rd = VFP_SREG_D(insn);
2872 } else {
2873 VFP_DREG_D(rd, insn);
2875 if (op == 15 &&
2876 (((rn & 0x1c) == 0x10) || ((rn & 0x14) == 0x14))) {
2877 /* VCVT from int is always from S reg regardless of dp bit.
2878 * VCVT with immediate frac_bits has same format as SREG_M
2880 rm = VFP_SREG_M(insn);
2881 } else {
2882 VFP_DREG_M(rm, insn);
2884 } else {
2885 rn = VFP_SREG_N(insn);
2886 if (op == 15 && rn == 15) {
2887 /* Double precision destination. */
2888 VFP_DREG_D(rd, insn);
2889 } else {
2890 rd = VFP_SREG_D(insn);
2892 /* NB that we implicitly rely on the encoding for the frac_bits
2893 * in VCVT of fixed to float being the same as that of an SREG_M
2895 rm = VFP_SREG_M(insn);
2898 veclen = env->vfp.vec_len;
2899 if (op == 15 && rn > 3)
2900 veclen = 0;
2902 /* Shut up compiler warnings. */
2903 delta_m = 0;
2904 delta_d = 0;
2905 bank_mask = 0;
2907 if (veclen > 0) {
2908 if (dp)
2909 bank_mask = 0xc;
2910 else
2911 bank_mask = 0x18;
2913 /* Figure out what type of vector operation this is. */
2914 if ((rd & bank_mask) == 0) {
2915 /* scalar */
2916 veclen = 0;
2917 } else {
2918 if (dp)
2919 delta_d = (env->vfp.vec_stride >> 1) + 1;
2920 else
2921 delta_d = env->vfp.vec_stride + 1;
2923 if ((rm & bank_mask) == 0) {
2924 /* mixed scalar/vector */
2925 delta_m = 0;
2926 } else {
2927 /* vector */
2928 delta_m = delta_d;
2933 /* Load the initial operands. */
2934 if (op == 15) {
2935 switch (rn) {
2936 case 16:
2937 case 17:
2938 /* Integer source */
2939 gen_mov_F0_vreg(0, rm);
2940 break;
2941 case 8:
2942 case 9:
2943 /* Compare */
2944 gen_mov_F0_vreg(dp, rd);
2945 gen_mov_F1_vreg(dp, rm);
2946 break;
2947 case 10:
2948 case 11:
2949 /* Compare with zero */
2950 gen_mov_F0_vreg(dp, rd);
2951 gen_vfp_F1_ld0(dp);
2952 break;
2953 case 20:
2954 case 21:
2955 case 22:
2956 case 23:
2957 case 28:
2958 case 29:
2959 case 30:
2960 case 31:
2961 /* Source and destination the same. */
2962 gen_mov_F0_vreg(dp, rd);
2963 break;
2964 default:
2965 /* One source operand. */
2966 gen_mov_F0_vreg(dp, rm);
2967 break;
2969 } else {
2970 /* Two source operands. */
2971 gen_mov_F0_vreg(dp, rn);
2972 gen_mov_F1_vreg(dp, rm);
2975 for (;;) {
2976 /* Perform the calculation. */
2977 switch (op) {
2978 case 0: /* mac: fd + (fn * fm) */
2979 gen_vfp_mul(dp);
2980 gen_mov_F1_vreg(dp, rd);
2981 gen_vfp_add(dp);
2982 break;
2983 case 1: /* nmac: fd - (fn * fm) */
2984 gen_vfp_mul(dp);
2985 gen_vfp_neg(dp);
2986 gen_mov_F1_vreg(dp, rd);
2987 gen_vfp_add(dp);
2988 break;
2989 case 2: /* msc: -fd + (fn * fm) */
2990 gen_vfp_mul(dp);
2991 gen_mov_F1_vreg(dp, rd);
2992 gen_vfp_sub(dp);
2993 break;
2994 case 3: /* nmsc: -fd - (fn * fm) */
2995 gen_vfp_mul(dp);
2996 gen_vfp_neg(dp);
2997 gen_mov_F1_vreg(dp, rd);
2998 gen_vfp_sub(dp);
2999 break;
3000 case 4: /* mul: fn * fm */
3001 gen_vfp_mul(dp);
3002 break;
3003 case 5: /* nmul: -(fn * fm) */
3004 gen_vfp_mul(dp);
3005 gen_vfp_neg(dp);
3006 break;
3007 case 6: /* add: fn + fm */
3008 gen_vfp_add(dp);
3009 break;
3010 case 7: /* sub: fn - fm */
3011 gen_vfp_sub(dp);
3012 break;
3013 case 8: /* div: fn / fm */
3014 gen_vfp_div(dp);
3015 break;
3016 case 14: /* fconst */
3017 if (!arm_feature(env, ARM_FEATURE_VFP3))
3018 return 1;
3020 n = (insn << 12) & 0x80000000;
3021 i = ((insn >> 12) & 0x70) | (insn & 0xf);
3022 if (dp) {
3023 if (i & 0x40)
3024 i |= 0x3f80;
3025 else
3026 i |= 0x4000;
3027 n |= i << 16;
3028 tcg_gen_movi_i64(cpu_F0d, ((uint64_t)n) << 32);
3029 } else {
3030 if (i & 0x40)
3031 i |= 0x780;
3032 else
3033 i |= 0x800;
3034 n |= i << 19;
3035 tcg_gen_movi_i32(cpu_F0s, n);
3037 break;
3038 case 15: /* extension space */
3039 switch (rn) {
3040 case 0: /* cpy */
3041 /* no-op */
3042 break;
3043 case 1: /* abs */
3044 gen_vfp_abs(dp);
3045 break;
3046 case 2: /* neg */
3047 gen_vfp_neg(dp);
3048 break;
3049 case 3: /* sqrt */
3050 gen_vfp_sqrt(dp);
3051 break;
3052 case 4: /* vcvtb.f32.f16 */
3053 if (!arm_feature(env, ARM_FEATURE_VFP_FP16))
3054 return 1;
3055 tmp = gen_vfp_mrs();
3056 tcg_gen_ext16u_i32(tmp, tmp);
3057 gen_helper_vfp_fcvt_f16_to_f32(cpu_F0s, tmp, cpu_env);
3058 dead_tmp(tmp);
3059 break;
3060 case 5: /* vcvtt.f32.f16 */
3061 if (!arm_feature(env, ARM_FEATURE_VFP_FP16))
3062 return 1;
3063 tmp = gen_vfp_mrs();
3064 tcg_gen_shri_i32(tmp, tmp, 16);
3065 gen_helper_vfp_fcvt_f16_to_f32(cpu_F0s, tmp, cpu_env);
3066 dead_tmp(tmp);
3067 break;
3068 case 6: /* vcvtb.f16.f32 */
3069 if (!arm_feature(env, ARM_FEATURE_VFP_FP16))
3070 return 1;
3071 tmp = new_tmp();
3072 gen_helper_vfp_fcvt_f32_to_f16(tmp, cpu_F0s, cpu_env);
3073 gen_mov_F0_vreg(0, rd);
3074 tmp2 = gen_vfp_mrs();
3075 tcg_gen_andi_i32(tmp2, tmp2, 0xffff0000);
3076 tcg_gen_or_i32(tmp, tmp, tmp2);
3077 dead_tmp(tmp2);
3078 gen_vfp_msr(tmp);
3079 break;
3080 case 7: /* vcvtt.f16.f32 */
3081 if (!arm_feature(env, ARM_FEATURE_VFP_FP16))
3082 return 1;
3083 tmp = new_tmp();
3084 gen_helper_vfp_fcvt_f32_to_f16(tmp, cpu_F0s, cpu_env);
3085 tcg_gen_shli_i32(tmp, tmp, 16);
3086 gen_mov_F0_vreg(0, rd);
3087 tmp2 = gen_vfp_mrs();
3088 tcg_gen_ext16u_i32(tmp2, tmp2);
3089 tcg_gen_or_i32(tmp, tmp, tmp2);
3090 dead_tmp(tmp2);
3091 gen_vfp_msr(tmp);
3092 break;
3093 case 8: /* cmp */
3094 gen_vfp_cmp(dp);
3095 break;
3096 case 9: /* cmpe */
3097 gen_vfp_cmpe(dp);
3098 break;
3099 case 10: /* cmpz */
3100 gen_vfp_cmp(dp);
3101 break;
3102 case 11: /* cmpez */
3103 gen_vfp_F1_ld0(dp);
3104 gen_vfp_cmpe(dp);
3105 break;
3106 case 15: /* single<->double conversion */
3107 if (dp)
3108 gen_helper_vfp_fcvtsd(cpu_F0s, cpu_F0d, cpu_env);
3109 else
3110 gen_helper_vfp_fcvtds(cpu_F0d, cpu_F0s, cpu_env);
3111 break;
3112 case 16: /* fuito */
3113 gen_vfp_uito(dp);
3114 break;
3115 case 17: /* fsito */
3116 gen_vfp_sito(dp);
3117 break;
3118 case 20: /* fshto */
3119 if (!arm_feature(env, ARM_FEATURE_VFP3))
3120 return 1;
3121 gen_vfp_shto(dp, 16 - rm);
3122 break;
3123 case 21: /* fslto */
3124 if (!arm_feature(env, ARM_FEATURE_VFP3))
3125 return 1;
3126 gen_vfp_slto(dp, 32 - rm);
3127 break;
3128 case 22: /* fuhto */
3129 if (!arm_feature(env, ARM_FEATURE_VFP3))
3130 return 1;
3131 gen_vfp_uhto(dp, 16 - rm);
3132 break;
3133 case 23: /* fulto */
3134 if (!arm_feature(env, ARM_FEATURE_VFP3))
3135 return 1;
3136 gen_vfp_ulto(dp, 32 - rm);
3137 break;
3138 case 24: /* ftoui */
3139 gen_vfp_toui(dp);
3140 break;
3141 case 25: /* ftouiz */
3142 gen_vfp_touiz(dp);
3143 break;
3144 case 26: /* ftosi */
3145 gen_vfp_tosi(dp);
3146 break;
3147 case 27: /* ftosiz */
3148 gen_vfp_tosiz(dp);
3149 break;
3150 case 28: /* ftosh */
3151 if (!arm_feature(env, ARM_FEATURE_VFP3))
3152 return 1;
3153 gen_vfp_tosh(dp, 16 - rm);
3154 break;
3155 case 29: /* ftosl */
3156 if (!arm_feature(env, ARM_FEATURE_VFP3))
3157 return 1;
3158 gen_vfp_tosl(dp, 32 - rm);
3159 break;
3160 case 30: /* ftouh */
3161 if (!arm_feature(env, ARM_FEATURE_VFP3))
3162 return 1;
3163 gen_vfp_touh(dp, 16 - rm);
3164 break;
3165 case 31: /* ftoul */
3166 if (!arm_feature(env, ARM_FEATURE_VFP3))
3167 return 1;
3168 gen_vfp_toul(dp, 32 - rm);
3169 break;
3170 default: /* undefined */
3171 printf ("rn:%d\n", rn);
3172 return 1;
3174 break;
3175 default: /* undefined */
3176 printf ("op:%d\n", op);
3177 return 1;
3180 /* Write back the result. */
3181 if (op == 15 && (rn >= 8 && rn <= 11))
3182 ; /* Comparison, do nothing. */
3183 else if (op == 15 && dp && ((rn & 0x1c) == 0x18))
3184 /* VCVT double to int: always integer result. */
3185 gen_mov_vreg_F0(0, rd);
3186 else if (op == 15 && rn == 15)
3187 /* conversion */
3188 gen_mov_vreg_F0(!dp, rd);
3189 else
3190 gen_mov_vreg_F0(dp, rd);
3192 /* break out of the loop if we have finished */
3193 if (veclen == 0)
3194 break;
3196 if (op == 15 && delta_m == 0) {
3197 /* single source one-many */
3198 while (veclen--) {
3199 rd = ((rd + delta_d) & (bank_mask - 1))
3200 | (rd & bank_mask);
3201 gen_mov_vreg_F0(dp, rd);
3203 break;
3205 /* Setup the next operands. */
3206 veclen--;
3207 rd = ((rd + delta_d) & (bank_mask - 1))
3208 | (rd & bank_mask);
3210 if (op == 15) {
3211 /* One source operand. */
3212 rm = ((rm + delta_m) & (bank_mask - 1))
3213 | (rm & bank_mask);
3214 gen_mov_F0_vreg(dp, rm);
3215 } else {
3216 /* Two source operands. */
3217 rn = ((rn + delta_d) & (bank_mask - 1))
3218 | (rn & bank_mask);
3219 gen_mov_F0_vreg(dp, rn);
3220 if (delta_m) {
3221 rm = ((rm + delta_m) & (bank_mask - 1))
3222 | (rm & bank_mask);
3223 gen_mov_F1_vreg(dp, rm);
3228 break;
3229 case 0xc:
3230 case 0xd:
3231 if (dp && (insn & 0x03e00000) == 0x00400000) {
3232 /* two-register transfer */
3233 rn = (insn >> 16) & 0xf;
3234 rd = (insn >> 12) & 0xf;
3235 if (dp) {
3236 VFP_DREG_M(rm, insn);
3237 } else {
3238 rm = VFP_SREG_M(insn);
3241 if (insn & ARM_CP_RW_BIT) {
3242 /* vfp->arm */
3243 if (dp) {
3244 gen_mov_F0_vreg(0, rm * 2);
3245 tmp = gen_vfp_mrs();
3246 store_reg(s, rd, tmp);
3247 gen_mov_F0_vreg(0, rm * 2 + 1);
3248 tmp = gen_vfp_mrs();
3249 store_reg(s, rn, tmp);
3250 } else {
3251 gen_mov_F0_vreg(0, rm);
3252 tmp = gen_vfp_mrs();
3253 store_reg(s, rn, tmp);
3254 gen_mov_F0_vreg(0, rm + 1);
3255 tmp = gen_vfp_mrs();
3256 store_reg(s, rd, tmp);
3258 } else {
3259 /* arm->vfp */
3260 if (dp) {
3261 tmp = load_reg(s, rd);
3262 gen_vfp_msr(tmp);
3263 gen_mov_vreg_F0(0, rm * 2);
3264 tmp = load_reg(s, rn);
3265 gen_vfp_msr(tmp);
3266 gen_mov_vreg_F0(0, rm * 2 + 1);
3267 } else {
3268 tmp = load_reg(s, rn);
3269 gen_vfp_msr(tmp);
3270 gen_mov_vreg_F0(0, rm);
3271 tmp = load_reg(s, rd);
3272 gen_vfp_msr(tmp);
3273 gen_mov_vreg_F0(0, rm + 1);
3276 } else {
3277 /* Load/store */
3278 rn = (insn >> 16) & 0xf;
3279 if (dp)
3280 VFP_DREG_D(rd, insn);
3281 else
3282 rd = VFP_SREG_D(insn);
3283 if (s->thumb && rn == 15) {
3284 addr = new_tmp();
3285 tcg_gen_movi_i32(addr, s->pc & ~2);
3286 } else {
3287 addr = load_reg(s, rn);
3289 if ((insn & 0x01200000) == 0x01000000) {
3290 /* Single load/store */
3291 offset = (insn & 0xff) << 2;
3292 if ((insn & (1 << 23)) == 0)
3293 offset = -offset;
3294 tcg_gen_addi_i32(addr, addr, offset);
3295 if (insn & (1 << 20)) {
3296 gen_vfp_ld(s, dp, addr);
3297 gen_mov_vreg_F0(dp, rd);
3298 } else {
3299 gen_mov_F0_vreg(dp, rd);
3300 gen_vfp_st(s, dp, addr);
3302 dead_tmp(addr);
3303 } else {
3304 /* load/store multiple */
3305 if (dp)
3306 n = (insn >> 1) & 0x7f;
3307 else
3308 n = insn & 0xff;
3310 if (insn & (1 << 24)) /* pre-decrement */
3311 tcg_gen_addi_i32(addr, addr, -((insn & 0xff) << 2));
3313 if (dp)
3314 offset = 8;
3315 else
3316 offset = 4;
3317 for (i = 0; i < n; i++) {
3318 if (insn & ARM_CP_RW_BIT) {
3319 /* load */
3320 gen_vfp_ld(s, dp, addr);
3321 gen_mov_vreg_F0(dp, rd + i);
3322 } else {
3323 /* store */
3324 gen_mov_F0_vreg(dp, rd + i);
3325 gen_vfp_st(s, dp, addr);
3327 tcg_gen_addi_i32(addr, addr, offset);
3329 if (insn & (1 << 21)) {
3330 /* writeback */
3331 if (insn & (1 << 24))
3332 offset = -offset * n;
3333 else if (dp && (insn & 1))
3334 offset = 4;
3335 else
3336 offset = 0;
3338 if (offset != 0)
3339 tcg_gen_addi_i32(addr, addr, offset);
3340 store_reg(s, rn, addr);
3341 } else {
3342 dead_tmp(addr);
3346 break;
3347 default:
3348 /* Should never happen. */
3349 return 1;
3351 return 0;
3354 static inline void gen_goto_tb(DisasContext *s, int n, uint32_t dest)
3356 TranslationBlock *tb;
3358 tb = s->tb;
3359 if ((tb->pc & TARGET_PAGE_MASK) == (dest & TARGET_PAGE_MASK)) {
3360 tcg_gen_goto_tb(n);
3361 gen_set_pc_im(dest);
3362 tcg_gen_exit_tb((long)tb + n);
3363 } else {
3364 gen_set_pc_im(dest);
3365 tcg_gen_exit_tb(0);
3369 static inline void gen_jmp (DisasContext *s, uint32_t dest)
3371 if (unlikely(s->singlestep_enabled)) {
3372 /* An indirect jump so that we still trigger the debug exception. */
3373 if (s->thumb)
3374 dest |= 1;
3375 gen_bx_im(s, dest);
3376 } else {
3377 gen_goto_tb(s, 0, dest);
3378 s->is_jmp = DISAS_TB_JUMP;
3382 static inline void gen_mulxy(TCGv t0, TCGv t1, int x, int y)
3384 if (x)
3385 tcg_gen_sari_i32(t0, t0, 16);
3386 else
3387 gen_sxth(t0);
3388 if (y)
3389 tcg_gen_sari_i32(t1, t1, 16);
3390 else
3391 gen_sxth(t1);
3392 tcg_gen_mul_i32(t0, t0, t1);
3395 /* Return the mask of PSR bits set by a MSR instruction. */
3396 static uint32_t msr_mask(CPUState *env, DisasContext *s, int flags, int spsr) {
3397 uint32_t mask;
3399 mask = 0;
3400 if (flags & (1 << 0))
3401 mask |= 0xff;
3402 if (flags & (1 << 1))
3403 mask |= 0xff00;
3404 if (flags & (1 << 2))
3405 mask |= 0xff0000;
3406 if (flags & (1 << 3))
3407 mask |= 0xff000000;
3409 /* Mask out undefined bits. */
3410 mask &= ~CPSR_RESERVED;
3411 if (!arm_feature(env, ARM_FEATURE_V6))
3412 mask &= ~(CPSR_E | CPSR_GE);
3413 if (!arm_feature(env, ARM_FEATURE_THUMB2))
3414 mask &= ~CPSR_IT;
3415 /* Mask out execution state bits. */
3416 if (!spsr)
3417 mask &= ~CPSR_EXEC;
3418 /* Mask out privileged bits. */
3419 if (IS_USER(s))
3420 mask &= CPSR_USER;
3421 return mask;
3424 /* Returns nonzero if access to the PSR is not permitted. Marks t0 as dead. */
3425 static int gen_set_psr(DisasContext *s, uint32_t mask, int spsr, TCGv t0)
3427 TCGv tmp;
3428 if (spsr) {
3429 /* ??? This is also undefined in system mode. */
3430 if (IS_USER(s))
3431 return 1;
3433 tmp = load_cpu_field(spsr);
3434 tcg_gen_andi_i32(tmp, tmp, ~mask);
3435 tcg_gen_andi_i32(t0, t0, mask);
3436 tcg_gen_or_i32(tmp, tmp, t0);
3437 store_cpu_field(tmp, spsr);
3438 } else {
3439 gen_set_cpsr(t0, mask);
3441 dead_tmp(t0);
3442 gen_lookup_tb(s);
3443 return 0;
3446 /* Returns nonzero if access to the PSR is not permitted. */
3447 static int gen_set_psr_im(DisasContext *s, uint32_t mask, int spsr, uint32_t val)
3449 TCGv tmp;
3450 tmp = new_tmp();
3451 tcg_gen_movi_i32(tmp, val);
3452 return gen_set_psr(s, mask, spsr, tmp);
3455 /* Generate an old-style exception return. Marks pc as dead. */
3456 static void gen_exception_return(DisasContext *s, TCGv pc)
3458 TCGv tmp;
3459 store_reg(s, 15, pc);
3460 tmp = load_cpu_field(spsr);
3461 gen_set_cpsr(tmp, 0xffffffff);
3462 dead_tmp(tmp);
3463 s->is_jmp = DISAS_UPDATE;
3466 /* Generate a v6 exception return. Marks both values as dead. */
3467 static void gen_rfe(DisasContext *s, TCGv pc, TCGv cpsr)
3469 gen_set_cpsr(cpsr, 0xffffffff);
3470 dead_tmp(cpsr);
3471 store_reg(s, 15, pc);
3472 s->is_jmp = DISAS_UPDATE;
3475 static inline void
3476 gen_set_condexec (DisasContext *s)
3478 if (s->condexec_mask) {
3479 uint32_t val = (s->condexec_cond << 4) | (s->condexec_mask >> 1);
3480 TCGv tmp = new_tmp();
3481 tcg_gen_movi_i32(tmp, val);
3482 store_cpu_field(tmp, condexec_bits);
3486 static void gen_nop_hint(DisasContext *s, int val)
3488 switch (val) {
3489 case 3: /* wfi */
3490 gen_set_pc_im(s->pc);
3491 s->is_jmp = DISAS_WFI;
3492 break;
3493 case 2: /* wfe */
3494 case 4: /* sev */
3495 /* TODO: Implement SEV and WFE. May help SMP performance. */
3496 default: /* nop */
3497 break;
3501 #define CPU_V001 cpu_V0, cpu_V0, cpu_V1
3503 static inline int gen_neon_add(int size, TCGv t0, TCGv t1)
3505 switch (size) {
3506 case 0: gen_helper_neon_add_u8(t0, t0, t1); break;
3507 case 1: gen_helper_neon_add_u16(t0, t0, t1); break;
3508 case 2: tcg_gen_add_i32(t0, t0, t1); break;
3509 default: return 1;
3511 return 0;
3514 static inline void gen_neon_rsb(int size, TCGv t0, TCGv t1)
3516 switch (size) {
3517 case 0: gen_helper_neon_sub_u8(t0, t1, t0); break;
3518 case 1: gen_helper_neon_sub_u16(t0, t1, t0); break;
3519 case 2: tcg_gen_sub_i32(t0, t1, t0); break;
3520 default: return;
3524 /* 32-bit pairwise ops end up the same as the elementwise versions. */
3525 #define gen_helper_neon_pmax_s32 gen_helper_neon_max_s32
3526 #define gen_helper_neon_pmax_u32 gen_helper_neon_max_u32
3527 #define gen_helper_neon_pmin_s32 gen_helper_neon_min_s32
3528 #define gen_helper_neon_pmin_u32 gen_helper_neon_min_u32
3530 /* FIXME: This is wrong. They set the wrong overflow bit. */
3531 #define gen_helper_neon_qadd_s32(a, e, b, c) gen_helper_add_saturate(a, b, c)
3532 #define gen_helper_neon_qadd_u32(a, e, b, c) gen_helper_add_usaturate(a, b, c)
3533 #define gen_helper_neon_qsub_s32(a, e, b, c) gen_helper_sub_saturate(a, b, c)
3534 #define gen_helper_neon_qsub_u32(a, e, b, c) gen_helper_sub_usaturate(a, b, c)
3536 #define GEN_NEON_INTEGER_OP_ENV(name) do { \
3537 switch ((size << 1) | u) { \
3538 case 0: \
3539 gen_helper_neon_##name##_s8(tmp, cpu_env, tmp, tmp2); \
3540 break; \
3541 case 1: \
3542 gen_helper_neon_##name##_u8(tmp, cpu_env, tmp, tmp2); \
3543 break; \
3544 case 2: \
3545 gen_helper_neon_##name##_s16(tmp, cpu_env, tmp, tmp2); \
3546 break; \
3547 case 3: \
3548 gen_helper_neon_##name##_u16(tmp, cpu_env, tmp, tmp2); \
3549 break; \
3550 case 4: \
3551 gen_helper_neon_##name##_s32(tmp, cpu_env, tmp, tmp2); \
3552 break; \
3553 case 5: \
3554 gen_helper_neon_##name##_u32(tmp, cpu_env, tmp, tmp2); \
3555 break; \
3556 default: return 1; \
3557 }} while (0)
3559 #define GEN_NEON_INTEGER_OP(name) do { \
3560 switch ((size << 1) | u) { \
3561 case 0: \
3562 gen_helper_neon_##name##_s8(tmp, tmp, tmp2); \
3563 break; \
3564 case 1: \
3565 gen_helper_neon_##name##_u8(tmp, tmp, tmp2); \
3566 break; \
3567 case 2: \
3568 gen_helper_neon_##name##_s16(tmp, tmp, tmp2); \
3569 break; \
3570 case 3: \
3571 gen_helper_neon_##name##_u16(tmp, tmp, tmp2); \
3572 break; \
3573 case 4: \
3574 gen_helper_neon_##name##_s32(tmp, tmp, tmp2); \
3575 break; \
3576 case 5: \
3577 gen_helper_neon_##name##_u32(tmp, tmp, tmp2); \
3578 break; \
3579 default: return 1; \
3580 }} while (0)
3582 static TCGv neon_load_scratch(int scratch)
3584 TCGv tmp = new_tmp();
3585 tcg_gen_ld_i32(tmp, cpu_env, offsetof(CPUARMState, vfp.scratch[scratch]));
3586 return tmp;
3589 static void neon_store_scratch(int scratch, TCGv var)
3591 tcg_gen_st_i32(var, cpu_env, offsetof(CPUARMState, vfp.scratch[scratch]));
3592 dead_tmp(var);
3595 static inline TCGv neon_get_scalar(int size, int reg)
3597 TCGv tmp;
3598 if (size == 1) {
3599 tmp = neon_load_reg(reg >> 1, reg & 1);
3600 } else {
3601 tmp = neon_load_reg(reg >> 2, (reg >> 1) & 1);
3602 if (reg & 1) {
3603 gen_neon_dup_low16(tmp);
3604 } else {
3605 gen_neon_dup_high16(tmp);
3608 return tmp;
3611 static void gen_neon_unzip_u8(TCGv t0, TCGv t1)
3613 TCGv rd, rm, tmp;
3615 rd = new_tmp();
3616 rm = new_tmp();
3617 tmp = new_tmp();
3619 tcg_gen_andi_i32(rd, t0, 0xff);
3620 tcg_gen_shri_i32(tmp, t0, 8);
3621 tcg_gen_andi_i32(tmp, tmp, 0xff00);
3622 tcg_gen_or_i32(rd, rd, tmp);
3623 tcg_gen_shli_i32(tmp, t1, 16);
3624 tcg_gen_andi_i32(tmp, tmp, 0xff0000);
3625 tcg_gen_or_i32(rd, rd, tmp);
3626 tcg_gen_shli_i32(tmp, t1, 8);
3627 tcg_gen_andi_i32(tmp, tmp, 0xff000000);
3628 tcg_gen_or_i32(rd, rd, tmp);
3630 tcg_gen_shri_i32(rm, t0, 8);
3631 tcg_gen_andi_i32(rm, rm, 0xff);
3632 tcg_gen_shri_i32(tmp, t0, 16);
3633 tcg_gen_andi_i32(tmp, tmp, 0xff00);
3634 tcg_gen_or_i32(rm, rm, tmp);
3635 tcg_gen_shli_i32(tmp, t1, 8);
3636 tcg_gen_andi_i32(tmp, tmp, 0xff0000);
3637 tcg_gen_or_i32(rm, rm, tmp);
3638 tcg_gen_andi_i32(tmp, t1, 0xff000000);
3639 tcg_gen_or_i32(t1, rm, tmp);
3640 tcg_gen_mov_i32(t0, rd);
3642 dead_tmp(tmp);
3643 dead_tmp(rm);
3644 dead_tmp(rd);
3647 static void gen_neon_zip_u8(TCGv t0, TCGv t1)
3649 TCGv rd, rm, tmp;
3651 rd = new_tmp();
3652 rm = new_tmp();
3653 tmp = new_tmp();
3655 tcg_gen_andi_i32(rd, t0, 0xff);
3656 tcg_gen_shli_i32(tmp, t1, 8);
3657 tcg_gen_andi_i32(tmp, tmp, 0xff00);
3658 tcg_gen_or_i32(rd, rd, tmp);
3659 tcg_gen_shli_i32(tmp, t0, 16);
3660 tcg_gen_andi_i32(tmp, tmp, 0xff0000);
3661 tcg_gen_or_i32(rd, rd, tmp);
3662 tcg_gen_shli_i32(tmp, t1, 24);
3663 tcg_gen_andi_i32(tmp, tmp, 0xff000000);
3664 tcg_gen_or_i32(rd, rd, tmp);
3666 tcg_gen_andi_i32(rm, t1, 0xff000000);
3667 tcg_gen_shri_i32(tmp, t0, 8);
3668 tcg_gen_andi_i32(tmp, tmp, 0xff0000);
3669 tcg_gen_or_i32(rm, rm, tmp);
3670 tcg_gen_shri_i32(tmp, t1, 8);
3671 tcg_gen_andi_i32(tmp, tmp, 0xff00);
3672 tcg_gen_or_i32(rm, rm, tmp);
3673 tcg_gen_shri_i32(tmp, t0, 16);
3674 tcg_gen_andi_i32(tmp, tmp, 0xff);
3675 tcg_gen_or_i32(t1, rm, tmp);
3676 tcg_gen_mov_i32(t0, rd);
3678 dead_tmp(tmp);
3679 dead_tmp(rm);
3680 dead_tmp(rd);
3683 static void gen_neon_zip_u16(TCGv t0, TCGv t1)
3685 TCGv tmp, tmp2;
3687 tmp = new_tmp();
3688 tmp2 = new_tmp();
3690 tcg_gen_andi_i32(tmp, t0, 0xffff);
3691 tcg_gen_shli_i32(tmp2, t1, 16);
3692 tcg_gen_or_i32(tmp, tmp, tmp2);
3693 tcg_gen_andi_i32(t1, t1, 0xffff0000);
3694 tcg_gen_shri_i32(tmp2, t0, 16);
3695 tcg_gen_or_i32(t1, t1, tmp2);
3696 tcg_gen_mov_i32(t0, tmp);
3698 dead_tmp(tmp2);
3699 dead_tmp(tmp);
3702 static void gen_neon_unzip(int reg, int q, int tmp, int size)
3704 int n;
3705 TCGv t0, t1;
3707 for (n = 0; n < q + 1; n += 2) {
3708 t0 = neon_load_reg(reg, n);
3709 t1 = neon_load_reg(reg, n + 1);
3710 switch (size) {
3711 case 0: gen_neon_unzip_u8(t0, t1); break;
3712 case 1: gen_neon_zip_u16(t0, t1); break; /* zip and unzip are the same. */
3713 case 2: /* no-op */; break;
3714 default: abort();
3716 neon_store_scratch(tmp + n, t0);
3717 neon_store_scratch(tmp + n + 1, t1);
3721 static void gen_neon_trn_u8(TCGv t0, TCGv t1)
3723 TCGv rd, tmp;
3725 rd = new_tmp();
3726 tmp = new_tmp();
3728 tcg_gen_shli_i32(rd, t0, 8);
3729 tcg_gen_andi_i32(rd, rd, 0xff00ff00);
3730 tcg_gen_andi_i32(tmp, t1, 0x00ff00ff);
3731 tcg_gen_or_i32(rd, rd, tmp);
3733 tcg_gen_shri_i32(t1, t1, 8);
3734 tcg_gen_andi_i32(t1, t1, 0x00ff00ff);
3735 tcg_gen_andi_i32(tmp, t0, 0xff00ff00);
3736 tcg_gen_or_i32(t1, t1, tmp);
3737 tcg_gen_mov_i32(t0, rd);
3739 dead_tmp(tmp);
3740 dead_tmp(rd);
3743 static void gen_neon_trn_u16(TCGv t0, TCGv t1)
3745 TCGv rd, tmp;
3747 rd = new_tmp();
3748 tmp = new_tmp();
3750 tcg_gen_shli_i32(rd, t0, 16);
3751 tcg_gen_andi_i32(tmp, t1, 0xffff);
3752 tcg_gen_or_i32(rd, rd, tmp);
3753 tcg_gen_shri_i32(t1, t1, 16);
3754 tcg_gen_andi_i32(tmp, t0, 0xffff0000);
3755 tcg_gen_or_i32(t1, t1, tmp);
3756 tcg_gen_mov_i32(t0, rd);
3758 dead_tmp(tmp);
3759 dead_tmp(rd);
3763 static struct {
3764 int nregs;
3765 int interleave;
3766 int spacing;
3767 } neon_ls_element_type[11] = {
3768 {4, 4, 1},
3769 {4, 4, 2},
3770 {4, 1, 1},
3771 {4, 2, 1},
3772 {3, 3, 1},
3773 {3, 3, 2},
3774 {3, 1, 1},
3775 {1, 1, 1},
3776 {2, 2, 1},
3777 {2, 2, 2},
3778 {2, 1, 1}
3781 /* Translate a NEON load/store element instruction. Return nonzero if the
3782 instruction is invalid. */
3783 static int disas_neon_ls_insn(CPUState * env, DisasContext *s, uint32_t insn)
3785 int rd, rn, rm;
3786 int op;
3787 int nregs;
3788 int interleave;
3789 int spacing;
3790 int stride;
3791 int size;
3792 int reg;
3793 int pass;
3794 int load;
3795 int shift;
3796 int n;
3797 TCGv addr;
3798 TCGv tmp;
3799 TCGv tmp2;
3800 TCGv_i64 tmp64;
3802 if (!vfp_enabled(env))
3803 return 1;
3804 VFP_DREG_D(rd, insn);
3805 rn = (insn >> 16) & 0xf;
3806 rm = insn & 0xf;
3807 load = (insn & (1 << 21)) != 0;
3808 addr = new_tmp();
3809 if ((insn & (1 << 23)) == 0) {
3810 /* Load store all elements. */
3811 op = (insn >> 8) & 0xf;
3812 size = (insn >> 6) & 3;
3813 if (op > 10)
3814 return 1;
3815 nregs = neon_ls_element_type[op].nregs;
3816 interleave = neon_ls_element_type[op].interleave;
3817 spacing = neon_ls_element_type[op].spacing;
3818 if (size == 3 && (interleave | spacing) != 1)
3819 return 1;
3820 load_reg_var(s, addr, rn);
3821 stride = (1 << size) * interleave;
3822 for (reg = 0; reg < nregs; reg++) {
3823 if (interleave > 2 || (interleave == 2 && nregs == 2)) {
3824 load_reg_var(s, addr, rn);
3825 tcg_gen_addi_i32(addr, addr, (1 << size) * reg);
3826 } else if (interleave == 2 && nregs == 4 && reg == 2) {
3827 load_reg_var(s, addr, rn);
3828 tcg_gen_addi_i32(addr, addr, 1 << size);
3830 if (size == 3) {
3831 if (load) {
3832 tmp64 = gen_ld64(addr, IS_USER(s));
3833 neon_store_reg64(tmp64, rd);
3834 tcg_temp_free_i64(tmp64);
3835 } else {
3836 tmp64 = tcg_temp_new_i64();
3837 neon_load_reg64(tmp64, rd);
3838 gen_st64(tmp64, addr, IS_USER(s));
3840 tcg_gen_addi_i32(addr, addr, stride);
3841 } else {
3842 for (pass = 0; pass < 2; pass++) {
3843 if (size == 2) {
3844 if (load) {
3845 tmp = gen_ld32(addr, IS_USER(s));
3846 neon_store_reg(rd, pass, tmp);
3847 } else {
3848 tmp = neon_load_reg(rd, pass);
3849 gen_st32(tmp, addr, IS_USER(s));
3851 tcg_gen_addi_i32(addr, addr, stride);
3852 } else if (size == 1) {
3853 if (load) {
3854 tmp = gen_ld16u(addr, IS_USER(s));
3855 tcg_gen_addi_i32(addr, addr, stride);
3856 tmp2 = gen_ld16u(addr, IS_USER(s));
3857 tcg_gen_addi_i32(addr, addr, stride);
3858 tcg_gen_shli_i32(tmp2, tmp2, 16);
3859 tcg_gen_or_i32(tmp, tmp, tmp2);
3860 dead_tmp(tmp2);
3861 neon_store_reg(rd, pass, tmp);
3862 } else {
3863 tmp = neon_load_reg(rd, pass);
3864 tmp2 = new_tmp();
3865 tcg_gen_shri_i32(tmp2, tmp, 16);
3866 gen_st16(tmp, addr, IS_USER(s));
3867 tcg_gen_addi_i32(addr, addr, stride);
3868 gen_st16(tmp2, addr, IS_USER(s));
3869 tcg_gen_addi_i32(addr, addr, stride);
3871 } else /* size == 0 */ {
3872 if (load) {
3873 TCGV_UNUSED(tmp2);
3874 for (n = 0; n < 4; n++) {
3875 tmp = gen_ld8u(addr, IS_USER(s));
3876 tcg_gen_addi_i32(addr, addr, stride);
3877 if (n == 0) {
3878 tmp2 = tmp;
3879 } else {
3880 tcg_gen_shli_i32(tmp, tmp, n * 8);
3881 tcg_gen_or_i32(tmp2, tmp2, tmp);
3882 dead_tmp(tmp);
3885 neon_store_reg(rd, pass, tmp2);
3886 } else {
3887 tmp2 = neon_load_reg(rd, pass);
3888 for (n = 0; n < 4; n++) {
3889 tmp = new_tmp();
3890 if (n == 0) {
3891 tcg_gen_mov_i32(tmp, tmp2);
3892 } else {
3893 tcg_gen_shri_i32(tmp, tmp2, n * 8);
3895 gen_st8(tmp, addr, IS_USER(s));
3896 tcg_gen_addi_i32(addr, addr, stride);
3898 dead_tmp(tmp2);
3903 rd += spacing;
3905 stride = nregs * 8;
3906 } else {
3907 size = (insn >> 10) & 3;
3908 if (size == 3) {
3909 /* Load single element to all lanes. */
3910 if (!load)
3911 return 1;
3912 size = (insn >> 6) & 3;
3913 nregs = ((insn >> 8) & 3) + 1;
3914 stride = (insn & (1 << 5)) ? 2 : 1;
3915 load_reg_var(s, addr, rn);
3916 for (reg = 0; reg < nregs; reg++) {
3917 switch (size) {
3918 case 0:
3919 tmp = gen_ld8u(addr, IS_USER(s));
3920 gen_neon_dup_u8(tmp, 0);
3921 break;
3922 case 1:
3923 tmp = gen_ld16u(addr, IS_USER(s));
3924 gen_neon_dup_low16(tmp);
3925 break;
3926 case 2:
3927 tmp = gen_ld32(addr, IS_USER(s));
3928 break;
3929 case 3:
3930 return 1;
3931 default: /* Avoid compiler warnings. */
3932 abort();
3934 tcg_gen_addi_i32(addr, addr, 1 << size);
3935 tmp2 = new_tmp();
3936 tcg_gen_mov_i32(tmp2, tmp);
3937 neon_store_reg(rd, 0, tmp2);
3938 neon_store_reg(rd, 1, tmp);
3939 rd += stride;
3941 stride = (1 << size) * nregs;
3942 } else {
3943 /* Single element. */
3944 pass = (insn >> 7) & 1;
3945 switch (size) {
3946 case 0:
3947 shift = ((insn >> 5) & 3) * 8;
3948 stride = 1;
3949 break;
3950 case 1:
3951 shift = ((insn >> 6) & 1) * 16;
3952 stride = (insn & (1 << 5)) ? 2 : 1;
3953 break;
3954 case 2:
3955 shift = 0;
3956 stride = (insn & (1 << 6)) ? 2 : 1;
3957 break;
3958 default:
3959 abort();
3961 nregs = ((insn >> 8) & 3) + 1;
3962 load_reg_var(s, addr, rn);
3963 for (reg = 0; reg < nregs; reg++) {
3964 if (load) {
3965 switch (size) {
3966 case 0:
3967 tmp = gen_ld8u(addr, IS_USER(s));
3968 break;
3969 case 1:
3970 tmp = gen_ld16u(addr, IS_USER(s));
3971 break;
3972 case 2:
3973 tmp = gen_ld32(addr, IS_USER(s));
3974 break;
3975 default: /* Avoid compiler warnings. */
3976 abort();
3978 if (size != 2) {
3979 tmp2 = neon_load_reg(rd, pass);
3980 gen_bfi(tmp, tmp2, tmp, shift, size ? 0xffff : 0xff);
3981 dead_tmp(tmp2);
3983 neon_store_reg(rd, pass, tmp);
3984 } else { /* Store */
3985 tmp = neon_load_reg(rd, pass);
3986 if (shift)
3987 tcg_gen_shri_i32(tmp, tmp, shift);
3988 switch (size) {
3989 case 0:
3990 gen_st8(tmp, addr, IS_USER(s));
3991 break;
3992 case 1:
3993 gen_st16(tmp, addr, IS_USER(s));
3994 break;
3995 case 2:
3996 gen_st32(tmp, addr, IS_USER(s));
3997 break;
4000 rd += stride;
4001 tcg_gen_addi_i32(addr, addr, 1 << size);
4003 stride = nregs * (1 << size);
4006 dead_tmp(addr);
4007 if (rm != 15) {
4008 TCGv base;
4010 base = load_reg(s, rn);
4011 if (rm == 13) {
4012 tcg_gen_addi_i32(base, base, stride);
4013 } else {
4014 TCGv index;
4015 index = load_reg(s, rm);
4016 tcg_gen_add_i32(base, base, index);
4017 dead_tmp(index);
4019 store_reg(s, rn, base);
4021 return 0;
4024 /* Bitwise select. dest = c ? t : f. Clobbers T and F. */
4025 static void gen_neon_bsl(TCGv dest, TCGv t, TCGv f, TCGv c)
4027 tcg_gen_and_i32(t, t, c);
4028 tcg_gen_andc_i32(f, f, c);
4029 tcg_gen_or_i32(dest, t, f);
4032 static inline void gen_neon_narrow(int size, TCGv dest, TCGv_i64 src)
4034 switch (size) {
4035 case 0: gen_helper_neon_narrow_u8(dest, src); break;
4036 case 1: gen_helper_neon_narrow_u16(dest, src); break;
4037 case 2: tcg_gen_trunc_i64_i32(dest, src); break;
4038 default: abort();
4042 static inline void gen_neon_narrow_sats(int size, TCGv dest, TCGv_i64 src)
4044 switch (size) {
4045 case 0: gen_helper_neon_narrow_sat_s8(dest, cpu_env, src); break;
4046 case 1: gen_helper_neon_narrow_sat_s16(dest, cpu_env, src); break;
4047 case 2: gen_helper_neon_narrow_sat_s32(dest, cpu_env, src); break;
4048 default: abort();
4052 static inline void gen_neon_narrow_satu(int size, TCGv dest, TCGv_i64 src)
4054 switch (size) {
4055 case 0: gen_helper_neon_narrow_sat_u8(dest, cpu_env, src); break;
4056 case 1: gen_helper_neon_narrow_sat_u16(dest, cpu_env, src); break;
4057 case 2: gen_helper_neon_narrow_sat_u32(dest, cpu_env, src); break;
4058 default: abort();
4062 static inline void gen_neon_shift_narrow(int size, TCGv var, TCGv shift,
4063 int q, int u)
4065 if (q) {
4066 if (u) {
4067 switch (size) {
4068 case 1: gen_helper_neon_rshl_u16(var, var, shift); break;
4069 case 2: gen_helper_neon_rshl_u32(var, var, shift); break;
4070 default: abort();
4072 } else {
4073 switch (size) {
4074 case 1: gen_helper_neon_rshl_s16(var, var, shift); break;
4075 case 2: gen_helper_neon_rshl_s32(var, var, shift); break;
4076 default: abort();
4079 } else {
4080 if (u) {
4081 switch (size) {
4082 case 1: gen_helper_neon_rshl_u16(var, var, shift); break;
4083 case 2: gen_helper_neon_rshl_u32(var, var, shift); break;
4084 default: abort();
4086 } else {
4087 switch (size) {
4088 case 1: gen_helper_neon_shl_s16(var, var, shift); break;
4089 case 2: gen_helper_neon_shl_s32(var, var, shift); break;
4090 default: abort();
4096 static inline void gen_neon_widen(TCGv_i64 dest, TCGv src, int size, int u)
4098 if (u) {
4099 switch (size) {
4100 case 0: gen_helper_neon_widen_u8(dest, src); break;
4101 case 1: gen_helper_neon_widen_u16(dest, src); break;
4102 case 2: tcg_gen_extu_i32_i64(dest, src); break;
4103 default: abort();
4105 } else {
4106 switch (size) {
4107 case 0: gen_helper_neon_widen_s8(dest, src); break;
4108 case 1: gen_helper_neon_widen_s16(dest, src); break;
4109 case 2: tcg_gen_ext_i32_i64(dest, src); break;
4110 default: abort();
4113 dead_tmp(src);
4116 static inline void gen_neon_addl(int size)
4118 switch (size) {
4119 case 0: gen_helper_neon_addl_u16(CPU_V001); break;
4120 case 1: gen_helper_neon_addl_u32(CPU_V001); break;
4121 case 2: tcg_gen_add_i64(CPU_V001); break;
4122 default: abort();
4126 static inline void gen_neon_subl(int size)
4128 switch (size) {
4129 case 0: gen_helper_neon_subl_u16(CPU_V001); break;
4130 case 1: gen_helper_neon_subl_u32(CPU_V001); break;
4131 case 2: tcg_gen_sub_i64(CPU_V001); break;
4132 default: abort();
4136 static inline void gen_neon_negl(TCGv_i64 var, int size)
4138 switch (size) {
4139 case 0: gen_helper_neon_negl_u16(var, var); break;
4140 case 1: gen_helper_neon_negl_u32(var, var); break;
4141 case 2: gen_helper_neon_negl_u64(var, var); break;
4142 default: abort();
4146 static inline void gen_neon_addl_saturate(TCGv_i64 op0, TCGv_i64 op1, int size)
4148 switch (size) {
4149 case 1: gen_helper_neon_addl_saturate_s32(op0, cpu_env, op0, op1); break;
4150 case 2: gen_helper_neon_addl_saturate_s64(op0, cpu_env, op0, op1); break;
4151 default: abort();
4155 static inline void gen_neon_mull(TCGv_i64 dest, TCGv a, TCGv b, int size, int u)
4157 TCGv_i64 tmp;
4159 switch ((size << 1) | u) {
4160 case 0: gen_helper_neon_mull_s8(dest, a, b); break;
4161 case 1: gen_helper_neon_mull_u8(dest, a, b); break;
4162 case 2: gen_helper_neon_mull_s16(dest, a, b); break;
4163 case 3: gen_helper_neon_mull_u16(dest, a, b); break;
4164 case 4:
4165 tmp = gen_muls_i64_i32(a, b);
4166 tcg_gen_mov_i64(dest, tmp);
4167 break;
4168 case 5:
4169 tmp = gen_mulu_i64_i32(a, b);
4170 tcg_gen_mov_i64(dest, tmp);
4171 break;
4172 default: abort();
4176 /* Translate a NEON data processing instruction. Return nonzero if the
4177 instruction is invalid.
4178 We process data in a mixture of 32-bit and 64-bit chunks.
4179 Mostly we use 32-bit chunks so we can use normal scalar instructions. */
4181 static int disas_neon_data_insn(CPUState * env, DisasContext *s, uint32_t insn)
4183 int op;
4184 int q;
4185 int rd, rn, rm;
4186 int size;
4187 int shift;
4188 int pass;
4189 int count;
4190 int pairwise;
4191 int u;
4192 int n;
4193 uint32_t imm, mask;
4194 TCGv tmp, tmp2, tmp3, tmp4, tmp5;
4195 TCGv_i64 tmp64;
4197 if (!vfp_enabled(env))
4198 return 1;
4199 q = (insn & (1 << 6)) != 0;
4200 u = (insn >> 24) & 1;
4201 VFP_DREG_D(rd, insn);
4202 VFP_DREG_N(rn, insn);
4203 VFP_DREG_M(rm, insn);
4204 size = (insn >> 20) & 3;
4205 if ((insn & (1 << 23)) == 0) {
4206 /* Three register same length. */
4207 op = ((insn >> 7) & 0x1e) | ((insn >> 4) & 1);
4208 if (size == 3 && (op == 1 || op == 5 || op == 8 || op == 9
4209 || op == 10 || op == 11 || op == 16)) {
4210 /* 64-bit element instructions. */
4211 for (pass = 0; pass < (q ? 2 : 1); pass++) {
4212 neon_load_reg64(cpu_V0, rn + pass);
4213 neon_load_reg64(cpu_V1, rm + pass);
4214 switch (op) {
4215 case 1: /* VQADD */
4216 if (u) {
4217 gen_helper_neon_add_saturate_u64(CPU_V001);
4218 } else {
4219 gen_helper_neon_add_saturate_s64(CPU_V001);
4221 break;
4222 case 5: /* VQSUB */
4223 if (u) {
4224 gen_helper_neon_sub_saturate_u64(CPU_V001);
4225 } else {
4226 gen_helper_neon_sub_saturate_s64(CPU_V001);
4228 break;
4229 case 8: /* VSHL */
4230 if (u) {
4231 gen_helper_neon_shl_u64(cpu_V0, cpu_V1, cpu_V0);
4232 } else {
4233 gen_helper_neon_shl_s64(cpu_V0, cpu_V1, cpu_V0);
4235 break;
4236 case 9: /* VQSHL */
4237 if (u) {
4238 gen_helper_neon_qshl_u64(cpu_V0, cpu_env,
4239 cpu_V1, cpu_V0);
4240 } else {
4241 gen_helper_neon_qshl_s64(cpu_V0, cpu_env,
4242 cpu_V1, cpu_V0);
4244 break;
4245 case 10: /* VRSHL */
4246 if (u) {
4247 gen_helper_neon_rshl_u64(cpu_V0, cpu_V1, cpu_V0);
4248 } else {
4249 gen_helper_neon_rshl_s64(cpu_V0, cpu_V1, cpu_V0);
4251 break;
4252 case 11: /* VQRSHL */
4253 if (u) {
4254 gen_helper_neon_qrshl_u64(cpu_V0, cpu_env,
4255 cpu_V1, cpu_V0);
4256 } else {
4257 gen_helper_neon_qrshl_s64(cpu_V0, cpu_env,
4258 cpu_V1, cpu_V0);
4260 break;
4261 case 16:
4262 if (u) {
4263 tcg_gen_sub_i64(CPU_V001);
4264 } else {
4265 tcg_gen_add_i64(CPU_V001);
4267 break;
4268 default:
4269 abort();
4271 neon_store_reg64(cpu_V0, rd + pass);
4273 return 0;
4275 switch (op) {
4276 case 8: /* VSHL */
4277 case 9: /* VQSHL */
4278 case 10: /* VRSHL */
4279 case 11: /* VQRSHL */
4281 int rtmp;
4282 /* Shift instruction operands are reversed. */
4283 rtmp = rn;
4284 rn = rm;
4285 rm = rtmp;
4286 pairwise = 0;
4288 break;
4289 case 20: /* VPMAX */
4290 case 21: /* VPMIN */
4291 case 23: /* VPADD */
4292 pairwise = 1;
4293 break;
4294 case 26: /* VPADD (float) */
4295 pairwise = (u && size < 2);
4296 break;
4297 case 30: /* VPMIN/VPMAX (float) */
4298 pairwise = u;
4299 break;
4300 default:
4301 pairwise = 0;
4302 break;
4305 for (pass = 0; pass < (q ? 4 : 2); pass++) {
4307 if (pairwise) {
4308 /* Pairwise. */
4309 if (q)
4310 n = (pass & 1) * 2;
4311 else
4312 n = 0;
4313 if (pass < q + 1) {
4314 tmp = neon_load_reg(rn, n);
4315 tmp2 = neon_load_reg(rn, n + 1);
4316 } else {
4317 tmp = neon_load_reg(rm, n);
4318 tmp2 = neon_load_reg(rm, n + 1);
4320 } else {
4321 /* Elementwise. */
4322 tmp = neon_load_reg(rn, pass);
4323 tmp2 = neon_load_reg(rm, pass);
4325 switch (op) {
4326 case 0: /* VHADD */
4327 GEN_NEON_INTEGER_OP(hadd);
4328 break;
4329 case 1: /* VQADD */
4330 GEN_NEON_INTEGER_OP_ENV(qadd);
4331 break;
4332 case 2: /* VRHADD */
4333 GEN_NEON_INTEGER_OP(rhadd);
4334 break;
4335 case 3: /* Logic ops. */
4336 switch ((u << 2) | size) {
4337 case 0: /* VAND */
4338 tcg_gen_and_i32(tmp, tmp, tmp2);
4339 break;
4340 case 1: /* BIC */
4341 tcg_gen_andc_i32(tmp, tmp, tmp2);
4342 break;
4343 case 2: /* VORR */
4344 tcg_gen_or_i32(tmp, tmp, tmp2);
4345 break;
4346 case 3: /* VORN */
4347 tcg_gen_orc_i32(tmp, tmp, tmp2);
4348 break;
4349 case 4: /* VEOR */
4350 tcg_gen_xor_i32(tmp, tmp, tmp2);
4351 break;
4352 case 5: /* VBSL */
4353 tmp3 = neon_load_reg(rd, pass);
4354 gen_neon_bsl(tmp, tmp, tmp2, tmp3);
4355 dead_tmp(tmp3);
4356 break;
4357 case 6: /* VBIT */
4358 tmp3 = neon_load_reg(rd, pass);
4359 gen_neon_bsl(tmp, tmp, tmp3, tmp2);
4360 dead_tmp(tmp3);
4361 break;
4362 case 7: /* VBIF */
4363 tmp3 = neon_load_reg(rd, pass);
4364 gen_neon_bsl(tmp, tmp3, tmp, tmp2);
4365 dead_tmp(tmp3);
4366 break;
4368 break;
4369 case 4: /* VHSUB */
4370 GEN_NEON_INTEGER_OP(hsub);
4371 break;
4372 case 5: /* VQSUB */
4373 GEN_NEON_INTEGER_OP_ENV(qsub);
4374 break;
4375 case 6: /* VCGT */
4376 GEN_NEON_INTEGER_OP(cgt);
4377 break;
4378 case 7: /* VCGE */
4379 GEN_NEON_INTEGER_OP(cge);
4380 break;
4381 case 8: /* VSHL */
4382 GEN_NEON_INTEGER_OP(shl);
4383 break;
4384 case 9: /* VQSHL */
4385 GEN_NEON_INTEGER_OP_ENV(qshl);
4386 break;
4387 case 10: /* VRSHL */
4388 GEN_NEON_INTEGER_OP(rshl);
4389 break;
4390 case 11: /* VQRSHL */
4391 GEN_NEON_INTEGER_OP_ENV(qrshl);
4392 break;
4393 case 12: /* VMAX */
4394 GEN_NEON_INTEGER_OP(max);
4395 break;
4396 case 13: /* VMIN */
4397 GEN_NEON_INTEGER_OP(min);
4398 break;
4399 case 14: /* VABD */
4400 GEN_NEON_INTEGER_OP(abd);
4401 break;
4402 case 15: /* VABA */
4403 GEN_NEON_INTEGER_OP(abd);
4404 dead_tmp(tmp2);
4405 tmp2 = neon_load_reg(rd, pass);
4406 gen_neon_add(size, tmp, tmp2);
4407 break;
4408 case 16:
4409 if (!u) { /* VADD */
4410 if (gen_neon_add(size, tmp, tmp2))
4411 return 1;
4412 } else { /* VSUB */
4413 switch (size) {
4414 case 0: gen_helper_neon_sub_u8(tmp, tmp, tmp2); break;
4415 case 1: gen_helper_neon_sub_u16(tmp, tmp, tmp2); break;
4416 case 2: tcg_gen_sub_i32(tmp, tmp, tmp2); break;
4417 default: return 1;
4420 break;
4421 case 17:
4422 if (!u) { /* VTST */
4423 switch (size) {
4424 case 0: gen_helper_neon_tst_u8(tmp, tmp, tmp2); break;
4425 case 1: gen_helper_neon_tst_u16(tmp, tmp, tmp2); break;
4426 case 2: gen_helper_neon_tst_u32(tmp, tmp, tmp2); break;
4427 default: return 1;
4429 } else { /* VCEQ */
4430 switch (size) {
4431 case 0: gen_helper_neon_ceq_u8(tmp, tmp, tmp2); break;
4432 case 1: gen_helper_neon_ceq_u16(tmp, tmp, tmp2); break;
4433 case 2: gen_helper_neon_ceq_u32(tmp, tmp, tmp2); break;
4434 default: return 1;
4437 break;
4438 case 18: /* Multiply. */
4439 switch (size) {
4440 case 0: gen_helper_neon_mul_u8(tmp, tmp, tmp2); break;
4441 case 1: gen_helper_neon_mul_u16(tmp, tmp, tmp2); break;
4442 case 2: tcg_gen_mul_i32(tmp, tmp, tmp2); break;
4443 default: return 1;
4445 dead_tmp(tmp2);
4446 tmp2 = neon_load_reg(rd, pass);
4447 if (u) { /* VMLS */
4448 gen_neon_rsb(size, tmp, tmp2);
4449 } else { /* VMLA */
4450 gen_neon_add(size, tmp, tmp2);
4452 break;
4453 case 19: /* VMUL */
4454 if (u) { /* polynomial */
4455 gen_helper_neon_mul_p8(tmp, tmp, tmp2);
4456 } else { /* Integer */
4457 switch (size) {
4458 case 0: gen_helper_neon_mul_u8(tmp, tmp, tmp2); break;
4459 case 1: gen_helper_neon_mul_u16(tmp, tmp, tmp2); break;
4460 case 2: tcg_gen_mul_i32(tmp, tmp, tmp2); break;
4461 default: return 1;
4464 break;
4465 case 20: /* VPMAX */
4466 GEN_NEON_INTEGER_OP(pmax);
4467 break;
4468 case 21: /* VPMIN */
4469 GEN_NEON_INTEGER_OP(pmin);
4470 break;
4471 case 22: /* Hultiply high. */
4472 if (!u) { /* VQDMULH */
4473 switch (size) {
4474 case 1: gen_helper_neon_qdmulh_s16(tmp, cpu_env, tmp, tmp2); break;
4475 case 2: gen_helper_neon_qdmulh_s32(tmp, cpu_env, tmp, tmp2); break;
4476 default: return 1;
4478 } else { /* VQRDHMUL */
4479 switch (size) {
4480 case 1: gen_helper_neon_qrdmulh_s16(tmp, cpu_env, tmp, tmp2); break;
4481 case 2: gen_helper_neon_qrdmulh_s32(tmp, cpu_env, tmp, tmp2); break;
4482 default: return 1;
4485 break;
4486 case 23: /* VPADD */
4487 if (u)
4488 return 1;
4489 switch (size) {
4490 case 0: gen_helper_neon_padd_u8(tmp, tmp, tmp2); break;
4491 case 1: gen_helper_neon_padd_u16(tmp, tmp, tmp2); break;
4492 case 2: tcg_gen_add_i32(tmp, tmp, tmp2); break;
4493 default: return 1;
4495 break;
4496 case 26: /* Floating point arithnetic. */
4497 switch ((u << 2) | size) {
4498 case 0: /* VADD */
4499 gen_helper_neon_add_f32(tmp, tmp, tmp2);
4500 break;
4501 case 2: /* VSUB */
4502 gen_helper_neon_sub_f32(tmp, tmp, tmp2);
4503 break;
4504 case 4: /* VPADD */
4505 gen_helper_neon_add_f32(tmp, tmp, tmp2);
4506 break;
4507 case 6: /* VABD */
4508 gen_helper_neon_abd_f32(tmp, tmp, tmp2);
4509 break;
4510 default:
4511 return 1;
4513 break;
4514 case 27: /* Float multiply. */
4515 gen_helper_neon_mul_f32(tmp, tmp, tmp2);
4516 if (!u) {
4517 dead_tmp(tmp2);
4518 tmp2 = neon_load_reg(rd, pass);
4519 if (size == 0) {
4520 gen_helper_neon_add_f32(tmp, tmp, tmp2);
4521 } else {
4522 gen_helper_neon_sub_f32(tmp, tmp2, tmp);
4525 break;
4526 case 28: /* Float compare. */
4527 if (!u) {
4528 gen_helper_neon_ceq_f32(tmp, tmp, tmp2);
4529 } else {
4530 if (size == 0)
4531 gen_helper_neon_cge_f32(tmp, tmp, tmp2);
4532 else
4533 gen_helper_neon_cgt_f32(tmp, tmp, tmp2);
4535 break;
4536 case 29: /* Float compare absolute. */
4537 if (!u)
4538 return 1;
4539 if (size == 0)
4540 gen_helper_neon_acge_f32(tmp, tmp, tmp2);
4541 else
4542 gen_helper_neon_acgt_f32(tmp, tmp, tmp2);
4543 break;
4544 case 30: /* Float min/max. */
4545 if (size == 0)
4546 gen_helper_neon_max_f32(tmp, tmp, tmp2);
4547 else
4548 gen_helper_neon_min_f32(tmp, tmp, tmp2);
4549 break;
4550 case 31:
4551 if (size == 0)
4552 gen_helper_recps_f32(tmp, tmp, tmp2, cpu_env);
4553 else
4554 gen_helper_rsqrts_f32(tmp, tmp, tmp2, cpu_env);
4555 break;
4556 default:
4557 abort();
4559 dead_tmp(tmp2);
4561 /* Save the result. For elementwise operations we can put it
4562 straight into the destination register. For pairwise operations
4563 we have to be careful to avoid clobbering the source operands. */
4564 if (pairwise && rd == rm) {
4565 neon_store_scratch(pass, tmp);
4566 } else {
4567 neon_store_reg(rd, pass, tmp);
4570 } /* for pass */
4571 if (pairwise && rd == rm) {
4572 for (pass = 0; pass < (q ? 4 : 2); pass++) {
4573 tmp = neon_load_scratch(pass);
4574 neon_store_reg(rd, pass, tmp);
4577 /* End of 3 register same size operations. */
4578 } else if (insn & (1 << 4)) {
4579 if ((insn & 0x00380080) != 0) {
4580 /* Two registers and shift. */
4581 op = (insn >> 8) & 0xf;
4582 if (insn & (1 << 7)) {
4583 /* 64-bit shift. */
4584 size = 3;
4585 } else {
4586 size = 2;
4587 while ((insn & (1 << (size + 19))) == 0)
4588 size--;
4590 shift = (insn >> 16) & ((1 << (3 + size)) - 1);
4591 /* To avoid excessive dumplication of ops we implement shift
4592 by immediate using the variable shift operations. */
4593 if (op < 8) {
4594 /* Shift by immediate:
4595 VSHR, VSRA, VRSHR, VRSRA, VSRI, VSHL, VQSHL, VQSHLU. */
4596 /* Right shifts are encoded as N - shift, where N is the
4597 element size in bits. */
4598 if (op <= 4)
4599 shift = shift - (1 << (size + 3));
4600 if (size == 3) {
4601 count = q + 1;
4602 } else {
4603 count = q ? 4: 2;
4605 switch (size) {
4606 case 0:
4607 imm = (uint8_t) shift;
4608 imm |= imm << 8;
4609 imm |= imm << 16;
4610 break;
4611 case 1:
4612 imm = (uint16_t) shift;
4613 imm |= imm << 16;
4614 break;
4615 case 2:
4616 case 3:
4617 imm = shift;
4618 break;
4619 default:
4620 abort();
4623 for (pass = 0; pass < count; pass++) {
4624 if (size == 3) {
4625 neon_load_reg64(cpu_V0, rm + pass);
4626 tcg_gen_movi_i64(cpu_V1, imm);
4627 switch (op) {
4628 case 0: /* VSHR */
4629 case 1: /* VSRA */
4630 if (u)
4631 gen_helper_neon_shl_u64(cpu_V0, cpu_V0, cpu_V1);
4632 else
4633 gen_helper_neon_shl_s64(cpu_V0, cpu_V0, cpu_V1);
4634 break;
4635 case 2: /* VRSHR */
4636 case 3: /* VRSRA */
4637 if (u)
4638 gen_helper_neon_rshl_u64(cpu_V0, cpu_V0, cpu_V1);
4639 else
4640 gen_helper_neon_rshl_s64(cpu_V0, cpu_V0, cpu_V1);
4641 break;
4642 case 4: /* VSRI */
4643 if (!u)
4644 return 1;
4645 gen_helper_neon_shl_u64(cpu_V0, cpu_V0, cpu_V1);
4646 break;
4647 case 5: /* VSHL, VSLI */
4648 gen_helper_neon_shl_u64(cpu_V0, cpu_V0, cpu_V1);
4649 break;
4650 case 6: /* VQSHL */
4651 if (u)
4652 gen_helper_neon_qshl_u64(cpu_V0, cpu_env, cpu_V0, cpu_V1);
4653 else
4654 gen_helper_neon_qshl_s64(cpu_V0, cpu_env, cpu_V0, cpu_V1);
4655 break;
4656 case 7: /* VQSHLU */
4657 gen_helper_neon_qshl_u64(cpu_V0, cpu_env, cpu_V0, cpu_V1);
4658 break;
4660 if (op == 1 || op == 3) {
4661 /* Accumulate. */
4662 neon_load_reg64(cpu_V0, rd + pass);
4663 tcg_gen_add_i64(cpu_V0, cpu_V0, cpu_V1);
4664 } else if (op == 4 || (op == 5 && u)) {
4665 /* Insert */
4666 cpu_abort(env, "VS[LR]I.64 not implemented");
4668 neon_store_reg64(cpu_V0, rd + pass);
4669 } else { /* size < 3 */
4670 /* Operands in T0 and T1. */
4671 tmp = neon_load_reg(rm, pass);
4672 tmp2 = new_tmp();
4673 tcg_gen_movi_i32(tmp2, imm);
4674 switch (op) {
4675 case 0: /* VSHR */
4676 case 1: /* VSRA */
4677 GEN_NEON_INTEGER_OP(shl);
4678 break;
4679 case 2: /* VRSHR */
4680 case 3: /* VRSRA */
4681 GEN_NEON_INTEGER_OP(rshl);
4682 break;
4683 case 4: /* VSRI */
4684 if (!u)
4685 return 1;
4686 GEN_NEON_INTEGER_OP(shl);
4687 break;
4688 case 5: /* VSHL, VSLI */
4689 switch (size) {
4690 case 0: gen_helper_neon_shl_u8(tmp, tmp, tmp2); break;
4691 case 1: gen_helper_neon_shl_u16(tmp, tmp, tmp2); break;
4692 case 2: gen_helper_neon_shl_u32(tmp, tmp, tmp2); break;
4693 default: return 1;
4695 break;
4696 case 6: /* VQSHL */
4697 GEN_NEON_INTEGER_OP_ENV(qshl);
4698 break;
4699 case 7: /* VQSHLU */
4700 switch (size) {
4701 case 0: gen_helper_neon_qshl_u8(tmp, cpu_env, tmp, tmp2); break;
4702 case 1: gen_helper_neon_qshl_u16(tmp, cpu_env, tmp, tmp2); break;
4703 case 2: gen_helper_neon_qshl_u32(tmp, cpu_env, tmp, tmp2); break;
4704 default: return 1;
4706 break;
4708 dead_tmp(tmp2);
4710 if (op == 1 || op == 3) {
4711 /* Accumulate. */
4712 tmp2 = neon_load_reg(rd, pass);
4713 gen_neon_add(size, tmp2, tmp);
4714 dead_tmp(tmp2);
4715 } else if (op == 4 || (op == 5 && u)) {
4716 /* Insert */
4717 switch (size) {
4718 case 0:
4719 if (op == 4)
4720 mask = 0xff >> -shift;
4721 else
4722 mask = (uint8_t)(0xff << shift);
4723 mask |= mask << 8;
4724 mask |= mask << 16;
4725 break;
4726 case 1:
4727 if (op == 4)
4728 mask = 0xffff >> -shift;
4729 else
4730 mask = (uint16_t)(0xffff << shift);
4731 mask |= mask << 16;
4732 break;
4733 case 2:
4734 if (shift < -31 || shift > 31) {
4735 mask = 0;
4736 } else {
4737 if (op == 4)
4738 mask = 0xffffffffu >> -shift;
4739 else
4740 mask = 0xffffffffu << shift;
4742 break;
4743 default:
4744 abort();
4746 tmp2 = neon_load_reg(rd, pass);
4747 tcg_gen_andi_i32(tmp, tmp, mask);
4748 tcg_gen_andi_i32(tmp2, tmp2, ~mask);
4749 tcg_gen_or_i32(tmp, tmp, tmp2);
4750 dead_tmp(tmp2);
4752 neon_store_reg(rd, pass, tmp);
4754 } /* for pass */
4755 } else if (op < 10) {
4756 /* Shift by immediate and narrow:
4757 VSHRN, VRSHRN, VQSHRN, VQRSHRN. */
4758 shift = shift - (1 << (size + 3));
4759 size++;
4760 switch (size) {
4761 case 1:
4762 imm = (uint16_t)shift;
4763 imm |= imm << 16;
4764 tmp2 = tcg_const_i32(imm);
4765 TCGV_UNUSED_I64(tmp64);
4766 break;
4767 case 2:
4768 imm = (uint32_t)shift;
4769 tmp2 = tcg_const_i32(imm);
4770 TCGV_UNUSED_I64(tmp64);
4771 break;
4772 case 3:
4773 tmp64 = tcg_const_i64(shift);
4774 TCGV_UNUSED(tmp2);
4775 break;
4776 default:
4777 abort();
4780 for (pass = 0; pass < 2; pass++) {
4781 if (size == 3) {
4782 neon_load_reg64(cpu_V0, rm + pass);
4783 if (q) {
4784 if (u)
4785 gen_helper_neon_rshl_u64(cpu_V0, cpu_V0, tmp64);
4786 else
4787 gen_helper_neon_rshl_s64(cpu_V0, cpu_V0, tmp64);
4788 } else {
4789 if (u)
4790 gen_helper_neon_shl_u64(cpu_V0, cpu_V0, tmp64);
4791 else
4792 gen_helper_neon_shl_s64(cpu_V0, cpu_V0, tmp64);
4794 } else {
4795 tmp = neon_load_reg(rm + pass, 0);
4796 gen_neon_shift_narrow(size, tmp, tmp2, q, u);
4797 tmp3 = neon_load_reg(rm + pass, 1);
4798 gen_neon_shift_narrow(size, tmp3, tmp2, q, u);
4799 tcg_gen_concat_i32_i64(cpu_V0, tmp, tmp3);
4800 dead_tmp(tmp);
4801 dead_tmp(tmp3);
4803 tmp = new_tmp();
4804 if (op == 8 && !u) {
4805 gen_neon_narrow(size - 1, tmp, cpu_V0);
4806 } else {
4807 if (op == 8)
4808 gen_neon_narrow_sats(size - 1, tmp, cpu_V0);
4809 else
4810 gen_neon_narrow_satu(size - 1, tmp, cpu_V0);
4812 neon_store_reg(rd, pass, tmp);
4813 } /* for pass */
4814 if (size == 3) {
4815 tcg_temp_free_i64(tmp64);
4816 } else {
4817 dead_tmp(tmp2);
4819 } else if (op == 10) {
4820 /* VSHLL */
4821 if (q || size == 3)
4822 return 1;
4823 tmp = neon_load_reg(rm, 0);
4824 tmp2 = neon_load_reg(rm, 1);
4825 for (pass = 0; pass < 2; pass++) {
4826 if (pass == 1)
4827 tmp = tmp2;
4829 gen_neon_widen(cpu_V0, tmp, size, u);
4831 if (shift != 0) {
4832 /* The shift is less than the width of the source
4833 type, so we can just shift the whole register. */
4834 tcg_gen_shli_i64(cpu_V0, cpu_V0, shift);
4835 if (size < 2 || !u) {
4836 uint64_t imm64;
4837 if (size == 0) {
4838 imm = (0xffu >> (8 - shift));
4839 imm |= imm << 16;
4840 } else {
4841 imm = 0xffff >> (16 - shift);
4843 imm64 = imm | (((uint64_t)imm) << 32);
4844 tcg_gen_andi_i64(cpu_V0, cpu_V0, imm64);
4847 neon_store_reg64(cpu_V0, rd + pass);
4849 } else if (op >= 14) {
4850 /* VCVT fixed-point. */
4851 /* We have already masked out the must-be-1 top bit of imm6,
4852 * hence this 32-shift where the ARM ARM has 64-imm6.
4854 shift = 32 - shift;
4855 for (pass = 0; pass < (q ? 4 : 2); pass++) {
4856 tcg_gen_ld_f32(cpu_F0s, cpu_env, neon_reg_offset(rm, pass));
4857 if (!(op & 1)) {
4858 if (u)
4859 gen_vfp_ulto(0, shift);
4860 else
4861 gen_vfp_slto(0, shift);
4862 } else {
4863 if (u)
4864 gen_vfp_toul(0, shift);
4865 else
4866 gen_vfp_tosl(0, shift);
4868 tcg_gen_st_f32(cpu_F0s, cpu_env, neon_reg_offset(rd, pass));
4870 } else {
4871 return 1;
4873 } else { /* (insn & 0x00380080) == 0 */
4874 int invert;
4876 op = (insn >> 8) & 0xf;
4877 /* One register and immediate. */
4878 imm = (u << 7) | ((insn >> 12) & 0x70) | (insn & 0xf);
4879 invert = (insn & (1 << 5)) != 0;
4880 switch (op) {
4881 case 0: case 1:
4882 /* no-op */
4883 break;
4884 case 2: case 3:
4885 imm <<= 8;
4886 break;
4887 case 4: case 5:
4888 imm <<= 16;
4889 break;
4890 case 6: case 7:
4891 imm <<= 24;
4892 break;
4893 case 8: case 9:
4894 imm |= imm << 16;
4895 break;
4896 case 10: case 11:
4897 imm = (imm << 8) | (imm << 24);
4898 break;
4899 case 12:
4900 imm = (imm << 8) | 0xff;
4901 break;
4902 case 13:
4903 imm = (imm << 16) | 0xffff;
4904 break;
4905 case 14:
4906 imm |= (imm << 8) | (imm << 16) | (imm << 24);
4907 if (invert)
4908 imm = ~imm;
4909 break;
4910 case 15:
4911 imm = ((imm & 0x80) << 24) | ((imm & 0x3f) << 19)
4912 | ((imm & 0x40) ? (0x1f << 25) : (1 << 30));
4913 break;
4915 if (invert)
4916 imm = ~imm;
4918 for (pass = 0; pass < (q ? 4 : 2); pass++) {
4919 if (op & 1 && op < 12) {
4920 tmp = neon_load_reg(rd, pass);
4921 if (invert) {
4922 /* The immediate value has already been inverted, so
4923 BIC becomes AND. */
4924 tcg_gen_andi_i32(tmp, tmp, imm);
4925 } else {
4926 tcg_gen_ori_i32(tmp, tmp, imm);
4928 } else {
4929 /* VMOV, VMVN. */
4930 tmp = new_tmp();
4931 if (op == 14 && invert) {
4932 uint32_t val;
4933 val = 0;
4934 for (n = 0; n < 4; n++) {
4935 if (imm & (1 << (n + (pass & 1) * 4)))
4936 val |= 0xff << (n * 8);
4938 tcg_gen_movi_i32(tmp, val);
4939 } else {
4940 tcg_gen_movi_i32(tmp, imm);
4943 neon_store_reg(rd, pass, tmp);
4946 } else { /* (insn & 0x00800010 == 0x00800000) */
4947 if (size != 3) {
4948 op = (insn >> 8) & 0xf;
4949 if ((insn & (1 << 6)) == 0) {
4950 /* Three registers of different lengths. */
4951 int src1_wide;
4952 int src2_wide;
4953 int prewiden;
4954 /* prewiden, src1_wide, src2_wide */
4955 static const int neon_3reg_wide[16][3] = {
4956 {1, 0, 0}, /* VADDL */
4957 {1, 1, 0}, /* VADDW */
4958 {1, 0, 0}, /* VSUBL */
4959 {1, 1, 0}, /* VSUBW */
4960 {0, 1, 1}, /* VADDHN */
4961 {0, 0, 0}, /* VABAL */
4962 {0, 1, 1}, /* VSUBHN */
4963 {0, 0, 0}, /* VABDL */
4964 {0, 0, 0}, /* VMLAL */
4965 {0, 0, 0}, /* VQDMLAL */
4966 {0, 0, 0}, /* VMLSL */
4967 {0, 0, 0}, /* VQDMLSL */
4968 {0, 0, 0}, /* Integer VMULL */
4969 {0, 0, 0}, /* VQDMULL */
4970 {0, 0, 0} /* Polynomial VMULL */
4973 prewiden = neon_3reg_wide[op][0];
4974 src1_wide = neon_3reg_wide[op][1];
4975 src2_wide = neon_3reg_wide[op][2];
4977 if (size == 0 && (op == 9 || op == 11 || op == 13))
4978 return 1;
4980 /* Avoid overlapping operands. Wide source operands are
4981 always aligned so will never overlap with wide
4982 destinations in problematic ways. */
4983 if (rd == rm && !src2_wide) {
4984 tmp = neon_load_reg(rm, 1);
4985 neon_store_scratch(2, tmp);
4986 } else if (rd == rn && !src1_wide) {
4987 tmp = neon_load_reg(rn, 1);
4988 neon_store_scratch(2, tmp);
4990 TCGV_UNUSED(tmp3);
4991 for (pass = 0; pass < 2; pass++) {
4992 if (src1_wide) {
4993 neon_load_reg64(cpu_V0, rn + pass);
4994 TCGV_UNUSED(tmp);
4995 } else {
4996 if (pass == 1 && rd == rn) {
4997 tmp = neon_load_scratch(2);
4998 } else {
4999 tmp = neon_load_reg(rn, pass);
5001 if (prewiden) {
5002 gen_neon_widen(cpu_V0, tmp, size, u);
5005 if (src2_wide) {
5006 neon_load_reg64(cpu_V1, rm + pass);
5007 TCGV_UNUSED(tmp2);
5008 } else {
5009 if (pass == 1 && rd == rm) {
5010 tmp2 = neon_load_scratch(2);
5011 } else {
5012 tmp2 = neon_load_reg(rm, pass);
5014 if (prewiden) {
5015 gen_neon_widen(cpu_V1, tmp2, size, u);
5018 switch (op) {
5019 case 0: case 1: case 4: /* VADDL, VADDW, VADDHN, VRADDHN */
5020 gen_neon_addl(size);
5021 break;
5022 case 2: case 3: case 6: /* VSUBL, VSUBW, VSUBHN, VRSUBHN */
5023 gen_neon_subl(size);
5024 break;
5025 case 5: case 7: /* VABAL, VABDL */
5026 switch ((size << 1) | u) {
5027 case 0:
5028 gen_helper_neon_abdl_s16(cpu_V0, tmp, tmp2);
5029 break;
5030 case 1:
5031 gen_helper_neon_abdl_u16(cpu_V0, tmp, tmp2);
5032 break;
5033 case 2:
5034 gen_helper_neon_abdl_s32(cpu_V0, tmp, tmp2);
5035 break;
5036 case 3:
5037 gen_helper_neon_abdl_u32(cpu_V0, tmp, tmp2);
5038 break;
5039 case 4:
5040 gen_helper_neon_abdl_s64(cpu_V0, tmp, tmp2);
5041 break;
5042 case 5:
5043 gen_helper_neon_abdl_u64(cpu_V0, tmp, tmp2);
5044 break;
5045 default: abort();
5047 dead_tmp(tmp2);
5048 dead_tmp(tmp);
5049 break;
5050 case 8: case 9: case 10: case 11: case 12: case 13:
5051 /* VMLAL, VQDMLAL, VMLSL, VQDMLSL, VMULL, VQDMULL */
5052 gen_neon_mull(cpu_V0, tmp, tmp2, size, u);
5053 dead_tmp(tmp2);
5054 dead_tmp(tmp);
5055 break;
5056 case 14: /* Polynomial VMULL */
5057 cpu_abort(env, "Polynomial VMULL not implemented");
5059 default: /* 15 is RESERVED. */
5060 return 1;
5062 if (op == 5 || op == 13 || (op >= 8 && op <= 11)) {
5063 /* Accumulate. */
5064 if (op == 10 || op == 11) {
5065 gen_neon_negl(cpu_V0, size);
5068 if (op != 13) {
5069 neon_load_reg64(cpu_V1, rd + pass);
5072 switch (op) {
5073 case 5: case 8: case 10: /* VABAL, VMLAL, VMLSL */
5074 gen_neon_addl(size);
5075 break;
5076 case 9: case 11: /* VQDMLAL, VQDMLSL */
5077 gen_neon_addl_saturate(cpu_V0, cpu_V0, size);
5078 gen_neon_addl_saturate(cpu_V0, cpu_V1, size);
5079 break;
5080 /* Fall through. */
5081 case 13: /* VQDMULL */
5082 gen_neon_addl_saturate(cpu_V0, cpu_V0, size);
5083 break;
5084 default:
5085 abort();
5087 neon_store_reg64(cpu_V0, rd + pass);
5088 } else if (op == 4 || op == 6) {
5089 /* Narrowing operation. */
5090 tmp = new_tmp();
5091 if (!u) {
5092 switch (size) {
5093 case 0:
5094 gen_helper_neon_narrow_high_u8(tmp, cpu_V0);
5095 break;
5096 case 1:
5097 gen_helper_neon_narrow_high_u16(tmp, cpu_V0);
5098 break;
5099 case 2:
5100 tcg_gen_shri_i64(cpu_V0, cpu_V0, 32);
5101 tcg_gen_trunc_i64_i32(tmp, cpu_V0);
5102 break;
5103 default: abort();
5105 } else {
5106 switch (size) {
5107 case 0:
5108 gen_helper_neon_narrow_round_high_u8(tmp, cpu_V0);
5109 break;
5110 case 1:
5111 gen_helper_neon_narrow_round_high_u16(tmp, cpu_V0);
5112 break;
5113 case 2:
5114 tcg_gen_addi_i64(cpu_V0, cpu_V0, 1u << 31);
5115 tcg_gen_shri_i64(cpu_V0, cpu_V0, 32);
5116 tcg_gen_trunc_i64_i32(tmp, cpu_V0);
5117 break;
5118 default: abort();
5121 if (pass == 0) {
5122 tmp3 = tmp;
5123 } else {
5124 neon_store_reg(rd, 0, tmp3);
5125 neon_store_reg(rd, 1, tmp);
5127 } else {
5128 /* Write back the result. */
5129 neon_store_reg64(cpu_V0, rd + pass);
5132 } else {
5133 /* Two registers and a scalar. */
5134 switch (op) {
5135 case 0: /* Integer VMLA scalar */
5136 case 1: /* Float VMLA scalar */
5137 case 4: /* Integer VMLS scalar */
5138 case 5: /* Floating point VMLS scalar */
5139 case 8: /* Integer VMUL scalar */
5140 case 9: /* Floating point VMUL scalar */
5141 case 12: /* VQDMULH scalar */
5142 case 13: /* VQRDMULH scalar */
5143 tmp = neon_get_scalar(size, rm);
5144 neon_store_scratch(0, tmp);
5145 for (pass = 0; pass < (u ? 4 : 2); pass++) {
5146 tmp = neon_load_scratch(0);
5147 tmp2 = neon_load_reg(rn, pass);
5148 if (op == 12) {
5149 if (size == 1) {
5150 gen_helper_neon_qdmulh_s16(tmp, cpu_env, tmp, tmp2);
5151 } else {
5152 gen_helper_neon_qdmulh_s32(tmp, cpu_env, tmp, tmp2);
5154 } else if (op == 13) {
5155 if (size == 1) {
5156 gen_helper_neon_qrdmulh_s16(tmp, cpu_env, tmp, tmp2);
5157 } else {
5158 gen_helper_neon_qrdmulh_s32(tmp, cpu_env, tmp, tmp2);
5160 } else if (op & 1) {
5161 gen_helper_neon_mul_f32(tmp, tmp, tmp2);
5162 } else {
5163 switch (size) {
5164 case 0: gen_helper_neon_mul_u8(tmp, tmp, tmp2); break;
5165 case 1: gen_helper_neon_mul_u16(tmp, tmp, tmp2); break;
5166 case 2: tcg_gen_mul_i32(tmp, tmp, tmp2); break;
5167 default: return 1;
5170 dead_tmp(tmp2);
5171 if (op < 8) {
5172 /* Accumulate. */
5173 tmp2 = neon_load_reg(rd, pass);
5174 switch (op) {
5175 case 0:
5176 gen_neon_add(size, tmp, tmp2);
5177 break;
5178 case 1:
5179 gen_helper_neon_add_f32(tmp, tmp, tmp2);
5180 break;
5181 case 4:
5182 gen_neon_rsb(size, tmp, tmp2);
5183 break;
5184 case 5:
5185 gen_helper_neon_sub_f32(tmp, tmp2, tmp);
5186 break;
5187 default:
5188 abort();
5190 dead_tmp(tmp2);
5192 neon_store_reg(rd, pass, tmp);
5194 break;
5195 case 2: /* VMLAL sclar */
5196 case 3: /* VQDMLAL scalar */
5197 case 6: /* VMLSL scalar */
5198 case 7: /* VQDMLSL scalar */
5199 case 10: /* VMULL scalar */
5200 case 11: /* VQDMULL scalar */
5201 if (size == 0 && (op == 3 || op == 7 || op == 11))
5202 return 1;
5204 tmp2 = neon_get_scalar(size, rm);
5205 tmp3 = neon_load_reg(rn, 1);
5207 for (pass = 0; pass < 2; pass++) {
5208 if (pass == 0) {
5209 tmp = neon_load_reg(rn, 0);
5210 } else {
5211 tmp = tmp3;
5213 gen_neon_mull(cpu_V0, tmp, tmp2, size, u);
5214 dead_tmp(tmp);
5215 if (op == 6 || op == 7) {
5216 gen_neon_negl(cpu_V0, size);
5218 if (op != 11) {
5219 neon_load_reg64(cpu_V1, rd + pass);
5221 switch (op) {
5222 case 2: case 6:
5223 gen_neon_addl(size);
5224 break;
5225 case 3: case 7:
5226 gen_neon_addl_saturate(cpu_V0, cpu_V0, size);
5227 gen_neon_addl_saturate(cpu_V0, cpu_V1, size);
5228 break;
5229 case 10:
5230 /* no-op */
5231 break;
5232 case 11:
5233 gen_neon_addl_saturate(cpu_V0, cpu_V0, size);
5234 break;
5235 default:
5236 abort();
5238 neon_store_reg64(cpu_V0, rd + pass);
5241 dead_tmp(tmp2);
5243 break;
5244 default: /* 14 and 15 are RESERVED */
5245 return 1;
5248 } else { /* size == 3 */
5249 if (!u) {
5250 /* Extract. */
5251 imm = (insn >> 8) & 0xf;
5253 if (imm > 7 && !q)
5254 return 1;
5256 if (imm == 0) {
5257 neon_load_reg64(cpu_V0, rn);
5258 if (q) {
5259 neon_load_reg64(cpu_V1, rn + 1);
5261 } else if (imm == 8) {
5262 neon_load_reg64(cpu_V0, rn + 1);
5263 if (q) {
5264 neon_load_reg64(cpu_V1, rm);
5266 } else if (q) {
5267 tmp64 = tcg_temp_new_i64();
5268 if (imm < 8) {
5269 neon_load_reg64(cpu_V0, rn);
5270 neon_load_reg64(tmp64, rn + 1);
5271 } else {
5272 neon_load_reg64(cpu_V0, rn + 1);
5273 neon_load_reg64(tmp64, rm);
5275 tcg_gen_shri_i64(cpu_V0, cpu_V0, (imm & 7) * 8);
5276 tcg_gen_shli_i64(cpu_V1, tmp64, 64 - ((imm & 7) * 8));
5277 tcg_gen_or_i64(cpu_V0, cpu_V0, cpu_V1);
5278 if (imm < 8) {
5279 neon_load_reg64(cpu_V1, rm);
5280 } else {
5281 neon_load_reg64(cpu_V1, rm + 1);
5282 imm -= 8;
5284 tcg_gen_shli_i64(cpu_V1, cpu_V1, 64 - (imm * 8));
5285 tcg_gen_shri_i64(tmp64, tmp64, imm * 8);
5286 tcg_gen_or_i64(cpu_V1, cpu_V1, tmp64);
5287 tcg_temp_free_i64(tmp64);
5288 } else {
5289 /* BUGFIX */
5290 neon_load_reg64(cpu_V0, rn);
5291 tcg_gen_shri_i64(cpu_V0, cpu_V0, imm * 8);
5292 neon_load_reg64(cpu_V1, rm);
5293 tcg_gen_shli_i64(cpu_V1, cpu_V1, 64 - (imm * 8));
5294 tcg_gen_or_i64(cpu_V0, cpu_V0, cpu_V1);
5296 neon_store_reg64(cpu_V0, rd);
5297 if (q) {
5298 neon_store_reg64(cpu_V1, rd + 1);
5300 } else if ((insn & (1 << 11)) == 0) {
5301 /* Two register misc. */
5302 op = ((insn >> 12) & 0x30) | ((insn >> 7) & 0xf);
5303 size = (insn >> 18) & 3;
5304 switch (op) {
5305 case 0: /* VREV64 */
5306 if (size == 3)
5307 return 1;
5308 for (pass = 0; pass < (q ? 2 : 1); pass++) {
5309 tmp = neon_load_reg(rm, pass * 2);
5310 tmp2 = neon_load_reg(rm, pass * 2 + 1);
5311 switch (size) {
5312 case 0: tcg_gen_bswap32_i32(tmp, tmp); break;
5313 case 1: gen_swap_half(tmp); break;
5314 case 2: /* no-op */ break;
5315 default: abort();
5317 neon_store_reg(rd, pass * 2 + 1, tmp);
5318 if (size == 2) {
5319 neon_store_reg(rd, pass * 2, tmp2);
5320 } else {
5321 switch (size) {
5322 case 0: tcg_gen_bswap32_i32(tmp2, tmp2); break;
5323 case 1: gen_swap_half(tmp2); break;
5324 default: abort();
5326 neon_store_reg(rd, pass * 2, tmp2);
5329 break;
5330 case 4: case 5: /* VPADDL */
5331 case 12: case 13: /* VPADAL */
5332 if (size == 3)
5333 return 1;
5334 for (pass = 0; pass < q + 1; pass++) {
5335 tmp = neon_load_reg(rm, pass * 2);
5336 gen_neon_widen(cpu_V0, tmp, size, op & 1);
5337 tmp = neon_load_reg(rm, pass * 2 + 1);
5338 gen_neon_widen(cpu_V1, tmp, size, op & 1);
5339 switch (size) {
5340 case 0: gen_helper_neon_paddl_u16(CPU_V001); break;
5341 case 1: gen_helper_neon_paddl_u32(CPU_V001); break;
5342 case 2: tcg_gen_add_i64(CPU_V001); break;
5343 default: abort();
5345 if (op >= 12) {
5346 /* Accumulate. */
5347 neon_load_reg64(cpu_V1, rd + pass);
5348 gen_neon_addl(size);
5350 neon_store_reg64(cpu_V0, rd + pass);
5352 break;
5353 case 33: /* VTRN */
5354 if (size == 2) {
5355 for (n = 0; n < (q ? 4 : 2); n += 2) {
5356 tmp = neon_load_reg(rm, n);
5357 tmp2 = neon_load_reg(rd, n + 1);
5358 neon_store_reg(rm, n, tmp2);
5359 neon_store_reg(rd, n + 1, tmp);
5361 } else {
5362 goto elementwise;
5364 break;
5365 case 34: /* VUZP */
5366 /* Reg Before After
5367 Rd A3 A2 A1 A0 B2 B0 A2 A0
5368 Rm B3 B2 B1 B0 B3 B1 A3 A1
5370 if (size == 3)
5371 return 1;
5372 gen_neon_unzip(rd, q, 0, size);
5373 gen_neon_unzip(rm, q, 4, size);
5374 if (q) {
5375 static int unzip_order_q[8] =
5376 {0, 2, 4, 6, 1, 3, 5, 7};
5377 for (n = 0; n < 8; n++) {
5378 int reg = (n < 4) ? rd : rm;
5379 tmp = neon_load_scratch(unzip_order_q[n]);
5380 neon_store_reg(reg, n % 4, tmp);
5382 } else {
5383 static int unzip_order[4] =
5384 {0, 4, 1, 5};
5385 for (n = 0; n < 4; n++) {
5386 int reg = (n < 2) ? rd : rm;
5387 tmp = neon_load_scratch(unzip_order[n]);
5388 neon_store_reg(reg, n % 2, tmp);
5391 break;
5392 case 35: /* VZIP */
5393 /* Reg Before After
5394 Rd A3 A2 A1 A0 B1 A1 B0 A0
5395 Rm B3 B2 B1 B0 B3 A3 B2 A2
5397 if (size == 3)
5398 return 1;
5399 count = (q ? 4 : 2);
5400 for (n = 0; n < count; n++) {
5401 tmp = neon_load_reg(rd, n);
5402 tmp2 = neon_load_reg(rd, n);
5403 switch (size) {
5404 case 0: gen_neon_zip_u8(tmp, tmp2); break;
5405 case 1: gen_neon_zip_u16(tmp, tmp2); break;
5406 case 2: /* no-op */; break;
5407 default: abort();
5409 neon_store_scratch(n * 2, tmp);
5410 neon_store_scratch(n * 2 + 1, tmp2);
5412 for (n = 0; n < count * 2; n++) {
5413 int reg = (n < count) ? rd : rm;
5414 tmp = neon_load_scratch(n);
5415 neon_store_reg(reg, n % count, tmp);
5417 break;
5418 case 36: case 37: /* VMOVN, VQMOVUN, VQMOVN */
5419 if (size == 3)
5420 return 1;
5421 TCGV_UNUSED(tmp2);
5422 for (pass = 0; pass < 2; pass++) {
5423 neon_load_reg64(cpu_V0, rm + pass);
5424 tmp = new_tmp();
5425 if (op == 36 && q == 0) {
5426 gen_neon_narrow(size, tmp, cpu_V0);
5427 } else if (q) {
5428 gen_neon_narrow_satu(size, tmp, cpu_V0);
5429 } else {
5430 gen_neon_narrow_sats(size, tmp, cpu_V0);
5432 if (pass == 0) {
5433 tmp2 = tmp;
5434 } else {
5435 neon_store_reg(rd, 0, tmp2);
5436 neon_store_reg(rd, 1, tmp);
5439 break;
5440 case 38: /* VSHLL */
5441 if (q || size == 3)
5442 return 1;
5443 tmp = neon_load_reg(rm, 0);
5444 tmp2 = neon_load_reg(rm, 1);
5445 for (pass = 0; pass < 2; pass++) {
5446 if (pass == 1)
5447 tmp = tmp2;
5448 gen_neon_widen(cpu_V0, tmp, size, 1);
5449 tcg_gen_shli_i64(cpu_V0, cpu_V0, 8 << size);
5450 neon_store_reg64(cpu_V0, rd + pass);
5452 break;
5453 case 44: /* VCVT.F16.F32 */
5454 if (!arm_feature(env, ARM_FEATURE_VFP_FP16))
5455 return 1;
5456 tmp = new_tmp();
5457 tmp2 = new_tmp();
5458 tcg_gen_ld_f32(cpu_F0s, cpu_env, neon_reg_offset(rm, 0));
5459 gen_helper_vfp_fcvt_f32_to_f16(tmp, cpu_F0s, cpu_env);
5460 tcg_gen_ld_f32(cpu_F0s, cpu_env, neon_reg_offset(rm, 1));
5461 gen_helper_vfp_fcvt_f32_to_f16(tmp2, cpu_F0s, cpu_env);
5462 tcg_gen_shli_i32(tmp2, tmp2, 16);
5463 tcg_gen_or_i32(tmp2, tmp2, tmp);
5464 tcg_gen_ld_f32(cpu_F0s, cpu_env, neon_reg_offset(rm, 2));
5465 gen_helper_vfp_fcvt_f32_to_f16(tmp, cpu_F0s, cpu_env);
5466 tcg_gen_ld_f32(cpu_F0s, cpu_env, neon_reg_offset(rm, 3));
5467 neon_store_reg(rd, 0, tmp2);
5468 tmp2 = new_tmp();
5469 gen_helper_vfp_fcvt_f32_to_f16(tmp2, cpu_F0s, cpu_env);
5470 tcg_gen_shli_i32(tmp2, tmp2, 16);
5471 tcg_gen_or_i32(tmp2, tmp2, tmp);
5472 neon_store_reg(rd, 1, tmp2);
5473 dead_tmp(tmp);
5474 break;
5475 case 46: /* VCVT.F32.F16 */
5476 if (!arm_feature(env, ARM_FEATURE_VFP_FP16))
5477 return 1;
5478 tmp3 = new_tmp();
5479 tmp = neon_load_reg(rm, 0);
5480 tmp2 = neon_load_reg(rm, 1);
5481 tcg_gen_ext16u_i32(tmp3, tmp);
5482 gen_helper_vfp_fcvt_f16_to_f32(cpu_F0s, tmp3, cpu_env);
5483 tcg_gen_st_f32(cpu_F0s, cpu_env, neon_reg_offset(rd, 0));
5484 tcg_gen_shri_i32(tmp3, tmp, 16);
5485 gen_helper_vfp_fcvt_f16_to_f32(cpu_F0s, tmp3, cpu_env);
5486 tcg_gen_st_f32(cpu_F0s, cpu_env, neon_reg_offset(rd, 1));
5487 dead_tmp(tmp);
5488 tcg_gen_ext16u_i32(tmp3, tmp2);
5489 gen_helper_vfp_fcvt_f16_to_f32(cpu_F0s, tmp3, cpu_env);
5490 tcg_gen_st_f32(cpu_F0s, cpu_env, neon_reg_offset(rd, 2));
5491 tcg_gen_shri_i32(tmp3, tmp2, 16);
5492 gen_helper_vfp_fcvt_f16_to_f32(cpu_F0s, tmp3, cpu_env);
5493 tcg_gen_st_f32(cpu_F0s, cpu_env, neon_reg_offset(rd, 3));
5494 dead_tmp(tmp2);
5495 dead_tmp(tmp3);
5496 break;
5497 default:
5498 elementwise:
5499 for (pass = 0; pass < (q ? 4 : 2); pass++) {
5500 if (op == 30 || op == 31 || op >= 58) {
5501 tcg_gen_ld_f32(cpu_F0s, cpu_env,
5502 neon_reg_offset(rm, pass));
5503 TCGV_UNUSED(tmp);
5504 } else {
5505 tmp = neon_load_reg(rm, pass);
5507 switch (op) {
5508 case 1: /* VREV32 */
5509 switch (size) {
5510 case 0: tcg_gen_bswap32_i32(tmp, tmp); break;
5511 case 1: gen_swap_half(tmp); break;
5512 default: return 1;
5514 break;
5515 case 2: /* VREV16 */
5516 if (size != 0)
5517 return 1;
5518 gen_rev16(tmp);
5519 break;
5520 case 8: /* CLS */
5521 switch (size) {
5522 case 0: gen_helper_neon_cls_s8(tmp, tmp); break;
5523 case 1: gen_helper_neon_cls_s16(tmp, tmp); break;
5524 case 2: gen_helper_neon_cls_s32(tmp, tmp); break;
5525 default: return 1;
5527 break;
5528 case 9: /* CLZ */
5529 switch (size) {
5530 case 0: gen_helper_neon_clz_u8(tmp, tmp); break;
5531 case 1: gen_helper_neon_clz_u16(tmp, tmp); break;
5532 case 2: gen_helper_clz(tmp, tmp); break;
5533 default: return 1;
5535 break;
5536 case 10: /* CNT */
5537 if (size != 0)
5538 return 1;
5539 gen_helper_neon_cnt_u8(tmp, tmp);
5540 break;
5541 case 11: /* VNOT */
5542 if (size != 0)
5543 return 1;
5544 tcg_gen_not_i32(tmp, tmp);
5545 break;
5546 case 14: /* VQABS */
5547 switch (size) {
5548 case 0: gen_helper_neon_qabs_s8(tmp, cpu_env, tmp); break;
5549 case 1: gen_helper_neon_qabs_s16(tmp, cpu_env, tmp); break;
5550 case 2: gen_helper_neon_qabs_s32(tmp, cpu_env, tmp); break;
5551 default: return 1;
5553 break;
5554 case 15: /* VQNEG */
5555 switch (size) {
5556 case 0: gen_helper_neon_qneg_s8(tmp, cpu_env, tmp); break;
5557 case 1: gen_helper_neon_qneg_s16(tmp, cpu_env, tmp); break;
5558 case 2: gen_helper_neon_qneg_s32(tmp, cpu_env, tmp); break;
5559 default: return 1;
5561 break;
5562 case 16: case 19: /* VCGT #0, VCLE #0 */
5563 tmp2 = tcg_const_i32(0);
5564 switch(size) {
5565 case 0: gen_helper_neon_cgt_s8(tmp, tmp, tmp2); break;
5566 case 1: gen_helper_neon_cgt_s16(tmp, tmp, tmp2); break;
5567 case 2: gen_helper_neon_cgt_s32(tmp, tmp, tmp2); break;
5568 default: return 1;
5570 tcg_temp_free(tmp2);
5571 if (op == 19)
5572 tcg_gen_not_i32(tmp, tmp);
5573 break;
5574 case 17: case 20: /* VCGE #0, VCLT #0 */
5575 tmp2 = tcg_const_i32(0);
5576 switch(size) {
5577 case 0: gen_helper_neon_cge_s8(tmp, tmp, tmp2); break;
5578 case 1: gen_helper_neon_cge_s16(tmp, tmp, tmp2); break;
5579 case 2: gen_helper_neon_cge_s32(tmp, tmp, tmp2); break;
5580 default: return 1;
5582 tcg_temp_free(tmp2);
5583 if (op == 20)
5584 tcg_gen_not_i32(tmp, tmp);
5585 break;
5586 case 18: /* VCEQ #0 */
5587 tmp2 = tcg_const_i32(0);
5588 switch(size) {
5589 case 0: gen_helper_neon_ceq_u8(tmp, tmp, tmp2); break;
5590 case 1: gen_helper_neon_ceq_u16(tmp, tmp, tmp2); break;
5591 case 2: gen_helper_neon_ceq_u32(tmp, tmp, tmp2); break;
5592 default: return 1;
5594 tcg_temp_free(tmp2);
5595 break;
5596 case 22: /* VABS */
5597 switch(size) {
5598 case 0: gen_helper_neon_abs_s8(tmp, tmp); break;
5599 case 1: gen_helper_neon_abs_s16(tmp, tmp); break;
5600 case 2: tcg_gen_abs_i32(tmp, tmp); break;
5601 default: return 1;
5603 break;
5604 case 23: /* VNEG */
5605 if (size == 3)
5606 return 1;
5607 tmp2 = tcg_const_i32(0);
5608 gen_neon_rsb(size, tmp, tmp2);
5609 tcg_temp_free(tmp2);
5610 break;
5611 case 24: case 27: /* Float VCGT #0, Float VCLE #0 */
5612 tmp2 = tcg_const_i32(0);
5613 gen_helper_neon_cgt_f32(tmp, tmp, tmp2);
5614 tcg_temp_free(tmp2);
5615 if (op == 27)
5616 tcg_gen_not_i32(tmp, tmp);
5617 break;
5618 case 25: case 28: /* Float VCGE #0, Float VCLT #0 */
5619 tmp2 = tcg_const_i32(0);
5620 gen_helper_neon_cge_f32(tmp, tmp, tmp2);
5621 tcg_temp_free(tmp2);
5622 if (op == 28)
5623 tcg_gen_not_i32(tmp, tmp);
5624 break;
5625 case 26: /* Float VCEQ #0 */
5626 tmp2 = tcg_const_i32(0);
5627 gen_helper_neon_ceq_f32(tmp, tmp, tmp2);
5628 tcg_temp_free(tmp2);
5629 break;
5630 case 30: /* Float VABS */
5631 gen_vfp_abs(0);
5632 break;
5633 case 31: /* Float VNEG */
5634 gen_vfp_neg(0);
5635 break;
5636 case 32: /* VSWP */
5637 tmp2 = neon_load_reg(rd, pass);
5638 neon_store_reg(rm, pass, tmp2);
5639 break;
5640 case 33: /* VTRN */
5641 tmp2 = neon_load_reg(rd, pass);
5642 switch (size) {
5643 case 0: gen_neon_trn_u8(tmp, tmp2); break;
5644 case 1: gen_neon_trn_u16(tmp, tmp2); break;
5645 case 2: abort();
5646 default: return 1;
5648 neon_store_reg(rm, pass, tmp2);
5649 break;
5650 case 56: /* Integer VRECPE */
5651 gen_helper_recpe_u32(tmp, tmp, cpu_env);
5652 break;
5653 case 57: /* Integer VRSQRTE */
5654 gen_helper_rsqrte_u32(tmp, tmp, cpu_env);
5655 break;
5656 case 58: /* Float VRECPE */
5657 gen_helper_recpe_f32(cpu_F0s, cpu_F0s, cpu_env);
5658 break;
5659 case 59: /* Float VRSQRTE */
5660 gen_helper_rsqrte_f32(cpu_F0s, cpu_F0s, cpu_env);
5661 break;
5662 case 60: /* VCVT.F32.S32 */
5663 gen_vfp_sito(0);
5664 break;
5665 case 61: /* VCVT.F32.U32 */
5666 gen_vfp_uito(0);
5667 break;
5668 case 62: /* VCVT.S32.F32 */
5669 gen_vfp_tosiz(0);
5670 break;
5671 case 63: /* VCVT.U32.F32 */
5672 gen_vfp_touiz(0);
5673 break;
5674 default:
5675 /* Reserved: 21, 29, 39-56 */
5676 return 1;
5678 if (op == 30 || op == 31 || op >= 58) {
5679 tcg_gen_st_f32(cpu_F0s, cpu_env,
5680 neon_reg_offset(rd, pass));
5681 } else {
5682 neon_store_reg(rd, pass, tmp);
5685 break;
5687 } else if ((insn & (1 << 10)) == 0) {
5688 /* VTBL, VTBX. */
5689 n = ((insn >> 5) & 0x18) + 8;
5690 if (insn & (1 << 6)) {
5691 tmp = neon_load_reg(rd, 0);
5692 } else {
5693 tmp = new_tmp();
5694 tcg_gen_movi_i32(tmp, 0);
5696 tmp2 = neon_load_reg(rm, 0);
5697 tmp4 = tcg_const_i32(rn);
5698 tmp5 = tcg_const_i32(n);
5699 gen_helper_neon_tbl(tmp2, tmp2, tmp, tmp4, tmp5);
5700 dead_tmp(tmp);
5701 if (insn & (1 << 6)) {
5702 tmp = neon_load_reg(rd, 1);
5703 } else {
5704 tmp = new_tmp();
5705 tcg_gen_movi_i32(tmp, 0);
5707 tmp3 = neon_load_reg(rm, 1);
5708 gen_helper_neon_tbl(tmp3, tmp3, tmp, tmp4, tmp5);
5709 tcg_temp_free_i32(tmp5);
5710 tcg_temp_free_i32(tmp4);
5711 neon_store_reg(rd, 0, tmp2);
5712 neon_store_reg(rd, 1, tmp3);
5713 dead_tmp(tmp);
5714 } else if ((insn & 0x380) == 0) {
5715 /* VDUP */
5716 if (insn & (1 << 19)) {
5717 tmp = neon_load_reg(rm, 1);
5718 } else {
5719 tmp = neon_load_reg(rm, 0);
5721 if (insn & (1 << 16)) {
5722 gen_neon_dup_u8(tmp, ((insn >> 17) & 3) * 8);
5723 } else if (insn & (1 << 17)) {
5724 if ((insn >> 18) & 1)
5725 gen_neon_dup_high16(tmp);
5726 else
5727 gen_neon_dup_low16(tmp);
5729 for (pass = 0; pass < (q ? 4 : 2); pass++) {
5730 tmp2 = new_tmp();
5731 tcg_gen_mov_i32(tmp2, tmp);
5732 neon_store_reg(rd, pass, tmp2);
5734 dead_tmp(tmp);
5735 } else {
5736 return 1;
5740 return 0;
5743 static int disas_cp14_read(CPUState * env, DisasContext *s, uint32_t insn)
5745 int crn = (insn >> 16) & 0xf;
5746 int crm = insn & 0xf;
5747 int op1 = (insn >> 21) & 7;
5748 int op2 = (insn >> 5) & 7;
5749 int rt = (insn >> 12) & 0xf;
5750 TCGv tmp;
5752 if (arm_feature(env, ARM_FEATURE_THUMB2EE)) {
5753 if (op1 == 6 && crn == 0 && crm == 0 && op2 == 0) {
5754 /* TEECR */
5755 if (IS_USER(s))
5756 return 1;
5757 tmp = load_cpu_field(teecr);
5758 store_reg(s, rt, tmp);
5759 return 0;
5761 if (op1 == 6 && crn == 1 && crm == 0 && op2 == 0) {
5762 /* TEEHBR */
5763 if (IS_USER(s) && (env->teecr & 1))
5764 return 1;
5765 tmp = load_cpu_field(teehbr);
5766 store_reg(s, rt, tmp);
5767 return 0;
5770 fprintf(stderr, "Unknown cp14 read op1:%d crn:%d crm:%d op2:%d\n",
5771 op1, crn, crm, op2);
5772 return 1;
5775 static int disas_cp14_write(CPUState * env, DisasContext *s, uint32_t insn)
5777 int crn = (insn >> 16) & 0xf;
5778 int crm = insn & 0xf;
5779 int op1 = (insn >> 21) & 7;
5780 int op2 = (insn >> 5) & 7;
5781 int rt = (insn >> 12) & 0xf;
5782 TCGv tmp;
5784 if (arm_feature(env, ARM_FEATURE_THUMB2EE)) {
5785 if (op1 == 6 && crn == 0 && crm == 0 && op2 == 0) {
5786 /* TEECR */
5787 if (IS_USER(s))
5788 return 1;
5789 tmp = load_reg(s, rt);
5790 gen_helper_set_teecr(cpu_env, tmp);
5791 dead_tmp(tmp);
5792 return 0;
5794 if (op1 == 6 && crn == 1 && crm == 0 && op2 == 0) {
5795 /* TEEHBR */
5796 if (IS_USER(s) && (env->teecr & 1))
5797 return 1;
5798 tmp = load_reg(s, rt);
5799 store_cpu_field(tmp, teehbr);
5800 return 0;
5803 fprintf(stderr, "Unknown cp14 write op1:%d crn:%d crm:%d op2:%d\n",
5804 op1, crn, crm, op2);
5805 return 1;
5808 static int disas_coproc_insn(CPUState * env, DisasContext *s, uint32_t insn)
5810 int cpnum;
5812 cpnum = (insn >> 8) & 0xf;
5813 if (arm_feature(env, ARM_FEATURE_XSCALE)
5814 && ((env->cp15.c15_cpar ^ 0x3fff) & (1 << cpnum)))
5815 return 1;
5817 switch (cpnum) {
5818 case 0:
5819 case 1:
5820 if (arm_feature(env, ARM_FEATURE_IWMMXT)) {
5821 return disas_iwmmxt_insn(env, s, insn);
5822 } else if (arm_feature(env, ARM_FEATURE_XSCALE)) {
5823 return disas_dsp_insn(env, s, insn);
5825 return 1;
5826 case 10:
5827 case 11:
5828 return disas_vfp_insn (env, s, insn);
5829 case 14:
5830 /* Coprocessors 7-15 are architecturally reserved by ARM.
5831 Unfortunately Intel decided to ignore this. */
5832 if (arm_feature(env, ARM_FEATURE_XSCALE))
5833 goto board;
5834 if (insn & (1 << 20))
5835 return disas_cp14_read(env, s, insn);
5836 else
5837 return disas_cp14_write(env, s, insn);
5838 case 15:
5839 return disas_cp15_insn (env, s, insn);
5840 default:
5841 board:
5842 /* Unknown coprocessor. See if the board has hooked it. */
5843 return disas_cp_insn (env, s, insn);
5848 /* Store a 64-bit value to a register pair. Clobbers val. */
5849 static void gen_storeq_reg(DisasContext *s, int rlow, int rhigh, TCGv_i64 val)
5851 TCGv tmp;
5852 tmp = new_tmp();
5853 tcg_gen_trunc_i64_i32(tmp, val);
5854 store_reg(s, rlow, tmp);
5855 tmp = new_tmp();
5856 tcg_gen_shri_i64(val, val, 32);
5857 tcg_gen_trunc_i64_i32(tmp, val);
5858 store_reg(s, rhigh, tmp);
5861 /* load a 32-bit value from a register and perform a 64-bit accumulate. */
5862 static void gen_addq_lo(DisasContext *s, TCGv_i64 val, int rlow)
5864 TCGv_i64 tmp;
5865 TCGv tmp2;
5867 /* Load value and extend to 64 bits. */
5868 tmp = tcg_temp_new_i64();
5869 tmp2 = load_reg(s, rlow);
5870 tcg_gen_extu_i32_i64(tmp, tmp2);
5871 dead_tmp(tmp2);
5872 tcg_gen_add_i64(val, val, tmp);
5873 tcg_temp_free_i64(tmp);
5876 /* load and add a 64-bit value from a register pair. */
5877 static void gen_addq(DisasContext *s, TCGv_i64 val, int rlow, int rhigh)
5879 TCGv_i64 tmp;
5880 TCGv tmpl;
5881 TCGv tmph;
5883 /* Load 64-bit value rd:rn. */
5884 tmpl = load_reg(s, rlow);
5885 tmph = load_reg(s, rhigh);
5886 tmp = tcg_temp_new_i64();
5887 tcg_gen_concat_i32_i64(tmp, tmpl, tmph);
5888 dead_tmp(tmpl);
5889 dead_tmp(tmph);
5890 tcg_gen_add_i64(val, val, tmp);
5891 tcg_temp_free_i64(tmp);
5894 /* Set N and Z flags from a 64-bit value. */
5895 static void gen_logicq_cc(TCGv_i64 val)
5897 TCGv tmp = new_tmp();
5898 gen_helper_logicq_cc(tmp, val);
5899 gen_logic_CC(tmp);
5900 dead_tmp(tmp);
5903 /* Load/Store exclusive instructions are implemented by remembering
5904 the value/address loaded, and seeing if these are the same
5905 when the store is performed. This should be is sufficient to implement
5906 the architecturally mandated semantics, and avoids having to monitor
5907 regular stores.
5909 In system emulation mode only one CPU will be running at once, so
5910 this sequence is effectively atomic. In user emulation mode we
5911 throw an exception and handle the atomic operation elsewhere. */
5912 static void gen_load_exclusive(DisasContext *s, int rt, int rt2,
5913 TCGv addr, int size)
5915 TCGv tmp;
5917 switch (size) {
5918 case 0:
5919 tmp = gen_ld8u(addr, IS_USER(s));
5920 break;
5921 case 1:
5922 tmp = gen_ld16u(addr, IS_USER(s));
5923 break;
5924 case 2:
5925 case 3:
5926 tmp = gen_ld32(addr, IS_USER(s));
5927 break;
5928 default:
5929 abort();
5931 tcg_gen_mov_i32(cpu_exclusive_val, tmp);
5932 store_reg(s, rt, tmp);
5933 if (size == 3) {
5934 TCGv tmp2 = new_tmp();
5935 tcg_gen_addi_i32(tmp2, addr, 4);
5936 tmp = gen_ld32(tmp2, IS_USER(s));
5937 dead_tmp(tmp2);
5938 tcg_gen_mov_i32(cpu_exclusive_high, tmp);
5939 store_reg(s, rt2, tmp);
5941 tcg_gen_mov_i32(cpu_exclusive_addr, addr);
5944 static void gen_clrex(DisasContext *s)
5946 tcg_gen_movi_i32(cpu_exclusive_addr, -1);
5949 #ifdef CONFIG_USER_ONLY
5950 static void gen_store_exclusive(DisasContext *s, int rd, int rt, int rt2,
5951 TCGv addr, int size)
5953 tcg_gen_mov_i32(cpu_exclusive_test, addr);
5954 tcg_gen_movi_i32(cpu_exclusive_info,
5955 size | (rd << 4) | (rt << 8) | (rt2 << 12));
5956 gen_set_condexec(s);
5957 gen_set_pc_im(s->pc - 4);
5958 gen_exception(EXCP_STREX);
5959 s->is_jmp = DISAS_JUMP;
5961 #else
5962 static void gen_store_exclusive(DisasContext *s, int rd, int rt, int rt2,
5963 TCGv addr, int size)
5965 TCGv tmp;
5966 int done_label;
5967 int fail_label;
5969 /* if (env->exclusive_addr == addr && env->exclusive_val == [addr]) {
5970 [addr] = {Rt};
5971 {Rd} = 0;
5972 } else {
5973 {Rd} = 1;
5974 } */
5975 fail_label = gen_new_label();
5976 done_label = gen_new_label();
5977 tcg_gen_brcond_i32(TCG_COND_NE, addr, cpu_exclusive_addr, fail_label);
5978 switch (size) {
5979 case 0:
5980 tmp = gen_ld8u(addr, IS_USER(s));
5981 break;
5982 case 1:
5983 tmp = gen_ld16u(addr, IS_USER(s));
5984 break;
5985 case 2:
5986 case 3:
5987 tmp = gen_ld32(addr, IS_USER(s));
5988 break;
5989 default:
5990 abort();
5992 tcg_gen_brcond_i32(TCG_COND_NE, tmp, cpu_exclusive_val, fail_label);
5993 dead_tmp(tmp);
5994 if (size == 3) {
5995 TCGv tmp2 = new_tmp();
5996 tcg_gen_addi_i32(tmp2, addr, 4);
5997 tmp = gen_ld32(tmp2, IS_USER(s));
5998 dead_tmp(tmp2);
5999 tcg_gen_brcond_i32(TCG_COND_NE, tmp, cpu_exclusive_high, fail_label);
6000 dead_tmp(tmp);
6002 tmp = load_reg(s, rt);
6003 switch (size) {
6004 case 0:
6005 gen_st8(tmp, addr, IS_USER(s));
6006 break;
6007 case 1:
6008 gen_st16(tmp, addr, IS_USER(s));
6009 break;
6010 case 2:
6011 case 3:
6012 gen_st32(tmp, addr, IS_USER(s));
6013 break;
6014 default:
6015 abort();
6017 if (size == 3) {
6018 tcg_gen_addi_i32(addr, addr, 4);
6019 tmp = load_reg(s, rt2);
6020 gen_st32(tmp, addr, IS_USER(s));
6022 tcg_gen_movi_i32(cpu_R[rd], 0);
6023 tcg_gen_br(done_label);
6024 gen_set_label(fail_label);
6025 tcg_gen_movi_i32(cpu_R[rd], 1);
6026 gen_set_label(done_label);
6027 tcg_gen_movi_i32(cpu_exclusive_addr, -1);
6029 #endif
6031 static void disas_arm_insn(CPUState * env, DisasContext *s)
6033 unsigned int cond, insn, val, op1, i, shift, rm, rs, rn, rd, sh;
6034 TCGv tmp;
6035 TCGv tmp2;
6036 TCGv tmp3;
6037 TCGv addr;
6038 TCGv_i64 tmp64;
6040 insn = ldl_code(s->pc);
6041 s->pc += 4;
6043 /* M variants do not implement ARM mode. */
6044 if (IS_M(env))
6045 goto illegal_op;
6046 cond = insn >> 28;
6047 if (cond == 0xf){
6048 /* Unconditional instructions. */
6049 if (((insn >> 25) & 7) == 1) {
6050 /* NEON Data processing. */
6051 if (!arm_feature(env, ARM_FEATURE_NEON))
6052 goto illegal_op;
6054 if (disas_neon_data_insn(env, s, insn))
6055 goto illegal_op;
6056 return;
6058 if ((insn & 0x0f100000) == 0x04000000) {
6059 /* NEON load/store. */
6060 if (!arm_feature(env, ARM_FEATURE_NEON))
6061 goto illegal_op;
6063 if (disas_neon_ls_insn(env, s, insn))
6064 goto illegal_op;
6065 return;
6067 if ((insn & 0x0d70f000) == 0x0550f000)
6068 return; /* PLD */
6069 else if ((insn & 0x0ffffdff) == 0x01010000) {
6070 ARCH(6);
6071 /* setend */
6072 if (insn & (1 << 9)) {
6073 /* BE8 mode not implemented. */
6074 goto illegal_op;
6076 return;
6077 } else if ((insn & 0x0fffff00) == 0x057ff000) {
6078 switch ((insn >> 4) & 0xf) {
6079 case 1: /* clrex */
6080 ARCH(6K);
6081 gen_clrex(s);
6082 return;
6083 case 4: /* dsb */
6084 case 5: /* dmb */
6085 case 6: /* isb */
6086 ARCH(7);
6087 /* We don't emulate caches so these are a no-op. */
6088 return;
6089 default:
6090 goto illegal_op;
6092 } else if ((insn & 0x0e5fffe0) == 0x084d0500) {
6093 /* srs */
6094 int32_t offset;
6095 if (IS_USER(s))
6096 goto illegal_op;
6097 ARCH(6);
6098 op1 = (insn & 0x1f);
6099 if (op1 == (env->uncached_cpsr & CPSR_M)) {
6100 addr = load_reg(s, 13);
6101 } else {
6102 addr = new_tmp();
6103 tmp = tcg_const_i32(op1);
6104 gen_helper_get_r13_banked(addr, cpu_env, tmp);
6105 tcg_temp_free_i32(tmp);
6107 i = (insn >> 23) & 3;
6108 switch (i) {
6109 case 0: offset = -4; break; /* DA */
6110 case 1: offset = 0; break; /* IA */
6111 case 2: offset = -8; break; /* DB */
6112 case 3: offset = 4; break; /* IB */
6113 default: abort();
6115 if (offset)
6116 tcg_gen_addi_i32(addr, addr, offset);
6117 tmp = load_reg(s, 14);
6118 gen_st32(tmp, addr, 0);
6119 tmp = load_cpu_field(spsr);
6120 tcg_gen_addi_i32(addr, addr, 4);
6121 gen_st32(tmp, addr, 0);
6122 if (insn & (1 << 21)) {
6123 /* Base writeback. */
6124 switch (i) {
6125 case 0: offset = -8; break;
6126 case 1: offset = 4; break;
6127 case 2: offset = -4; break;
6128 case 3: offset = 0; break;
6129 default: abort();
6131 if (offset)
6132 tcg_gen_addi_i32(addr, addr, offset);
6133 if (op1 == (env->uncached_cpsr & CPSR_M)) {
6134 store_reg(s, 13, addr);
6135 } else {
6136 tmp = tcg_const_i32(op1);
6137 gen_helper_set_r13_banked(cpu_env, tmp, addr);
6138 tcg_temp_free_i32(tmp);
6139 dead_tmp(addr);
6141 } else {
6142 dead_tmp(addr);
6144 return;
6145 } else if ((insn & 0x0e50ffe0) == 0x08100a00) {
6146 /* rfe */
6147 int32_t offset;
6148 if (IS_USER(s))
6149 goto illegal_op;
6150 ARCH(6);
6151 rn = (insn >> 16) & 0xf;
6152 addr = load_reg(s, rn);
6153 i = (insn >> 23) & 3;
6154 switch (i) {
6155 case 0: offset = -4; break; /* DA */
6156 case 1: offset = 0; break; /* IA */
6157 case 2: offset = -8; break; /* DB */
6158 case 3: offset = 4; break; /* IB */
6159 default: abort();
6161 if (offset)
6162 tcg_gen_addi_i32(addr, addr, offset);
6163 /* Load PC into tmp and CPSR into tmp2. */
6164 tmp = gen_ld32(addr, 0);
6165 tcg_gen_addi_i32(addr, addr, 4);
6166 tmp2 = gen_ld32(addr, 0);
6167 if (insn & (1 << 21)) {
6168 /* Base writeback. */
6169 switch (i) {
6170 case 0: offset = -8; break;
6171 case 1: offset = 4; break;
6172 case 2: offset = -4; break;
6173 case 3: offset = 0; break;
6174 default: abort();
6176 if (offset)
6177 tcg_gen_addi_i32(addr, addr, offset);
6178 store_reg(s, rn, addr);
6179 } else {
6180 dead_tmp(addr);
6182 gen_rfe(s, tmp, tmp2);
6183 return;
6184 } else if ((insn & 0x0e000000) == 0x0a000000) {
6185 /* branch link and change to thumb (blx <offset>) */
6186 int32_t offset;
6188 val = (uint32_t)s->pc;
6189 tmp = new_tmp();
6190 tcg_gen_movi_i32(tmp, val);
6191 store_reg(s, 14, tmp);
6192 /* Sign-extend the 24-bit offset */
6193 offset = (((int32_t)insn) << 8) >> 8;
6194 /* offset * 4 + bit24 * 2 + (thumb bit) */
6195 val += (offset << 2) | ((insn >> 23) & 2) | 1;
6196 /* pipeline offset */
6197 val += 4;
6198 gen_bx_im(s, val);
6199 return;
6200 } else if ((insn & 0x0e000f00) == 0x0c000100) {
6201 if (arm_feature(env, ARM_FEATURE_IWMMXT)) {
6202 /* iWMMXt register transfer. */
6203 if (env->cp15.c15_cpar & (1 << 1))
6204 if (!disas_iwmmxt_insn(env, s, insn))
6205 return;
6207 } else if ((insn & 0x0fe00000) == 0x0c400000) {
6208 /* Coprocessor double register transfer. */
6209 } else if ((insn & 0x0f000010) == 0x0e000010) {
6210 /* Additional coprocessor register transfer. */
6211 } else if ((insn & 0x0ff10020) == 0x01000000) {
6212 uint32_t mask;
6213 uint32_t val;
6214 /* cps (privileged) */
6215 if (IS_USER(s))
6216 return;
6217 mask = val = 0;
6218 if (insn & (1 << 19)) {
6219 if (insn & (1 << 8))
6220 mask |= CPSR_A;
6221 if (insn & (1 << 7))
6222 mask |= CPSR_I;
6223 if (insn & (1 << 6))
6224 mask |= CPSR_F;
6225 if (insn & (1 << 18))
6226 val |= mask;
6228 if (insn & (1 << 17)) {
6229 mask |= CPSR_M;
6230 val |= (insn & 0x1f);
6232 if (mask) {
6233 gen_set_psr_im(s, mask, 0, val);
6235 return;
6237 goto illegal_op;
6239 if (cond != 0xe) {
6240 /* if not always execute, we generate a conditional jump to
6241 next instruction */
6242 s->condlabel = gen_new_label();
6243 gen_test_cc(cond ^ 1, s->condlabel);
6244 s->condjmp = 1;
6246 if ((insn & 0x0f900000) == 0x03000000) {
6247 if ((insn & (1 << 21)) == 0) {
6248 ARCH(6T2);
6249 rd = (insn >> 12) & 0xf;
6250 val = ((insn >> 4) & 0xf000) | (insn & 0xfff);
6251 if ((insn & (1 << 22)) == 0) {
6252 /* MOVW */
6253 tmp = new_tmp();
6254 tcg_gen_movi_i32(tmp, val);
6255 } else {
6256 /* MOVT */
6257 tmp = load_reg(s, rd);
6258 tcg_gen_ext16u_i32(tmp, tmp);
6259 tcg_gen_ori_i32(tmp, tmp, val << 16);
6261 store_reg(s, rd, tmp);
6262 } else {
6263 if (((insn >> 12) & 0xf) != 0xf)
6264 goto illegal_op;
6265 if (((insn >> 16) & 0xf) == 0) {
6266 gen_nop_hint(s, insn & 0xff);
6267 } else {
6268 /* CPSR = immediate */
6269 val = insn & 0xff;
6270 shift = ((insn >> 8) & 0xf) * 2;
6271 if (shift)
6272 val = (val >> shift) | (val << (32 - shift));
6273 i = ((insn & (1 << 22)) != 0);
6274 if (gen_set_psr_im(s, msr_mask(env, s, (insn >> 16) & 0xf, i), i, val))
6275 goto illegal_op;
6278 } else if ((insn & 0x0f900000) == 0x01000000
6279 && (insn & 0x00000090) != 0x00000090) {
6280 /* miscellaneous instructions */
6281 op1 = (insn >> 21) & 3;
6282 sh = (insn >> 4) & 0xf;
6283 rm = insn & 0xf;
6284 switch (sh) {
6285 case 0x0: /* move program status register */
6286 if (op1 & 1) {
6287 /* PSR = reg */
6288 tmp = load_reg(s, rm);
6289 i = ((op1 & 2) != 0);
6290 if (gen_set_psr(s, msr_mask(env, s, (insn >> 16) & 0xf, i), i, tmp))
6291 goto illegal_op;
6292 } else {
6293 /* reg = PSR */
6294 rd = (insn >> 12) & 0xf;
6295 if (op1 & 2) {
6296 if (IS_USER(s))
6297 goto illegal_op;
6298 tmp = load_cpu_field(spsr);
6299 } else {
6300 tmp = new_tmp();
6301 gen_helper_cpsr_read(tmp);
6303 store_reg(s, rd, tmp);
6305 break;
6306 case 0x1:
6307 if (op1 == 1) {
6308 /* branch/exchange thumb (bx). */
6309 tmp = load_reg(s, rm);
6310 gen_bx(s, tmp);
6311 } else if (op1 == 3) {
6312 /* clz */
6313 rd = (insn >> 12) & 0xf;
6314 tmp = load_reg(s, rm);
6315 gen_helper_clz(tmp, tmp);
6316 store_reg(s, rd, tmp);
6317 } else {
6318 goto illegal_op;
6320 break;
6321 case 0x2:
6322 if (op1 == 1) {
6323 ARCH(5J); /* bxj */
6324 /* Trivial implementation equivalent to bx. */
6325 tmp = load_reg(s, rm);
6326 gen_bx(s, tmp);
6327 } else {
6328 goto illegal_op;
6330 break;
6331 case 0x3:
6332 if (op1 != 1)
6333 goto illegal_op;
6335 /* branch link/exchange thumb (blx) */
6336 tmp = load_reg(s, rm);
6337 tmp2 = new_tmp();
6338 tcg_gen_movi_i32(tmp2, s->pc);
6339 store_reg(s, 14, tmp2);
6340 gen_bx(s, tmp);
6341 break;
6342 case 0x5: /* saturating add/subtract */
6343 rd = (insn >> 12) & 0xf;
6344 rn = (insn >> 16) & 0xf;
6345 tmp = load_reg(s, rm);
6346 tmp2 = load_reg(s, rn);
6347 if (op1 & 2)
6348 gen_helper_double_saturate(tmp2, tmp2);
6349 if (op1 & 1)
6350 gen_helper_sub_saturate(tmp, tmp, tmp2);
6351 else
6352 gen_helper_add_saturate(tmp, tmp, tmp2);
6353 dead_tmp(tmp2);
6354 store_reg(s, rd, tmp);
6355 break;
6356 case 7:
6357 /* SMC instruction (op1 == 3)
6358 and undefined instructions (op1 == 0 || op1 == 2)
6359 will trap */
6360 if (op1 != 1) {
6361 goto illegal_op;
6363 /* bkpt */
6364 gen_set_condexec(s);
6365 gen_set_pc_im(s->pc - 4);
6366 gen_exception(EXCP_BKPT);
6367 s->is_jmp = DISAS_JUMP;
6368 break;
6369 case 0x8: /* signed multiply */
6370 case 0xa:
6371 case 0xc:
6372 case 0xe:
6373 rs = (insn >> 8) & 0xf;
6374 rn = (insn >> 12) & 0xf;
6375 rd = (insn >> 16) & 0xf;
6376 if (op1 == 1) {
6377 /* (32 * 16) >> 16 */
6378 tmp = load_reg(s, rm);
6379 tmp2 = load_reg(s, rs);
6380 if (sh & 4)
6381 tcg_gen_sari_i32(tmp2, tmp2, 16);
6382 else
6383 gen_sxth(tmp2);
6384 tmp64 = gen_muls_i64_i32(tmp, tmp2);
6385 tcg_gen_shri_i64(tmp64, tmp64, 16);
6386 tmp = new_tmp();
6387 tcg_gen_trunc_i64_i32(tmp, tmp64);
6388 tcg_temp_free_i64(tmp64);
6389 if ((sh & 2) == 0) {
6390 tmp2 = load_reg(s, rn);
6391 gen_helper_add_setq(tmp, tmp, tmp2);
6392 dead_tmp(tmp2);
6394 store_reg(s, rd, tmp);
6395 } else {
6396 /* 16 * 16 */
6397 tmp = load_reg(s, rm);
6398 tmp2 = load_reg(s, rs);
6399 gen_mulxy(tmp, tmp2, sh & 2, sh & 4);
6400 dead_tmp(tmp2);
6401 if (op1 == 2) {
6402 tmp64 = tcg_temp_new_i64();
6403 tcg_gen_ext_i32_i64(tmp64, tmp);
6404 dead_tmp(tmp);
6405 gen_addq(s, tmp64, rn, rd);
6406 gen_storeq_reg(s, rn, rd, tmp64);
6407 tcg_temp_free_i64(tmp64);
6408 } else {
6409 if (op1 == 0) {
6410 tmp2 = load_reg(s, rn);
6411 gen_helper_add_setq(tmp, tmp, tmp2);
6412 dead_tmp(tmp2);
6414 store_reg(s, rd, tmp);
6417 break;
6418 default:
6419 goto illegal_op;
6421 } else if (((insn & 0x0e000000) == 0 &&
6422 (insn & 0x00000090) != 0x90) ||
6423 ((insn & 0x0e000000) == (1 << 25))) {
6424 int set_cc, logic_cc, shiftop;
6426 op1 = (insn >> 21) & 0xf;
6427 set_cc = (insn >> 20) & 1;
6428 logic_cc = table_logic_cc[op1] & set_cc;
6430 /* data processing instruction */
6431 if (insn & (1 << 25)) {
6432 /* immediate operand */
6433 val = insn & 0xff;
6434 shift = ((insn >> 8) & 0xf) * 2;
6435 if (shift) {
6436 val = (val >> shift) | (val << (32 - shift));
6438 tmp2 = new_tmp();
6439 tcg_gen_movi_i32(tmp2, val);
6440 if (logic_cc && shift) {
6441 gen_set_CF_bit31(tmp2);
6443 } else {
6444 /* register */
6445 rm = (insn) & 0xf;
6446 tmp2 = load_reg(s, rm);
6447 shiftop = (insn >> 5) & 3;
6448 if (!(insn & (1 << 4))) {
6449 shift = (insn >> 7) & 0x1f;
6450 gen_arm_shift_im(tmp2, shiftop, shift, logic_cc);
6451 } else {
6452 rs = (insn >> 8) & 0xf;
6453 tmp = load_reg(s, rs);
6454 gen_arm_shift_reg(tmp2, shiftop, tmp, logic_cc);
6457 if (op1 != 0x0f && op1 != 0x0d) {
6458 rn = (insn >> 16) & 0xf;
6459 tmp = load_reg(s, rn);
6460 } else {
6461 TCGV_UNUSED(tmp);
6463 rd = (insn >> 12) & 0xf;
6464 switch(op1) {
6465 case 0x00:
6466 tcg_gen_and_i32(tmp, tmp, tmp2);
6467 if (logic_cc) {
6468 gen_logic_CC(tmp);
6470 store_reg_bx(env, s, rd, tmp);
6471 break;
6472 case 0x01:
6473 tcg_gen_xor_i32(tmp, tmp, tmp2);
6474 if (logic_cc) {
6475 gen_logic_CC(tmp);
6477 store_reg_bx(env, s, rd, tmp);
6478 break;
6479 case 0x02:
6480 if (set_cc && rd == 15) {
6481 /* SUBS r15, ... is used for exception return. */
6482 if (IS_USER(s)) {
6483 goto illegal_op;
6485 gen_helper_sub_cc(tmp, tmp, tmp2);
6486 gen_exception_return(s, tmp);
6487 } else {
6488 if (set_cc) {
6489 gen_helper_sub_cc(tmp, tmp, tmp2);
6490 } else {
6491 tcg_gen_sub_i32(tmp, tmp, tmp2);
6493 store_reg_bx(env, s, rd, tmp);
6495 break;
6496 case 0x03:
6497 if (set_cc) {
6498 gen_helper_sub_cc(tmp, tmp2, tmp);
6499 } else {
6500 tcg_gen_sub_i32(tmp, tmp2, tmp);
6502 store_reg_bx(env, s, rd, tmp);
6503 break;
6504 case 0x04:
6505 if (set_cc) {
6506 gen_helper_add_cc(tmp, tmp, tmp2);
6507 } else {
6508 tcg_gen_add_i32(tmp, tmp, tmp2);
6510 store_reg_bx(env, s, rd, tmp);
6511 break;
6512 case 0x05:
6513 if (set_cc) {
6514 gen_helper_adc_cc(tmp, tmp, tmp2);
6515 } else {
6516 gen_add_carry(tmp, tmp, tmp2);
6518 store_reg_bx(env, s, rd, tmp);
6519 break;
6520 case 0x06:
6521 if (set_cc) {
6522 gen_helper_sbc_cc(tmp, tmp, tmp2);
6523 } else {
6524 gen_sub_carry(tmp, tmp, tmp2);
6526 store_reg_bx(env, s, rd, tmp);
6527 break;
6528 case 0x07:
6529 if (set_cc) {
6530 gen_helper_sbc_cc(tmp, tmp2, tmp);
6531 } else {
6532 gen_sub_carry(tmp, tmp2, tmp);
6534 store_reg_bx(env, s, rd, tmp);
6535 break;
6536 case 0x08:
6537 if (set_cc) {
6538 tcg_gen_and_i32(tmp, tmp, tmp2);
6539 gen_logic_CC(tmp);
6541 dead_tmp(tmp);
6542 break;
6543 case 0x09:
6544 if (set_cc) {
6545 tcg_gen_xor_i32(tmp, tmp, tmp2);
6546 gen_logic_CC(tmp);
6548 dead_tmp(tmp);
6549 break;
6550 case 0x0a:
6551 if (set_cc) {
6552 gen_helper_sub_cc(tmp, tmp, tmp2);
6554 dead_tmp(tmp);
6555 break;
6556 case 0x0b:
6557 if (set_cc) {
6558 gen_helper_add_cc(tmp, tmp, tmp2);
6560 dead_tmp(tmp);
6561 break;
6562 case 0x0c:
6563 tcg_gen_or_i32(tmp, tmp, tmp2);
6564 if (logic_cc) {
6565 gen_logic_CC(tmp);
6567 store_reg_bx(env, s, rd, tmp);
6568 break;
6569 case 0x0d:
6570 if (logic_cc && rd == 15) {
6571 /* MOVS r15, ... is used for exception return. */
6572 if (IS_USER(s)) {
6573 goto illegal_op;
6575 gen_exception_return(s, tmp2);
6576 } else {
6577 if (logic_cc) {
6578 gen_logic_CC(tmp2);
6580 store_reg_bx(env, s, rd, tmp2);
6582 break;
6583 case 0x0e:
6584 tcg_gen_andc_i32(tmp, tmp, tmp2);
6585 if (logic_cc) {
6586 gen_logic_CC(tmp);
6588 store_reg_bx(env, s, rd, tmp);
6589 break;
6590 default:
6591 case 0x0f:
6592 tcg_gen_not_i32(tmp2, tmp2);
6593 if (logic_cc) {
6594 gen_logic_CC(tmp2);
6596 store_reg_bx(env, s, rd, tmp2);
6597 break;
6599 if (op1 != 0x0f && op1 != 0x0d) {
6600 dead_tmp(tmp2);
6602 } else {
6603 /* other instructions */
6604 op1 = (insn >> 24) & 0xf;
6605 switch(op1) {
6606 case 0x0:
6607 case 0x1:
6608 /* multiplies, extra load/stores */
6609 sh = (insn >> 5) & 3;
6610 if (sh == 0) {
6611 if (op1 == 0x0) {
6612 rd = (insn >> 16) & 0xf;
6613 rn = (insn >> 12) & 0xf;
6614 rs = (insn >> 8) & 0xf;
6615 rm = (insn) & 0xf;
6616 op1 = (insn >> 20) & 0xf;
6617 switch (op1) {
6618 case 0: case 1: case 2: case 3: case 6:
6619 /* 32 bit mul */
6620 tmp = load_reg(s, rs);
6621 tmp2 = load_reg(s, rm);
6622 tcg_gen_mul_i32(tmp, tmp, tmp2);
6623 dead_tmp(tmp2);
6624 if (insn & (1 << 22)) {
6625 /* Subtract (mls) */
6626 ARCH(6T2);
6627 tmp2 = load_reg(s, rn);
6628 tcg_gen_sub_i32(tmp, tmp2, tmp);
6629 dead_tmp(tmp2);
6630 } else if (insn & (1 << 21)) {
6631 /* Add */
6632 tmp2 = load_reg(s, rn);
6633 tcg_gen_add_i32(tmp, tmp, tmp2);
6634 dead_tmp(tmp2);
6636 if (insn & (1 << 20))
6637 gen_logic_CC(tmp);
6638 store_reg(s, rd, tmp);
6639 break;
6640 default:
6641 /* 64 bit mul */
6642 tmp = load_reg(s, rs);
6643 tmp2 = load_reg(s, rm);
6644 if (insn & (1 << 22))
6645 tmp64 = gen_muls_i64_i32(tmp, tmp2);
6646 else
6647 tmp64 = gen_mulu_i64_i32(tmp, tmp2);
6648 if (insn & (1 << 21)) /* mult accumulate */
6649 gen_addq(s, tmp64, rn, rd);
6650 if (!(insn & (1 << 23))) { /* double accumulate */
6651 ARCH(6);
6652 gen_addq_lo(s, tmp64, rn);
6653 gen_addq_lo(s, tmp64, rd);
6655 if (insn & (1 << 20))
6656 gen_logicq_cc(tmp64);
6657 gen_storeq_reg(s, rn, rd, tmp64);
6658 tcg_temp_free_i64(tmp64);
6659 break;
6661 } else {
6662 rn = (insn >> 16) & 0xf;
6663 rd = (insn >> 12) & 0xf;
6664 if (insn & (1 << 23)) {
6665 /* load/store exclusive */
6666 op1 = (insn >> 21) & 0x3;
6667 if (op1)
6668 ARCH(6K);
6669 else
6670 ARCH(6);
6671 addr = tcg_temp_local_new_i32();
6672 load_reg_var(s, addr, rn);
6673 if (insn & (1 << 20)) {
6674 switch (op1) {
6675 case 0: /* ldrex */
6676 gen_load_exclusive(s, rd, 15, addr, 2);
6677 break;
6678 case 1: /* ldrexd */
6679 gen_load_exclusive(s, rd, rd + 1, addr, 3);
6680 break;
6681 case 2: /* ldrexb */
6682 gen_load_exclusive(s, rd, 15, addr, 0);
6683 break;
6684 case 3: /* ldrexh */
6685 gen_load_exclusive(s, rd, 15, addr, 1);
6686 break;
6687 default:
6688 abort();
6690 } else {
6691 rm = insn & 0xf;
6692 switch (op1) {
6693 case 0: /* strex */
6694 gen_store_exclusive(s, rd, rm, 15, addr, 2);
6695 break;
6696 case 1: /* strexd */
6697 gen_store_exclusive(s, rd, rm, rm + 1, addr, 3);
6698 break;
6699 case 2: /* strexb */
6700 gen_store_exclusive(s, rd, rm, 15, addr, 0);
6701 break;
6702 case 3: /* strexh */
6703 gen_store_exclusive(s, rd, rm, 15, addr, 1);
6704 break;
6705 default:
6706 abort();
6709 tcg_temp_free(addr);
6710 } else {
6711 /* SWP instruction */
6712 rm = (insn) & 0xf;
6714 /* ??? This is not really atomic. However we know
6715 we never have multiple CPUs running in parallel,
6716 so it is good enough. */
6717 addr = load_reg(s, rn);
6718 tmp = load_reg(s, rm);
6719 if (insn & (1 << 22)) {
6720 tmp2 = gen_ld8u(addr, IS_USER(s));
6721 gen_st8(tmp, addr, IS_USER(s));
6722 } else {
6723 tmp2 = gen_ld32(addr, IS_USER(s));
6724 gen_st32(tmp, addr, IS_USER(s));
6726 dead_tmp(addr);
6727 store_reg(s, rd, tmp2);
6730 } else {
6731 int address_offset;
6732 int load;
6733 /* Misc load/store */
6734 rn = (insn >> 16) & 0xf;
6735 rd = (insn >> 12) & 0xf;
6736 addr = load_reg(s, rn);
6737 if (insn & (1 << 24))
6738 gen_add_datah_offset(s, insn, 0, addr);
6739 address_offset = 0;
6740 if (insn & (1 << 20)) {
6741 /* load */
6742 switch(sh) {
6743 case 1:
6744 tmp = gen_ld16u(addr, IS_USER(s));
6745 break;
6746 case 2:
6747 tmp = gen_ld8s(addr, IS_USER(s));
6748 break;
6749 default:
6750 case 3:
6751 tmp = gen_ld16s(addr, IS_USER(s));
6752 break;
6754 load = 1;
6755 } else if (sh & 2) {
6756 /* doubleword */
6757 if (sh & 1) {
6758 /* store */
6759 tmp = load_reg(s, rd);
6760 gen_st32(tmp, addr, IS_USER(s));
6761 tcg_gen_addi_i32(addr, addr, 4);
6762 tmp = load_reg(s, rd + 1);
6763 gen_st32(tmp, addr, IS_USER(s));
6764 load = 0;
6765 } else {
6766 /* load */
6767 tmp = gen_ld32(addr, IS_USER(s));
6768 store_reg(s, rd, tmp);
6769 tcg_gen_addi_i32(addr, addr, 4);
6770 tmp = gen_ld32(addr, IS_USER(s));
6771 rd++;
6772 load = 1;
6774 address_offset = -4;
6775 } else {
6776 /* store */
6777 tmp = load_reg(s, rd);
6778 gen_st16(tmp, addr, IS_USER(s));
6779 load = 0;
6781 /* Perform base writeback before the loaded value to
6782 ensure correct behavior with overlapping index registers.
6783 ldrd with base writeback is is undefined if the
6784 destination and index registers overlap. */
6785 if (!(insn & (1 << 24))) {
6786 gen_add_datah_offset(s, insn, address_offset, addr);
6787 store_reg(s, rn, addr);
6788 } else if (insn & (1 << 21)) {
6789 if (address_offset)
6790 tcg_gen_addi_i32(addr, addr, address_offset);
6791 store_reg(s, rn, addr);
6792 } else {
6793 dead_tmp(addr);
6795 if (load) {
6796 /* Complete the load. */
6797 store_reg(s, rd, tmp);
6800 break;
6801 case 0x4:
6802 case 0x5:
6803 goto do_ldst;
6804 case 0x6:
6805 case 0x7:
6806 if (insn & (1 << 4)) {
6807 ARCH(6);
6808 /* Armv6 Media instructions. */
6809 rm = insn & 0xf;
6810 rn = (insn >> 16) & 0xf;
6811 rd = (insn >> 12) & 0xf;
6812 rs = (insn >> 8) & 0xf;
6813 switch ((insn >> 23) & 3) {
6814 case 0: /* Parallel add/subtract. */
6815 op1 = (insn >> 20) & 7;
6816 tmp = load_reg(s, rn);
6817 tmp2 = load_reg(s, rm);
6818 sh = (insn >> 5) & 7;
6819 if ((op1 & 3) == 0 || sh == 5 || sh == 6)
6820 goto illegal_op;
6821 gen_arm_parallel_addsub(op1, sh, tmp, tmp2);
6822 dead_tmp(tmp2);
6823 store_reg(s, rd, tmp);
6824 break;
6825 case 1:
6826 if ((insn & 0x00700020) == 0) {
6827 /* Halfword pack. */
6828 tmp = load_reg(s, rn);
6829 tmp2 = load_reg(s, rm);
6830 shift = (insn >> 7) & 0x1f;
6831 if (insn & (1 << 6)) {
6832 /* pkhtb */
6833 if (shift == 0)
6834 shift = 31;
6835 tcg_gen_sari_i32(tmp2, tmp2, shift);
6836 tcg_gen_andi_i32(tmp, tmp, 0xffff0000);
6837 tcg_gen_ext16u_i32(tmp2, tmp2);
6838 } else {
6839 /* pkhbt */
6840 if (shift)
6841 tcg_gen_shli_i32(tmp2, tmp2, shift);
6842 tcg_gen_ext16u_i32(tmp, tmp);
6843 tcg_gen_andi_i32(tmp2, tmp2, 0xffff0000);
6845 tcg_gen_or_i32(tmp, tmp, tmp2);
6846 dead_tmp(tmp2);
6847 store_reg(s, rd, tmp);
6848 } else if ((insn & 0x00200020) == 0x00200000) {
6849 /* [us]sat */
6850 tmp = load_reg(s, rm);
6851 shift = (insn >> 7) & 0x1f;
6852 if (insn & (1 << 6)) {
6853 if (shift == 0)
6854 shift = 31;
6855 tcg_gen_sari_i32(tmp, tmp, shift);
6856 } else {
6857 tcg_gen_shli_i32(tmp, tmp, shift);
6859 sh = (insn >> 16) & 0x1f;
6860 if (sh != 0) {
6861 tmp2 = tcg_const_i32(sh);
6862 if (insn & (1 << 22))
6863 gen_helper_usat(tmp, tmp, tmp2);
6864 else
6865 gen_helper_ssat(tmp, tmp, tmp2);
6866 tcg_temp_free_i32(tmp2);
6868 store_reg(s, rd, tmp);
6869 } else if ((insn & 0x00300fe0) == 0x00200f20) {
6870 /* [us]sat16 */
6871 tmp = load_reg(s, rm);
6872 sh = (insn >> 16) & 0x1f;
6873 if (sh != 0) {
6874 tmp2 = tcg_const_i32(sh);
6875 if (insn & (1 << 22))
6876 gen_helper_usat16(tmp, tmp, tmp2);
6877 else
6878 gen_helper_ssat16(tmp, tmp, tmp2);
6879 tcg_temp_free_i32(tmp2);
6881 store_reg(s, rd, tmp);
6882 } else if ((insn & 0x00700fe0) == 0x00000fa0) {
6883 /* Select bytes. */
6884 tmp = load_reg(s, rn);
6885 tmp2 = load_reg(s, rm);
6886 tmp3 = new_tmp();
6887 tcg_gen_ld_i32(tmp3, cpu_env, offsetof(CPUState, GE));
6888 gen_helper_sel_flags(tmp, tmp3, tmp, tmp2);
6889 dead_tmp(tmp3);
6890 dead_tmp(tmp2);
6891 store_reg(s, rd, tmp);
6892 } else if ((insn & 0x000003e0) == 0x00000060) {
6893 tmp = load_reg(s, rm);
6894 shift = (insn >> 10) & 3;
6895 /* ??? In many cases it's not neccessary to do a
6896 rotate, a shift is sufficient. */
6897 if (shift != 0)
6898 tcg_gen_rotri_i32(tmp, tmp, shift * 8);
6899 op1 = (insn >> 20) & 7;
6900 switch (op1) {
6901 case 0: gen_sxtb16(tmp); break;
6902 case 2: gen_sxtb(tmp); break;
6903 case 3: gen_sxth(tmp); break;
6904 case 4: gen_uxtb16(tmp); break;
6905 case 6: gen_uxtb(tmp); break;
6906 case 7: gen_uxth(tmp); break;
6907 default: goto illegal_op;
6909 if (rn != 15) {
6910 tmp2 = load_reg(s, rn);
6911 if ((op1 & 3) == 0) {
6912 gen_add16(tmp, tmp2);
6913 } else {
6914 tcg_gen_add_i32(tmp, tmp, tmp2);
6915 dead_tmp(tmp2);
6918 store_reg(s, rd, tmp);
6919 } else if ((insn & 0x003f0f60) == 0x003f0f20) {
6920 /* rev */
6921 tmp = load_reg(s, rm);
6922 if (insn & (1 << 22)) {
6923 if (insn & (1 << 7)) {
6924 gen_revsh(tmp);
6925 } else {
6926 ARCH(6T2);
6927 gen_helper_rbit(tmp, tmp);
6929 } else {
6930 if (insn & (1 << 7))
6931 gen_rev16(tmp);
6932 else
6933 tcg_gen_bswap32_i32(tmp, tmp);
6935 store_reg(s, rd, tmp);
6936 } else {
6937 goto illegal_op;
6939 break;
6940 case 2: /* Multiplies (Type 3). */
6941 tmp = load_reg(s, rm);
6942 tmp2 = load_reg(s, rs);
6943 if (insn & (1 << 20)) {
6944 /* Signed multiply most significant [accumulate]. */
6945 tmp64 = gen_muls_i64_i32(tmp, tmp2);
6946 if (insn & (1 << 5))
6947 tcg_gen_addi_i64(tmp64, tmp64, 0x80000000u);
6948 tcg_gen_shri_i64(tmp64, tmp64, 32);
6949 tmp = new_tmp();
6950 tcg_gen_trunc_i64_i32(tmp, tmp64);
6951 tcg_temp_free_i64(tmp64);
6952 if (rd != 15) {
6953 tmp2 = load_reg(s, rd);
6954 if (insn & (1 << 6)) {
6955 tcg_gen_sub_i32(tmp, tmp, tmp2);
6956 } else {
6957 tcg_gen_add_i32(tmp, tmp, tmp2);
6959 dead_tmp(tmp2);
6961 store_reg(s, rn, tmp);
6962 } else {
6963 if (insn & (1 << 5))
6964 gen_swap_half(tmp2);
6965 gen_smul_dual(tmp, tmp2);
6966 /* This addition cannot overflow. */
6967 if (insn & (1 << 6)) {
6968 tcg_gen_sub_i32(tmp, tmp, tmp2);
6969 } else {
6970 tcg_gen_add_i32(tmp, tmp, tmp2);
6972 dead_tmp(tmp2);
6973 if (insn & (1 << 22)) {
6974 /* smlald, smlsld */
6975 tmp64 = tcg_temp_new_i64();
6976 tcg_gen_ext_i32_i64(tmp64, tmp);
6977 dead_tmp(tmp);
6978 gen_addq(s, tmp64, rd, rn);
6979 gen_storeq_reg(s, rd, rn, tmp64);
6980 tcg_temp_free_i64(tmp64);
6981 } else {
6982 /* smuad, smusd, smlad, smlsd */
6983 if (rd != 15)
6985 tmp2 = load_reg(s, rd);
6986 gen_helper_add_setq(tmp, tmp, tmp2);
6987 dead_tmp(tmp2);
6989 store_reg(s, rn, tmp);
6992 break;
6993 case 3:
6994 op1 = ((insn >> 17) & 0x38) | ((insn >> 5) & 7);
6995 switch (op1) {
6996 case 0: /* Unsigned sum of absolute differences. */
6997 ARCH(6);
6998 tmp = load_reg(s, rm);
6999 tmp2 = load_reg(s, rs);
7000 gen_helper_usad8(tmp, tmp, tmp2);
7001 dead_tmp(tmp2);
7002 if (rd != 15) {
7003 tmp2 = load_reg(s, rd);
7004 tcg_gen_add_i32(tmp, tmp, tmp2);
7005 dead_tmp(tmp2);
7007 store_reg(s, rn, tmp);
7008 break;
7009 case 0x20: case 0x24: case 0x28: case 0x2c:
7010 /* Bitfield insert/clear. */
7011 ARCH(6T2);
7012 shift = (insn >> 7) & 0x1f;
7013 i = (insn >> 16) & 0x1f;
7014 i = i + 1 - shift;
7015 if (rm == 15) {
7016 tmp = new_tmp();
7017 tcg_gen_movi_i32(tmp, 0);
7018 } else {
7019 tmp = load_reg(s, rm);
7021 if (i != 32) {
7022 tmp2 = load_reg(s, rd);
7023 gen_bfi(tmp, tmp2, tmp, shift, (1u << i) - 1);
7024 dead_tmp(tmp2);
7026 store_reg(s, rd, tmp);
7027 break;
7028 case 0x12: case 0x16: case 0x1a: case 0x1e: /* sbfx */
7029 case 0x32: case 0x36: case 0x3a: case 0x3e: /* ubfx */
7030 ARCH(6T2);
7031 tmp = load_reg(s, rm);
7032 shift = (insn >> 7) & 0x1f;
7033 i = ((insn >> 16) & 0x1f) + 1;
7034 if (shift + i > 32)
7035 goto illegal_op;
7036 if (i < 32) {
7037 if (op1 & 0x20) {
7038 gen_ubfx(tmp, shift, (1u << i) - 1);
7039 } else {
7040 gen_sbfx(tmp, shift, i);
7043 store_reg(s, rd, tmp);
7044 break;
7045 default:
7046 goto illegal_op;
7048 break;
7050 break;
7052 do_ldst:
7053 /* Check for undefined extension instructions
7054 * per the ARM Bible IE:
7055 * xxxx 0111 1111 xxxx xxxx xxxx 1111 xxxx
7057 sh = (0xf << 20) | (0xf << 4);
7058 if (op1 == 0x7 && ((insn & sh) == sh))
7060 goto illegal_op;
7062 /* load/store byte/word */
7063 rn = (insn >> 16) & 0xf;
7064 rd = (insn >> 12) & 0xf;
7065 tmp2 = load_reg(s, rn);
7066 i = (IS_USER(s) || (insn & 0x01200000) == 0x00200000);
7067 if (insn & (1 << 24))
7068 gen_add_data_offset(s, insn, tmp2);
7069 if (insn & (1 << 20)) {
7070 /* load */
7071 if (insn & (1 << 22)) {
7072 tmp = gen_ld8u(tmp2, i);
7073 } else {
7074 tmp = gen_ld32(tmp2, i);
7076 } else {
7077 /* store */
7078 tmp = load_reg(s, rd);
7079 if (insn & (1 << 22))
7080 gen_st8(tmp, tmp2, i);
7081 else
7082 gen_st32(tmp, tmp2, i);
7084 if (!(insn & (1 << 24))) {
7085 gen_add_data_offset(s, insn, tmp2);
7086 store_reg(s, rn, tmp2);
7087 } else if (insn & (1 << 21)) {
7088 store_reg(s, rn, tmp2);
7089 } else {
7090 dead_tmp(tmp2);
7092 if (insn & (1 << 20)) {
7093 /* Complete the load. */
7094 if (rd == 15)
7095 gen_bx(s, tmp);
7096 else
7097 store_reg(s, rd, tmp);
7099 break;
7100 case 0x08:
7101 case 0x09:
7103 int j, n, user, loaded_base;
7104 TCGv loaded_var;
7105 /* load/store multiple words */
7106 /* XXX: store correct base if write back */
7107 user = 0;
7108 if (insn & (1 << 22)) {
7109 if (IS_USER(s))
7110 goto illegal_op; /* only usable in supervisor mode */
7112 if ((insn & (1 << 15)) == 0)
7113 user = 1;
7115 rn = (insn >> 16) & 0xf;
7116 addr = load_reg(s, rn);
7118 /* compute total size */
7119 loaded_base = 0;
7120 TCGV_UNUSED(loaded_var);
7121 n = 0;
7122 for(i=0;i<16;i++) {
7123 if (insn & (1 << i))
7124 n++;
7126 /* XXX: test invalid n == 0 case ? */
7127 if (insn & (1 << 23)) {
7128 if (insn & (1 << 24)) {
7129 /* pre increment */
7130 tcg_gen_addi_i32(addr, addr, 4);
7131 } else {
7132 /* post increment */
7134 } else {
7135 if (insn & (1 << 24)) {
7136 /* pre decrement */
7137 tcg_gen_addi_i32(addr, addr, -(n * 4));
7138 } else {
7139 /* post decrement */
7140 if (n != 1)
7141 tcg_gen_addi_i32(addr, addr, -((n - 1) * 4));
7144 j = 0;
7145 for(i=0;i<16;i++) {
7146 if (insn & (1 << i)) {
7147 if (insn & (1 << 20)) {
7148 /* load */
7149 tmp = gen_ld32(addr, IS_USER(s));
7150 if (i == 15) {
7151 gen_bx(s, tmp);
7152 } else if (user) {
7153 tmp2 = tcg_const_i32(i);
7154 gen_helper_set_user_reg(tmp2, tmp);
7155 tcg_temp_free_i32(tmp2);
7156 dead_tmp(tmp);
7157 } else if (i == rn) {
7158 loaded_var = tmp;
7159 loaded_base = 1;
7160 } else {
7161 store_reg(s, i, tmp);
7163 } else {
7164 /* store */
7165 if (i == 15) {
7166 /* special case: r15 = PC + 8 */
7167 val = (long)s->pc + 4;
7168 tmp = new_tmp();
7169 tcg_gen_movi_i32(tmp, val);
7170 } else if (user) {
7171 tmp = new_tmp();
7172 tmp2 = tcg_const_i32(i);
7173 gen_helper_get_user_reg(tmp, tmp2);
7174 tcg_temp_free_i32(tmp2);
7175 } else {
7176 tmp = load_reg(s, i);
7178 gen_st32(tmp, addr, IS_USER(s));
7180 j++;
7181 /* no need to add after the last transfer */
7182 if (j != n)
7183 tcg_gen_addi_i32(addr, addr, 4);
7186 if (insn & (1 << 21)) {
7187 /* write back */
7188 if (insn & (1 << 23)) {
7189 if (insn & (1 << 24)) {
7190 /* pre increment */
7191 } else {
7192 /* post increment */
7193 tcg_gen_addi_i32(addr, addr, 4);
7195 } else {
7196 if (insn & (1 << 24)) {
7197 /* pre decrement */
7198 if (n != 1)
7199 tcg_gen_addi_i32(addr, addr, -((n - 1) * 4));
7200 } else {
7201 /* post decrement */
7202 tcg_gen_addi_i32(addr, addr, -(n * 4));
7205 store_reg(s, rn, addr);
7206 } else {
7207 dead_tmp(addr);
7209 if (loaded_base) {
7210 store_reg(s, rn, loaded_var);
7212 if ((insn & (1 << 22)) && !user) {
7213 /* Restore CPSR from SPSR. */
7214 tmp = load_cpu_field(spsr);
7215 gen_set_cpsr(tmp, 0xffffffff);
7216 dead_tmp(tmp);
7217 s->is_jmp = DISAS_UPDATE;
7220 break;
7221 case 0xa:
7222 case 0xb:
7224 int32_t offset;
7226 /* branch (and link) */
7227 val = (int32_t)s->pc;
7228 if (insn & (1 << 24)) {
7229 tmp = new_tmp();
7230 tcg_gen_movi_i32(tmp, val);
7231 store_reg(s, 14, tmp);
7233 offset = (((int32_t)insn << 8) >> 8);
7234 val += (offset << 2) + 4;
7235 gen_jmp(s, val);
7237 break;
7238 case 0xc:
7239 case 0xd:
7240 case 0xe:
7241 /* Coprocessor. */
7242 if (disas_coproc_insn(env, s, insn))
7243 goto illegal_op;
7244 break;
7245 case 0xf:
7246 /* swi */
7247 gen_set_pc_im(s->pc);
7248 s->is_jmp = DISAS_SWI;
7249 break;
7250 default:
7251 illegal_op:
7252 gen_set_condexec(s);
7253 gen_set_pc_im(s->pc - 4);
7254 gen_exception(EXCP_UDEF);
7255 s->is_jmp = DISAS_JUMP;
7256 break;
7261 /* Return true if this is a Thumb-2 logical op. */
7262 static int
7263 thumb2_logic_op(int op)
7265 return (op < 8);
7268 /* Generate code for a Thumb-2 data processing operation. If CONDS is nonzero
7269 then set condition code flags based on the result of the operation.
7270 If SHIFTER_OUT is nonzero then set the carry flag for logical operations
7271 to the high bit of T1.
7272 Returns zero if the opcode is valid. */
7274 static int
7275 gen_thumb2_data_op(DisasContext *s, int op, int conds, uint32_t shifter_out, TCGv t0, TCGv t1)
7277 int logic_cc;
7279 logic_cc = 0;
7280 switch (op) {
7281 case 0: /* and */
7282 tcg_gen_and_i32(t0, t0, t1);
7283 logic_cc = conds;
7284 break;
7285 case 1: /* bic */
7286 tcg_gen_andc_i32(t0, t0, t1);
7287 logic_cc = conds;
7288 break;
7289 case 2: /* orr */
7290 tcg_gen_or_i32(t0, t0, t1);
7291 logic_cc = conds;
7292 break;
7293 case 3: /* orn */
7294 tcg_gen_not_i32(t1, t1);
7295 tcg_gen_or_i32(t0, t0, t1);
7296 logic_cc = conds;
7297 break;
7298 case 4: /* eor */
7299 tcg_gen_xor_i32(t0, t0, t1);
7300 logic_cc = conds;
7301 break;
7302 case 8: /* add */
7303 if (conds)
7304 gen_helper_add_cc(t0, t0, t1);
7305 else
7306 tcg_gen_add_i32(t0, t0, t1);
7307 break;
7308 case 10: /* adc */
7309 if (conds)
7310 gen_helper_adc_cc(t0, t0, t1);
7311 else
7312 gen_adc(t0, t1);
7313 break;
7314 case 11: /* sbc */
7315 if (conds)
7316 gen_helper_sbc_cc(t0, t0, t1);
7317 else
7318 gen_sub_carry(t0, t0, t1);
7319 break;
7320 case 13: /* sub */
7321 if (conds)
7322 gen_helper_sub_cc(t0, t0, t1);
7323 else
7324 tcg_gen_sub_i32(t0, t0, t1);
7325 break;
7326 case 14: /* rsb */
7327 if (conds)
7328 gen_helper_sub_cc(t0, t1, t0);
7329 else
7330 tcg_gen_sub_i32(t0, t1, t0);
7331 break;
7332 default: /* 5, 6, 7, 9, 12, 15. */
7333 return 1;
7335 if (logic_cc) {
7336 gen_logic_CC(t0);
7337 if (shifter_out)
7338 gen_set_CF_bit31(t1);
7340 return 0;
7343 /* Translate a 32-bit thumb instruction. Returns nonzero if the instruction
7344 is not legal. */
7345 static int disas_thumb2_insn(CPUState *env, DisasContext *s, uint16_t insn_hw1)
7347 uint32_t insn, imm, shift, offset;
7348 uint32_t rd, rn, rm, rs;
7349 TCGv tmp;
7350 TCGv tmp2;
7351 TCGv tmp3;
7352 TCGv addr;
7353 TCGv_i64 tmp64;
7354 int op;
7355 int shiftop;
7356 int conds;
7357 int logic_cc;
7359 if (!(arm_feature(env, ARM_FEATURE_THUMB2)
7360 || arm_feature (env, ARM_FEATURE_M))) {
7361 /* Thumb-1 cores may need to treat bl and blx as a pair of
7362 16-bit instructions to get correct prefetch abort behavior. */
7363 insn = insn_hw1;
7364 if ((insn & (1 << 12)) == 0) {
7365 /* Second half of blx. */
7366 offset = ((insn & 0x7ff) << 1);
7367 tmp = load_reg(s, 14);
7368 tcg_gen_addi_i32(tmp, tmp, offset);
7369 tcg_gen_andi_i32(tmp, tmp, 0xfffffffc);
7371 tmp2 = new_tmp();
7372 tcg_gen_movi_i32(tmp2, s->pc | 1);
7373 store_reg(s, 14, tmp2);
7374 gen_bx(s, tmp);
7375 return 0;
7377 if (insn & (1 << 11)) {
7378 /* Second half of bl. */
7379 offset = ((insn & 0x7ff) << 1) | 1;
7380 tmp = load_reg(s, 14);
7381 tcg_gen_addi_i32(tmp, tmp, offset);
7383 tmp2 = new_tmp();
7384 tcg_gen_movi_i32(tmp2, s->pc | 1);
7385 store_reg(s, 14, tmp2);
7386 gen_bx(s, tmp);
7387 return 0;
7389 if ((s->pc & ~TARGET_PAGE_MASK) == 0) {
7390 /* Instruction spans a page boundary. Implement it as two
7391 16-bit instructions in case the second half causes an
7392 prefetch abort. */
7393 offset = ((int32_t)insn << 21) >> 9;
7394 tcg_gen_movi_i32(cpu_R[14], s->pc + 2 + offset);
7395 return 0;
7397 /* Fall through to 32-bit decode. */
7400 insn = lduw_code(s->pc);
7401 s->pc += 2;
7402 insn |= (uint32_t)insn_hw1 << 16;
7404 if ((insn & 0xf800e800) != 0xf000e800) {
7405 ARCH(6T2);
7408 rn = (insn >> 16) & 0xf;
7409 rs = (insn >> 12) & 0xf;
7410 rd = (insn >> 8) & 0xf;
7411 rm = insn & 0xf;
7412 switch ((insn >> 25) & 0xf) {
7413 case 0: case 1: case 2: case 3:
7414 /* 16-bit instructions. Should never happen. */
7415 abort();
7416 case 4:
7417 if (insn & (1 << 22)) {
7418 /* Other load/store, table branch. */
7419 if (insn & 0x01200000) {
7420 /* Load/store doubleword. */
7421 if (rn == 15) {
7422 addr = new_tmp();
7423 tcg_gen_movi_i32(addr, s->pc & ~3);
7424 } else {
7425 addr = load_reg(s, rn);
7427 offset = (insn & 0xff) * 4;
7428 if ((insn & (1 << 23)) == 0)
7429 offset = -offset;
7430 if (insn & (1 << 24)) {
7431 tcg_gen_addi_i32(addr, addr, offset);
7432 offset = 0;
7434 if (insn & (1 << 20)) {
7435 /* ldrd */
7436 tmp = gen_ld32(addr, IS_USER(s));
7437 store_reg(s, rs, tmp);
7438 tcg_gen_addi_i32(addr, addr, 4);
7439 tmp = gen_ld32(addr, IS_USER(s));
7440 store_reg(s, rd, tmp);
7441 } else {
7442 /* strd */
7443 tmp = load_reg(s, rs);
7444 gen_st32(tmp, addr, IS_USER(s));
7445 tcg_gen_addi_i32(addr, addr, 4);
7446 tmp = load_reg(s, rd);
7447 gen_st32(tmp, addr, IS_USER(s));
7449 if (insn & (1 << 21)) {
7450 /* Base writeback. */
7451 if (rn == 15)
7452 goto illegal_op;
7453 tcg_gen_addi_i32(addr, addr, offset - 4);
7454 store_reg(s, rn, addr);
7455 } else {
7456 dead_tmp(addr);
7458 } else if ((insn & (1 << 23)) == 0) {
7459 /* Load/store exclusive word. */
7460 addr = tcg_temp_local_new();
7461 load_reg_var(s, addr, rn);
7462 tcg_gen_addi_i32(addr, addr, (insn & 0xff) << 2);
7463 if (insn & (1 << 20)) {
7464 gen_load_exclusive(s, rs, 15, addr, 2);
7465 } else {
7466 gen_store_exclusive(s, rd, rs, 15, addr, 2);
7468 tcg_temp_free(addr);
7469 } else if ((insn & (1 << 6)) == 0) {
7470 /* Table Branch. */
7471 if (rn == 15) {
7472 addr = new_tmp();
7473 tcg_gen_movi_i32(addr, s->pc);
7474 } else {
7475 addr = load_reg(s, rn);
7477 tmp = load_reg(s, rm);
7478 tcg_gen_add_i32(addr, addr, tmp);
7479 if (insn & (1 << 4)) {
7480 /* tbh */
7481 tcg_gen_add_i32(addr, addr, tmp);
7482 dead_tmp(tmp);
7483 tmp = gen_ld16u(addr, IS_USER(s));
7484 } else { /* tbb */
7485 dead_tmp(tmp);
7486 tmp = gen_ld8u(addr, IS_USER(s));
7488 dead_tmp(addr);
7489 tcg_gen_shli_i32(tmp, tmp, 1);
7490 tcg_gen_addi_i32(tmp, tmp, s->pc);
7491 store_reg(s, 15, tmp);
7492 } else {
7493 /* Load/store exclusive byte/halfword/doubleword. */
7494 ARCH(7);
7495 op = (insn >> 4) & 0x3;
7496 if (op == 2) {
7497 goto illegal_op;
7499 addr = tcg_temp_local_new();
7500 load_reg_var(s, addr, rn);
7501 if (insn & (1 << 20)) {
7502 gen_load_exclusive(s, rs, rd, addr, op);
7503 } else {
7504 gen_store_exclusive(s, rm, rs, rd, addr, op);
7506 tcg_temp_free(addr);
7508 } else {
7509 /* Load/store multiple, RFE, SRS. */
7510 if (((insn >> 23) & 1) == ((insn >> 24) & 1)) {
7511 /* Not available in user mode. */
7512 if (IS_USER(s))
7513 goto illegal_op;
7514 if (insn & (1 << 20)) {
7515 /* rfe */
7516 addr = load_reg(s, rn);
7517 if ((insn & (1 << 24)) == 0)
7518 tcg_gen_addi_i32(addr, addr, -8);
7519 /* Load PC into tmp and CPSR into tmp2. */
7520 tmp = gen_ld32(addr, 0);
7521 tcg_gen_addi_i32(addr, addr, 4);
7522 tmp2 = gen_ld32(addr, 0);
7523 if (insn & (1 << 21)) {
7524 /* Base writeback. */
7525 if (insn & (1 << 24)) {
7526 tcg_gen_addi_i32(addr, addr, 4);
7527 } else {
7528 tcg_gen_addi_i32(addr, addr, -4);
7530 store_reg(s, rn, addr);
7531 } else {
7532 dead_tmp(addr);
7534 gen_rfe(s, tmp, tmp2);
7535 } else {
7536 /* srs */
7537 op = (insn & 0x1f);
7538 if (op == (env->uncached_cpsr & CPSR_M)) {
7539 addr = load_reg(s, 13);
7540 } else {
7541 addr = new_tmp();
7542 tmp = tcg_const_i32(op);
7543 gen_helper_get_r13_banked(addr, cpu_env, tmp);
7544 tcg_temp_free_i32(tmp);
7546 if ((insn & (1 << 24)) == 0) {
7547 tcg_gen_addi_i32(addr, addr, -8);
7549 tmp = load_reg(s, 14);
7550 gen_st32(tmp, addr, 0);
7551 tcg_gen_addi_i32(addr, addr, 4);
7552 tmp = new_tmp();
7553 gen_helper_cpsr_read(tmp);
7554 gen_st32(tmp, addr, 0);
7555 if (insn & (1 << 21)) {
7556 if ((insn & (1 << 24)) == 0) {
7557 tcg_gen_addi_i32(addr, addr, -4);
7558 } else {
7559 tcg_gen_addi_i32(addr, addr, 4);
7561 if (op == (env->uncached_cpsr & CPSR_M)) {
7562 store_reg(s, 13, addr);
7563 } else {
7564 tmp = tcg_const_i32(op);
7565 gen_helper_set_r13_banked(cpu_env, tmp, addr);
7566 tcg_temp_free_i32(tmp);
7568 } else {
7569 dead_tmp(addr);
7572 } else {
7573 int i;
7574 /* Load/store multiple. */
7575 addr = load_reg(s, rn);
7576 offset = 0;
7577 for (i = 0; i < 16; i++) {
7578 if (insn & (1 << i))
7579 offset += 4;
7581 if (insn & (1 << 24)) {
7582 tcg_gen_addi_i32(addr, addr, -offset);
7585 for (i = 0; i < 16; i++) {
7586 if ((insn & (1 << i)) == 0)
7587 continue;
7588 if (insn & (1 << 20)) {
7589 /* Load. */
7590 tmp = gen_ld32(addr, IS_USER(s));
7591 if (i == 15) {
7592 gen_bx(s, tmp);
7593 } else {
7594 store_reg(s, i, tmp);
7596 } else {
7597 /* Store. */
7598 tmp = load_reg(s, i);
7599 gen_st32(tmp, addr, IS_USER(s));
7601 tcg_gen_addi_i32(addr, addr, 4);
7603 if (insn & (1 << 21)) {
7604 /* Base register writeback. */
7605 if (insn & (1 << 24)) {
7606 tcg_gen_addi_i32(addr, addr, -offset);
7608 /* Fault if writeback register is in register list. */
7609 if (insn & (1 << rn))
7610 goto illegal_op;
7611 store_reg(s, rn, addr);
7612 } else {
7613 dead_tmp(addr);
7617 break;
7618 case 5:
7620 op = (insn >> 21) & 0xf;
7621 if (op == 6) {
7622 /* Halfword pack. */
7623 tmp = load_reg(s, rn);
7624 tmp2 = load_reg(s, rm);
7625 shift = ((insn >> 10) & 0x1c) | ((insn >> 6) & 0x3);
7626 if (insn & (1 << 5)) {
7627 /* pkhtb */
7628 if (shift == 0)
7629 shift = 31;
7630 tcg_gen_sari_i32(tmp2, tmp2, shift);
7631 tcg_gen_andi_i32(tmp, tmp, 0xffff0000);
7632 tcg_gen_ext16u_i32(tmp2, tmp2);
7633 } else {
7634 /* pkhbt */
7635 if (shift)
7636 tcg_gen_shli_i32(tmp2, tmp2, shift);
7637 tcg_gen_ext16u_i32(tmp, tmp);
7638 tcg_gen_andi_i32(tmp2, tmp2, 0xffff0000);
7640 tcg_gen_or_i32(tmp, tmp, tmp2);
7641 dead_tmp(tmp2);
7642 store_reg(s, rd, tmp);
7643 } else {
7644 /* Data processing register constant shift. */
7645 if (rn == 15) {
7646 tmp = new_tmp();
7647 tcg_gen_movi_i32(tmp, 0);
7648 } else {
7649 tmp = load_reg(s, rn);
7651 tmp2 = load_reg(s, rm);
7653 shiftop = (insn >> 4) & 3;
7654 shift = ((insn >> 6) & 3) | ((insn >> 10) & 0x1c);
7655 conds = (insn & (1 << 20)) != 0;
7656 logic_cc = (conds && thumb2_logic_op(op));
7657 gen_arm_shift_im(tmp2, shiftop, shift, logic_cc);
7658 if (gen_thumb2_data_op(s, op, conds, 0, tmp, tmp2))
7659 goto illegal_op;
7660 dead_tmp(tmp2);
7661 if (rd != 15) {
7662 store_reg(s, rd, tmp);
7663 } else {
7664 dead_tmp(tmp);
7667 break;
7668 case 13: /* Misc data processing. */
7669 op = ((insn >> 22) & 6) | ((insn >> 7) & 1);
7670 if (op < 4 && (insn & 0xf000) != 0xf000)
7671 goto illegal_op;
7672 switch (op) {
7673 case 0: /* Register controlled shift. */
7674 tmp = load_reg(s, rn);
7675 tmp2 = load_reg(s, rm);
7676 if ((insn & 0x70) != 0)
7677 goto illegal_op;
7678 op = (insn >> 21) & 3;
7679 logic_cc = (insn & (1 << 20)) != 0;
7680 gen_arm_shift_reg(tmp, op, tmp2, logic_cc);
7681 if (logic_cc)
7682 gen_logic_CC(tmp);
7683 store_reg_bx(env, s, rd, tmp);
7684 break;
7685 case 1: /* Sign/zero extend. */
7686 tmp = load_reg(s, rm);
7687 shift = (insn >> 4) & 3;
7688 /* ??? In many cases it's not neccessary to do a
7689 rotate, a shift is sufficient. */
7690 if (shift != 0)
7691 tcg_gen_rotri_i32(tmp, tmp, shift * 8);
7692 op = (insn >> 20) & 7;
7693 switch (op) {
7694 case 0: gen_sxth(tmp); break;
7695 case 1: gen_uxth(tmp); break;
7696 case 2: gen_sxtb16(tmp); break;
7697 case 3: gen_uxtb16(tmp); break;
7698 case 4: gen_sxtb(tmp); break;
7699 case 5: gen_uxtb(tmp); break;
7700 default: goto illegal_op;
7702 if (rn != 15) {
7703 tmp2 = load_reg(s, rn);
7704 if ((op >> 1) == 1) {
7705 gen_add16(tmp, tmp2);
7706 } else {
7707 tcg_gen_add_i32(tmp, tmp, tmp2);
7708 dead_tmp(tmp2);
7711 store_reg(s, rd, tmp);
7712 break;
7713 case 2: /* SIMD add/subtract. */
7714 op = (insn >> 20) & 7;
7715 shift = (insn >> 4) & 7;
7716 if ((op & 3) == 3 || (shift & 3) == 3)
7717 goto illegal_op;
7718 tmp = load_reg(s, rn);
7719 tmp2 = load_reg(s, rm);
7720 gen_thumb2_parallel_addsub(op, shift, tmp, tmp2);
7721 dead_tmp(tmp2);
7722 store_reg(s, rd, tmp);
7723 break;
7724 case 3: /* Other data processing. */
7725 op = ((insn >> 17) & 0x38) | ((insn >> 4) & 7);
7726 if (op < 4) {
7727 /* Saturating add/subtract. */
7728 tmp = load_reg(s, rn);
7729 tmp2 = load_reg(s, rm);
7730 if (op & 1)
7731 gen_helper_double_saturate(tmp, tmp);
7732 if (op & 2)
7733 gen_helper_sub_saturate(tmp, tmp2, tmp);
7734 else
7735 gen_helper_add_saturate(tmp, tmp, tmp2);
7736 dead_tmp(tmp2);
7737 } else {
7738 tmp = load_reg(s, rn);
7739 switch (op) {
7740 case 0x0a: /* rbit */
7741 gen_helper_rbit(tmp, tmp);
7742 break;
7743 case 0x08: /* rev */
7744 tcg_gen_bswap32_i32(tmp, tmp);
7745 break;
7746 case 0x09: /* rev16 */
7747 gen_rev16(tmp);
7748 break;
7749 case 0x0b: /* revsh */
7750 gen_revsh(tmp);
7751 break;
7752 case 0x10: /* sel */
7753 tmp2 = load_reg(s, rm);
7754 tmp3 = new_tmp();
7755 tcg_gen_ld_i32(tmp3, cpu_env, offsetof(CPUState, GE));
7756 gen_helper_sel_flags(tmp, tmp3, tmp, tmp2);
7757 dead_tmp(tmp3);
7758 dead_tmp(tmp2);
7759 break;
7760 case 0x18: /* clz */
7761 gen_helper_clz(tmp, tmp);
7762 break;
7763 default:
7764 goto illegal_op;
7767 store_reg(s, rd, tmp);
7768 break;
7769 case 4: case 5: /* 32-bit multiply. Sum of absolute differences. */
7770 op = (insn >> 4) & 0xf;
7771 tmp = load_reg(s, rn);
7772 tmp2 = load_reg(s, rm);
7773 switch ((insn >> 20) & 7) {
7774 case 0: /* 32 x 32 -> 32 */
7775 tcg_gen_mul_i32(tmp, tmp, tmp2);
7776 dead_tmp(tmp2);
7777 if (rs != 15) {
7778 tmp2 = load_reg(s, rs);
7779 if (op)
7780 tcg_gen_sub_i32(tmp, tmp2, tmp);
7781 else
7782 tcg_gen_add_i32(tmp, tmp, tmp2);
7783 dead_tmp(tmp2);
7785 break;
7786 case 1: /* 16 x 16 -> 32 */
7787 gen_mulxy(tmp, tmp2, op & 2, op & 1);
7788 dead_tmp(tmp2);
7789 if (rs != 15) {
7790 tmp2 = load_reg(s, rs);
7791 gen_helper_add_setq(tmp, tmp, tmp2);
7792 dead_tmp(tmp2);
7794 break;
7795 case 2: /* Dual multiply add. */
7796 case 4: /* Dual multiply subtract. */
7797 if (op)
7798 gen_swap_half(tmp2);
7799 gen_smul_dual(tmp, tmp2);
7800 /* This addition cannot overflow. */
7801 if (insn & (1 << 22)) {
7802 tcg_gen_sub_i32(tmp, tmp, tmp2);
7803 } else {
7804 tcg_gen_add_i32(tmp, tmp, tmp2);
7806 dead_tmp(tmp2);
7807 if (rs != 15)
7809 tmp2 = load_reg(s, rs);
7810 gen_helper_add_setq(tmp, tmp, tmp2);
7811 dead_tmp(tmp2);
7813 break;
7814 case 3: /* 32 * 16 -> 32msb */
7815 if (op)
7816 tcg_gen_sari_i32(tmp2, tmp2, 16);
7817 else
7818 gen_sxth(tmp2);
7819 tmp64 = gen_muls_i64_i32(tmp, tmp2);
7820 tcg_gen_shri_i64(tmp64, tmp64, 16);
7821 tmp = new_tmp();
7822 tcg_gen_trunc_i64_i32(tmp, tmp64);
7823 tcg_temp_free_i64(tmp64);
7824 if (rs != 15)
7826 tmp2 = load_reg(s, rs);
7827 gen_helper_add_setq(tmp, tmp, tmp2);
7828 dead_tmp(tmp2);
7830 break;
7831 case 5: case 6: /* 32 * 32 -> 32msb */
7832 gen_imull(tmp, tmp2);
7833 if (insn & (1 << 5)) {
7834 gen_roundqd(tmp, tmp2);
7835 dead_tmp(tmp2);
7836 } else {
7837 dead_tmp(tmp);
7838 tmp = tmp2;
7840 if (rs != 15) {
7841 tmp2 = load_reg(s, rs);
7842 if (insn & (1 << 21)) {
7843 tcg_gen_add_i32(tmp, tmp, tmp2);
7844 } else {
7845 tcg_gen_sub_i32(tmp, tmp2, tmp);
7847 dead_tmp(tmp2);
7849 break;
7850 case 7: /* Unsigned sum of absolute differences. */
7851 gen_helper_usad8(tmp, tmp, tmp2);
7852 dead_tmp(tmp2);
7853 if (rs != 15) {
7854 tmp2 = load_reg(s, rs);
7855 tcg_gen_add_i32(tmp, tmp, tmp2);
7856 dead_tmp(tmp2);
7858 break;
7860 store_reg(s, rd, tmp);
7861 break;
7862 case 6: case 7: /* 64-bit multiply, Divide. */
7863 op = ((insn >> 4) & 0xf) | ((insn >> 16) & 0x70);
7864 tmp = load_reg(s, rn);
7865 tmp2 = load_reg(s, rm);
7866 if ((op & 0x50) == 0x10) {
7867 /* sdiv, udiv */
7868 if (!arm_feature(env, ARM_FEATURE_DIV))
7869 goto illegal_op;
7870 if (op & 0x20)
7871 gen_helper_udiv(tmp, tmp, tmp2);
7872 else
7873 gen_helper_sdiv(tmp, tmp, tmp2);
7874 dead_tmp(tmp2);
7875 store_reg(s, rd, tmp);
7876 } else if ((op & 0xe) == 0xc) {
7877 /* Dual multiply accumulate long. */
7878 if (op & 1)
7879 gen_swap_half(tmp2);
7880 gen_smul_dual(tmp, tmp2);
7881 if (op & 0x10) {
7882 tcg_gen_sub_i32(tmp, tmp, tmp2);
7883 } else {
7884 tcg_gen_add_i32(tmp, tmp, tmp2);
7886 dead_tmp(tmp2);
7887 /* BUGFIX */
7888 tmp64 = tcg_temp_new_i64();
7889 tcg_gen_ext_i32_i64(tmp64, tmp);
7890 dead_tmp(tmp);
7891 gen_addq(s, tmp64, rs, rd);
7892 gen_storeq_reg(s, rs, rd, tmp64);
7893 tcg_temp_free_i64(tmp64);
7894 } else {
7895 if (op & 0x20) {
7896 /* Unsigned 64-bit multiply */
7897 tmp64 = gen_mulu_i64_i32(tmp, tmp2);
7898 } else {
7899 if (op & 8) {
7900 /* smlalxy */
7901 gen_mulxy(tmp, tmp2, op & 2, op & 1);
7902 dead_tmp(tmp2);
7903 tmp64 = tcg_temp_new_i64();
7904 tcg_gen_ext_i32_i64(tmp64, tmp);
7905 dead_tmp(tmp);
7906 } else {
7907 /* Signed 64-bit multiply */
7908 tmp64 = gen_muls_i64_i32(tmp, tmp2);
7911 if (op & 4) {
7912 /* umaal */
7913 gen_addq_lo(s, tmp64, rs);
7914 gen_addq_lo(s, tmp64, rd);
7915 } else if (op & 0x40) {
7916 /* 64-bit accumulate. */
7917 gen_addq(s, tmp64, rs, rd);
7919 gen_storeq_reg(s, rs, rd, tmp64);
7920 tcg_temp_free_i64(tmp64);
7922 break;
7924 break;
7925 case 6: case 7: case 14: case 15:
7926 /* Coprocessor. */
7927 if (((insn >> 24) & 3) == 3) {
7928 /* Translate into the equivalent ARM encoding. */
7929 insn = (insn & 0xe2ffffff) | ((insn & (1 << 28)) >> 4);
7930 if (disas_neon_data_insn(env, s, insn))
7931 goto illegal_op;
7932 } else {
7933 if (insn & (1 << 28))
7934 goto illegal_op;
7935 if (disas_coproc_insn (env, s, insn))
7936 goto illegal_op;
7938 break;
7939 case 8: case 9: case 10: case 11:
7940 if (insn & (1 << 15)) {
7941 /* Branches, misc control. */
7942 if (insn & 0x5000) {
7943 /* Unconditional branch. */
7944 /* signextend(hw1[10:0]) -> offset[:12]. */
7945 offset = ((int32_t)insn << 5) >> 9 & ~(int32_t)0xfff;
7946 /* hw1[10:0] -> offset[11:1]. */
7947 offset |= (insn & 0x7ff) << 1;
7948 /* (~hw2[13, 11] ^ offset[24]) -> offset[23,22]
7949 offset[24:22] already have the same value because of the
7950 sign extension above. */
7951 offset ^= ((~insn) & (1 << 13)) << 10;
7952 offset ^= ((~insn) & (1 << 11)) << 11;
7954 if (insn & (1 << 14)) {
7955 /* Branch and link. */
7956 tcg_gen_movi_i32(cpu_R[14], s->pc | 1);
7959 offset += s->pc;
7960 if (insn & (1 << 12)) {
7961 /* b/bl */
7962 gen_jmp(s, offset);
7963 } else {
7964 /* blx */
7965 offset &= ~(uint32_t)2;
7966 gen_bx_im(s, offset);
7968 } else if (((insn >> 23) & 7) == 7) {
7969 /* Misc control */
7970 if (insn & (1 << 13))
7971 goto illegal_op;
7973 if (insn & (1 << 26)) {
7974 /* Secure monitor call (v6Z) */
7975 goto illegal_op; /* not implemented. */
7976 } else {
7977 op = (insn >> 20) & 7;
7978 switch (op) {
7979 case 0: /* msr cpsr. */
7980 if (IS_M(env)) {
7981 tmp = load_reg(s, rn);
7982 addr = tcg_const_i32(insn & 0xff);
7983 gen_helper_v7m_msr(cpu_env, addr, tmp);
7984 tcg_temp_free_i32(addr);
7985 dead_tmp(tmp);
7986 gen_lookup_tb(s);
7987 break;
7989 /* fall through */
7990 case 1: /* msr spsr. */
7991 if (IS_M(env))
7992 goto illegal_op;
7993 tmp = load_reg(s, rn);
7994 if (gen_set_psr(s,
7995 msr_mask(env, s, (insn >> 8) & 0xf, op == 1),
7996 op == 1, tmp))
7997 goto illegal_op;
7998 break;
7999 case 2: /* cps, nop-hint. */
8000 if (((insn >> 8) & 7) == 0) {
8001 gen_nop_hint(s, insn & 0xff);
8003 /* Implemented as NOP in user mode. */
8004 if (IS_USER(s))
8005 break;
8006 offset = 0;
8007 imm = 0;
8008 if (insn & (1 << 10)) {
8009 if (insn & (1 << 7))
8010 offset |= CPSR_A;
8011 if (insn & (1 << 6))
8012 offset |= CPSR_I;
8013 if (insn & (1 << 5))
8014 offset |= CPSR_F;
8015 if (insn & (1 << 9))
8016 imm = CPSR_A | CPSR_I | CPSR_F;
8018 if (insn & (1 << 8)) {
8019 offset |= 0x1f;
8020 imm |= (insn & 0x1f);
8022 if (offset) {
8023 gen_set_psr_im(s, offset, 0, imm);
8025 break;
8026 case 3: /* Special control operations. */
8027 ARCH(7);
8028 op = (insn >> 4) & 0xf;
8029 switch (op) {
8030 case 2: /* clrex */
8031 gen_clrex(s);
8032 break;
8033 case 4: /* dsb */
8034 case 5: /* dmb */
8035 case 6: /* isb */
8036 /* These execute as NOPs. */
8037 break;
8038 default:
8039 goto illegal_op;
8041 break;
8042 case 4: /* bxj */
8043 /* Trivial implementation equivalent to bx. */
8044 tmp = load_reg(s, rn);
8045 gen_bx(s, tmp);
8046 break;
8047 case 5: /* Exception return. */
8048 if (IS_USER(s)) {
8049 goto illegal_op;
8051 if (rn != 14 || rd != 15) {
8052 goto illegal_op;
8054 tmp = load_reg(s, rn);
8055 tcg_gen_subi_i32(tmp, tmp, insn & 0xff);
8056 gen_exception_return(s, tmp);
8057 break;
8058 case 6: /* mrs cpsr. */
8059 tmp = new_tmp();
8060 if (IS_M(env)) {
8061 addr = tcg_const_i32(insn & 0xff);
8062 gen_helper_v7m_mrs(tmp, cpu_env, addr);
8063 tcg_temp_free_i32(addr);
8064 } else {
8065 gen_helper_cpsr_read(tmp);
8067 store_reg(s, rd, tmp);
8068 break;
8069 case 7: /* mrs spsr. */
8070 /* Not accessible in user mode. */
8071 if (IS_USER(s) || IS_M(env))
8072 goto illegal_op;
8073 tmp = load_cpu_field(spsr);
8074 store_reg(s, rd, tmp);
8075 break;
8078 } else {
8079 /* Conditional branch. */
8080 op = (insn >> 22) & 0xf;
8081 /* Generate a conditional jump to next instruction. */
8082 s->condlabel = gen_new_label();
8083 gen_test_cc(op ^ 1, s->condlabel);
8084 s->condjmp = 1;
8086 /* offset[11:1] = insn[10:0] */
8087 offset = (insn & 0x7ff) << 1;
8088 /* offset[17:12] = insn[21:16]. */
8089 offset |= (insn & 0x003f0000) >> 4;
8090 /* offset[31:20] = insn[26]. */
8091 offset |= ((int32_t)((insn << 5) & 0x80000000)) >> 11;
8092 /* offset[18] = insn[13]. */
8093 offset |= (insn & (1 << 13)) << 5;
8094 /* offset[19] = insn[11]. */
8095 offset |= (insn & (1 << 11)) << 8;
8097 /* jump to the offset */
8098 gen_jmp(s, s->pc + offset);
8100 } else {
8101 /* Data processing immediate. */
8102 if (insn & (1 << 25)) {
8103 if (insn & (1 << 24)) {
8104 if (insn & (1 << 20))
8105 goto illegal_op;
8106 /* Bitfield/Saturate. */
8107 op = (insn >> 21) & 7;
8108 imm = insn & 0x1f;
8109 shift = ((insn >> 6) & 3) | ((insn >> 10) & 0x1c);
8110 if (rn == 15) {
8111 tmp = new_tmp();
8112 tcg_gen_movi_i32(tmp, 0);
8113 } else {
8114 tmp = load_reg(s, rn);
8116 switch (op) {
8117 case 2: /* Signed bitfield extract. */
8118 imm++;
8119 if (shift + imm > 32)
8120 goto illegal_op;
8121 if (imm < 32)
8122 gen_sbfx(tmp, shift, imm);
8123 break;
8124 case 6: /* Unsigned bitfield extract. */
8125 imm++;
8126 if (shift + imm > 32)
8127 goto illegal_op;
8128 if (imm < 32)
8129 gen_ubfx(tmp, shift, (1u << imm) - 1);
8130 break;
8131 case 3: /* Bitfield insert/clear. */
8132 if (imm < shift)
8133 goto illegal_op;
8134 imm = imm + 1 - shift;
8135 if (imm != 32) {
8136 tmp2 = load_reg(s, rd);
8137 gen_bfi(tmp, tmp2, tmp, shift, (1u << imm) - 1);
8138 dead_tmp(tmp2);
8140 break;
8141 case 7:
8142 goto illegal_op;
8143 default: /* Saturate. */
8144 if (shift) {
8145 if (op & 1)
8146 tcg_gen_sari_i32(tmp, tmp, shift);
8147 else
8148 tcg_gen_shli_i32(tmp, tmp, shift);
8150 tmp2 = tcg_const_i32(imm);
8151 if (op & 4) {
8152 /* Unsigned. */
8153 if ((op & 1) && shift == 0)
8154 gen_helper_usat16(tmp, tmp, tmp2);
8155 else
8156 gen_helper_usat(tmp, tmp, tmp2);
8157 } else {
8158 /* Signed. */
8159 if ((op & 1) && shift == 0)
8160 gen_helper_ssat16(tmp, tmp, tmp2);
8161 else
8162 gen_helper_ssat(tmp, tmp, tmp2);
8164 tcg_temp_free_i32(tmp2);
8165 break;
8167 store_reg(s, rd, tmp);
8168 } else {
8169 imm = ((insn & 0x04000000) >> 15)
8170 | ((insn & 0x7000) >> 4) | (insn & 0xff);
8171 if (insn & (1 << 22)) {
8172 /* 16-bit immediate. */
8173 imm |= (insn >> 4) & 0xf000;
8174 if (insn & (1 << 23)) {
8175 /* movt */
8176 tmp = load_reg(s, rd);
8177 tcg_gen_ext16u_i32(tmp, tmp);
8178 tcg_gen_ori_i32(tmp, tmp, imm << 16);
8179 } else {
8180 /* movw */
8181 tmp = new_tmp();
8182 tcg_gen_movi_i32(tmp, imm);
8184 } else {
8185 /* Add/sub 12-bit immediate. */
8186 if (rn == 15) {
8187 offset = s->pc & ~(uint32_t)3;
8188 if (insn & (1 << 23))
8189 offset -= imm;
8190 else
8191 offset += imm;
8192 tmp = new_tmp();
8193 tcg_gen_movi_i32(tmp, offset);
8194 } else {
8195 tmp = load_reg(s, rn);
8196 if (insn & (1 << 23))
8197 tcg_gen_subi_i32(tmp, tmp, imm);
8198 else
8199 tcg_gen_addi_i32(tmp, tmp, imm);
8202 store_reg(s, rd, tmp);
8204 } else {
8205 int shifter_out = 0;
8206 /* modified 12-bit immediate. */
8207 shift = ((insn & 0x04000000) >> 23) | ((insn & 0x7000) >> 12);
8208 imm = (insn & 0xff);
8209 switch (shift) {
8210 case 0: /* XY */
8211 /* Nothing to do. */
8212 break;
8213 case 1: /* 00XY00XY */
8214 imm |= imm << 16;
8215 break;
8216 case 2: /* XY00XY00 */
8217 imm |= imm << 16;
8218 imm <<= 8;
8219 break;
8220 case 3: /* XYXYXYXY */
8221 imm |= imm << 16;
8222 imm |= imm << 8;
8223 break;
8224 default: /* Rotated constant. */
8225 shift = (shift << 1) | (imm >> 7);
8226 imm |= 0x80;
8227 imm = imm << (32 - shift);
8228 shifter_out = 1;
8229 break;
8231 tmp2 = new_tmp();
8232 tcg_gen_movi_i32(tmp2, imm);
8233 rn = (insn >> 16) & 0xf;
8234 if (rn == 15) {
8235 tmp = new_tmp();
8236 tcg_gen_movi_i32(tmp, 0);
8237 } else {
8238 tmp = load_reg(s, rn);
8240 op = (insn >> 21) & 0xf;
8241 if (gen_thumb2_data_op(s, op, (insn & (1 << 20)) != 0,
8242 shifter_out, tmp, tmp2))
8243 goto illegal_op;
8244 dead_tmp(tmp2);
8245 rd = (insn >> 8) & 0xf;
8246 if (rd != 15) {
8247 store_reg(s, rd, tmp);
8248 } else {
8249 dead_tmp(tmp);
8253 break;
8254 case 12: /* Load/store single data item. */
8256 int postinc = 0;
8257 int writeback = 0;
8258 int user;
8259 if ((insn & 0x01100000) == 0x01000000) {
8260 if (disas_neon_ls_insn(env, s, insn))
8261 goto illegal_op;
8262 break;
8264 user = IS_USER(s);
8265 if (rn == 15) {
8266 addr = new_tmp();
8267 /* PC relative. */
8268 /* s->pc has already been incremented by 4. */
8269 imm = s->pc & 0xfffffffc;
8270 if (insn & (1 << 23))
8271 imm += insn & 0xfff;
8272 else
8273 imm -= insn & 0xfff;
8274 tcg_gen_movi_i32(addr, imm);
8275 } else {
8276 addr = load_reg(s, rn);
8277 if (insn & (1 << 23)) {
8278 /* Positive offset. */
8279 imm = insn & 0xfff;
8280 tcg_gen_addi_i32(addr, addr, imm);
8281 } else {
8282 op = (insn >> 8) & 7;
8283 imm = insn & 0xff;
8284 switch (op) {
8285 case 0: case 8: /* Shifted Register. */
8286 shift = (insn >> 4) & 0xf;
8287 if (shift > 3)
8288 goto illegal_op;
8289 tmp = load_reg(s, rm);
8290 if (shift)
8291 tcg_gen_shli_i32(tmp, tmp, shift);
8292 tcg_gen_add_i32(addr, addr, tmp);
8293 dead_tmp(tmp);
8294 break;
8295 case 4: /* Negative offset. */
8296 tcg_gen_addi_i32(addr, addr, -imm);
8297 break;
8298 case 6: /* User privilege. */
8299 tcg_gen_addi_i32(addr, addr, imm);
8300 user = 1;
8301 break;
8302 case 1: /* Post-decrement. */
8303 imm = -imm;
8304 /* Fall through. */
8305 case 3: /* Post-increment. */
8306 postinc = 1;
8307 writeback = 1;
8308 break;
8309 case 5: /* Pre-decrement. */
8310 imm = -imm;
8311 /* Fall through. */
8312 case 7: /* Pre-increment. */
8313 tcg_gen_addi_i32(addr, addr, imm);
8314 writeback = 1;
8315 break;
8316 default:
8317 goto illegal_op;
8321 op = ((insn >> 21) & 3) | ((insn >> 22) & 4);
8322 if (insn & (1 << 20)) {
8323 /* Load. */
8324 if (rs == 15 && op != 2) {
8325 if (op & 2)
8326 goto illegal_op;
8327 /* Memory hint. Implemented as NOP. */
8328 } else {
8329 switch (op) {
8330 case 0: tmp = gen_ld8u(addr, user); break;
8331 case 4: tmp = gen_ld8s(addr, user); break;
8332 case 1: tmp = gen_ld16u(addr, user); break;
8333 case 5: tmp = gen_ld16s(addr, user); break;
8334 case 2: tmp = gen_ld32(addr, user); break;
8335 default: goto illegal_op;
8337 if (rs == 15) {
8338 gen_bx(s, tmp);
8339 } else {
8340 store_reg(s, rs, tmp);
8343 } else {
8344 /* Store. */
8345 if (rs == 15)
8346 goto illegal_op;
8347 tmp = load_reg(s, rs);
8348 switch (op) {
8349 case 0: gen_st8(tmp, addr, user); break;
8350 case 1: gen_st16(tmp, addr, user); break;
8351 case 2: gen_st32(tmp, addr, user); break;
8352 default: goto illegal_op;
8355 if (postinc)
8356 tcg_gen_addi_i32(addr, addr, imm);
8357 if (writeback) {
8358 store_reg(s, rn, addr);
8359 } else {
8360 dead_tmp(addr);
8363 break;
8364 default:
8365 goto illegal_op;
8367 return 0;
8368 illegal_op:
8369 return 1;
8372 static void disas_thumb_insn(CPUState *env, DisasContext *s)
8374 uint32_t val, insn, op, rm, rn, rd, shift, cond;
8375 int32_t offset;
8376 int i;
8377 TCGv tmp;
8378 TCGv tmp2;
8379 TCGv addr;
8381 if (s->condexec_mask) {
8382 cond = s->condexec_cond;
8383 if (cond != 0x0e) { /* Skip conditional when condition is AL. */
8384 s->condlabel = gen_new_label();
8385 gen_test_cc(cond ^ 1, s->condlabel);
8386 s->condjmp = 1;
8390 insn = lduw_code(s->pc);
8391 s->pc += 2;
8393 switch (insn >> 12) {
8394 case 0: case 1:
8396 rd = insn & 7;
8397 op = (insn >> 11) & 3;
8398 if (op == 3) {
8399 /* add/subtract */
8400 rn = (insn >> 3) & 7;
8401 tmp = load_reg(s, rn);
8402 if (insn & (1 << 10)) {
8403 /* immediate */
8404 tmp2 = new_tmp();
8405 tcg_gen_movi_i32(tmp2, (insn >> 6) & 7);
8406 } else {
8407 /* reg */
8408 rm = (insn >> 6) & 7;
8409 tmp2 = load_reg(s, rm);
8411 if (insn & (1 << 9)) {
8412 if (s->condexec_mask)
8413 tcg_gen_sub_i32(tmp, tmp, tmp2);
8414 else
8415 gen_helper_sub_cc(tmp, tmp, tmp2);
8416 } else {
8417 if (s->condexec_mask)
8418 tcg_gen_add_i32(tmp, tmp, tmp2);
8419 else
8420 gen_helper_add_cc(tmp, tmp, tmp2);
8422 dead_tmp(tmp2);
8423 store_reg(s, rd, tmp);
8424 } else {
8425 /* shift immediate */
8426 rm = (insn >> 3) & 7;
8427 shift = (insn >> 6) & 0x1f;
8428 tmp = load_reg(s, rm);
8429 gen_arm_shift_im(tmp, op, shift, s->condexec_mask == 0);
8430 if (!s->condexec_mask)
8431 gen_logic_CC(tmp);
8432 store_reg(s, rd, tmp);
8434 break;
8435 case 2: case 3:
8436 /* arithmetic large immediate */
8437 op = (insn >> 11) & 3;
8438 rd = (insn >> 8) & 0x7;
8439 if (op == 0) { /* mov */
8440 tmp = new_tmp();
8441 tcg_gen_movi_i32(tmp, insn & 0xff);
8442 if (!s->condexec_mask)
8443 gen_logic_CC(tmp);
8444 store_reg(s, rd, tmp);
8445 } else {
8446 tmp = load_reg(s, rd);
8447 tmp2 = new_tmp();
8448 tcg_gen_movi_i32(tmp2, insn & 0xff);
8449 switch (op) {
8450 case 1: /* cmp */
8451 gen_helper_sub_cc(tmp, tmp, tmp2);
8452 dead_tmp(tmp);
8453 dead_tmp(tmp2);
8454 break;
8455 case 2: /* add */
8456 if (s->condexec_mask)
8457 tcg_gen_add_i32(tmp, tmp, tmp2);
8458 else
8459 gen_helper_add_cc(tmp, tmp, tmp2);
8460 dead_tmp(tmp2);
8461 store_reg(s, rd, tmp);
8462 break;
8463 case 3: /* sub */
8464 if (s->condexec_mask)
8465 tcg_gen_sub_i32(tmp, tmp, tmp2);
8466 else
8467 gen_helper_sub_cc(tmp, tmp, tmp2);
8468 dead_tmp(tmp2);
8469 store_reg(s, rd, tmp);
8470 break;
8473 break;
8474 case 4:
8475 if (insn & (1 << 11)) {
8476 rd = (insn >> 8) & 7;
8477 /* load pc-relative. Bit 1 of PC is ignored. */
8478 val = s->pc + 2 + ((insn & 0xff) * 4);
8479 val &= ~(uint32_t)2;
8480 addr = new_tmp();
8481 tcg_gen_movi_i32(addr, val);
8482 tmp = gen_ld32(addr, IS_USER(s));
8483 dead_tmp(addr);
8484 store_reg(s, rd, tmp);
8485 break;
8487 if (insn & (1 << 10)) {
8488 /* data processing extended or blx */
8489 rd = (insn & 7) | ((insn >> 4) & 8);
8490 rm = (insn >> 3) & 0xf;
8491 op = (insn >> 8) & 3;
8492 switch (op) {
8493 case 0: /* add */
8494 tmp = load_reg(s, rd);
8495 tmp2 = load_reg(s, rm);
8496 tcg_gen_add_i32(tmp, tmp, tmp2);
8497 dead_tmp(tmp2);
8498 store_reg(s, rd, tmp);
8499 break;
8500 case 1: /* cmp */
8501 tmp = load_reg(s, rd);
8502 tmp2 = load_reg(s, rm);
8503 gen_helper_sub_cc(tmp, tmp, tmp2);
8504 dead_tmp(tmp2);
8505 dead_tmp(tmp);
8506 break;
8507 case 2: /* mov/cpy */
8508 tmp = load_reg(s, rm);
8509 store_reg(s, rd, tmp);
8510 break;
8511 case 3:/* branch [and link] exchange thumb register */
8512 tmp = load_reg(s, rm);
8513 if (insn & (1 << 7)) {
8514 val = (uint32_t)s->pc | 1;
8515 tmp2 = new_tmp();
8516 tcg_gen_movi_i32(tmp2, val);
8517 store_reg(s, 14, tmp2);
8519 gen_bx(s, tmp);
8520 break;
8522 break;
8525 /* data processing register */
8526 rd = insn & 7;
8527 rm = (insn >> 3) & 7;
8528 op = (insn >> 6) & 0xf;
8529 if (op == 2 || op == 3 || op == 4 || op == 7) {
8530 /* the shift/rotate ops want the operands backwards */
8531 val = rm;
8532 rm = rd;
8533 rd = val;
8534 val = 1;
8535 } else {
8536 val = 0;
8539 if (op == 9) { /* neg */
8540 tmp = new_tmp();
8541 tcg_gen_movi_i32(tmp, 0);
8542 } else if (op != 0xf) { /* mvn doesn't read its first operand */
8543 tmp = load_reg(s, rd);
8544 } else {
8545 TCGV_UNUSED(tmp);
8548 tmp2 = load_reg(s, rm);
8549 switch (op) {
8550 case 0x0: /* and */
8551 tcg_gen_and_i32(tmp, tmp, tmp2);
8552 if (!s->condexec_mask)
8553 gen_logic_CC(tmp);
8554 break;
8555 case 0x1: /* eor */
8556 tcg_gen_xor_i32(tmp, tmp, tmp2);
8557 if (!s->condexec_mask)
8558 gen_logic_CC(tmp);
8559 break;
8560 case 0x2: /* lsl */
8561 if (s->condexec_mask) {
8562 gen_helper_shl(tmp2, tmp2, tmp);
8563 } else {
8564 gen_helper_shl_cc(tmp2, tmp2, tmp);
8565 gen_logic_CC(tmp2);
8567 break;
8568 case 0x3: /* lsr */
8569 if (s->condexec_mask) {
8570 gen_helper_shr(tmp2, tmp2, tmp);
8571 } else {
8572 gen_helper_shr_cc(tmp2, tmp2, tmp);
8573 gen_logic_CC(tmp2);
8575 break;
8576 case 0x4: /* asr */
8577 if (s->condexec_mask) {
8578 gen_helper_sar(tmp2, tmp2, tmp);
8579 } else {
8580 gen_helper_sar_cc(tmp2, tmp2, tmp);
8581 gen_logic_CC(tmp2);
8583 break;
8584 case 0x5: /* adc */
8585 if (s->condexec_mask)
8586 gen_adc(tmp, tmp2);
8587 else
8588 gen_helper_adc_cc(tmp, tmp, tmp2);
8589 break;
8590 case 0x6: /* sbc */
8591 if (s->condexec_mask)
8592 gen_sub_carry(tmp, tmp, tmp2);
8593 else
8594 gen_helper_sbc_cc(tmp, tmp, tmp2);
8595 break;
8596 case 0x7: /* ror */
8597 if (s->condexec_mask) {
8598 tcg_gen_andi_i32(tmp, tmp, 0x1f);
8599 tcg_gen_rotr_i32(tmp2, tmp2, tmp);
8600 } else {
8601 gen_helper_ror_cc(tmp2, tmp2, tmp);
8602 gen_logic_CC(tmp2);
8604 break;
8605 case 0x8: /* tst */
8606 tcg_gen_and_i32(tmp, tmp, tmp2);
8607 gen_logic_CC(tmp);
8608 rd = 16;
8609 break;
8610 case 0x9: /* neg */
8611 if (s->condexec_mask)
8612 tcg_gen_neg_i32(tmp, tmp2);
8613 else
8614 gen_helper_sub_cc(tmp, tmp, tmp2);
8615 break;
8616 case 0xa: /* cmp */
8617 gen_helper_sub_cc(tmp, tmp, tmp2);
8618 rd = 16;
8619 break;
8620 case 0xb: /* cmn */
8621 gen_helper_add_cc(tmp, tmp, tmp2);
8622 rd = 16;
8623 break;
8624 case 0xc: /* orr */
8625 tcg_gen_or_i32(tmp, tmp, tmp2);
8626 if (!s->condexec_mask)
8627 gen_logic_CC(tmp);
8628 break;
8629 case 0xd: /* mul */
8630 tcg_gen_mul_i32(tmp, tmp, tmp2);
8631 if (!s->condexec_mask)
8632 gen_logic_CC(tmp);
8633 break;
8634 case 0xe: /* bic */
8635 tcg_gen_andc_i32(tmp, tmp, tmp2);
8636 if (!s->condexec_mask)
8637 gen_logic_CC(tmp);
8638 break;
8639 case 0xf: /* mvn */
8640 tcg_gen_not_i32(tmp2, tmp2);
8641 if (!s->condexec_mask)
8642 gen_logic_CC(tmp2);
8643 val = 1;
8644 rm = rd;
8645 break;
8647 if (rd != 16) {
8648 if (val) {
8649 store_reg(s, rm, tmp2);
8650 if (op != 0xf)
8651 dead_tmp(tmp);
8652 } else {
8653 store_reg(s, rd, tmp);
8654 dead_tmp(tmp2);
8656 } else {
8657 dead_tmp(tmp);
8658 dead_tmp(tmp2);
8660 break;
8662 case 5:
8663 /* load/store register offset. */
8664 rd = insn & 7;
8665 rn = (insn >> 3) & 7;
8666 rm = (insn >> 6) & 7;
8667 op = (insn >> 9) & 7;
8668 addr = load_reg(s, rn);
8669 tmp = load_reg(s, rm);
8670 tcg_gen_add_i32(addr, addr, tmp);
8671 dead_tmp(tmp);
8673 if (op < 3) /* store */
8674 tmp = load_reg(s, rd);
8676 switch (op) {
8677 case 0: /* str */
8678 gen_st32(tmp, addr, IS_USER(s));
8679 break;
8680 case 1: /* strh */
8681 gen_st16(tmp, addr, IS_USER(s));
8682 break;
8683 case 2: /* strb */
8684 gen_st8(tmp, addr, IS_USER(s));
8685 break;
8686 case 3: /* ldrsb */
8687 tmp = gen_ld8s(addr, IS_USER(s));
8688 break;
8689 case 4: /* ldr */
8690 tmp = gen_ld32(addr, IS_USER(s));
8691 break;
8692 case 5: /* ldrh */
8693 tmp = gen_ld16u(addr, IS_USER(s));
8694 break;
8695 case 6: /* ldrb */
8696 tmp = gen_ld8u(addr, IS_USER(s));
8697 break;
8698 case 7: /* ldrsh */
8699 tmp = gen_ld16s(addr, IS_USER(s));
8700 break;
8702 if (op >= 3) /* load */
8703 store_reg(s, rd, tmp);
8704 dead_tmp(addr);
8705 break;
8707 case 6:
8708 /* load/store word immediate offset */
8709 rd = insn & 7;
8710 rn = (insn >> 3) & 7;
8711 addr = load_reg(s, rn);
8712 val = (insn >> 4) & 0x7c;
8713 tcg_gen_addi_i32(addr, addr, val);
8715 if (insn & (1 << 11)) {
8716 /* load */
8717 tmp = gen_ld32(addr, IS_USER(s));
8718 store_reg(s, rd, tmp);
8719 } else {
8720 /* store */
8721 tmp = load_reg(s, rd);
8722 gen_st32(tmp, addr, IS_USER(s));
8724 dead_tmp(addr);
8725 break;
8727 case 7:
8728 /* load/store byte immediate offset */
8729 rd = insn & 7;
8730 rn = (insn >> 3) & 7;
8731 addr = load_reg(s, rn);
8732 val = (insn >> 6) & 0x1f;
8733 tcg_gen_addi_i32(addr, addr, val);
8735 if (insn & (1 << 11)) {
8736 /* load */
8737 tmp = gen_ld8u(addr, IS_USER(s));
8738 store_reg(s, rd, tmp);
8739 } else {
8740 /* store */
8741 tmp = load_reg(s, rd);
8742 gen_st8(tmp, addr, IS_USER(s));
8744 dead_tmp(addr);
8745 break;
8747 case 8:
8748 /* load/store halfword immediate offset */
8749 rd = insn & 7;
8750 rn = (insn >> 3) & 7;
8751 addr = load_reg(s, rn);
8752 val = (insn >> 5) & 0x3e;
8753 tcg_gen_addi_i32(addr, addr, val);
8755 if (insn & (1 << 11)) {
8756 /* load */
8757 tmp = gen_ld16u(addr, IS_USER(s));
8758 store_reg(s, rd, tmp);
8759 } else {
8760 /* store */
8761 tmp = load_reg(s, rd);
8762 gen_st16(tmp, addr, IS_USER(s));
8764 dead_tmp(addr);
8765 break;
8767 case 9:
8768 /* load/store from stack */
8769 rd = (insn >> 8) & 7;
8770 addr = load_reg(s, 13);
8771 val = (insn & 0xff) * 4;
8772 tcg_gen_addi_i32(addr, addr, val);
8774 if (insn & (1 << 11)) {
8775 /* load */
8776 tmp = gen_ld32(addr, IS_USER(s));
8777 store_reg(s, rd, tmp);
8778 } else {
8779 /* store */
8780 tmp = load_reg(s, rd);
8781 gen_st32(tmp, addr, IS_USER(s));
8783 dead_tmp(addr);
8784 break;
8786 case 10:
8787 /* add to high reg */
8788 rd = (insn >> 8) & 7;
8789 if (insn & (1 << 11)) {
8790 /* SP */
8791 tmp = load_reg(s, 13);
8792 } else {
8793 /* PC. bit 1 is ignored. */
8794 tmp = new_tmp();
8795 tcg_gen_movi_i32(tmp, (s->pc + 2) & ~(uint32_t)2);
8797 val = (insn & 0xff) * 4;
8798 tcg_gen_addi_i32(tmp, tmp, val);
8799 store_reg(s, rd, tmp);
8800 break;
8802 case 11:
8803 /* misc */
8804 op = (insn >> 8) & 0xf;
8805 switch (op) {
8806 case 0:
8807 /* adjust stack pointer */
8808 tmp = load_reg(s, 13);
8809 val = (insn & 0x7f) * 4;
8810 if (insn & (1 << 7))
8811 val = -(int32_t)val;
8812 tcg_gen_addi_i32(tmp, tmp, val);
8813 store_reg(s, 13, tmp);
8814 break;
8816 case 2: /* sign/zero extend. */
8817 ARCH(6);
8818 rd = insn & 7;
8819 rm = (insn >> 3) & 7;
8820 tmp = load_reg(s, rm);
8821 switch ((insn >> 6) & 3) {
8822 case 0: gen_sxth(tmp); break;
8823 case 1: gen_sxtb(tmp); break;
8824 case 2: gen_uxth(tmp); break;
8825 case 3: gen_uxtb(tmp); break;
8827 store_reg(s, rd, tmp);
8828 break;
8829 case 4: case 5: case 0xc: case 0xd:
8830 /* push/pop */
8831 addr = load_reg(s, 13);
8832 if (insn & (1 << 8))
8833 offset = 4;
8834 else
8835 offset = 0;
8836 for (i = 0; i < 8; i++) {
8837 if (insn & (1 << i))
8838 offset += 4;
8840 if ((insn & (1 << 11)) == 0) {
8841 tcg_gen_addi_i32(addr, addr, -offset);
8843 for (i = 0; i < 8; i++) {
8844 if (insn & (1 << i)) {
8845 if (insn & (1 << 11)) {
8846 /* pop */
8847 tmp = gen_ld32(addr, IS_USER(s));
8848 store_reg(s, i, tmp);
8849 } else {
8850 /* push */
8851 tmp = load_reg(s, i);
8852 gen_st32(tmp, addr, IS_USER(s));
8854 /* advance to the next address. */
8855 tcg_gen_addi_i32(addr, addr, 4);
8858 TCGV_UNUSED(tmp);
8859 if (insn & (1 << 8)) {
8860 if (insn & (1 << 11)) {
8861 /* pop pc */
8862 tmp = gen_ld32(addr, IS_USER(s));
8863 /* don't set the pc until the rest of the instruction
8864 has completed */
8865 } else {
8866 /* push lr */
8867 tmp = load_reg(s, 14);
8868 gen_st32(tmp, addr, IS_USER(s));
8870 tcg_gen_addi_i32(addr, addr, 4);
8872 if ((insn & (1 << 11)) == 0) {
8873 tcg_gen_addi_i32(addr, addr, -offset);
8875 /* write back the new stack pointer */
8876 store_reg(s, 13, addr);
8877 /* set the new PC value */
8878 if ((insn & 0x0900) == 0x0900)
8879 gen_bx(s, tmp);
8880 break;
8882 case 1: case 3: case 9: case 11: /* czb */
8883 rm = insn & 7;
8884 tmp = load_reg(s, rm);
8885 s->condlabel = gen_new_label();
8886 s->condjmp = 1;
8887 if (insn & (1 << 11))
8888 tcg_gen_brcondi_i32(TCG_COND_EQ, tmp, 0, s->condlabel);
8889 else
8890 tcg_gen_brcondi_i32(TCG_COND_NE, tmp, 0, s->condlabel);
8891 dead_tmp(tmp);
8892 offset = ((insn & 0xf8) >> 2) | (insn & 0x200) >> 3;
8893 val = (uint32_t)s->pc + 2;
8894 val += offset;
8895 gen_jmp(s, val);
8896 break;
8898 case 15: /* IT, nop-hint. */
8899 if ((insn & 0xf) == 0) {
8900 gen_nop_hint(s, (insn >> 4) & 0xf);
8901 break;
8903 /* If Then. */
8904 s->condexec_cond = (insn >> 4) & 0xe;
8905 s->condexec_mask = insn & 0x1f;
8906 /* No actual code generated for this insn, just setup state. */
8907 break;
8909 case 0xe: /* bkpt */
8910 gen_set_condexec(s);
8911 gen_set_pc_im(s->pc - 2);
8912 gen_exception(EXCP_BKPT);
8913 s->is_jmp = DISAS_JUMP;
8914 break;
8916 case 0xa: /* rev */
8917 ARCH(6);
8918 rn = (insn >> 3) & 0x7;
8919 rd = insn & 0x7;
8920 tmp = load_reg(s, rn);
8921 switch ((insn >> 6) & 3) {
8922 case 0: tcg_gen_bswap32_i32(tmp, tmp); break;
8923 case 1: gen_rev16(tmp); break;
8924 case 3: gen_revsh(tmp); break;
8925 default: goto illegal_op;
8927 store_reg(s, rd, tmp);
8928 break;
8930 case 6: /* cps */
8931 ARCH(6);
8932 if (IS_USER(s))
8933 break;
8934 if (IS_M(env)) {
8935 tmp = tcg_const_i32((insn & (1 << 4)) != 0);
8936 /* PRIMASK */
8937 if (insn & 1) {
8938 addr = tcg_const_i32(16);
8939 gen_helper_v7m_msr(cpu_env, addr, tmp);
8940 tcg_temp_free_i32(addr);
8942 /* FAULTMASK */
8943 if (insn & 2) {
8944 addr = tcg_const_i32(17);
8945 gen_helper_v7m_msr(cpu_env, addr, tmp);
8946 tcg_temp_free_i32(addr);
8948 tcg_temp_free_i32(tmp);
8949 gen_lookup_tb(s);
8950 } else {
8951 if (insn & (1 << 4))
8952 shift = CPSR_A | CPSR_I | CPSR_F;
8953 else
8954 shift = 0;
8955 gen_set_psr_im(s, ((insn & 7) << 6), 0, shift);
8957 break;
8959 default:
8960 goto undef;
8962 break;
8964 case 12:
8965 /* load/store multiple */
8966 rn = (insn >> 8) & 0x7;
8967 addr = load_reg(s, rn);
8968 for (i = 0; i < 8; i++) {
8969 if (insn & (1 << i)) {
8970 if (insn & (1 << 11)) {
8971 /* load */
8972 tmp = gen_ld32(addr, IS_USER(s));
8973 store_reg(s, i, tmp);
8974 } else {
8975 /* store */
8976 tmp = load_reg(s, i);
8977 gen_st32(tmp, addr, IS_USER(s));
8979 /* advance to the next address */
8980 tcg_gen_addi_i32(addr, addr, 4);
8983 /* Base register writeback. */
8984 if ((insn & (1 << rn)) == 0) {
8985 store_reg(s, rn, addr);
8986 } else {
8987 dead_tmp(addr);
8989 break;
8991 case 13:
8992 /* conditional branch or swi */
8993 cond = (insn >> 8) & 0xf;
8994 if (cond == 0xe)
8995 goto undef;
8997 if (cond == 0xf) {
8998 /* swi */
8999 gen_set_condexec(s);
9000 gen_set_pc_im(s->pc);
9001 s->is_jmp = DISAS_SWI;
9002 break;
9004 /* generate a conditional jump to next instruction */
9005 s->condlabel = gen_new_label();
9006 gen_test_cc(cond ^ 1, s->condlabel);
9007 s->condjmp = 1;
9009 /* jump to the offset */
9010 val = (uint32_t)s->pc + 2;
9011 offset = ((int32_t)insn << 24) >> 24;
9012 val += offset << 1;
9013 gen_jmp(s, val);
9014 break;
9016 case 14:
9017 if (insn & (1 << 11)) {
9018 if (disas_thumb2_insn(env, s, insn))
9019 goto undef32;
9020 break;
9022 /* unconditional branch */
9023 val = (uint32_t)s->pc;
9024 offset = ((int32_t)insn << 21) >> 21;
9025 val += (offset << 1) + 2;
9026 gen_jmp(s, val);
9027 break;
9029 case 15:
9030 if (disas_thumb2_insn(env, s, insn))
9031 goto undef32;
9032 break;
9034 return;
9035 undef32:
9036 gen_set_condexec(s);
9037 gen_set_pc_im(s->pc - 4);
9038 gen_exception(EXCP_UDEF);
9039 s->is_jmp = DISAS_JUMP;
9040 return;
9041 illegal_op:
9042 undef:
9043 gen_set_condexec(s);
9044 gen_set_pc_im(s->pc - 2);
9045 gen_exception(EXCP_UDEF);
9046 s->is_jmp = DISAS_JUMP;
9049 /* generate intermediate code in gen_opc_buf and gen_opparam_buf for
9050 basic block 'tb'. If search_pc is TRUE, also generate PC
9051 information for each intermediate instruction. */
9052 static inline void gen_intermediate_code_internal(CPUState *env,
9053 TranslationBlock *tb,
9054 int search_pc)
9056 DisasContext dc1, *dc = &dc1;
9057 CPUBreakpoint *bp;
9058 uint16_t *gen_opc_end;
9059 int j, lj;
9060 target_ulong pc_start;
9061 uint32_t next_page_start;
9062 int num_insns;
9063 int max_insns;
9065 /* generate intermediate code */
9066 num_temps = 0;
9068 pc_start = tb->pc;
9070 dc->tb = tb;
9072 gen_opc_end = gen_opc_buf + OPC_MAX_SIZE;
9074 dc->is_jmp = DISAS_NEXT;
9075 dc->pc = pc_start;
9076 dc->singlestep_enabled = env->singlestep_enabled;
9077 dc->condjmp = 0;
9078 dc->thumb = env->thumb;
9079 dc->condexec_mask = (env->condexec_bits & 0xf) << 1;
9080 dc->condexec_cond = env->condexec_bits >> 4;
9081 #if !defined(CONFIG_USER_ONLY)
9082 if (IS_M(env)) {
9083 dc->user = ((env->v7m.exception == 0) && (env->v7m.control & 1));
9084 } else {
9085 dc->user = (env->uncached_cpsr & 0x1f) == ARM_CPU_MODE_USR;
9087 #endif
9088 cpu_F0s = tcg_temp_new_i32();
9089 cpu_F1s = tcg_temp_new_i32();
9090 cpu_F0d = tcg_temp_new_i64();
9091 cpu_F1d = tcg_temp_new_i64();
9092 cpu_V0 = cpu_F0d;
9093 cpu_V1 = cpu_F1d;
9094 /* FIXME: cpu_M0 can probably be the same as cpu_V0. */
9095 cpu_M0 = tcg_temp_new_i64();
9096 next_page_start = (pc_start & TARGET_PAGE_MASK) + TARGET_PAGE_SIZE;
9097 lj = -1;
9098 num_insns = 0;
9099 max_insns = tb->cflags & CF_COUNT_MASK;
9100 if (max_insns == 0)
9101 max_insns = CF_COUNT_MASK;
9103 gen_icount_start();
9104 /* Reset the conditional execution bits immediately. This avoids
9105 complications trying to do it at the end of the block. */
9106 if (env->condexec_bits)
9108 TCGv tmp = new_tmp();
9109 tcg_gen_movi_i32(tmp, 0);
9110 store_cpu_field(tmp, condexec_bits);
9112 do {
9113 #ifdef CONFIG_USER_ONLY
9114 /* Intercept jump to the magic kernel page. */
9115 if (dc->pc >= 0xffff0000) {
9116 /* We always get here via a jump, so know we are not in a
9117 conditional execution block. */
9118 gen_exception(EXCP_KERNEL_TRAP);
9119 dc->is_jmp = DISAS_UPDATE;
9120 break;
9122 #else
9123 if (dc->pc >= 0xfffffff0 && IS_M(env)) {
9124 /* We always get here via a jump, so know we are not in a
9125 conditional execution block. */
9126 gen_exception(EXCP_EXCEPTION_EXIT);
9127 dc->is_jmp = DISAS_UPDATE;
9128 break;
9130 #endif
9132 if (unlikely(!QTAILQ_EMPTY(&env->breakpoints))) {
9133 QTAILQ_FOREACH(bp, &env->breakpoints, entry) {
9134 if (bp->pc == dc->pc) {
9135 gen_set_condexec(dc);
9136 gen_set_pc_im(dc->pc);
9137 gen_exception(EXCP_DEBUG);
9138 dc->is_jmp = DISAS_JUMP;
9139 /* Advance PC so that clearing the breakpoint will
9140 invalidate this TB. */
9141 dc->pc += 2;
9142 goto done_generating;
9143 break;
9147 if (search_pc) {
9148 j = gen_opc_ptr - gen_opc_buf;
9149 if (lj < j) {
9150 lj++;
9151 while (lj < j)
9152 gen_opc_instr_start[lj++] = 0;
9154 gen_opc_pc[lj] = dc->pc;
9155 gen_opc_instr_start[lj] = 1;
9156 gen_opc_icount[lj] = num_insns;
9159 if (num_insns + 1 == max_insns && (tb->cflags & CF_LAST_IO))
9160 gen_io_start();
9162 if (env->thumb) {
9163 disas_thumb_insn(env, dc);
9164 if (dc->condexec_mask) {
9165 dc->condexec_cond = (dc->condexec_cond & 0xe)
9166 | ((dc->condexec_mask >> 4) & 1);
9167 dc->condexec_mask = (dc->condexec_mask << 1) & 0x1f;
9168 if (dc->condexec_mask == 0) {
9169 dc->condexec_cond = 0;
9172 } else {
9173 disas_arm_insn(env, dc);
9175 if (num_temps) {
9176 fprintf(stderr, "Internal resource leak before %08x\n", dc->pc);
9177 num_temps = 0;
9180 if (dc->condjmp && !dc->is_jmp) {
9181 gen_set_label(dc->condlabel);
9182 dc->condjmp = 0;
9184 /* Translation stops when a conditional branch is encountered.
9185 * Otherwise the subsequent code could get translated several times.
9186 * Also stop translation when a page boundary is reached. This
9187 * ensures prefetch aborts occur at the right place. */
9188 num_insns ++;
9189 } while (!dc->is_jmp && gen_opc_ptr < gen_opc_end &&
9190 !env->singlestep_enabled &&
9191 !singlestep &&
9192 dc->pc < next_page_start &&
9193 num_insns < max_insns);
9195 if (tb->cflags & CF_LAST_IO) {
9196 if (dc->condjmp) {
9197 /* FIXME: This can theoretically happen with self-modifying
9198 code. */
9199 cpu_abort(env, "IO on conditional branch instruction");
9201 gen_io_end();
9204 /* At this stage dc->condjmp will only be set when the skipped
9205 instruction was a conditional branch or trap, and the PC has
9206 already been written. */
9207 if (unlikely(env->singlestep_enabled)) {
9208 /* Make sure the pc is updated, and raise a debug exception. */
9209 if (dc->condjmp) {
9210 gen_set_condexec(dc);
9211 if (dc->is_jmp == DISAS_SWI) {
9212 gen_exception(EXCP_SWI);
9213 } else {
9214 gen_exception(EXCP_DEBUG);
9216 gen_set_label(dc->condlabel);
9218 if (dc->condjmp || !dc->is_jmp) {
9219 gen_set_pc_im(dc->pc);
9220 dc->condjmp = 0;
9222 gen_set_condexec(dc);
9223 if (dc->is_jmp == DISAS_SWI && !dc->condjmp) {
9224 gen_exception(EXCP_SWI);
9225 } else {
9226 /* FIXME: Single stepping a WFI insn will not halt
9227 the CPU. */
9228 gen_exception(EXCP_DEBUG);
9230 } else {
9231 /* While branches must always occur at the end of an IT block,
9232 there are a few other things that can cause us to terminate
9233 the TB in the middel of an IT block:
9234 - Exception generating instructions (bkpt, swi, undefined).
9235 - Page boundaries.
9236 - Hardware watchpoints.
9237 Hardware breakpoints have already been handled and skip this code.
9239 gen_set_condexec(dc);
9240 switch(dc->is_jmp) {
9241 case DISAS_NEXT:
9242 gen_goto_tb(dc, 1, dc->pc);
9243 break;
9244 default:
9245 case DISAS_JUMP:
9246 case DISAS_UPDATE:
9247 /* indicate that the hash table must be used to find the next TB */
9248 tcg_gen_exit_tb(0);
9249 break;
9250 case DISAS_TB_JUMP:
9251 /* nothing more to generate */
9252 break;
9253 case DISAS_WFI:
9254 gen_helper_wfi();
9255 break;
9256 case DISAS_SWI:
9257 gen_exception(EXCP_SWI);
9258 break;
9260 if (dc->condjmp) {
9261 gen_set_label(dc->condlabel);
9262 gen_set_condexec(dc);
9263 gen_goto_tb(dc, 1, dc->pc);
9264 dc->condjmp = 0;
9268 done_generating:
9269 gen_icount_end(tb, num_insns);
9270 *gen_opc_ptr = INDEX_op_end;
9272 #ifdef DEBUG_DISAS
9273 if (qemu_loglevel_mask(CPU_LOG_TB_IN_ASM)) {
9274 qemu_log("----------------\n");
9275 qemu_log("IN: %s\n", lookup_symbol(pc_start));
9276 log_target_disas(pc_start, dc->pc - pc_start, env->thumb);
9277 qemu_log("\n");
9279 #endif
9280 if (search_pc) {
9281 j = gen_opc_ptr - gen_opc_buf;
9282 lj++;
9283 while (lj <= j)
9284 gen_opc_instr_start[lj++] = 0;
9285 } else {
9286 tb->size = dc->pc - pc_start;
9287 tb->icount = num_insns;
9291 void gen_intermediate_code(CPUState *env, TranslationBlock *tb)
9293 gen_intermediate_code_internal(env, tb, 0);
9296 void gen_intermediate_code_pc(CPUState *env, TranslationBlock *tb)
9298 gen_intermediate_code_internal(env, tb, 1);
9301 static const char *cpu_mode_names[16] = {
9302 "usr", "fiq", "irq", "svc", "???", "???", "???", "abt",
9303 "???", "???", "???", "und", "???", "???", "???", "sys"
9306 void cpu_dump_state(CPUState *env, FILE *f, fprintf_function cpu_fprintf,
9307 int flags)
9309 int i;
9310 #if 0
9311 union {
9312 uint32_t i;
9313 float s;
9314 } s0, s1;
9315 CPU_DoubleU d;
9316 /* ??? This assumes float64 and double have the same layout.
9317 Oh well, it's only debug dumps. */
9318 union {
9319 float64 f64;
9320 double d;
9321 } d0;
9322 #endif
9323 uint32_t psr;
9325 for(i=0;i<16;i++) {
9326 cpu_fprintf(f, "R%02d=%08x", i, env->regs[i]);
9327 if ((i % 4) == 3)
9328 cpu_fprintf(f, "\n");
9329 else
9330 cpu_fprintf(f, " ");
9332 psr = cpsr_read(env);
9333 cpu_fprintf(f, "PSR=%08x %c%c%c%c %c %s%d\n",
9334 psr,
9335 psr & (1 << 31) ? 'N' : '-',
9336 psr & (1 << 30) ? 'Z' : '-',
9337 psr & (1 << 29) ? 'C' : '-',
9338 psr & (1 << 28) ? 'V' : '-',
9339 psr & CPSR_T ? 'T' : 'A',
9340 cpu_mode_names[psr & 0xf], (psr & 0x10) ? 32 : 26);
9342 #if 0
9343 for (i = 0; i < 16; i++) {
9344 d.d = env->vfp.regs[i];
9345 s0.i = d.l.lower;
9346 s1.i = d.l.upper;
9347 d0.f64 = d.d;
9348 cpu_fprintf(f, "s%02d=%08x(%8g) s%02d=%08x(%8g) d%02d=%08x%08x(%8g)\n",
9349 i * 2, (int)s0.i, s0.s,
9350 i * 2 + 1, (int)s1.i, s1.s,
9351 i, (int)(uint32_t)d.l.upper, (int)(uint32_t)d.l.lower,
9352 d0.d);
9354 cpu_fprintf(f, "FPSCR: %08x\n", (int)env->vfp.xregs[ARM_VFP_FPSCR]);
9355 #endif
9358 void gen_pc_load(CPUState *env, TranslationBlock *tb,
9359 unsigned long searched_pc, int pc_pos, void *puc)
9361 env->regs[15] = gen_opc_pc[pc_pos];