4 * Copyright (c) 2003 Fabrice Bellard
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
26 #include "qemu/host-utils.h"
28 #include "disas/disas.h"
35 #define PREFIX_REPZ 0x01
36 #define PREFIX_REPNZ 0x02
37 #define PREFIX_LOCK 0x04
38 #define PREFIX_DATA 0x08
39 #define PREFIX_ADR 0x10
40 #define PREFIX_VEX 0x20
43 #define CODE64(s) ((s)->code64)
44 #define REX_X(s) ((s)->rex_x)
45 #define REX_B(s) ((s)->rex_b)
60 //#define MACRO_TEST 1
62 /* global register indexes */
63 static TCGv_ptr cpu_env
;
65 static TCGv cpu_cc_dst
, cpu_cc_src
, cpu_cc_src2
, cpu_cc_srcT
;
66 static TCGv_i32 cpu_cc_op
;
67 static TCGv cpu_regs
[CPU_NB_REGS
];
70 /* local register indexes (only used inside old micro ops) */
71 static TCGv cpu_tmp0
, cpu_tmp4
;
72 static TCGv_ptr cpu_ptr0
, cpu_ptr1
;
73 static TCGv_i32 cpu_tmp2_i32
, cpu_tmp3_i32
;
74 static TCGv_i64 cpu_tmp1_i64
;
76 static uint8_t gen_opc_cc_op
[OPC_BUF_SIZE
];
78 #include "exec/gen-icount.h"
81 static int x86_64_hregs
;
84 typedef struct DisasContext
{
85 /* current insn context */
86 int override
; /* -1 if no override */
89 target_ulong pc
; /* pc = eip + cs_base */
90 int is_jmp
; /* 1 = means jump (stop translation), 2 means CPU
91 static state change (stop translation) */
92 /* current block context */
93 target_ulong cs_base
; /* base of CS segment */
94 int pe
; /* protected mode */
95 int code32
; /* 32 bit code segment */
97 int lma
; /* long mode active */
98 int code64
; /* 64 bit code segment */
101 int vex_l
; /* vex vector length */
102 int vex_v
; /* vex vvvv register, without 1's compliment. */
103 int ss32
; /* 32 bit stack segment */
104 CCOp cc_op
; /* current CC operation */
106 int addseg
; /* non zero if either DS/ES/SS have a non zero base */
107 int f_st
; /* currently unused */
108 int vm86
; /* vm86 mode */
111 int tf
; /* TF cpu flag */
112 int singlestep_enabled
; /* "hardware" single step enabled */
113 int jmp_opt
; /* use direct block chaining for direct jumps */
114 int mem_index
; /* select memory access functions */
115 uint64_t flags
; /* all execution flags */
116 struct TranslationBlock
*tb
;
117 int popl_esp_hack
; /* for correct popl with esp base handling */
118 int rip_offset
; /* only used in x86_64, but left for simplicity */
120 int cpuid_ext_features
;
121 int cpuid_ext2_features
;
122 int cpuid_ext3_features
;
123 int cpuid_7_0_ebx_features
;
126 static void gen_eob(DisasContext
*s
);
127 static void gen_jmp(DisasContext
*s
, target_ulong eip
);
128 static void gen_jmp_tb(DisasContext
*s
, target_ulong eip
, int tb_num
);
129 static void gen_op(DisasContext
*s1
, int op
, int ot
, int d
);
131 /* i386 arith/logic operations */
151 OP_SHL1
, /* undocumented */
175 /* I386 int registers */
176 OR_EAX
, /* MUST be even numbered */
185 OR_TMP0
= 16, /* temporary operand register */
187 OR_A0
, /* temporary register used when doing address evaluation */
197 /* Bit set if the global variable is live after setting CC_OP to X. */
198 static const uint8_t cc_op_live
[CC_OP_NB
] = {
199 [CC_OP_DYNAMIC
] = USES_CC_DST
| USES_CC_SRC
| USES_CC_SRC2
,
200 [CC_OP_EFLAGS
] = USES_CC_SRC
,
201 [CC_OP_MULB
... CC_OP_MULQ
] = USES_CC_DST
| USES_CC_SRC
,
202 [CC_OP_ADDB
... CC_OP_ADDQ
] = USES_CC_DST
| USES_CC_SRC
,
203 [CC_OP_ADCB
... CC_OP_ADCQ
] = USES_CC_DST
| USES_CC_SRC
| USES_CC_SRC2
,
204 [CC_OP_SUBB
... CC_OP_SUBQ
] = USES_CC_DST
| USES_CC_SRC
| USES_CC_SRCT
,
205 [CC_OP_SBBB
... CC_OP_SBBQ
] = USES_CC_DST
| USES_CC_SRC
| USES_CC_SRC2
,
206 [CC_OP_LOGICB
... CC_OP_LOGICQ
] = USES_CC_DST
,
207 [CC_OP_INCB
... CC_OP_INCQ
] = USES_CC_DST
| USES_CC_SRC
,
208 [CC_OP_DECB
... CC_OP_DECQ
] = USES_CC_DST
| USES_CC_SRC
,
209 [CC_OP_SHLB
... CC_OP_SHLQ
] = USES_CC_DST
| USES_CC_SRC
,
210 [CC_OP_SARB
... CC_OP_SARQ
] = USES_CC_DST
| USES_CC_SRC
,
211 [CC_OP_BMILGB
... CC_OP_BMILGQ
] = USES_CC_DST
| USES_CC_SRC
,
212 [CC_OP_ADCX
] = USES_CC_DST
| USES_CC_SRC
,
213 [CC_OP_ADOX
] = USES_CC_SRC
| USES_CC_SRC2
,
214 [CC_OP_ADCOX
] = USES_CC_DST
| USES_CC_SRC
| USES_CC_SRC2
,
218 static void set_cc_op(DisasContext
*s
, CCOp op
)
222 if (s
->cc_op
== op
) {
226 /* Discard CC computation that will no longer be used. */
227 dead
= cc_op_live
[s
->cc_op
] & ~cc_op_live
[op
];
228 if (dead
& USES_CC_DST
) {
229 tcg_gen_discard_tl(cpu_cc_dst
);
231 if (dead
& USES_CC_SRC
) {
232 tcg_gen_discard_tl(cpu_cc_src
);
234 if (dead
& USES_CC_SRC2
) {
235 tcg_gen_discard_tl(cpu_cc_src2
);
237 if (dead
& USES_CC_SRCT
) {
238 tcg_gen_discard_tl(cpu_cc_srcT
);
241 if (op
== CC_OP_DYNAMIC
) {
242 /* The DYNAMIC setting is translator only, and should never be
243 stored. Thus we always consider it clean. */
244 s
->cc_op_dirty
= false;
246 /* Discard any computed CC_OP value (see shifts). */
247 if (s
->cc_op
== CC_OP_DYNAMIC
) {
248 tcg_gen_discard_i32(cpu_cc_op
);
250 s
->cc_op_dirty
= true;
255 static void gen_update_cc_op(DisasContext
*s
)
257 if (s
->cc_op_dirty
) {
258 tcg_gen_movi_i32(cpu_cc_op
, s
->cc_op
);
259 s
->cc_op_dirty
= false;
263 static inline void gen_op_movl_T0_0(void)
265 tcg_gen_movi_tl(cpu_T
[0], 0);
268 static inline void gen_op_movl_T0_im(int32_t val
)
270 tcg_gen_movi_tl(cpu_T
[0], val
);
273 static inline void gen_op_movl_T0_imu(uint32_t val
)
275 tcg_gen_movi_tl(cpu_T
[0], val
);
278 static inline void gen_op_movl_T1_im(int32_t val
)
280 tcg_gen_movi_tl(cpu_T
[1], val
);
283 static inline void gen_op_movl_T1_imu(uint32_t val
)
285 tcg_gen_movi_tl(cpu_T
[1], val
);
288 static inline void gen_op_movl_A0_im(uint32_t val
)
290 tcg_gen_movi_tl(cpu_A0
, val
);
294 static inline void gen_op_movq_A0_im(int64_t val
)
296 tcg_gen_movi_tl(cpu_A0
, val
);
300 static inline void gen_movtl_T0_im(target_ulong val
)
302 tcg_gen_movi_tl(cpu_T
[0], val
);
305 static inline void gen_movtl_T1_im(target_ulong val
)
307 tcg_gen_movi_tl(cpu_T
[1], val
);
310 static inline void gen_op_andl_T0_ffff(void)
312 tcg_gen_andi_tl(cpu_T
[0], cpu_T
[0], 0xffff);
315 static inline void gen_op_andl_T0_im(uint32_t val
)
317 tcg_gen_andi_tl(cpu_T
[0], cpu_T
[0], val
);
320 static inline void gen_op_movl_T0_T1(void)
322 tcg_gen_mov_tl(cpu_T
[0], cpu_T
[1]);
325 static inline void gen_op_andl_A0_ffff(void)
327 tcg_gen_andi_tl(cpu_A0
, cpu_A0
, 0xffff);
332 #define NB_OP_SIZES 4
334 #else /* !TARGET_X86_64 */
336 #define NB_OP_SIZES 3
338 #endif /* !TARGET_X86_64 */
340 #if defined(HOST_WORDS_BIGENDIAN)
341 #define REG_B_OFFSET (sizeof(target_ulong) - 1)
342 #define REG_H_OFFSET (sizeof(target_ulong) - 2)
343 #define REG_W_OFFSET (sizeof(target_ulong) - 2)
344 #define REG_L_OFFSET (sizeof(target_ulong) - 4)
345 #define REG_LH_OFFSET (sizeof(target_ulong) - 8)
347 #define REG_B_OFFSET 0
348 #define REG_H_OFFSET 1
349 #define REG_W_OFFSET 0
350 #define REG_L_OFFSET 0
351 #define REG_LH_OFFSET 4
354 /* In instruction encodings for byte register accesses the
355 * register number usually indicates "low 8 bits of register N";
356 * however there are some special cases where N 4..7 indicates
357 * [AH, CH, DH, BH], ie "bits 15..8 of register N-4". Return
358 * true for this special case, false otherwise.
360 static inline bool byte_reg_is_xH(int reg
)
366 if (reg
>= 8 || x86_64_hregs
) {
373 static inline void gen_op_mov_reg_v(int ot
, int reg
, TCGv t0
)
377 if (!byte_reg_is_xH(reg
)) {
378 tcg_gen_deposit_tl(cpu_regs
[reg
], cpu_regs
[reg
], t0
, 0, 8);
380 tcg_gen_deposit_tl(cpu_regs
[reg
- 4], cpu_regs
[reg
- 4], t0
, 8, 8);
384 tcg_gen_deposit_tl(cpu_regs
[reg
], cpu_regs
[reg
], t0
, 0, 16);
386 default: /* XXX this shouldn't be reached; abort? */
388 /* For x86_64, this sets the higher half of register to zero.
389 For i386, this is equivalent to a mov. */
390 tcg_gen_ext32u_tl(cpu_regs
[reg
], t0
);
394 tcg_gen_mov_tl(cpu_regs
[reg
], t0
);
400 static inline void gen_op_mov_reg_T0(int ot
, int reg
)
402 gen_op_mov_reg_v(ot
, reg
, cpu_T
[0]);
405 static inline void gen_op_mov_reg_T1(int ot
, int reg
)
407 gen_op_mov_reg_v(ot
, reg
, cpu_T
[1]);
410 static inline void gen_op_mov_reg_A0(int size
, int reg
)
414 tcg_gen_deposit_tl(cpu_regs
[reg
], cpu_regs
[reg
], cpu_A0
, 0, 16);
416 default: /* XXX this shouldn't be reached; abort? */
418 /* For x86_64, this sets the higher half of register to zero.
419 For i386, this is equivalent to a mov. */
420 tcg_gen_ext32u_tl(cpu_regs
[reg
], cpu_A0
);
424 tcg_gen_mov_tl(cpu_regs
[reg
], cpu_A0
);
430 static inline void gen_op_mov_v_reg(int ot
, TCGv t0
, int reg
)
432 if (ot
== OT_BYTE
&& byte_reg_is_xH(reg
)) {
433 tcg_gen_shri_tl(t0
, cpu_regs
[reg
- 4], 8);
434 tcg_gen_ext8u_tl(t0
, t0
);
436 tcg_gen_mov_tl(t0
, cpu_regs
[reg
]);
440 static inline void gen_op_mov_TN_reg(int ot
, int t_index
, int reg
)
442 gen_op_mov_v_reg(ot
, cpu_T
[t_index
], reg
);
445 static inline void gen_op_movl_A0_reg(int reg
)
447 tcg_gen_mov_tl(cpu_A0
, cpu_regs
[reg
]);
450 static inline void gen_op_addl_A0_im(int32_t val
)
452 tcg_gen_addi_tl(cpu_A0
, cpu_A0
, val
);
454 tcg_gen_andi_tl(cpu_A0
, cpu_A0
, 0xffffffff);
459 static inline void gen_op_addq_A0_im(int64_t val
)
461 tcg_gen_addi_tl(cpu_A0
, cpu_A0
, val
);
465 static void gen_add_A0_im(DisasContext
*s
, int val
)
469 gen_op_addq_A0_im(val
);
472 gen_op_addl_A0_im(val
);
475 static inline void gen_op_addl_T0_T1(void)
477 tcg_gen_add_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
480 static inline void gen_op_jmp_T0(void)
482 tcg_gen_st_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
, eip
));
485 static inline void gen_op_add_reg_im(int size
, int reg
, int32_t val
)
489 tcg_gen_addi_tl(cpu_tmp0
, cpu_regs
[reg
], val
);
490 tcg_gen_deposit_tl(cpu_regs
[reg
], cpu_regs
[reg
], cpu_tmp0
, 0, 16);
493 tcg_gen_addi_tl(cpu_tmp0
, cpu_regs
[reg
], val
);
494 /* For x86_64, this sets the higher half of register to zero.
495 For i386, this is equivalent to a nop. */
496 tcg_gen_ext32u_tl(cpu_tmp0
, cpu_tmp0
);
497 tcg_gen_mov_tl(cpu_regs
[reg
], cpu_tmp0
);
501 tcg_gen_addi_tl(cpu_regs
[reg
], cpu_regs
[reg
], val
);
507 static inline void gen_op_add_reg_T0(int size
, int reg
)
511 tcg_gen_add_tl(cpu_tmp0
, cpu_regs
[reg
], cpu_T
[0]);
512 tcg_gen_deposit_tl(cpu_regs
[reg
], cpu_regs
[reg
], cpu_tmp0
, 0, 16);
515 tcg_gen_add_tl(cpu_tmp0
, cpu_regs
[reg
], cpu_T
[0]);
516 /* For x86_64, this sets the higher half of register to zero.
517 For i386, this is equivalent to a nop. */
518 tcg_gen_ext32u_tl(cpu_tmp0
, cpu_tmp0
);
519 tcg_gen_mov_tl(cpu_regs
[reg
], cpu_tmp0
);
523 tcg_gen_add_tl(cpu_regs
[reg
], cpu_regs
[reg
], cpu_T
[0]);
529 static inline void gen_op_addl_A0_reg_sN(int shift
, int reg
)
531 tcg_gen_mov_tl(cpu_tmp0
, cpu_regs
[reg
]);
533 tcg_gen_shli_tl(cpu_tmp0
, cpu_tmp0
, shift
);
534 tcg_gen_add_tl(cpu_A0
, cpu_A0
, cpu_tmp0
);
535 /* For x86_64, this sets the higher half of register to zero.
536 For i386, this is equivalent to a nop. */
537 tcg_gen_ext32u_tl(cpu_A0
, cpu_A0
);
540 static inline void gen_op_movl_A0_seg(int reg
)
542 tcg_gen_ld32u_tl(cpu_A0
, cpu_env
, offsetof(CPUX86State
, segs
[reg
].base
) + REG_L_OFFSET
);
545 static inline void gen_op_addl_A0_seg(DisasContext
*s
, int reg
)
547 tcg_gen_ld_tl(cpu_tmp0
, cpu_env
, offsetof(CPUX86State
, segs
[reg
].base
));
550 tcg_gen_andi_tl(cpu_A0
, cpu_A0
, 0xffffffff);
551 tcg_gen_add_tl(cpu_A0
, cpu_A0
, cpu_tmp0
);
553 tcg_gen_add_tl(cpu_A0
, cpu_A0
, cpu_tmp0
);
554 tcg_gen_andi_tl(cpu_A0
, cpu_A0
, 0xffffffff);
557 tcg_gen_add_tl(cpu_A0
, cpu_A0
, cpu_tmp0
);
562 static inline void gen_op_movq_A0_seg(int reg
)
564 tcg_gen_ld_tl(cpu_A0
, cpu_env
, offsetof(CPUX86State
, segs
[reg
].base
));
567 static inline void gen_op_addq_A0_seg(int reg
)
569 tcg_gen_ld_tl(cpu_tmp0
, cpu_env
, offsetof(CPUX86State
, segs
[reg
].base
));
570 tcg_gen_add_tl(cpu_A0
, cpu_A0
, cpu_tmp0
);
573 static inline void gen_op_movq_A0_reg(int reg
)
575 tcg_gen_mov_tl(cpu_A0
, cpu_regs
[reg
]);
578 static inline void gen_op_addq_A0_reg_sN(int shift
, int reg
)
580 tcg_gen_mov_tl(cpu_tmp0
, cpu_regs
[reg
]);
582 tcg_gen_shli_tl(cpu_tmp0
, cpu_tmp0
, shift
);
583 tcg_gen_add_tl(cpu_A0
, cpu_A0
, cpu_tmp0
);
587 static inline void gen_op_lds_T0_A0(int idx
)
589 int mem_index
= (idx
>> 2) - 1;
592 tcg_gen_qemu_ld8s(cpu_T
[0], cpu_A0
, mem_index
);
595 tcg_gen_qemu_ld16s(cpu_T
[0], cpu_A0
, mem_index
);
599 tcg_gen_qemu_ld32s(cpu_T
[0], cpu_A0
, mem_index
);
604 static inline void gen_op_ld_v(int idx
, TCGv t0
, TCGv a0
)
606 int mem_index
= (idx
>> 2) - 1;
609 tcg_gen_qemu_ld8u(t0
, a0
, mem_index
);
612 tcg_gen_qemu_ld16u(t0
, a0
, mem_index
);
615 tcg_gen_qemu_ld32u(t0
, a0
, mem_index
);
619 /* Should never happen on 32-bit targets. */
621 tcg_gen_qemu_ld64(t0
, a0
, mem_index
);
627 /* XXX: always use ldu or lds */
628 static inline void gen_op_ld_T0_A0(int idx
)
630 gen_op_ld_v(idx
, cpu_T
[0], cpu_A0
);
633 static inline void gen_op_ldu_T0_A0(int idx
)
635 gen_op_ld_v(idx
, cpu_T
[0], cpu_A0
);
638 static inline void gen_op_ld_T1_A0(int idx
)
640 gen_op_ld_v(idx
, cpu_T
[1], cpu_A0
);
643 static inline void gen_op_st_v(int idx
, TCGv t0
, TCGv a0
)
645 int mem_index
= (idx
>> 2) - 1;
648 tcg_gen_qemu_st8(t0
, a0
, mem_index
);
651 tcg_gen_qemu_st16(t0
, a0
, mem_index
);
654 tcg_gen_qemu_st32(t0
, a0
, mem_index
);
658 /* Should never happen on 32-bit targets. */
660 tcg_gen_qemu_st64(t0
, a0
, mem_index
);
666 static inline void gen_op_st_T0_A0(int idx
)
668 gen_op_st_v(idx
, cpu_T
[0], cpu_A0
);
671 static inline void gen_op_st_T1_A0(int idx
)
673 gen_op_st_v(idx
, cpu_T
[1], cpu_A0
);
676 static inline void gen_jmp_im(target_ulong pc
)
678 tcg_gen_movi_tl(cpu_tmp0
, pc
);
679 tcg_gen_st_tl(cpu_tmp0
, cpu_env
, offsetof(CPUX86State
, eip
));
682 static inline void gen_string_movl_A0_ESI(DisasContext
*s
)
686 override
= s
->override
;
690 gen_op_movq_A0_seg(override
);
691 gen_op_addq_A0_reg_sN(0, R_ESI
);
693 gen_op_movq_A0_reg(R_ESI
);
699 if (s
->addseg
&& override
< 0)
702 gen_op_movl_A0_seg(override
);
703 gen_op_addl_A0_reg_sN(0, R_ESI
);
705 gen_op_movl_A0_reg(R_ESI
);
708 /* 16 address, always override */
711 gen_op_movl_A0_reg(R_ESI
);
712 gen_op_andl_A0_ffff();
713 gen_op_addl_A0_seg(s
, override
);
717 static inline void gen_string_movl_A0_EDI(DisasContext
*s
)
721 gen_op_movq_A0_reg(R_EDI
);
726 gen_op_movl_A0_seg(R_ES
);
727 gen_op_addl_A0_reg_sN(0, R_EDI
);
729 gen_op_movl_A0_reg(R_EDI
);
732 gen_op_movl_A0_reg(R_EDI
);
733 gen_op_andl_A0_ffff();
734 gen_op_addl_A0_seg(s
, R_ES
);
738 static inline void gen_op_movl_T0_Dshift(int ot
)
740 tcg_gen_ld32s_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
, df
));
741 tcg_gen_shli_tl(cpu_T
[0], cpu_T
[0], ot
);
744 static TCGv
gen_ext_tl(TCGv dst
, TCGv src
, int size
, bool sign
)
749 tcg_gen_ext8s_tl(dst
, src
);
751 tcg_gen_ext8u_tl(dst
, src
);
756 tcg_gen_ext16s_tl(dst
, src
);
758 tcg_gen_ext16u_tl(dst
, src
);
764 tcg_gen_ext32s_tl(dst
, src
);
766 tcg_gen_ext32u_tl(dst
, src
);
775 static void gen_extu(int ot
, TCGv reg
)
777 gen_ext_tl(reg
, reg
, ot
, false);
780 static void gen_exts(int ot
, TCGv reg
)
782 gen_ext_tl(reg
, reg
, ot
, true);
785 static inline void gen_op_jnz_ecx(int size
, int label1
)
787 tcg_gen_mov_tl(cpu_tmp0
, cpu_regs
[R_ECX
]);
788 gen_extu(size
+ 1, cpu_tmp0
);
789 tcg_gen_brcondi_tl(TCG_COND_NE
, cpu_tmp0
, 0, label1
);
792 static inline void gen_op_jz_ecx(int size
, int label1
)
794 tcg_gen_mov_tl(cpu_tmp0
, cpu_regs
[R_ECX
]);
795 gen_extu(size
+ 1, cpu_tmp0
);
796 tcg_gen_brcondi_tl(TCG_COND_EQ
, cpu_tmp0
, 0, label1
);
799 static void gen_helper_in_func(int ot
, TCGv v
, TCGv_i32 n
)
803 gen_helper_inb(v
, n
);
806 gen_helper_inw(v
, n
);
809 gen_helper_inl(v
, n
);
814 static void gen_helper_out_func(int ot
, TCGv_i32 v
, TCGv_i32 n
)
818 gen_helper_outb(v
, n
);
821 gen_helper_outw(v
, n
);
824 gen_helper_outl(v
, n
);
829 static void gen_check_io(DisasContext
*s
, int ot
, target_ulong cur_eip
,
833 target_ulong next_eip
;
836 if (s
->pe
&& (s
->cpl
> s
->iopl
|| s
->vm86
)) {
840 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
843 gen_helper_check_iob(cpu_env
, cpu_tmp2_i32
);
846 gen_helper_check_iow(cpu_env
, cpu_tmp2_i32
);
849 gen_helper_check_iol(cpu_env
, cpu_tmp2_i32
);
853 if(s
->flags
& HF_SVMI_MASK
) {
858 svm_flags
|= (1 << (4 + ot
));
859 next_eip
= s
->pc
- s
->cs_base
;
860 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
861 gen_helper_svm_check_io(cpu_env
, cpu_tmp2_i32
,
862 tcg_const_i32(svm_flags
),
863 tcg_const_i32(next_eip
- cur_eip
));
867 static inline void gen_movs(DisasContext
*s
, int ot
)
869 gen_string_movl_A0_ESI(s
);
870 gen_op_ld_T0_A0(ot
+ s
->mem_index
);
871 gen_string_movl_A0_EDI(s
);
872 gen_op_st_T0_A0(ot
+ s
->mem_index
);
873 gen_op_movl_T0_Dshift(ot
);
874 gen_op_add_reg_T0(s
->aflag
, R_ESI
);
875 gen_op_add_reg_T0(s
->aflag
, R_EDI
);
878 static void gen_op_update1_cc(void)
880 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
883 static void gen_op_update2_cc(void)
885 tcg_gen_mov_tl(cpu_cc_src
, cpu_T
[1]);
886 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
889 static void gen_op_update3_cc(TCGv reg
)
891 tcg_gen_mov_tl(cpu_cc_src2
, reg
);
892 tcg_gen_mov_tl(cpu_cc_src
, cpu_T
[1]);
893 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
896 static inline void gen_op_testl_T0_T1_cc(void)
898 tcg_gen_and_tl(cpu_cc_dst
, cpu_T
[0], cpu_T
[1]);
901 static void gen_op_update_neg_cc(void)
903 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
904 tcg_gen_neg_tl(cpu_cc_src
, cpu_T
[0]);
905 tcg_gen_movi_tl(cpu_cc_srcT
, 0);
908 /* compute all eflags to cc_src */
909 static void gen_compute_eflags(DisasContext
*s
)
911 TCGv zero
, dst
, src1
, src2
;
914 if (s
->cc_op
== CC_OP_EFLAGS
) {
917 if (s
->cc_op
== CC_OP_CLR
) {
918 tcg_gen_movi_tl(cpu_cc_src
, CC_Z
);
919 set_cc_op(s
, CC_OP_EFLAGS
);
928 /* Take care to not read values that are not live. */
929 live
= cc_op_live
[s
->cc_op
] & ~USES_CC_SRCT
;
930 dead
= live
^ (USES_CC_DST
| USES_CC_SRC
| USES_CC_SRC2
);
932 zero
= tcg_const_tl(0);
933 if (dead
& USES_CC_DST
) {
936 if (dead
& USES_CC_SRC
) {
939 if (dead
& USES_CC_SRC2
) {
945 gen_helper_cc_compute_all(cpu_cc_src
, dst
, src1
, src2
, cpu_cc_op
);
946 set_cc_op(s
, CC_OP_EFLAGS
);
953 typedef struct CCPrepare
{
963 /* compute eflags.C to reg */
964 static CCPrepare
gen_prepare_eflags_c(DisasContext
*s
, TCGv reg
)
970 case CC_OP_SUBB
... CC_OP_SUBQ
:
971 /* (DATA_TYPE)CC_SRCT < (DATA_TYPE)CC_SRC */
972 size
= s
->cc_op
- CC_OP_SUBB
;
973 t1
= gen_ext_tl(cpu_tmp0
, cpu_cc_src
, size
, false);
974 /* If no temporary was used, be careful not to alias t1 and t0. */
975 t0
= TCGV_EQUAL(t1
, cpu_cc_src
) ? cpu_tmp0
: reg
;
976 tcg_gen_mov_tl(t0
, cpu_cc_srcT
);
980 case CC_OP_ADDB
... CC_OP_ADDQ
:
981 /* (DATA_TYPE)CC_DST < (DATA_TYPE)CC_SRC */
982 size
= s
->cc_op
- CC_OP_ADDB
;
983 t1
= gen_ext_tl(cpu_tmp0
, cpu_cc_src
, size
, false);
984 t0
= gen_ext_tl(reg
, cpu_cc_dst
, size
, false);
986 return (CCPrepare
) { .cond
= TCG_COND_LTU
, .reg
= t0
,
987 .reg2
= t1
, .mask
= -1, .use_reg2
= true };
989 case CC_OP_LOGICB
... CC_OP_LOGICQ
:
991 return (CCPrepare
) { .cond
= TCG_COND_NEVER
, .mask
= -1 };
993 case CC_OP_INCB
... CC_OP_INCQ
:
994 case CC_OP_DECB
... CC_OP_DECQ
:
995 return (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= cpu_cc_src
,
996 .mask
= -1, .no_setcond
= true };
998 case CC_OP_SHLB
... CC_OP_SHLQ
:
999 /* (CC_SRC >> (DATA_BITS - 1)) & 1 */
1000 size
= s
->cc_op
- CC_OP_SHLB
;
1001 shift
= (8 << size
) - 1;
1002 return (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= cpu_cc_src
,
1003 .mask
= (target_ulong
)1 << shift
};
1005 case CC_OP_MULB
... CC_OP_MULQ
:
1006 return (CCPrepare
) { .cond
= TCG_COND_NE
,
1007 .reg
= cpu_cc_src
, .mask
= -1 };
1009 case CC_OP_BMILGB
... CC_OP_BMILGQ
:
1010 size
= s
->cc_op
- CC_OP_BMILGB
;
1011 t0
= gen_ext_tl(reg
, cpu_cc_src
, size
, false);
1012 return (CCPrepare
) { .cond
= TCG_COND_EQ
, .reg
= t0
, .mask
= -1 };
1016 return (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= cpu_cc_dst
,
1017 .mask
= -1, .no_setcond
= true };
1020 case CC_OP_SARB
... CC_OP_SARQ
:
1022 return (CCPrepare
) { .cond
= TCG_COND_NE
,
1023 .reg
= cpu_cc_src
, .mask
= CC_C
};
1026 /* The need to compute only C from CC_OP_DYNAMIC is important
1027 in efficiently implementing e.g. INC at the start of a TB. */
1028 gen_update_cc_op(s
);
1029 gen_helper_cc_compute_c(reg
, cpu_cc_dst
, cpu_cc_src
,
1030 cpu_cc_src2
, cpu_cc_op
);
1031 return (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= reg
,
1032 .mask
= -1, .no_setcond
= true };
1036 /* compute eflags.P to reg */
1037 static CCPrepare
gen_prepare_eflags_p(DisasContext
*s
, TCGv reg
)
1039 gen_compute_eflags(s
);
1040 return (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= cpu_cc_src
,
1044 /* compute eflags.S to reg */
1045 static CCPrepare
gen_prepare_eflags_s(DisasContext
*s
, TCGv reg
)
1049 gen_compute_eflags(s
);
1055 return (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= cpu_cc_src
,
1058 return (CCPrepare
) { .cond
= TCG_COND_NEVER
, .mask
= -1 };
1061 int size
= (s
->cc_op
- CC_OP_ADDB
) & 3;
1062 TCGv t0
= gen_ext_tl(reg
, cpu_cc_dst
, size
, true);
1063 return (CCPrepare
) { .cond
= TCG_COND_LT
, .reg
= t0
, .mask
= -1 };
1068 /* compute eflags.O to reg */
1069 static CCPrepare
gen_prepare_eflags_o(DisasContext
*s
, TCGv reg
)
1074 return (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= cpu_cc_src2
,
1075 .mask
= -1, .no_setcond
= true };
1077 return (CCPrepare
) { .cond
= TCG_COND_NEVER
, .mask
= -1 };
1079 gen_compute_eflags(s
);
1080 return (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= cpu_cc_src
,
1085 /* compute eflags.Z to reg */
1086 static CCPrepare
gen_prepare_eflags_z(DisasContext
*s
, TCGv reg
)
1090 gen_compute_eflags(s
);
1096 return (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= cpu_cc_src
,
1099 return (CCPrepare
) { .cond
= TCG_COND_ALWAYS
, .mask
= -1 };
1102 int size
= (s
->cc_op
- CC_OP_ADDB
) & 3;
1103 TCGv t0
= gen_ext_tl(reg
, cpu_cc_dst
, size
, false);
1104 return (CCPrepare
) { .cond
= TCG_COND_EQ
, .reg
= t0
, .mask
= -1 };
1109 /* perform a conditional store into register 'reg' according to jump opcode
1110 value 'b'. In the fast case, T0 is guaranted not to be used. */
1111 static CCPrepare
gen_prepare_cc(DisasContext
*s
, int b
, TCGv reg
)
1113 int inv
, jcc_op
, size
, cond
;
1118 jcc_op
= (b
>> 1) & 7;
1121 case CC_OP_SUBB
... CC_OP_SUBQ
:
1122 /* We optimize relational operators for the cmp/jcc case. */
1123 size
= s
->cc_op
- CC_OP_SUBB
;
1126 tcg_gen_mov_tl(cpu_tmp4
, cpu_cc_srcT
);
1127 gen_extu(size
, cpu_tmp4
);
1128 t0
= gen_ext_tl(cpu_tmp0
, cpu_cc_src
, size
, false);
1129 cc
= (CCPrepare
) { .cond
= TCG_COND_LEU
, .reg
= cpu_tmp4
,
1130 .reg2
= t0
, .mask
= -1, .use_reg2
= true };
1139 tcg_gen_mov_tl(cpu_tmp4
, cpu_cc_srcT
);
1140 gen_exts(size
, cpu_tmp4
);
1141 t0
= gen_ext_tl(cpu_tmp0
, cpu_cc_src
, size
, true);
1142 cc
= (CCPrepare
) { .cond
= cond
, .reg
= cpu_tmp4
,
1143 .reg2
= t0
, .mask
= -1, .use_reg2
= true };
1153 /* This actually generates good code for JC, JZ and JS. */
1156 cc
= gen_prepare_eflags_o(s
, reg
);
1159 cc
= gen_prepare_eflags_c(s
, reg
);
1162 cc
= gen_prepare_eflags_z(s
, reg
);
1165 gen_compute_eflags(s
);
1166 cc
= (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= cpu_cc_src
,
1167 .mask
= CC_Z
| CC_C
};
1170 cc
= gen_prepare_eflags_s(s
, reg
);
1173 cc
= gen_prepare_eflags_p(s
, reg
);
1176 gen_compute_eflags(s
);
1177 if (TCGV_EQUAL(reg
, cpu_cc_src
)) {
1180 tcg_gen_shri_tl(reg
, cpu_cc_src
, 4); /* CC_O -> CC_S */
1181 tcg_gen_xor_tl(reg
, reg
, cpu_cc_src
);
1182 cc
= (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= reg
,
1187 gen_compute_eflags(s
);
1188 if (TCGV_EQUAL(reg
, cpu_cc_src
)) {
1191 tcg_gen_shri_tl(reg
, cpu_cc_src
, 4); /* CC_O -> CC_S */
1192 tcg_gen_xor_tl(reg
, reg
, cpu_cc_src
);
1193 cc
= (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= reg
,
1194 .mask
= CC_S
| CC_Z
};
1201 cc
.cond
= tcg_invert_cond(cc
.cond
);
1206 static void gen_setcc1(DisasContext
*s
, int b
, TCGv reg
)
1208 CCPrepare cc
= gen_prepare_cc(s
, b
, reg
);
1210 if (cc
.no_setcond
) {
1211 if (cc
.cond
== TCG_COND_EQ
) {
1212 tcg_gen_xori_tl(reg
, cc
.reg
, 1);
1214 tcg_gen_mov_tl(reg
, cc
.reg
);
1219 if (cc
.cond
== TCG_COND_NE
&& !cc
.use_reg2
&& cc
.imm
== 0 &&
1220 cc
.mask
!= 0 && (cc
.mask
& (cc
.mask
- 1)) == 0) {
1221 tcg_gen_shri_tl(reg
, cc
.reg
, ctztl(cc
.mask
));
1222 tcg_gen_andi_tl(reg
, reg
, 1);
1225 if (cc
.mask
!= -1) {
1226 tcg_gen_andi_tl(reg
, cc
.reg
, cc
.mask
);
1230 tcg_gen_setcond_tl(cc
.cond
, reg
, cc
.reg
, cc
.reg2
);
1232 tcg_gen_setcondi_tl(cc
.cond
, reg
, cc
.reg
, cc
.imm
);
1236 static inline void gen_compute_eflags_c(DisasContext
*s
, TCGv reg
)
1238 gen_setcc1(s
, JCC_B
<< 1, reg
);
1241 /* generate a conditional jump to label 'l1' according to jump opcode
1242 value 'b'. In the fast case, T0 is guaranted not to be used. */
1243 static inline void gen_jcc1_noeob(DisasContext
*s
, int b
, int l1
)
1245 CCPrepare cc
= gen_prepare_cc(s
, b
, cpu_T
[0]);
1247 if (cc
.mask
!= -1) {
1248 tcg_gen_andi_tl(cpu_T
[0], cc
.reg
, cc
.mask
);
1252 tcg_gen_brcond_tl(cc
.cond
, cc
.reg
, cc
.reg2
, l1
);
1254 tcg_gen_brcondi_tl(cc
.cond
, cc
.reg
, cc
.imm
, l1
);
1258 /* Generate a conditional jump to label 'l1' according to jump opcode
1259 value 'b'. In the fast case, T0 is guaranted not to be used.
1260 A translation block must end soon. */
1261 static inline void gen_jcc1(DisasContext
*s
, int b
, int l1
)
1263 CCPrepare cc
= gen_prepare_cc(s
, b
, cpu_T
[0]);
1265 gen_update_cc_op(s
);
1266 if (cc
.mask
!= -1) {
1267 tcg_gen_andi_tl(cpu_T
[0], cc
.reg
, cc
.mask
);
1270 set_cc_op(s
, CC_OP_DYNAMIC
);
1272 tcg_gen_brcond_tl(cc
.cond
, cc
.reg
, cc
.reg2
, l1
);
1274 tcg_gen_brcondi_tl(cc
.cond
, cc
.reg
, cc
.imm
, l1
);
1278 /* XXX: does not work with gdbstub "ice" single step - not a
1280 static int gen_jz_ecx_string(DisasContext
*s
, target_ulong next_eip
)
1284 l1
= gen_new_label();
1285 l2
= gen_new_label();
1286 gen_op_jnz_ecx(s
->aflag
, l1
);
1288 gen_jmp_tb(s
, next_eip
, 1);
1293 static inline void gen_stos(DisasContext
*s
, int ot
)
1295 gen_op_mov_TN_reg(OT_LONG
, 0, R_EAX
);
1296 gen_string_movl_A0_EDI(s
);
1297 gen_op_st_T0_A0(ot
+ s
->mem_index
);
1298 gen_op_movl_T0_Dshift(ot
);
1299 gen_op_add_reg_T0(s
->aflag
, R_EDI
);
1302 static inline void gen_lods(DisasContext
*s
, int ot
)
1304 gen_string_movl_A0_ESI(s
);
1305 gen_op_ld_T0_A0(ot
+ s
->mem_index
);
1306 gen_op_mov_reg_T0(ot
, R_EAX
);
1307 gen_op_movl_T0_Dshift(ot
);
1308 gen_op_add_reg_T0(s
->aflag
, R_ESI
);
1311 static inline void gen_scas(DisasContext
*s
, int ot
)
1313 gen_string_movl_A0_EDI(s
);
1314 gen_op_ld_T1_A0(ot
+ s
->mem_index
);
1315 gen_op(s
, OP_CMPL
, ot
, R_EAX
);
1316 gen_op_movl_T0_Dshift(ot
);
1317 gen_op_add_reg_T0(s
->aflag
, R_EDI
);
1320 static inline void gen_cmps(DisasContext
*s
, int ot
)
1322 gen_string_movl_A0_EDI(s
);
1323 gen_op_ld_T1_A0(ot
+ s
->mem_index
);
1324 gen_string_movl_A0_ESI(s
);
1325 gen_op(s
, OP_CMPL
, ot
, OR_TMP0
);
1326 gen_op_movl_T0_Dshift(ot
);
1327 gen_op_add_reg_T0(s
->aflag
, R_ESI
);
1328 gen_op_add_reg_T0(s
->aflag
, R_EDI
);
1331 static inline void gen_ins(DisasContext
*s
, int ot
)
1335 gen_string_movl_A0_EDI(s
);
1336 /* Note: we must do this dummy write first to be restartable in
1337 case of page fault. */
1339 gen_op_st_T0_A0(ot
+ s
->mem_index
);
1340 gen_op_mov_TN_reg(OT_WORD
, 1, R_EDX
);
1341 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[1]);
1342 tcg_gen_andi_i32(cpu_tmp2_i32
, cpu_tmp2_i32
, 0xffff);
1343 gen_helper_in_func(ot
, cpu_T
[0], cpu_tmp2_i32
);
1344 gen_op_st_T0_A0(ot
+ s
->mem_index
);
1345 gen_op_movl_T0_Dshift(ot
);
1346 gen_op_add_reg_T0(s
->aflag
, R_EDI
);
1351 static inline void gen_outs(DisasContext
*s
, int ot
)
1355 gen_string_movl_A0_ESI(s
);
1356 gen_op_ld_T0_A0(ot
+ s
->mem_index
);
1358 gen_op_mov_TN_reg(OT_WORD
, 1, R_EDX
);
1359 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[1]);
1360 tcg_gen_andi_i32(cpu_tmp2_i32
, cpu_tmp2_i32
, 0xffff);
1361 tcg_gen_trunc_tl_i32(cpu_tmp3_i32
, cpu_T
[0]);
1362 gen_helper_out_func(ot
, cpu_tmp2_i32
, cpu_tmp3_i32
);
1364 gen_op_movl_T0_Dshift(ot
);
1365 gen_op_add_reg_T0(s
->aflag
, R_ESI
);
1370 /* same method as Valgrind : we generate jumps to current or next
1372 #define GEN_REPZ(op) \
1373 static inline void gen_repz_ ## op(DisasContext *s, int ot, \
1374 target_ulong cur_eip, target_ulong next_eip) \
1377 gen_update_cc_op(s); \
1378 l2 = gen_jz_ecx_string(s, next_eip); \
1379 gen_ ## op(s, ot); \
1380 gen_op_add_reg_im(s->aflag, R_ECX, -1); \
1381 /* a loop would cause two single step exceptions if ECX = 1 \
1382 before rep string_insn */ \
1384 gen_op_jz_ecx(s->aflag, l2); \
1385 gen_jmp(s, cur_eip); \
1388 #define GEN_REPZ2(op) \
1389 static inline void gen_repz_ ## op(DisasContext *s, int ot, \
1390 target_ulong cur_eip, \
1391 target_ulong next_eip, \
1395 gen_update_cc_op(s); \
1396 l2 = gen_jz_ecx_string(s, next_eip); \
1397 gen_ ## op(s, ot); \
1398 gen_op_add_reg_im(s->aflag, R_ECX, -1); \
1399 gen_update_cc_op(s); \
1400 gen_jcc1(s, (JCC_Z << 1) | (nz ^ 1), l2); \
1402 gen_op_jz_ecx(s->aflag, l2); \
1403 gen_jmp(s, cur_eip); \
1414 static void gen_helper_fp_arith_ST0_FT0(int op
)
1418 gen_helper_fadd_ST0_FT0(cpu_env
);
1421 gen_helper_fmul_ST0_FT0(cpu_env
);
1424 gen_helper_fcom_ST0_FT0(cpu_env
);
1427 gen_helper_fcom_ST0_FT0(cpu_env
);
1430 gen_helper_fsub_ST0_FT0(cpu_env
);
1433 gen_helper_fsubr_ST0_FT0(cpu_env
);
1436 gen_helper_fdiv_ST0_FT0(cpu_env
);
1439 gen_helper_fdivr_ST0_FT0(cpu_env
);
1444 /* NOTE the exception in "r" op ordering */
1445 static void gen_helper_fp_arith_STN_ST0(int op
, int opreg
)
1447 TCGv_i32 tmp
= tcg_const_i32(opreg
);
1450 gen_helper_fadd_STN_ST0(cpu_env
, tmp
);
1453 gen_helper_fmul_STN_ST0(cpu_env
, tmp
);
1456 gen_helper_fsubr_STN_ST0(cpu_env
, tmp
);
1459 gen_helper_fsub_STN_ST0(cpu_env
, tmp
);
1462 gen_helper_fdivr_STN_ST0(cpu_env
, tmp
);
1465 gen_helper_fdiv_STN_ST0(cpu_env
, tmp
);
1470 /* if d == OR_TMP0, it means memory operand (address in A0) */
1471 static void gen_op(DisasContext
*s1
, int op
, int ot
, int d
)
1474 gen_op_mov_TN_reg(ot
, 0, d
);
1476 gen_op_ld_T0_A0(ot
+ s1
->mem_index
);
1480 gen_compute_eflags_c(s1
, cpu_tmp4
);
1481 tcg_gen_add_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1482 tcg_gen_add_tl(cpu_T
[0], cpu_T
[0], cpu_tmp4
);
1484 gen_op_mov_reg_T0(ot
, d
);
1486 gen_op_st_T0_A0(ot
+ s1
->mem_index
);
1487 gen_op_update3_cc(cpu_tmp4
);
1488 set_cc_op(s1
, CC_OP_ADCB
+ ot
);
1491 gen_compute_eflags_c(s1
, cpu_tmp4
);
1492 tcg_gen_sub_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1493 tcg_gen_sub_tl(cpu_T
[0], cpu_T
[0], cpu_tmp4
);
1495 gen_op_mov_reg_T0(ot
, d
);
1497 gen_op_st_T0_A0(ot
+ s1
->mem_index
);
1498 gen_op_update3_cc(cpu_tmp4
);
1499 set_cc_op(s1
, CC_OP_SBBB
+ ot
);
1502 gen_op_addl_T0_T1();
1504 gen_op_mov_reg_T0(ot
, d
);
1506 gen_op_st_T0_A0(ot
+ s1
->mem_index
);
1507 gen_op_update2_cc();
1508 set_cc_op(s1
, CC_OP_ADDB
+ ot
);
1511 tcg_gen_mov_tl(cpu_cc_srcT
, cpu_T
[0]);
1512 tcg_gen_sub_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1514 gen_op_mov_reg_T0(ot
, d
);
1516 gen_op_st_T0_A0(ot
+ s1
->mem_index
);
1517 gen_op_update2_cc();
1518 set_cc_op(s1
, CC_OP_SUBB
+ ot
);
1522 tcg_gen_and_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1524 gen_op_mov_reg_T0(ot
, d
);
1526 gen_op_st_T0_A0(ot
+ s1
->mem_index
);
1527 gen_op_update1_cc();
1528 set_cc_op(s1
, CC_OP_LOGICB
+ ot
);
1531 tcg_gen_or_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1533 gen_op_mov_reg_T0(ot
, d
);
1535 gen_op_st_T0_A0(ot
+ s1
->mem_index
);
1536 gen_op_update1_cc();
1537 set_cc_op(s1
, CC_OP_LOGICB
+ ot
);
1540 tcg_gen_xor_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1542 gen_op_mov_reg_T0(ot
, d
);
1544 gen_op_st_T0_A0(ot
+ s1
->mem_index
);
1545 gen_op_update1_cc();
1546 set_cc_op(s1
, CC_OP_LOGICB
+ ot
);
1549 tcg_gen_mov_tl(cpu_cc_src
, cpu_T
[1]);
1550 tcg_gen_mov_tl(cpu_cc_srcT
, cpu_T
[0]);
1551 tcg_gen_sub_tl(cpu_cc_dst
, cpu_T
[0], cpu_T
[1]);
1552 set_cc_op(s1
, CC_OP_SUBB
+ ot
);
1557 /* if d == OR_TMP0, it means memory operand (address in A0) */
1558 static void gen_inc(DisasContext
*s1
, int ot
, int d
, int c
)
1561 gen_op_mov_TN_reg(ot
, 0, d
);
1563 gen_op_ld_T0_A0(ot
+ s1
->mem_index
);
1564 gen_compute_eflags_c(s1
, cpu_cc_src
);
1566 tcg_gen_addi_tl(cpu_T
[0], cpu_T
[0], 1);
1567 set_cc_op(s1
, CC_OP_INCB
+ ot
);
1569 tcg_gen_addi_tl(cpu_T
[0], cpu_T
[0], -1);
1570 set_cc_op(s1
, CC_OP_DECB
+ ot
);
1573 gen_op_mov_reg_T0(ot
, d
);
1575 gen_op_st_T0_A0(ot
+ s1
->mem_index
);
1576 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
1579 static void gen_shift_flags(DisasContext
*s
, int ot
, TCGv result
, TCGv shm1
,
1580 TCGv count
, bool is_right
)
1582 TCGv_i32 z32
, s32
, oldop
;
1585 /* Store the results into the CC variables. If we know that the
1586 variable must be dead, store unconditionally. Otherwise we'll
1587 need to not disrupt the current contents. */
1588 z_tl
= tcg_const_tl(0);
1589 if (cc_op_live
[s
->cc_op
] & USES_CC_DST
) {
1590 tcg_gen_movcond_tl(TCG_COND_NE
, cpu_cc_dst
, count
, z_tl
,
1591 result
, cpu_cc_dst
);
1593 tcg_gen_mov_tl(cpu_cc_dst
, result
);
1595 if (cc_op_live
[s
->cc_op
] & USES_CC_SRC
) {
1596 tcg_gen_movcond_tl(TCG_COND_NE
, cpu_cc_src
, count
, z_tl
,
1599 tcg_gen_mov_tl(cpu_cc_src
, shm1
);
1601 tcg_temp_free(z_tl
);
1603 /* Get the two potential CC_OP values into temporaries. */
1604 tcg_gen_movi_i32(cpu_tmp2_i32
, (is_right
? CC_OP_SARB
: CC_OP_SHLB
) + ot
);
1605 if (s
->cc_op
== CC_OP_DYNAMIC
) {
1608 tcg_gen_movi_i32(cpu_tmp3_i32
, s
->cc_op
);
1609 oldop
= cpu_tmp3_i32
;
1612 /* Conditionally store the CC_OP value. */
1613 z32
= tcg_const_i32(0);
1614 s32
= tcg_temp_new_i32();
1615 tcg_gen_trunc_tl_i32(s32
, count
);
1616 tcg_gen_movcond_i32(TCG_COND_NE
, cpu_cc_op
, s32
, z32
, cpu_tmp2_i32
, oldop
);
1617 tcg_temp_free_i32(z32
);
1618 tcg_temp_free_i32(s32
);
1620 /* The CC_OP value is no longer predictable. */
1621 set_cc_op(s
, CC_OP_DYNAMIC
);
1624 static void gen_shift_rm_T1(DisasContext
*s
, int ot
, int op1
,
1625 int is_right
, int is_arith
)
1627 target_ulong mask
= (ot
== OT_QUAD
? 0x3f : 0x1f);
1630 if (op1
== OR_TMP0
) {
1631 gen_op_ld_T0_A0(ot
+ s
->mem_index
);
1633 gen_op_mov_TN_reg(ot
, 0, op1
);
1636 tcg_gen_andi_tl(cpu_T
[1], cpu_T
[1], mask
);
1637 tcg_gen_subi_tl(cpu_tmp0
, cpu_T
[1], 1);
1641 gen_exts(ot
, cpu_T
[0]);
1642 tcg_gen_sar_tl(cpu_tmp0
, cpu_T
[0], cpu_tmp0
);
1643 tcg_gen_sar_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1645 gen_extu(ot
, cpu_T
[0]);
1646 tcg_gen_shr_tl(cpu_tmp0
, cpu_T
[0], cpu_tmp0
);
1647 tcg_gen_shr_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1650 tcg_gen_shl_tl(cpu_tmp0
, cpu_T
[0], cpu_tmp0
);
1651 tcg_gen_shl_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1655 if (op1
== OR_TMP0
) {
1656 gen_op_st_T0_A0(ot
+ s
->mem_index
);
1658 gen_op_mov_reg_T0(ot
, op1
);
1661 gen_shift_flags(s
, ot
, cpu_T
[0], cpu_tmp0
, cpu_T
[1], is_right
);
1664 static void gen_shift_rm_im(DisasContext
*s
, int ot
, int op1
, int op2
,
1665 int is_right
, int is_arith
)
1667 int mask
= (ot
== OT_QUAD
? 0x3f : 0x1f);
1671 gen_op_ld_T0_A0(ot
+ s
->mem_index
);
1673 gen_op_mov_TN_reg(ot
, 0, op1
);
1679 gen_exts(ot
, cpu_T
[0]);
1680 tcg_gen_sari_tl(cpu_tmp4
, cpu_T
[0], op2
- 1);
1681 tcg_gen_sari_tl(cpu_T
[0], cpu_T
[0], op2
);
1683 gen_extu(ot
, cpu_T
[0]);
1684 tcg_gen_shri_tl(cpu_tmp4
, cpu_T
[0], op2
- 1);
1685 tcg_gen_shri_tl(cpu_T
[0], cpu_T
[0], op2
);
1688 tcg_gen_shli_tl(cpu_tmp4
, cpu_T
[0], op2
- 1);
1689 tcg_gen_shli_tl(cpu_T
[0], cpu_T
[0], op2
);
1695 gen_op_st_T0_A0(ot
+ s
->mem_index
);
1697 gen_op_mov_reg_T0(ot
, op1
);
1699 /* update eflags if non zero shift */
1701 tcg_gen_mov_tl(cpu_cc_src
, cpu_tmp4
);
1702 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
1703 set_cc_op(s
, (is_right
? CC_OP_SARB
: CC_OP_SHLB
) + ot
);
1707 static inline void tcg_gen_lshift(TCGv ret
, TCGv arg1
, target_long arg2
)
1710 tcg_gen_shli_tl(ret
, arg1
, arg2
);
1712 tcg_gen_shri_tl(ret
, arg1
, -arg2
);
1715 static void gen_rot_rm_T1(DisasContext
*s
, int ot
, int op1
, int is_right
)
1717 target_ulong mask
= (ot
== OT_QUAD
? 0x3f : 0x1f);
1721 if (op1
== OR_TMP0
) {
1722 gen_op_ld_T0_A0(ot
+ s
->mem_index
);
1724 gen_op_mov_TN_reg(ot
, 0, op1
);
1727 tcg_gen_andi_tl(cpu_T
[1], cpu_T
[1], mask
);
1731 /* Replicate the 8-bit input so that a 32-bit rotate works. */
1732 tcg_gen_ext8u_tl(cpu_T
[0], cpu_T
[0]);
1733 tcg_gen_muli_tl(cpu_T
[0], cpu_T
[0], 0x01010101);
1736 /* Replicate the 16-bit input so that a 32-bit rotate works. */
1737 tcg_gen_deposit_tl(cpu_T
[0], cpu_T
[0], cpu_T
[0], 16, 16);
1740 #ifdef TARGET_X86_64
1742 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
1743 tcg_gen_trunc_tl_i32(cpu_tmp3_i32
, cpu_T
[1]);
1745 tcg_gen_rotr_i32(cpu_tmp2_i32
, cpu_tmp2_i32
, cpu_tmp3_i32
);
1747 tcg_gen_rotl_i32(cpu_tmp2_i32
, cpu_tmp2_i32
, cpu_tmp3_i32
);
1749 tcg_gen_extu_i32_tl(cpu_T
[0], cpu_tmp2_i32
);
1754 tcg_gen_rotr_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1756 tcg_gen_rotl_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1762 if (op1
== OR_TMP0
) {
1763 gen_op_st_T0_A0(ot
+ s
->mem_index
);
1765 gen_op_mov_reg_T0(ot
, op1
);
1768 /* We'll need the flags computed into CC_SRC. */
1769 gen_compute_eflags(s
);
1771 /* The value that was "rotated out" is now present at the other end
1772 of the word. Compute C into CC_DST and O into CC_SRC2. Note that
1773 since we've computed the flags into CC_SRC, these variables are
1776 tcg_gen_shri_tl(cpu_cc_src2
, cpu_T
[0], mask
- 1);
1777 tcg_gen_shri_tl(cpu_cc_dst
, cpu_T
[0], mask
);
1778 tcg_gen_andi_tl(cpu_cc_dst
, cpu_cc_dst
, 1);
1780 tcg_gen_shri_tl(cpu_cc_src2
, cpu_T
[0], mask
);
1781 tcg_gen_andi_tl(cpu_cc_dst
, cpu_T
[0], 1);
1783 tcg_gen_andi_tl(cpu_cc_src2
, cpu_cc_src2
, 1);
1784 tcg_gen_xor_tl(cpu_cc_src2
, cpu_cc_src2
, cpu_cc_dst
);
1786 /* Now conditionally store the new CC_OP value. If the shift count
1787 is 0 we keep the CC_OP_EFLAGS setting so that only CC_SRC is live.
1788 Otherwise reuse CC_OP_ADCOX which have the C and O flags split out
1789 exactly as we computed above. */
1790 t0
= tcg_const_i32(0);
1791 t1
= tcg_temp_new_i32();
1792 tcg_gen_trunc_tl_i32(t1
, cpu_T
[1]);
1793 tcg_gen_movi_i32(cpu_tmp2_i32
, CC_OP_ADCOX
);
1794 tcg_gen_movi_i32(cpu_tmp3_i32
, CC_OP_EFLAGS
);
1795 tcg_gen_movcond_i32(TCG_COND_NE
, cpu_cc_op
, t1
, t0
,
1796 cpu_tmp2_i32
, cpu_tmp3_i32
);
1797 tcg_temp_free_i32(t0
);
1798 tcg_temp_free_i32(t1
);
1800 /* The CC_OP value is no longer predictable. */
1801 set_cc_op(s
, CC_OP_DYNAMIC
);
1804 static void gen_rot_rm_im(DisasContext
*s
, int ot
, int op1
, int op2
,
1807 int mask
= (ot
== OT_QUAD
? 0x3f : 0x1f);
1811 if (op1
== OR_TMP0
) {
1812 gen_op_ld_T0_A0(ot
+ s
->mem_index
);
1814 gen_op_mov_TN_reg(ot
, 0, op1
);
1820 #ifdef TARGET_X86_64
1822 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
1824 tcg_gen_rotri_i32(cpu_tmp2_i32
, cpu_tmp2_i32
, op2
);
1826 tcg_gen_rotli_i32(cpu_tmp2_i32
, cpu_tmp2_i32
, op2
);
1828 tcg_gen_extu_i32_tl(cpu_T
[0], cpu_tmp2_i32
);
1833 tcg_gen_rotri_tl(cpu_T
[0], cpu_T
[0], op2
);
1835 tcg_gen_rotli_tl(cpu_T
[0], cpu_T
[0], op2
);
1846 shift
= mask
+ 1 - shift
;
1848 gen_extu(ot
, cpu_T
[0]);
1849 tcg_gen_shli_tl(cpu_tmp0
, cpu_T
[0], shift
);
1850 tcg_gen_shri_tl(cpu_T
[0], cpu_T
[0], mask
+ 1 - shift
);
1851 tcg_gen_or_tl(cpu_T
[0], cpu_T
[0], cpu_tmp0
);
1857 if (op1
== OR_TMP0
) {
1858 gen_op_st_T0_A0(ot
+ s
->mem_index
);
1860 gen_op_mov_reg_T0(ot
, op1
);
1864 /* Compute the flags into CC_SRC. */
1865 gen_compute_eflags(s
);
1867 /* The value that was "rotated out" is now present at the other end
1868 of the word. Compute C into CC_DST and O into CC_SRC2. Note that
1869 since we've computed the flags into CC_SRC, these variables are
1872 tcg_gen_shri_tl(cpu_cc_src2
, cpu_T
[0], mask
- 1);
1873 tcg_gen_shri_tl(cpu_cc_dst
, cpu_T
[0], mask
);
1874 tcg_gen_andi_tl(cpu_cc_dst
, cpu_cc_dst
, 1);
1876 tcg_gen_shri_tl(cpu_cc_src2
, cpu_T
[0], mask
);
1877 tcg_gen_andi_tl(cpu_cc_dst
, cpu_T
[0], 1);
1879 tcg_gen_andi_tl(cpu_cc_src2
, cpu_cc_src2
, 1);
1880 tcg_gen_xor_tl(cpu_cc_src2
, cpu_cc_src2
, cpu_cc_dst
);
1881 set_cc_op(s
, CC_OP_ADCOX
);
1885 /* XXX: add faster immediate = 1 case */
1886 static void gen_rotc_rm_T1(DisasContext
*s
, int ot
, int op1
,
1889 gen_compute_eflags(s
);
1890 assert(s
->cc_op
== CC_OP_EFLAGS
);
1894 gen_op_ld_T0_A0(ot
+ s
->mem_index
);
1896 gen_op_mov_TN_reg(ot
, 0, op1
);
1901 gen_helper_rcrb(cpu_T
[0], cpu_env
, cpu_T
[0], cpu_T
[1]);
1904 gen_helper_rcrw(cpu_T
[0], cpu_env
, cpu_T
[0], cpu_T
[1]);
1907 gen_helper_rcrl(cpu_T
[0], cpu_env
, cpu_T
[0], cpu_T
[1]);
1909 #ifdef TARGET_X86_64
1911 gen_helper_rcrq(cpu_T
[0], cpu_env
, cpu_T
[0], cpu_T
[1]);
1918 gen_helper_rclb(cpu_T
[0], cpu_env
, cpu_T
[0], cpu_T
[1]);
1921 gen_helper_rclw(cpu_T
[0], cpu_env
, cpu_T
[0], cpu_T
[1]);
1924 gen_helper_rcll(cpu_T
[0], cpu_env
, cpu_T
[0], cpu_T
[1]);
1926 #ifdef TARGET_X86_64
1928 gen_helper_rclq(cpu_T
[0], cpu_env
, cpu_T
[0], cpu_T
[1]);
1935 gen_op_st_T0_A0(ot
+ s
->mem_index
);
1937 gen_op_mov_reg_T0(ot
, op1
);
1940 /* XXX: add faster immediate case */
1941 static void gen_shiftd_rm_T1(DisasContext
*s
, int ot
, int op1
,
1942 bool is_right
, TCGv count_in
)
1944 target_ulong mask
= (ot
== OT_QUAD
? 63 : 31);
1948 if (op1
== OR_TMP0
) {
1949 gen_op_ld_T0_A0(ot
+ s
->mem_index
);
1951 gen_op_mov_TN_reg(ot
, 0, op1
);
1954 count
= tcg_temp_new();
1955 tcg_gen_andi_tl(count
, count_in
, mask
);
1959 /* Note: we implement the Intel behaviour for shift count > 16.
1960 This means "shrdw C, B, A" shifts A:B:A >> C. Build the B:A
1961 portion by constructing it as a 32-bit value. */
1963 tcg_gen_deposit_tl(cpu_tmp0
, cpu_T
[0], cpu_T
[1], 16, 16);
1964 tcg_gen_mov_tl(cpu_T
[1], cpu_T
[0]);
1965 tcg_gen_mov_tl(cpu_T
[0], cpu_tmp0
);
1967 tcg_gen_deposit_tl(cpu_T
[1], cpu_T
[0], cpu_T
[1], 16, 16);
1970 #ifdef TARGET_X86_64
1972 /* Concatenate the two 32-bit values and use a 64-bit shift. */
1973 tcg_gen_subi_tl(cpu_tmp0
, count
, 1);
1975 tcg_gen_concat_tl_i64(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1976 tcg_gen_shr_i64(cpu_tmp0
, cpu_T
[0], cpu_tmp0
);
1977 tcg_gen_shr_i64(cpu_T
[0], cpu_T
[0], count
);
1979 tcg_gen_concat_tl_i64(cpu_T
[0], cpu_T
[1], cpu_T
[0]);
1980 tcg_gen_shl_i64(cpu_tmp0
, cpu_T
[0], cpu_tmp0
);
1981 tcg_gen_shl_i64(cpu_T
[0], cpu_T
[0], count
);
1982 tcg_gen_shri_i64(cpu_tmp0
, cpu_tmp0
, 32);
1983 tcg_gen_shri_i64(cpu_T
[0], cpu_T
[0], 32);
1988 tcg_gen_subi_tl(cpu_tmp0
, count
, 1);
1990 tcg_gen_shr_tl(cpu_tmp0
, cpu_T
[0], cpu_tmp0
);
1992 tcg_gen_subfi_tl(cpu_tmp4
, mask
+ 1, count
);
1993 tcg_gen_shr_tl(cpu_T
[0], cpu_T
[0], count
);
1994 tcg_gen_shl_tl(cpu_T
[1], cpu_T
[1], cpu_tmp4
);
1996 tcg_gen_shl_tl(cpu_tmp0
, cpu_T
[0], cpu_tmp0
);
1997 if (ot
== OT_WORD
) {
1998 /* Only needed if count > 16, for Intel behaviour. */
1999 tcg_gen_subfi_tl(cpu_tmp4
, 33, count
);
2000 tcg_gen_shr_tl(cpu_tmp4
, cpu_T
[1], cpu_tmp4
);
2001 tcg_gen_or_tl(cpu_tmp0
, cpu_tmp0
, cpu_tmp4
);
2004 tcg_gen_subfi_tl(cpu_tmp4
, mask
+ 1, count
);
2005 tcg_gen_shl_tl(cpu_T
[0], cpu_T
[0], count
);
2006 tcg_gen_shr_tl(cpu_T
[1], cpu_T
[1], cpu_tmp4
);
2008 tcg_gen_movi_tl(cpu_tmp4
, 0);
2009 tcg_gen_movcond_tl(TCG_COND_EQ
, cpu_T
[1], count
, cpu_tmp4
,
2010 cpu_tmp4
, cpu_T
[1]);
2011 tcg_gen_or_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
2016 if (op1
== OR_TMP0
) {
2017 gen_op_st_T0_A0(ot
+ s
->mem_index
);
2019 gen_op_mov_reg_T0(ot
, op1
);
2022 gen_shift_flags(s
, ot
, cpu_T
[0], cpu_tmp0
, count
, is_right
);
2023 tcg_temp_free(count
);
2026 static void gen_shift(DisasContext
*s1
, int op
, int ot
, int d
, int s
)
2029 gen_op_mov_TN_reg(ot
, 1, s
);
2032 gen_rot_rm_T1(s1
, ot
, d
, 0);
2035 gen_rot_rm_T1(s1
, ot
, d
, 1);
2039 gen_shift_rm_T1(s1
, ot
, d
, 0, 0);
2042 gen_shift_rm_T1(s1
, ot
, d
, 1, 0);
2045 gen_shift_rm_T1(s1
, ot
, d
, 1, 1);
2048 gen_rotc_rm_T1(s1
, ot
, d
, 0);
2051 gen_rotc_rm_T1(s1
, ot
, d
, 1);
2056 static void gen_shifti(DisasContext
*s1
, int op
, int ot
, int d
, int c
)
2060 gen_rot_rm_im(s1
, ot
, d
, c
, 0);
2063 gen_rot_rm_im(s1
, ot
, d
, c
, 1);
2067 gen_shift_rm_im(s1
, ot
, d
, c
, 0, 0);
2070 gen_shift_rm_im(s1
, ot
, d
, c
, 1, 0);
2073 gen_shift_rm_im(s1
, ot
, d
, c
, 1, 1);
2076 /* currently not optimized */
2077 gen_op_movl_T1_im(c
);
2078 gen_shift(s1
, op
, ot
, d
, OR_TMP1
);
2083 static void gen_lea_modrm(CPUX86State
*env
, DisasContext
*s
, int modrm
,
2084 int *reg_ptr
, int *offset_ptr
)
2092 int mod
, rm
, code
, override
, must_add_seg
;
2094 override
= s
->override
;
2095 must_add_seg
= s
->addseg
;
2098 mod
= (modrm
>> 6) & 3;
2110 code
= cpu_ldub_code(env
, s
->pc
++);
2111 scale
= (code
>> 6) & 3;
2112 index
= ((code
>> 3) & 7) | REX_X(s
);
2119 if ((base
& 7) == 5) {
2121 disp
= (int32_t)cpu_ldl_code(env
, s
->pc
);
2123 if (CODE64(s
) && !havesib
) {
2124 disp
+= s
->pc
+ s
->rip_offset
;
2131 disp
= (int8_t)cpu_ldub_code(env
, s
->pc
++);
2135 disp
= (int32_t)cpu_ldl_code(env
, s
->pc
);
2141 /* for correct popl handling with esp */
2142 if (base
== 4 && s
->popl_esp_hack
)
2143 disp
+= s
->popl_esp_hack
;
2144 #ifdef TARGET_X86_64
2145 if (s
->aflag
== 2) {
2146 gen_op_movq_A0_reg(base
);
2148 gen_op_addq_A0_im(disp
);
2153 gen_op_movl_A0_reg(base
);
2155 gen_op_addl_A0_im(disp
);
2158 #ifdef TARGET_X86_64
2159 if (s
->aflag
== 2) {
2160 gen_op_movq_A0_im(disp
);
2164 gen_op_movl_A0_im(disp
);
2167 /* index == 4 means no index */
2168 if (havesib
&& (index
!= 4)) {
2169 #ifdef TARGET_X86_64
2170 if (s
->aflag
== 2) {
2171 gen_op_addq_A0_reg_sN(scale
, index
);
2175 gen_op_addl_A0_reg_sN(scale
, index
);
2180 if (base
== R_EBP
|| base
== R_ESP
)
2185 #ifdef TARGET_X86_64
2186 if (s
->aflag
== 2) {
2187 gen_op_addq_A0_seg(override
);
2191 gen_op_addl_A0_seg(s
, override
);
2198 disp
= cpu_lduw_code(env
, s
->pc
);
2200 gen_op_movl_A0_im(disp
);
2201 rm
= 0; /* avoid SS override */
2208 disp
= (int8_t)cpu_ldub_code(env
, s
->pc
++);
2212 disp
= cpu_lduw_code(env
, s
->pc
);
2218 gen_op_movl_A0_reg(R_EBX
);
2219 gen_op_addl_A0_reg_sN(0, R_ESI
);
2222 gen_op_movl_A0_reg(R_EBX
);
2223 gen_op_addl_A0_reg_sN(0, R_EDI
);
2226 gen_op_movl_A0_reg(R_EBP
);
2227 gen_op_addl_A0_reg_sN(0, R_ESI
);
2230 gen_op_movl_A0_reg(R_EBP
);
2231 gen_op_addl_A0_reg_sN(0, R_EDI
);
2234 gen_op_movl_A0_reg(R_ESI
);
2237 gen_op_movl_A0_reg(R_EDI
);
2240 gen_op_movl_A0_reg(R_EBP
);
2244 gen_op_movl_A0_reg(R_EBX
);
2248 gen_op_addl_A0_im(disp
);
2249 gen_op_andl_A0_ffff();
2253 if (rm
== 2 || rm
== 3 || rm
== 6)
2258 gen_op_addl_A0_seg(s
, override
);
2268 static void gen_nop_modrm(CPUX86State
*env
, DisasContext
*s
, int modrm
)
2270 int mod
, rm
, base
, code
;
2272 mod
= (modrm
>> 6) & 3;
2282 code
= cpu_ldub_code(env
, s
->pc
++);
2318 /* used for LEA and MOV AX, mem */
2319 static void gen_add_A0_ds_seg(DisasContext
*s
)
2321 int override
, must_add_seg
;
2322 must_add_seg
= s
->addseg
;
2324 if (s
->override
>= 0) {
2325 override
= s
->override
;
2329 #ifdef TARGET_X86_64
2331 gen_op_addq_A0_seg(override
);
2335 gen_op_addl_A0_seg(s
, override
);
2340 /* generate modrm memory load or store of 'reg'. TMP0 is used if reg ==
2342 static void gen_ldst_modrm(CPUX86State
*env
, DisasContext
*s
, int modrm
,
2343 int ot
, int reg
, int is_store
)
2345 int mod
, rm
, opreg
, disp
;
2347 mod
= (modrm
>> 6) & 3;
2348 rm
= (modrm
& 7) | REX_B(s
);
2352 gen_op_mov_TN_reg(ot
, 0, reg
);
2353 gen_op_mov_reg_T0(ot
, rm
);
2355 gen_op_mov_TN_reg(ot
, 0, rm
);
2357 gen_op_mov_reg_T0(ot
, reg
);
2360 gen_lea_modrm(env
, s
, modrm
, &opreg
, &disp
);
2363 gen_op_mov_TN_reg(ot
, 0, reg
);
2364 gen_op_st_T0_A0(ot
+ s
->mem_index
);
2366 gen_op_ld_T0_A0(ot
+ s
->mem_index
);
2368 gen_op_mov_reg_T0(ot
, reg
);
2373 static inline uint32_t insn_get(CPUX86State
*env
, DisasContext
*s
, int ot
)
2379 ret
= cpu_ldub_code(env
, s
->pc
);
2383 ret
= cpu_lduw_code(env
, s
->pc
);
2388 ret
= cpu_ldl_code(env
, s
->pc
);
2395 static inline int insn_const_size(unsigned int ot
)
2403 static inline void gen_goto_tb(DisasContext
*s
, int tb_num
, target_ulong eip
)
2405 TranslationBlock
*tb
;
2408 pc
= s
->cs_base
+ eip
;
2410 /* NOTE: we handle the case where the TB spans two pages here */
2411 if ((pc
& TARGET_PAGE_MASK
) == (tb
->pc
& TARGET_PAGE_MASK
) ||
2412 (pc
& TARGET_PAGE_MASK
) == ((s
->pc
- 1) & TARGET_PAGE_MASK
)) {
2413 /* jump to same page: we can use a direct jump */
2414 tcg_gen_goto_tb(tb_num
);
2416 tcg_gen_exit_tb((tcg_target_long
)tb
+ tb_num
);
2418 /* jump to another page: currently not optimized */
2424 static inline void gen_jcc(DisasContext
*s
, int b
,
2425 target_ulong val
, target_ulong next_eip
)
2430 l1
= gen_new_label();
2433 gen_goto_tb(s
, 0, next_eip
);
2436 gen_goto_tb(s
, 1, val
);
2437 s
->is_jmp
= DISAS_TB_JUMP
;
2439 l1
= gen_new_label();
2440 l2
= gen_new_label();
2443 gen_jmp_im(next_eip
);
2453 static void gen_cmovcc1(CPUX86State
*env
, DisasContext
*s
, int ot
, int b
,
2458 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
2460 cc
= gen_prepare_cc(s
, b
, cpu_T
[1]);
2461 if (cc
.mask
!= -1) {
2462 TCGv t0
= tcg_temp_new();
2463 tcg_gen_andi_tl(t0
, cc
.reg
, cc
.mask
);
2467 cc
.reg2
= tcg_const_tl(cc
.imm
);
2470 tcg_gen_movcond_tl(cc
.cond
, cpu_T
[0], cc
.reg
, cc
.reg2
,
2471 cpu_T
[0], cpu_regs
[reg
]);
2472 gen_op_mov_reg_T0(ot
, reg
);
2474 if (cc
.mask
!= -1) {
2475 tcg_temp_free(cc
.reg
);
2478 tcg_temp_free(cc
.reg2
);
2482 static inline void gen_op_movl_T0_seg(int seg_reg
)
2484 tcg_gen_ld32u_tl(cpu_T
[0], cpu_env
,
2485 offsetof(CPUX86State
,segs
[seg_reg
].selector
));
2488 static inline void gen_op_movl_seg_T0_vm(int seg_reg
)
2490 tcg_gen_andi_tl(cpu_T
[0], cpu_T
[0], 0xffff);
2491 tcg_gen_st32_tl(cpu_T
[0], cpu_env
,
2492 offsetof(CPUX86State
,segs
[seg_reg
].selector
));
2493 tcg_gen_shli_tl(cpu_T
[0], cpu_T
[0], 4);
2494 tcg_gen_st_tl(cpu_T
[0], cpu_env
,
2495 offsetof(CPUX86State
,segs
[seg_reg
].base
));
2498 /* move T0 to seg_reg and compute if the CPU state may change. Never
2499 call this function with seg_reg == R_CS */
2500 static void gen_movl_seg_T0(DisasContext
*s
, int seg_reg
, target_ulong cur_eip
)
2502 if (s
->pe
&& !s
->vm86
) {
2503 /* XXX: optimize by finding processor state dynamically */
2504 gen_update_cc_op(s
);
2505 gen_jmp_im(cur_eip
);
2506 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
2507 gen_helper_load_seg(cpu_env
, tcg_const_i32(seg_reg
), cpu_tmp2_i32
);
2508 /* abort translation because the addseg value may change or
2509 because ss32 may change. For R_SS, translation must always
2510 stop as a special handling must be done to disable hardware
2511 interrupts for the next instruction */
2512 if (seg_reg
== R_SS
|| (s
->code32
&& seg_reg
< R_FS
))
2513 s
->is_jmp
= DISAS_TB_JUMP
;
2515 gen_op_movl_seg_T0_vm(seg_reg
);
2516 if (seg_reg
== R_SS
)
2517 s
->is_jmp
= DISAS_TB_JUMP
;
2521 static inline int svm_is_rep(int prefixes
)
2523 return ((prefixes
& (PREFIX_REPZ
| PREFIX_REPNZ
)) ? 8 : 0);
2527 gen_svm_check_intercept_param(DisasContext
*s
, target_ulong pc_start
,
2528 uint32_t type
, uint64_t param
)
2530 /* no SVM activated; fast case */
2531 if (likely(!(s
->flags
& HF_SVMI_MASK
)))
2533 gen_update_cc_op(s
);
2534 gen_jmp_im(pc_start
- s
->cs_base
);
2535 gen_helper_svm_check_intercept_param(cpu_env
, tcg_const_i32(type
),
2536 tcg_const_i64(param
));
2540 gen_svm_check_intercept(DisasContext
*s
, target_ulong pc_start
, uint64_t type
)
2542 gen_svm_check_intercept_param(s
, pc_start
, type
, 0);
2545 static inline void gen_stack_update(DisasContext
*s
, int addend
)
2547 #ifdef TARGET_X86_64
2549 gen_op_add_reg_im(2, R_ESP
, addend
);
2553 gen_op_add_reg_im(1, R_ESP
, addend
);
2555 gen_op_add_reg_im(0, R_ESP
, addend
);
2559 /* generate a push. It depends on ss32, addseg and dflag */
2560 static void gen_push_T0(DisasContext
*s
)
2562 #ifdef TARGET_X86_64
2564 gen_op_movq_A0_reg(R_ESP
);
2566 gen_op_addq_A0_im(-8);
2567 gen_op_st_T0_A0(OT_QUAD
+ s
->mem_index
);
2569 gen_op_addq_A0_im(-2);
2570 gen_op_st_T0_A0(OT_WORD
+ s
->mem_index
);
2572 gen_op_mov_reg_A0(2, R_ESP
);
2576 gen_op_movl_A0_reg(R_ESP
);
2578 gen_op_addl_A0_im(-2);
2580 gen_op_addl_A0_im(-4);
2583 tcg_gen_mov_tl(cpu_T
[1], cpu_A0
);
2584 gen_op_addl_A0_seg(s
, R_SS
);
2587 gen_op_andl_A0_ffff();
2588 tcg_gen_mov_tl(cpu_T
[1], cpu_A0
);
2589 gen_op_addl_A0_seg(s
, R_SS
);
2591 gen_op_st_T0_A0(s
->dflag
+ 1 + s
->mem_index
);
2592 if (s
->ss32
&& !s
->addseg
)
2593 gen_op_mov_reg_A0(1, R_ESP
);
2595 gen_op_mov_reg_T1(s
->ss32
+ 1, R_ESP
);
2599 /* generate a push. It depends on ss32, addseg and dflag */
2600 /* slower version for T1, only used for call Ev */
2601 static void gen_push_T1(DisasContext
*s
)
2603 #ifdef TARGET_X86_64
2605 gen_op_movq_A0_reg(R_ESP
);
2607 gen_op_addq_A0_im(-8);
2608 gen_op_st_T1_A0(OT_QUAD
+ s
->mem_index
);
2610 gen_op_addq_A0_im(-2);
2611 gen_op_st_T0_A0(OT_WORD
+ s
->mem_index
);
2613 gen_op_mov_reg_A0(2, R_ESP
);
2617 gen_op_movl_A0_reg(R_ESP
);
2619 gen_op_addl_A0_im(-2);
2621 gen_op_addl_A0_im(-4);
2624 gen_op_addl_A0_seg(s
, R_SS
);
2627 gen_op_andl_A0_ffff();
2628 gen_op_addl_A0_seg(s
, R_SS
);
2630 gen_op_st_T1_A0(s
->dflag
+ 1 + s
->mem_index
);
2632 if (s
->ss32
&& !s
->addseg
)
2633 gen_op_mov_reg_A0(1, R_ESP
);
2635 gen_stack_update(s
, (-2) << s
->dflag
);
2639 /* two step pop is necessary for precise exceptions */
2640 static void gen_pop_T0(DisasContext
*s
)
2642 #ifdef TARGET_X86_64
2644 gen_op_movq_A0_reg(R_ESP
);
2645 gen_op_ld_T0_A0((s
->dflag
? OT_QUAD
: OT_WORD
) + s
->mem_index
);
2649 gen_op_movl_A0_reg(R_ESP
);
2652 gen_op_addl_A0_seg(s
, R_SS
);
2654 gen_op_andl_A0_ffff();
2655 gen_op_addl_A0_seg(s
, R_SS
);
2657 gen_op_ld_T0_A0(s
->dflag
+ 1 + s
->mem_index
);
2661 static void gen_pop_update(DisasContext
*s
)
2663 #ifdef TARGET_X86_64
2664 if (CODE64(s
) && s
->dflag
) {
2665 gen_stack_update(s
, 8);
2669 gen_stack_update(s
, 2 << s
->dflag
);
2673 static void gen_stack_A0(DisasContext
*s
)
2675 gen_op_movl_A0_reg(R_ESP
);
2677 gen_op_andl_A0_ffff();
2678 tcg_gen_mov_tl(cpu_T
[1], cpu_A0
);
2680 gen_op_addl_A0_seg(s
, R_SS
);
2683 /* NOTE: wrap around in 16 bit not fully handled */
2684 static void gen_pusha(DisasContext
*s
)
2687 gen_op_movl_A0_reg(R_ESP
);
2688 gen_op_addl_A0_im(-16 << s
->dflag
);
2690 gen_op_andl_A0_ffff();
2691 tcg_gen_mov_tl(cpu_T
[1], cpu_A0
);
2693 gen_op_addl_A0_seg(s
, R_SS
);
2694 for(i
= 0;i
< 8; i
++) {
2695 gen_op_mov_TN_reg(OT_LONG
, 0, 7 - i
);
2696 gen_op_st_T0_A0(OT_WORD
+ s
->dflag
+ s
->mem_index
);
2697 gen_op_addl_A0_im(2 << s
->dflag
);
2699 gen_op_mov_reg_T1(OT_WORD
+ s
->ss32
, R_ESP
);
2702 /* NOTE: wrap around in 16 bit not fully handled */
2703 static void gen_popa(DisasContext
*s
)
2706 gen_op_movl_A0_reg(R_ESP
);
2708 gen_op_andl_A0_ffff();
2709 tcg_gen_mov_tl(cpu_T
[1], cpu_A0
);
2710 tcg_gen_addi_tl(cpu_T
[1], cpu_T
[1], 16 << s
->dflag
);
2712 gen_op_addl_A0_seg(s
, R_SS
);
2713 for(i
= 0;i
< 8; i
++) {
2714 /* ESP is not reloaded */
2716 gen_op_ld_T0_A0(OT_WORD
+ s
->dflag
+ s
->mem_index
);
2717 gen_op_mov_reg_T0(OT_WORD
+ s
->dflag
, 7 - i
);
2719 gen_op_addl_A0_im(2 << s
->dflag
);
2721 gen_op_mov_reg_T1(OT_WORD
+ s
->ss32
, R_ESP
);
2724 static void gen_enter(DisasContext
*s
, int esp_addend
, int level
)
2729 #ifdef TARGET_X86_64
2731 ot
= s
->dflag
? OT_QUAD
: OT_WORD
;
2734 gen_op_movl_A0_reg(R_ESP
);
2735 gen_op_addq_A0_im(-opsize
);
2736 tcg_gen_mov_tl(cpu_T
[1], cpu_A0
);
2739 gen_op_mov_TN_reg(OT_LONG
, 0, R_EBP
);
2740 gen_op_st_T0_A0(ot
+ s
->mem_index
);
2742 /* XXX: must save state */
2743 gen_helper_enter64_level(cpu_env
, tcg_const_i32(level
),
2744 tcg_const_i32((ot
== OT_QUAD
)),
2747 gen_op_mov_reg_T1(ot
, R_EBP
);
2748 tcg_gen_addi_tl(cpu_T
[1], cpu_T
[1], -esp_addend
+ (-opsize
* level
));
2749 gen_op_mov_reg_T1(OT_QUAD
, R_ESP
);
2753 ot
= s
->dflag
+ OT_WORD
;
2754 opsize
= 2 << s
->dflag
;
2756 gen_op_movl_A0_reg(R_ESP
);
2757 gen_op_addl_A0_im(-opsize
);
2759 gen_op_andl_A0_ffff();
2760 tcg_gen_mov_tl(cpu_T
[1], cpu_A0
);
2762 gen_op_addl_A0_seg(s
, R_SS
);
2764 gen_op_mov_TN_reg(OT_LONG
, 0, R_EBP
);
2765 gen_op_st_T0_A0(ot
+ s
->mem_index
);
2767 /* XXX: must save state */
2768 gen_helper_enter_level(cpu_env
, tcg_const_i32(level
),
2769 tcg_const_i32(s
->dflag
),
2772 gen_op_mov_reg_T1(ot
, R_EBP
);
2773 tcg_gen_addi_tl(cpu_T
[1], cpu_T
[1], -esp_addend
+ (-opsize
* level
));
2774 gen_op_mov_reg_T1(OT_WORD
+ s
->ss32
, R_ESP
);
2778 static void gen_exception(DisasContext
*s
, int trapno
, target_ulong cur_eip
)
2780 gen_update_cc_op(s
);
2781 gen_jmp_im(cur_eip
);
2782 gen_helper_raise_exception(cpu_env
, tcg_const_i32(trapno
));
2783 s
->is_jmp
= DISAS_TB_JUMP
;
2786 /* an interrupt is different from an exception because of the
2788 static void gen_interrupt(DisasContext
*s
, int intno
,
2789 target_ulong cur_eip
, target_ulong next_eip
)
2791 gen_update_cc_op(s
);
2792 gen_jmp_im(cur_eip
);
2793 gen_helper_raise_interrupt(cpu_env
, tcg_const_i32(intno
),
2794 tcg_const_i32(next_eip
- cur_eip
));
2795 s
->is_jmp
= DISAS_TB_JUMP
;
2798 static void gen_debug(DisasContext
*s
, target_ulong cur_eip
)
2800 gen_update_cc_op(s
);
2801 gen_jmp_im(cur_eip
);
2802 gen_helper_debug(cpu_env
);
2803 s
->is_jmp
= DISAS_TB_JUMP
;
2806 /* generate a generic end of block. Trace exception is also generated
2808 static void gen_eob(DisasContext
*s
)
2810 gen_update_cc_op(s
);
2811 if (s
->tb
->flags
& HF_INHIBIT_IRQ_MASK
) {
2812 gen_helper_reset_inhibit_irq(cpu_env
);
2814 if (s
->tb
->flags
& HF_RF_MASK
) {
2815 gen_helper_reset_rf(cpu_env
);
2817 if (s
->singlestep_enabled
) {
2818 gen_helper_debug(cpu_env
);
2820 gen_helper_single_step(cpu_env
);
2824 s
->is_jmp
= DISAS_TB_JUMP
;
2827 /* generate a jump to eip. No segment change must happen before as a
2828 direct call to the next block may occur */
2829 static void gen_jmp_tb(DisasContext
*s
, target_ulong eip
, int tb_num
)
2831 gen_update_cc_op(s
);
2832 set_cc_op(s
, CC_OP_DYNAMIC
);
2834 gen_goto_tb(s
, tb_num
, eip
);
2835 s
->is_jmp
= DISAS_TB_JUMP
;
2842 static void gen_jmp(DisasContext
*s
, target_ulong eip
)
2844 gen_jmp_tb(s
, eip
, 0);
2847 static inline void gen_ldq_env_A0(int idx
, int offset
)
2849 int mem_index
= (idx
>> 2) - 1;
2850 tcg_gen_qemu_ld64(cpu_tmp1_i64
, cpu_A0
, mem_index
);
2851 tcg_gen_st_i64(cpu_tmp1_i64
, cpu_env
, offset
);
2854 static inline void gen_stq_env_A0(int idx
, int offset
)
2856 int mem_index
= (idx
>> 2) - 1;
2857 tcg_gen_ld_i64(cpu_tmp1_i64
, cpu_env
, offset
);
2858 tcg_gen_qemu_st64(cpu_tmp1_i64
, cpu_A0
, mem_index
);
2861 static inline void gen_ldo_env_A0(int idx
, int offset
)
2863 int mem_index
= (idx
>> 2) - 1;
2864 tcg_gen_qemu_ld64(cpu_tmp1_i64
, cpu_A0
, mem_index
);
2865 tcg_gen_st_i64(cpu_tmp1_i64
, cpu_env
, offset
+ offsetof(XMMReg
, XMM_Q(0)));
2866 tcg_gen_addi_tl(cpu_tmp0
, cpu_A0
, 8);
2867 tcg_gen_qemu_ld64(cpu_tmp1_i64
, cpu_tmp0
, mem_index
);
2868 tcg_gen_st_i64(cpu_tmp1_i64
, cpu_env
, offset
+ offsetof(XMMReg
, XMM_Q(1)));
2871 static inline void gen_sto_env_A0(int idx
, int offset
)
2873 int mem_index
= (idx
>> 2) - 1;
2874 tcg_gen_ld_i64(cpu_tmp1_i64
, cpu_env
, offset
+ offsetof(XMMReg
, XMM_Q(0)));
2875 tcg_gen_qemu_st64(cpu_tmp1_i64
, cpu_A0
, mem_index
);
2876 tcg_gen_addi_tl(cpu_tmp0
, cpu_A0
, 8);
2877 tcg_gen_ld_i64(cpu_tmp1_i64
, cpu_env
, offset
+ offsetof(XMMReg
, XMM_Q(1)));
2878 tcg_gen_qemu_st64(cpu_tmp1_i64
, cpu_tmp0
, mem_index
);
2881 static inline void gen_op_movo(int d_offset
, int s_offset
)
2883 tcg_gen_ld_i64(cpu_tmp1_i64
, cpu_env
, s_offset
);
2884 tcg_gen_st_i64(cpu_tmp1_i64
, cpu_env
, d_offset
);
2885 tcg_gen_ld_i64(cpu_tmp1_i64
, cpu_env
, s_offset
+ 8);
2886 tcg_gen_st_i64(cpu_tmp1_i64
, cpu_env
, d_offset
+ 8);
2889 static inline void gen_op_movq(int d_offset
, int s_offset
)
2891 tcg_gen_ld_i64(cpu_tmp1_i64
, cpu_env
, s_offset
);
2892 tcg_gen_st_i64(cpu_tmp1_i64
, cpu_env
, d_offset
);
2895 static inline void gen_op_movl(int d_offset
, int s_offset
)
2897 tcg_gen_ld_i32(cpu_tmp2_i32
, cpu_env
, s_offset
);
2898 tcg_gen_st_i32(cpu_tmp2_i32
, cpu_env
, d_offset
);
2901 static inline void gen_op_movq_env_0(int d_offset
)
2903 tcg_gen_movi_i64(cpu_tmp1_i64
, 0);
2904 tcg_gen_st_i64(cpu_tmp1_i64
, cpu_env
, d_offset
);
2907 typedef void (*SSEFunc_i_ep
)(TCGv_i32 val
, TCGv_ptr env
, TCGv_ptr reg
);
2908 typedef void (*SSEFunc_l_ep
)(TCGv_i64 val
, TCGv_ptr env
, TCGv_ptr reg
);
2909 typedef void (*SSEFunc_0_epi
)(TCGv_ptr env
, TCGv_ptr reg
, TCGv_i32 val
);
2910 typedef void (*SSEFunc_0_epl
)(TCGv_ptr env
, TCGv_ptr reg
, TCGv_i64 val
);
2911 typedef void (*SSEFunc_0_epp
)(TCGv_ptr env
, TCGv_ptr reg_a
, TCGv_ptr reg_b
);
2912 typedef void (*SSEFunc_0_eppi
)(TCGv_ptr env
, TCGv_ptr reg_a
, TCGv_ptr reg_b
,
2914 typedef void (*SSEFunc_0_ppi
)(TCGv_ptr reg_a
, TCGv_ptr reg_b
, TCGv_i32 val
);
2915 typedef void (*SSEFunc_0_eppt
)(TCGv_ptr env
, TCGv_ptr reg_a
, TCGv_ptr reg_b
,
2918 #define SSE_SPECIAL ((void *)1)
2919 #define SSE_DUMMY ((void *)2)
2921 #define MMX_OP2(x) { gen_helper_ ## x ## _mmx, gen_helper_ ## x ## _xmm }
2922 #define SSE_FOP(x) { gen_helper_ ## x ## ps, gen_helper_ ## x ## pd, \
2923 gen_helper_ ## x ## ss, gen_helper_ ## x ## sd, }
2925 static const SSEFunc_0_epp sse_op_table1
[256][4] = {
2926 /* 3DNow! extensions */
2927 [0x0e] = { SSE_DUMMY
}, /* femms */
2928 [0x0f] = { SSE_DUMMY
}, /* pf... */
2929 /* pure SSE operations */
2930 [0x10] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* movups, movupd, movss, movsd */
2931 [0x11] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* movups, movupd, movss, movsd */
2932 [0x12] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* movlps, movlpd, movsldup, movddup */
2933 [0x13] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* movlps, movlpd */
2934 [0x14] = { gen_helper_punpckldq_xmm
, gen_helper_punpcklqdq_xmm
},
2935 [0x15] = { gen_helper_punpckhdq_xmm
, gen_helper_punpckhqdq_xmm
},
2936 [0x16] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* movhps, movhpd, movshdup */
2937 [0x17] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* movhps, movhpd */
2939 [0x28] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* movaps, movapd */
2940 [0x29] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* movaps, movapd */
2941 [0x2a] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* cvtpi2ps, cvtpi2pd, cvtsi2ss, cvtsi2sd */
2942 [0x2b] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* movntps, movntpd, movntss, movntsd */
2943 [0x2c] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* cvttps2pi, cvttpd2pi, cvttsd2si, cvttss2si */
2944 [0x2d] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* cvtps2pi, cvtpd2pi, cvtsd2si, cvtss2si */
2945 [0x2e] = { gen_helper_ucomiss
, gen_helper_ucomisd
},
2946 [0x2f] = { gen_helper_comiss
, gen_helper_comisd
},
2947 [0x50] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* movmskps, movmskpd */
2948 [0x51] = SSE_FOP(sqrt
),
2949 [0x52] = { gen_helper_rsqrtps
, NULL
, gen_helper_rsqrtss
, NULL
},
2950 [0x53] = { gen_helper_rcpps
, NULL
, gen_helper_rcpss
, NULL
},
2951 [0x54] = { gen_helper_pand_xmm
, gen_helper_pand_xmm
}, /* andps, andpd */
2952 [0x55] = { gen_helper_pandn_xmm
, gen_helper_pandn_xmm
}, /* andnps, andnpd */
2953 [0x56] = { gen_helper_por_xmm
, gen_helper_por_xmm
}, /* orps, orpd */
2954 [0x57] = { gen_helper_pxor_xmm
, gen_helper_pxor_xmm
}, /* xorps, xorpd */
2955 [0x58] = SSE_FOP(add
),
2956 [0x59] = SSE_FOP(mul
),
2957 [0x5a] = { gen_helper_cvtps2pd
, gen_helper_cvtpd2ps
,
2958 gen_helper_cvtss2sd
, gen_helper_cvtsd2ss
},
2959 [0x5b] = { gen_helper_cvtdq2ps
, gen_helper_cvtps2dq
, gen_helper_cvttps2dq
},
2960 [0x5c] = SSE_FOP(sub
),
2961 [0x5d] = SSE_FOP(min
),
2962 [0x5e] = SSE_FOP(div
),
2963 [0x5f] = SSE_FOP(max
),
2965 [0xc2] = SSE_FOP(cmpeq
),
2966 [0xc6] = { (SSEFunc_0_epp
)gen_helper_shufps
,
2967 (SSEFunc_0_epp
)gen_helper_shufpd
}, /* XXX: casts */
2969 /* SSSE3, SSE4, MOVBE, CRC32, BMI1, BMI2, ADX. */
2970 [0x38] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
},
2971 [0x3a] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
},
2973 /* MMX ops and their SSE extensions */
2974 [0x60] = MMX_OP2(punpcklbw
),
2975 [0x61] = MMX_OP2(punpcklwd
),
2976 [0x62] = MMX_OP2(punpckldq
),
2977 [0x63] = MMX_OP2(packsswb
),
2978 [0x64] = MMX_OP2(pcmpgtb
),
2979 [0x65] = MMX_OP2(pcmpgtw
),
2980 [0x66] = MMX_OP2(pcmpgtl
),
2981 [0x67] = MMX_OP2(packuswb
),
2982 [0x68] = MMX_OP2(punpckhbw
),
2983 [0x69] = MMX_OP2(punpckhwd
),
2984 [0x6a] = MMX_OP2(punpckhdq
),
2985 [0x6b] = MMX_OP2(packssdw
),
2986 [0x6c] = { NULL
, gen_helper_punpcklqdq_xmm
},
2987 [0x6d] = { NULL
, gen_helper_punpckhqdq_xmm
},
2988 [0x6e] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* movd mm, ea */
2989 [0x6f] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* movq, movdqa, , movqdu */
2990 [0x70] = { (SSEFunc_0_epp
)gen_helper_pshufw_mmx
,
2991 (SSEFunc_0_epp
)gen_helper_pshufd_xmm
,
2992 (SSEFunc_0_epp
)gen_helper_pshufhw_xmm
,
2993 (SSEFunc_0_epp
)gen_helper_pshuflw_xmm
}, /* XXX: casts */
2994 [0x71] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* shiftw */
2995 [0x72] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* shiftd */
2996 [0x73] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* shiftq */
2997 [0x74] = MMX_OP2(pcmpeqb
),
2998 [0x75] = MMX_OP2(pcmpeqw
),
2999 [0x76] = MMX_OP2(pcmpeql
),
3000 [0x77] = { SSE_DUMMY
}, /* emms */
3001 [0x78] = { NULL
, SSE_SPECIAL
, NULL
, SSE_SPECIAL
}, /* extrq_i, insertq_i */
3002 [0x79] = { NULL
, gen_helper_extrq_r
, NULL
, gen_helper_insertq_r
},
3003 [0x7c] = { NULL
, gen_helper_haddpd
, NULL
, gen_helper_haddps
},
3004 [0x7d] = { NULL
, gen_helper_hsubpd
, NULL
, gen_helper_hsubps
},
3005 [0x7e] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* movd, movd, , movq */
3006 [0x7f] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* movq, movdqa, movdqu */
3007 [0xc4] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* pinsrw */
3008 [0xc5] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* pextrw */
3009 [0xd0] = { NULL
, gen_helper_addsubpd
, NULL
, gen_helper_addsubps
},
3010 [0xd1] = MMX_OP2(psrlw
),
3011 [0xd2] = MMX_OP2(psrld
),
3012 [0xd3] = MMX_OP2(psrlq
),
3013 [0xd4] = MMX_OP2(paddq
),
3014 [0xd5] = MMX_OP2(pmullw
),
3015 [0xd6] = { NULL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
},
3016 [0xd7] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* pmovmskb */
3017 [0xd8] = MMX_OP2(psubusb
),
3018 [0xd9] = MMX_OP2(psubusw
),
3019 [0xda] = MMX_OP2(pminub
),
3020 [0xdb] = MMX_OP2(pand
),
3021 [0xdc] = MMX_OP2(paddusb
),
3022 [0xdd] = MMX_OP2(paddusw
),
3023 [0xde] = MMX_OP2(pmaxub
),
3024 [0xdf] = MMX_OP2(pandn
),
3025 [0xe0] = MMX_OP2(pavgb
),
3026 [0xe1] = MMX_OP2(psraw
),
3027 [0xe2] = MMX_OP2(psrad
),
3028 [0xe3] = MMX_OP2(pavgw
),
3029 [0xe4] = MMX_OP2(pmulhuw
),
3030 [0xe5] = MMX_OP2(pmulhw
),
3031 [0xe6] = { NULL
, gen_helper_cvttpd2dq
, gen_helper_cvtdq2pd
, gen_helper_cvtpd2dq
},
3032 [0xe7] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* movntq, movntq */
3033 [0xe8] = MMX_OP2(psubsb
),
3034 [0xe9] = MMX_OP2(psubsw
),
3035 [0xea] = MMX_OP2(pminsw
),
3036 [0xeb] = MMX_OP2(por
),
3037 [0xec] = MMX_OP2(paddsb
),
3038 [0xed] = MMX_OP2(paddsw
),
3039 [0xee] = MMX_OP2(pmaxsw
),
3040 [0xef] = MMX_OP2(pxor
),
3041 [0xf0] = { NULL
, NULL
, NULL
, SSE_SPECIAL
}, /* lddqu */
3042 [0xf1] = MMX_OP2(psllw
),
3043 [0xf2] = MMX_OP2(pslld
),
3044 [0xf3] = MMX_OP2(psllq
),
3045 [0xf4] = MMX_OP2(pmuludq
),
3046 [0xf5] = MMX_OP2(pmaddwd
),
3047 [0xf6] = MMX_OP2(psadbw
),
3048 [0xf7] = { (SSEFunc_0_epp
)gen_helper_maskmov_mmx
,
3049 (SSEFunc_0_epp
)gen_helper_maskmov_xmm
}, /* XXX: casts */
3050 [0xf8] = MMX_OP2(psubb
),
3051 [0xf9] = MMX_OP2(psubw
),
3052 [0xfa] = MMX_OP2(psubl
),
3053 [0xfb] = MMX_OP2(psubq
),
3054 [0xfc] = MMX_OP2(paddb
),
3055 [0xfd] = MMX_OP2(paddw
),
3056 [0xfe] = MMX_OP2(paddl
),
3059 static const SSEFunc_0_epp sse_op_table2
[3 * 8][2] = {
3060 [0 + 2] = MMX_OP2(psrlw
),
3061 [0 + 4] = MMX_OP2(psraw
),
3062 [0 + 6] = MMX_OP2(psllw
),
3063 [8 + 2] = MMX_OP2(psrld
),
3064 [8 + 4] = MMX_OP2(psrad
),
3065 [8 + 6] = MMX_OP2(pslld
),
3066 [16 + 2] = MMX_OP2(psrlq
),
3067 [16 + 3] = { NULL
, gen_helper_psrldq_xmm
},
3068 [16 + 6] = MMX_OP2(psllq
),
3069 [16 + 7] = { NULL
, gen_helper_pslldq_xmm
},
3072 static const SSEFunc_0_epi sse_op_table3ai
[] = {
3073 gen_helper_cvtsi2ss
,
3077 #ifdef TARGET_X86_64
3078 static const SSEFunc_0_epl sse_op_table3aq
[] = {
3079 gen_helper_cvtsq2ss
,
3084 static const SSEFunc_i_ep sse_op_table3bi
[] = {
3085 gen_helper_cvttss2si
,
3086 gen_helper_cvtss2si
,
3087 gen_helper_cvttsd2si
,
3091 #ifdef TARGET_X86_64
3092 static const SSEFunc_l_ep sse_op_table3bq
[] = {
3093 gen_helper_cvttss2sq
,
3094 gen_helper_cvtss2sq
,
3095 gen_helper_cvttsd2sq
,
3100 static const SSEFunc_0_epp sse_op_table4
[8][4] = {
3111 static const SSEFunc_0_epp sse_op_table5
[256] = {
3112 [0x0c] = gen_helper_pi2fw
,
3113 [0x0d] = gen_helper_pi2fd
,
3114 [0x1c] = gen_helper_pf2iw
,
3115 [0x1d] = gen_helper_pf2id
,
3116 [0x8a] = gen_helper_pfnacc
,
3117 [0x8e] = gen_helper_pfpnacc
,
3118 [0x90] = gen_helper_pfcmpge
,
3119 [0x94] = gen_helper_pfmin
,
3120 [0x96] = gen_helper_pfrcp
,
3121 [0x97] = gen_helper_pfrsqrt
,
3122 [0x9a] = gen_helper_pfsub
,
3123 [0x9e] = gen_helper_pfadd
,
3124 [0xa0] = gen_helper_pfcmpgt
,
3125 [0xa4] = gen_helper_pfmax
,
3126 [0xa6] = gen_helper_movq
, /* pfrcpit1; no need to actually increase precision */
3127 [0xa7] = gen_helper_movq
, /* pfrsqit1 */
3128 [0xaa] = gen_helper_pfsubr
,
3129 [0xae] = gen_helper_pfacc
,
3130 [0xb0] = gen_helper_pfcmpeq
,
3131 [0xb4] = gen_helper_pfmul
,
3132 [0xb6] = gen_helper_movq
, /* pfrcpit2 */
3133 [0xb7] = gen_helper_pmulhrw_mmx
,
3134 [0xbb] = gen_helper_pswapd
,
3135 [0xbf] = gen_helper_pavgb_mmx
/* pavgusb */
3138 struct SSEOpHelper_epp
{
3139 SSEFunc_0_epp op
[2];
3143 struct SSEOpHelper_eppi
{
3144 SSEFunc_0_eppi op
[2];
3148 #define SSSE3_OP(x) { MMX_OP2(x), CPUID_EXT_SSSE3 }
3149 #define SSE41_OP(x) { { NULL, gen_helper_ ## x ## _xmm }, CPUID_EXT_SSE41 }
3150 #define SSE42_OP(x) { { NULL, gen_helper_ ## x ## _xmm }, CPUID_EXT_SSE42 }
3151 #define SSE41_SPECIAL { { NULL, SSE_SPECIAL }, CPUID_EXT_SSE41 }
3152 #define PCLMULQDQ_OP(x) { { NULL, gen_helper_ ## x ## _xmm }, \
3153 CPUID_EXT_PCLMULQDQ }
3154 #define AESNI_OP(x) { { NULL, gen_helper_ ## x ## _xmm }, CPUID_EXT_AES }
3156 static const struct SSEOpHelper_epp sse_op_table6
[256] = {
3157 [0x00] = SSSE3_OP(pshufb
),
3158 [0x01] = SSSE3_OP(phaddw
),
3159 [0x02] = SSSE3_OP(phaddd
),
3160 [0x03] = SSSE3_OP(phaddsw
),
3161 [0x04] = SSSE3_OP(pmaddubsw
),
3162 [0x05] = SSSE3_OP(phsubw
),
3163 [0x06] = SSSE3_OP(phsubd
),
3164 [0x07] = SSSE3_OP(phsubsw
),
3165 [0x08] = SSSE3_OP(psignb
),
3166 [0x09] = SSSE3_OP(psignw
),
3167 [0x0a] = SSSE3_OP(psignd
),
3168 [0x0b] = SSSE3_OP(pmulhrsw
),
3169 [0x10] = SSE41_OP(pblendvb
),
3170 [0x14] = SSE41_OP(blendvps
),
3171 [0x15] = SSE41_OP(blendvpd
),
3172 [0x17] = SSE41_OP(ptest
),
3173 [0x1c] = SSSE3_OP(pabsb
),
3174 [0x1d] = SSSE3_OP(pabsw
),
3175 [0x1e] = SSSE3_OP(pabsd
),
3176 [0x20] = SSE41_OP(pmovsxbw
),
3177 [0x21] = SSE41_OP(pmovsxbd
),
3178 [0x22] = SSE41_OP(pmovsxbq
),
3179 [0x23] = SSE41_OP(pmovsxwd
),
3180 [0x24] = SSE41_OP(pmovsxwq
),
3181 [0x25] = SSE41_OP(pmovsxdq
),
3182 [0x28] = SSE41_OP(pmuldq
),
3183 [0x29] = SSE41_OP(pcmpeqq
),
3184 [0x2a] = SSE41_SPECIAL
, /* movntqda */
3185 [0x2b] = SSE41_OP(packusdw
),
3186 [0x30] = SSE41_OP(pmovzxbw
),
3187 [0x31] = SSE41_OP(pmovzxbd
),
3188 [0x32] = SSE41_OP(pmovzxbq
),
3189 [0x33] = SSE41_OP(pmovzxwd
),
3190 [0x34] = SSE41_OP(pmovzxwq
),
3191 [0x35] = SSE41_OP(pmovzxdq
),
3192 [0x37] = SSE42_OP(pcmpgtq
),
3193 [0x38] = SSE41_OP(pminsb
),
3194 [0x39] = SSE41_OP(pminsd
),
3195 [0x3a] = SSE41_OP(pminuw
),
3196 [0x3b] = SSE41_OP(pminud
),
3197 [0x3c] = SSE41_OP(pmaxsb
),
3198 [0x3d] = SSE41_OP(pmaxsd
),
3199 [0x3e] = SSE41_OP(pmaxuw
),
3200 [0x3f] = SSE41_OP(pmaxud
),
3201 [0x40] = SSE41_OP(pmulld
),
3202 [0x41] = SSE41_OP(phminposuw
),
3203 [0xdb] = AESNI_OP(aesimc
),
3204 [0xdc] = AESNI_OP(aesenc
),
3205 [0xdd] = AESNI_OP(aesenclast
),
3206 [0xde] = AESNI_OP(aesdec
),
3207 [0xdf] = AESNI_OP(aesdeclast
),
3210 static const struct SSEOpHelper_eppi sse_op_table7
[256] = {
3211 [0x08] = SSE41_OP(roundps
),
3212 [0x09] = SSE41_OP(roundpd
),
3213 [0x0a] = SSE41_OP(roundss
),
3214 [0x0b] = SSE41_OP(roundsd
),
3215 [0x0c] = SSE41_OP(blendps
),
3216 [0x0d] = SSE41_OP(blendpd
),
3217 [0x0e] = SSE41_OP(pblendw
),
3218 [0x0f] = SSSE3_OP(palignr
),
3219 [0x14] = SSE41_SPECIAL
, /* pextrb */
3220 [0x15] = SSE41_SPECIAL
, /* pextrw */
3221 [0x16] = SSE41_SPECIAL
, /* pextrd/pextrq */
3222 [0x17] = SSE41_SPECIAL
, /* extractps */
3223 [0x20] = SSE41_SPECIAL
, /* pinsrb */
3224 [0x21] = SSE41_SPECIAL
, /* insertps */
3225 [0x22] = SSE41_SPECIAL
, /* pinsrd/pinsrq */
3226 [0x40] = SSE41_OP(dpps
),
3227 [0x41] = SSE41_OP(dppd
),
3228 [0x42] = SSE41_OP(mpsadbw
),
3229 [0x44] = PCLMULQDQ_OP(pclmulqdq
),
3230 [0x60] = SSE42_OP(pcmpestrm
),
3231 [0x61] = SSE42_OP(pcmpestri
),
3232 [0x62] = SSE42_OP(pcmpistrm
),
3233 [0x63] = SSE42_OP(pcmpistri
),
3234 [0xdf] = AESNI_OP(aeskeygenassist
),
3237 static void gen_sse(CPUX86State
*env
, DisasContext
*s
, int b
,
3238 target_ulong pc_start
, int rex_r
)
3240 int b1
, op1_offset
, op2_offset
, is_xmm
, val
, ot
;
3241 int modrm
, mod
, rm
, reg
, reg_addr
, offset_addr
;
3242 SSEFunc_0_epp sse_fn_epp
;
3243 SSEFunc_0_eppi sse_fn_eppi
;
3244 SSEFunc_0_ppi sse_fn_ppi
;
3245 SSEFunc_0_eppt sse_fn_eppt
;
3248 if (s
->prefix
& PREFIX_DATA
)
3250 else if (s
->prefix
& PREFIX_REPZ
)
3252 else if (s
->prefix
& PREFIX_REPNZ
)
3256 sse_fn_epp
= sse_op_table1
[b
][b1
];
3260 if ((b
<= 0x5f && b
>= 0x10) || b
== 0xc6 || b
== 0xc2) {
3270 /* simple MMX/SSE operation */
3271 if (s
->flags
& HF_TS_MASK
) {
3272 gen_exception(s
, EXCP07_PREX
, pc_start
- s
->cs_base
);
3275 if (s
->flags
& HF_EM_MASK
) {
3277 gen_exception(s
, EXCP06_ILLOP
, pc_start
- s
->cs_base
);
3280 if (is_xmm
&& !(s
->flags
& HF_OSFXSR_MASK
))
3281 if ((b
!= 0x38 && b
!= 0x3a) || (s
->prefix
& PREFIX_DATA
))
3284 if (!(s
->cpuid_ext2_features
& CPUID_EXT2_3DNOW
))
3287 gen_helper_emms(cpu_env
);
3292 gen_helper_emms(cpu_env
);
3295 /* prepare MMX state (XXX: optimize by storing fptt and fptags in
3296 the static cpu state) */
3298 gen_helper_enter_mmx(cpu_env
);
3301 modrm
= cpu_ldub_code(env
, s
->pc
++);
3302 reg
= ((modrm
>> 3) & 7);
3305 mod
= (modrm
>> 6) & 3;
3306 if (sse_fn_epp
== SSE_SPECIAL
) {
3309 case 0x0e7: /* movntq */
3312 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3313 gen_stq_env_A0(s
->mem_index
, offsetof(CPUX86State
,fpregs
[reg
].mmx
));
3315 case 0x1e7: /* movntdq */
3316 case 0x02b: /* movntps */
3317 case 0x12b: /* movntps */
3320 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3321 gen_sto_env_A0(s
->mem_index
, offsetof(CPUX86State
,xmm_regs
[reg
]));
3323 case 0x3f0: /* lddqu */
3326 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3327 gen_ldo_env_A0(s
->mem_index
, offsetof(CPUX86State
,xmm_regs
[reg
]));
3329 case 0x22b: /* movntss */
3330 case 0x32b: /* movntsd */
3333 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3335 gen_stq_env_A0(s
->mem_index
, offsetof(CPUX86State
,
3338 tcg_gen_ld32u_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,
3339 xmm_regs
[reg
].XMM_L(0)));
3340 gen_op_st_T0_A0(OT_LONG
+ s
->mem_index
);
3343 case 0x6e: /* movd mm, ea */
3344 #ifdef TARGET_X86_64
3345 if (s
->dflag
== 2) {
3346 gen_ldst_modrm(env
, s
, modrm
, OT_QUAD
, OR_TMP0
, 0);
3347 tcg_gen_st_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,fpregs
[reg
].mmx
));
3351 gen_ldst_modrm(env
, s
, modrm
, OT_LONG
, OR_TMP0
, 0);
3352 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
,
3353 offsetof(CPUX86State
,fpregs
[reg
].mmx
));
3354 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
3355 gen_helper_movl_mm_T0_mmx(cpu_ptr0
, cpu_tmp2_i32
);
3358 case 0x16e: /* movd xmm, ea */
3359 #ifdef TARGET_X86_64
3360 if (s
->dflag
== 2) {
3361 gen_ldst_modrm(env
, s
, modrm
, OT_QUAD
, OR_TMP0
, 0);
3362 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
,
3363 offsetof(CPUX86State
,xmm_regs
[reg
]));
3364 gen_helper_movq_mm_T0_xmm(cpu_ptr0
, cpu_T
[0]);
3368 gen_ldst_modrm(env
, s
, modrm
, OT_LONG
, OR_TMP0
, 0);
3369 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
,
3370 offsetof(CPUX86State
,xmm_regs
[reg
]));
3371 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
3372 gen_helper_movl_mm_T0_xmm(cpu_ptr0
, cpu_tmp2_i32
);
3375 case 0x6f: /* movq mm, ea */
3377 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3378 gen_ldq_env_A0(s
->mem_index
, offsetof(CPUX86State
,fpregs
[reg
].mmx
));
3381 tcg_gen_ld_i64(cpu_tmp1_i64
, cpu_env
,
3382 offsetof(CPUX86State
,fpregs
[rm
].mmx
));
3383 tcg_gen_st_i64(cpu_tmp1_i64
, cpu_env
,
3384 offsetof(CPUX86State
,fpregs
[reg
].mmx
));
3387 case 0x010: /* movups */
3388 case 0x110: /* movupd */
3389 case 0x028: /* movaps */
3390 case 0x128: /* movapd */
3391 case 0x16f: /* movdqa xmm, ea */
3392 case 0x26f: /* movdqu xmm, ea */
3394 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3395 gen_ldo_env_A0(s
->mem_index
, offsetof(CPUX86State
,xmm_regs
[reg
]));
3397 rm
= (modrm
& 7) | REX_B(s
);
3398 gen_op_movo(offsetof(CPUX86State
,xmm_regs
[reg
]),
3399 offsetof(CPUX86State
,xmm_regs
[rm
]));
3402 case 0x210: /* movss xmm, ea */
3404 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3405 gen_op_ld_T0_A0(OT_LONG
+ s
->mem_index
);
3406 tcg_gen_st32_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(0)));
3408 tcg_gen_st32_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(1)));
3409 tcg_gen_st32_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(2)));
3410 tcg_gen_st32_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(3)));
3412 rm
= (modrm
& 7) | REX_B(s
);
3413 gen_op_movl(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(0)),
3414 offsetof(CPUX86State
,xmm_regs
[rm
].XMM_L(0)));
3417 case 0x310: /* movsd xmm, ea */
3419 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3420 gen_ldq_env_A0(s
->mem_index
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(0)));
3422 tcg_gen_st32_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(2)));
3423 tcg_gen_st32_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(3)));
3425 rm
= (modrm
& 7) | REX_B(s
);
3426 gen_op_movq(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(0)),
3427 offsetof(CPUX86State
,xmm_regs
[rm
].XMM_Q(0)));
3430 case 0x012: /* movlps */
3431 case 0x112: /* movlpd */
3433 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3434 gen_ldq_env_A0(s
->mem_index
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(0)));
3437 rm
= (modrm
& 7) | REX_B(s
);
3438 gen_op_movq(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(0)),
3439 offsetof(CPUX86State
,xmm_regs
[rm
].XMM_Q(1)));
3442 case 0x212: /* movsldup */
3444 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3445 gen_ldo_env_A0(s
->mem_index
, offsetof(CPUX86State
,xmm_regs
[reg
]));
3447 rm
= (modrm
& 7) | REX_B(s
);
3448 gen_op_movl(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(0)),
3449 offsetof(CPUX86State
,xmm_regs
[rm
].XMM_L(0)));
3450 gen_op_movl(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(2)),
3451 offsetof(CPUX86State
,xmm_regs
[rm
].XMM_L(2)));
3453 gen_op_movl(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(1)),
3454 offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(0)));
3455 gen_op_movl(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(3)),
3456 offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(2)));
3458 case 0x312: /* movddup */
3460 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3461 gen_ldq_env_A0(s
->mem_index
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(0)));
3463 rm
= (modrm
& 7) | REX_B(s
);
3464 gen_op_movq(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(0)),
3465 offsetof(CPUX86State
,xmm_regs
[rm
].XMM_Q(0)));
3467 gen_op_movq(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(1)),
3468 offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(0)));
3470 case 0x016: /* movhps */
3471 case 0x116: /* movhpd */
3473 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3474 gen_ldq_env_A0(s
->mem_index
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(1)));
3477 rm
= (modrm
& 7) | REX_B(s
);
3478 gen_op_movq(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(1)),
3479 offsetof(CPUX86State
,xmm_regs
[rm
].XMM_Q(0)));
3482 case 0x216: /* movshdup */
3484 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3485 gen_ldo_env_A0(s
->mem_index
, offsetof(CPUX86State
,xmm_regs
[reg
]));
3487 rm
= (modrm
& 7) | REX_B(s
);
3488 gen_op_movl(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(1)),
3489 offsetof(CPUX86State
,xmm_regs
[rm
].XMM_L(1)));
3490 gen_op_movl(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(3)),
3491 offsetof(CPUX86State
,xmm_regs
[rm
].XMM_L(3)));
3493 gen_op_movl(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(0)),
3494 offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(1)));
3495 gen_op_movl(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(2)),
3496 offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(3)));
3501 int bit_index
, field_length
;
3503 if (b1
== 1 && reg
!= 0)
3505 field_length
= cpu_ldub_code(env
, s
->pc
++) & 0x3F;
3506 bit_index
= cpu_ldub_code(env
, s
->pc
++) & 0x3F;
3507 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
,
3508 offsetof(CPUX86State
,xmm_regs
[reg
]));
3510 gen_helper_extrq_i(cpu_env
, cpu_ptr0
,
3511 tcg_const_i32(bit_index
),
3512 tcg_const_i32(field_length
));
3514 gen_helper_insertq_i(cpu_env
, cpu_ptr0
,
3515 tcg_const_i32(bit_index
),
3516 tcg_const_i32(field_length
));
3519 case 0x7e: /* movd ea, mm */
3520 #ifdef TARGET_X86_64
3521 if (s
->dflag
== 2) {
3522 tcg_gen_ld_i64(cpu_T
[0], cpu_env
,
3523 offsetof(CPUX86State
,fpregs
[reg
].mmx
));
3524 gen_ldst_modrm(env
, s
, modrm
, OT_QUAD
, OR_TMP0
, 1);
3528 tcg_gen_ld32u_tl(cpu_T
[0], cpu_env
,
3529 offsetof(CPUX86State
,fpregs
[reg
].mmx
.MMX_L(0)));
3530 gen_ldst_modrm(env
, s
, modrm
, OT_LONG
, OR_TMP0
, 1);
3533 case 0x17e: /* movd ea, xmm */
3534 #ifdef TARGET_X86_64
3535 if (s
->dflag
== 2) {
3536 tcg_gen_ld_i64(cpu_T
[0], cpu_env
,
3537 offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(0)));
3538 gen_ldst_modrm(env
, s
, modrm
, OT_QUAD
, OR_TMP0
, 1);
3542 tcg_gen_ld32u_tl(cpu_T
[0], cpu_env
,
3543 offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(0)));
3544 gen_ldst_modrm(env
, s
, modrm
, OT_LONG
, OR_TMP0
, 1);
3547 case 0x27e: /* movq xmm, ea */
3549 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3550 gen_ldq_env_A0(s
->mem_index
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(0)));
3552 rm
= (modrm
& 7) | REX_B(s
);
3553 gen_op_movq(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(0)),
3554 offsetof(CPUX86State
,xmm_regs
[rm
].XMM_Q(0)));
3556 gen_op_movq_env_0(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(1)));
3558 case 0x7f: /* movq ea, mm */
3560 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3561 gen_stq_env_A0(s
->mem_index
, offsetof(CPUX86State
,fpregs
[reg
].mmx
));
3564 gen_op_movq(offsetof(CPUX86State
,fpregs
[rm
].mmx
),
3565 offsetof(CPUX86State
,fpregs
[reg
].mmx
));
3568 case 0x011: /* movups */
3569 case 0x111: /* movupd */
3570 case 0x029: /* movaps */
3571 case 0x129: /* movapd */
3572 case 0x17f: /* movdqa ea, xmm */
3573 case 0x27f: /* movdqu ea, xmm */
3575 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3576 gen_sto_env_A0(s
->mem_index
, offsetof(CPUX86State
,xmm_regs
[reg
]));
3578 rm
= (modrm
& 7) | REX_B(s
);
3579 gen_op_movo(offsetof(CPUX86State
,xmm_regs
[rm
]),
3580 offsetof(CPUX86State
,xmm_regs
[reg
]));
3583 case 0x211: /* movss ea, xmm */
3585 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3586 tcg_gen_ld32u_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(0)));
3587 gen_op_st_T0_A0(OT_LONG
+ s
->mem_index
);
3589 rm
= (modrm
& 7) | REX_B(s
);
3590 gen_op_movl(offsetof(CPUX86State
,xmm_regs
[rm
].XMM_L(0)),
3591 offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(0)));
3594 case 0x311: /* movsd ea, xmm */
3596 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3597 gen_stq_env_A0(s
->mem_index
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(0)));
3599 rm
= (modrm
& 7) | REX_B(s
);
3600 gen_op_movq(offsetof(CPUX86State
,xmm_regs
[rm
].XMM_Q(0)),
3601 offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(0)));
3604 case 0x013: /* movlps */
3605 case 0x113: /* movlpd */
3607 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3608 gen_stq_env_A0(s
->mem_index
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(0)));
3613 case 0x017: /* movhps */
3614 case 0x117: /* movhpd */
3616 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3617 gen_stq_env_A0(s
->mem_index
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(1)));
3622 case 0x71: /* shift mm, im */
3625 case 0x171: /* shift xmm, im */
3631 val
= cpu_ldub_code(env
, s
->pc
++);
3633 gen_op_movl_T0_im(val
);
3634 tcg_gen_st32_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,xmm_t0
.XMM_L(0)));
3636 tcg_gen_st32_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,xmm_t0
.XMM_L(1)));
3637 op1_offset
= offsetof(CPUX86State
,xmm_t0
);
3639 gen_op_movl_T0_im(val
);
3640 tcg_gen_st32_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,mmx_t0
.MMX_L(0)));
3642 tcg_gen_st32_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,mmx_t0
.MMX_L(1)));
3643 op1_offset
= offsetof(CPUX86State
,mmx_t0
);
3645 sse_fn_epp
= sse_op_table2
[((b
- 1) & 3) * 8 +
3646 (((modrm
>> 3)) & 7)][b1
];
3651 rm
= (modrm
& 7) | REX_B(s
);
3652 op2_offset
= offsetof(CPUX86State
,xmm_regs
[rm
]);
3655 op2_offset
= offsetof(CPUX86State
,fpregs
[rm
].mmx
);
3657 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
, op2_offset
);
3658 tcg_gen_addi_ptr(cpu_ptr1
, cpu_env
, op1_offset
);
3659 sse_fn_epp(cpu_env
, cpu_ptr0
, cpu_ptr1
);
3661 case 0x050: /* movmskps */
3662 rm
= (modrm
& 7) | REX_B(s
);
3663 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
,
3664 offsetof(CPUX86State
,xmm_regs
[rm
]));
3665 gen_helper_movmskps(cpu_tmp2_i32
, cpu_env
, cpu_ptr0
);
3666 tcg_gen_extu_i32_tl(cpu_T
[0], cpu_tmp2_i32
);
3667 gen_op_mov_reg_T0(OT_LONG
, reg
);
3669 case 0x150: /* movmskpd */
3670 rm
= (modrm
& 7) | REX_B(s
);
3671 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
,
3672 offsetof(CPUX86State
,xmm_regs
[rm
]));
3673 gen_helper_movmskpd(cpu_tmp2_i32
, cpu_env
, cpu_ptr0
);
3674 tcg_gen_extu_i32_tl(cpu_T
[0], cpu_tmp2_i32
);
3675 gen_op_mov_reg_T0(OT_LONG
, reg
);
3677 case 0x02a: /* cvtpi2ps */
3678 case 0x12a: /* cvtpi2pd */
3679 gen_helper_enter_mmx(cpu_env
);
3681 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3682 op2_offset
= offsetof(CPUX86State
,mmx_t0
);
3683 gen_ldq_env_A0(s
->mem_index
, op2_offset
);
3686 op2_offset
= offsetof(CPUX86State
,fpregs
[rm
].mmx
);
3688 op1_offset
= offsetof(CPUX86State
,xmm_regs
[reg
]);
3689 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
, op1_offset
);
3690 tcg_gen_addi_ptr(cpu_ptr1
, cpu_env
, op2_offset
);
3693 gen_helper_cvtpi2ps(cpu_env
, cpu_ptr0
, cpu_ptr1
);
3697 gen_helper_cvtpi2pd(cpu_env
, cpu_ptr0
, cpu_ptr1
);
3701 case 0x22a: /* cvtsi2ss */
3702 case 0x32a: /* cvtsi2sd */
3703 ot
= (s
->dflag
== 2) ? OT_QUAD
: OT_LONG
;
3704 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
3705 op1_offset
= offsetof(CPUX86State
,xmm_regs
[reg
]);
3706 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
, op1_offset
);
3707 if (ot
== OT_LONG
) {
3708 SSEFunc_0_epi sse_fn_epi
= sse_op_table3ai
[(b
>> 8) & 1];
3709 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
3710 sse_fn_epi(cpu_env
, cpu_ptr0
, cpu_tmp2_i32
);
3712 #ifdef TARGET_X86_64
3713 SSEFunc_0_epl sse_fn_epl
= sse_op_table3aq
[(b
>> 8) & 1];
3714 sse_fn_epl(cpu_env
, cpu_ptr0
, cpu_T
[0]);
3720 case 0x02c: /* cvttps2pi */
3721 case 0x12c: /* cvttpd2pi */
3722 case 0x02d: /* cvtps2pi */
3723 case 0x12d: /* cvtpd2pi */
3724 gen_helper_enter_mmx(cpu_env
);
3726 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3727 op2_offset
= offsetof(CPUX86State
,xmm_t0
);
3728 gen_ldo_env_A0(s
->mem_index
, op2_offset
);
3730 rm
= (modrm
& 7) | REX_B(s
);
3731 op2_offset
= offsetof(CPUX86State
,xmm_regs
[rm
]);
3733 op1_offset
= offsetof(CPUX86State
,fpregs
[reg
& 7].mmx
);
3734 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
, op1_offset
);
3735 tcg_gen_addi_ptr(cpu_ptr1
, cpu_env
, op2_offset
);
3738 gen_helper_cvttps2pi(cpu_env
, cpu_ptr0
, cpu_ptr1
);
3741 gen_helper_cvttpd2pi(cpu_env
, cpu_ptr0
, cpu_ptr1
);
3744 gen_helper_cvtps2pi(cpu_env
, cpu_ptr0
, cpu_ptr1
);
3747 gen_helper_cvtpd2pi(cpu_env
, cpu_ptr0
, cpu_ptr1
);
3751 case 0x22c: /* cvttss2si */
3752 case 0x32c: /* cvttsd2si */
3753 case 0x22d: /* cvtss2si */
3754 case 0x32d: /* cvtsd2si */
3755 ot
= (s
->dflag
== 2) ? OT_QUAD
: OT_LONG
;
3757 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3759 gen_ldq_env_A0(s
->mem_index
, offsetof(CPUX86State
,xmm_t0
.XMM_Q(0)));
3761 gen_op_ld_T0_A0(OT_LONG
+ s
->mem_index
);
3762 tcg_gen_st32_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,xmm_t0
.XMM_L(0)));
3764 op2_offset
= offsetof(CPUX86State
,xmm_t0
);
3766 rm
= (modrm
& 7) | REX_B(s
);
3767 op2_offset
= offsetof(CPUX86State
,xmm_regs
[rm
]);
3769 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
, op2_offset
);
3770 if (ot
== OT_LONG
) {
3771 SSEFunc_i_ep sse_fn_i_ep
=
3772 sse_op_table3bi
[((b
>> 7) & 2) | (b
& 1)];
3773 sse_fn_i_ep(cpu_tmp2_i32
, cpu_env
, cpu_ptr0
);
3774 tcg_gen_extu_i32_tl(cpu_T
[0], cpu_tmp2_i32
);
3776 #ifdef TARGET_X86_64
3777 SSEFunc_l_ep sse_fn_l_ep
=
3778 sse_op_table3bq
[((b
>> 7) & 2) | (b
& 1)];
3779 sse_fn_l_ep(cpu_T
[0], cpu_env
, cpu_ptr0
);
3784 gen_op_mov_reg_T0(ot
, reg
);
3786 case 0xc4: /* pinsrw */
3789 gen_ldst_modrm(env
, s
, modrm
, OT_WORD
, OR_TMP0
, 0);
3790 val
= cpu_ldub_code(env
, s
->pc
++);
3793 tcg_gen_st16_tl(cpu_T
[0], cpu_env
,
3794 offsetof(CPUX86State
,xmm_regs
[reg
].XMM_W(val
)));
3797 tcg_gen_st16_tl(cpu_T
[0], cpu_env
,
3798 offsetof(CPUX86State
,fpregs
[reg
].mmx
.MMX_W(val
)));
3801 case 0xc5: /* pextrw */
3805 ot
= (s
->dflag
== 2) ? OT_QUAD
: OT_LONG
;
3806 val
= cpu_ldub_code(env
, s
->pc
++);
3809 rm
= (modrm
& 7) | REX_B(s
);
3810 tcg_gen_ld16u_tl(cpu_T
[0], cpu_env
,
3811 offsetof(CPUX86State
,xmm_regs
[rm
].XMM_W(val
)));
3815 tcg_gen_ld16u_tl(cpu_T
[0], cpu_env
,
3816 offsetof(CPUX86State
,fpregs
[rm
].mmx
.MMX_W(val
)));
3818 reg
= ((modrm
>> 3) & 7) | rex_r
;
3819 gen_op_mov_reg_T0(ot
, reg
);
3821 case 0x1d6: /* movq ea, xmm */
3823 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3824 gen_stq_env_A0(s
->mem_index
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(0)));
3826 rm
= (modrm
& 7) | REX_B(s
);
3827 gen_op_movq(offsetof(CPUX86State
,xmm_regs
[rm
].XMM_Q(0)),
3828 offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(0)));
3829 gen_op_movq_env_0(offsetof(CPUX86State
,xmm_regs
[rm
].XMM_Q(1)));
3832 case 0x2d6: /* movq2dq */
3833 gen_helper_enter_mmx(cpu_env
);
3835 gen_op_movq(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(0)),
3836 offsetof(CPUX86State
,fpregs
[rm
].mmx
));
3837 gen_op_movq_env_0(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_Q(1)));
3839 case 0x3d6: /* movdq2q */
3840 gen_helper_enter_mmx(cpu_env
);
3841 rm
= (modrm
& 7) | REX_B(s
);
3842 gen_op_movq(offsetof(CPUX86State
,fpregs
[reg
& 7].mmx
),
3843 offsetof(CPUX86State
,xmm_regs
[rm
].XMM_Q(0)));
3845 case 0xd7: /* pmovmskb */
3850 rm
= (modrm
& 7) | REX_B(s
);
3851 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
, offsetof(CPUX86State
,xmm_regs
[rm
]));
3852 gen_helper_pmovmskb_xmm(cpu_tmp2_i32
, cpu_env
, cpu_ptr0
);
3855 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
, offsetof(CPUX86State
,fpregs
[rm
].mmx
));
3856 gen_helper_pmovmskb_mmx(cpu_tmp2_i32
, cpu_env
, cpu_ptr0
);
3858 tcg_gen_extu_i32_tl(cpu_T
[0], cpu_tmp2_i32
);
3859 reg
= ((modrm
>> 3) & 7) | rex_r
;
3860 gen_op_mov_reg_T0(OT_LONG
, reg
);
3866 if ((b
& 0xf0) == 0xf0) {
3869 modrm
= cpu_ldub_code(env
, s
->pc
++);
3871 reg
= ((modrm
>> 3) & 7) | rex_r
;
3872 mod
= (modrm
>> 6) & 3;
3877 sse_fn_epp
= sse_op_table6
[b
].op
[b1
];
3881 if (!(s
->cpuid_ext_features
& sse_op_table6
[b
].ext_mask
))
3885 op1_offset
= offsetof(CPUX86State
,xmm_regs
[reg
]);
3887 op2_offset
= offsetof(CPUX86State
,xmm_regs
[rm
| REX_B(s
)]);
3889 op2_offset
= offsetof(CPUX86State
,xmm_t0
);
3890 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3892 case 0x20: case 0x30: /* pmovsxbw, pmovzxbw */
3893 case 0x23: case 0x33: /* pmovsxwd, pmovzxwd */
3894 case 0x25: case 0x35: /* pmovsxdq, pmovzxdq */
3895 gen_ldq_env_A0(s
->mem_index
, op2_offset
+
3896 offsetof(XMMReg
, XMM_Q(0)));
3898 case 0x21: case 0x31: /* pmovsxbd, pmovzxbd */
3899 case 0x24: case 0x34: /* pmovsxwq, pmovzxwq */
3900 tcg_gen_qemu_ld32u(cpu_tmp0
, cpu_A0
,
3901 (s
->mem_index
>> 2) - 1);
3902 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_tmp0
);
3903 tcg_gen_st_i32(cpu_tmp2_i32
, cpu_env
, op2_offset
+
3904 offsetof(XMMReg
, XMM_L(0)));
3906 case 0x22: case 0x32: /* pmovsxbq, pmovzxbq */
3907 tcg_gen_qemu_ld16u(cpu_tmp0
, cpu_A0
,
3908 (s
->mem_index
>> 2) - 1);
3909 tcg_gen_st16_tl(cpu_tmp0
, cpu_env
, op2_offset
+
3910 offsetof(XMMReg
, XMM_W(0)));
3912 case 0x2a: /* movntqda */
3913 gen_ldo_env_A0(s
->mem_index
, op1_offset
);
3916 gen_ldo_env_A0(s
->mem_index
, op2_offset
);
3920 op1_offset
= offsetof(CPUX86State
,fpregs
[reg
].mmx
);
3922 op2_offset
= offsetof(CPUX86State
,fpregs
[rm
].mmx
);
3924 op2_offset
= offsetof(CPUX86State
,mmx_t0
);
3925 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
3926 gen_ldq_env_A0(s
->mem_index
, op2_offset
);
3929 if (sse_fn_epp
== SSE_SPECIAL
) {
3933 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
, op1_offset
);
3934 tcg_gen_addi_ptr(cpu_ptr1
, cpu_env
, op2_offset
);
3935 sse_fn_epp(cpu_env
, cpu_ptr0
, cpu_ptr1
);
3938 set_cc_op(s
, CC_OP_EFLAGS
);
3945 /* Various integer extensions at 0f 38 f[0-f]. */
3946 b
= modrm
| (b1
<< 8);
3947 modrm
= cpu_ldub_code(env
, s
->pc
++);
3948 reg
= ((modrm
>> 3) & 7) | rex_r
;
3951 case 0x3f0: /* crc32 Gd,Eb */
3952 case 0x3f1: /* crc32 Gd,Ey */
3954 if (!(s
->cpuid_ext_features
& CPUID_EXT_SSE42
)) {
3957 if ((b
& 0xff) == 0xf0) {
3959 } else if (s
->dflag
!= 2) {
3960 ot
= (s
->prefix
& PREFIX_DATA
? OT_WORD
: OT_LONG
);
3965 gen_op_mov_TN_reg(OT_LONG
, 0, reg
);
3966 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
3967 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
3968 gen_helper_crc32(cpu_T
[0], cpu_tmp2_i32
,
3969 cpu_T
[0], tcg_const_i32(8 << ot
));
3971 ot
= (s
->dflag
== 2) ? OT_QUAD
: OT_LONG
;
3972 gen_op_mov_reg_T0(ot
, reg
);
3975 case 0x1f0: /* crc32 or movbe */
3977 /* For these insns, the f3 prefix is supposed to have priority
3978 over the 66 prefix, but that's not what we implement above
3980 if (s
->prefix
& PREFIX_REPNZ
) {
3984 case 0x0f0: /* movbe Gy,My */
3985 case 0x0f1: /* movbe My,Gy */
3986 if (!(s
->cpuid_ext_features
& CPUID_EXT_MOVBE
)) {
3989 if (s
->dflag
!= 2) {
3990 ot
= (s
->prefix
& PREFIX_DATA
? OT_WORD
: OT_LONG
);
3995 /* Load the data incoming to the bswap. Note that the TCG
3996 implementation of bswap requires the input be zero
3997 extended. In the case of the loads, we simply know that
3998 gen_op_ld_v via gen_ldst_modrm does that already. */
4000 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
4004 tcg_gen_ext16u_tl(cpu_T
[0], cpu_regs
[reg
]);
4007 tcg_gen_ext32u_tl(cpu_T
[0], cpu_regs
[reg
]);
4010 tcg_gen_mov_tl(cpu_T
[0], cpu_regs
[reg
]);
4017 tcg_gen_bswap16_tl(cpu_T
[0], cpu_T
[0]);
4020 tcg_gen_bswap32_tl(cpu_T
[0], cpu_T
[0]);
4022 #ifdef TARGET_X86_64
4024 tcg_gen_bswap64_tl(cpu_T
[0], cpu_T
[0]);
4030 gen_op_mov_reg_T0(ot
, reg
);
4032 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 1);
4036 case 0x0f2: /* andn Gy, By, Ey */
4037 if (!(s
->cpuid_7_0_ebx_features
& CPUID_7_0_EBX_BMI1
)
4038 || !(s
->prefix
& PREFIX_VEX
)
4042 ot
= s
->dflag
== 2 ? OT_QUAD
: OT_LONG
;
4043 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
4044 tcg_gen_andc_tl(cpu_T
[0], cpu_regs
[s
->vex_v
], cpu_T
[0]);
4045 gen_op_mov_reg_T0(ot
, reg
);
4046 gen_op_update1_cc();
4047 set_cc_op(s
, CC_OP_LOGICB
+ ot
);
4050 case 0x0f7: /* bextr Gy, Ey, By */
4051 if (!(s
->cpuid_7_0_ebx_features
& CPUID_7_0_EBX_BMI1
)
4052 || !(s
->prefix
& PREFIX_VEX
)
4056 ot
= s
->dflag
== 2 ? OT_QUAD
: OT_LONG
;
4060 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
4061 /* Extract START, and shift the operand.
4062 Shifts larger than operand size get zeros. */
4063 tcg_gen_ext8u_tl(cpu_A0
, cpu_regs
[s
->vex_v
]);
4064 tcg_gen_shr_tl(cpu_T
[0], cpu_T
[0], cpu_A0
);
4066 bound
= tcg_const_tl(ot
== OT_QUAD
? 63 : 31);
4067 zero
= tcg_const_tl(0);
4068 tcg_gen_movcond_tl(TCG_COND_LEU
, cpu_T
[0], cpu_A0
, bound
,
4070 tcg_temp_free(zero
);
4072 /* Extract the LEN into a mask. Lengths larger than
4073 operand size get all ones. */
4074 tcg_gen_shri_tl(cpu_A0
, cpu_regs
[s
->vex_v
], 8);
4075 tcg_gen_ext8u_tl(cpu_A0
, cpu_A0
);
4076 tcg_gen_movcond_tl(TCG_COND_LEU
, cpu_A0
, cpu_A0
, bound
,
4078 tcg_temp_free(bound
);
4079 tcg_gen_movi_tl(cpu_T
[1], 1);
4080 tcg_gen_shl_tl(cpu_T
[1], cpu_T
[1], cpu_A0
);
4081 tcg_gen_subi_tl(cpu_T
[1], cpu_T
[1], 1);
4082 tcg_gen_and_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
4084 gen_op_mov_reg_T0(ot
, reg
);
4085 gen_op_update1_cc();
4086 set_cc_op(s
, CC_OP_LOGICB
+ ot
);
4090 case 0x0f5: /* bzhi Gy, Ey, By */
4091 if (!(s
->cpuid_7_0_ebx_features
& CPUID_7_0_EBX_BMI2
)
4092 || !(s
->prefix
& PREFIX_VEX
)
4096 ot
= s
->dflag
== 2 ? OT_QUAD
: OT_LONG
;
4097 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
4098 tcg_gen_ext8u_tl(cpu_T
[1], cpu_regs
[s
->vex_v
]);
4100 TCGv bound
= tcg_const_tl(ot
== OT_QUAD
? 63 : 31);
4101 /* Note that since we're using BMILG (in order to get O
4102 cleared) we need to store the inverse into C. */
4103 tcg_gen_setcond_tl(TCG_COND_LT
, cpu_cc_src
,
4105 tcg_gen_movcond_tl(TCG_COND_GT
, cpu_T
[1], cpu_T
[1],
4106 bound
, bound
, cpu_T
[1]);
4107 tcg_temp_free(bound
);
4109 tcg_gen_movi_tl(cpu_A0
, -1);
4110 tcg_gen_shl_tl(cpu_A0
, cpu_A0
, cpu_T
[1]);
4111 tcg_gen_andc_tl(cpu_T
[0], cpu_T
[0], cpu_A0
);
4112 gen_op_mov_reg_T0(ot
, reg
);
4113 gen_op_update1_cc();
4114 set_cc_op(s
, CC_OP_BMILGB
+ ot
);
4117 case 0x3f6: /* mulx By, Gy, rdx, Ey */
4118 if (!(s
->cpuid_7_0_ebx_features
& CPUID_7_0_EBX_BMI2
)
4119 || !(s
->prefix
& PREFIX_VEX
)
4123 ot
= s
->dflag
== 2 ? OT_QUAD
: OT_LONG
;
4124 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
4127 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
4128 tcg_gen_trunc_tl_i32(cpu_tmp3_i32
, cpu_regs
[R_EDX
]);
4129 tcg_gen_mulu2_i32(cpu_tmp2_i32
, cpu_tmp3_i32
,
4130 cpu_tmp2_i32
, cpu_tmp3_i32
);
4131 tcg_gen_extu_i32_tl(cpu_regs
[s
->vex_v
], cpu_tmp2_i32
);
4132 tcg_gen_extu_i32_tl(cpu_regs
[reg
], cpu_tmp3_i32
);
4134 #ifdef TARGET_X86_64
4136 tcg_gen_mulu2_i64(cpu_regs
[s
->vex_v
], cpu_regs
[reg
],
4137 cpu_T
[0], cpu_regs
[R_EDX
]);
4143 case 0x3f5: /* pdep Gy, By, Ey */
4144 if (!(s
->cpuid_7_0_ebx_features
& CPUID_7_0_EBX_BMI2
)
4145 || !(s
->prefix
& PREFIX_VEX
)
4149 ot
= s
->dflag
== 2 ? OT_QUAD
: OT_LONG
;
4150 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
4151 /* Note that by zero-extending the mask operand, we
4152 automatically handle zero-extending the result. */
4153 if (s
->dflag
== 2) {
4154 tcg_gen_mov_tl(cpu_T
[1], cpu_regs
[s
->vex_v
]);
4156 tcg_gen_ext32u_tl(cpu_T
[1], cpu_regs
[s
->vex_v
]);
4158 gen_helper_pdep(cpu_regs
[reg
], cpu_T
[0], cpu_T
[1]);
4161 case 0x2f5: /* pext Gy, By, Ey */
4162 if (!(s
->cpuid_7_0_ebx_features
& CPUID_7_0_EBX_BMI2
)
4163 || !(s
->prefix
& PREFIX_VEX
)
4167 ot
= s
->dflag
== 2 ? OT_QUAD
: OT_LONG
;
4168 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
4169 /* Note that by zero-extending the mask operand, we
4170 automatically handle zero-extending the result. */
4171 if (s
->dflag
== 2) {
4172 tcg_gen_mov_tl(cpu_T
[1], cpu_regs
[s
->vex_v
]);
4174 tcg_gen_ext32u_tl(cpu_T
[1], cpu_regs
[s
->vex_v
]);
4176 gen_helper_pext(cpu_regs
[reg
], cpu_T
[0], cpu_T
[1]);
4179 case 0x1f6: /* adcx Gy, Ey */
4180 case 0x2f6: /* adox Gy, Ey */
4181 if (!(s
->cpuid_7_0_ebx_features
& CPUID_7_0_EBX_ADX
)) {
4184 TCGv carry_in
, carry_out
, zero
;
4187 ot
= (s
->dflag
== 2 ? OT_QUAD
: OT_LONG
);
4188 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
4190 /* Re-use the carry-out from a previous round. */
4191 TCGV_UNUSED(carry_in
);
4192 carry_out
= (b
== 0x1f6 ? cpu_cc_dst
: cpu_cc_src2
);
4196 carry_in
= cpu_cc_dst
;
4197 end_op
= CC_OP_ADCX
;
4199 end_op
= CC_OP_ADCOX
;
4204 end_op
= CC_OP_ADCOX
;
4206 carry_in
= cpu_cc_src2
;
4207 end_op
= CC_OP_ADOX
;
4211 end_op
= CC_OP_ADCOX
;
4212 carry_in
= carry_out
;
4215 end_op
= (b
== 0x1f6 ? CC_OP_ADCX
: CC_OP_ADOX
);
4218 /* If we can't reuse carry-out, get it out of EFLAGS. */
4219 if (TCGV_IS_UNUSED(carry_in
)) {
4220 if (s
->cc_op
!= CC_OP_ADCX
&& s
->cc_op
!= CC_OP_ADOX
) {
4221 gen_compute_eflags(s
);
4223 carry_in
= cpu_tmp0
;
4224 tcg_gen_shri_tl(carry_in
, cpu_cc_src
,
4225 ctz32(b
== 0x1f6 ? CC_C
: CC_O
));
4226 tcg_gen_andi_tl(carry_in
, carry_in
, 1);
4230 #ifdef TARGET_X86_64
4232 /* If we know TL is 64-bit, and we want a 32-bit
4233 result, just do everything in 64-bit arithmetic. */
4234 tcg_gen_ext32u_i64(cpu_regs
[reg
], cpu_regs
[reg
]);
4235 tcg_gen_ext32u_i64(cpu_T
[0], cpu_T
[0]);
4236 tcg_gen_add_i64(cpu_T
[0], cpu_T
[0], cpu_regs
[reg
]);
4237 tcg_gen_add_i64(cpu_T
[0], cpu_T
[0], carry_in
);
4238 tcg_gen_ext32u_i64(cpu_regs
[reg
], cpu_T
[0]);
4239 tcg_gen_shri_i64(carry_out
, cpu_T
[0], 32);
4243 /* Otherwise compute the carry-out in two steps. */
4244 zero
= tcg_const_tl(0);
4245 tcg_gen_add2_tl(cpu_T
[0], carry_out
,
4248 tcg_gen_add2_tl(cpu_regs
[reg
], carry_out
,
4249 cpu_regs
[reg
], carry_out
,
4251 tcg_temp_free(zero
);
4254 set_cc_op(s
, end_op
);
4258 case 0x1f7: /* shlx Gy, Ey, By */
4259 case 0x2f7: /* sarx Gy, Ey, By */
4260 case 0x3f7: /* shrx Gy, Ey, By */
4261 if (!(s
->cpuid_7_0_ebx_features
& CPUID_7_0_EBX_BMI2
)
4262 || !(s
->prefix
& PREFIX_VEX
)
4266 ot
= (s
->dflag
== 2 ? OT_QUAD
: OT_LONG
);
4267 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
4268 if (ot
== OT_QUAD
) {
4269 tcg_gen_andi_tl(cpu_T
[1], cpu_regs
[s
->vex_v
], 63);
4271 tcg_gen_andi_tl(cpu_T
[1], cpu_regs
[s
->vex_v
], 31);
4274 tcg_gen_shl_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
4275 } else if (b
== 0x2f7) {
4276 if (ot
!= OT_QUAD
) {
4277 tcg_gen_ext32s_tl(cpu_T
[0], cpu_T
[0]);
4279 tcg_gen_sar_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
4281 if (ot
!= OT_QUAD
) {
4282 tcg_gen_ext32u_tl(cpu_T
[0], cpu_T
[0]);
4284 tcg_gen_shr_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
4286 gen_op_mov_reg_T0(ot
, reg
);
4292 case 0x3f3: /* Group 17 */
4293 if (!(s
->cpuid_7_0_ebx_features
& CPUID_7_0_EBX_BMI1
)
4294 || !(s
->prefix
& PREFIX_VEX
)
4298 ot
= s
->dflag
== 2 ? OT_QUAD
: OT_LONG
;
4299 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
4302 case 1: /* blsr By,Ey */
4303 tcg_gen_neg_tl(cpu_T
[1], cpu_T
[0]);
4304 tcg_gen_and_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
4305 gen_op_mov_reg_T0(ot
, s
->vex_v
);
4306 gen_op_update2_cc();
4307 set_cc_op(s
, CC_OP_BMILGB
+ ot
);
4310 case 2: /* blsmsk By,Ey */
4311 tcg_gen_mov_tl(cpu_cc_src
, cpu_T
[0]);
4312 tcg_gen_subi_tl(cpu_T
[0], cpu_T
[0], 1);
4313 tcg_gen_xor_tl(cpu_T
[0], cpu_T
[0], cpu_cc_src
);
4314 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
4315 set_cc_op(s
, CC_OP_BMILGB
+ ot
);
4318 case 3: /* blsi By, Ey */
4319 tcg_gen_mov_tl(cpu_cc_src
, cpu_T
[0]);
4320 tcg_gen_subi_tl(cpu_T
[0], cpu_T
[0], 1);
4321 tcg_gen_and_tl(cpu_T
[0], cpu_T
[0], cpu_cc_src
);
4322 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
4323 set_cc_op(s
, CC_OP_BMILGB
+ ot
);
4339 modrm
= cpu_ldub_code(env
, s
->pc
++);
4341 reg
= ((modrm
>> 3) & 7) | rex_r
;
4342 mod
= (modrm
>> 6) & 3;
4347 sse_fn_eppi
= sse_op_table7
[b
].op
[b1
];
4351 if (!(s
->cpuid_ext_features
& sse_op_table7
[b
].ext_mask
))
4354 if (sse_fn_eppi
== SSE_SPECIAL
) {
4355 ot
= (s
->dflag
== 2) ? OT_QUAD
: OT_LONG
;
4356 rm
= (modrm
& 7) | REX_B(s
);
4358 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
4359 reg
= ((modrm
>> 3) & 7) | rex_r
;
4360 val
= cpu_ldub_code(env
, s
->pc
++);
4362 case 0x14: /* pextrb */
4363 tcg_gen_ld8u_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,
4364 xmm_regs
[reg
].XMM_B(val
& 15)));
4366 gen_op_mov_reg_T0(ot
, rm
);
4368 tcg_gen_qemu_st8(cpu_T
[0], cpu_A0
,
4369 (s
->mem_index
>> 2) - 1);
4371 case 0x15: /* pextrw */
4372 tcg_gen_ld16u_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,
4373 xmm_regs
[reg
].XMM_W(val
& 7)));
4375 gen_op_mov_reg_T0(ot
, rm
);
4377 tcg_gen_qemu_st16(cpu_T
[0], cpu_A0
,
4378 (s
->mem_index
>> 2) - 1);
4381 if (ot
== OT_LONG
) { /* pextrd */
4382 tcg_gen_ld_i32(cpu_tmp2_i32
, cpu_env
,
4383 offsetof(CPUX86State
,
4384 xmm_regs
[reg
].XMM_L(val
& 3)));
4385 tcg_gen_extu_i32_tl(cpu_T
[0], cpu_tmp2_i32
);
4387 gen_op_mov_reg_v(ot
, rm
, cpu_T
[0]);
4389 tcg_gen_qemu_st32(cpu_T
[0], cpu_A0
,
4390 (s
->mem_index
>> 2) - 1);
4391 } else { /* pextrq */
4392 #ifdef TARGET_X86_64
4393 tcg_gen_ld_i64(cpu_tmp1_i64
, cpu_env
,
4394 offsetof(CPUX86State
,
4395 xmm_regs
[reg
].XMM_Q(val
& 1)));
4397 gen_op_mov_reg_v(ot
, rm
, cpu_tmp1_i64
);
4399 tcg_gen_qemu_st64(cpu_tmp1_i64
, cpu_A0
,
4400 (s
->mem_index
>> 2) - 1);
4406 case 0x17: /* extractps */
4407 tcg_gen_ld32u_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,
4408 xmm_regs
[reg
].XMM_L(val
& 3)));
4410 gen_op_mov_reg_T0(ot
, rm
);
4412 tcg_gen_qemu_st32(cpu_T
[0], cpu_A0
,
4413 (s
->mem_index
>> 2) - 1);
4415 case 0x20: /* pinsrb */
4417 gen_op_mov_TN_reg(OT_LONG
, 0, rm
);
4419 tcg_gen_qemu_ld8u(cpu_T
[0], cpu_A0
,
4420 (s
->mem_index
>> 2) - 1);
4421 tcg_gen_st8_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,
4422 xmm_regs
[reg
].XMM_B(val
& 15)));
4424 case 0x21: /* insertps */
4426 tcg_gen_ld_i32(cpu_tmp2_i32
, cpu_env
,
4427 offsetof(CPUX86State
,xmm_regs
[rm
]
4428 .XMM_L((val
>> 6) & 3)));
4430 tcg_gen_qemu_ld32u(cpu_tmp0
, cpu_A0
,
4431 (s
->mem_index
>> 2) - 1);
4432 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_tmp0
);
4434 tcg_gen_st_i32(cpu_tmp2_i32
, cpu_env
,
4435 offsetof(CPUX86State
,xmm_regs
[reg
]
4436 .XMM_L((val
>> 4) & 3)));
4438 tcg_gen_st_i32(tcg_const_i32(0 /*float32_zero*/),
4439 cpu_env
, offsetof(CPUX86State
,
4440 xmm_regs
[reg
].XMM_L(0)));
4442 tcg_gen_st_i32(tcg_const_i32(0 /*float32_zero*/),
4443 cpu_env
, offsetof(CPUX86State
,
4444 xmm_regs
[reg
].XMM_L(1)));
4446 tcg_gen_st_i32(tcg_const_i32(0 /*float32_zero*/),
4447 cpu_env
, offsetof(CPUX86State
,
4448 xmm_regs
[reg
].XMM_L(2)));
4450 tcg_gen_st_i32(tcg_const_i32(0 /*float32_zero*/),
4451 cpu_env
, offsetof(CPUX86State
,
4452 xmm_regs
[reg
].XMM_L(3)));
4455 if (ot
== OT_LONG
) { /* pinsrd */
4457 gen_op_mov_v_reg(ot
, cpu_tmp0
, rm
);
4459 tcg_gen_qemu_ld32u(cpu_tmp0
, cpu_A0
,
4460 (s
->mem_index
>> 2) - 1);
4461 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_tmp0
);
4462 tcg_gen_st_i32(cpu_tmp2_i32
, cpu_env
,
4463 offsetof(CPUX86State
,
4464 xmm_regs
[reg
].XMM_L(val
& 3)));
4465 } else { /* pinsrq */
4466 #ifdef TARGET_X86_64
4468 gen_op_mov_v_reg(ot
, cpu_tmp1_i64
, rm
);
4470 tcg_gen_qemu_ld64(cpu_tmp1_i64
, cpu_A0
,
4471 (s
->mem_index
>> 2) - 1);
4472 tcg_gen_st_i64(cpu_tmp1_i64
, cpu_env
,
4473 offsetof(CPUX86State
,
4474 xmm_regs
[reg
].XMM_Q(val
& 1)));
4485 op1_offset
= offsetof(CPUX86State
,xmm_regs
[reg
]);
4487 op2_offset
= offsetof(CPUX86State
,xmm_regs
[rm
| REX_B(s
)]);
4489 op2_offset
= offsetof(CPUX86State
,xmm_t0
);
4490 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
4491 gen_ldo_env_A0(s
->mem_index
, op2_offset
);
4494 op1_offset
= offsetof(CPUX86State
,fpregs
[reg
].mmx
);
4496 op2_offset
= offsetof(CPUX86State
,fpregs
[rm
].mmx
);
4498 op2_offset
= offsetof(CPUX86State
,mmx_t0
);
4499 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
4500 gen_ldq_env_A0(s
->mem_index
, op2_offset
);
4503 val
= cpu_ldub_code(env
, s
->pc
++);
4505 if ((b
& 0xfc) == 0x60) { /* pcmpXstrX */
4506 set_cc_op(s
, CC_OP_EFLAGS
);
4509 /* The helper must use entire 64-bit gp registers */
4513 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
, op1_offset
);
4514 tcg_gen_addi_ptr(cpu_ptr1
, cpu_env
, op2_offset
);
4515 sse_fn_eppi(cpu_env
, cpu_ptr0
, cpu_ptr1
, tcg_const_i32(val
));
4519 /* Various integer extensions at 0f 3a f[0-f]. */
4520 b
= modrm
| (b1
<< 8);
4521 modrm
= cpu_ldub_code(env
, s
->pc
++);
4522 reg
= ((modrm
>> 3) & 7) | rex_r
;
4525 case 0x3f0: /* rorx Gy,Ey, Ib */
4526 if (!(s
->cpuid_7_0_ebx_features
& CPUID_7_0_EBX_BMI2
)
4527 || !(s
->prefix
& PREFIX_VEX
)
4531 ot
= s
->dflag
== 2 ? OT_QUAD
: OT_LONG
;
4532 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
4533 b
= cpu_ldub_code(env
, s
->pc
++);
4534 if (ot
== OT_QUAD
) {
4535 tcg_gen_rotri_tl(cpu_T
[0], cpu_T
[0], b
& 63);
4537 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
4538 tcg_gen_rotri_i32(cpu_tmp2_i32
, cpu_tmp2_i32
, b
& 31);
4539 tcg_gen_extu_i32_tl(cpu_T
[0], cpu_tmp2_i32
);
4541 gen_op_mov_reg_T0(ot
, reg
);
4553 /* generic MMX or SSE operation */
4555 case 0x70: /* pshufx insn */
4556 case 0xc6: /* pshufx insn */
4557 case 0xc2: /* compare insns */
4564 op1_offset
= offsetof(CPUX86State
,xmm_regs
[reg
]);
4566 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
4567 op2_offset
= offsetof(CPUX86State
,xmm_t0
);
4568 if (b1
>= 2 && ((b
>= 0x50 && b
<= 0x5f && b
!= 0x5b) ||
4570 /* specific case for SSE single instructions */
4573 gen_op_ld_T0_A0(OT_LONG
+ s
->mem_index
);
4574 tcg_gen_st32_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,xmm_t0
.XMM_L(0)));
4577 gen_ldq_env_A0(s
->mem_index
, offsetof(CPUX86State
,xmm_t0
.XMM_D(0)));
4580 gen_ldo_env_A0(s
->mem_index
, op2_offset
);
4583 rm
= (modrm
& 7) | REX_B(s
);
4584 op2_offset
= offsetof(CPUX86State
,xmm_regs
[rm
]);
4587 op1_offset
= offsetof(CPUX86State
,fpregs
[reg
].mmx
);
4589 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
4590 op2_offset
= offsetof(CPUX86State
,mmx_t0
);
4591 gen_ldq_env_A0(s
->mem_index
, op2_offset
);
4594 op2_offset
= offsetof(CPUX86State
,fpregs
[rm
].mmx
);
4598 case 0x0f: /* 3DNow! data insns */
4599 if (!(s
->cpuid_ext2_features
& CPUID_EXT2_3DNOW
))
4601 val
= cpu_ldub_code(env
, s
->pc
++);
4602 sse_fn_epp
= sse_op_table5
[val
];
4606 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
, op1_offset
);
4607 tcg_gen_addi_ptr(cpu_ptr1
, cpu_env
, op2_offset
);
4608 sse_fn_epp(cpu_env
, cpu_ptr0
, cpu_ptr1
);
4610 case 0x70: /* pshufx insn */
4611 case 0xc6: /* pshufx insn */
4612 val
= cpu_ldub_code(env
, s
->pc
++);
4613 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
, op1_offset
);
4614 tcg_gen_addi_ptr(cpu_ptr1
, cpu_env
, op2_offset
);
4615 /* XXX: introduce a new table? */
4616 sse_fn_ppi
= (SSEFunc_0_ppi
)sse_fn_epp
;
4617 sse_fn_ppi(cpu_ptr0
, cpu_ptr1
, tcg_const_i32(val
));
4621 val
= cpu_ldub_code(env
, s
->pc
++);
4624 sse_fn_epp
= sse_op_table4
[val
][b1
];
4626 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
, op1_offset
);
4627 tcg_gen_addi_ptr(cpu_ptr1
, cpu_env
, op2_offset
);
4628 sse_fn_epp(cpu_env
, cpu_ptr0
, cpu_ptr1
);
4631 /* maskmov : we must prepare A0 */
4634 #ifdef TARGET_X86_64
4635 if (s
->aflag
== 2) {
4636 gen_op_movq_A0_reg(R_EDI
);
4640 gen_op_movl_A0_reg(R_EDI
);
4642 gen_op_andl_A0_ffff();
4644 gen_add_A0_ds_seg(s
);
4646 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
, op1_offset
);
4647 tcg_gen_addi_ptr(cpu_ptr1
, cpu_env
, op2_offset
);
4648 /* XXX: introduce a new table? */
4649 sse_fn_eppt
= (SSEFunc_0_eppt
)sse_fn_epp
;
4650 sse_fn_eppt(cpu_env
, cpu_ptr0
, cpu_ptr1
, cpu_A0
);
4653 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
, op1_offset
);
4654 tcg_gen_addi_ptr(cpu_ptr1
, cpu_env
, op2_offset
);
4655 sse_fn_epp(cpu_env
, cpu_ptr0
, cpu_ptr1
);
4658 if (b
== 0x2e || b
== 0x2f) {
4659 set_cc_op(s
, CC_OP_EFLAGS
);
4664 /* convert one instruction. s->is_jmp is set if the translation must
4665 be stopped. Return the next pc value */
4666 static target_ulong
disas_insn(CPUX86State
*env
, DisasContext
*s
,
4667 target_ulong pc_start
)
4669 int b
, prefixes
, aflag
, dflag
;
4671 int modrm
, reg
, rm
, mod
, reg_addr
, op
, opreg
, offset_addr
, val
;
4672 target_ulong next_eip
, tval
;
4675 if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP
| CPU_LOG_TB_OP_OPT
))) {
4676 tcg_gen_debug_insn_start(pc_start
);
4683 #ifdef TARGET_X86_64
4688 s
->rip_offset
= 0; /* for relative ip address */
4692 b
= cpu_ldub_code(env
, s
->pc
);
4694 /* Collect prefixes. */
4697 prefixes
|= PREFIX_REPZ
;
4700 prefixes
|= PREFIX_REPNZ
;
4703 prefixes
|= PREFIX_LOCK
;
4724 prefixes
|= PREFIX_DATA
;
4727 prefixes
|= PREFIX_ADR
;
4729 #ifdef TARGET_X86_64
4733 rex_w
= (b
>> 3) & 1;
4734 rex_r
= (b
& 0x4) << 1;
4735 s
->rex_x
= (b
& 0x2) << 2;
4736 REX_B(s
) = (b
& 0x1) << 3;
4737 x86_64_hregs
= 1; /* select uniform byte register addressing */
4742 case 0xc5: /* 2-byte VEX */
4743 case 0xc4: /* 3-byte VEX */
4744 /* VEX prefixes cannot be used except in 32-bit mode.
4745 Otherwise the instruction is LES or LDS. */
4746 if (s
->code32
&& !s
->vm86
) {
4747 static const int pp_prefix
[4] = {
4748 0, PREFIX_DATA
, PREFIX_REPZ
, PREFIX_REPNZ
4750 int vex3
, vex2
= cpu_ldub_code(env
, s
->pc
);
4752 if (!CODE64(s
) && (vex2
& 0xc0) != 0xc0) {
4753 /* 4.1.4.6: In 32-bit mode, bits [7:6] must be 11b,
4754 otherwise the instruction is LES or LDS. */
4759 /* 4.1.1-4.1.3: No preceding lock, 66, f2, f3, or rex prefixes. */
4760 if (prefixes
& (PREFIX_REPZ
| PREFIX_REPNZ
4761 | PREFIX_LOCK
| PREFIX_DATA
)) {
4764 #ifdef TARGET_X86_64
4769 rex_r
= (~vex2
>> 4) & 8;
4772 b
= cpu_ldub_code(env
, s
->pc
++);
4774 #ifdef TARGET_X86_64
4775 s
->rex_x
= (~vex2
>> 3) & 8;
4776 s
->rex_b
= (~vex2
>> 2) & 8;
4778 vex3
= cpu_ldub_code(env
, s
->pc
++);
4779 rex_w
= (vex3
>> 7) & 1;
4780 switch (vex2
& 0x1f) {
4781 case 0x01: /* Implied 0f leading opcode bytes. */
4782 b
= cpu_ldub_code(env
, s
->pc
++) | 0x100;
4784 case 0x02: /* Implied 0f 38 leading opcode bytes. */
4787 case 0x03: /* Implied 0f 3a leading opcode bytes. */
4790 default: /* Reserved for future use. */
4794 s
->vex_v
= (~vex3
>> 3) & 0xf;
4795 s
->vex_l
= (vex3
>> 2) & 1;
4796 prefixes
|= pp_prefix
[vex3
& 3] | PREFIX_VEX
;
4801 /* Post-process prefixes. */
4803 /* In 64-bit mode, the default data size is 32-bit. Select 64-bit
4804 data with rex_w, and 16-bit data with 0x66; rex_w takes precedence
4805 over 0x66 if both are present. */
4806 dflag
= (rex_w
> 0 ? 2 : prefixes
& PREFIX_DATA
? 0 : 1);
4807 /* In 64-bit mode, 0x67 selects 32-bit addressing. */
4808 aflag
= (prefixes
& PREFIX_ADR
? 1 : 2);
4810 /* In 16/32-bit mode, 0x66 selects the opposite data size. */
4812 if (prefixes
& PREFIX_DATA
) {
4815 /* In 16/32-bit mode, 0x67 selects the opposite addressing. */
4817 if (prefixes
& PREFIX_ADR
) {
4822 s
->prefix
= prefixes
;
4826 /* lock generation */
4827 if (prefixes
& PREFIX_LOCK
)
4830 /* now check op code */
4834 /**************************/
4835 /* extended op code */
4836 b
= cpu_ldub_code(env
, s
->pc
++) | 0x100;
4839 /**************************/
4857 ot
= dflag
+ OT_WORD
;
4860 case 0: /* OP Ev, Gv */
4861 modrm
= cpu_ldub_code(env
, s
->pc
++);
4862 reg
= ((modrm
>> 3) & 7) | rex_r
;
4863 mod
= (modrm
>> 6) & 3;
4864 rm
= (modrm
& 7) | REX_B(s
);
4866 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
4868 } else if (op
== OP_XORL
&& rm
== reg
) {
4870 /* xor reg, reg optimisation */
4871 set_cc_op(s
, CC_OP_CLR
);
4873 gen_op_mov_reg_T0(ot
, reg
);
4878 gen_op_mov_TN_reg(ot
, 1, reg
);
4879 gen_op(s
, op
, ot
, opreg
);
4881 case 1: /* OP Gv, Ev */
4882 modrm
= cpu_ldub_code(env
, s
->pc
++);
4883 mod
= (modrm
>> 6) & 3;
4884 reg
= ((modrm
>> 3) & 7) | rex_r
;
4885 rm
= (modrm
& 7) | REX_B(s
);
4887 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
4888 gen_op_ld_T1_A0(ot
+ s
->mem_index
);
4889 } else if (op
== OP_XORL
&& rm
== reg
) {
4892 gen_op_mov_TN_reg(ot
, 1, rm
);
4894 gen_op(s
, op
, ot
, reg
);
4896 case 2: /* OP A, Iv */
4897 val
= insn_get(env
, s
, ot
);
4898 gen_op_movl_T1_im(val
);
4899 gen_op(s
, op
, ot
, OR_EAX
);
4908 case 0x80: /* GRP1 */
4917 ot
= dflag
+ OT_WORD
;
4919 modrm
= cpu_ldub_code(env
, s
->pc
++);
4920 mod
= (modrm
>> 6) & 3;
4921 rm
= (modrm
& 7) | REX_B(s
);
4922 op
= (modrm
>> 3) & 7;
4928 s
->rip_offset
= insn_const_size(ot
);
4929 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
4940 val
= insn_get(env
, s
, ot
);
4943 val
= (int8_t)insn_get(env
, s
, OT_BYTE
);
4946 gen_op_movl_T1_im(val
);
4947 gen_op(s
, op
, ot
, opreg
);
4951 /**************************/
4952 /* inc, dec, and other misc arith */
4953 case 0x40 ... 0x47: /* inc Gv */
4954 ot
= dflag
? OT_LONG
: OT_WORD
;
4955 gen_inc(s
, ot
, OR_EAX
+ (b
& 7), 1);
4957 case 0x48 ... 0x4f: /* dec Gv */
4958 ot
= dflag
? OT_LONG
: OT_WORD
;
4959 gen_inc(s
, ot
, OR_EAX
+ (b
& 7), -1);
4961 case 0xf6: /* GRP3 */
4966 ot
= dflag
+ OT_WORD
;
4968 modrm
= cpu_ldub_code(env
, s
->pc
++);
4969 mod
= (modrm
>> 6) & 3;
4970 rm
= (modrm
& 7) | REX_B(s
);
4971 op
= (modrm
>> 3) & 7;
4974 s
->rip_offset
= insn_const_size(ot
);
4975 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
4976 gen_op_ld_T0_A0(ot
+ s
->mem_index
);
4978 gen_op_mov_TN_reg(ot
, 0, rm
);
4983 val
= insn_get(env
, s
, ot
);
4984 gen_op_movl_T1_im(val
);
4985 gen_op_testl_T0_T1_cc();
4986 set_cc_op(s
, CC_OP_LOGICB
+ ot
);
4989 tcg_gen_not_tl(cpu_T
[0], cpu_T
[0]);
4991 gen_op_st_T0_A0(ot
+ s
->mem_index
);
4993 gen_op_mov_reg_T0(ot
, rm
);
4997 tcg_gen_neg_tl(cpu_T
[0], cpu_T
[0]);
4999 gen_op_st_T0_A0(ot
+ s
->mem_index
);
5001 gen_op_mov_reg_T0(ot
, rm
);
5003 gen_op_update_neg_cc();
5004 set_cc_op(s
, CC_OP_SUBB
+ ot
);
5009 gen_op_mov_TN_reg(OT_BYTE
, 1, R_EAX
);
5010 tcg_gen_ext8u_tl(cpu_T
[0], cpu_T
[0]);
5011 tcg_gen_ext8u_tl(cpu_T
[1], cpu_T
[1]);
5012 /* XXX: use 32 bit mul which could be faster */
5013 tcg_gen_mul_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
5014 gen_op_mov_reg_T0(OT_WORD
, R_EAX
);
5015 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
5016 tcg_gen_andi_tl(cpu_cc_src
, cpu_T
[0], 0xff00);
5017 set_cc_op(s
, CC_OP_MULB
);
5020 gen_op_mov_TN_reg(OT_WORD
, 1, R_EAX
);
5021 tcg_gen_ext16u_tl(cpu_T
[0], cpu_T
[0]);
5022 tcg_gen_ext16u_tl(cpu_T
[1], cpu_T
[1]);
5023 /* XXX: use 32 bit mul which could be faster */
5024 tcg_gen_mul_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
5025 gen_op_mov_reg_T0(OT_WORD
, R_EAX
);
5026 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
5027 tcg_gen_shri_tl(cpu_T
[0], cpu_T
[0], 16);
5028 gen_op_mov_reg_T0(OT_WORD
, R_EDX
);
5029 tcg_gen_mov_tl(cpu_cc_src
, cpu_T
[0]);
5030 set_cc_op(s
, CC_OP_MULW
);
5034 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
5035 tcg_gen_trunc_tl_i32(cpu_tmp3_i32
, cpu_regs
[R_EAX
]);
5036 tcg_gen_mulu2_i32(cpu_tmp2_i32
, cpu_tmp3_i32
,
5037 cpu_tmp2_i32
, cpu_tmp3_i32
);
5038 tcg_gen_extu_i32_tl(cpu_regs
[R_EAX
], cpu_tmp2_i32
);
5039 tcg_gen_extu_i32_tl(cpu_regs
[R_EDX
], cpu_tmp3_i32
);
5040 tcg_gen_mov_tl(cpu_cc_dst
, cpu_regs
[R_EAX
]);
5041 tcg_gen_mov_tl(cpu_cc_src
, cpu_regs
[R_EDX
]);
5042 set_cc_op(s
, CC_OP_MULL
);
5044 #ifdef TARGET_X86_64
5046 tcg_gen_mulu2_i64(cpu_regs
[R_EAX
], cpu_regs
[R_EDX
],
5047 cpu_T
[0], cpu_regs
[R_EAX
]);
5048 tcg_gen_mov_tl(cpu_cc_dst
, cpu_regs
[R_EAX
]);
5049 tcg_gen_mov_tl(cpu_cc_src
, cpu_regs
[R_EDX
]);
5050 set_cc_op(s
, CC_OP_MULQ
);
5058 gen_op_mov_TN_reg(OT_BYTE
, 1, R_EAX
);
5059 tcg_gen_ext8s_tl(cpu_T
[0], cpu_T
[0]);
5060 tcg_gen_ext8s_tl(cpu_T
[1], cpu_T
[1]);
5061 /* XXX: use 32 bit mul which could be faster */
5062 tcg_gen_mul_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
5063 gen_op_mov_reg_T0(OT_WORD
, R_EAX
);
5064 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
5065 tcg_gen_ext8s_tl(cpu_tmp0
, cpu_T
[0]);
5066 tcg_gen_sub_tl(cpu_cc_src
, cpu_T
[0], cpu_tmp0
);
5067 set_cc_op(s
, CC_OP_MULB
);
5070 gen_op_mov_TN_reg(OT_WORD
, 1, R_EAX
);
5071 tcg_gen_ext16s_tl(cpu_T
[0], cpu_T
[0]);
5072 tcg_gen_ext16s_tl(cpu_T
[1], cpu_T
[1]);
5073 /* XXX: use 32 bit mul which could be faster */
5074 tcg_gen_mul_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
5075 gen_op_mov_reg_T0(OT_WORD
, R_EAX
);
5076 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
5077 tcg_gen_ext16s_tl(cpu_tmp0
, cpu_T
[0]);
5078 tcg_gen_sub_tl(cpu_cc_src
, cpu_T
[0], cpu_tmp0
);
5079 tcg_gen_shri_tl(cpu_T
[0], cpu_T
[0], 16);
5080 gen_op_mov_reg_T0(OT_WORD
, R_EDX
);
5081 set_cc_op(s
, CC_OP_MULW
);
5085 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
5086 tcg_gen_trunc_tl_i32(cpu_tmp3_i32
, cpu_regs
[R_EAX
]);
5087 tcg_gen_muls2_i32(cpu_tmp2_i32
, cpu_tmp3_i32
,
5088 cpu_tmp2_i32
, cpu_tmp3_i32
);
5089 tcg_gen_extu_i32_tl(cpu_regs
[R_EAX
], cpu_tmp2_i32
);
5090 tcg_gen_extu_i32_tl(cpu_regs
[R_EDX
], cpu_tmp3_i32
);
5091 tcg_gen_sari_i32(cpu_tmp2_i32
, cpu_tmp2_i32
, 31);
5092 tcg_gen_mov_tl(cpu_cc_dst
, cpu_regs
[R_EAX
]);
5093 tcg_gen_sub_i32(cpu_tmp2_i32
, cpu_tmp2_i32
, cpu_tmp3_i32
);
5094 tcg_gen_extu_i32_tl(cpu_cc_src
, cpu_tmp2_i32
);
5095 set_cc_op(s
, CC_OP_MULL
);
5097 #ifdef TARGET_X86_64
5099 tcg_gen_muls2_i64(cpu_regs
[R_EAX
], cpu_regs
[R_EDX
],
5100 cpu_T
[0], cpu_regs
[R_EAX
]);
5101 tcg_gen_mov_tl(cpu_cc_dst
, cpu_regs
[R_EAX
]);
5102 tcg_gen_sari_tl(cpu_cc_src
, cpu_regs
[R_EAX
], 63);
5103 tcg_gen_sub_tl(cpu_cc_src
, cpu_cc_src
, cpu_regs
[R_EDX
]);
5104 set_cc_op(s
, CC_OP_MULQ
);
5112 gen_jmp_im(pc_start
- s
->cs_base
);
5113 gen_helper_divb_AL(cpu_env
, cpu_T
[0]);
5116 gen_jmp_im(pc_start
- s
->cs_base
);
5117 gen_helper_divw_AX(cpu_env
, cpu_T
[0]);
5121 gen_jmp_im(pc_start
- s
->cs_base
);
5122 gen_helper_divl_EAX(cpu_env
, cpu_T
[0]);
5124 #ifdef TARGET_X86_64
5126 gen_jmp_im(pc_start
- s
->cs_base
);
5127 gen_helper_divq_EAX(cpu_env
, cpu_T
[0]);
5135 gen_jmp_im(pc_start
- s
->cs_base
);
5136 gen_helper_idivb_AL(cpu_env
, cpu_T
[0]);
5139 gen_jmp_im(pc_start
- s
->cs_base
);
5140 gen_helper_idivw_AX(cpu_env
, cpu_T
[0]);
5144 gen_jmp_im(pc_start
- s
->cs_base
);
5145 gen_helper_idivl_EAX(cpu_env
, cpu_T
[0]);
5147 #ifdef TARGET_X86_64
5149 gen_jmp_im(pc_start
- s
->cs_base
);
5150 gen_helper_idivq_EAX(cpu_env
, cpu_T
[0]);
5160 case 0xfe: /* GRP4 */
5161 case 0xff: /* GRP5 */
5165 ot
= dflag
+ OT_WORD
;
5167 modrm
= cpu_ldub_code(env
, s
->pc
++);
5168 mod
= (modrm
>> 6) & 3;
5169 rm
= (modrm
& 7) | REX_B(s
);
5170 op
= (modrm
>> 3) & 7;
5171 if (op
>= 2 && b
== 0xfe) {
5175 if (op
== 2 || op
== 4) {
5176 /* operand size for jumps is 64 bit */
5178 } else if (op
== 3 || op
== 5) {
5179 ot
= dflag
? OT_LONG
+ (rex_w
== 1) : OT_WORD
;
5180 } else if (op
== 6) {
5181 /* default push size is 64 bit */
5182 ot
= dflag
? OT_QUAD
: OT_WORD
;
5186 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
5187 if (op
>= 2 && op
!= 3 && op
!= 5)
5188 gen_op_ld_T0_A0(ot
+ s
->mem_index
);
5190 gen_op_mov_TN_reg(ot
, 0, rm
);
5194 case 0: /* inc Ev */
5199 gen_inc(s
, ot
, opreg
, 1);
5201 case 1: /* dec Ev */
5206 gen_inc(s
, ot
, opreg
, -1);
5208 case 2: /* call Ev */
5209 /* XXX: optimize if memory (no 'and' is necessary) */
5211 gen_op_andl_T0_ffff();
5212 next_eip
= s
->pc
- s
->cs_base
;
5213 gen_movtl_T1_im(next_eip
);
5218 case 3: /* lcall Ev */
5219 gen_op_ld_T1_A0(ot
+ s
->mem_index
);
5220 gen_add_A0_im(s
, 1 << (ot
- OT_WORD
+ 1));
5221 gen_op_ldu_T0_A0(OT_WORD
+ s
->mem_index
);
5223 if (s
->pe
&& !s
->vm86
) {
5224 gen_update_cc_op(s
);
5225 gen_jmp_im(pc_start
- s
->cs_base
);
5226 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
5227 gen_helper_lcall_protected(cpu_env
, cpu_tmp2_i32
, cpu_T
[1],
5228 tcg_const_i32(dflag
),
5229 tcg_const_i32(s
->pc
- pc_start
));
5231 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
5232 gen_helper_lcall_real(cpu_env
, cpu_tmp2_i32
, cpu_T
[1],
5233 tcg_const_i32(dflag
),
5234 tcg_const_i32(s
->pc
- s
->cs_base
));
5238 case 4: /* jmp Ev */
5240 gen_op_andl_T0_ffff();
5244 case 5: /* ljmp Ev */
5245 gen_op_ld_T1_A0(ot
+ s
->mem_index
);
5246 gen_add_A0_im(s
, 1 << (ot
- OT_WORD
+ 1));
5247 gen_op_ldu_T0_A0(OT_WORD
+ s
->mem_index
);
5249 if (s
->pe
&& !s
->vm86
) {
5250 gen_update_cc_op(s
);
5251 gen_jmp_im(pc_start
- s
->cs_base
);
5252 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
5253 gen_helper_ljmp_protected(cpu_env
, cpu_tmp2_i32
, cpu_T
[1],
5254 tcg_const_i32(s
->pc
- pc_start
));
5256 gen_op_movl_seg_T0_vm(R_CS
);
5257 gen_op_movl_T0_T1();
5262 case 6: /* push Ev */
5270 case 0x84: /* test Ev, Gv */
5275 ot
= dflag
+ OT_WORD
;
5277 modrm
= cpu_ldub_code(env
, s
->pc
++);
5278 reg
= ((modrm
>> 3) & 7) | rex_r
;
5280 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
5281 gen_op_mov_TN_reg(ot
, 1, reg
);
5282 gen_op_testl_T0_T1_cc();
5283 set_cc_op(s
, CC_OP_LOGICB
+ ot
);
5286 case 0xa8: /* test eAX, Iv */
5291 ot
= dflag
+ OT_WORD
;
5292 val
= insn_get(env
, s
, ot
);
5294 gen_op_mov_TN_reg(ot
, 0, OR_EAX
);
5295 gen_op_movl_T1_im(val
);
5296 gen_op_testl_T0_T1_cc();
5297 set_cc_op(s
, CC_OP_LOGICB
+ ot
);
5300 case 0x98: /* CWDE/CBW */
5301 #ifdef TARGET_X86_64
5303 gen_op_mov_TN_reg(OT_LONG
, 0, R_EAX
);
5304 tcg_gen_ext32s_tl(cpu_T
[0], cpu_T
[0]);
5305 gen_op_mov_reg_T0(OT_QUAD
, R_EAX
);
5309 gen_op_mov_TN_reg(OT_WORD
, 0, R_EAX
);
5310 tcg_gen_ext16s_tl(cpu_T
[0], cpu_T
[0]);
5311 gen_op_mov_reg_T0(OT_LONG
, R_EAX
);
5313 gen_op_mov_TN_reg(OT_BYTE
, 0, R_EAX
);
5314 tcg_gen_ext8s_tl(cpu_T
[0], cpu_T
[0]);
5315 gen_op_mov_reg_T0(OT_WORD
, R_EAX
);
5318 case 0x99: /* CDQ/CWD */
5319 #ifdef TARGET_X86_64
5321 gen_op_mov_TN_reg(OT_QUAD
, 0, R_EAX
);
5322 tcg_gen_sari_tl(cpu_T
[0], cpu_T
[0], 63);
5323 gen_op_mov_reg_T0(OT_QUAD
, R_EDX
);
5327 gen_op_mov_TN_reg(OT_LONG
, 0, R_EAX
);
5328 tcg_gen_ext32s_tl(cpu_T
[0], cpu_T
[0]);
5329 tcg_gen_sari_tl(cpu_T
[0], cpu_T
[0], 31);
5330 gen_op_mov_reg_T0(OT_LONG
, R_EDX
);
5332 gen_op_mov_TN_reg(OT_WORD
, 0, R_EAX
);
5333 tcg_gen_ext16s_tl(cpu_T
[0], cpu_T
[0]);
5334 tcg_gen_sari_tl(cpu_T
[0], cpu_T
[0], 15);
5335 gen_op_mov_reg_T0(OT_WORD
, R_EDX
);
5338 case 0x1af: /* imul Gv, Ev */
5339 case 0x69: /* imul Gv, Ev, I */
5341 ot
= dflag
+ OT_WORD
;
5342 modrm
= cpu_ldub_code(env
, s
->pc
++);
5343 reg
= ((modrm
>> 3) & 7) | rex_r
;
5345 s
->rip_offset
= insn_const_size(ot
);
5348 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
5350 val
= insn_get(env
, s
, ot
);
5351 gen_op_movl_T1_im(val
);
5352 } else if (b
== 0x6b) {
5353 val
= (int8_t)insn_get(env
, s
, OT_BYTE
);
5354 gen_op_movl_T1_im(val
);
5356 gen_op_mov_TN_reg(ot
, 1, reg
);
5359 #ifdef TARGET_X86_64
5361 tcg_gen_muls2_i64(cpu_regs
[reg
], cpu_T
[1], cpu_T
[0], cpu_T
[1]);
5362 tcg_gen_mov_tl(cpu_cc_dst
, cpu_regs
[reg
]);
5363 tcg_gen_sari_tl(cpu_cc_src
, cpu_cc_dst
, 63);
5364 tcg_gen_sub_tl(cpu_cc_src
, cpu_cc_src
, cpu_T
[1]);
5368 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
5369 tcg_gen_trunc_tl_i32(cpu_tmp3_i32
, cpu_T
[1]);
5370 tcg_gen_muls2_i32(cpu_tmp2_i32
, cpu_tmp3_i32
,
5371 cpu_tmp2_i32
, cpu_tmp3_i32
);
5372 tcg_gen_extu_i32_tl(cpu_regs
[reg
], cpu_tmp2_i32
);
5373 tcg_gen_sari_i32(cpu_tmp2_i32
, cpu_tmp2_i32
, 31);
5374 tcg_gen_mov_tl(cpu_cc_dst
, cpu_regs
[reg
]);
5375 tcg_gen_sub_i32(cpu_tmp2_i32
, cpu_tmp2_i32
, cpu_tmp3_i32
);
5376 tcg_gen_extu_i32_tl(cpu_cc_src
, cpu_tmp2_i32
);
5379 tcg_gen_ext16s_tl(cpu_T
[0], cpu_T
[0]);
5380 tcg_gen_ext16s_tl(cpu_T
[1], cpu_T
[1]);
5381 /* XXX: use 32 bit mul which could be faster */
5382 tcg_gen_mul_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
5383 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
5384 tcg_gen_ext16s_tl(cpu_tmp0
, cpu_T
[0]);
5385 tcg_gen_sub_tl(cpu_cc_src
, cpu_T
[0], cpu_tmp0
);
5386 gen_op_mov_reg_T0(ot
, reg
);
5389 set_cc_op(s
, CC_OP_MULB
+ ot
);
5392 case 0x1c1: /* xadd Ev, Gv */
5396 ot
= dflag
+ OT_WORD
;
5397 modrm
= cpu_ldub_code(env
, s
->pc
++);
5398 reg
= ((modrm
>> 3) & 7) | rex_r
;
5399 mod
= (modrm
>> 6) & 3;
5401 rm
= (modrm
& 7) | REX_B(s
);
5402 gen_op_mov_TN_reg(ot
, 0, reg
);
5403 gen_op_mov_TN_reg(ot
, 1, rm
);
5404 gen_op_addl_T0_T1();
5405 gen_op_mov_reg_T1(ot
, reg
);
5406 gen_op_mov_reg_T0(ot
, rm
);
5408 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
5409 gen_op_mov_TN_reg(ot
, 0, reg
);
5410 gen_op_ld_T1_A0(ot
+ s
->mem_index
);
5411 gen_op_addl_T0_T1();
5412 gen_op_st_T0_A0(ot
+ s
->mem_index
);
5413 gen_op_mov_reg_T1(ot
, reg
);
5415 gen_op_update2_cc();
5416 set_cc_op(s
, CC_OP_ADDB
+ ot
);
5419 case 0x1b1: /* cmpxchg Ev, Gv */
5422 TCGv t0
, t1
, t2
, a0
;
5427 ot
= dflag
+ OT_WORD
;
5428 modrm
= cpu_ldub_code(env
, s
->pc
++);
5429 reg
= ((modrm
>> 3) & 7) | rex_r
;
5430 mod
= (modrm
>> 6) & 3;
5431 t0
= tcg_temp_local_new();
5432 t1
= tcg_temp_local_new();
5433 t2
= tcg_temp_local_new();
5434 a0
= tcg_temp_local_new();
5435 gen_op_mov_v_reg(ot
, t1
, reg
);
5437 rm
= (modrm
& 7) | REX_B(s
);
5438 gen_op_mov_v_reg(ot
, t0
, rm
);
5440 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
5441 tcg_gen_mov_tl(a0
, cpu_A0
);
5442 gen_op_ld_v(ot
+ s
->mem_index
, t0
, a0
);
5443 rm
= 0; /* avoid warning */
5445 label1
= gen_new_label();
5446 tcg_gen_mov_tl(t2
, cpu_regs
[R_EAX
]);
5449 tcg_gen_brcond_tl(TCG_COND_EQ
, t2
, t0
, label1
);
5450 label2
= gen_new_label();
5452 gen_op_mov_reg_v(ot
, R_EAX
, t0
);
5454 gen_set_label(label1
);
5455 gen_op_mov_reg_v(ot
, rm
, t1
);
5457 /* perform no-op store cycle like physical cpu; must be
5458 before changing accumulator to ensure idempotency if
5459 the store faults and the instruction is restarted */
5460 gen_op_st_v(ot
+ s
->mem_index
, t0
, a0
);
5461 gen_op_mov_reg_v(ot
, R_EAX
, t0
);
5463 gen_set_label(label1
);
5464 gen_op_st_v(ot
+ s
->mem_index
, t1
, a0
);
5466 gen_set_label(label2
);
5467 tcg_gen_mov_tl(cpu_cc_src
, t0
);
5468 tcg_gen_mov_tl(cpu_cc_srcT
, t2
);
5469 tcg_gen_sub_tl(cpu_cc_dst
, t2
, t0
);
5470 set_cc_op(s
, CC_OP_SUBB
+ ot
);
5477 case 0x1c7: /* cmpxchg8b */
5478 modrm
= cpu_ldub_code(env
, s
->pc
++);
5479 mod
= (modrm
>> 6) & 3;
5480 if ((mod
== 3) || ((modrm
& 0x38) != 0x8))
5482 #ifdef TARGET_X86_64
5484 if (!(s
->cpuid_ext_features
& CPUID_EXT_CX16
))
5486 gen_jmp_im(pc_start
- s
->cs_base
);
5487 gen_update_cc_op(s
);
5488 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
5489 gen_helper_cmpxchg16b(cpu_env
, cpu_A0
);
5493 if (!(s
->cpuid_features
& CPUID_CX8
))
5495 gen_jmp_im(pc_start
- s
->cs_base
);
5496 gen_update_cc_op(s
);
5497 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
5498 gen_helper_cmpxchg8b(cpu_env
, cpu_A0
);
5500 set_cc_op(s
, CC_OP_EFLAGS
);
5503 /**************************/
5505 case 0x50 ... 0x57: /* push */
5506 gen_op_mov_TN_reg(OT_LONG
, 0, (b
& 7) | REX_B(s
));
5509 case 0x58 ... 0x5f: /* pop */
5511 ot
= dflag
? OT_QUAD
: OT_WORD
;
5513 ot
= dflag
+ OT_WORD
;
5516 /* NOTE: order is important for pop %sp */
5518 gen_op_mov_reg_T0(ot
, (b
& 7) | REX_B(s
));
5520 case 0x60: /* pusha */
5525 case 0x61: /* popa */
5530 case 0x68: /* push Iv */
5533 ot
= dflag
? OT_QUAD
: OT_WORD
;
5535 ot
= dflag
+ OT_WORD
;
5538 val
= insn_get(env
, s
, ot
);
5540 val
= (int8_t)insn_get(env
, s
, OT_BYTE
);
5541 gen_op_movl_T0_im(val
);
5544 case 0x8f: /* pop Ev */
5546 ot
= dflag
? OT_QUAD
: OT_WORD
;
5548 ot
= dflag
+ OT_WORD
;
5550 modrm
= cpu_ldub_code(env
, s
->pc
++);
5551 mod
= (modrm
>> 6) & 3;
5554 /* NOTE: order is important for pop %sp */
5556 rm
= (modrm
& 7) | REX_B(s
);
5557 gen_op_mov_reg_T0(ot
, rm
);
5559 /* NOTE: order is important too for MMU exceptions */
5560 s
->popl_esp_hack
= 1 << ot
;
5561 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 1);
5562 s
->popl_esp_hack
= 0;
5566 case 0xc8: /* enter */
5569 val
= cpu_lduw_code(env
, s
->pc
);
5571 level
= cpu_ldub_code(env
, s
->pc
++);
5572 gen_enter(s
, val
, level
);
5575 case 0xc9: /* leave */
5576 /* XXX: exception not precise (ESP is updated before potential exception) */
5578 gen_op_mov_TN_reg(OT_QUAD
, 0, R_EBP
);
5579 gen_op_mov_reg_T0(OT_QUAD
, R_ESP
);
5580 } else if (s
->ss32
) {
5581 gen_op_mov_TN_reg(OT_LONG
, 0, R_EBP
);
5582 gen_op_mov_reg_T0(OT_LONG
, R_ESP
);
5584 gen_op_mov_TN_reg(OT_WORD
, 0, R_EBP
);
5585 gen_op_mov_reg_T0(OT_WORD
, R_ESP
);
5589 ot
= dflag
? OT_QUAD
: OT_WORD
;
5591 ot
= dflag
+ OT_WORD
;
5593 gen_op_mov_reg_T0(ot
, R_EBP
);
5596 case 0x06: /* push es */
5597 case 0x0e: /* push cs */
5598 case 0x16: /* push ss */
5599 case 0x1e: /* push ds */
5602 gen_op_movl_T0_seg(b
>> 3);
5605 case 0x1a0: /* push fs */
5606 case 0x1a8: /* push gs */
5607 gen_op_movl_T0_seg((b
>> 3) & 7);
5610 case 0x07: /* pop es */
5611 case 0x17: /* pop ss */
5612 case 0x1f: /* pop ds */
5617 gen_movl_seg_T0(s
, reg
, pc_start
- s
->cs_base
);
5620 /* if reg == SS, inhibit interrupts/trace. */
5621 /* If several instructions disable interrupts, only the
5623 if (!(s
->tb
->flags
& HF_INHIBIT_IRQ_MASK
))
5624 gen_helper_set_inhibit_irq(cpu_env
);
5628 gen_jmp_im(s
->pc
- s
->cs_base
);
5632 case 0x1a1: /* pop fs */
5633 case 0x1a9: /* pop gs */
5635 gen_movl_seg_T0(s
, (b
>> 3) & 7, pc_start
- s
->cs_base
);
5638 gen_jmp_im(s
->pc
- s
->cs_base
);
5643 /**************************/
5646 case 0x89: /* mov Gv, Ev */
5650 ot
= dflag
+ OT_WORD
;
5651 modrm
= cpu_ldub_code(env
, s
->pc
++);
5652 reg
= ((modrm
>> 3) & 7) | rex_r
;
5654 /* generate a generic store */
5655 gen_ldst_modrm(env
, s
, modrm
, ot
, reg
, 1);
5658 case 0xc7: /* mov Ev, Iv */
5662 ot
= dflag
+ OT_WORD
;
5663 modrm
= cpu_ldub_code(env
, s
->pc
++);
5664 mod
= (modrm
>> 6) & 3;
5666 s
->rip_offset
= insn_const_size(ot
);
5667 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
5669 val
= insn_get(env
, s
, ot
);
5670 gen_op_movl_T0_im(val
);
5672 gen_op_st_T0_A0(ot
+ s
->mem_index
);
5674 gen_op_mov_reg_T0(ot
, (modrm
& 7) | REX_B(s
));
5677 case 0x8b: /* mov Ev, Gv */
5681 ot
= OT_WORD
+ dflag
;
5682 modrm
= cpu_ldub_code(env
, s
->pc
++);
5683 reg
= ((modrm
>> 3) & 7) | rex_r
;
5685 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
5686 gen_op_mov_reg_T0(ot
, reg
);
5688 case 0x8e: /* mov seg, Gv */
5689 modrm
= cpu_ldub_code(env
, s
->pc
++);
5690 reg
= (modrm
>> 3) & 7;
5691 if (reg
>= 6 || reg
== R_CS
)
5693 gen_ldst_modrm(env
, s
, modrm
, OT_WORD
, OR_TMP0
, 0);
5694 gen_movl_seg_T0(s
, reg
, pc_start
- s
->cs_base
);
5696 /* if reg == SS, inhibit interrupts/trace */
5697 /* If several instructions disable interrupts, only the
5699 if (!(s
->tb
->flags
& HF_INHIBIT_IRQ_MASK
))
5700 gen_helper_set_inhibit_irq(cpu_env
);
5704 gen_jmp_im(s
->pc
- s
->cs_base
);
5708 case 0x8c: /* mov Gv, seg */
5709 modrm
= cpu_ldub_code(env
, s
->pc
++);
5710 reg
= (modrm
>> 3) & 7;
5711 mod
= (modrm
>> 6) & 3;
5714 gen_op_movl_T0_seg(reg
);
5716 ot
= OT_WORD
+ dflag
;
5719 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 1);
5722 case 0x1b6: /* movzbS Gv, Eb */
5723 case 0x1b7: /* movzwS Gv, Eb */
5724 case 0x1be: /* movsbS Gv, Eb */
5725 case 0x1bf: /* movswS Gv, Eb */
5728 /* d_ot is the size of destination */
5729 d_ot
= dflag
+ OT_WORD
;
5730 /* ot is the size of source */
5731 ot
= (b
& 1) + OT_BYTE
;
5732 modrm
= cpu_ldub_code(env
, s
->pc
++);
5733 reg
= ((modrm
>> 3) & 7) | rex_r
;
5734 mod
= (modrm
>> 6) & 3;
5735 rm
= (modrm
& 7) | REX_B(s
);
5738 gen_op_mov_TN_reg(ot
, 0, rm
);
5739 switch(ot
| (b
& 8)) {
5741 tcg_gen_ext8u_tl(cpu_T
[0], cpu_T
[0]);
5744 tcg_gen_ext8s_tl(cpu_T
[0], cpu_T
[0]);
5747 tcg_gen_ext16u_tl(cpu_T
[0], cpu_T
[0]);
5751 tcg_gen_ext16s_tl(cpu_T
[0], cpu_T
[0]);
5754 gen_op_mov_reg_T0(d_ot
, reg
);
5756 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
5758 gen_op_lds_T0_A0(ot
+ s
->mem_index
);
5760 gen_op_ldu_T0_A0(ot
+ s
->mem_index
);
5762 gen_op_mov_reg_T0(d_ot
, reg
);
5767 case 0x8d: /* lea */
5768 ot
= dflag
+ OT_WORD
;
5769 modrm
= cpu_ldub_code(env
, s
->pc
++);
5770 mod
= (modrm
>> 6) & 3;
5773 reg
= ((modrm
>> 3) & 7) | rex_r
;
5774 /* we must ensure that no segment is added */
5778 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
5780 gen_op_mov_reg_A0(ot
- OT_WORD
, reg
);
5783 case 0xa0: /* mov EAX, Ov */
5785 case 0xa2: /* mov Ov, EAX */
5788 target_ulong offset_addr
;
5793 ot
= dflag
+ OT_WORD
;
5794 #ifdef TARGET_X86_64
5795 if (s
->aflag
== 2) {
5796 offset_addr
= cpu_ldq_code(env
, s
->pc
);
5798 gen_op_movq_A0_im(offset_addr
);
5803 offset_addr
= insn_get(env
, s
, OT_LONG
);
5805 offset_addr
= insn_get(env
, s
, OT_WORD
);
5807 gen_op_movl_A0_im(offset_addr
);
5809 gen_add_A0_ds_seg(s
);
5811 gen_op_ld_T0_A0(ot
+ s
->mem_index
);
5812 gen_op_mov_reg_T0(ot
, R_EAX
);
5814 gen_op_mov_TN_reg(ot
, 0, R_EAX
);
5815 gen_op_st_T0_A0(ot
+ s
->mem_index
);
5819 case 0xd7: /* xlat */
5820 #ifdef TARGET_X86_64
5821 if (s
->aflag
== 2) {
5822 gen_op_movq_A0_reg(R_EBX
);
5823 gen_op_mov_TN_reg(OT_QUAD
, 0, R_EAX
);
5824 tcg_gen_andi_tl(cpu_T
[0], cpu_T
[0], 0xff);
5825 tcg_gen_add_tl(cpu_A0
, cpu_A0
, cpu_T
[0]);
5829 gen_op_movl_A0_reg(R_EBX
);
5830 gen_op_mov_TN_reg(OT_LONG
, 0, R_EAX
);
5831 tcg_gen_andi_tl(cpu_T
[0], cpu_T
[0], 0xff);
5832 tcg_gen_add_tl(cpu_A0
, cpu_A0
, cpu_T
[0]);
5834 gen_op_andl_A0_ffff();
5836 tcg_gen_andi_tl(cpu_A0
, cpu_A0
, 0xffffffff);
5838 gen_add_A0_ds_seg(s
);
5839 gen_op_ldu_T0_A0(OT_BYTE
+ s
->mem_index
);
5840 gen_op_mov_reg_T0(OT_BYTE
, R_EAX
);
5842 case 0xb0 ... 0xb7: /* mov R, Ib */
5843 val
= insn_get(env
, s
, OT_BYTE
);
5844 gen_op_movl_T0_im(val
);
5845 gen_op_mov_reg_T0(OT_BYTE
, (b
& 7) | REX_B(s
));
5847 case 0xb8 ... 0xbf: /* mov R, Iv */
5848 #ifdef TARGET_X86_64
5852 tmp
= cpu_ldq_code(env
, s
->pc
);
5854 reg
= (b
& 7) | REX_B(s
);
5855 gen_movtl_T0_im(tmp
);
5856 gen_op_mov_reg_T0(OT_QUAD
, reg
);
5860 ot
= dflag
? OT_LONG
: OT_WORD
;
5861 val
= insn_get(env
, s
, ot
);
5862 reg
= (b
& 7) | REX_B(s
);
5863 gen_op_movl_T0_im(val
);
5864 gen_op_mov_reg_T0(ot
, reg
);
5868 case 0x91 ... 0x97: /* xchg R, EAX */
5870 ot
= dflag
+ OT_WORD
;
5871 reg
= (b
& 7) | REX_B(s
);
5875 case 0x87: /* xchg Ev, Gv */
5879 ot
= dflag
+ OT_WORD
;
5880 modrm
= cpu_ldub_code(env
, s
->pc
++);
5881 reg
= ((modrm
>> 3) & 7) | rex_r
;
5882 mod
= (modrm
>> 6) & 3;
5884 rm
= (modrm
& 7) | REX_B(s
);
5886 gen_op_mov_TN_reg(ot
, 0, reg
);
5887 gen_op_mov_TN_reg(ot
, 1, rm
);
5888 gen_op_mov_reg_T0(ot
, rm
);
5889 gen_op_mov_reg_T1(ot
, reg
);
5891 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
5892 gen_op_mov_TN_reg(ot
, 0, reg
);
5893 /* for xchg, lock is implicit */
5894 if (!(prefixes
& PREFIX_LOCK
))
5896 gen_op_ld_T1_A0(ot
+ s
->mem_index
);
5897 gen_op_st_T0_A0(ot
+ s
->mem_index
);
5898 if (!(prefixes
& PREFIX_LOCK
))
5899 gen_helper_unlock();
5900 gen_op_mov_reg_T1(ot
, reg
);
5903 case 0xc4: /* les Gv */
5904 /* In CODE64 this is VEX3; see above. */
5907 case 0xc5: /* lds Gv */
5908 /* In CODE64 this is VEX2; see above. */
5911 case 0x1b2: /* lss Gv */
5914 case 0x1b4: /* lfs Gv */
5917 case 0x1b5: /* lgs Gv */
5920 ot
= dflag
? OT_LONG
: OT_WORD
;
5921 modrm
= cpu_ldub_code(env
, s
->pc
++);
5922 reg
= ((modrm
>> 3) & 7) | rex_r
;
5923 mod
= (modrm
>> 6) & 3;
5926 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
5927 gen_op_ld_T1_A0(ot
+ s
->mem_index
);
5928 gen_add_A0_im(s
, 1 << (ot
- OT_WORD
+ 1));
5929 /* load the segment first to handle exceptions properly */
5930 gen_op_ldu_T0_A0(OT_WORD
+ s
->mem_index
);
5931 gen_movl_seg_T0(s
, op
, pc_start
- s
->cs_base
);
5932 /* then put the data */
5933 gen_op_mov_reg_T1(ot
, reg
);
5935 gen_jmp_im(s
->pc
- s
->cs_base
);
5940 /************************/
5951 ot
= dflag
+ OT_WORD
;
5953 modrm
= cpu_ldub_code(env
, s
->pc
++);
5954 mod
= (modrm
>> 6) & 3;
5955 op
= (modrm
>> 3) & 7;
5961 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
5964 opreg
= (modrm
& 7) | REX_B(s
);
5969 gen_shift(s
, op
, ot
, opreg
, OR_ECX
);
5972 shift
= cpu_ldub_code(env
, s
->pc
++);
5974 gen_shifti(s
, op
, ot
, opreg
, shift
);
5989 case 0x1a4: /* shld imm */
5993 case 0x1a5: /* shld cl */
5997 case 0x1ac: /* shrd imm */
6001 case 0x1ad: /* shrd cl */
6005 ot
= dflag
+ OT_WORD
;
6006 modrm
= cpu_ldub_code(env
, s
->pc
++);
6007 mod
= (modrm
>> 6) & 3;
6008 rm
= (modrm
& 7) | REX_B(s
);
6009 reg
= ((modrm
>> 3) & 7) | rex_r
;
6011 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
6016 gen_op_mov_TN_reg(ot
, 1, reg
);
6019 TCGv imm
= tcg_const_tl(cpu_ldub_code(env
, s
->pc
++));
6020 gen_shiftd_rm_T1(s
, ot
, opreg
, op
, imm
);
6023 gen_shiftd_rm_T1(s
, ot
, opreg
, op
, cpu_regs
[R_ECX
]);
6027 /************************/
6030 if (s
->flags
& (HF_EM_MASK
| HF_TS_MASK
)) {
6031 /* if CR0.EM or CR0.TS are set, generate an FPU exception */
6032 /* XXX: what to do if illegal op ? */
6033 gen_exception(s
, EXCP07_PREX
, pc_start
- s
->cs_base
);
6036 modrm
= cpu_ldub_code(env
, s
->pc
++);
6037 mod
= (modrm
>> 6) & 3;
6039 op
= ((b
& 7) << 3) | ((modrm
>> 3) & 7);
6042 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
6044 case 0x00 ... 0x07: /* fxxxs */
6045 case 0x10 ... 0x17: /* fixxxl */
6046 case 0x20 ... 0x27: /* fxxxl */
6047 case 0x30 ... 0x37: /* fixxx */
6054 gen_op_ld_T0_A0(OT_LONG
+ s
->mem_index
);
6055 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
6056 gen_helper_flds_FT0(cpu_env
, cpu_tmp2_i32
);
6059 gen_op_ld_T0_A0(OT_LONG
+ s
->mem_index
);
6060 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
6061 gen_helper_fildl_FT0(cpu_env
, cpu_tmp2_i32
);
6064 tcg_gen_qemu_ld64(cpu_tmp1_i64
, cpu_A0
,
6065 (s
->mem_index
>> 2) - 1);
6066 gen_helper_fldl_FT0(cpu_env
, cpu_tmp1_i64
);
6070 gen_op_lds_T0_A0(OT_WORD
+ s
->mem_index
);
6071 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
6072 gen_helper_fildl_FT0(cpu_env
, cpu_tmp2_i32
);
6076 gen_helper_fp_arith_ST0_FT0(op1
);
6078 /* fcomp needs pop */
6079 gen_helper_fpop(cpu_env
);
6083 case 0x08: /* flds */
6084 case 0x0a: /* fsts */
6085 case 0x0b: /* fstps */
6086 case 0x18 ... 0x1b: /* fildl, fisttpl, fistl, fistpl */
6087 case 0x28 ... 0x2b: /* fldl, fisttpll, fstl, fstpl */
6088 case 0x38 ... 0x3b: /* filds, fisttps, fists, fistps */
6093 gen_op_ld_T0_A0(OT_LONG
+ s
->mem_index
);
6094 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
6095 gen_helper_flds_ST0(cpu_env
, cpu_tmp2_i32
);
6098 gen_op_ld_T0_A0(OT_LONG
+ s
->mem_index
);
6099 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
6100 gen_helper_fildl_ST0(cpu_env
, cpu_tmp2_i32
);
6103 tcg_gen_qemu_ld64(cpu_tmp1_i64
, cpu_A0
,
6104 (s
->mem_index
>> 2) - 1);
6105 gen_helper_fldl_ST0(cpu_env
, cpu_tmp1_i64
);
6109 gen_op_lds_T0_A0(OT_WORD
+ s
->mem_index
);
6110 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
6111 gen_helper_fildl_ST0(cpu_env
, cpu_tmp2_i32
);
6116 /* XXX: the corresponding CPUID bit must be tested ! */
6119 gen_helper_fisttl_ST0(cpu_tmp2_i32
, cpu_env
);
6120 tcg_gen_extu_i32_tl(cpu_T
[0], cpu_tmp2_i32
);
6121 gen_op_st_T0_A0(OT_LONG
+ s
->mem_index
);
6124 gen_helper_fisttll_ST0(cpu_tmp1_i64
, cpu_env
);
6125 tcg_gen_qemu_st64(cpu_tmp1_i64
, cpu_A0
,
6126 (s
->mem_index
>> 2) - 1);
6130 gen_helper_fistt_ST0(cpu_tmp2_i32
, cpu_env
);
6131 tcg_gen_extu_i32_tl(cpu_T
[0], cpu_tmp2_i32
);
6132 gen_op_st_T0_A0(OT_WORD
+ s
->mem_index
);
6135 gen_helper_fpop(cpu_env
);
6140 gen_helper_fsts_ST0(cpu_tmp2_i32
, cpu_env
);
6141 tcg_gen_extu_i32_tl(cpu_T
[0], cpu_tmp2_i32
);
6142 gen_op_st_T0_A0(OT_LONG
+ s
->mem_index
);
6145 gen_helper_fistl_ST0(cpu_tmp2_i32
, cpu_env
);
6146 tcg_gen_extu_i32_tl(cpu_T
[0], cpu_tmp2_i32
);
6147 gen_op_st_T0_A0(OT_LONG
+ s
->mem_index
);
6150 gen_helper_fstl_ST0(cpu_tmp1_i64
, cpu_env
);
6151 tcg_gen_qemu_st64(cpu_tmp1_i64
, cpu_A0
,
6152 (s
->mem_index
>> 2) - 1);
6156 gen_helper_fist_ST0(cpu_tmp2_i32
, cpu_env
);
6157 tcg_gen_extu_i32_tl(cpu_T
[0], cpu_tmp2_i32
);
6158 gen_op_st_T0_A0(OT_WORD
+ s
->mem_index
);
6162 gen_helper_fpop(cpu_env
);
6166 case 0x0c: /* fldenv mem */
6167 gen_update_cc_op(s
);
6168 gen_jmp_im(pc_start
- s
->cs_base
);
6169 gen_helper_fldenv(cpu_env
, cpu_A0
, tcg_const_i32(s
->dflag
));
6171 case 0x0d: /* fldcw mem */
6172 gen_op_ld_T0_A0(OT_WORD
+ s
->mem_index
);
6173 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
6174 gen_helper_fldcw(cpu_env
, cpu_tmp2_i32
);
6176 case 0x0e: /* fnstenv mem */
6177 gen_update_cc_op(s
);
6178 gen_jmp_im(pc_start
- s
->cs_base
);
6179 gen_helper_fstenv(cpu_env
, cpu_A0
, tcg_const_i32(s
->dflag
));
6181 case 0x0f: /* fnstcw mem */
6182 gen_helper_fnstcw(cpu_tmp2_i32
, cpu_env
);
6183 tcg_gen_extu_i32_tl(cpu_T
[0], cpu_tmp2_i32
);
6184 gen_op_st_T0_A0(OT_WORD
+ s
->mem_index
);
6186 case 0x1d: /* fldt mem */
6187 gen_update_cc_op(s
);
6188 gen_jmp_im(pc_start
- s
->cs_base
);
6189 gen_helper_fldt_ST0(cpu_env
, cpu_A0
);
6191 case 0x1f: /* fstpt mem */
6192 gen_update_cc_op(s
);
6193 gen_jmp_im(pc_start
- s
->cs_base
);
6194 gen_helper_fstt_ST0(cpu_env
, cpu_A0
);
6195 gen_helper_fpop(cpu_env
);
6197 case 0x2c: /* frstor mem */
6198 gen_update_cc_op(s
);
6199 gen_jmp_im(pc_start
- s
->cs_base
);
6200 gen_helper_frstor(cpu_env
, cpu_A0
, tcg_const_i32(s
->dflag
));
6202 case 0x2e: /* fnsave mem */
6203 gen_update_cc_op(s
);
6204 gen_jmp_im(pc_start
- s
->cs_base
);
6205 gen_helper_fsave(cpu_env
, cpu_A0
, tcg_const_i32(s
->dflag
));
6207 case 0x2f: /* fnstsw mem */
6208 gen_helper_fnstsw(cpu_tmp2_i32
, cpu_env
);
6209 tcg_gen_extu_i32_tl(cpu_T
[0], cpu_tmp2_i32
);
6210 gen_op_st_T0_A0(OT_WORD
+ s
->mem_index
);
6212 case 0x3c: /* fbld */
6213 gen_update_cc_op(s
);
6214 gen_jmp_im(pc_start
- s
->cs_base
);
6215 gen_helper_fbld_ST0(cpu_env
, cpu_A0
);
6217 case 0x3e: /* fbstp */
6218 gen_update_cc_op(s
);
6219 gen_jmp_im(pc_start
- s
->cs_base
);
6220 gen_helper_fbst_ST0(cpu_env
, cpu_A0
);
6221 gen_helper_fpop(cpu_env
);
6223 case 0x3d: /* fildll */
6224 tcg_gen_qemu_ld64(cpu_tmp1_i64
, cpu_A0
,
6225 (s
->mem_index
>> 2) - 1);
6226 gen_helper_fildll_ST0(cpu_env
, cpu_tmp1_i64
);
6228 case 0x3f: /* fistpll */
6229 gen_helper_fistll_ST0(cpu_tmp1_i64
, cpu_env
);
6230 tcg_gen_qemu_st64(cpu_tmp1_i64
, cpu_A0
,
6231 (s
->mem_index
>> 2) - 1);
6232 gen_helper_fpop(cpu_env
);
6238 /* register float ops */
6242 case 0x08: /* fld sti */
6243 gen_helper_fpush(cpu_env
);
6244 gen_helper_fmov_ST0_STN(cpu_env
,
6245 tcg_const_i32((opreg
+ 1) & 7));
6247 case 0x09: /* fxchg sti */
6248 case 0x29: /* fxchg4 sti, undocumented op */
6249 case 0x39: /* fxchg7 sti, undocumented op */
6250 gen_helper_fxchg_ST0_STN(cpu_env
, tcg_const_i32(opreg
));
6252 case 0x0a: /* grp d9/2 */
6255 /* check exceptions (FreeBSD FPU probe) */
6256 gen_update_cc_op(s
);
6257 gen_jmp_im(pc_start
- s
->cs_base
);
6258 gen_helper_fwait(cpu_env
);
6264 case 0x0c: /* grp d9/4 */
6267 gen_helper_fchs_ST0(cpu_env
);
6270 gen_helper_fabs_ST0(cpu_env
);
6273 gen_helper_fldz_FT0(cpu_env
);
6274 gen_helper_fcom_ST0_FT0(cpu_env
);
6277 gen_helper_fxam_ST0(cpu_env
);
6283 case 0x0d: /* grp d9/5 */
6287 gen_helper_fpush(cpu_env
);
6288 gen_helper_fld1_ST0(cpu_env
);
6291 gen_helper_fpush(cpu_env
);
6292 gen_helper_fldl2t_ST0(cpu_env
);
6295 gen_helper_fpush(cpu_env
);
6296 gen_helper_fldl2e_ST0(cpu_env
);
6299 gen_helper_fpush(cpu_env
);
6300 gen_helper_fldpi_ST0(cpu_env
);
6303 gen_helper_fpush(cpu_env
);
6304 gen_helper_fldlg2_ST0(cpu_env
);
6307 gen_helper_fpush(cpu_env
);
6308 gen_helper_fldln2_ST0(cpu_env
);
6311 gen_helper_fpush(cpu_env
);
6312 gen_helper_fldz_ST0(cpu_env
);
6319 case 0x0e: /* grp d9/6 */
6322 gen_helper_f2xm1(cpu_env
);
6325 gen_helper_fyl2x(cpu_env
);
6328 gen_helper_fptan(cpu_env
);
6330 case 3: /* fpatan */
6331 gen_helper_fpatan(cpu_env
);
6333 case 4: /* fxtract */
6334 gen_helper_fxtract(cpu_env
);
6336 case 5: /* fprem1 */
6337 gen_helper_fprem1(cpu_env
);
6339 case 6: /* fdecstp */
6340 gen_helper_fdecstp(cpu_env
);
6343 case 7: /* fincstp */
6344 gen_helper_fincstp(cpu_env
);
6348 case 0x0f: /* grp d9/7 */
6351 gen_helper_fprem(cpu_env
);
6353 case 1: /* fyl2xp1 */
6354 gen_helper_fyl2xp1(cpu_env
);
6357 gen_helper_fsqrt(cpu_env
);
6359 case 3: /* fsincos */
6360 gen_helper_fsincos(cpu_env
);
6362 case 5: /* fscale */
6363 gen_helper_fscale(cpu_env
);
6365 case 4: /* frndint */
6366 gen_helper_frndint(cpu_env
);
6369 gen_helper_fsin(cpu_env
);
6373 gen_helper_fcos(cpu_env
);
6377 case 0x00: case 0x01: case 0x04 ... 0x07: /* fxxx st, sti */
6378 case 0x20: case 0x21: case 0x24 ... 0x27: /* fxxx sti, st */
6379 case 0x30: case 0x31: case 0x34 ... 0x37: /* fxxxp sti, st */
6385 gen_helper_fp_arith_STN_ST0(op1
, opreg
);
6387 gen_helper_fpop(cpu_env
);
6389 gen_helper_fmov_FT0_STN(cpu_env
, tcg_const_i32(opreg
));
6390 gen_helper_fp_arith_ST0_FT0(op1
);
6394 case 0x02: /* fcom */
6395 case 0x22: /* fcom2, undocumented op */
6396 gen_helper_fmov_FT0_STN(cpu_env
, tcg_const_i32(opreg
));
6397 gen_helper_fcom_ST0_FT0(cpu_env
);
6399 case 0x03: /* fcomp */
6400 case 0x23: /* fcomp3, undocumented op */
6401 case 0x32: /* fcomp5, undocumented op */
6402 gen_helper_fmov_FT0_STN(cpu_env
, tcg_const_i32(opreg
));
6403 gen_helper_fcom_ST0_FT0(cpu_env
);
6404 gen_helper_fpop(cpu_env
);
6406 case 0x15: /* da/5 */
6408 case 1: /* fucompp */
6409 gen_helper_fmov_FT0_STN(cpu_env
, tcg_const_i32(1));
6410 gen_helper_fucom_ST0_FT0(cpu_env
);
6411 gen_helper_fpop(cpu_env
);
6412 gen_helper_fpop(cpu_env
);
6420 case 0: /* feni (287 only, just do nop here) */
6422 case 1: /* fdisi (287 only, just do nop here) */
6425 gen_helper_fclex(cpu_env
);
6427 case 3: /* fninit */
6428 gen_helper_fninit(cpu_env
);
6430 case 4: /* fsetpm (287 only, just do nop here) */
6436 case 0x1d: /* fucomi */
6437 gen_update_cc_op(s
);
6438 gen_helper_fmov_FT0_STN(cpu_env
, tcg_const_i32(opreg
));
6439 gen_helper_fucomi_ST0_FT0(cpu_env
);
6440 set_cc_op(s
, CC_OP_EFLAGS
);
6442 case 0x1e: /* fcomi */
6443 gen_update_cc_op(s
);
6444 gen_helper_fmov_FT0_STN(cpu_env
, tcg_const_i32(opreg
));
6445 gen_helper_fcomi_ST0_FT0(cpu_env
);
6446 set_cc_op(s
, CC_OP_EFLAGS
);
6448 case 0x28: /* ffree sti */
6449 gen_helper_ffree_STN(cpu_env
, tcg_const_i32(opreg
));
6451 case 0x2a: /* fst sti */
6452 gen_helper_fmov_STN_ST0(cpu_env
, tcg_const_i32(opreg
));
6454 case 0x2b: /* fstp sti */
6455 case 0x0b: /* fstp1 sti, undocumented op */
6456 case 0x3a: /* fstp8 sti, undocumented op */
6457 case 0x3b: /* fstp9 sti, undocumented op */
6458 gen_helper_fmov_STN_ST0(cpu_env
, tcg_const_i32(opreg
));
6459 gen_helper_fpop(cpu_env
);
6461 case 0x2c: /* fucom st(i) */
6462 gen_helper_fmov_FT0_STN(cpu_env
, tcg_const_i32(opreg
));
6463 gen_helper_fucom_ST0_FT0(cpu_env
);
6465 case 0x2d: /* fucomp st(i) */
6466 gen_helper_fmov_FT0_STN(cpu_env
, tcg_const_i32(opreg
));
6467 gen_helper_fucom_ST0_FT0(cpu_env
);
6468 gen_helper_fpop(cpu_env
);
6470 case 0x33: /* de/3 */
6472 case 1: /* fcompp */
6473 gen_helper_fmov_FT0_STN(cpu_env
, tcg_const_i32(1));
6474 gen_helper_fcom_ST0_FT0(cpu_env
);
6475 gen_helper_fpop(cpu_env
);
6476 gen_helper_fpop(cpu_env
);
6482 case 0x38: /* ffreep sti, undocumented op */
6483 gen_helper_ffree_STN(cpu_env
, tcg_const_i32(opreg
));
6484 gen_helper_fpop(cpu_env
);
6486 case 0x3c: /* df/4 */
6489 gen_helper_fnstsw(cpu_tmp2_i32
, cpu_env
);
6490 tcg_gen_extu_i32_tl(cpu_T
[0], cpu_tmp2_i32
);
6491 gen_op_mov_reg_T0(OT_WORD
, R_EAX
);
6497 case 0x3d: /* fucomip */
6498 gen_update_cc_op(s
);
6499 gen_helper_fmov_FT0_STN(cpu_env
, tcg_const_i32(opreg
));
6500 gen_helper_fucomi_ST0_FT0(cpu_env
);
6501 gen_helper_fpop(cpu_env
);
6502 set_cc_op(s
, CC_OP_EFLAGS
);
6504 case 0x3e: /* fcomip */
6505 gen_update_cc_op(s
);
6506 gen_helper_fmov_FT0_STN(cpu_env
, tcg_const_i32(opreg
));
6507 gen_helper_fcomi_ST0_FT0(cpu_env
);
6508 gen_helper_fpop(cpu_env
);
6509 set_cc_op(s
, CC_OP_EFLAGS
);
6511 case 0x10 ... 0x13: /* fcmovxx */
6515 static const uint8_t fcmov_cc
[8] = {
6521 op1
= fcmov_cc
[op
& 3] | (((op
>> 3) & 1) ^ 1);
6522 l1
= gen_new_label();
6523 gen_jcc1_noeob(s
, op1
, l1
);
6524 gen_helper_fmov_ST0_STN(cpu_env
, tcg_const_i32(opreg
));
6533 /************************/
6536 case 0xa4: /* movsS */
6541 ot
= dflag
+ OT_WORD
;
6543 if (prefixes
& (PREFIX_REPZ
| PREFIX_REPNZ
)) {
6544 gen_repz_movs(s
, ot
, pc_start
- s
->cs_base
, s
->pc
- s
->cs_base
);
6550 case 0xaa: /* stosS */
6555 ot
= dflag
+ OT_WORD
;
6557 if (prefixes
& (PREFIX_REPZ
| PREFIX_REPNZ
)) {
6558 gen_repz_stos(s
, ot
, pc_start
- s
->cs_base
, s
->pc
- s
->cs_base
);
6563 case 0xac: /* lodsS */
6568 ot
= dflag
+ OT_WORD
;
6569 if (prefixes
& (PREFIX_REPZ
| PREFIX_REPNZ
)) {
6570 gen_repz_lods(s
, ot
, pc_start
- s
->cs_base
, s
->pc
- s
->cs_base
);
6575 case 0xae: /* scasS */
6580 ot
= dflag
+ OT_WORD
;
6581 if (prefixes
& PREFIX_REPNZ
) {
6582 gen_repz_scas(s
, ot
, pc_start
- s
->cs_base
, s
->pc
- s
->cs_base
, 1);
6583 } else if (prefixes
& PREFIX_REPZ
) {
6584 gen_repz_scas(s
, ot
, pc_start
- s
->cs_base
, s
->pc
- s
->cs_base
, 0);
6590 case 0xa6: /* cmpsS */
6595 ot
= dflag
+ OT_WORD
;
6596 if (prefixes
& PREFIX_REPNZ
) {
6597 gen_repz_cmps(s
, ot
, pc_start
- s
->cs_base
, s
->pc
- s
->cs_base
, 1);
6598 } else if (prefixes
& PREFIX_REPZ
) {
6599 gen_repz_cmps(s
, ot
, pc_start
- s
->cs_base
, s
->pc
- s
->cs_base
, 0);
6604 case 0x6c: /* insS */
6609 ot
= dflag
? OT_LONG
: OT_WORD
;
6610 gen_op_mov_TN_reg(OT_WORD
, 0, R_EDX
);
6611 gen_op_andl_T0_ffff();
6612 gen_check_io(s
, ot
, pc_start
- s
->cs_base
,
6613 SVM_IOIO_TYPE_MASK
| svm_is_rep(prefixes
) | 4);
6614 if (prefixes
& (PREFIX_REPZ
| PREFIX_REPNZ
)) {
6615 gen_repz_ins(s
, ot
, pc_start
- s
->cs_base
, s
->pc
- s
->cs_base
);
6619 gen_jmp(s
, s
->pc
- s
->cs_base
);
6623 case 0x6e: /* outsS */
6628 ot
= dflag
? OT_LONG
: OT_WORD
;
6629 gen_op_mov_TN_reg(OT_WORD
, 0, R_EDX
);
6630 gen_op_andl_T0_ffff();
6631 gen_check_io(s
, ot
, pc_start
- s
->cs_base
,
6632 svm_is_rep(prefixes
) | 4);
6633 if (prefixes
& (PREFIX_REPZ
| PREFIX_REPNZ
)) {
6634 gen_repz_outs(s
, ot
, pc_start
- s
->cs_base
, s
->pc
- s
->cs_base
);
6638 gen_jmp(s
, s
->pc
- s
->cs_base
);
6643 /************************/
6651 ot
= dflag
? OT_LONG
: OT_WORD
;
6652 val
= cpu_ldub_code(env
, s
->pc
++);
6653 gen_op_movl_T0_im(val
);
6654 gen_check_io(s
, ot
, pc_start
- s
->cs_base
,
6655 SVM_IOIO_TYPE_MASK
| svm_is_rep(prefixes
));
6658 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
6659 gen_helper_in_func(ot
, cpu_T
[1], cpu_tmp2_i32
);
6660 gen_op_mov_reg_T1(ot
, R_EAX
);
6663 gen_jmp(s
, s
->pc
- s
->cs_base
);
6671 ot
= dflag
? OT_LONG
: OT_WORD
;
6672 val
= cpu_ldub_code(env
, s
->pc
++);
6673 gen_op_movl_T0_im(val
);
6674 gen_check_io(s
, ot
, pc_start
- s
->cs_base
,
6675 svm_is_rep(prefixes
));
6676 gen_op_mov_TN_reg(ot
, 1, R_EAX
);
6680 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
6681 tcg_gen_trunc_tl_i32(cpu_tmp3_i32
, cpu_T
[1]);
6682 gen_helper_out_func(ot
, cpu_tmp2_i32
, cpu_tmp3_i32
);
6685 gen_jmp(s
, s
->pc
- s
->cs_base
);
6693 ot
= dflag
? OT_LONG
: OT_WORD
;
6694 gen_op_mov_TN_reg(OT_WORD
, 0, R_EDX
);
6695 gen_op_andl_T0_ffff();
6696 gen_check_io(s
, ot
, pc_start
- s
->cs_base
,
6697 SVM_IOIO_TYPE_MASK
| svm_is_rep(prefixes
));
6700 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
6701 gen_helper_in_func(ot
, cpu_T
[1], cpu_tmp2_i32
);
6702 gen_op_mov_reg_T1(ot
, R_EAX
);
6705 gen_jmp(s
, s
->pc
- s
->cs_base
);
6713 ot
= dflag
? OT_LONG
: OT_WORD
;
6714 gen_op_mov_TN_reg(OT_WORD
, 0, R_EDX
);
6715 gen_op_andl_T0_ffff();
6716 gen_check_io(s
, ot
, pc_start
- s
->cs_base
,
6717 svm_is_rep(prefixes
));
6718 gen_op_mov_TN_reg(ot
, 1, R_EAX
);
6722 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
6723 tcg_gen_trunc_tl_i32(cpu_tmp3_i32
, cpu_T
[1]);
6724 gen_helper_out_func(ot
, cpu_tmp2_i32
, cpu_tmp3_i32
);
6727 gen_jmp(s
, s
->pc
- s
->cs_base
);
6731 /************************/
6733 case 0xc2: /* ret im */
6734 val
= cpu_ldsw_code(env
, s
->pc
);
6737 if (CODE64(s
) && s
->dflag
)
6739 gen_stack_update(s
, val
+ (2 << s
->dflag
));
6741 gen_op_andl_T0_ffff();
6745 case 0xc3: /* ret */
6749 gen_op_andl_T0_ffff();
6753 case 0xca: /* lret im */
6754 val
= cpu_ldsw_code(env
, s
->pc
);
6757 if (s
->pe
&& !s
->vm86
) {
6758 gen_update_cc_op(s
);
6759 gen_jmp_im(pc_start
- s
->cs_base
);
6760 gen_helper_lret_protected(cpu_env
, tcg_const_i32(s
->dflag
),
6761 tcg_const_i32(val
));
6765 gen_op_ld_T0_A0(1 + s
->dflag
+ s
->mem_index
);
6767 gen_op_andl_T0_ffff();
6768 /* NOTE: keeping EIP updated is not a problem in case of
6772 gen_op_addl_A0_im(2 << s
->dflag
);
6773 gen_op_ld_T0_A0(1 + s
->dflag
+ s
->mem_index
);
6774 gen_op_movl_seg_T0_vm(R_CS
);
6775 /* add stack offset */
6776 gen_stack_update(s
, val
+ (4 << s
->dflag
));
6780 case 0xcb: /* lret */
6783 case 0xcf: /* iret */
6784 gen_svm_check_intercept(s
, pc_start
, SVM_EXIT_IRET
);
6787 gen_helper_iret_real(cpu_env
, tcg_const_i32(s
->dflag
));
6788 set_cc_op(s
, CC_OP_EFLAGS
);
6789 } else if (s
->vm86
) {
6791 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
6793 gen_helper_iret_real(cpu_env
, tcg_const_i32(s
->dflag
));
6794 set_cc_op(s
, CC_OP_EFLAGS
);
6797 gen_update_cc_op(s
);
6798 gen_jmp_im(pc_start
- s
->cs_base
);
6799 gen_helper_iret_protected(cpu_env
, tcg_const_i32(s
->dflag
),
6800 tcg_const_i32(s
->pc
- s
->cs_base
));
6801 set_cc_op(s
, CC_OP_EFLAGS
);
6805 case 0xe8: /* call im */
6808 tval
= (int32_t)insn_get(env
, s
, OT_LONG
);
6810 tval
= (int16_t)insn_get(env
, s
, OT_WORD
);
6811 next_eip
= s
->pc
- s
->cs_base
;
6817 gen_movtl_T0_im(next_eip
);
6822 case 0x9a: /* lcall im */
6824 unsigned int selector
, offset
;
6828 ot
= dflag
? OT_LONG
: OT_WORD
;
6829 offset
= insn_get(env
, s
, ot
);
6830 selector
= insn_get(env
, s
, OT_WORD
);
6832 gen_op_movl_T0_im(selector
);
6833 gen_op_movl_T1_imu(offset
);
6836 case 0xe9: /* jmp im */
6838 tval
= (int32_t)insn_get(env
, s
, OT_LONG
);
6840 tval
= (int16_t)insn_get(env
, s
, OT_WORD
);
6841 tval
+= s
->pc
- s
->cs_base
;
6848 case 0xea: /* ljmp im */
6850 unsigned int selector
, offset
;
6854 ot
= dflag
? OT_LONG
: OT_WORD
;
6855 offset
= insn_get(env
, s
, ot
);
6856 selector
= insn_get(env
, s
, OT_WORD
);
6858 gen_op_movl_T0_im(selector
);
6859 gen_op_movl_T1_imu(offset
);
6862 case 0xeb: /* jmp Jb */
6863 tval
= (int8_t)insn_get(env
, s
, OT_BYTE
);
6864 tval
+= s
->pc
- s
->cs_base
;
6869 case 0x70 ... 0x7f: /* jcc Jb */
6870 tval
= (int8_t)insn_get(env
, s
, OT_BYTE
);
6872 case 0x180 ... 0x18f: /* jcc Jv */
6874 tval
= (int32_t)insn_get(env
, s
, OT_LONG
);
6876 tval
= (int16_t)insn_get(env
, s
, OT_WORD
);
6879 next_eip
= s
->pc
- s
->cs_base
;
6883 gen_jcc(s
, b
, tval
, next_eip
);
6886 case 0x190 ... 0x19f: /* setcc Gv */
6887 modrm
= cpu_ldub_code(env
, s
->pc
++);
6888 gen_setcc1(s
, b
, cpu_T
[0]);
6889 gen_ldst_modrm(env
, s
, modrm
, OT_BYTE
, OR_TMP0
, 1);
6891 case 0x140 ... 0x14f: /* cmov Gv, Ev */
6892 ot
= dflag
+ OT_WORD
;
6893 modrm
= cpu_ldub_code(env
, s
->pc
++);
6894 reg
= ((modrm
>> 3) & 7) | rex_r
;
6895 gen_cmovcc1(env
, s
, ot
, b
, modrm
, reg
);
6898 /************************/
6900 case 0x9c: /* pushf */
6901 gen_svm_check_intercept(s
, pc_start
, SVM_EXIT_PUSHF
);
6902 if (s
->vm86
&& s
->iopl
!= 3) {
6903 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
6905 gen_update_cc_op(s
);
6906 gen_helper_read_eflags(cpu_T
[0], cpu_env
);
6910 case 0x9d: /* popf */
6911 gen_svm_check_intercept(s
, pc_start
, SVM_EXIT_POPF
);
6912 if (s
->vm86
&& s
->iopl
!= 3) {
6913 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
6918 gen_helper_write_eflags(cpu_env
, cpu_T
[0],
6919 tcg_const_i32((TF_MASK
| AC_MASK
|
6924 gen_helper_write_eflags(cpu_env
, cpu_T
[0],
6925 tcg_const_i32((TF_MASK
| AC_MASK
|
6927 IF_MASK
| IOPL_MASK
)
6931 if (s
->cpl
<= s
->iopl
) {
6933 gen_helper_write_eflags(cpu_env
, cpu_T
[0],
6934 tcg_const_i32((TF_MASK
|
6940 gen_helper_write_eflags(cpu_env
, cpu_T
[0],
6941 tcg_const_i32((TF_MASK
|
6950 gen_helper_write_eflags(cpu_env
, cpu_T
[0],
6951 tcg_const_i32((TF_MASK
| AC_MASK
|
6952 ID_MASK
| NT_MASK
)));
6954 gen_helper_write_eflags(cpu_env
, cpu_T
[0],
6955 tcg_const_i32((TF_MASK
| AC_MASK
|
6962 set_cc_op(s
, CC_OP_EFLAGS
);
6963 /* abort translation because TF/AC flag may change */
6964 gen_jmp_im(s
->pc
- s
->cs_base
);
6968 case 0x9e: /* sahf */
6969 if (CODE64(s
) && !(s
->cpuid_ext3_features
& CPUID_EXT3_LAHF_LM
))
6971 gen_op_mov_TN_reg(OT_BYTE
, 0, R_AH
);
6972 gen_compute_eflags(s
);
6973 tcg_gen_andi_tl(cpu_cc_src
, cpu_cc_src
, CC_O
);
6974 tcg_gen_andi_tl(cpu_T
[0], cpu_T
[0], CC_S
| CC_Z
| CC_A
| CC_P
| CC_C
);
6975 tcg_gen_or_tl(cpu_cc_src
, cpu_cc_src
, cpu_T
[0]);
6977 case 0x9f: /* lahf */
6978 if (CODE64(s
) && !(s
->cpuid_ext3_features
& CPUID_EXT3_LAHF_LM
))
6980 gen_compute_eflags(s
);
6981 /* Note: gen_compute_eflags() only gives the condition codes */
6982 tcg_gen_ori_tl(cpu_T
[0], cpu_cc_src
, 0x02);
6983 gen_op_mov_reg_T0(OT_BYTE
, R_AH
);
6985 case 0xf5: /* cmc */
6986 gen_compute_eflags(s
);
6987 tcg_gen_xori_tl(cpu_cc_src
, cpu_cc_src
, CC_C
);
6989 case 0xf8: /* clc */
6990 gen_compute_eflags(s
);
6991 tcg_gen_andi_tl(cpu_cc_src
, cpu_cc_src
, ~CC_C
);
6993 case 0xf9: /* stc */
6994 gen_compute_eflags(s
);
6995 tcg_gen_ori_tl(cpu_cc_src
, cpu_cc_src
, CC_C
);
6997 case 0xfc: /* cld */
6998 tcg_gen_movi_i32(cpu_tmp2_i32
, 1);
6999 tcg_gen_st_i32(cpu_tmp2_i32
, cpu_env
, offsetof(CPUX86State
, df
));
7001 case 0xfd: /* std */
7002 tcg_gen_movi_i32(cpu_tmp2_i32
, -1);
7003 tcg_gen_st_i32(cpu_tmp2_i32
, cpu_env
, offsetof(CPUX86State
, df
));
7006 /************************/
7007 /* bit operations */
7008 case 0x1ba: /* bt/bts/btr/btc Gv, im */
7009 ot
= dflag
+ OT_WORD
;
7010 modrm
= cpu_ldub_code(env
, s
->pc
++);
7011 op
= (modrm
>> 3) & 7;
7012 mod
= (modrm
>> 6) & 3;
7013 rm
= (modrm
& 7) | REX_B(s
);
7016 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
7017 gen_op_ld_T0_A0(ot
+ s
->mem_index
);
7019 gen_op_mov_TN_reg(ot
, 0, rm
);
7022 val
= cpu_ldub_code(env
, s
->pc
++);
7023 gen_op_movl_T1_im(val
);
7028 case 0x1a3: /* bt Gv, Ev */
7031 case 0x1ab: /* bts */
7034 case 0x1b3: /* btr */
7037 case 0x1bb: /* btc */
7040 ot
= dflag
+ OT_WORD
;
7041 modrm
= cpu_ldub_code(env
, s
->pc
++);
7042 reg
= ((modrm
>> 3) & 7) | rex_r
;
7043 mod
= (modrm
>> 6) & 3;
7044 rm
= (modrm
& 7) | REX_B(s
);
7045 gen_op_mov_TN_reg(OT_LONG
, 1, reg
);
7047 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
7048 /* specific case: we need to add a displacement */
7049 gen_exts(ot
, cpu_T
[1]);
7050 tcg_gen_sari_tl(cpu_tmp0
, cpu_T
[1], 3 + ot
);
7051 tcg_gen_shli_tl(cpu_tmp0
, cpu_tmp0
, ot
);
7052 tcg_gen_add_tl(cpu_A0
, cpu_A0
, cpu_tmp0
);
7053 gen_op_ld_T0_A0(ot
+ s
->mem_index
);
7055 gen_op_mov_TN_reg(ot
, 0, rm
);
7058 tcg_gen_andi_tl(cpu_T
[1], cpu_T
[1], (1 << (3 + ot
)) - 1);
7061 tcg_gen_shr_tl(cpu_cc_src
, cpu_T
[0], cpu_T
[1]);
7062 tcg_gen_movi_tl(cpu_cc_dst
, 0);
7065 tcg_gen_shr_tl(cpu_tmp4
, cpu_T
[0], cpu_T
[1]);
7066 tcg_gen_movi_tl(cpu_tmp0
, 1);
7067 tcg_gen_shl_tl(cpu_tmp0
, cpu_tmp0
, cpu_T
[1]);
7068 tcg_gen_or_tl(cpu_T
[0], cpu_T
[0], cpu_tmp0
);
7071 tcg_gen_shr_tl(cpu_tmp4
, cpu_T
[0], cpu_T
[1]);
7072 tcg_gen_movi_tl(cpu_tmp0
, 1);
7073 tcg_gen_shl_tl(cpu_tmp0
, cpu_tmp0
, cpu_T
[1]);
7074 tcg_gen_not_tl(cpu_tmp0
, cpu_tmp0
);
7075 tcg_gen_and_tl(cpu_T
[0], cpu_T
[0], cpu_tmp0
);
7079 tcg_gen_shr_tl(cpu_tmp4
, cpu_T
[0], cpu_T
[1]);
7080 tcg_gen_movi_tl(cpu_tmp0
, 1);
7081 tcg_gen_shl_tl(cpu_tmp0
, cpu_tmp0
, cpu_T
[1]);
7082 tcg_gen_xor_tl(cpu_T
[0], cpu_T
[0], cpu_tmp0
);
7085 set_cc_op(s
, CC_OP_SARB
+ ot
);
7088 gen_op_st_T0_A0(ot
+ s
->mem_index
);
7090 gen_op_mov_reg_T0(ot
, rm
);
7091 tcg_gen_mov_tl(cpu_cc_src
, cpu_tmp4
);
7092 tcg_gen_movi_tl(cpu_cc_dst
, 0);
7095 case 0x1bc: /* bsf / tzcnt */
7096 case 0x1bd: /* bsr / lzcnt */
7097 ot
= dflag
+ OT_WORD
;
7098 modrm
= cpu_ldub_code(env
, s
->pc
++);
7099 reg
= ((modrm
>> 3) & 7) | rex_r
;
7100 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
7101 gen_extu(ot
, cpu_T
[0]);
7103 /* Note that lzcnt and tzcnt are in different extensions. */
7104 if ((prefixes
& PREFIX_REPZ
)
7106 ? s
->cpuid_ext3_features
& CPUID_EXT3_ABM
7107 : s
->cpuid_7_0_ebx_features
& CPUID_7_0_EBX_BMI1
)) {
7109 tcg_gen_mov_tl(cpu_cc_src
, cpu_T
[0]);
7111 /* For lzcnt, reduce the target_ulong result by the
7112 number of zeros that we expect to find at the top. */
7113 gen_helper_clz(cpu_T
[0], cpu_T
[0]);
7114 tcg_gen_subi_tl(cpu_T
[0], cpu_T
[0], TARGET_LONG_BITS
- size
);
7116 /* For tzcnt, a zero input must return the operand size:
7117 force all bits outside the operand size to 1. */
7118 target_ulong mask
= (target_ulong
)-2 << (size
- 1);
7119 tcg_gen_ori_tl(cpu_T
[0], cpu_T
[0], mask
);
7120 gen_helper_ctz(cpu_T
[0], cpu_T
[0]);
7122 /* For lzcnt/tzcnt, C and Z bits are defined and are
7123 related to the result. */
7124 gen_op_update1_cc();
7125 set_cc_op(s
, CC_OP_BMILGB
+ ot
);
7127 /* For bsr/bsf, only the Z bit is defined and it is related
7128 to the input and not the result. */
7129 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
7130 set_cc_op(s
, CC_OP_LOGICB
+ ot
);
7132 /* For bsr, return the bit index of the first 1 bit,
7133 not the count of leading zeros. */
7134 gen_helper_clz(cpu_T
[0], cpu_T
[0]);
7135 tcg_gen_xori_tl(cpu_T
[0], cpu_T
[0], TARGET_LONG_BITS
- 1);
7137 gen_helper_ctz(cpu_T
[0], cpu_T
[0]);
7139 /* ??? The manual says that the output is undefined when the
7140 input is zero, but real hardware leaves it unchanged, and
7141 real programs appear to depend on that. */
7142 tcg_gen_movi_tl(cpu_tmp0
, 0);
7143 tcg_gen_movcond_tl(TCG_COND_EQ
, cpu_T
[0], cpu_cc_dst
, cpu_tmp0
,
7144 cpu_regs
[reg
], cpu_T
[0]);
7146 gen_op_mov_reg_T0(ot
, reg
);
7148 /************************/
7150 case 0x27: /* daa */
7153 gen_update_cc_op(s
);
7154 gen_helper_daa(cpu_env
);
7155 set_cc_op(s
, CC_OP_EFLAGS
);
7157 case 0x2f: /* das */
7160 gen_update_cc_op(s
);
7161 gen_helper_das(cpu_env
);
7162 set_cc_op(s
, CC_OP_EFLAGS
);
7164 case 0x37: /* aaa */
7167 gen_update_cc_op(s
);
7168 gen_helper_aaa(cpu_env
);
7169 set_cc_op(s
, CC_OP_EFLAGS
);
7171 case 0x3f: /* aas */
7174 gen_update_cc_op(s
);
7175 gen_helper_aas(cpu_env
);
7176 set_cc_op(s
, CC_OP_EFLAGS
);
7178 case 0xd4: /* aam */
7181 val
= cpu_ldub_code(env
, s
->pc
++);
7183 gen_exception(s
, EXCP00_DIVZ
, pc_start
- s
->cs_base
);
7185 gen_helper_aam(cpu_env
, tcg_const_i32(val
));
7186 set_cc_op(s
, CC_OP_LOGICB
);
7189 case 0xd5: /* aad */
7192 val
= cpu_ldub_code(env
, s
->pc
++);
7193 gen_helper_aad(cpu_env
, tcg_const_i32(val
));
7194 set_cc_op(s
, CC_OP_LOGICB
);
7196 /************************/
7198 case 0x90: /* nop */
7199 /* XXX: correct lock test for all insn */
7200 if (prefixes
& PREFIX_LOCK
) {
7203 /* If REX_B is set, then this is xchg eax, r8d, not a nop. */
7205 goto do_xchg_reg_eax
;
7207 if (prefixes
& PREFIX_REPZ
) {
7208 gen_svm_check_intercept(s
, pc_start
, SVM_EXIT_PAUSE
);
7211 case 0x9b: /* fwait */
7212 if ((s
->flags
& (HF_MP_MASK
| HF_TS_MASK
)) ==
7213 (HF_MP_MASK
| HF_TS_MASK
)) {
7214 gen_exception(s
, EXCP07_PREX
, pc_start
- s
->cs_base
);
7216 gen_update_cc_op(s
);
7217 gen_jmp_im(pc_start
- s
->cs_base
);
7218 gen_helper_fwait(cpu_env
);
7221 case 0xcc: /* int3 */
7222 gen_interrupt(s
, EXCP03_INT3
, pc_start
- s
->cs_base
, s
->pc
- s
->cs_base
);
7224 case 0xcd: /* int N */
7225 val
= cpu_ldub_code(env
, s
->pc
++);
7226 if (s
->vm86
&& s
->iopl
!= 3) {
7227 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7229 gen_interrupt(s
, val
, pc_start
- s
->cs_base
, s
->pc
- s
->cs_base
);
7232 case 0xce: /* into */
7235 gen_update_cc_op(s
);
7236 gen_jmp_im(pc_start
- s
->cs_base
);
7237 gen_helper_into(cpu_env
, tcg_const_i32(s
->pc
- pc_start
));
7240 case 0xf1: /* icebp (undocumented, exits to external debugger) */
7241 gen_svm_check_intercept(s
, pc_start
, SVM_EXIT_ICEBP
);
7243 gen_debug(s
, pc_start
- s
->cs_base
);
7247 qemu_set_log(CPU_LOG_INT
| CPU_LOG_TB_IN_ASM
);
7251 case 0xfa: /* cli */
7253 if (s
->cpl
<= s
->iopl
) {
7254 gen_helper_cli(cpu_env
);
7256 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7260 gen_helper_cli(cpu_env
);
7262 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7266 case 0xfb: /* sti */
7268 if (s
->cpl
<= s
->iopl
) {
7270 gen_helper_sti(cpu_env
);
7271 /* interruptions are enabled only the first insn after sti */
7272 /* If several instructions disable interrupts, only the
7274 if (!(s
->tb
->flags
& HF_INHIBIT_IRQ_MASK
))
7275 gen_helper_set_inhibit_irq(cpu_env
);
7276 /* give a chance to handle pending irqs */
7277 gen_jmp_im(s
->pc
- s
->cs_base
);
7280 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7286 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7290 case 0x62: /* bound */
7293 ot
= dflag
? OT_LONG
: OT_WORD
;
7294 modrm
= cpu_ldub_code(env
, s
->pc
++);
7295 reg
= (modrm
>> 3) & 7;
7296 mod
= (modrm
>> 6) & 3;
7299 gen_op_mov_TN_reg(ot
, 0, reg
);
7300 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
7301 gen_jmp_im(pc_start
- s
->cs_base
);
7302 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
7303 if (ot
== OT_WORD
) {
7304 gen_helper_boundw(cpu_env
, cpu_A0
, cpu_tmp2_i32
);
7306 gen_helper_boundl(cpu_env
, cpu_A0
, cpu_tmp2_i32
);
7309 case 0x1c8 ... 0x1cf: /* bswap reg */
7310 reg
= (b
& 7) | REX_B(s
);
7311 #ifdef TARGET_X86_64
7313 gen_op_mov_TN_reg(OT_QUAD
, 0, reg
);
7314 tcg_gen_bswap64_i64(cpu_T
[0], cpu_T
[0]);
7315 gen_op_mov_reg_T0(OT_QUAD
, reg
);
7319 gen_op_mov_TN_reg(OT_LONG
, 0, reg
);
7320 tcg_gen_ext32u_tl(cpu_T
[0], cpu_T
[0]);
7321 tcg_gen_bswap32_tl(cpu_T
[0], cpu_T
[0]);
7322 gen_op_mov_reg_T0(OT_LONG
, reg
);
7325 case 0xd6: /* salc */
7328 gen_compute_eflags_c(s
, cpu_T
[0]);
7329 tcg_gen_neg_tl(cpu_T
[0], cpu_T
[0]);
7330 gen_op_mov_reg_T0(OT_BYTE
, R_EAX
);
7332 case 0xe0: /* loopnz */
7333 case 0xe1: /* loopz */
7334 case 0xe2: /* loop */
7335 case 0xe3: /* jecxz */
7339 tval
= (int8_t)insn_get(env
, s
, OT_BYTE
);
7340 next_eip
= s
->pc
- s
->cs_base
;
7345 l1
= gen_new_label();
7346 l2
= gen_new_label();
7347 l3
= gen_new_label();
7350 case 0: /* loopnz */
7352 gen_op_add_reg_im(s
->aflag
, R_ECX
, -1);
7353 gen_op_jz_ecx(s
->aflag
, l3
);
7354 gen_jcc1(s
, (JCC_Z
<< 1) | (b
^ 1), l1
);
7357 gen_op_add_reg_im(s
->aflag
, R_ECX
, -1);
7358 gen_op_jnz_ecx(s
->aflag
, l1
);
7362 gen_op_jz_ecx(s
->aflag
, l1
);
7367 gen_jmp_im(next_eip
);
7376 case 0x130: /* wrmsr */
7377 case 0x132: /* rdmsr */
7379 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7381 gen_update_cc_op(s
);
7382 gen_jmp_im(pc_start
- s
->cs_base
);
7384 gen_helper_rdmsr(cpu_env
);
7386 gen_helper_wrmsr(cpu_env
);
7390 case 0x131: /* rdtsc */
7391 gen_update_cc_op(s
);
7392 gen_jmp_im(pc_start
- s
->cs_base
);
7395 gen_helper_rdtsc(cpu_env
);
7398 gen_jmp(s
, s
->pc
- s
->cs_base
);
7401 case 0x133: /* rdpmc */
7402 gen_update_cc_op(s
);
7403 gen_jmp_im(pc_start
- s
->cs_base
);
7404 gen_helper_rdpmc(cpu_env
);
7406 case 0x134: /* sysenter */
7407 /* For Intel SYSENTER is valid on 64-bit */
7408 if (CODE64(s
) && env
->cpuid_vendor1
!= CPUID_VENDOR_INTEL_1
)
7411 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7413 gen_update_cc_op(s
);
7414 gen_jmp_im(pc_start
- s
->cs_base
);
7415 gen_helper_sysenter(cpu_env
);
7419 case 0x135: /* sysexit */
7420 /* For Intel SYSEXIT is valid on 64-bit */
7421 if (CODE64(s
) && env
->cpuid_vendor1
!= CPUID_VENDOR_INTEL_1
)
7424 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7426 gen_update_cc_op(s
);
7427 gen_jmp_im(pc_start
- s
->cs_base
);
7428 gen_helper_sysexit(cpu_env
, tcg_const_i32(dflag
));
7432 #ifdef TARGET_X86_64
7433 case 0x105: /* syscall */
7434 /* XXX: is it usable in real mode ? */
7435 gen_update_cc_op(s
);
7436 gen_jmp_im(pc_start
- s
->cs_base
);
7437 gen_helper_syscall(cpu_env
, tcg_const_i32(s
->pc
- pc_start
));
7440 case 0x107: /* sysret */
7442 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7444 gen_update_cc_op(s
);
7445 gen_jmp_im(pc_start
- s
->cs_base
);
7446 gen_helper_sysret(cpu_env
, tcg_const_i32(s
->dflag
));
7447 /* condition codes are modified only in long mode */
7449 set_cc_op(s
, CC_OP_EFLAGS
);
7455 case 0x1a2: /* cpuid */
7456 gen_update_cc_op(s
);
7457 gen_jmp_im(pc_start
- s
->cs_base
);
7458 gen_helper_cpuid(cpu_env
);
7460 case 0xf4: /* hlt */
7462 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7464 gen_update_cc_op(s
);
7465 gen_jmp_im(pc_start
- s
->cs_base
);
7466 gen_helper_hlt(cpu_env
, tcg_const_i32(s
->pc
- pc_start
));
7467 s
->is_jmp
= DISAS_TB_JUMP
;
7471 modrm
= cpu_ldub_code(env
, s
->pc
++);
7472 mod
= (modrm
>> 6) & 3;
7473 op
= (modrm
>> 3) & 7;
7476 if (!s
->pe
|| s
->vm86
)
7478 gen_svm_check_intercept(s
, pc_start
, SVM_EXIT_LDTR_READ
);
7479 tcg_gen_ld32u_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,ldt
.selector
));
7483 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 1);
7486 if (!s
->pe
|| s
->vm86
)
7489 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7491 gen_svm_check_intercept(s
, pc_start
, SVM_EXIT_LDTR_WRITE
);
7492 gen_ldst_modrm(env
, s
, modrm
, OT_WORD
, OR_TMP0
, 0);
7493 gen_jmp_im(pc_start
- s
->cs_base
);
7494 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
7495 gen_helper_lldt(cpu_env
, cpu_tmp2_i32
);
7499 if (!s
->pe
|| s
->vm86
)
7501 gen_svm_check_intercept(s
, pc_start
, SVM_EXIT_TR_READ
);
7502 tcg_gen_ld32u_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,tr
.selector
));
7506 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 1);
7509 if (!s
->pe
|| s
->vm86
)
7512 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7514 gen_svm_check_intercept(s
, pc_start
, SVM_EXIT_TR_WRITE
);
7515 gen_ldst_modrm(env
, s
, modrm
, OT_WORD
, OR_TMP0
, 0);
7516 gen_jmp_im(pc_start
- s
->cs_base
);
7517 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
7518 gen_helper_ltr(cpu_env
, cpu_tmp2_i32
);
7523 if (!s
->pe
|| s
->vm86
)
7525 gen_ldst_modrm(env
, s
, modrm
, OT_WORD
, OR_TMP0
, 0);
7526 gen_update_cc_op(s
);
7528 gen_helper_verr(cpu_env
, cpu_T
[0]);
7530 gen_helper_verw(cpu_env
, cpu_T
[0]);
7532 set_cc_op(s
, CC_OP_EFLAGS
);
7539 modrm
= cpu_ldub_code(env
, s
->pc
++);
7540 mod
= (modrm
>> 6) & 3;
7541 op
= (modrm
>> 3) & 7;
7547 gen_svm_check_intercept(s
, pc_start
, SVM_EXIT_GDTR_READ
);
7548 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
7549 tcg_gen_ld32u_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
, gdt
.limit
));
7550 gen_op_st_T0_A0(OT_WORD
+ s
->mem_index
);
7551 gen_add_A0_im(s
, 2);
7552 tcg_gen_ld_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
, gdt
.base
));
7554 gen_op_andl_T0_im(0xffffff);
7555 gen_op_st_T0_A0(CODE64(s
) + OT_LONG
+ s
->mem_index
);
7560 case 0: /* monitor */
7561 if (!(s
->cpuid_ext_features
& CPUID_EXT_MONITOR
) ||
7564 gen_update_cc_op(s
);
7565 gen_jmp_im(pc_start
- s
->cs_base
);
7566 #ifdef TARGET_X86_64
7567 if (s
->aflag
== 2) {
7568 gen_op_movq_A0_reg(R_EAX
);
7572 gen_op_movl_A0_reg(R_EAX
);
7574 gen_op_andl_A0_ffff();
7576 gen_add_A0_ds_seg(s
);
7577 gen_helper_monitor(cpu_env
, cpu_A0
);
7580 if (!(s
->cpuid_ext_features
& CPUID_EXT_MONITOR
) ||
7583 gen_update_cc_op(s
);
7584 gen_jmp_im(pc_start
- s
->cs_base
);
7585 gen_helper_mwait(cpu_env
, tcg_const_i32(s
->pc
- pc_start
));
7589 if (!(s
->cpuid_7_0_ebx_features
& CPUID_7_0_EBX_SMAP
) ||
7593 gen_helper_clac(cpu_env
);
7594 gen_jmp_im(s
->pc
- s
->cs_base
);
7598 if (!(s
->cpuid_7_0_ebx_features
& CPUID_7_0_EBX_SMAP
) ||
7602 gen_helper_stac(cpu_env
);
7603 gen_jmp_im(s
->pc
- s
->cs_base
);
7610 gen_svm_check_intercept(s
, pc_start
, SVM_EXIT_IDTR_READ
);
7611 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
7612 tcg_gen_ld32u_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
, idt
.limit
));
7613 gen_op_st_T0_A0(OT_WORD
+ s
->mem_index
);
7614 gen_add_A0_im(s
, 2);
7615 tcg_gen_ld_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
, idt
.base
));
7617 gen_op_andl_T0_im(0xffffff);
7618 gen_op_st_T0_A0(CODE64(s
) + OT_LONG
+ s
->mem_index
);
7624 gen_update_cc_op(s
);
7625 gen_jmp_im(pc_start
- s
->cs_base
);
7628 if (!(s
->flags
& HF_SVME_MASK
) || !s
->pe
)
7631 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7634 gen_helper_vmrun(cpu_env
, tcg_const_i32(s
->aflag
),
7635 tcg_const_i32(s
->pc
- pc_start
));
7637 s
->is_jmp
= DISAS_TB_JUMP
;
7640 case 1: /* VMMCALL */
7641 if (!(s
->flags
& HF_SVME_MASK
))
7643 gen_helper_vmmcall(cpu_env
);
7645 case 2: /* VMLOAD */
7646 if (!(s
->flags
& HF_SVME_MASK
) || !s
->pe
)
7649 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7652 gen_helper_vmload(cpu_env
, tcg_const_i32(s
->aflag
));
7655 case 3: /* VMSAVE */
7656 if (!(s
->flags
& HF_SVME_MASK
) || !s
->pe
)
7659 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7662 gen_helper_vmsave(cpu_env
, tcg_const_i32(s
->aflag
));
7666 if ((!(s
->flags
& HF_SVME_MASK
) &&
7667 !(s
->cpuid_ext3_features
& CPUID_EXT3_SKINIT
)) ||
7671 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7674 gen_helper_stgi(cpu_env
);
7678 if (!(s
->flags
& HF_SVME_MASK
) || !s
->pe
)
7681 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7684 gen_helper_clgi(cpu_env
);
7687 case 6: /* SKINIT */
7688 if ((!(s
->flags
& HF_SVME_MASK
) &&
7689 !(s
->cpuid_ext3_features
& CPUID_EXT3_SKINIT
)) ||
7692 gen_helper_skinit(cpu_env
);
7694 case 7: /* INVLPGA */
7695 if (!(s
->flags
& HF_SVME_MASK
) || !s
->pe
)
7698 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7701 gen_helper_invlpga(cpu_env
, tcg_const_i32(s
->aflag
));
7707 } else if (s
->cpl
!= 0) {
7708 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7710 gen_svm_check_intercept(s
, pc_start
,
7711 op
==2 ? SVM_EXIT_GDTR_WRITE
: SVM_EXIT_IDTR_WRITE
);
7712 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
7713 gen_op_ld_T1_A0(OT_WORD
+ s
->mem_index
);
7714 gen_add_A0_im(s
, 2);
7715 gen_op_ld_T0_A0(CODE64(s
) + OT_LONG
+ s
->mem_index
);
7717 gen_op_andl_T0_im(0xffffff);
7719 tcg_gen_st_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,gdt
.base
));
7720 tcg_gen_st32_tl(cpu_T
[1], cpu_env
, offsetof(CPUX86State
,gdt
.limit
));
7722 tcg_gen_st_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,idt
.base
));
7723 tcg_gen_st32_tl(cpu_T
[1], cpu_env
, offsetof(CPUX86State
,idt
.limit
));
7728 gen_svm_check_intercept(s
, pc_start
, SVM_EXIT_READ_CR0
);
7729 #if defined TARGET_X86_64 && defined HOST_WORDS_BIGENDIAN
7730 tcg_gen_ld32u_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,cr
[0]) + 4);
7732 tcg_gen_ld32u_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,cr
[0]));
7734 gen_ldst_modrm(env
, s
, modrm
, OT_WORD
, OR_TMP0
, 1);
7738 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7740 gen_svm_check_intercept(s
, pc_start
, SVM_EXIT_WRITE_CR0
);
7741 gen_ldst_modrm(env
, s
, modrm
, OT_WORD
, OR_TMP0
, 0);
7742 gen_helper_lmsw(cpu_env
, cpu_T
[0]);
7743 gen_jmp_im(s
->pc
- s
->cs_base
);
7748 if (mod
!= 3) { /* invlpg */
7750 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7752 gen_update_cc_op(s
);
7753 gen_jmp_im(pc_start
- s
->cs_base
);
7754 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
7755 gen_helper_invlpg(cpu_env
, cpu_A0
);
7756 gen_jmp_im(s
->pc
- s
->cs_base
);
7761 case 0: /* swapgs */
7762 #ifdef TARGET_X86_64
7765 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7767 tcg_gen_ld_tl(cpu_T
[0], cpu_env
,
7768 offsetof(CPUX86State
,segs
[R_GS
].base
));
7769 tcg_gen_ld_tl(cpu_T
[1], cpu_env
,
7770 offsetof(CPUX86State
,kernelgsbase
));
7771 tcg_gen_st_tl(cpu_T
[1], cpu_env
,
7772 offsetof(CPUX86State
,segs
[R_GS
].base
));
7773 tcg_gen_st_tl(cpu_T
[0], cpu_env
,
7774 offsetof(CPUX86State
,kernelgsbase
));
7782 case 1: /* rdtscp */
7783 if (!(s
->cpuid_ext2_features
& CPUID_EXT2_RDTSCP
))
7785 gen_update_cc_op(s
);
7786 gen_jmp_im(pc_start
- s
->cs_base
);
7789 gen_helper_rdtscp(cpu_env
);
7792 gen_jmp(s
, s
->pc
- s
->cs_base
);
7804 case 0x108: /* invd */
7805 case 0x109: /* wbinvd */
7807 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7809 gen_svm_check_intercept(s
, pc_start
, (b
& 2) ? SVM_EXIT_INVD
: SVM_EXIT_WBINVD
);
7813 case 0x63: /* arpl or movslS (x86_64) */
7814 #ifdef TARGET_X86_64
7817 /* d_ot is the size of destination */
7818 d_ot
= dflag
+ OT_WORD
;
7820 modrm
= cpu_ldub_code(env
, s
->pc
++);
7821 reg
= ((modrm
>> 3) & 7) | rex_r
;
7822 mod
= (modrm
>> 6) & 3;
7823 rm
= (modrm
& 7) | REX_B(s
);
7826 gen_op_mov_TN_reg(OT_LONG
, 0, rm
);
7828 if (d_ot
== OT_QUAD
)
7829 tcg_gen_ext32s_tl(cpu_T
[0], cpu_T
[0]);
7830 gen_op_mov_reg_T0(d_ot
, reg
);
7832 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
7833 if (d_ot
== OT_QUAD
) {
7834 gen_op_lds_T0_A0(OT_LONG
+ s
->mem_index
);
7836 gen_op_ld_T0_A0(OT_LONG
+ s
->mem_index
);
7838 gen_op_mov_reg_T0(d_ot
, reg
);
7844 TCGv t0
, t1
, t2
, a0
;
7846 if (!s
->pe
|| s
->vm86
)
7848 t0
= tcg_temp_local_new();
7849 t1
= tcg_temp_local_new();
7850 t2
= tcg_temp_local_new();
7852 modrm
= cpu_ldub_code(env
, s
->pc
++);
7853 reg
= (modrm
>> 3) & 7;
7854 mod
= (modrm
>> 6) & 3;
7857 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
7858 gen_op_ld_v(ot
+ s
->mem_index
, t0
, cpu_A0
);
7859 a0
= tcg_temp_local_new();
7860 tcg_gen_mov_tl(a0
, cpu_A0
);
7862 gen_op_mov_v_reg(ot
, t0
, rm
);
7865 gen_op_mov_v_reg(ot
, t1
, reg
);
7866 tcg_gen_andi_tl(cpu_tmp0
, t0
, 3);
7867 tcg_gen_andi_tl(t1
, t1
, 3);
7868 tcg_gen_movi_tl(t2
, 0);
7869 label1
= gen_new_label();
7870 tcg_gen_brcond_tl(TCG_COND_GE
, cpu_tmp0
, t1
, label1
);
7871 tcg_gen_andi_tl(t0
, t0
, ~3);
7872 tcg_gen_or_tl(t0
, t0
, t1
);
7873 tcg_gen_movi_tl(t2
, CC_Z
);
7874 gen_set_label(label1
);
7876 gen_op_st_v(ot
+ s
->mem_index
, t0
, a0
);
7879 gen_op_mov_reg_v(ot
, rm
, t0
);
7881 gen_compute_eflags(s
);
7882 tcg_gen_andi_tl(cpu_cc_src
, cpu_cc_src
, ~CC_Z
);
7883 tcg_gen_or_tl(cpu_cc_src
, cpu_cc_src
, t2
);
7889 case 0x102: /* lar */
7890 case 0x103: /* lsl */
7894 if (!s
->pe
|| s
->vm86
)
7896 ot
= dflag
? OT_LONG
: OT_WORD
;
7897 modrm
= cpu_ldub_code(env
, s
->pc
++);
7898 reg
= ((modrm
>> 3) & 7) | rex_r
;
7899 gen_ldst_modrm(env
, s
, modrm
, OT_WORD
, OR_TMP0
, 0);
7900 t0
= tcg_temp_local_new();
7901 gen_update_cc_op(s
);
7903 gen_helper_lar(t0
, cpu_env
, cpu_T
[0]);
7905 gen_helper_lsl(t0
, cpu_env
, cpu_T
[0]);
7907 tcg_gen_andi_tl(cpu_tmp0
, cpu_cc_src
, CC_Z
);
7908 label1
= gen_new_label();
7909 tcg_gen_brcondi_tl(TCG_COND_EQ
, cpu_tmp0
, 0, label1
);
7910 gen_op_mov_reg_v(ot
, reg
, t0
);
7911 gen_set_label(label1
);
7912 set_cc_op(s
, CC_OP_EFLAGS
);
7917 modrm
= cpu_ldub_code(env
, s
->pc
++);
7918 mod
= (modrm
>> 6) & 3;
7919 op
= (modrm
>> 3) & 7;
7921 case 0: /* prefetchnta */
7922 case 1: /* prefetchnt0 */
7923 case 2: /* prefetchnt0 */
7924 case 3: /* prefetchnt0 */
7927 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
7928 /* nothing more to do */
7930 default: /* nop (multi byte) */
7931 gen_nop_modrm(env
, s
, modrm
);
7935 case 0x119 ... 0x11f: /* nop (multi byte) */
7936 modrm
= cpu_ldub_code(env
, s
->pc
++);
7937 gen_nop_modrm(env
, s
, modrm
);
7939 case 0x120: /* mov reg, crN */
7940 case 0x122: /* mov crN, reg */
7942 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7944 modrm
= cpu_ldub_code(env
, s
->pc
++);
7945 /* Ignore the mod bits (assume (modrm&0xc0)==0xc0).
7946 * AMD documentation (24594.pdf) and testing of
7947 * intel 386 and 486 processors all show that the mod bits
7948 * are assumed to be 1's, regardless of actual values.
7950 rm
= (modrm
& 7) | REX_B(s
);
7951 reg
= ((modrm
>> 3) & 7) | rex_r
;
7956 if ((prefixes
& PREFIX_LOCK
) && (reg
== 0) &&
7957 (s
->cpuid_ext3_features
& CPUID_EXT3_CR8LEG
)) {
7966 gen_update_cc_op(s
);
7967 gen_jmp_im(pc_start
- s
->cs_base
);
7969 gen_op_mov_TN_reg(ot
, 0, rm
);
7970 gen_helper_write_crN(cpu_env
, tcg_const_i32(reg
),
7972 gen_jmp_im(s
->pc
- s
->cs_base
);
7975 gen_helper_read_crN(cpu_T
[0], cpu_env
, tcg_const_i32(reg
));
7976 gen_op_mov_reg_T0(ot
, rm
);
7984 case 0x121: /* mov reg, drN */
7985 case 0x123: /* mov drN, reg */
7987 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
7989 modrm
= cpu_ldub_code(env
, s
->pc
++);
7990 /* Ignore the mod bits (assume (modrm&0xc0)==0xc0).
7991 * AMD documentation (24594.pdf) and testing of
7992 * intel 386 and 486 processors all show that the mod bits
7993 * are assumed to be 1's, regardless of actual values.
7995 rm
= (modrm
& 7) | REX_B(s
);
7996 reg
= ((modrm
>> 3) & 7) | rex_r
;
8001 /* XXX: do it dynamically with CR4.DE bit */
8002 if (reg
== 4 || reg
== 5 || reg
>= 8)
8005 gen_svm_check_intercept(s
, pc_start
, SVM_EXIT_WRITE_DR0
+ reg
);
8006 gen_op_mov_TN_reg(ot
, 0, rm
);
8007 gen_helper_movl_drN_T0(cpu_env
, tcg_const_i32(reg
), cpu_T
[0]);
8008 gen_jmp_im(s
->pc
- s
->cs_base
);
8011 gen_svm_check_intercept(s
, pc_start
, SVM_EXIT_READ_DR0
+ reg
);
8012 tcg_gen_ld_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,dr
[reg
]));
8013 gen_op_mov_reg_T0(ot
, rm
);
8017 case 0x106: /* clts */
8019 gen_exception(s
, EXCP0D_GPF
, pc_start
- s
->cs_base
);
8021 gen_svm_check_intercept(s
, pc_start
, SVM_EXIT_WRITE_CR0
);
8022 gen_helper_clts(cpu_env
);
8023 /* abort block because static cpu state changed */
8024 gen_jmp_im(s
->pc
- s
->cs_base
);
8028 /* MMX/3DNow!/SSE/SSE2/SSE3/SSSE3/SSE4 support */
8029 case 0x1c3: /* MOVNTI reg, mem */
8030 if (!(s
->cpuid_features
& CPUID_SSE2
))
8032 ot
= s
->dflag
== 2 ? OT_QUAD
: OT_LONG
;
8033 modrm
= cpu_ldub_code(env
, s
->pc
++);
8034 mod
= (modrm
>> 6) & 3;
8037 reg
= ((modrm
>> 3) & 7) | rex_r
;
8038 /* generate a generic store */
8039 gen_ldst_modrm(env
, s
, modrm
, ot
, reg
, 1);
8042 modrm
= cpu_ldub_code(env
, s
->pc
++);
8043 mod
= (modrm
>> 6) & 3;
8044 op
= (modrm
>> 3) & 7;
8046 case 0: /* fxsave */
8047 if (mod
== 3 || !(s
->cpuid_features
& CPUID_FXSR
) ||
8048 (s
->prefix
& PREFIX_LOCK
))
8050 if ((s
->flags
& HF_EM_MASK
) || (s
->flags
& HF_TS_MASK
)) {
8051 gen_exception(s
, EXCP07_PREX
, pc_start
- s
->cs_base
);
8054 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
8055 gen_update_cc_op(s
);
8056 gen_jmp_im(pc_start
- s
->cs_base
);
8057 gen_helper_fxsave(cpu_env
, cpu_A0
, tcg_const_i32((s
->dflag
== 2)));
8059 case 1: /* fxrstor */
8060 if (mod
== 3 || !(s
->cpuid_features
& CPUID_FXSR
) ||
8061 (s
->prefix
& PREFIX_LOCK
))
8063 if ((s
->flags
& HF_EM_MASK
) || (s
->flags
& HF_TS_MASK
)) {
8064 gen_exception(s
, EXCP07_PREX
, pc_start
- s
->cs_base
);
8067 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
8068 gen_update_cc_op(s
);
8069 gen_jmp_im(pc_start
- s
->cs_base
);
8070 gen_helper_fxrstor(cpu_env
, cpu_A0
,
8071 tcg_const_i32((s
->dflag
== 2)));
8073 case 2: /* ldmxcsr */
8074 case 3: /* stmxcsr */
8075 if (s
->flags
& HF_TS_MASK
) {
8076 gen_exception(s
, EXCP07_PREX
, pc_start
- s
->cs_base
);
8079 if ((s
->flags
& HF_EM_MASK
) || !(s
->flags
& HF_OSFXSR_MASK
) ||
8082 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
8084 gen_op_ld_T0_A0(OT_LONG
+ s
->mem_index
);
8085 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
8086 gen_helper_ldmxcsr(cpu_env
, cpu_tmp2_i32
);
8088 tcg_gen_ld32u_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
, mxcsr
));
8089 gen_op_st_T0_A0(OT_LONG
+ s
->mem_index
);
8092 case 5: /* lfence */
8093 case 6: /* mfence */
8094 if ((modrm
& 0xc7) != 0xc0 || !(s
->cpuid_features
& CPUID_SSE2
))
8097 case 7: /* sfence / clflush */
8098 if ((modrm
& 0xc7) == 0xc0) {
8100 /* XXX: also check for cpuid_ext2_features & CPUID_EXT2_EMMX */
8101 if (!(s
->cpuid_features
& CPUID_SSE
))
8105 if (!(s
->cpuid_features
& CPUID_CLFLUSH
))
8107 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
8114 case 0x10d: /* 3DNow! prefetch(w) */
8115 modrm
= cpu_ldub_code(env
, s
->pc
++);
8116 mod
= (modrm
>> 6) & 3;
8119 gen_lea_modrm(env
, s
, modrm
, ®_addr
, &offset_addr
);
8120 /* ignore for now */
8122 case 0x1aa: /* rsm */
8123 gen_svm_check_intercept(s
, pc_start
, SVM_EXIT_RSM
);
8124 if (!(s
->flags
& HF_SMM_MASK
))
8126 gen_update_cc_op(s
);
8127 gen_jmp_im(s
->pc
- s
->cs_base
);
8128 gen_helper_rsm(cpu_env
);
8131 case 0x1b8: /* SSE4.2 popcnt */
8132 if ((prefixes
& (PREFIX_REPZ
| PREFIX_LOCK
| PREFIX_REPNZ
)) !=
8135 if (!(s
->cpuid_ext_features
& CPUID_EXT_POPCNT
))
8138 modrm
= cpu_ldub_code(env
, s
->pc
++);
8139 reg
= ((modrm
>> 3) & 7) | rex_r
;
8141 if (s
->prefix
& PREFIX_DATA
)
8143 else if (s
->dflag
!= 2)
8148 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
8149 gen_helper_popcnt(cpu_T
[0], cpu_env
, cpu_T
[0], tcg_const_i32(ot
));
8150 gen_op_mov_reg_T0(ot
, reg
);
8152 set_cc_op(s
, CC_OP_EFLAGS
);
8154 case 0x10e ... 0x10f:
8155 /* 3DNow! instructions, ignore prefixes */
8156 s
->prefix
&= ~(PREFIX_REPZ
| PREFIX_REPNZ
| PREFIX_DATA
);
8157 case 0x110 ... 0x117:
8158 case 0x128 ... 0x12f:
8159 case 0x138 ... 0x13a:
8160 case 0x150 ... 0x179:
8161 case 0x17c ... 0x17f:
8163 case 0x1c4 ... 0x1c6:
8164 case 0x1d0 ... 0x1fe:
8165 gen_sse(env
, s
, b
, pc_start
, rex_r
);
8170 /* lock generation */
8171 if (s
->prefix
& PREFIX_LOCK
)
8172 gen_helper_unlock();
8175 if (s
->prefix
& PREFIX_LOCK
)
8176 gen_helper_unlock();
8177 /* XXX: ensure that no lock was generated */
8178 gen_exception(s
, EXCP06_ILLOP
, pc_start
- s
->cs_base
);
8182 void optimize_flags_init(void)
8184 cpu_env
= tcg_global_reg_new_ptr(TCG_AREG0
, "env");
8185 cpu_cc_op
= tcg_global_mem_new_i32(TCG_AREG0
,
8186 offsetof(CPUX86State
, cc_op
), "cc_op");
8187 cpu_cc_dst
= tcg_global_mem_new(TCG_AREG0
, offsetof(CPUX86State
, cc_dst
),
8189 cpu_cc_src
= tcg_global_mem_new(TCG_AREG0
, offsetof(CPUX86State
, cc_src
),
8191 cpu_cc_src2
= tcg_global_mem_new(TCG_AREG0
, offsetof(CPUX86State
, cc_src2
),
8194 #ifdef TARGET_X86_64
8195 cpu_regs
[R_EAX
] = tcg_global_mem_new_i64(TCG_AREG0
,
8196 offsetof(CPUX86State
, regs
[R_EAX
]), "rax");
8197 cpu_regs
[R_ECX
] = tcg_global_mem_new_i64(TCG_AREG0
,
8198 offsetof(CPUX86State
, regs
[R_ECX
]), "rcx");
8199 cpu_regs
[R_EDX
] = tcg_global_mem_new_i64(TCG_AREG0
,
8200 offsetof(CPUX86State
, regs
[R_EDX
]), "rdx");
8201 cpu_regs
[R_EBX
] = tcg_global_mem_new_i64(TCG_AREG0
,
8202 offsetof(CPUX86State
, regs
[R_EBX
]), "rbx");
8203 cpu_regs
[R_ESP
] = tcg_global_mem_new_i64(TCG_AREG0
,
8204 offsetof(CPUX86State
, regs
[R_ESP
]), "rsp");
8205 cpu_regs
[R_EBP
] = tcg_global_mem_new_i64(TCG_AREG0
,
8206 offsetof(CPUX86State
, regs
[R_EBP
]), "rbp");
8207 cpu_regs
[R_ESI
] = tcg_global_mem_new_i64(TCG_AREG0
,
8208 offsetof(CPUX86State
, regs
[R_ESI
]), "rsi");
8209 cpu_regs
[R_EDI
] = tcg_global_mem_new_i64(TCG_AREG0
,
8210 offsetof(CPUX86State
, regs
[R_EDI
]), "rdi");
8211 cpu_regs
[8] = tcg_global_mem_new_i64(TCG_AREG0
,
8212 offsetof(CPUX86State
, regs
[8]), "r8");
8213 cpu_regs
[9] = tcg_global_mem_new_i64(TCG_AREG0
,
8214 offsetof(CPUX86State
, regs
[9]), "r9");
8215 cpu_regs
[10] = tcg_global_mem_new_i64(TCG_AREG0
,
8216 offsetof(CPUX86State
, regs
[10]), "r10");
8217 cpu_regs
[11] = tcg_global_mem_new_i64(TCG_AREG0
,
8218 offsetof(CPUX86State
, regs
[11]), "r11");
8219 cpu_regs
[12] = tcg_global_mem_new_i64(TCG_AREG0
,
8220 offsetof(CPUX86State
, regs
[12]), "r12");
8221 cpu_regs
[13] = tcg_global_mem_new_i64(TCG_AREG0
,
8222 offsetof(CPUX86State
, regs
[13]), "r13");
8223 cpu_regs
[14] = tcg_global_mem_new_i64(TCG_AREG0
,
8224 offsetof(CPUX86State
, regs
[14]), "r14");
8225 cpu_regs
[15] = tcg_global_mem_new_i64(TCG_AREG0
,
8226 offsetof(CPUX86State
, regs
[15]), "r15");
8228 cpu_regs
[R_EAX
] = tcg_global_mem_new_i32(TCG_AREG0
,
8229 offsetof(CPUX86State
, regs
[R_EAX
]), "eax");
8230 cpu_regs
[R_ECX
] = tcg_global_mem_new_i32(TCG_AREG0
,
8231 offsetof(CPUX86State
, regs
[R_ECX
]), "ecx");
8232 cpu_regs
[R_EDX
] = tcg_global_mem_new_i32(TCG_AREG0
,
8233 offsetof(CPUX86State
, regs
[R_EDX
]), "edx");
8234 cpu_regs
[R_EBX
] = tcg_global_mem_new_i32(TCG_AREG0
,
8235 offsetof(CPUX86State
, regs
[R_EBX
]), "ebx");
8236 cpu_regs
[R_ESP
] = tcg_global_mem_new_i32(TCG_AREG0
,
8237 offsetof(CPUX86State
, regs
[R_ESP
]), "esp");
8238 cpu_regs
[R_EBP
] = tcg_global_mem_new_i32(TCG_AREG0
,
8239 offsetof(CPUX86State
, regs
[R_EBP
]), "ebp");
8240 cpu_regs
[R_ESI
] = tcg_global_mem_new_i32(TCG_AREG0
,
8241 offsetof(CPUX86State
, regs
[R_ESI
]), "esi");
8242 cpu_regs
[R_EDI
] = tcg_global_mem_new_i32(TCG_AREG0
,
8243 offsetof(CPUX86State
, regs
[R_EDI
]), "edi");
8246 /* register helpers */
8247 #define GEN_HELPER 2
8251 /* generate intermediate code in gen_opc_buf and gen_opparam_buf for
8252 basic block 'tb'. If search_pc is TRUE, also generate PC
8253 information for each intermediate instruction. */
8254 static inline void gen_intermediate_code_internal(X86CPU
*cpu
,
8255 TranslationBlock
*tb
,
8258 CPUState
*cs
= CPU(cpu
);
8259 CPUX86State
*env
= &cpu
->env
;
8260 DisasContext dc1
, *dc
= &dc1
;
8261 target_ulong pc_ptr
;
8262 uint16_t *gen_opc_end
;
8266 target_ulong pc_start
;
8267 target_ulong cs_base
;
8271 /* generate intermediate code */
8273 cs_base
= tb
->cs_base
;
8276 dc
->pe
= (flags
>> HF_PE_SHIFT
) & 1;
8277 dc
->code32
= (flags
>> HF_CS32_SHIFT
) & 1;
8278 dc
->ss32
= (flags
>> HF_SS32_SHIFT
) & 1;
8279 dc
->addseg
= (flags
>> HF_ADDSEG_SHIFT
) & 1;
8281 dc
->vm86
= (flags
>> VM_SHIFT
) & 1;
8282 dc
->cpl
= (flags
>> HF_CPL_SHIFT
) & 3;
8283 dc
->iopl
= (flags
>> IOPL_SHIFT
) & 3;
8284 dc
->tf
= (flags
>> TF_SHIFT
) & 1;
8285 dc
->singlestep_enabled
= cs
->singlestep_enabled
;
8286 dc
->cc_op
= CC_OP_DYNAMIC
;
8287 dc
->cc_op_dirty
= false;
8288 dc
->cs_base
= cs_base
;
8290 dc
->popl_esp_hack
= 0;
8291 /* select memory access functions */
8293 if (flags
& HF_SOFTMMU_MASK
) {
8294 dc
->mem_index
= (cpu_mmu_index(env
) + 1) << 2;
8296 dc
->cpuid_features
= env
->features
[FEAT_1_EDX
];
8297 dc
->cpuid_ext_features
= env
->features
[FEAT_1_ECX
];
8298 dc
->cpuid_ext2_features
= env
->features
[FEAT_8000_0001_EDX
];
8299 dc
->cpuid_ext3_features
= env
->features
[FEAT_8000_0001_ECX
];
8300 dc
->cpuid_7_0_ebx_features
= env
->features
[FEAT_7_0_EBX
];
8301 #ifdef TARGET_X86_64
8302 dc
->lma
= (flags
>> HF_LMA_SHIFT
) & 1;
8303 dc
->code64
= (flags
>> HF_CS64_SHIFT
) & 1;
8306 dc
->jmp_opt
= !(dc
->tf
|| cs
->singlestep_enabled
||
8307 (flags
& HF_INHIBIT_IRQ_MASK
)
8308 #ifndef CONFIG_SOFTMMU
8309 || (flags
& HF_SOFTMMU_MASK
)
8313 /* check addseg logic */
8314 if (!dc
->addseg
&& (dc
->vm86
|| !dc
->pe
|| !dc
->code32
))
8315 printf("ERROR addseg\n");
8318 cpu_T
[0] = tcg_temp_new();
8319 cpu_T
[1] = tcg_temp_new();
8320 cpu_A0
= tcg_temp_new();
8322 cpu_tmp0
= tcg_temp_new();
8323 cpu_tmp1_i64
= tcg_temp_new_i64();
8324 cpu_tmp2_i32
= tcg_temp_new_i32();
8325 cpu_tmp3_i32
= tcg_temp_new_i32();
8326 cpu_tmp4
= tcg_temp_new();
8327 cpu_ptr0
= tcg_temp_new_ptr();
8328 cpu_ptr1
= tcg_temp_new_ptr();
8329 cpu_cc_srcT
= tcg_temp_local_new();
8331 gen_opc_end
= tcg_ctx
.gen_opc_buf
+ OPC_MAX_SIZE
;
8333 dc
->is_jmp
= DISAS_NEXT
;
8337 max_insns
= tb
->cflags
& CF_COUNT_MASK
;
8339 max_insns
= CF_COUNT_MASK
;
8343 if (unlikely(!QTAILQ_EMPTY(&env
->breakpoints
))) {
8344 QTAILQ_FOREACH(bp
, &env
->breakpoints
, entry
) {
8345 if (bp
->pc
== pc_ptr
&&
8346 !((bp
->flags
& BP_CPU
) && (tb
->flags
& HF_RF_MASK
))) {
8347 gen_debug(dc
, pc_ptr
- dc
->cs_base
);
8353 j
= tcg_ctx
.gen_opc_ptr
- tcg_ctx
.gen_opc_buf
;
8357 tcg_ctx
.gen_opc_instr_start
[lj
++] = 0;
8359 tcg_ctx
.gen_opc_pc
[lj
] = pc_ptr
;
8360 gen_opc_cc_op
[lj
] = dc
->cc_op
;
8361 tcg_ctx
.gen_opc_instr_start
[lj
] = 1;
8362 tcg_ctx
.gen_opc_icount
[lj
] = num_insns
;
8364 if (num_insns
+ 1 == max_insns
&& (tb
->cflags
& CF_LAST_IO
))
8367 pc_ptr
= disas_insn(env
, dc
, pc_ptr
);
8369 /* stop translation if indicated */
8372 /* if single step mode, we generate only one instruction and
8373 generate an exception */
8374 /* if irq were inhibited with HF_INHIBIT_IRQ_MASK, we clear
8375 the flag and abort the translation to give the irqs a
8376 change to be happen */
8377 if (dc
->tf
|| dc
->singlestep_enabled
||
8378 (flags
& HF_INHIBIT_IRQ_MASK
)) {
8379 gen_jmp_im(pc_ptr
- dc
->cs_base
);
8383 /* if too long translation, stop generation too */
8384 if (tcg_ctx
.gen_opc_ptr
>= gen_opc_end
||
8385 (pc_ptr
- pc_start
) >= (TARGET_PAGE_SIZE
- 32) ||
8386 num_insns
>= max_insns
) {
8387 gen_jmp_im(pc_ptr
- dc
->cs_base
);
8392 gen_jmp_im(pc_ptr
- dc
->cs_base
);
8397 if (tb
->cflags
& CF_LAST_IO
)
8399 gen_tb_end(tb
, num_insns
);
8400 *tcg_ctx
.gen_opc_ptr
= INDEX_op_end
;
8401 /* we don't forget to fill the last values */
8403 j
= tcg_ctx
.gen_opc_ptr
- tcg_ctx
.gen_opc_buf
;
8406 tcg_ctx
.gen_opc_instr_start
[lj
++] = 0;
8410 if (qemu_loglevel_mask(CPU_LOG_TB_IN_ASM
)) {
8412 qemu_log("----------------\n");
8413 qemu_log("IN: %s\n", lookup_symbol(pc_start
));
8414 #ifdef TARGET_X86_64
8419 disas_flags
= !dc
->code32
;
8420 log_target_disas(env
, pc_start
, pc_ptr
- pc_start
, disas_flags
);
8426 tb
->size
= pc_ptr
- pc_start
;
8427 tb
->icount
= num_insns
;
8431 void gen_intermediate_code(CPUX86State
*env
, TranslationBlock
*tb
)
8433 gen_intermediate_code_internal(x86_env_get_cpu(env
), tb
, false);
8436 void gen_intermediate_code_pc(CPUX86State
*env
, TranslationBlock
*tb
)
8438 gen_intermediate_code_internal(x86_env_get_cpu(env
), tb
, true);
8441 void restore_state_to_opc(CPUX86State
*env
, TranslationBlock
*tb
, int pc_pos
)
8445 if (qemu_loglevel_mask(CPU_LOG_TB_OP
)) {
8447 qemu_log("RESTORE:\n");
8448 for(i
= 0;i
<= pc_pos
; i
++) {
8449 if (tcg_ctx
.gen_opc_instr_start
[i
]) {
8450 qemu_log("0x%04x: " TARGET_FMT_lx
"\n", i
,
8451 tcg_ctx
.gen_opc_pc
[i
]);
8454 qemu_log("pc_pos=0x%x eip=" TARGET_FMT_lx
" cs_base=%x\n",
8455 pc_pos
, tcg_ctx
.gen_opc_pc
[pc_pos
] - tb
->cs_base
,
8456 (uint32_t)tb
->cs_base
);
8459 env
->eip
= tcg_ctx
.gen_opc_pc
[pc_pos
] - tb
->cs_base
;
8460 cc_op
= gen_opc_cc_op
[pc_pos
];
8461 if (cc_op
!= CC_OP_DYNAMIC
)