target-i386: Use CC_SRC2 for ADC and SBB
[qemu/ar7.git] / target-i386 / translate.c
blobf667f9333bfe95bb9a017c60d5fedab1cd43ff55
1 /*
2 * i386 translation
4 * Copyright (c) 2003 Fabrice Bellard
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
19 #include <stdarg.h>
20 #include <stdlib.h>
21 #include <stdio.h>
22 #include <string.h>
23 #include <inttypes.h>
24 #include <signal.h>
26 #include "qemu/host-utils.h"
27 #include "cpu.h"
28 #include "disas/disas.h"
29 #include "tcg-op.h"
31 #include "helper.h"
32 #define GEN_HELPER 1
33 #include "helper.h"
35 #define PREFIX_REPZ 0x01
36 #define PREFIX_REPNZ 0x02
37 #define PREFIX_LOCK 0x04
38 #define PREFIX_DATA 0x08
39 #define PREFIX_ADR 0x10
41 #ifdef TARGET_X86_64
42 #define CODE64(s) ((s)->code64)
43 #define REX_X(s) ((s)->rex_x)
44 #define REX_B(s) ((s)->rex_b)
45 #else
46 #define CODE64(s) 0
47 #define REX_X(s) 0
48 #define REX_B(s) 0
49 #endif
51 #ifdef TARGET_X86_64
52 # define ctztl ctz64
53 # define clztl clz64
54 #else
55 # define ctztl ctz32
56 # define clztl clz32
57 #endif
59 //#define MACRO_TEST 1
61 /* global register indexes */
62 static TCGv_ptr cpu_env;
63 static TCGv cpu_A0;
64 static TCGv cpu_cc_dst, cpu_cc_src, cpu_cc_src2, cpu_cc_srcT;
65 static TCGv_i32 cpu_cc_op;
66 static TCGv cpu_regs[CPU_NB_REGS];
67 /* local temps */
68 static TCGv cpu_T[2];
69 /* local register indexes (only used inside old micro ops) */
70 static TCGv cpu_tmp0, cpu_tmp4;
71 static TCGv_ptr cpu_ptr0, cpu_ptr1;
72 static TCGv_i32 cpu_tmp2_i32, cpu_tmp3_i32;
73 static TCGv_i64 cpu_tmp1_i64;
74 static TCGv cpu_tmp5;
76 static uint8_t gen_opc_cc_op[OPC_BUF_SIZE];
78 #include "exec/gen-icount.h"
80 #ifdef TARGET_X86_64
81 static int x86_64_hregs;
82 #endif
84 typedef struct DisasContext {
85 /* current insn context */
86 int override; /* -1 if no override */
87 int prefix;
88 int aflag, dflag;
89 target_ulong pc; /* pc = eip + cs_base */
90 int is_jmp; /* 1 = means jump (stop translation), 2 means CPU
91 static state change (stop translation) */
92 /* current block context */
93 target_ulong cs_base; /* base of CS segment */
94 int pe; /* protected mode */
95 int code32; /* 32 bit code segment */
96 #ifdef TARGET_X86_64
97 int lma; /* long mode active */
98 int code64; /* 64 bit code segment */
99 int rex_x, rex_b;
100 #endif
101 int ss32; /* 32 bit stack segment */
102 CCOp cc_op; /* current CC operation */
103 bool cc_op_dirty;
104 int addseg; /* non zero if either DS/ES/SS have a non zero base */
105 int f_st; /* currently unused */
106 int vm86; /* vm86 mode */
107 int cpl;
108 int iopl;
109 int tf; /* TF cpu flag */
110 int singlestep_enabled; /* "hardware" single step enabled */
111 int jmp_opt; /* use direct block chaining for direct jumps */
112 int mem_index; /* select memory access functions */
113 uint64_t flags; /* all execution flags */
114 struct TranslationBlock *tb;
115 int popl_esp_hack; /* for correct popl with esp base handling */
116 int rip_offset; /* only used in x86_64, but left for simplicity */
117 int cpuid_features;
118 int cpuid_ext_features;
119 int cpuid_ext2_features;
120 int cpuid_ext3_features;
121 int cpuid_7_0_ebx_features;
122 } DisasContext;
124 static void gen_eob(DisasContext *s);
125 static void gen_jmp(DisasContext *s, target_ulong eip);
126 static void gen_jmp_tb(DisasContext *s, target_ulong eip, int tb_num);
127 static void gen_op(DisasContext *s1, int op, int ot, int d);
129 /* i386 arith/logic operations */
130 enum {
131 OP_ADDL,
132 OP_ORL,
133 OP_ADCL,
134 OP_SBBL,
135 OP_ANDL,
136 OP_SUBL,
137 OP_XORL,
138 OP_CMPL,
141 /* i386 shift ops */
142 enum {
143 OP_ROL,
144 OP_ROR,
145 OP_RCL,
146 OP_RCR,
147 OP_SHL,
148 OP_SHR,
149 OP_SHL1, /* undocumented */
150 OP_SAR = 7,
153 enum {
154 JCC_O,
155 JCC_B,
156 JCC_Z,
157 JCC_BE,
158 JCC_S,
159 JCC_P,
160 JCC_L,
161 JCC_LE,
164 /* operand size */
165 enum {
166 OT_BYTE = 0,
167 OT_WORD,
168 OT_LONG,
169 OT_QUAD,
172 enum {
173 /* I386 int registers */
174 OR_EAX, /* MUST be even numbered */
175 OR_ECX,
176 OR_EDX,
177 OR_EBX,
178 OR_ESP,
179 OR_EBP,
180 OR_ESI,
181 OR_EDI,
183 OR_TMP0 = 16, /* temporary operand register */
184 OR_TMP1,
185 OR_A0, /* temporary register used when doing address evaluation */
188 enum {
189 USES_CC_DST = 1,
190 USES_CC_SRC = 2,
191 USES_CC_SRC2 = 4,
192 USES_CC_SRCT = 8,
195 /* Bit set if the global variable is live after setting CC_OP to X. */
196 static const uint8_t cc_op_live[CC_OP_NB] = {
197 [CC_OP_DYNAMIC] = USES_CC_DST | USES_CC_SRC | USES_CC_SRC2,
198 [CC_OP_EFLAGS] = USES_CC_SRC,
199 [CC_OP_MULB ... CC_OP_MULQ] = USES_CC_DST | USES_CC_SRC,
200 [CC_OP_ADDB ... CC_OP_ADDQ] = USES_CC_DST | USES_CC_SRC,
201 [CC_OP_ADCB ... CC_OP_ADCQ] = USES_CC_DST | USES_CC_SRC | USES_CC_SRC2,
202 [CC_OP_SUBB ... CC_OP_SUBQ] = USES_CC_DST | USES_CC_SRC | USES_CC_SRCT,
203 [CC_OP_SBBB ... CC_OP_SBBQ] = USES_CC_DST | USES_CC_SRC | USES_CC_SRC2,
204 [CC_OP_LOGICB ... CC_OP_LOGICQ] = USES_CC_DST,
205 [CC_OP_INCB ... CC_OP_INCQ] = USES_CC_DST | USES_CC_SRC,
206 [CC_OP_DECB ... CC_OP_DECQ] = USES_CC_DST | USES_CC_SRC,
207 [CC_OP_SHLB ... CC_OP_SHLQ] = USES_CC_DST | USES_CC_SRC,
208 [CC_OP_SARB ... CC_OP_SARQ] = USES_CC_DST | USES_CC_SRC,
211 static void set_cc_op(DisasContext *s, CCOp op)
213 int dead;
215 if (s->cc_op == op) {
216 return;
219 /* Discard CC computation that will no longer be used. */
220 dead = cc_op_live[s->cc_op] & ~cc_op_live[op];
221 if (dead & USES_CC_DST) {
222 tcg_gen_discard_tl(cpu_cc_dst);
224 if (dead & USES_CC_SRC) {
225 tcg_gen_discard_tl(cpu_cc_src);
227 if (dead & USES_CC_SRC2) {
228 tcg_gen_discard_tl(cpu_cc_src2);
230 if (dead & USES_CC_SRCT) {
231 tcg_gen_discard_tl(cpu_cc_srcT);
234 s->cc_op = op;
235 /* The DYNAMIC setting is translator only, and should never be
236 stored. Thus we always consider it clean. */
237 s->cc_op_dirty = (op != CC_OP_DYNAMIC);
240 static void gen_update_cc_op(DisasContext *s)
242 if (s->cc_op_dirty) {
243 tcg_gen_movi_i32(cpu_cc_op, s->cc_op);
244 s->cc_op_dirty = false;
248 static inline void gen_op_movl_T0_0(void)
250 tcg_gen_movi_tl(cpu_T[0], 0);
253 static inline void gen_op_movl_T0_im(int32_t val)
255 tcg_gen_movi_tl(cpu_T[0], val);
258 static inline void gen_op_movl_T0_imu(uint32_t val)
260 tcg_gen_movi_tl(cpu_T[0], val);
263 static inline void gen_op_movl_T1_im(int32_t val)
265 tcg_gen_movi_tl(cpu_T[1], val);
268 static inline void gen_op_movl_T1_imu(uint32_t val)
270 tcg_gen_movi_tl(cpu_T[1], val);
273 static inline void gen_op_movl_A0_im(uint32_t val)
275 tcg_gen_movi_tl(cpu_A0, val);
278 #ifdef TARGET_X86_64
279 static inline void gen_op_movq_A0_im(int64_t val)
281 tcg_gen_movi_tl(cpu_A0, val);
283 #endif
285 static inline void gen_movtl_T0_im(target_ulong val)
287 tcg_gen_movi_tl(cpu_T[0], val);
290 static inline void gen_movtl_T1_im(target_ulong val)
292 tcg_gen_movi_tl(cpu_T[1], val);
295 static inline void gen_op_andl_T0_ffff(void)
297 tcg_gen_andi_tl(cpu_T[0], cpu_T[0], 0xffff);
300 static inline void gen_op_andl_T0_im(uint32_t val)
302 tcg_gen_andi_tl(cpu_T[0], cpu_T[0], val);
305 static inline void gen_op_movl_T0_T1(void)
307 tcg_gen_mov_tl(cpu_T[0], cpu_T[1]);
310 static inline void gen_op_andl_A0_ffff(void)
312 tcg_gen_andi_tl(cpu_A0, cpu_A0, 0xffff);
315 #ifdef TARGET_X86_64
317 #define NB_OP_SIZES 4
319 #else /* !TARGET_X86_64 */
321 #define NB_OP_SIZES 3
323 #endif /* !TARGET_X86_64 */
325 #if defined(HOST_WORDS_BIGENDIAN)
326 #define REG_B_OFFSET (sizeof(target_ulong) - 1)
327 #define REG_H_OFFSET (sizeof(target_ulong) - 2)
328 #define REG_W_OFFSET (sizeof(target_ulong) - 2)
329 #define REG_L_OFFSET (sizeof(target_ulong) - 4)
330 #define REG_LH_OFFSET (sizeof(target_ulong) - 8)
331 #else
332 #define REG_B_OFFSET 0
333 #define REG_H_OFFSET 1
334 #define REG_W_OFFSET 0
335 #define REG_L_OFFSET 0
336 #define REG_LH_OFFSET 4
337 #endif
339 /* In instruction encodings for byte register accesses the
340 * register number usually indicates "low 8 bits of register N";
341 * however there are some special cases where N 4..7 indicates
342 * [AH, CH, DH, BH], ie "bits 15..8 of register N-4". Return
343 * true for this special case, false otherwise.
345 static inline bool byte_reg_is_xH(int reg)
347 if (reg < 4) {
348 return false;
350 #ifdef TARGET_X86_64
351 if (reg >= 8 || x86_64_hregs) {
352 return false;
354 #endif
355 return true;
358 static inline void gen_op_mov_reg_v(int ot, int reg, TCGv t0)
360 switch(ot) {
361 case OT_BYTE:
362 if (!byte_reg_is_xH(reg)) {
363 tcg_gen_deposit_tl(cpu_regs[reg], cpu_regs[reg], t0, 0, 8);
364 } else {
365 tcg_gen_deposit_tl(cpu_regs[reg - 4], cpu_regs[reg - 4], t0, 8, 8);
367 break;
368 case OT_WORD:
369 tcg_gen_deposit_tl(cpu_regs[reg], cpu_regs[reg], t0, 0, 16);
370 break;
371 default: /* XXX this shouldn't be reached; abort? */
372 case OT_LONG:
373 /* For x86_64, this sets the higher half of register to zero.
374 For i386, this is equivalent to a mov. */
375 tcg_gen_ext32u_tl(cpu_regs[reg], t0);
376 break;
377 #ifdef TARGET_X86_64
378 case OT_QUAD:
379 tcg_gen_mov_tl(cpu_regs[reg], t0);
380 break;
381 #endif
385 static inline void gen_op_mov_reg_T0(int ot, int reg)
387 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
390 static inline void gen_op_mov_reg_T1(int ot, int reg)
392 gen_op_mov_reg_v(ot, reg, cpu_T[1]);
395 static inline void gen_op_mov_reg_A0(int size, int reg)
397 switch(size) {
398 case OT_BYTE:
399 tcg_gen_deposit_tl(cpu_regs[reg], cpu_regs[reg], cpu_A0, 0, 16);
400 break;
401 default: /* XXX this shouldn't be reached; abort? */
402 case OT_WORD:
403 /* For x86_64, this sets the higher half of register to zero.
404 For i386, this is equivalent to a mov. */
405 tcg_gen_ext32u_tl(cpu_regs[reg], cpu_A0);
406 break;
407 #ifdef TARGET_X86_64
408 case OT_LONG:
409 tcg_gen_mov_tl(cpu_regs[reg], cpu_A0);
410 break;
411 #endif
415 static inline void gen_op_mov_v_reg(int ot, TCGv t0, int reg)
417 if (ot == OT_BYTE && byte_reg_is_xH(reg)) {
418 tcg_gen_shri_tl(t0, cpu_regs[reg - 4], 8);
419 tcg_gen_ext8u_tl(t0, t0);
420 } else {
421 tcg_gen_mov_tl(t0, cpu_regs[reg]);
425 static inline void gen_op_mov_TN_reg(int ot, int t_index, int reg)
427 gen_op_mov_v_reg(ot, cpu_T[t_index], reg);
430 static inline void gen_op_movl_A0_reg(int reg)
432 tcg_gen_mov_tl(cpu_A0, cpu_regs[reg]);
435 static inline void gen_op_addl_A0_im(int32_t val)
437 tcg_gen_addi_tl(cpu_A0, cpu_A0, val);
438 #ifdef TARGET_X86_64
439 tcg_gen_andi_tl(cpu_A0, cpu_A0, 0xffffffff);
440 #endif
443 #ifdef TARGET_X86_64
444 static inline void gen_op_addq_A0_im(int64_t val)
446 tcg_gen_addi_tl(cpu_A0, cpu_A0, val);
448 #endif
450 static void gen_add_A0_im(DisasContext *s, int val)
452 #ifdef TARGET_X86_64
453 if (CODE64(s))
454 gen_op_addq_A0_im(val);
455 else
456 #endif
457 gen_op_addl_A0_im(val);
460 static inline void gen_op_addl_T0_T1(void)
462 tcg_gen_add_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
465 static inline void gen_op_jmp_T0(void)
467 tcg_gen_st_tl(cpu_T[0], cpu_env, offsetof(CPUX86State, eip));
470 static inline void gen_op_add_reg_im(int size, int reg, int32_t val)
472 switch(size) {
473 case OT_BYTE:
474 tcg_gen_addi_tl(cpu_tmp0, cpu_regs[reg], val);
475 tcg_gen_deposit_tl(cpu_regs[reg], cpu_regs[reg], cpu_tmp0, 0, 16);
476 break;
477 case OT_WORD:
478 tcg_gen_addi_tl(cpu_tmp0, cpu_regs[reg], val);
479 /* For x86_64, this sets the higher half of register to zero.
480 For i386, this is equivalent to a nop. */
481 tcg_gen_ext32u_tl(cpu_tmp0, cpu_tmp0);
482 tcg_gen_mov_tl(cpu_regs[reg], cpu_tmp0);
483 break;
484 #ifdef TARGET_X86_64
485 case OT_LONG:
486 tcg_gen_addi_tl(cpu_regs[reg], cpu_regs[reg], val);
487 break;
488 #endif
492 static inline void gen_op_add_reg_T0(int size, int reg)
494 switch(size) {
495 case OT_BYTE:
496 tcg_gen_add_tl(cpu_tmp0, cpu_regs[reg], cpu_T[0]);
497 tcg_gen_deposit_tl(cpu_regs[reg], cpu_regs[reg], cpu_tmp0, 0, 16);
498 break;
499 case OT_WORD:
500 tcg_gen_add_tl(cpu_tmp0, cpu_regs[reg], cpu_T[0]);
501 /* For x86_64, this sets the higher half of register to zero.
502 For i386, this is equivalent to a nop. */
503 tcg_gen_ext32u_tl(cpu_tmp0, cpu_tmp0);
504 tcg_gen_mov_tl(cpu_regs[reg], cpu_tmp0);
505 break;
506 #ifdef TARGET_X86_64
507 case OT_LONG:
508 tcg_gen_add_tl(cpu_regs[reg], cpu_regs[reg], cpu_T[0]);
509 break;
510 #endif
514 static inline void gen_op_addl_A0_reg_sN(int shift, int reg)
516 tcg_gen_mov_tl(cpu_tmp0, cpu_regs[reg]);
517 if (shift != 0)
518 tcg_gen_shli_tl(cpu_tmp0, cpu_tmp0, shift);
519 tcg_gen_add_tl(cpu_A0, cpu_A0, cpu_tmp0);
520 /* For x86_64, this sets the higher half of register to zero.
521 For i386, this is equivalent to a nop. */
522 tcg_gen_ext32u_tl(cpu_A0, cpu_A0);
525 static inline void gen_op_movl_A0_seg(int reg)
527 tcg_gen_ld32u_tl(cpu_A0, cpu_env, offsetof(CPUX86State, segs[reg].base) + REG_L_OFFSET);
530 static inline void gen_op_addl_A0_seg(DisasContext *s, int reg)
532 tcg_gen_ld_tl(cpu_tmp0, cpu_env, offsetof(CPUX86State, segs[reg].base));
533 #ifdef TARGET_X86_64
534 if (CODE64(s)) {
535 tcg_gen_andi_tl(cpu_A0, cpu_A0, 0xffffffff);
536 tcg_gen_add_tl(cpu_A0, cpu_A0, cpu_tmp0);
537 } else {
538 tcg_gen_add_tl(cpu_A0, cpu_A0, cpu_tmp0);
539 tcg_gen_andi_tl(cpu_A0, cpu_A0, 0xffffffff);
541 #else
542 tcg_gen_add_tl(cpu_A0, cpu_A0, cpu_tmp0);
543 #endif
546 #ifdef TARGET_X86_64
547 static inline void gen_op_movq_A0_seg(int reg)
549 tcg_gen_ld_tl(cpu_A0, cpu_env, offsetof(CPUX86State, segs[reg].base));
552 static inline void gen_op_addq_A0_seg(int reg)
554 tcg_gen_ld_tl(cpu_tmp0, cpu_env, offsetof(CPUX86State, segs[reg].base));
555 tcg_gen_add_tl(cpu_A0, cpu_A0, cpu_tmp0);
558 static inline void gen_op_movq_A0_reg(int reg)
560 tcg_gen_mov_tl(cpu_A0, cpu_regs[reg]);
563 static inline void gen_op_addq_A0_reg_sN(int shift, int reg)
565 tcg_gen_mov_tl(cpu_tmp0, cpu_regs[reg]);
566 if (shift != 0)
567 tcg_gen_shli_tl(cpu_tmp0, cpu_tmp0, shift);
568 tcg_gen_add_tl(cpu_A0, cpu_A0, cpu_tmp0);
570 #endif
572 static inline void gen_op_lds_T0_A0(int idx)
574 int mem_index = (idx >> 2) - 1;
575 switch(idx & 3) {
576 case OT_BYTE:
577 tcg_gen_qemu_ld8s(cpu_T[0], cpu_A0, mem_index);
578 break;
579 case OT_WORD:
580 tcg_gen_qemu_ld16s(cpu_T[0], cpu_A0, mem_index);
581 break;
582 default:
583 case OT_LONG:
584 tcg_gen_qemu_ld32s(cpu_T[0], cpu_A0, mem_index);
585 break;
589 static inline void gen_op_ld_v(int idx, TCGv t0, TCGv a0)
591 int mem_index = (idx >> 2) - 1;
592 switch(idx & 3) {
593 case OT_BYTE:
594 tcg_gen_qemu_ld8u(t0, a0, mem_index);
595 break;
596 case OT_WORD:
597 tcg_gen_qemu_ld16u(t0, a0, mem_index);
598 break;
599 case OT_LONG:
600 tcg_gen_qemu_ld32u(t0, a0, mem_index);
601 break;
602 default:
603 case OT_QUAD:
604 /* Should never happen on 32-bit targets. */
605 #ifdef TARGET_X86_64
606 tcg_gen_qemu_ld64(t0, a0, mem_index);
607 #endif
608 break;
612 /* XXX: always use ldu or lds */
613 static inline void gen_op_ld_T0_A0(int idx)
615 gen_op_ld_v(idx, cpu_T[0], cpu_A0);
618 static inline void gen_op_ldu_T0_A0(int idx)
620 gen_op_ld_v(idx, cpu_T[0], cpu_A0);
623 static inline void gen_op_ld_T1_A0(int idx)
625 gen_op_ld_v(idx, cpu_T[1], cpu_A0);
628 static inline void gen_op_st_v(int idx, TCGv t0, TCGv a0)
630 int mem_index = (idx >> 2) - 1;
631 switch(idx & 3) {
632 case OT_BYTE:
633 tcg_gen_qemu_st8(t0, a0, mem_index);
634 break;
635 case OT_WORD:
636 tcg_gen_qemu_st16(t0, a0, mem_index);
637 break;
638 case OT_LONG:
639 tcg_gen_qemu_st32(t0, a0, mem_index);
640 break;
641 default:
642 case OT_QUAD:
643 /* Should never happen on 32-bit targets. */
644 #ifdef TARGET_X86_64
645 tcg_gen_qemu_st64(t0, a0, mem_index);
646 #endif
647 break;
651 static inline void gen_op_st_T0_A0(int idx)
653 gen_op_st_v(idx, cpu_T[0], cpu_A0);
656 static inline void gen_op_st_T1_A0(int idx)
658 gen_op_st_v(idx, cpu_T[1], cpu_A0);
661 static inline void gen_jmp_im(target_ulong pc)
663 tcg_gen_movi_tl(cpu_tmp0, pc);
664 tcg_gen_st_tl(cpu_tmp0, cpu_env, offsetof(CPUX86State, eip));
667 static inline void gen_string_movl_A0_ESI(DisasContext *s)
669 int override;
671 override = s->override;
672 #ifdef TARGET_X86_64
673 if (s->aflag == 2) {
674 if (override >= 0) {
675 gen_op_movq_A0_seg(override);
676 gen_op_addq_A0_reg_sN(0, R_ESI);
677 } else {
678 gen_op_movq_A0_reg(R_ESI);
680 } else
681 #endif
682 if (s->aflag) {
683 /* 32 bit address */
684 if (s->addseg && override < 0)
685 override = R_DS;
686 if (override >= 0) {
687 gen_op_movl_A0_seg(override);
688 gen_op_addl_A0_reg_sN(0, R_ESI);
689 } else {
690 gen_op_movl_A0_reg(R_ESI);
692 } else {
693 /* 16 address, always override */
694 if (override < 0)
695 override = R_DS;
696 gen_op_movl_A0_reg(R_ESI);
697 gen_op_andl_A0_ffff();
698 gen_op_addl_A0_seg(s, override);
702 static inline void gen_string_movl_A0_EDI(DisasContext *s)
704 #ifdef TARGET_X86_64
705 if (s->aflag == 2) {
706 gen_op_movq_A0_reg(R_EDI);
707 } else
708 #endif
709 if (s->aflag) {
710 if (s->addseg) {
711 gen_op_movl_A0_seg(R_ES);
712 gen_op_addl_A0_reg_sN(0, R_EDI);
713 } else {
714 gen_op_movl_A0_reg(R_EDI);
716 } else {
717 gen_op_movl_A0_reg(R_EDI);
718 gen_op_andl_A0_ffff();
719 gen_op_addl_A0_seg(s, R_ES);
723 static inline void gen_op_movl_T0_Dshift(int ot)
725 tcg_gen_ld32s_tl(cpu_T[0], cpu_env, offsetof(CPUX86State, df));
726 tcg_gen_shli_tl(cpu_T[0], cpu_T[0], ot);
729 static TCGv gen_ext_tl(TCGv dst, TCGv src, int size, bool sign)
731 switch (size) {
732 case OT_BYTE:
733 if (sign) {
734 tcg_gen_ext8s_tl(dst, src);
735 } else {
736 tcg_gen_ext8u_tl(dst, src);
738 return dst;
739 case OT_WORD:
740 if (sign) {
741 tcg_gen_ext16s_tl(dst, src);
742 } else {
743 tcg_gen_ext16u_tl(dst, src);
745 return dst;
746 #ifdef TARGET_X86_64
747 case OT_LONG:
748 if (sign) {
749 tcg_gen_ext32s_tl(dst, src);
750 } else {
751 tcg_gen_ext32u_tl(dst, src);
753 return dst;
754 #endif
755 default:
756 return src;
760 static void gen_extu(int ot, TCGv reg)
762 gen_ext_tl(reg, reg, ot, false);
765 static void gen_exts(int ot, TCGv reg)
767 gen_ext_tl(reg, reg, ot, true);
770 static inline void gen_op_jnz_ecx(int size, int label1)
772 tcg_gen_mov_tl(cpu_tmp0, cpu_regs[R_ECX]);
773 gen_extu(size + 1, cpu_tmp0);
774 tcg_gen_brcondi_tl(TCG_COND_NE, cpu_tmp0, 0, label1);
777 static inline void gen_op_jz_ecx(int size, int label1)
779 tcg_gen_mov_tl(cpu_tmp0, cpu_regs[R_ECX]);
780 gen_extu(size + 1, cpu_tmp0);
781 tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_tmp0, 0, label1);
784 static void gen_helper_in_func(int ot, TCGv v, TCGv_i32 n)
786 switch (ot) {
787 case OT_BYTE:
788 gen_helper_inb(v, n);
789 break;
790 case OT_WORD:
791 gen_helper_inw(v, n);
792 break;
793 case OT_LONG:
794 gen_helper_inl(v, n);
795 break;
799 static void gen_helper_out_func(int ot, TCGv_i32 v, TCGv_i32 n)
801 switch (ot) {
802 case OT_BYTE:
803 gen_helper_outb(v, n);
804 break;
805 case OT_WORD:
806 gen_helper_outw(v, n);
807 break;
808 case OT_LONG:
809 gen_helper_outl(v, n);
810 break;
814 static void gen_check_io(DisasContext *s, int ot, target_ulong cur_eip,
815 uint32_t svm_flags)
817 int state_saved;
818 target_ulong next_eip;
820 state_saved = 0;
821 if (s->pe && (s->cpl > s->iopl || s->vm86)) {
822 gen_update_cc_op(s);
823 gen_jmp_im(cur_eip);
824 state_saved = 1;
825 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
826 switch (ot) {
827 case OT_BYTE:
828 gen_helper_check_iob(cpu_env, cpu_tmp2_i32);
829 break;
830 case OT_WORD:
831 gen_helper_check_iow(cpu_env, cpu_tmp2_i32);
832 break;
833 case OT_LONG:
834 gen_helper_check_iol(cpu_env, cpu_tmp2_i32);
835 break;
838 if(s->flags & HF_SVMI_MASK) {
839 if (!state_saved) {
840 gen_update_cc_op(s);
841 gen_jmp_im(cur_eip);
843 svm_flags |= (1 << (4 + ot));
844 next_eip = s->pc - s->cs_base;
845 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
846 gen_helper_svm_check_io(cpu_env, cpu_tmp2_i32,
847 tcg_const_i32(svm_flags),
848 tcg_const_i32(next_eip - cur_eip));
852 static inline void gen_movs(DisasContext *s, int ot)
854 gen_string_movl_A0_ESI(s);
855 gen_op_ld_T0_A0(ot + s->mem_index);
856 gen_string_movl_A0_EDI(s);
857 gen_op_st_T0_A0(ot + s->mem_index);
858 gen_op_movl_T0_Dshift(ot);
859 gen_op_add_reg_T0(s->aflag, R_ESI);
860 gen_op_add_reg_T0(s->aflag, R_EDI);
863 static void gen_op_update1_cc(void)
865 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
868 static void gen_op_update2_cc(void)
870 tcg_gen_mov_tl(cpu_cc_src, cpu_T[1]);
871 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
874 static void gen_op_update3_cc(TCGv reg)
876 tcg_gen_mov_tl(cpu_cc_src2, reg);
877 tcg_gen_mov_tl(cpu_cc_src, cpu_T[1]);
878 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
881 static inline void gen_op_testl_T0_T1_cc(void)
883 tcg_gen_and_tl(cpu_cc_dst, cpu_T[0], cpu_T[1]);
886 static void gen_op_update_neg_cc(void)
888 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
889 tcg_gen_neg_tl(cpu_cc_src, cpu_T[0]);
890 tcg_gen_movi_tl(cpu_cc_srcT, 0);
893 /* compute all eflags to cc_src */
894 static void gen_compute_eflags(DisasContext *s)
896 TCGv zero, dst, src1, src2;
897 int live, dead;
899 if (s->cc_op == CC_OP_EFLAGS) {
900 return;
903 TCGV_UNUSED(zero);
904 dst = cpu_cc_dst;
905 src1 = cpu_cc_src;
906 src2 = cpu_cc_src2;
908 /* Take care to not read values that are not live. */
909 live = cc_op_live[s->cc_op] & ~USES_CC_SRCT;
910 dead = live ^ (USES_CC_DST | USES_CC_SRC | USES_CC_SRC2);
911 if (dead) {
912 zero = tcg_const_tl(0);
913 if (dead & USES_CC_DST) {
914 dst = zero;
916 if (dead & USES_CC_SRC) {
917 src1 = zero;
919 if (dead & USES_CC_SRC2) {
920 src2 = zero;
924 gen_update_cc_op(s);
925 gen_helper_cc_compute_all(cpu_cc_src, dst, src1, src2, cpu_cc_op);
926 set_cc_op(s, CC_OP_EFLAGS);
928 if (dead) {
929 tcg_temp_free(zero);
933 typedef struct CCPrepare {
934 TCGCond cond;
935 TCGv reg;
936 TCGv reg2;
937 target_ulong imm;
938 target_ulong mask;
939 bool use_reg2;
940 bool no_setcond;
941 } CCPrepare;
943 /* compute eflags.C to reg */
944 static CCPrepare gen_prepare_eflags_c(DisasContext *s, TCGv reg)
946 TCGv t0, t1;
947 int size, shift;
949 switch (s->cc_op) {
950 case CC_OP_SUBB ... CC_OP_SUBQ:
951 /* (DATA_TYPE)CC_SRCT < (DATA_TYPE)CC_SRC */
952 size = s->cc_op - CC_OP_SUBB;
953 t1 = gen_ext_tl(cpu_tmp0, cpu_cc_src, size, false);
954 /* If no temporary was used, be careful not to alias t1 and t0. */
955 t0 = TCGV_EQUAL(t1, cpu_cc_src) ? cpu_tmp0 : reg;
956 tcg_gen_mov_tl(t0, cpu_cc_srcT);
957 gen_extu(size, t0);
958 goto add_sub;
960 case CC_OP_ADDB ... CC_OP_ADDQ:
961 /* (DATA_TYPE)CC_DST < (DATA_TYPE)CC_SRC */
962 size = s->cc_op - CC_OP_ADDB;
963 t1 = gen_ext_tl(cpu_tmp0, cpu_cc_src, size, false);
964 t0 = gen_ext_tl(reg, cpu_cc_dst, size, false);
965 add_sub:
966 return (CCPrepare) { .cond = TCG_COND_LTU, .reg = t0,
967 .reg2 = t1, .mask = -1, .use_reg2 = true };
969 case CC_OP_LOGICB ... CC_OP_LOGICQ:
970 return (CCPrepare) { .cond = TCG_COND_NEVER, .mask = -1 };
972 case CC_OP_INCB ... CC_OP_INCQ:
973 case CC_OP_DECB ... CC_OP_DECQ:
974 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
975 .mask = -1, .no_setcond = true };
977 case CC_OP_SHLB ... CC_OP_SHLQ:
978 /* (CC_SRC >> (DATA_BITS - 1)) & 1 */
979 size = s->cc_op - CC_OP_SHLB;
980 shift = (8 << size) - 1;
981 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
982 .mask = (target_ulong)1 << shift };
984 case CC_OP_MULB ... CC_OP_MULQ:
985 return (CCPrepare) { .cond = TCG_COND_NE,
986 .reg = cpu_cc_src, .mask = -1 };
988 case CC_OP_EFLAGS:
989 case CC_OP_SARB ... CC_OP_SARQ:
990 /* CC_SRC & 1 */
991 return (CCPrepare) { .cond = TCG_COND_NE,
992 .reg = cpu_cc_src, .mask = CC_C };
994 default:
995 /* The need to compute only C from CC_OP_DYNAMIC is important
996 in efficiently implementing e.g. INC at the start of a TB. */
997 gen_update_cc_op(s);
998 gen_helper_cc_compute_c(reg, cpu_cc_dst, cpu_cc_src,
999 cpu_cc_src2, cpu_cc_op);
1000 return (CCPrepare) { .cond = TCG_COND_NE, .reg = reg,
1001 .mask = -1, .no_setcond = true };
1005 /* compute eflags.P to reg */
1006 static CCPrepare gen_prepare_eflags_p(DisasContext *s, TCGv reg)
1008 gen_compute_eflags(s);
1009 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
1010 .mask = CC_P };
1013 /* compute eflags.S to reg */
1014 static CCPrepare gen_prepare_eflags_s(DisasContext *s, TCGv reg)
1016 switch (s->cc_op) {
1017 case CC_OP_DYNAMIC:
1018 gen_compute_eflags(s);
1019 /* FALLTHRU */
1020 case CC_OP_EFLAGS:
1021 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
1022 .mask = CC_S };
1023 default:
1025 int size = (s->cc_op - CC_OP_ADDB) & 3;
1026 TCGv t0 = gen_ext_tl(reg, cpu_cc_dst, size, true);
1027 return (CCPrepare) { .cond = TCG_COND_LT, .reg = t0, .mask = -1 };
1032 /* compute eflags.O to reg */
1033 static CCPrepare gen_prepare_eflags_o(DisasContext *s, TCGv reg)
1035 gen_compute_eflags(s);
1036 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
1037 .mask = CC_O };
1040 /* compute eflags.Z to reg */
1041 static CCPrepare gen_prepare_eflags_z(DisasContext *s, TCGv reg)
1043 switch (s->cc_op) {
1044 case CC_OP_DYNAMIC:
1045 gen_compute_eflags(s);
1046 /* FALLTHRU */
1047 case CC_OP_EFLAGS:
1048 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
1049 .mask = CC_Z };
1050 default:
1052 int size = (s->cc_op - CC_OP_ADDB) & 3;
1053 TCGv t0 = gen_ext_tl(reg, cpu_cc_dst, size, false);
1054 return (CCPrepare) { .cond = TCG_COND_EQ, .reg = t0, .mask = -1 };
1059 /* perform a conditional store into register 'reg' according to jump opcode
1060 value 'b'. In the fast case, T0 is guaranted not to be used. */
1061 static CCPrepare gen_prepare_cc(DisasContext *s, int b, TCGv reg)
1063 int inv, jcc_op, size, cond;
1064 CCPrepare cc;
1065 TCGv t0;
1067 inv = b & 1;
1068 jcc_op = (b >> 1) & 7;
1070 switch (s->cc_op) {
1071 case CC_OP_SUBB ... CC_OP_SUBQ:
1072 /* We optimize relational operators for the cmp/jcc case. */
1073 size = s->cc_op - CC_OP_SUBB;
1074 switch (jcc_op) {
1075 case JCC_BE:
1076 tcg_gen_mov_tl(cpu_tmp4, cpu_cc_srcT);
1077 gen_extu(size, cpu_tmp4);
1078 t0 = gen_ext_tl(cpu_tmp0, cpu_cc_src, size, false);
1079 cc = (CCPrepare) { .cond = TCG_COND_LEU, .reg = cpu_tmp4,
1080 .reg2 = t0, .mask = -1, .use_reg2 = true };
1081 break;
1083 case JCC_L:
1084 cond = TCG_COND_LT;
1085 goto fast_jcc_l;
1086 case JCC_LE:
1087 cond = TCG_COND_LE;
1088 fast_jcc_l:
1089 tcg_gen_mov_tl(cpu_tmp4, cpu_cc_srcT);
1090 gen_exts(size, cpu_tmp4);
1091 t0 = gen_ext_tl(cpu_tmp0, cpu_cc_src, size, true);
1092 cc = (CCPrepare) { .cond = cond, .reg = cpu_tmp4,
1093 .reg2 = t0, .mask = -1, .use_reg2 = true };
1094 break;
1096 default:
1097 goto slow_jcc;
1099 break;
1101 default:
1102 slow_jcc:
1103 /* This actually generates good code for JC, JZ and JS. */
1104 switch (jcc_op) {
1105 case JCC_O:
1106 cc = gen_prepare_eflags_o(s, reg);
1107 break;
1108 case JCC_B:
1109 cc = gen_prepare_eflags_c(s, reg);
1110 break;
1111 case JCC_Z:
1112 cc = gen_prepare_eflags_z(s, reg);
1113 break;
1114 case JCC_BE:
1115 gen_compute_eflags(s);
1116 cc = (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
1117 .mask = CC_Z | CC_C };
1118 break;
1119 case JCC_S:
1120 cc = gen_prepare_eflags_s(s, reg);
1121 break;
1122 case JCC_P:
1123 cc = gen_prepare_eflags_p(s, reg);
1124 break;
1125 case JCC_L:
1126 gen_compute_eflags(s);
1127 if (TCGV_EQUAL(reg, cpu_cc_src)) {
1128 reg = cpu_tmp0;
1130 tcg_gen_shri_tl(reg, cpu_cc_src, 4); /* CC_O -> CC_S */
1131 tcg_gen_xor_tl(reg, reg, cpu_cc_src);
1132 cc = (CCPrepare) { .cond = TCG_COND_NE, .reg = reg,
1133 .mask = CC_S };
1134 break;
1135 default:
1136 case JCC_LE:
1137 gen_compute_eflags(s);
1138 if (TCGV_EQUAL(reg, cpu_cc_src)) {
1139 reg = cpu_tmp0;
1141 tcg_gen_shri_tl(reg, cpu_cc_src, 4); /* CC_O -> CC_S */
1142 tcg_gen_xor_tl(reg, reg, cpu_cc_src);
1143 cc = (CCPrepare) { .cond = TCG_COND_NE, .reg = reg,
1144 .mask = CC_S | CC_Z };
1145 break;
1147 break;
1150 if (inv) {
1151 cc.cond = tcg_invert_cond(cc.cond);
1153 return cc;
1156 static void gen_setcc1(DisasContext *s, int b, TCGv reg)
1158 CCPrepare cc = gen_prepare_cc(s, b, reg);
1160 if (cc.no_setcond) {
1161 if (cc.cond == TCG_COND_EQ) {
1162 tcg_gen_xori_tl(reg, cc.reg, 1);
1163 } else {
1164 tcg_gen_mov_tl(reg, cc.reg);
1166 return;
1169 if (cc.cond == TCG_COND_NE && !cc.use_reg2 && cc.imm == 0 &&
1170 cc.mask != 0 && (cc.mask & (cc.mask - 1)) == 0) {
1171 tcg_gen_shri_tl(reg, cc.reg, ctztl(cc.mask));
1172 tcg_gen_andi_tl(reg, reg, 1);
1173 return;
1175 if (cc.mask != -1) {
1176 tcg_gen_andi_tl(reg, cc.reg, cc.mask);
1177 cc.reg = reg;
1179 if (cc.use_reg2) {
1180 tcg_gen_setcond_tl(cc.cond, reg, cc.reg, cc.reg2);
1181 } else {
1182 tcg_gen_setcondi_tl(cc.cond, reg, cc.reg, cc.imm);
1186 static inline void gen_compute_eflags_c(DisasContext *s, TCGv reg)
1188 gen_setcc1(s, JCC_B << 1, reg);
1191 /* generate a conditional jump to label 'l1' according to jump opcode
1192 value 'b'. In the fast case, T0 is guaranted not to be used. */
1193 static inline void gen_jcc1_noeob(DisasContext *s, int b, int l1)
1195 CCPrepare cc = gen_prepare_cc(s, b, cpu_T[0]);
1197 if (cc.mask != -1) {
1198 tcg_gen_andi_tl(cpu_T[0], cc.reg, cc.mask);
1199 cc.reg = cpu_T[0];
1201 if (cc.use_reg2) {
1202 tcg_gen_brcond_tl(cc.cond, cc.reg, cc.reg2, l1);
1203 } else {
1204 tcg_gen_brcondi_tl(cc.cond, cc.reg, cc.imm, l1);
1208 /* Generate a conditional jump to label 'l1' according to jump opcode
1209 value 'b'. In the fast case, T0 is guaranted not to be used.
1210 A translation block must end soon. */
1211 static inline void gen_jcc1(DisasContext *s, int b, int l1)
1213 CCPrepare cc = gen_prepare_cc(s, b, cpu_T[0]);
1215 gen_update_cc_op(s);
1216 if (cc.mask != -1) {
1217 tcg_gen_andi_tl(cpu_T[0], cc.reg, cc.mask);
1218 cc.reg = cpu_T[0];
1220 set_cc_op(s, CC_OP_DYNAMIC);
1221 if (cc.use_reg2) {
1222 tcg_gen_brcond_tl(cc.cond, cc.reg, cc.reg2, l1);
1223 } else {
1224 tcg_gen_brcondi_tl(cc.cond, cc.reg, cc.imm, l1);
1228 /* XXX: does not work with gdbstub "ice" single step - not a
1229 serious problem */
1230 static int gen_jz_ecx_string(DisasContext *s, target_ulong next_eip)
1232 int l1, l2;
1234 l1 = gen_new_label();
1235 l2 = gen_new_label();
1236 gen_op_jnz_ecx(s->aflag, l1);
1237 gen_set_label(l2);
1238 gen_jmp_tb(s, next_eip, 1);
1239 gen_set_label(l1);
1240 return l2;
1243 static inline void gen_stos(DisasContext *s, int ot)
1245 gen_op_mov_TN_reg(OT_LONG, 0, R_EAX);
1246 gen_string_movl_A0_EDI(s);
1247 gen_op_st_T0_A0(ot + s->mem_index);
1248 gen_op_movl_T0_Dshift(ot);
1249 gen_op_add_reg_T0(s->aflag, R_EDI);
1252 static inline void gen_lods(DisasContext *s, int ot)
1254 gen_string_movl_A0_ESI(s);
1255 gen_op_ld_T0_A0(ot + s->mem_index);
1256 gen_op_mov_reg_T0(ot, R_EAX);
1257 gen_op_movl_T0_Dshift(ot);
1258 gen_op_add_reg_T0(s->aflag, R_ESI);
1261 static inline void gen_scas(DisasContext *s, int ot)
1263 gen_string_movl_A0_EDI(s);
1264 gen_op_ld_T1_A0(ot + s->mem_index);
1265 gen_op(s, OP_CMPL, ot, R_EAX);
1266 gen_op_movl_T0_Dshift(ot);
1267 gen_op_add_reg_T0(s->aflag, R_EDI);
1270 static inline void gen_cmps(DisasContext *s, int ot)
1272 gen_string_movl_A0_EDI(s);
1273 gen_op_ld_T1_A0(ot + s->mem_index);
1274 gen_string_movl_A0_ESI(s);
1275 gen_op(s, OP_CMPL, ot, OR_TMP0);
1276 gen_op_movl_T0_Dshift(ot);
1277 gen_op_add_reg_T0(s->aflag, R_ESI);
1278 gen_op_add_reg_T0(s->aflag, R_EDI);
1281 static inline void gen_ins(DisasContext *s, int ot)
1283 if (use_icount)
1284 gen_io_start();
1285 gen_string_movl_A0_EDI(s);
1286 /* Note: we must do this dummy write first to be restartable in
1287 case of page fault. */
1288 gen_op_movl_T0_0();
1289 gen_op_st_T0_A0(ot + s->mem_index);
1290 gen_op_mov_TN_reg(OT_WORD, 1, R_EDX);
1291 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[1]);
1292 tcg_gen_andi_i32(cpu_tmp2_i32, cpu_tmp2_i32, 0xffff);
1293 gen_helper_in_func(ot, cpu_T[0], cpu_tmp2_i32);
1294 gen_op_st_T0_A0(ot + s->mem_index);
1295 gen_op_movl_T0_Dshift(ot);
1296 gen_op_add_reg_T0(s->aflag, R_EDI);
1297 if (use_icount)
1298 gen_io_end();
1301 static inline void gen_outs(DisasContext *s, int ot)
1303 if (use_icount)
1304 gen_io_start();
1305 gen_string_movl_A0_ESI(s);
1306 gen_op_ld_T0_A0(ot + s->mem_index);
1308 gen_op_mov_TN_reg(OT_WORD, 1, R_EDX);
1309 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[1]);
1310 tcg_gen_andi_i32(cpu_tmp2_i32, cpu_tmp2_i32, 0xffff);
1311 tcg_gen_trunc_tl_i32(cpu_tmp3_i32, cpu_T[0]);
1312 gen_helper_out_func(ot, cpu_tmp2_i32, cpu_tmp3_i32);
1314 gen_op_movl_T0_Dshift(ot);
1315 gen_op_add_reg_T0(s->aflag, R_ESI);
1316 if (use_icount)
1317 gen_io_end();
1320 /* same method as Valgrind : we generate jumps to current or next
1321 instruction */
1322 #define GEN_REPZ(op) \
1323 static inline void gen_repz_ ## op(DisasContext *s, int ot, \
1324 target_ulong cur_eip, target_ulong next_eip) \
1326 int l2;\
1327 gen_update_cc_op(s); \
1328 l2 = gen_jz_ecx_string(s, next_eip); \
1329 gen_ ## op(s, ot); \
1330 gen_op_add_reg_im(s->aflag, R_ECX, -1); \
1331 /* a loop would cause two single step exceptions if ECX = 1 \
1332 before rep string_insn */ \
1333 if (!s->jmp_opt) \
1334 gen_op_jz_ecx(s->aflag, l2); \
1335 gen_jmp(s, cur_eip); \
1338 #define GEN_REPZ2(op) \
1339 static inline void gen_repz_ ## op(DisasContext *s, int ot, \
1340 target_ulong cur_eip, \
1341 target_ulong next_eip, \
1342 int nz) \
1344 int l2;\
1345 gen_update_cc_op(s); \
1346 l2 = gen_jz_ecx_string(s, next_eip); \
1347 gen_ ## op(s, ot); \
1348 gen_op_add_reg_im(s->aflag, R_ECX, -1); \
1349 gen_update_cc_op(s); \
1350 gen_jcc1(s, (JCC_Z << 1) | (nz ^ 1), l2); \
1351 if (!s->jmp_opt) \
1352 gen_op_jz_ecx(s->aflag, l2); \
1353 gen_jmp(s, cur_eip); \
1356 GEN_REPZ(movs)
1357 GEN_REPZ(stos)
1358 GEN_REPZ(lods)
1359 GEN_REPZ(ins)
1360 GEN_REPZ(outs)
1361 GEN_REPZ2(scas)
1362 GEN_REPZ2(cmps)
1364 static void gen_helper_fp_arith_ST0_FT0(int op)
1366 switch (op) {
1367 case 0:
1368 gen_helper_fadd_ST0_FT0(cpu_env);
1369 break;
1370 case 1:
1371 gen_helper_fmul_ST0_FT0(cpu_env);
1372 break;
1373 case 2:
1374 gen_helper_fcom_ST0_FT0(cpu_env);
1375 break;
1376 case 3:
1377 gen_helper_fcom_ST0_FT0(cpu_env);
1378 break;
1379 case 4:
1380 gen_helper_fsub_ST0_FT0(cpu_env);
1381 break;
1382 case 5:
1383 gen_helper_fsubr_ST0_FT0(cpu_env);
1384 break;
1385 case 6:
1386 gen_helper_fdiv_ST0_FT0(cpu_env);
1387 break;
1388 case 7:
1389 gen_helper_fdivr_ST0_FT0(cpu_env);
1390 break;
1394 /* NOTE the exception in "r" op ordering */
1395 static void gen_helper_fp_arith_STN_ST0(int op, int opreg)
1397 TCGv_i32 tmp = tcg_const_i32(opreg);
1398 switch (op) {
1399 case 0:
1400 gen_helper_fadd_STN_ST0(cpu_env, tmp);
1401 break;
1402 case 1:
1403 gen_helper_fmul_STN_ST0(cpu_env, tmp);
1404 break;
1405 case 4:
1406 gen_helper_fsubr_STN_ST0(cpu_env, tmp);
1407 break;
1408 case 5:
1409 gen_helper_fsub_STN_ST0(cpu_env, tmp);
1410 break;
1411 case 6:
1412 gen_helper_fdivr_STN_ST0(cpu_env, tmp);
1413 break;
1414 case 7:
1415 gen_helper_fdiv_STN_ST0(cpu_env, tmp);
1416 break;
1420 /* if d == OR_TMP0, it means memory operand (address in A0) */
1421 static void gen_op(DisasContext *s1, int op, int ot, int d)
1423 if (d != OR_TMP0) {
1424 gen_op_mov_TN_reg(ot, 0, d);
1425 } else {
1426 gen_op_ld_T0_A0(ot + s1->mem_index);
1428 switch(op) {
1429 case OP_ADCL:
1430 gen_compute_eflags_c(s1, cpu_tmp4);
1431 tcg_gen_add_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
1432 tcg_gen_add_tl(cpu_T[0], cpu_T[0], cpu_tmp4);
1433 if (d != OR_TMP0)
1434 gen_op_mov_reg_T0(ot, d);
1435 else
1436 gen_op_st_T0_A0(ot + s1->mem_index);
1437 gen_op_update3_cc(cpu_tmp4);
1438 set_cc_op(s1, CC_OP_ADCB + ot);
1439 break;
1440 case OP_SBBL:
1441 gen_compute_eflags_c(s1, cpu_tmp4);
1442 tcg_gen_sub_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
1443 tcg_gen_sub_tl(cpu_T[0], cpu_T[0], cpu_tmp4);
1444 if (d != OR_TMP0)
1445 gen_op_mov_reg_T0(ot, d);
1446 else
1447 gen_op_st_T0_A0(ot + s1->mem_index);
1448 gen_op_update3_cc(cpu_tmp4);
1449 set_cc_op(s1, CC_OP_SBBB + ot);
1450 break;
1451 case OP_ADDL:
1452 gen_op_addl_T0_T1();
1453 if (d != OR_TMP0)
1454 gen_op_mov_reg_T0(ot, d);
1455 else
1456 gen_op_st_T0_A0(ot + s1->mem_index);
1457 gen_op_update2_cc();
1458 set_cc_op(s1, CC_OP_ADDB + ot);
1459 break;
1460 case OP_SUBL:
1461 tcg_gen_mov_tl(cpu_cc_srcT, cpu_T[0]);
1462 tcg_gen_sub_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
1463 if (d != OR_TMP0)
1464 gen_op_mov_reg_T0(ot, d);
1465 else
1466 gen_op_st_T0_A0(ot + s1->mem_index);
1467 gen_op_update2_cc();
1468 set_cc_op(s1, CC_OP_SUBB + ot);
1469 break;
1470 default:
1471 case OP_ANDL:
1472 tcg_gen_and_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
1473 if (d != OR_TMP0)
1474 gen_op_mov_reg_T0(ot, d);
1475 else
1476 gen_op_st_T0_A0(ot + s1->mem_index);
1477 gen_op_update1_cc();
1478 set_cc_op(s1, CC_OP_LOGICB + ot);
1479 break;
1480 case OP_ORL:
1481 tcg_gen_or_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
1482 if (d != OR_TMP0)
1483 gen_op_mov_reg_T0(ot, d);
1484 else
1485 gen_op_st_T0_A0(ot + s1->mem_index);
1486 gen_op_update1_cc();
1487 set_cc_op(s1, CC_OP_LOGICB + ot);
1488 break;
1489 case OP_XORL:
1490 tcg_gen_xor_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
1491 if (d != OR_TMP0)
1492 gen_op_mov_reg_T0(ot, d);
1493 else
1494 gen_op_st_T0_A0(ot + s1->mem_index);
1495 gen_op_update1_cc();
1496 set_cc_op(s1, CC_OP_LOGICB + ot);
1497 break;
1498 case OP_CMPL:
1499 tcg_gen_mov_tl(cpu_cc_src, cpu_T[1]);
1500 tcg_gen_mov_tl(cpu_cc_srcT, cpu_T[0]);
1501 tcg_gen_sub_tl(cpu_cc_dst, cpu_T[0], cpu_T[1]);
1502 set_cc_op(s1, CC_OP_SUBB + ot);
1503 break;
1507 /* if d == OR_TMP0, it means memory operand (address in A0) */
1508 static void gen_inc(DisasContext *s1, int ot, int d, int c)
1510 if (d != OR_TMP0)
1511 gen_op_mov_TN_reg(ot, 0, d);
1512 else
1513 gen_op_ld_T0_A0(ot + s1->mem_index);
1514 gen_compute_eflags_c(s1, cpu_cc_src);
1515 if (c > 0) {
1516 tcg_gen_addi_tl(cpu_T[0], cpu_T[0], 1);
1517 set_cc_op(s1, CC_OP_INCB + ot);
1518 } else {
1519 tcg_gen_addi_tl(cpu_T[0], cpu_T[0], -1);
1520 set_cc_op(s1, CC_OP_DECB + ot);
1522 if (d != OR_TMP0)
1523 gen_op_mov_reg_T0(ot, d);
1524 else
1525 gen_op_st_T0_A0(ot + s1->mem_index);
1526 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
1529 static void gen_shift_rm_T1(DisasContext *s, int ot, int op1,
1530 int is_right, int is_arith)
1532 target_ulong mask;
1533 int shift_label;
1534 TCGv t0, t1, t2;
1536 if (ot == OT_QUAD) {
1537 mask = 0x3f;
1538 } else {
1539 mask = 0x1f;
1542 /* load */
1543 if (op1 == OR_TMP0) {
1544 gen_op_ld_T0_A0(ot + s->mem_index);
1545 } else {
1546 gen_op_mov_TN_reg(ot, 0, op1);
1549 t0 = tcg_temp_local_new();
1550 t1 = tcg_temp_local_new();
1551 t2 = tcg_temp_local_new();
1553 tcg_gen_andi_tl(t2, cpu_T[1], mask);
1555 if (is_right) {
1556 if (is_arith) {
1557 gen_exts(ot, cpu_T[0]);
1558 tcg_gen_mov_tl(t0, cpu_T[0]);
1559 tcg_gen_sar_tl(cpu_T[0], cpu_T[0], t2);
1560 } else {
1561 gen_extu(ot, cpu_T[0]);
1562 tcg_gen_mov_tl(t0, cpu_T[0]);
1563 tcg_gen_shr_tl(cpu_T[0], cpu_T[0], t2);
1565 } else {
1566 tcg_gen_mov_tl(t0, cpu_T[0]);
1567 tcg_gen_shl_tl(cpu_T[0], cpu_T[0], t2);
1570 /* store */
1571 if (op1 == OR_TMP0) {
1572 gen_op_st_T0_A0(ot + s->mem_index);
1573 } else {
1574 gen_op_mov_reg_T0(ot, op1);
1577 /* Update eflags data because we cannot predict flags afterward. */
1578 gen_update_cc_op(s);
1579 set_cc_op(s, CC_OP_DYNAMIC);
1581 tcg_gen_mov_tl(t1, cpu_T[0]);
1583 shift_label = gen_new_label();
1584 tcg_gen_brcondi_tl(TCG_COND_EQ, t2, 0, shift_label);
1586 tcg_gen_addi_tl(t2, t2, -1);
1587 tcg_gen_mov_tl(cpu_cc_dst, t1);
1589 if (is_right) {
1590 if (is_arith) {
1591 tcg_gen_sar_tl(cpu_cc_src, t0, t2);
1592 } else {
1593 tcg_gen_shr_tl(cpu_cc_src, t0, t2);
1595 } else {
1596 tcg_gen_shl_tl(cpu_cc_src, t0, t2);
1599 if (is_right) {
1600 tcg_gen_movi_i32(cpu_cc_op, CC_OP_SARB + ot);
1601 } else {
1602 tcg_gen_movi_i32(cpu_cc_op, CC_OP_SHLB + ot);
1605 gen_set_label(shift_label);
1607 tcg_temp_free(t0);
1608 tcg_temp_free(t1);
1609 tcg_temp_free(t2);
1612 static void gen_shift_rm_im(DisasContext *s, int ot, int op1, int op2,
1613 int is_right, int is_arith)
1615 int mask;
1617 if (ot == OT_QUAD)
1618 mask = 0x3f;
1619 else
1620 mask = 0x1f;
1622 /* load */
1623 if (op1 == OR_TMP0)
1624 gen_op_ld_T0_A0(ot + s->mem_index);
1625 else
1626 gen_op_mov_TN_reg(ot, 0, op1);
1628 op2 &= mask;
1629 if (op2 != 0) {
1630 if (is_right) {
1631 if (is_arith) {
1632 gen_exts(ot, cpu_T[0]);
1633 tcg_gen_sari_tl(cpu_tmp4, cpu_T[0], op2 - 1);
1634 tcg_gen_sari_tl(cpu_T[0], cpu_T[0], op2);
1635 } else {
1636 gen_extu(ot, cpu_T[0]);
1637 tcg_gen_shri_tl(cpu_tmp4, cpu_T[0], op2 - 1);
1638 tcg_gen_shri_tl(cpu_T[0], cpu_T[0], op2);
1640 } else {
1641 tcg_gen_shli_tl(cpu_tmp4, cpu_T[0], op2 - 1);
1642 tcg_gen_shli_tl(cpu_T[0], cpu_T[0], op2);
1646 /* store */
1647 if (op1 == OR_TMP0)
1648 gen_op_st_T0_A0(ot + s->mem_index);
1649 else
1650 gen_op_mov_reg_T0(ot, op1);
1652 /* update eflags if non zero shift */
1653 if (op2 != 0) {
1654 tcg_gen_mov_tl(cpu_cc_src, cpu_tmp4);
1655 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
1656 set_cc_op(s, (is_right ? CC_OP_SARB : CC_OP_SHLB) + ot);
1660 static inline void tcg_gen_lshift(TCGv ret, TCGv arg1, target_long arg2)
1662 if (arg2 >= 0)
1663 tcg_gen_shli_tl(ret, arg1, arg2);
1664 else
1665 tcg_gen_shri_tl(ret, arg1, -arg2);
1668 static void gen_rot_rm_T1(DisasContext *s, int ot, int op1,
1669 int is_right)
1671 target_ulong mask;
1672 int label1, label2, data_bits;
1673 TCGv t0, t1, t2, a0;
1675 /* XXX: inefficient, but we must use local temps */
1676 t0 = tcg_temp_local_new();
1677 t1 = tcg_temp_local_new();
1678 t2 = tcg_temp_local_new();
1679 a0 = tcg_temp_local_new();
1681 if (ot == OT_QUAD)
1682 mask = 0x3f;
1683 else
1684 mask = 0x1f;
1686 /* load */
1687 if (op1 == OR_TMP0) {
1688 tcg_gen_mov_tl(a0, cpu_A0);
1689 gen_op_ld_v(ot + s->mem_index, t0, a0);
1690 } else {
1691 gen_op_mov_v_reg(ot, t0, op1);
1694 tcg_gen_mov_tl(t1, cpu_T[1]);
1696 tcg_gen_andi_tl(t1, t1, mask);
1698 /* Must test zero case to avoid using undefined behaviour in TCG
1699 shifts. */
1700 label1 = gen_new_label();
1701 tcg_gen_brcondi_tl(TCG_COND_EQ, t1, 0, label1);
1703 if (ot <= OT_WORD)
1704 tcg_gen_andi_tl(cpu_tmp0, t1, (1 << (3 + ot)) - 1);
1705 else
1706 tcg_gen_mov_tl(cpu_tmp0, t1);
1708 gen_extu(ot, t0);
1709 tcg_gen_mov_tl(t2, t0);
1711 data_bits = 8 << ot;
1712 /* XXX: rely on behaviour of shifts when operand 2 overflows (XXX:
1713 fix TCG definition) */
1714 if (is_right) {
1715 tcg_gen_shr_tl(cpu_tmp4, t0, cpu_tmp0);
1716 tcg_gen_subfi_tl(cpu_tmp0, data_bits, cpu_tmp0);
1717 tcg_gen_shl_tl(t0, t0, cpu_tmp0);
1718 } else {
1719 tcg_gen_shl_tl(cpu_tmp4, t0, cpu_tmp0);
1720 tcg_gen_subfi_tl(cpu_tmp0, data_bits, cpu_tmp0);
1721 tcg_gen_shr_tl(t0, t0, cpu_tmp0);
1723 tcg_gen_or_tl(t0, t0, cpu_tmp4);
1725 gen_set_label(label1);
1726 /* store */
1727 if (op1 == OR_TMP0) {
1728 gen_op_st_v(ot + s->mem_index, t0, a0);
1729 } else {
1730 gen_op_mov_reg_v(ot, op1, t0);
1733 /* update eflags. It is needed anyway most of the time, do it always. */
1734 gen_compute_eflags(s);
1735 assert(s->cc_op == CC_OP_EFLAGS);
1737 label2 = gen_new_label();
1738 tcg_gen_brcondi_tl(TCG_COND_EQ, t1, 0, label2);
1740 tcg_gen_andi_tl(cpu_cc_src, cpu_cc_src, ~(CC_O | CC_C));
1741 tcg_gen_xor_tl(cpu_tmp0, t2, t0);
1742 tcg_gen_lshift(cpu_tmp0, cpu_tmp0, 11 - (data_bits - 1));
1743 tcg_gen_andi_tl(cpu_tmp0, cpu_tmp0, CC_O);
1744 tcg_gen_or_tl(cpu_cc_src, cpu_cc_src, cpu_tmp0);
1745 if (is_right) {
1746 tcg_gen_shri_tl(t0, t0, data_bits - 1);
1748 tcg_gen_andi_tl(t0, t0, CC_C);
1749 tcg_gen_or_tl(cpu_cc_src, cpu_cc_src, t0);
1751 gen_set_label(label2);
1753 tcg_temp_free(t0);
1754 tcg_temp_free(t1);
1755 tcg_temp_free(t2);
1756 tcg_temp_free(a0);
1759 static void gen_rot_rm_im(DisasContext *s, int ot, int op1, int op2,
1760 int is_right)
1762 int mask;
1763 int data_bits;
1764 TCGv t0, t1, a0;
1766 /* XXX: inefficient, but we must use local temps */
1767 t0 = tcg_temp_local_new();
1768 t1 = tcg_temp_local_new();
1769 a0 = tcg_temp_local_new();
1771 if (ot == OT_QUAD)
1772 mask = 0x3f;
1773 else
1774 mask = 0x1f;
1776 /* load */
1777 if (op1 == OR_TMP0) {
1778 tcg_gen_mov_tl(a0, cpu_A0);
1779 gen_op_ld_v(ot + s->mem_index, t0, a0);
1780 } else {
1781 gen_op_mov_v_reg(ot, t0, op1);
1784 gen_extu(ot, t0);
1785 tcg_gen_mov_tl(t1, t0);
1787 op2 &= mask;
1788 data_bits = 8 << ot;
1789 if (op2 != 0) {
1790 int shift = op2 & ((1 << (3 + ot)) - 1);
1791 if (is_right) {
1792 tcg_gen_shri_tl(cpu_tmp4, t0, shift);
1793 tcg_gen_shli_tl(t0, t0, data_bits - shift);
1795 else {
1796 tcg_gen_shli_tl(cpu_tmp4, t0, shift);
1797 tcg_gen_shri_tl(t0, t0, data_bits - shift);
1799 tcg_gen_or_tl(t0, t0, cpu_tmp4);
1802 /* store */
1803 if (op1 == OR_TMP0) {
1804 gen_op_st_v(ot + s->mem_index, t0, a0);
1805 } else {
1806 gen_op_mov_reg_v(ot, op1, t0);
1809 if (op2 != 0) {
1810 /* update eflags */
1811 gen_compute_eflags(s);
1812 assert(s->cc_op == CC_OP_EFLAGS);
1814 tcg_gen_andi_tl(cpu_cc_src, cpu_cc_src, ~(CC_O | CC_C));
1815 tcg_gen_xor_tl(cpu_tmp0, t1, t0);
1816 tcg_gen_lshift(cpu_tmp0, cpu_tmp0, 11 - (data_bits - 1));
1817 tcg_gen_andi_tl(cpu_tmp0, cpu_tmp0, CC_O);
1818 tcg_gen_or_tl(cpu_cc_src, cpu_cc_src, cpu_tmp0);
1819 if (is_right) {
1820 tcg_gen_shri_tl(t0, t0, data_bits - 1);
1822 tcg_gen_andi_tl(t0, t0, CC_C);
1823 tcg_gen_or_tl(cpu_cc_src, cpu_cc_src, t0);
1826 tcg_temp_free(t0);
1827 tcg_temp_free(t1);
1828 tcg_temp_free(a0);
1831 /* XXX: add faster immediate = 1 case */
1832 static void gen_rotc_rm_T1(DisasContext *s, int ot, int op1,
1833 int is_right)
1835 gen_compute_eflags(s);
1836 assert(s->cc_op == CC_OP_EFLAGS);
1838 /* load */
1839 if (op1 == OR_TMP0)
1840 gen_op_ld_T0_A0(ot + s->mem_index);
1841 else
1842 gen_op_mov_TN_reg(ot, 0, op1);
1844 if (is_right) {
1845 switch (ot) {
1846 case OT_BYTE:
1847 gen_helper_rcrb(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1848 break;
1849 case OT_WORD:
1850 gen_helper_rcrw(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1851 break;
1852 case OT_LONG:
1853 gen_helper_rcrl(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1854 break;
1855 #ifdef TARGET_X86_64
1856 case OT_QUAD:
1857 gen_helper_rcrq(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1858 break;
1859 #endif
1861 } else {
1862 switch (ot) {
1863 case OT_BYTE:
1864 gen_helper_rclb(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1865 break;
1866 case OT_WORD:
1867 gen_helper_rclw(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1868 break;
1869 case OT_LONG:
1870 gen_helper_rcll(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1871 break;
1872 #ifdef TARGET_X86_64
1873 case OT_QUAD:
1874 gen_helper_rclq(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1875 break;
1876 #endif
1879 /* store */
1880 if (op1 == OR_TMP0)
1881 gen_op_st_T0_A0(ot + s->mem_index);
1882 else
1883 gen_op_mov_reg_T0(ot, op1);
1886 /* XXX: add faster immediate case */
1887 static void gen_shiftd_rm_T1(DisasContext *s, int ot, int op1,
1888 int is_right, TCGv count)
1890 int label1, label2, data_bits;
1891 target_ulong mask;
1892 TCGv t0, t1, t2, a0;
1894 t0 = tcg_temp_local_new();
1895 t1 = tcg_temp_local_new();
1896 t2 = tcg_temp_local_new();
1897 a0 = tcg_temp_local_new();
1899 if (ot == OT_QUAD)
1900 mask = 0x3f;
1901 else
1902 mask = 0x1f;
1904 /* load */
1905 if (op1 == OR_TMP0) {
1906 tcg_gen_mov_tl(a0, cpu_A0);
1907 gen_op_ld_v(ot + s->mem_index, t0, a0);
1908 } else {
1909 gen_op_mov_v_reg(ot, t0, op1);
1912 tcg_gen_andi_tl(t2, count, mask);
1913 tcg_gen_mov_tl(t1, cpu_T[1]);
1915 /* Must test zero case to avoid using undefined behaviour in TCG
1916 shifts. */
1917 label1 = gen_new_label();
1918 tcg_gen_brcondi_tl(TCG_COND_EQ, t2, 0, label1);
1920 tcg_gen_addi_tl(cpu_tmp5, t2, -1);
1921 if (ot == OT_WORD) {
1922 /* Note: we implement the Intel behaviour for shift count > 16 */
1923 if (is_right) {
1924 tcg_gen_andi_tl(t0, t0, 0xffff);
1925 tcg_gen_shli_tl(cpu_tmp0, t1, 16);
1926 tcg_gen_or_tl(t0, t0, cpu_tmp0);
1927 tcg_gen_ext32u_tl(t0, t0);
1929 tcg_gen_shr_tl(cpu_tmp4, t0, cpu_tmp5);
1931 /* only needed if count > 16, but a test would complicate */
1932 tcg_gen_subfi_tl(cpu_tmp5, 32, t2);
1933 tcg_gen_shl_tl(cpu_tmp0, t0, cpu_tmp5);
1935 tcg_gen_shr_tl(t0, t0, t2);
1937 tcg_gen_or_tl(t0, t0, cpu_tmp0);
1938 } else {
1939 /* XXX: not optimal */
1940 tcg_gen_andi_tl(t0, t0, 0xffff);
1941 tcg_gen_shli_tl(t1, t1, 16);
1942 tcg_gen_or_tl(t1, t1, t0);
1943 tcg_gen_ext32u_tl(t1, t1);
1945 tcg_gen_shl_tl(cpu_tmp4, t0, cpu_tmp5);
1946 tcg_gen_subfi_tl(cpu_tmp0, 32, cpu_tmp5);
1947 tcg_gen_shr_tl(cpu_tmp5, t1, cpu_tmp0);
1948 tcg_gen_or_tl(cpu_tmp4, cpu_tmp4, cpu_tmp5);
1950 tcg_gen_shl_tl(t0, t0, t2);
1951 tcg_gen_subfi_tl(cpu_tmp5, 32, t2);
1952 tcg_gen_shr_tl(t1, t1, cpu_tmp5);
1953 tcg_gen_or_tl(t0, t0, t1);
1955 } else {
1956 data_bits = 8 << ot;
1957 if (is_right) {
1958 if (ot == OT_LONG)
1959 tcg_gen_ext32u_tl(t0, t0);
1961 tcg_gen_shr_tl(cpu_tmp4, t0, cpu_tmp5);
1963 tcg_gen_shr_tl(t0, t0, t2);
1964 tcg_gen_subfi_tl(cpu_tmp5, data_bits, t2);
1965 tcg_gen_shl_tl(t1, t1, cpu_tmp5);
1966 tcg_gen_or_tl(t0, t0, t1);
1968 } else {
1969 if (ot == OT_LONG)
1970 tcg_gen_ext32u_tl(t1, t1);
1972 tcg_gen_shl_tl(cpu_tmp4, t0, cpu_tmp5);
1974 tcg_gen_shl_tl(t0, t0, t2);
1975 tcg_gen_subfi_tl(cpu_tmp5, data_bits, t2);
1976 tcg_gen_shr_tl(t1, t1, cpu_tmp5);
1977 tcg_gen_or_tl(t0, t0, t1);
1980 tcg_gen_mov_tl(t1, cpu_tmp4);
1982 gen_set_label(label1);
1983 /* store */
1984 if (op1 == OR_TMP0) {
1985 gen_op_st_v(ot + s->mem_index, t0, a0);
1986 } else {
1987 gen_op_mov_reg_v(ot, op1, t0);
1990 /* Update eflags data because we cannot predict flags afterward. */
1991 gen_update_cc_op(s);
1992 set_cc_op(s, CC_OP_DYNAMIC);
1994 label2 = gen_new_label();
1995 tcg_gen_brcondi_tl(TCG_COND_EQ, t2, 0, label2);
1997 tcg_gen_mov_tl(cpu_cc_src, t1);
1998 tcg_gen_mov_tl(cpu_cc_dst, t0);
1999 if (is_right) {
2000 tcg_gen_movi_i32(cpu_cc_op, CC_OP_SARB + ot);
2001 } else {
2002 tcg_gen_movi_i32(cpu_cc_op, CC_OP_SHLB + ot);
2004 gen_set_label(label2);
2006 tcg_temp_free(t0);
2007 tcg_temp_free(t1);
2008 tcg_temp_free(t2);
2009 tcg_temp_free(a0);
2012 static void gen_shift(DisasContext *s1, int op, int ot, int d, int s)
2014 if (s != OR_TMP1)
2015 gen_op_mov_TN_reg(ot, 1, s);
2016 switch(op) {
2017 case OP_ROL:
2018 gen_rot_rm_T1(s1, ot, d, 0);
2019 break;
2020 case OP_ROR:
2021 gen_rot_rm_T1(s1, ot, d, 1);
2022 break;
2023 case OP_SHL:
2024 case OP_SHL1:
2025 gen_shift_rm_T1(s1, ot, d, 0, 0);
2026 break;
2027 case OP_SHR:
2028 gen_shift_rm_T1(s1, ot, d, 1, 0);
2029 break;
2030 case OP_SAR:
2031 gen_shift_rm_T1(s1, ot, d, 1, 1);
2032 break;
2033 case OP_RCL:
2034 gen_rotc_rm_T1(s1, ot, d, 0);
2035 break;
2036 case OP_RCR:
2037 gen_rotc_rm_T1(s1, ot, d, 1);
2038 break;
2042 static void gen_shifti(DisasContext *s1, int op, int ot, int d, int c)
2044 switch(op) {
2045 case OP_ROL:
2046 gen_rot_rm_im(s1, ot, d, c, 0);
2047 break;
2048 case OP_ROR:
2049 gen_rot_rm_im(s1, ot, d, c, 1);
2050 break;
2051 case OP_SHL:
2052 case OP_SHL1:
2053 gen_shift_rm_im(s1, ot, d, c, 0, 0);
2054 break;
2055 case OP_SHR:
2056 gen_shift_rm_im(s1, ot, d, c, 1, 0);
2057 break;
2058 case OP_SAR:
2059 gen_shift_rm_im(s1, ot, d, c, 1, 1);
2060 break;
2061 default:
2062 /* currently not optimized */
2063 gen_op_movl_T1_im(c);
2064 gen_shift(s1, op, ot, d, OR_TMP1);
2065 break;
2069 static void gen_lea_modrm(CPUX86State *env, DisasContext *s, int modrm,
2070 int *reg_ptr, int *offset_ptr)
2072 target_long disp;
2073 int havesib;
2074 int base;
2075 int index;
2076 int scale;
2077 int opreg;
2078 int mod, rm, code, override, must_add_seg;
2080 override = s->override;
2081 must_add_seg = s->addseg;
2082 if (override >= 0)
2083 must_add_seg = 1;
2084 mod = (modrm >> 6) & 3;
2085 rm = modrm & 7;
2087 if (s->aflag) {
2089 havesib = 0;
2090 base = rm;
2091 index = 0;
2092 scale = 0;
2094 if (base == 4) {
2095 havesib = 1;
2096 code = cpu_ldub_code(env, s->pc++);
2097 scale = (code >> 6) & 3;
2098 index = ((code >> 3) & 7) | REX_X(s);
2099 base = (code & 7);
2101 base |= REX_B(s);
2103 switch (mod) {
2104 case 0:
2105 if ((base & 7) == 5) {
2106 base = -1;
2107 disp = (int32_t)cpu_ldl_code(env, s->pc);
2108 s->pc += 4;
2109 if (CODE64(s) && !havesib) {
2110 disp += s->pc + s->rip_offset;
2112 } else {
2113 disp = 0;
2115 break;
2116 case 1:
2117 disp = (int8_t)cpu_ldub_code(env, s->pc++);
2118 break;
2119 default:
2120 case 2:
2121 disp = (int32_t)cpu_ldl_code(env, s->pc);
2122 s->pc += 4;
2123 break;
2126 if (base >= 0) {
2127 /* for correct popl handling with esp */
2128 if (base == 4 && s->popl_esp_hack)
2129 disp += s->popl_esp_hack;
2130 #ifdef TARGET_X86_64
2131 if (s->aflag == 2) {
2132 gen_op_movq_A0_reg(base);
2133 if (disp != 0) {
2134 gen_op_addq_A0_im(disp);
2136 } else
2137 #endif
2139 gen_op_movl_A0_reg(base);
2140 if (disp != 0)
2141 gen_op_addl_A0_im(disp);
2143 } else {
2144 #ifdef TARGET_X86_64
2145 if (s->aflag == 2) {
2146 gen_op_movq_A0_im(disp);
2147 } else
2148 #endif
2150 gen_op_movl_A0_im(disp);
2153 /* index == 4 means no index */
2154 if (havesib && (index != 4)) {
2155 #ifdef TARGET_X86_64
2156 if (s->aflag == 2) {
2157 gen_op_addq_A0_reg_sN(scale, index);
2158 } else
2159 #endif
2161 gen_op_addl_A0_reg_sN(scale, index);
2164 if (must_add_seg) {
2165 if (override < 0) {
2166 if (base == R_EBP || base == R_ESP)
2167 override = R_SS;
2168 else
2169 override = R_DS;
2171 #ifdef TARGET_X86_64
2172 if (s->aflag == 2) {
2173 gen_op_addq_A0_seg(override);
2174 } else
2175 #endif
2177 gen_op_addl_A0_seg(s, override);
2180 } else {
2181 switch (mod) {
2182 case 0:
2183 if (rm == 6) {
2184 disp = cpu_lduw_code(env, s->pc);
2185 s->pc += 2;
2186 gen_op_movl_A0_im(disp);
2187 rm = 0; /* avoid SS override */
2188 goto no_rm;
2189 } else {
2190 disp = 0;
2192 break;
2193 case 1:
2194 disp = (int8_t)cpu_ldub_code(env, s->pc++);
2195 break;
2196 default:
2197 case 2:
2198 disp = cpu_lduw_code(env, s->pc);
2199 s->pc += 2;
2200 break;
2202 switch(rm) {
2203 case 0:
2204 gen_op_movl_A0_reg(R_EBX);
2205 gen_op_addl_A0_reg_sN(0, R_ESI);
2206 break;
2207 case 1:
2208 gen_op_movl_A0_reg(R_EBX);
2209 gen_op_addl_A0_reg_sN(0, R_EDI);
2210 break;
2211 case 2:
2212 gen_op_movl_A0_reg(R_EBP);
2213 gen_op_addl_A0_reg_sN(0, R_ESI);
2214 break;
2215 case 3:
2216 gen_op_movl_A0_reg(R_EBP);
2217 gen_op_addl_A0_reg_sN(0, R_EDI);
2218 break;
2219 case 4:
2220 gen_op_movl_A0_reg(R_ESI);
2221 break;
2222 case 5:
2223 gen_op_movl_A0_reg(R_EDI);
2224 break;
2225 case 6:
2226 gen_op_movl_A0_reg(R_EBP);
2227 break;
2228 default:
2229 case 7:
2230 gen_op_movl_A0_reg(R_EBX);
2231 break;
2233 if (disp != 0)
2234 gen_op_addl_A0_im(disp);
2235 gen_op_andl_A0_ffff();
2236 no_rm:
2237 if (must_add_seg) {
2238 if (override < 0) {
2239 if (rm == 2 || rm == 3 || rm == 6)
2240 override = R_SS;
2241 else
2242 override = R_DS;
2244 gen_op_addl_A0_seg(s, override);
2248 opreg = OR_A0;
2249 disp = 0;
2250 *reg_ptr = opreg;
2251 *offset_ptr = disp;
2254 static void gen_nop_modrm(CPUX86State *env, DisasContext *s, int modrm)
2256 int mod, rm, base, code;
2258 mod = (modrm >> 6) & 3;
2259 if (mod == 3)
2260 return;
2261 rm = modrm & 7;
2263 if (s->aflag) {
2265 base = rm;
2267 if (base == 4) {
2268 code = cpu_ldub_code(env, s->pc++);
2269 base = (code & 7);
2272 switch (mod) {
2273 case 0:
2274 if (base == 5) {
2275 s->pc += 4;
2277 break;
2278 case 1:
2279 s->pc++;
2280 break;
2281 default:
2282 case 2:
2283 s->pc += 4;
2284 break;
2286 } else {
2287 switch (mod) {
2288 case 0:
2289 if (rm == 6) {
2290 s->pc += 2;
2292 break;
2293 case 1:
2294 s->pc++;
2295 break;
2296 default:
2297 case 2:
2298 s->pc += 2;
2299 break;
2304 /* used for LEA and MOV AX, mem */
2305 static void gen_add_A0_ds_seg(DisasContext *s)
2307 int override, must_add_seg;
2308 must_add_seg = s->addseg;
2309 override = R_DS;
2310 if (s->override >= 0) {
2311 override = s->override;
2312 must_add_seg = 1;
2314 if (must_add_seg) {
2315 #ifdef TARGET_X86_64
2316 if (CODE64(s)) {
2317 gen_op_addq_A0_seg(override);
2318 } else
2319 #endif
2321 gen_op_addl_A0_seg(s, override);
2326 /* generate modrm memory load or store of 'reg'. TMP0 is used if reg ==
2327 OR_TMP0 */
2328 static void gen_ldst_modrm(CPUX86State *env, DisasContext *s, int modrm,
2329 int ot, int reg, int is_store)
2331 int mod, rm, opreg, disp;
2333 mod = (modrm >> 6) & 3;
2334 rm = (modrm & 7) | REX_B(s);
2335 if (mod == 3) {
2336 if (is_store) {
2337 if (reg != OR_TMP0)
2338 gen_op_mov_TN_reg(ot, 0, reg);
2339 gen_op_mov_reg_T0(ot, rm);
2340 } else {
2341 gen_op_mov_TN_reg(ot, 0, rm);
2342 if (reg != OR_TMP0)
2343 gen_op_mov_reg_T0(ot, reg);
2345 } else {
2346 gen_lea_modrm(env, s, modrm, &opreg, &disp);
2347 if (is_store) {
2348 if (reg != OR_TMP0)
2349 gen_op_mov_TN_reg(ot, 0, reg);
2350 gen_op_st_T0_A0(ot + s->mem_index);
2351 } else {
2352 gen_op_ld_T0_A0(ot + s->mem_index);
2353 if (reg != OR_TMP0)
2354 gen_op_mov_reg_T0(ot, reg);
2359 static inline uint32_t insn_get(CPUX86State *env, DisasContext *s, int ot)
2361 uint32_t ret;
2363 switch(ot) {
2364 case OT_BYTE:
2365 ret = cpu_ldub_code(env, s->pc);
2366 s->pc++;
2367 break;
2368 case OT_WORD:
2369 ret = cpu_lduw_code(env, s->pc);
2370 s->pc += 2;
2371 break;
2372 default:
2373 case OT_LONG:
2374 ret = cpu_ldl_code(env, s->pc);
2375 s->pc += 4;
2376 break;
2378 return ret;
2381 static inline int insn_const_size(unsigned int ot)
2383 if (ot <= OT_LONG)
2384 return 1 << ot;
2385 else
2386 return 4;
2389 static inline void gen_goto_tb(DisasContext *s, int tb_num, target_ulong eip)
2391 TranslationBlock *tb;
2392 target_ulong pc;
2394 pc = s->cs_base + eip;
2395 tb = s->tb;
2396 /* NOTE: we handle the case where the TB spans two pages here */
2397 if ((pc & TARGET_PAGE_MASK) == (tb->pc & TARGET_PAGE_MASK) ||
2398 (pc & TARGET_PAGE_MASK) == ((s->pc - 1) & TARGET_PAGE_MASK)) {
2399 /* jump to same page: we can use a direct jump */
2400 tcg_gen_goto_tb(tb_num);
2401 gen_jmp_im(eip);
2402 tcg_gen_exit_tb((tcg_target_long)tb + tb_num);
2403 } else {
2404 /* jump to another page: currently not optimized */
2405 gen_jmp_im(eip);
2406 gen_eob(s);
2410 static inline void gen_jcc(DisasContext *s, int b,
2411 target_ulong val, target_ulong next_eip)
2413 int l1, l2;
2415 if (s->jmp_opt) {
2416 l1 = gen_new_label();
2417 gen_jcc1(s, b, l1);
2419 gen_goto_tb(s, 0, next_eip);
2421 gen_set_label(l1);
2422 gen_goto_tb(s, 1, val);
2423 s->is_jmp = DISAS_TB_JUMP;
2424 } else {
2425 l1 = gen_new_label();
2426 l2 = gen_new_label();
2427 gen_jcc1(s, b, l1);
2429 gen_jmp_im(next_eip);
2430 tcg_gen_br(l2);
2432 gen_set_label(l1);
2433 gen_jmp_im(val);
2434 gen_set_label(l2);
2435 gen_eob(s);
2439 static void gen_cmovcc1(CPUX86State *env, DisasContext *s, int ot, int b,
2440 int modrm, int reg)
2442 CCPrepare cc;
2444 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
2446 cc = gen_prepare_cc(s, b, cpu_T[1]);
2447 if (cc.mask != -1) {
2448 TCGv t0 = tcg_temp_new();
2449 tcg_gen_andi_tl(t0, cc.reg, cc.mask);
2450 cc.reg = t0;
2452 if (!cc.use_reg2) {
2453 cc.reg2 = tcg_const_tl(cc.imm);
2456 tcg_gen_movcond_tl(cc.cond, cpu_T[0], cc.reg, cc.reg2,
2457 cpu_T[0], cpu_regs[reg]);
2458 gen_op_mov_reg_T0(ot, reg);
2460 if (cc.mask != -1) {
2461 tcg_temp_free(cc.reg);
2463 if (!cc.use_reg2) {
2464 tcg_temp_free(cc.reg2);
2468 static inline void gen_op_movl_T0_seg(int seg_reg)
2470 tcg_gen_ld32u_tl(cpu_T[0], cpu_env,
2471 offsetof(CPUX86State,segs[seg_reg].selector));
2474 static inline void gen_op_movl_seg_T0_vm(int seg_reg)
2476 tcg_gen_andi_tl(cpu_T[0], cpu_T[0], 0xffff);
2477 tcg_gen_st32_tl(cpu_T[0], cpu_env,
2478 offsetof(CPUX86State,segs[seg_reg].selector));
2479 tcg_gen_shli_tl(cpu_T[0], cpu_T[0], 4);
2480 tcg_gen_st_tl(cpu_T[0], cpu_env,
2481 offsetof(CPUX86State,segs[seg_reg].base));
2484 /* move T0 to seg_reg and compute if the CPU state may change. Never
2485 call this function with seg_reg == R_CS */
2486 static void gen_movl_seg_T0(DisasContext *s, int seg_reg, target_ulong cur_eip)
2488 if (s->pe && !s->vm86) {
2489 /* XXX: optimize by finding processor state dynamically */
2490 gen_update_cc_op(s);
2491 gen_jmp_im(cur_eip);
2492 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
2493 gen_helper_load_seg(cpu_env, tcg_const_i32(seg_reg), cpu_tmp2_i32);
2494 /* abort translation because the addseg value may change or
2495 because ss32 may change. For R_SS, translation must always
2496 stop as a special handling must be done to disable hardware
2497 interrupts for the next instruction */
2498 if (seg_reg == R_SS || (s->code32 && seg_reg < R_FS))
2499 s->is_jmp = DISAS_TB_JUMP;
2500 } else {
2501 gen_op_movl_seg_T0_vm(seg_reg);
2502 if (seg_reg == R_SS)
2503 s->is_jmp = DISAS_TB_JUMP;
2507 static inline int svm_is_rep(int prefixes)
2509 return ((prefixes & (PREFIX_REPZ | PREFIX_REPNZ)) ? 8 : 0);
2512 static inline void
2513 gen_svm_check_intercept_param(DisasContext *s, target_ulong pc_start,
2514 uint32_t type, uint64_t param)
2516 /* no SVM activated; fast case */
2517 if (likely(!(s->flags & HF_SVMI_MASK)))
2518 return;
2519 gen_update_cc_op(s);
2520 gen_jmp_im(pc_start - s->cs_base);
2521 gen_helper_svm_check_intercept_param(cpu_env, tcg_const_i32(type),
2522 tcg_const_i64(param));
2525 static inline void
2526 gen_svm_check_intercept(DisasContext *s, target_ulong pc_start, uint64_t type)
2528 gen_svm_check_intercept_param(s, pc_start, type, 0);
2531 static inline void gen_stack_update(DisasContext *s, int addend)
2533 #ifdef TARGET_X86_64
2534 if (CODE64(s)) {
2535 gen_op_add_reg_im(2, R_ESP, addend);
2536 } else
2537 #endif
2538 if (s->ss32) {
2539 gen_op_add_reg_im(1, R_ESP, addend);
2540 } else {
2541 gen_op_add_reg_im(0, R_ESP, addend);
2545 /* generate a push. It depends on ss32, addseg and dflag */
2546 static void gen_push_T0(DisasContext *s)
2548 #ifdef TARGET_X86_64
2549 if (CODE64(s)) {
2550 gen_op_movq_A0_reg(R_ESP);
2551 if (s->dflag) {
2552 gen_op_addq_A0_im(-8);
2553 gen_op_st_T0_A0(OT_QUAD + s->mem_index);
2554 } else {
2555 gen_op_addq_A0_im(-2);
2556 gen_op_st_T0_A0(OT_WORD + s->mem_index);
2558 gen_op_mov_reg_A0(2, R_ESP);
2559 } else
2560 #endif
2562 gen_op_movl_A0_reg(R_ESP);
2563 if (!s->dflag)
2564 gen_op_addl_A0_im(-2);
2565 else
2566 gen_op_addl_A0_im(-4);
2567 if (s->ss32) {
2568 if (s->addseg) {
2569 tcg_gen_mov_tl(cpu_T[1], cpu_A0);
2570 gen_op_addl_A0_seg(s, R_SS);
2572 } else {
2573 gen_op_andl_A0_ffff();
2574 tcg_gen_mov_tl(cpu_T[1], cpu_A0);
2575 gen_op_addl_A0_seg(s, R_SS);
2577 gen_op_st_T0_A0(s->dflag + 1 + s->mem_index);
2578 if (s->ss32 && !s->addseg)
2579 gen_op_mov_reg_A0(1, R_ESP);
2580 else
2581 gen_op_mov_reg_T1(s->ss32 + 1, R_ESP);
2585 /* generate a push. It depends on ss32, addseg and dflag */
2586 /* slower version for T1, only used for call Ev */
2587 static void gen_push_T1(DisasContext *s)
2589 #ifdef TARGET_X86_64
2590 if (CODE64(s)) {
2591 gen_op_movq_A0_reg(R_ESP);
2592 if (s->dflag) {
2593 gen_op_addq_A0_im(-8);
2594 gen_op_st_T1_A0(OT_QUAD + s->mem_index);
2595 } else {
2596 gen_op_addq_A0_im(-2);
2597 gen_op_st_T0_A0(OT_WORD + s->mem_index);
2599 gen_op_mov_reg_A0(2, R_ESP);
2600 } else
2601 #endif
2603 gen_op_movl_A0_reg(R_ESP);
2604 if (!s->dflag)
2605 gen_op_addl_A0_im(-2);
2606 else
2607 gen_op_addl_A0_im(-4);
2608 if (s->ss32) {
2609 if (s->addseg) {
2610 gen_op_addl_A0_seg(s, R_SS);
2612 } else {
2613 gen_op_andl_A0_ffff();
2614 gen_op_addl_A0_seg(s, R_SS);
2616 gen_op_st_T1_A0(s->dflag + 1 + s->mem_index);
2618 if (s->ss32 && !s->addseg)
2619 gen_op_mov_reg_A0(1, R_ESP);
2620 else
2621 gen_stack_update(s, (-2) << s->dflag);
2625 /* two step pop is necessary for precise exceptions */
2626 static void gen_pop_T0(DisasContext *s)
2628 #ifdef TARGET_X86_64
2629 if (CODE64(s)) {
2630 gen_op_movq_A0_reg(R_ESP);
2631 gen_op_ld_T0_A0((s->dflag ? OT_QUAD : OT_WORD) + s->mem_index);
2632 } else
2633 #endif
2635 gen_op_movl_A0_reg(R_ESP);
2636 if (s->ss32) {
2637 if (s->addseg)
2638 gen_op_addl_A0_seg(s, R_SS);
2639 } else {
2640 gen_op_andl_A0_ffff();
2641 gen_op_addl_A0_seg(s, R_SS);
2643 gen_op_ld_T0_A0(s->dflag + 1 + s->mem_index);
2647 static void gen_pop_update(DisasContext *s)
2649 #ifdef TARGET_X86_64
2650 if (CODE64(s) && s->dflag) {
2651 gen_stack_update(s, 8);
2652 } else
2653 #endif
2655 gen_stack_update(s, 2 << s->dflag);
2659 static void gen_stack_A0(DisasContext *s)
2661 gen_op_movl_A0_reg(R_ESP);
2662 if (!s->ss32)
2663 gen_op_andl_A0_ffff();
2664 tcg_gen_mov_tl(cpu_T[1], cpu_A0);
2665 if (s->addseg)
2666 gen_op_addl_A0_seg(s, R_SS);
2669 /* NOTE: wrap around in 16 bit not fully handled */
2670 static void gen_pusha(DisasContext *s)
2672 int i;
2673 gen_op_movl_A0_reg(R_ESP);
2674 gen_op_addl_A0_im(-16 << s->dflag);
2675 if (!s->ss32)
2676 gen_op_andl_A0_ffff();
2677 tcg_gen_mov_tl(cpu_T[1], cpu_A0);
2678 if (s->addseg)
2679 gen_op_addl_A0_seg(s, R_SS);
2680 for(i = 0;i < 8; i++) {
2681 gen_op_mov_TN_reg(OT_LONG, 0, 7 - i);
2682 gen_op_st_T0_A0(OT_WORD + s->dflag + s->mem_index);
2683 gen_op_addl_A0_im(2 << s->dflag);
2685 gen_op_mov_reg_T1(OT_WORD + s->ss32, R_ESP);
2688 /* NOTE: wrap around in 16 bit not fully handled */
2689 static void gen_popa(DisasContext *s)
2691 int i;
2692 gen_op_movl_A0_reg(R_ESP);
2693 if (!s->ss32)
2694 gen_op_andl_A0_ffff();
2695 tcg_gen_mov_tl(cpu_T[1], cpu_A0);
2696 tcg_gen_addi_tl(cpu_T[1], cpu_T[1], 16 << s->dflag);
2697 if (s->addseg)
2698 gen_op_addl_A0_seg(s, R_SS);
2699 for(i = 0;i < 8; i++) {
2700 /* ESP is not reloaded */
2701 if (i != 3) {
2702 gen_op_ld_T0_A0(OT_WORD + s->dflag + s->mem_index);
2703 gen_op_mov_reg_T0(OT_WORD + s->dflag, 7 - i);
2705 gen_op_addl_A0_im(2 << s->dflag);
2707 gen_op_mov_reg_T1(OT_WORD + s->ss32, R_ESP);
2710 static void gen_enter(DisasContext *s, int esp_addend, int level)
2712 int ot, opsize;
2714 level &= 0x1f;
2715 #ifdef TARGET_X86_64
2716 if (CODE64(s)) {
2717 ot = s->dflag ? OT_QUAD : OT_WORD;
2718 opsize = 1 << ot;
2720 gen_op_movl_A0_reg(R_ESP);
2721 gen_op_addq_A0_im(-opsize);
2722 tcg_gen_mov_tl(cpu_T[1], cpu_A0);
2724 /* push bp */
2725 gen_op_mov_TN_reg(OT_LONG, 0, R_EBP);
2726 gen_op_st_T0_A0(ot + s->mem_index);
2727 if (level) {
2728 /* XXX: must save state */
2729 gen_helper_enter64_level(cpu_env, tcg_const_i32(level),
2730 tcg_const_i32((ot == OT_QUAD)),
2731 cpu_T[1]);
2733 gen_op_mov_reg_T1(ot, R_EBP);
2734 tcg_gen_addi_tl(cpu_T[1], cpu_T[1], -esp_addend + (-opsize * level));
2735 gen_op_mov_reg_T1(OT_QUAD, R_ESP);
2736 } else
2737 #endif
2739 ot = s->dflag + OT_WORD;
2740 opsize = 2 << s->dflag;
2742 gen_op_movl_A0_reg(R_ESP);
2743 gen_op_addl_A0_im(-opsize);
2744 if (!s->ss32)
2745 gen_op_andl_A0_ffff();
2746 tcg_gen_mov_tl(cpu_T[1], cpu_A0);
2747 if (s->addseg)
2748 gen_op_addl_A0_seg(s, R_SS);
2749 /* push bp */
2750 gen_op_mov_TN_reg(OT_LONG, 0, R_EBP);
2751 gen_op_st_T0_A0(ot + s->mem_index);
2752 if (level) {
2753 /* XXX: must save state */
2754 gen_helper_enter_level(cpu_env, tcg_const_i32(level),
2755 tcg_const_i32(s->dflag),
2756 cpu_T[1]);
2758 gen_op_mov_reg_T1(ot, R_EBP);
2759 tcg_gen_addi_tl(cpu_T[1], cpu_T[1], -esp_addend + (-opsize * level));
2760 gen_op_mov_reg_T1(OT_WORD + s->ss32, R_ESP);
2764 static void gen_exception(DisasContext *s, int trapno, target_ulong cur_eip)
2766 gen_update_cc_op(s);
2767 gen_jmp_im(cur_eip);
2768 gen_helper_raise_exception(cpu_env, tcg_const_i32(trapno));
2769 s->is_jmp = DISAS_TB_JUMP;
2772 /* an interrupt is different from an exception because of the
2773 privilege checks */
2774 static void gen_interrupt(DisasContext *s, int intno,
2775 target_ulong cur_eip, target_ulong next_eip)
2777 gen_update_cc_op(s);
2778 gen_jmp_im(cur_eip);
2779 gen_helper_raise_interrupt(cpu_env, tcg_const_i32(intno),
2780 tcg_const_i32(next_eip - cur_eip));
2781 s->is_jmp = DISAS_TB_JUMP;
2784 static void gen_debug(DisasContext *s, target_ulong cur_eip)
2786 gen_update_cc_op(s);
2787 gen_jmp_im(cur_eip);
2788 gen_helper_debug(cpu_env);
2789 s->is_jmp = DISAS_TB_JUMP;
2792 /* generate a generic end of block. Trace exception is also generated
2793 if needed */
2794 static void gen_eob(DisasContext *s)
2796 gen_update_cc_op(s);
2797 if (s->tb->flags & HF_INHIBIT_IRQ_MASK) {
2798 gen_helper_reset_inhibit_irq(cpu_env);
2800 if (s->tb->flags & HF_RF_MASK) {
2801 gen_helper_reset_rf(cpu_env);
2803 if (s->singlestep_enabled) {
2804 gen_helper_debug(cpu_env);
2805 } else if (s->tf) {
2806 gen_helper_single_step(cpu_env);
2807 } else {
2808 tcg_gen_exit_tb(0);
2810 s->is_jmp = DISAS_TB_JUMP;
2813 /* generate a jump to eip. No segment change must happen before as a
2814 direct call to the next block may occur */
2815 static void gen_jmp_tb(DisasContext *s, target_ulong eip, int tb_num)
2817 gen_update_cc_op(s);
2818 set_cc_op(s, CC_OP_DYNAMIC);
2819 if (s->jmp_opt) {
2820 gen_goto_tb(s, tb_num, eip);
2821 s->is_jmp = DISAS_TB_JUMP;
2822 } else {
2823 gen_jmp_im(eip);
2824 gen_eob(s);
2828 static void gen_jmp(DisasContext *s, target_ulong eip)
2830 gen_jmp_tb(s, eip, 0);
2833 static inline void gen_ldq_env_A0(int idx, int offset)
2835 int mem_index = (idx >> 2) - 1;
2836 tcg_gen_qemu_ld64(cpu_tmp1_i64, cpu_A0, mem_index);
2837 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, offset);
2840 static inline void gen_stq_env_A0(int idx, int offset)
2842 int mem_index = (idx >> 2) - 1;
2843 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env, offset);
2844 tcg_gen_qemu_st64(cpu_tmp1_i64, cpu_A0, mem_index);
2847 static inline void gen_ldo_env_A0(int idx, int offset)
2849 int mem_index = (idx >> 2) - 1;
2850 tcg_gen_qemu_ld64(cpu_tmp1_i64, cpu_A0, mem_index);
2851 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, offset + offsetof(XMMReg, XMM_Q(0)));
2852 tcg_gen_addi_tl(cpu_tmp0, cpu_A0, 8);
2853 tcg_gen_qemu_ld64(cpu_tmp1_i64, cpu_tmp0, mem_index);
2854 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, offset + offsetof(XMMReg, XMM_Q(1)));
2857 static inline void gen_sto_env_A0(int idx, int offset)
2859 int mem_index = (idx >> 2) - 1;
2860 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env, offset + offsetof(XMMReg, XMM_Q(0)));
2861 tcg_gen_qemu_st64(cpu_tmp1_i64, cpu_A0, mem_index);
2862 tcg_gen_addi_tl(cpu_tmp0, cpu_A0, 8);
2863 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env, offset + offsetof(XMMReg, XMM_Q(1)));
2864 tcg_gen_qemu_st64(cpu_tmp1_i64, cpu_tmp0, mem_index);
2867 static inline void gen_op_movo(int d_offset, int s_offset)
2869 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env, s_offset);
2870 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, d_offset);
2871 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env, s_offset + 8);
2872 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, d_offset + 8);
2875 static inline void gen_op_movq(int d_offset, int s_offset)
2877 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env, s_offset);
2878 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, d_offset);
2881 static inline void gen_op_movl(int d_offset, int s_offset)
2883 tcg_gen_ld_i32(cpu_tmp2_i32, cpu_env, s_offset);
2884 tcg_gen_st_i32(cpu_tmp2_i32, cpu_env, d_offset);
2887 static inline void gen_op_movq_env_0(int d_offset)
2889 tcg_gen_movi_i64(cpu_tmp1_i64, 0);
2890 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, d_offset);
2893 typedef void (*SSEFunc_i_ep)(TCGv_i32 val, TCGv_ptr env, TCGv_ptr reg);
2894 typedef void (*SSEFunc_l_ep)(TCGv_i64 val, TCGv_ptr env, TCGv_ptr reg);
2895 typedef void (*SSEFunc_0_epi)(TCGv_ptr env, TCGv_ptr reg, TCGv_i32 val);
2896 typedef void (*SSEFunc_0_epl)(TCGv_ptr env, TCGv_ptr reg, TCGv_i64 val);
2897 typedef void (*SSEFunc_0_epp)(TCGv_ptr env, TCGv_ptr reg_a, TCGv_ptr reg_b);
2898 typedef void (*SSEFunc_0_eppi)(TCGv_ptr env, TCGv_ptr reg_a, TCGv_ptr reg_b,
2899 TCGv_i32 val);
2900 typedef void (*SSEFunc_0_ppi)(TCGv_ptr reg_a, TCGv_ptr reg_b, TCGv_i32 val);
2901 typedef void (*SSEFunc_0_eppt)(TCGv_ptr env, TCGv_ptr reg_a, TCGv_ptr reg_b,
2902 TCGv val);
2904 #define SSE_SPECIAL ((void *)1)
2905 #define SSE_DUMMY ((void *)2)
2907 #define MMX_OP2(x) { gen_helper_ ## x ## _mmx, gen_helper_ ## x ## _xmm }
2908 #define SSE_FOP(x) { gen_helper_ ## x ## ps, gen_helper_ ## x ## pd, \
2909 gen_helper_ ## x ## ss, gen_helper_ ## x ## sd, }
2911 static const SSEFunc_0_epp sse_op_table1[256][4] = {
2912 /* 3DNow! extensions */
2913 [0x0e] = { SSE_DUMMY }, /* femms */
2914 [0x0f] = { SSE_DUMMY }, /* pf... */
2915 /* pure SSE operations */
2916 [0x10] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movups, movupd, movss, movsd */
2917 [0x11] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movups, movupd, movss, movsd */
2918 [0x12] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movlps, movlpd, movsldup, movddup */
2919 [0x13] = { SSE_SPECIAL, SSE_SPECIAL }, /* movlps, movlpd */
2920 [0x14] = { gen_helper_punpckldq_xmm, gen_helper_punpcklqdq_xmm },
2921 [0x15] = { gen_helper_punpckhdq_xmm, gen_helper_punpckhqdq_xmm },
2922 [0x16] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movhps, movhpd, movshdup */
2923 [0x17] = { SSE_SPECIAL, SSE_SPECIAL }, /* movhps, movhpd */
2925 [0x28] = { SSE_SPECIAL, SSE_SPECIAL }, /* movaps, movapd */
2926 [0x29] = { SSE_SPECIAL, SSE_SPECIAL }, /* movaps, movapd */
2927 [0x2a] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* cvtpi2ps, cvtpi2pd, cvtsi2ss, cvtsi2sd */
2928 [0x2b] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movntps, movntpd, movntss, movntsd */
2929 [0x2c] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* cvttps2pi, cvttpd2pi, cvttsd2si, cvttss2si */
2930 [0x2d] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* cvtps2pi, cvtpd2pi, cvtsd2si, cvtss2si */
2931 [0x2e] = { gen_helper_ucomiss, gen_helper_ucomisd },
2932 [0x2f] = { gen_helper_comiss, gen_helper_comisd },
2933 [0x50] = { SSE_SPECIAL, SSE_SPECIAL }, /* movmskps, movmskpd */
2934 [0x51] = SSE_FOP(sqrt),
2935 [0x52] = { gen_helper_rsqrtps, NULL, gen_helper_rsqrtss, NULL },
2936 [0x53] = { gen_helper_rcpps, NULL, gen_helper_rcpss, NULL },
2937 [0x54] = { gen_helper_pand_xmm, gen_helper_pand_xmm }, /* andps, andpd */
2938 [0x55] = { gen_helper_pandn_xmm, gen_helper_pandn_xmm }, /* andnps, andnpd */
2939 [0x56] = { gen_helper_por_xmm, gen_helper_por_xmm }, /* orps, orpd */
2940 [0x57] = { gen_helper_pxor_xmm, gen_helper_pxor_xmm }, /* xorps, xorpd */
2941 [0x58] = SSE_FOP(add),
2942 [0x59] = SSE_FOP(mul),
2943 [0x5a] = { gen_helper_cvtps2pd, gen_helper_cvtpd2ps,
2944 gen_helper_cvtss2sd, gen_helper_cvtsd2ss },
2945 [0x5b] = { gen_helper_cvtdq2ps, gen_helper_cvtps2dq, gen_helper_cvttps2dq },
2946 [0x5c] = SSE_FOP(sub),
2947 [0x5d] = SSE_FOP(min),
2948 [0x5e] = SSE_FOP(div),
2949 [0x5f] = SSE_FOP(max),
2951 [0xc2] = SSE_FOP(cmpeq),
2952 [0xc6] = { (SSEFunc_0_epp)gen_helper_shufps,
2953 (SSEFunc_0_epp)gen_helper_shufpd }, /* XXX: casts */
2955 [0x38] = { SSE_SPECIAL, SSE_SPECIAL, NULL, SSE_SPECIAL }, /* SSSE3/SSE4 */
2956 [0x3a] = { SSE_SPECIAL, SSE_SPECIAL }, /* SSSE3/SSE4 */
2958 /* MMX ops and their SSE extensions */
2959 [0x60] = MMX_OP2(punpcklbw),
2960 [0x61] = MMX_OP2(punpcklwd),
2961 [0x62] = MMX_OP2(punpckldq),
2962 [0x63] = MMX_OP2(packsswb),
2963 [0x64] = MMX_OP2(pcmpgtb),
2964 [0x65] = MMX_OP2(pcmpgtw),
2965 [0x66] = MMX_OP2(pcmpgtl),
2966 [0x67] = MMX_OP2(packuswb),
2967 [0x68] = MMX_OP2(punpckhbw),
2968 [0x69] = MMX_OP2(punpckhwd),
2969 [0x6a] = MMX_OP2(punpckhdq),
2970 [0x6b] = MMX_OP2(packssdw),
2971 [0x6c] = { NULL, gen_helper_punpcklqdq_xmm },
2972 [0x6d] = { NULL, gen_helper_punpckhqdq_xmm },
2973 [0x6e] = { SSE_SPECIAL, SSE_SPECIAL }, /* movd mm, ea */
2974 [0x6f] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movq, movdqa, , movqdu */
2975 [0x70] = { (SSEFunc_0_epp)gen_helper_pshufw_mmx,
2976 (SSEFunc_0_epp)gen_helper_pshufd_xmm,
2977 (SSEFunc_0_epp)gen_helper_pshufhw_xmm,
2978 (SSEFunc_0_epp)gen_helper_pshuflw_xmm }, /* XXX: casts */
2979 [0x71] = { SSE_SPECIAL, SSE_SPECIAL }, /* shiftw */
2980 [0x72] = { SSE_SPECIAL, SSE_SPECIAL }, /* shiftd */
2981 [0x73] = { SSE_SPECIAL, SSE_SPECIAL }, /* shiftq */
2982 [0x74] = MMX_OP2(pcmpeqb),
2983 [0x75] = MMX_OP2(pcmpeqw),
2984 [0x76] = MMX_OP2(pcmpeql),
2985 [0x77] = { SSE_DUMMY }, /* emms */
2986 [0x78] = { NULL, SSE_SPECIAL, NULL, SSE_SPECIAL }, /* extrq_i, insertq_i */
2987 [0x79] = { NULL, gen_helper_extrq_r, NULL, gen_helper_insertq_r },
2988 [0x7c] = { NULL, gen_helper_haddpd, NULL, gen_helper_haddps },
2989 [0x7d] = { NULL, gen_helper_hsubpd, NULL, gen_helper_hsubps },
2990 [0x7e] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movd, movd, , movq */
2991 [0x7f] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movq, movdqa, movdqu */
2992 [0xc4] = { SSE_SPECIAL, SSE_SPECIAL }, /* pinsrw */
2993 [0xc5] = { SSE_SPECIAL, SSE_SPECIAL }, /* pextrw */
2994 [0xd0] = { NULL, gen_helper_addsubpd, NULL, gen_helper_addsubps },
2995 [0xd1] = MMX_OP2(psrlw),
2996 [0xd2] = MMX_OP2(psrld),
2997 [0xd3] = MMX_OP2(psrlq),
2998 [0xd4] = MMX_OP2(paddq),
2999 [0xd5] = MMX_OP2(pmullw),
3000 [0xd6] = { NULL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL },
3001 [0xd7] = { SSE_SPECIAL, SSE_SPECIAL }, /* pmovmskb */
3002 [0xd8] = MMX_OP2(psubusb),
3003 [0xd9] = MMX_OP2(psubusw),
3004 [0xda] = MMX_OP2(pminub),
3005 [0xdb] = MMX_OP2(pand),
3006 [0xdc] = MMX_OP2(paddusb),
3007 [0xdd] = MMX_OP2(paddusw),
3008 [0xde] = MMX_OP2(pmaxub),
3009 [0xdf] = MMX_OP2(pandn),
3010 [0xe0] = MMX_OP2(pavgb),
3011 [0xe1] = MMX_OP2(psraw),
3012 [0xe2] = MMX_OP2(psrad),
3013 [0xe3] = MMX_OP2(pavgw),
3014 [0xe4] = MMX_OP2(pmulhuw),
3015 [0xe5] = MMX_OP2(pmulhw),
3016 [0xe6] = { NULL, gen_helper_cvttpd2dq, gen_helper_cvtdq2pd, gen_helper_cvtpd2dq },
3017 [0xe7] = { SSE_SPECIAL , SSE_SPECIAL }, /* movntq, movntq */
3018 [0xe8] = MMX_OP2(psubsb),
3019 [0xe9] = MMX_OP2(psubsw),
3020 [0xea] = MMX_OP2(pminsw),
3021 [0xeb] = MMX_OP2(por),
3022 [0xec] = MMX_OP2(paddsb),
3023 [0xed] = MMX_OP2(paddsw),
3024 [0xee] = MMX_OP2(pmaxsw),
3025 [0xef] = MMX_OP2(pxor),
3026 [0xf0] = { NULL, NULL, NULL, SSE_SPECIAL }, /* lddqu */
3027 [0xf1] = MMX_OP2(psllw),
3028 [0xf2] = MMX_OP2(pslld),
3029 [0xf3] = MMX_OP2(psllq),
3030 [0xf4] = MMX_OP2(pmuludq),
3031 [0xf5] = MMX_OP2(pmaddwd),
3032 [0xf6] = MMX_OP2(psadbw),
3033 [0xf7] = { (SSEFunc_0_epp)gen_helper_maskmov_mmx,
3034 (SSEFunc_0_epp)gen_helper_maskmov_xmm }, /* XXX: casts */
3035 [0xf8] = MMX_OP2(psubb),
3036 [0xf9] = MMX_OP2(psubw),
3037 [0xfa] = MMX_OP2(psubl),
3038 [0xfb] = MMX_OP2(psubq),
3039 [0xfc] = MMX_OP2(paddb),
3040 [0xfd] = MMX_OP2(paddw),
3041 [0xfe] = MMX_OP2(paddl),
3044 static const SSEFunc_0_epp sse_op_table2[3 * 8][2] = {
3045 [0 + 2] = MMX_OP2(psrlw),
3046 [0 + 4] = MMX_OP2(psraw),
3047 [0 + 6] = MMX_OP2(psllw),
3048 [8 + 2] = MMX_OP2(psrld),
3049 [8 + 4] = MMX_OP2(psrad),
3050 [8 + 6] = MMX_OP2(pslld),
3051 [16 + 2] = MMX_OP2(psrlq),
3052 [16 + 3] = { NULL, gen_helper_psrldq_xmm },
3053 [16 + 6] = MMX_OP2(psllq),
3054 [16 + 7] = { NULL, gen_helper_pslldq_xmm },
3057 static const SSEFunc_0_epi sse_op_table3ai[] = {
3058 gen_helper_cvtsi2ss,
3059 gen_helper_cvtsi2sd
3062 #ifdef TARGET_X86_64
3063 static const SSEFunc_0_epl sse_op_table3aq[] = {
3064 gen_helper_cvtsq2ss,
3065 gen_helper_cvtsq2sd
3067 #endif
3069 static const SSEFunc_i_ep sse_op_table3bi[] = {
3070 gen_helper_cvttss2si,
3071 gen_helper_cvtss2si,
3072 gen_helper_cvttsd2si,
3073 gen_helper_cvtsd2si
3076 #ifdef TARGET_X86_64
3077 static const SSEFunc_l_ep sse_op_table3bq[] = {
3078 gen_helper_cvttss2sq,
3079 gen_helper_cvtss2sq,
3080 gen_helper_cvttsd2sq,
3081 gen_helper_cvtsd2sq
3083 #endif
3085 static const SSEFunc_0_epp sse_op_table4[8][4] = {
3086 SSE_FOP(cmpeq),
3087 SSE_FOP(cmplt),
3088 SSE_FOP(cmple),
3089 SSE_FOP(cmpunord),
3090 SSE_FOP(cmpneq),
3091 SSE_FOP(cmpnlt),
3092 SSE_FOP(cmpnle),
3093 SSE_FOP(cmpord),
3096 static const SSEFunc_0_epp sse_op_table5[256] = {
3097 [0x0c] = gen_helper_pi2fw,
3098 [0x0d] = gen_helper_pi2fd,
3099 [0x1c] = gen_helper_pf2iw,
3100 [0x1d] = gen_helper_pf2id,
3101 [0x8a] = gen_helper_pfnacc,
3102 [0x8e] = gen_helper_pfpnacc,
3103 [0x90] = gen_helper_pfcmpge,
3104 [0x94] = gen_helper_pfmin,
3105 [0x96] = gen_helper_pfrcp,
3106 [0x97] = gen_helper_pfrsqrt,
3107 [0x9a] = gen_helper_pfsub,
3108 [0x9e] = gen_helper_pfadd,
3109 [0xa0] = gen_helper_pfcmpgt,
3110 [0xa4] = gen_helper_pfmax,
3111 [0xa6] = gen_helper_movq, /* pfrcpit1; no need to actually increase precision */
3112 [0xa7] = gen_helper_movq, /* pfrsqit1 */
3113 [0xaa] = gen_helper_pfsubr,
3114 [0xae] = gen_helper_pfacc,
3115 [0xb0] = gen_helper_pfcmpeq,
3116 [0xb4] = gen_helper_pfmul,
3117 [0xb6] = gen_helper_movq, /* pfrcpit2 */
3118 [0xb7] = gen_helper_pmulhrw_mmx,
3119 [0xbb] = gen_helper_pswapd,
3120 [0xbf] = gen_helper_pavgb_mmx /* pavgusb */
3123 struct SSEOpHelper_epp {
3124 SSEFunc_0_epp op[2];
3125 uint32_t ext_mask;
3128 struct SSEOpHelper_eppi {
3129 SSEFunc_0_eppi op[2];
3130 uint32_t ext_mask;
3133 #define SSSE3_OP(x) { MMX_OP2(x), CPUID_EXT_SSSE3 }
3134 #define SSE41_OP(x) { { NULL, gen_helper_ ## x ## _xmm }, CPUID_EXT_SSE41 }
3135 #define SSE42_OP(x) { { NULL, gen_helper_ ## x ## _xmm }, CPUID_EXT_SSE42 }
3136 #define SSE41_SPECIAL { { NULL, SSE_SPECIAL }, CPUID_EXT_SSE41 }
3138 static const struct SSEOpHelper_epp sse_op_table6[256] = {
3139 [0x00] = SSSE3_OP(pshufb),
3140 [0x01] = SSSE3_OP(phaddw),
3141 [0x02] = SSSE3_OP(phaddd),
3142 [0x03] = SSSE3_OP(phaddsw),
3143 [0x04] = SSSE3_OP(pmaddubsw),
3144 [0x05] = SSSE3_OP(phsubw),
3145 [0x06] = SSSE3_OP(phsubd),
3146 [0x07] = SSSE3_OP(phsubsw),
3147 [0x08] = SSSE3_OP(psignb),
3148 [0x09] = SSSE3_OP(psignw),
3149 [0x0a] = SSSE3_OP(psignd),
3150 [0x0b] = SSSE3_OP(pmulhrsw),
3151 [0x10] = SSE41_OP(pblendvb),
3152 [0x14] = SSE41_OP(blendvps),
3153 [0x15] = SSE41_OP(blendvpd),
3154 [0x17] = SSE41_OP(ptest),
3155 [0x1c] = SSSE3_OP(pabsb),
3156 [0x1d] = SSSE3_OP(pabsw),
3157 [0x1e] = SSSE3_OP(pabsd),
3158 [0x20] = SSE41_OP(pmovsxbw),
3159 [0x21] = SSE41_OP(pmovsxbd),
3160 [0x22] = SSE41_OP(pmovsxbq),
3161 [0x23] = SSE41_OP(pmovsxwd),
3162 [0x24] = SSE41_OP(pmovsxwq),
3163 [0x25] = SSE41_OP(pmovsxdq),
3164 [0x28] = SSE41_OP(pmuldq),
3165 [0x29] = SSE41_OP(pcmpeqq),
3166 [0x2a] = SSE41_SPECIAL, /* movntqda */
3167 [0x2b] = SSE41_OP(packusdw),
3168 [0x30] = SSE41_OP(pmovzxbw),
3169 [0x31] = SSE41_OP(pmovzxbd),
3170 [0x32] = SSE41_OP(pmovzxbq),
3171 [0x33] = SSE41_OP(pmovzxwd),
3172 [0x34] = SSE41_OP(pmovzxwq),
3173 [0x35] = SSE41_OP(pmovzxdq),
3174 [0x37] = SSE42_OP(pcmpgtq),
3175 [0x38] = SSE41_OP(pminsb),
3176 [0x39] = SSE41_OP(pminsd),
3177 [0x3a] = SSE41_OP(pminuw),
3178 [0x3b] = SSE41_OP(pminud),
3179 [0x3c] = SSE41_OP(pmaxsb),
3180 [0x3d] = SSE41_OP(pmaxsd),
3181 [0x3e] = SSE41_OP(pmaxuw),
3182 [0x3f] = SSE41_OP(pmaxud),
3183 [0x40] = SSE41_OP(pmulld),
3184 [0x41] = SSE41_OP(phminposuw),
3187 static const struct SSEOpHelper_eppi sse_op_table7[256] = {
3188 [0x08] = SSE41_OP(roundps),
3189 [0x09] = SSE41_OP(roundpd),
3190 [0x0a] = SSE41_OP(roundss),
3191 [0x0b] = SSE41_OP(roundsd),
3192 [0x0c] = SSE41_OP(blendps),
3193 [0x0d] = SSE41_OP(blendpd),
3194 [0x0e] = SSE41_OP(pblendw),
3195 [0x0f] = SSSE3_OP(palignr),
3196 [0x14] = SSE41_SPECIAL, /* pextrb */
3197 [0x15] = SSE41_SPECIAL, /* pextrw */
3198 [0x16] = SSE41_SPECIAL, /* pextrd/pextrq */
3199 [0x17] = SSE41_SPECIAL, /* extractps */
3200 [0x20] = SSE41_SPECIAL, /* pinsrb */
3201 [0x21] = SSE41_SPECIAL, /* insertps */
3202 [0x22] = SSE41_SPECIAL, /* pinsrd/pinsrq */
3203 [0x40] = SSE41_OP(dpps),
3204 [0x41] = SSE41_OP(dppd),
3205 [0x42] = SSE41_OP(mpsadbw),
3206 [0x60] = SSE42_OP(pcmpestrm),
3207 [0x61] = SSE42_OP(pcmpestri),
3208 [0x62] = SSE42_OP(pcmpistrm),
3209 [0x63] = SSE42_OP(pcmpistri),
3212 static void gen_sse(CPUX86State *env, DisasContext *s, int b,
3213 target_ulong pc_start, int rex_r)
3215 int b1, op1_offset, op2_offset, is_xmm, val, ot;
3216 int modrm, mod, rm, reg, reg_addr, offset_addr;
3217 SSEFunc_0_epp sse_fn_epp;
3218 SSEFunc_0_eppi sse_fn_eppi;
3219 SSEFunc_0_ppi sse_fn_ppi;
3220 SSEFunc_0_eppt sse_fn_eppt;
3222 b &= 0xff;
3223 if (s->prefix & PREFIX_DATA)
3224 b1 = 1;
3225 else if (s->prefix & PREFIX_REPZ)
3226 b1 = 2;
3227 else if (s->prefix & PREFIX_REPNZ)
3228 b1 = 3;
3229 else
3230 b1 = 0;
3231 sse_fn_epp = sse_op_table1[b][b1];
3232 if (!sse_fn_epp) {
3233 goto illegal_op;
3235 if ((b <= 0x5f && b >= 0x10) || b == 0xc6 || b == 0xc2) {
3236 is_xmm = 1;
3237 } else {
3238 if (b1 == 0) {
3239 /* MMX case */
3240 is_xmm = 0;
3241 } else {
3242 is_xmm = 1;
3245 /* simple MMX/SSE operation */
3246 if (s->flags & HF_TS_MASK) {
3247 gen_exception(s, EXCP07_PREX, pc_start - s->cs_base);
3248 return;
3250 if (s->flags & HF_EM_MASK) {
3251 illegal_op:
3252 gen_exception(s, EXCP06_ILLOP, pc_start - s->cs_base);
3253 return;
3255 if (is_xmm && !(s->flags & HF_OSFXSR_MASK))
3256 if ((b != 0x38 && b != 0x3a) || (s->prefix & PREFIX_DATA))
3257 goto illegal_op;
3258 if (b == 0x0e) {
3259 if (!(s->cpuid_ext2_features & CPUID_EXT2_3DNOW))
3260 goto illegal_op;
3261 /* femms */
3262 gen_helper_emms(cpu_env);
3263 return;
3265 if (b == 0x77) {
3266 /* emms */
3267 gen_helper_emms(cpu_env);
3268 return;
3270 /* prepare MMX state (XXX: optimize by storing fptt and fptags in
3271 the static cpu state) */
3272 if (!is_xmm) {
3273 gen_helper_enter_mmx(cpu_env);
3276 modrm = cpu_ldub_code(env, s->pc++);
3277 reg = ((modrm >> 3) & 7);
3278 if (is_xmm)
3279 reg |= rex_r;
3280 mod = (modrm >> 6) & 3;
3281 if (sse_fn_epp == SSE_SPECIAL) {
3282 b |= (b1 << 8);
3283 switch(b) {
3284 case 0x0e7: /* movntq */
3285 if (mod == 3)
3286 goto illegal_op;
3287 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3288 gen_stq_env_A0(s->mem_index, offsetof(CPUX86State,fpregs[reg].mmx));
3289 break;
3290 case 0x1e7: /* movntdq */
3291 case 0x02b: /* movntps */
3292 case 0x12b: /* movntps */
3293 if (mod == 3)
3294 goto illegal_op;
3295 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3296 gen_sto_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg]));
3297 break;
3298 case 0x3f0: /* lddqu */
3299 if (mod == 3)
3300 goto illegal_op;
3301 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3302 gen_ldo_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg]));
3303 break;
3304 case 0x22b: /* movntss */
3305 case 0x32b: /* movntsd */
3306 if (mod == 3)
3307 goto illegal_op;
3308 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3309 if (b1 & 1) {
3310 gen_stq_env_A0(s->mem_index, offsetof(CPUX86State,
3311 xmm_regs[reg]));
3312 } else {
3313 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,
3314 xmm_regs[reg].XMM_L(0)));
3315 gen_op_st_T0_A0(OT_LONG + s->mem_index);
3317 break;
3318 case 0x6e: /* movd mm, ea */
3319 #ifdef TARGET_X86_64
3320 if (s->dflag == 2) {
3321 gen_ldst_modrm(env, s, modrm, OT_QUAD, OR_TMP0, 0);
3322 tcg_gen_st_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,fpregs[reg].mmx));
3323 } else
3324 #endif
3326 gen_ldst_modrm(env, s, modrm, OT_LONG, OR_TMP0, 0);
3327 tcg_gen_addi_ptr(cpu_ptr0, cpu_env,
3328 offsetof(CPUX86State,fpregs[reg].mmx));
3329 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
3330 gen_helper_movl_mm_T0_mmx(cpu_ptr0, cpu_tmp2_i32);
3332 break;
3333 case 0x16e: /* movd xmm, ea */
3334 #ifdef TARGET_X86_64
3335 if (s->dflag == 2) {
3336 gen_ldst_modrm(env, s, modrm, OT_QUAD, OR_TMP0, 0);
3337 tcg_gen_addi_ptr(cpu_ptr0, cpu_env,
3338 offsetof(CPUX86State,xmm_regs[reg]));
3339 gen_helper_movq_mm_T0_xmm(cpu_ptr0, cpu_T[0]);
3340 } else
3341 #endif
3343 gen_ldst_modrm(env, s, modrm, OT_LONG, OR_TMP0, 0);
3344 tcg_gen_addi_ptr(cpu_ptr0, cpu_env,
3345 offsetof(CPUX86State,xmm_regs[reg]));
3346 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
3347 gen_helper_movl_mm_T0_xmm(cpu_ptr0, cpu_tmp2_i32);
3349 break;
3350 case 0x6f: /* movq mm, ea */
3351 if (mod != 3) {
3352 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3353 gen_ldq_env_A0(s->mem_index, offsetof(CPUX86State,fpregs[reg].mmx));
3354 } else {
3355 rm = (modrm & 7);
3356 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env,
3357 offsetof(CPUX86State,fpregs[rm].mmx));
3358 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env,
3359 offsetof(CPUX86State,fpregs[reg].mmx));
3361 break;
3362 case 0x010: /* movups */
3363 case 0x110: /* movupd */
3364 case 0x028: /* movaps */
3365 case 0x128: /* movapd */
3366 case 0x16f: /* movdqa xmm, ea */
3367 case 0x26f: /* movdqu xmm, ea */
3368 if (mod != 3) {
3369 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3370 gen_ldo_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg]));
3371 } else {
3372 rm = (modrm & 7) | REX_B(s);
3373 gen_op_movo(offsetof(CPUX86State,xmm_regs[reg]),
3374 offsetof(CPUX86State,xmm_regs[rm]));
3376 break;
3377 case 0x210: /* movss xmm, ea */
3378 if (mod != 3) {
3379 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3380 gen_op_ld_T0_A0(OT_LONG + s->mem_index);
3381 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(0)));
3382 gen_op_movl_T0_0();
3383 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(1)));
3384 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(2)));
3385 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(3)));
3386 } else {
3387 rm = (modrm & 7) | REX_B(s);
3388 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(0)),
3389 offsetof(CPUX86State,xmm_regs[rm].XMM_L(0)));
3391 break;
3392 case 0x310: /* movsd xmm, ea */
3393 if (mod != 3) {
3394 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3395 gen_ldq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3396 gen_op_movl_T0_0();
3397 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(2)));
3398 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(3)));
3399 } else {
3400 rm = (modrm & 7) | REX_B(s);
3401 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)),
3402 offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0)));
3404 break;
3405 case 0x012: /* movlps */
3406 case 0x112: /* movlpd */
3407 if (mod != 3) {
3408 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3409 gen_ldq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3410 } else {
3411 /* movhlps */
3412 rm = (modrm & 7) | REX_B(s);
3413 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)),
3414 offsetof(CPUX86State,xmm_regs[rm].XMM_Q(1)));
3416 break;
3417 case 0x212: /* movsldup */
3418 if (mod != 3) {
3419 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3420 gen_ldo_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg]));
3421 } else {
3422 rm = (modrm & 7) | REX_B(s);
3423 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(0)),
3424 offsetof(CPUX86State,xmm_regs[rm].XMM_L(0)));
3425 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(2)),
3426 offsetof(CPUX86State,xmm_regs[rm].XMM_L(2)));
3428 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(1)),
3429 offsetof(CPUX86State,xmm_regs[reg].XMM_L(0)));
3430 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(3)),
3431 offsetof(CPUX86State,xmm_regs[reg].XMM_L(2)));
3432 break;
3433 case 0x312: /* movddup */
3434 if (mod != 3) {
3435 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3436 gen_ldq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3437 } else {
3438 rm = (modrm & 7) | REX_B(s);
3439 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)),
3440 offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0)));
3442 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(1)),
3443 offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3444 break;
3445 case 0x016: /* movhps */
3446 case 0x116: /* movhpd */
3447 if (mod != 3) {
3448 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3449 gen_ldq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg].XMM_Q(1)));
3450 } else {
3451 /* movlhps */
3452 rm = (modrm & 7) | REX_B(s);
3453 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(1)),
3454 offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0)));
3456 break;
3457 case 0x216: /* movshdup */
3458 if (mod != 3) {
3459 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3460 gen_ldo_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg]));
3461 } else {
3462 rm = (modrm & 7) | REX_B(s);
3463 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(1)),
3464 offsetof(CPUX86State,xmm_regs[rm].XMM_L(1)));
3465 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(3)),
3466 offsetof(CPUX86State,xmm_regs[rm].XMM_L(3)));
3468 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(0)),
3469 offsetof(CPUX86State,xmm_regs[reg].XMM_L(1)));
3470 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(2)),
3471 offsetof(CPUX86State,xmm_regs[reg].XMM_L(3)));
3472 break;
3473 case 0x178:
3474 case 0x378:
3476 int bit_index, field_length;
3478 if (b1 == 1 && reg != 0)
3479 goto illegal_op;
3480 field_length = cpu_ldub_code(env, s->pc++) & 0x3F;
3481 bit_index = cpu_ldub_code(env, s->pc++) & 0x3F;
3482 tcg_gen_addi_ptr(cpu_ptr0, cpu_env,
3483 offsetof(CPUX86State,xmm_regs[reg]));
3484 if (b1 == 1)
3485 gen_helper_extrq_i(cpu_env, cpu_ptr0,
3486 tcg_const_i32(bit_index),
3487 tcg_const_i32(field_length));
3488 else
3489 gen_helper_insertq_i(cpu_env, cpu_ptr0,
3490 tcg_const_i32(bit_index),
3491 tcg_const_i32(field_length));
3493 break;
3494 case 0x7e: /* movd ea, mm */
3495 #ifdef TARGET_X86_64
3496 if (s->dflag == 2) {
3497 tcg_gen_ld_i64(cpu_T[0], cpu_env,
3498 offsetof(CPUX86State,fpregs[reg].mmx));
3499 gen_ldst_modrm(env, s, modrm, OT_QUAD, OR_TMP0, 1);
3500 } else
3501 #endif
3503 tcg_gen_ld32u_tl(cpu_T[0], cpu_env,
3504 offsetof(CPUX86State,fpregs[reg].mmx.MMX_L(0)));
3505 gen_ldst_modrm(env, s, modrm, OT_LONG, OR_TMP0, 1);
3507 break;
3508 case 0x17e: /* movd ea, xmm */
3509 #ifdef TARGET_X86_64
3510 if (s->dflag == 2) {
3511 tcg_gen_ld_i64(cpu_T[0], cpu_env,
3512 offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3513 gen_ldst_modrm(env, s, modrm, OT_QUAD, OR_TMP0, 1);
3514 } else
3515 #endif
3517 tcg_gen_ld32u_tl(cpu_T[0], cpu_env,
3518 offsetof(CPUX86State,xmm_regs[reg].XMM_L(0)));
3519 gen_ldst_modrm(env, s, modrm, OT_LONG, OR_TMP0, 1);
3521 break;
3522 case 0x27e: /* movq xmm, ea */
3523 if (mod != 3) {
3524 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3525 gen_ldq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3526 } else {
3527 rm = (modrm & 7) | REX_B(s);
3528 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)),
3529 offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0)));
3531 gen_op_movq_env_0(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(1)));
3532 break;
3533 case 0x7f: /* movq ea, mm */
3534 if (mod != 3) {
3535 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3536 gen_stq_env_A0(s->mem_index, offsetof(CPUX86State,fpregs[reg].mmx));
3537 } else {
3538 rm = (modrm & 7);
3539 gen_op_movq(offsetof(CPUX86State,fpregs[rm].mmx),
3540 offsetof(CPUX86State,fpregs[reg].mmx));
3542 break;
3543 case 0x011: /* movups */
3544 case 0x111: /* movupd */
3545 case 0x029: /* movaps */
3546 case 0x129: /* movapd */
3547 case 0x17f: /* movdqa ea, xmm */
3548 case 0x27f: /* movdqu ea, xmm */
3549 if (mod != 3) {
3550 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3551 gen_sto_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg]));
3552 } else {
3553 rm = (modrm & 7) | REX_B(s);
3554 gen_op_movo(offsetof(CPUX86State,xmm_regs[rm]),
3555 offsetof(CPUX86State,xmm_regs[reg]));
3557 break;
3558 case 0x211: /* movss ea, xmm */
3559 if (mod != 3) {
3560 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3561 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(0)));
3562 gen_op_st_T0_A0(OT_LONG + s->mem_index);
3563 } else {
3564 rm = (modrm & 7) | REX_B(s);
3565 gen_op_movl(offsetof(CPUX86State,xmm_regs[rm].XMM_L(0)),
3566 offsetof(CPUX86State,xmm_regs[reg].XMM_L(0)));
3568 break;
3569 case 0x311: /* movsd ea, xmm */
3570 if (mod != 3) {
3571 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3572 gen_stq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3573 } else {
3574 rm = (modrm & 7) | REX_B(s);
3575 gen_op_movq(offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0)),
3576 offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3578 break;
3579 case 0x013: /* movlps */
3580 case 0x113: /* movlpd */
3581 if (mod != 3) {
3582 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3583 gen_stq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3584 } else {
3585 goto illegal_op;
3587 break;
3588 case 0x017: /* movhps */
3589 case 0x117: /* movhpd */
3590 if (mod != 3) {
3591 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3592 gen_stq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg].XMM_Q(1)));
3593 } else {
3594 goto illegal_op;
3596 break;
3597 case 0x71: /* shift mm, im */
3598 case 0x72:
3599 case 0x73:
3600 case 0x171: /* shift xmm, im */
3601 case 0x172:
3602 case 0x173:
3603 if (b1 >= 2) {
3604 goto illegal_op;
3606 val = cpu_ldub_code(env, s->pc++);
3607 if (is_xmm) {
3608 gen_op_movl_T0_im(val);
3609 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_t0.XMM_L(0)));
3610 gen_op_movl_T0_0();
3611 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_t0.XMM_L(1)));
3612 op1_offset = offsetof(CPUX86State,xmm_t0);
3613 } else {
3614 gen_op_movl_T0_im(val);
3615 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,mmx_t0.MMX_L(0)));
3616 gen_op_movl_T0_0();
3617 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,mmx_t0.MMX_L(1)));
3618 op1_offset = offsetof(CPUX86State,mmx_t0);
3620 sse_fn_epp = sse_op_table2[((b - 1) & 3) * 8 +
3621 (((modrm >> 3)) & 7)][b1];
3622 if (!sse_fn_epp) {
3623 goto illegal_op;
3625 if (is_xmm) {
3626 rm = (modrm & 7) | REX_B(s);
3627 op2_offset = offsetof(CPUX86State,xmm_regs[rm]);
3628 } else {
3629 rm = (modrm & 7);
3630 op2_offset = offsetof(CPUX86State,fpregs[rm].mmx);
3632 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op2_offset);
3633 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op1_offset);
3634 sse_fn_epp(cpu_env, cpu_ptr0, cpu_ptr1);
3635 break;
3636 case 0x050: /* movmskps */
3637 rm = (modrm & 7) | REX_B(s);
3638 tcg_gen_addi_ptr(cpu_ptr0, cpu_env,
3639 offsetof(CPUX86State,xmm_regs[rm]));
3640 gen_helper_movmskps(cpu_tmp2_i32, cpu_env, cpu_ptr0);
3641 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
3642 gen_op_mov_reg_T0(OT_LONG, reg);
3643 break;
3644 case 0x150: /* movmskpd */
3645 rm = (modrm & 7) | REX_B(s);
3646 tcg_gen_addi_ptr(cpu_ptr0, cpu_env,
3647 offsetof(CPUX86State,xmm_regs[rm]));
3648 gen_helper_movmskpd(cpu_tmp2_i32, cpu_env, cpu_ptr0);
3649 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
3650 gen_op_mov_reg_T0(OT_LONG, reg);
3651 break;
3652 case 0x02a: /* cvtpi2ps */
3653 case 0x12a: /* cvtpi2pd */
3654 gen_helper_enter_mmx(cpu_env);
3655 if (mod != 3) {
3656 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3657 op2_offset = offsetof(CPUX86State,mmx_t0);
3658 gen_ldq_env_A0(s->mem_index, op2_offset);
3659 } else {
3660 rm = (modrm & 7);
3661 op2_offset = offsetof(CPUX86State,fpregs[rm].mmx);
3663 op1_offset = offsetof(CPUX86State,xmm_regs[reg]);
3664 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
3665 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset);
3666 switch(b >> 8) {
3667 case 0x0:
3668 gen_helper_cvtpi2ps(cpu_env, cpu_ptr0, cpu_ptr1);
3669 break;
3670 default:
3671 case 0x1:
3672 gen_helper_cvtpi2pd(cpu_env, cpu_ptr0, cpu_ptr1);
3673 break;
3675 break;
3676 case 0x22a: /* cvtsi2ss */
3677 case 0x32a: /* cvtsi2sd */
3678 ot = (s->dflag == 2) ? OT_QUAD : OT_LONG;
3679 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
3680 op1_offset = offsetof(CPUX86State,xmm_regs[reg]);
3681 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
3682 if (ot == OT_LONG) {
3683 SSEFunc_0_epi sse_fn_epi = sse_op_table3ai[(b >> 8) & 1];
3684 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
3685 sse_fn_epi(cpu_env, cpu_ptr0, cpu_tmp2_i32);
3686 } else {
3687 #ifdef TARGET_X86_64
3688 SSEFunc_0_epl sse_fn_epl = sse_op_table3aq[(b >> 8) & 1];
3689 sse_fn_epl(cpu_env, cpu_ptr0, cpu_T[0]);
3690 #else
3691 goto illegal_op;
3692 #endif
3694 break;
3695 case 0x02c: /* cvttps2pi */
3696 case 0x12c: /* cvttpd2pi */
3697 case 0x02d: /* cvtps2pi */
3698 case 0x12d: /* cvtpd2pi */
3699 gen_helper_enter_mmx(cpu_env);
3700 if (mod != 3) {
3701 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3702 op2_offset = offsetof(CPUX86State,xmm_t0);
3703 gen_ldo_env_A0(s->mem_index, op2_offset);
3704 } else {
3705 rm = (modrm & 7) | REX_B(s);
3706 op2_offset = offsetof(CPUX86State,xmm_regs[rm]);
3708 op1_offset = offsetof(CPUX86State,fpregs[reg & 7].mmx);
3709 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
3710 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset);
3711 switch(b) {
3712 case 0x02c:
3713 gen_helper_cvttps2pi(cpu_env, cpu_ptr0, cpu_ptr1);
3714 break;
3715 case 0x12c:
3716 gen_helper_cvttpd2pi(cpu_env, cpu_ptr0, cpu_ptr1);
3717 break;
3718 case 0x02d:
3719 gen_helper_cvtps2pi(cpu_env, cpu_ptr0, cpu_ptr1);
3720 break;
3721 case 0x12d:
3722 gen_helper_cvtpd2pi(cpu_env, cpu_ptr0, cpu_ptr1);
3723 break;
3725 break;
3726 case 0x22c: /* cvttss2si */
3727 case 0x32c: /* cvttsd2si */
3728 case 0x22d: /* cvtss2si */
3729 case 0x32d: /* cvtsd2si */
3730 ot = (s->dflag == 2) ? OT_QUAD : OT_LONG;
3731 if (mod != 3) {
3732 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3733 if ((b >> 8) & 1) {
3734 gen_ldq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_t0.XMM_Q(0)));
3735 } else {
3736 gen_op_ld_T0_A0(OT_LONG + s->mem_index);
3737 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_t0.XMM_L(0)));
3739 op2_offset = offsetof(CPUX86State,xmm_t0);
3740 } else {
3741 rm = (modrm & 7) | REX_B(s);
3742 op2_offset = offsetof(CPUX86State,xmm_regs[rm]);
3744 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op2_offset);
3745 if (ot == OT_LONG) {
3746 SSEFunc_i_ep sse_fn_i_ep =
3747 sse_op_table3bi[((b >> 7) & 2) | (b & 1)];
3748 sse_fn_i_ep(cpu_tmp2_i32, cpu_env, cpu_ptr0);
3749 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
3750 } else {
3751 #ifdef TARGET_X86_64
3752 SSEFunc_l_ep sse_fn_l_ep =
3753 sse_op_table3bq[((b >> 7) & 2) | (b & 1)];
3754 sse_fn_l_ep(cpu_T[0], cpu_env, cpu_ptr0);
3755 #else
3756 goto illegal_op;
3757 #endif
3759 gen_op_mov_reg_T0(ot, reg);
3760 break;
3761 case 0xc4: /* pinsrw */
3762 case 0x1c4:
3763 s->rip_offset = 1;
3764 gen_ldst_modrm(env, s, modrm, OT_WORD, OR_TMP0, 0);
3765 val = cpu_ldub_code(env, s->pc++);
3766 if (b1) {
3767 val &= 7;
3768 tcg_gen_st16_tl(cpu_T[0], cpu_env,
3769 offsetof(CPUX86State,xmm_regs[reg].XMM_W(val)));
3770 } else {
3771 val &= 3;
3772 tcg_gen_st16_tl(cpu_T[0], cpu_env,
3773 offsetof(CPUX86State,fpregs[reg].mmx.MMX_W(val)));
3775 break;
3776 case 0xc5: /* pextrw */
3777 case 0x1c5:
3778 if (mod != 3)
3779 goto illegal_op;
3780 ot = (s->dflag == 2) ? OT_QUAD : OT_LONG;
3781 val = cpu_ldub_code(env, s->pc++);
3782 if (b1) {
3783 val &= 7;
3784 rm = (modrm & 7) | REX_B(s);
3785 tcg_gen_ld16u_tl(cpu_T[0], cpu_env,
3786 offsetof(CPUX86State,xmm_regs[rm].XMM_W(val)));
3787 } else {
3788 val &= 3;
3789 rm = (modrm & 7);
3790 tcg_gen_ld16u_tl(cpu_T[0], cpu_env,
3791 offsetof(CPUX86State,fpregs[rm].mmx.MMX_W(val)));
3793 reg = ((modrm >> 3) & 7) | rex_r;
3794 gen_op_mov_reg_T0(ot, reg);
3795 break;
3796 case 0x1d6: /* movq ea, xmm */
3797 if (mod != 3) {
3798 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3799 gen_stq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3800 } else {
3801 rm = (modrm & 7) | REX_B(s);
3802 gen_op_movq(offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0)),
3803 offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3804 gen_op_movq_env_0(offsetof(CPUX86State,xmm_regs[rm].XMM_Q(1)));
3806 break;
3807 case 0x2d6: /* movq2dq */
3808 gen_helper_enter_mmx(cpu_env);
3809 rm = (modrm & 7);
3810 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)),
3811 offsetof(CPUX86State,fpregs[rm].mmx));
3812 gen_op_movq_env_0(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(1)));
3813 break;
3814 case 0x3d6: /* movdq2q */
3815 gen_helper_enter_mmx(cpu_env);
3816 rm = (modrm & 7) | REX_B(s);
3817 gen_op_movq(offsetof(CPUX86State,fpregs[reg & 7].mmx),
3818 offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0)));
3819 break;
3820 case 0xd7: /* pmovmskb */
3821 case 0x1d7:
3822 if (mod != 3)
3823 goto illegal_op;
3824 if (b1) {
3825 rm = (modrm & 7) | REX_B(s);
3826 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, offsetof(CPUX86State,xmm_regs[rm]));
3827 gen_helper_pmovmskb_xmm(cpu_tmp2_i32, cpu_env, cpu_ptr0);
3828 } else {
3829 rm = (modrm & 7);
3830 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, offsetof(CPUX86State,fpregs[rm].mmx));
3831 gen_helper_pmovmskb_mmx(cpu_tmp2_i32, cpu_env, cpu_ptr0);
3833 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
3834 reg = ((modrm >> 3) & 7) | rex_r;
3835 gen_op_mov_reg_T0(OT_LONG, reg);
3836 break;
3837 case 0x138:
3838 if (s->prefix & PREFIX_REPNZ)
3839 goto crc32;
3840 case 0x038:
3841 b = modrm;
3842 modrm = cpu_ldub_code(env, s->pc++);
3843 rm = modrm & 7;
3844 reg = ((modrm >> 3) & 7) | rex_r;
3845 mod = (modrm >> 6) & 3;
3846 if (b1 >= 2) {
3847 goto illegal_op;
3850 sse_fn_epp = sse_op_table6[b].op[b1];
3851 if (!sse_fn_epp) {
3852 goto illegal_op;
3854 if (!(s->cpuid_ext_features & sse_op_table6[b].ext_mask))
3855 goto illegal_op;
3857 if (b1) {
3858 op1_offset = offsetof(CPUX86State,xmm_regs[reg]);
3859 if (mod == 3) {
3860 op2_offset = offsetof(CPUX86State,xmm_regs[rm | REX_B(s)]);
3861 } else {
3862 op2_offset = offsetof(CPUX86State,xmm_t0);
3863 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3864 switch (b) {
3865 case 0x20: case 0x30: /* pmovsxbw, pmovzxbw */
3866 case 0x23: case 0x33: /* pmovsxwd, pmovzxwd */
3867 case 0x25: case 0x35: /* pmovsxdq, pmovzxdq */
3868 gen_ldq_env_A0(s->mem_index, op2_offset +
3869 offsetof(XMMReg, XMM_Q(0)));
3870 break;
3871 case 0x21: case 0x31: /* pmovsxbd, pmovzxbd */
3872 case 0x24: case 0x34: /* pmovsxwq, pmovzxwq */
3873 tcg_gen_qemu_ld32u(cpu_tmp0, cpu_A0,
3874 (s->mem_index >> 2) - 1);
3875 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_tmp0);
3876 tcg_gen_st_i32(cpu_tmp2_i32, cpu_env, op2_offset +
3877 offsetof(XMMReg, XMM_L(0)));
3878 break;
3879 case 0x22: case 0x32: /* pmovsxbq, pmovzxbq */
3880 tcg_gen_qemu_ld16u(cpu_tmp0, cpu_A0,
3881 (s->mem_index >> 2) - 1);
3882 tcg_gen_st16_tl(cpu_tmp0, cpu_env, op2_offset +
3883 offsetof(XMMReg, XMM_W(0)));
3884 break;
3885 case 0x2a: /* movntqda */
3886 gen_ldo_env_A0(s->mem_index, op1_offset);
3887 return;
3888 default:
3889 gen_ldo_env_A0(s->mem_index, op2_offset);
3892 } else {
3893 op1_offset = offsetof(CPUX86State,fpregs[reg].mmx);
3894 if (mod == 3) {
3895 op2_offset = offsetof(CPUX86State,fpregs[rm].mmx);
3896 } else {
3897 op2_offset = offsetof(CPUX86State,mmx_t0);
3898 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3899 gen_ldq_env_A0(s->mem_index, op2_offset);
3902 if (sse_fn_epp == SSE_SPECIAL) {
3903 goto illegal_op;
3906 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
3907 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset);
3908 sse_fn_epp(cpu_env, cpu_ptr0, cpu_ptr1);
3910 if (b == 0x17) {
3911 set_cc_op(s, CC_OP_EFLAGS);
3913 break;
3914 case 0x338: /* crc32 */
3915 crc32:
3916 b = modrm;
3917 modrm = cpu_ldub_code(env, s->pc++);
3918 reg = ((modrm >> 3) & 7) | rex_r;
3920 if (b != 0xf0 && b != 0xf1)
3921 goto illegal_op;
3922 if (!(s->cpuid_ext_features & CPUID_EXT_SSE42))
3923 goto illegal_op;
3925 if (b == 0xf0)
3926 ot = OT_BYTE;
3927 else if (b == 0xf1 && s->dflag != 2)
3928 if (s->prefix & PREFIX_DATA)
3929 ot = OT_WORD;
3930 else
3931 ot = OT_LONG;
3932 else
3933 ot = OT_QUAD;
3935 gen_op_mov_TN_reg(OT_LONG, 0, reg);
3936 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
3937 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
3938 gen_helper_crc32(cpu_T[0], cpu_tmp2_i32,
3939 cpu_T[0], tcg_const_i32(8 << ot));
3941 ot = (s->dflag == 2) ? OT_QUAD : OT_LONG;
3942 gen_op_mov_reg_T0(ot, reg);
3943 break;
3944 case 0x03a:
3945 case 0x13a:
3946 b = modrm;
3947 modrm = cpu_ldub_code(env, s->pc++);
3948 rm = modrm & 7;
3949 reg = ((modrm >> 3) & 7) | rex_r;
3950 mod = (modrm >> 6) & 3;
3951 if (b1 >= 2) {
3952 goto illegal_op;
3955 sse_fn_eppi = sse_op_table7[b].op[b1];
3956 if (!sse_fn_eppi) {
3957 goto illegal_op;
3959 if (!(s->cpuid_ext_features & sse_op_table7[b].ext_mask))
3960 goto illegal_op;
3962 if (sse_fn_eppi == SSE_SPECIAL) {
3963 ot = (s->dflag == 2) ? OT_QUAD : OT_LONG;
3964 rm = (modrm & 7) | REX_B(s);
3965 if (mod != 3)
3966 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3967 reg = ((modrm >> 3) & 7) | rex_r;
3968 val = cpu_ldub_code(env, s->pc++);
3969 switch (b) {
3970 case 0x14: /* pextrb */
3971 tcg_gen_ld8u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,
3972 xmm_regs[reg].XMM_B(val & 15)));
3973 if (mod == 3)
3974 gen_op_mov_reg_T0(ot, rm);
3975 else
3976 tcg_gen_qemu_st8(cpu_T[0], cpu_A0,
3977 (s->mem_index >> 2) - 1);
3978 break;
3979 case 0x15: /* pextrw */
3980 tcg_gen_ld16u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,
3981 xmm_regs[reg].XMM_W(val & 7)));
3982 if (mod == 3)
3983 gen_op_mov_reg_T0(ot, rm);
3984 else
3985 tcg_gen_qemu_st16(cpu_T[0], cpu_A0,
3986 (s->mem_index >> 2) - 1);
3987 break;
3988 case 0x16:
3989 if (ot == OT_LONG) { /* pextrd */
3990 tcg_gen_ld_i32(cpu_tmp2_i32, cpu_env,
3991 offsetof(CPUX86State,
3992 xmm_regs[reg].XMM_L(val & 3)));
3993 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
3994 if (mod == 3)
3995 gen_op_mov_reg_v(ot, rm, cpu_T[0]);
3996 else
3997 tcg_gen_qemu_st32(cpu_T[0], cpu_A0,
3998 (s->mem_index >> 2) - 1);
3999 } else { /* pextrq */
4000 #ifdef TARGET_X86_64
4001 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env,
4002 offsetof(CPUX86State,
4003 xmm_regs[reg].XMM_Q(val & 1)));
4004 if (mod == 3)
4005 gen_op_mov_reg_v(ot, rm, cpu_tmp1_i64);
4006 else
4007 tcg_gen_qemu_st64(cpu_tmp1_i64, cpu_A0,
4008 (s->mem_index >> 2) - 1);
4009 #else
4010 goto illegal_op;
4011 #endif
4013 break;
4014 case 0x17: /* extractps */
4015 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,
4016 xmm_regs[reg].XMM_L(val & 3)));
4017 if (mod == 3)
4018 gen_op_mov_reg_T0(ot, rm);
4019 else
4020 tcg_gen_qemu_st32(cpu_T[0], cpu_A0,
4021 (s->mem_index >> 2) - 1);
4022 break;
4023 case 0x20: /* pinsrb */
4024 if (mod == 3)
4025 gen_op_mov_TN_reg(OT_LONG, 0, rm);
4026 else
4027 tcg_gen_qemu_ld8u(cpu_tmp0, cpu_A0,
4028 (s->mem_index >> 2) - 1);
4029 tcg_gen_st8_tl(cpu_tmp0, cpu_env, offsetof(CPUX86State,
4030 xmm_regs[reg].XMM_B(val & 15)));
4031 break;
4032 case 0x21: /* insertps */
4033 if (mod == 3) {
4034 tcg_gen_ld_i32(cpu_tmp2_i32, cpu_env,
4035 offsetof(CPUX86State,xmm_regs[rm]
4036 .XMM_L((val >> 6) & 3)));
4037 } else {
4038 tcg_gen_qemu_ld32u(cpu_tmp0, cpu_A0,
4039 (s->mem_index >> 2) - 1);
4040 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_tmp0);
4042 tcg_gen_st_i32(cpu_tmp2_i32, cpu_env,
4043 offsetof(CPUX86State,xmm_regs[reg]
4044 .XMM_L((val >> 4) & 3)));
4045 if ((val >> 0) & 1)
4046 tcg_gen_st_i32(tcg_const_i32(0 /*float32_zero*/),
4047 cpu_env, offsetof(CPUX86State,
4048 xmm_regs[reg].XMM_L(0)));
4049 if ((val >> 1) & 1)
4050 tcg_gen_st_i32(tcg_const_i32(0 /*float32_zero*/),
4051 cpu_env, offsetof(CPUX86State,
4052 xmm_regs[reg].XMM_L(1)));
4053 if ((val >> 2) & 1)
4054 tcg_gen_st_i32(tcg_const_i32(0 /*float32_zero*/),
4055 cpu_env, offsetof(CPUX86State,
4056 xmm_regs[reg].XMM_L(2)));
4057 if ((val >> 3) & 1)
4058 tcg_gen_st_i32(tcg_const_i32(0 /*float32_zero*/),
4059 cpu_env, offsetof(CPUX86State,
4060 xmm_regs[reg].XMM_L(3)));
4061 break;
4062 case 0x22:
4063 if (ot == OT_LONG) { /* pinsrd */
4064 if (mod == 3)
4065 gen_op_mov_v_reg(ot, cpu_tmp0, rm);
4066 else
4067 tcg_gen_qemu_ld32u(cpu_tmp0, cpu_A0,
4068 (s->mem_index >> 2) - 1);
4069 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_tmp0);
4070 tcg_gen_st_i32(cpu_tmp2_i32, cpu_env,
4071 offsetof(CPUX86State,
4072 xmm_regs[reg].XMM_L(val & 3)));
4073 } else { /* pinsrq */
4074 #ifdef TARGET_X86_64
4075 if (mod == 3)
4076 gen_op_mov_v_reg(ot, cpu_tmp1_i64, rm);
4077 else
4078 tcg_gen_qemu_ld64(cpu_tmp1_i64, cpu_A0,
4079 (s->mem_index >> 2) - 1);
4080 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env,
4081 offsetof(CPUX86State,
4082 xmm_regs[reg].XMM_Q(val & 1)));
4083 #else
4084 goto illegal_op;
4085 #endif
4087 break;
4089 return;
4092 if (b1) {
4093 op1_offset = offsetof(CPUX86State,xmm_regs[reg]);
4094 if (mod == 3) {
4095 op2_offset = offsetof(CPUX86State,xmm_regs[rm | REX_B(s)]);
4096 } else {
4097 op2_offset = offsetof(CPUX86State,xmm_t0);
4098 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4099 gen_ldo_env_A0(s->mem_index, op2_offset);
4101 } else {
4102 op1_offset = offsetof(CPUX86State,fpregs[reg].mmx);
4103 if (mod == 3) {
4104 op2_offset = offsetof(CPUX86State,fpregs[rm].mmx);
4105 } else {
4106 op2_offset = offsetof(CPUX86State,mmx_t0);
4107 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4108 gen_ldq_env_A0(s->mem_index, op2_offset);
4111 val = cpu_ldub_code(env, s->pc++);
4113 if ((b & 0xfc) == 0x60) { /* pcmpXstrX */
4114 set_cc_op(s, CC_OP_EFLAGS);
4116 if (s->dflag == 2)
4117 /* The helper must use entire 64-bit gp registers */
4118 val |= 1 << 8;
4121 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
4122 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset);
4123 sse_fn_eppi(cpu_env, cpu_ptr0, cpu_ptr1, tcg_const_i32(val));
4124 break;
4125 default:
4126 goto illegal_op;
4128 } else {
4129 /* generic MMX or SSE operation */
4130 switch(b) {
4131 case 0x70: /* pshufx insn */
4132 case 0xc6: /* pshufx insn */
4133 case 0xc2: /* compare insns */
4134 s->rip_offset = 1;
4135 break;
4136 default:
4137 break;
4139 if (is_xmm) {
4140 op1_offset = offsetof(CPUX86State,xmm_regs[reg]);
4141 if (mod != 3) {
4142 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4143 op2_offset = offsetof(CPUX86State,xmm_t0);
4144 if (b1 >= 2 && ((b >= 0x50 && b <= 0x5f && b != 0x5b) ||
4145 b == 0xc2)) {
4146 /* specific case for SSE single instructions */
4147 if (b1 == 2) {
4148 /* 32 bit access */
4149 gen_op_ld_T0_A0(OT_LONG + s->mem_index);
4150 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_t0.XMM_L(0)));
4151 } else {
4152 /* 64 bit access */
4153 gen_ldq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_t0.XMM_D(0)));
4155 } else {
4156 gen_ldo_env_A0(s->mem_index, op2_offset);
4158 } else {
4159 rm = (modrm & 7) | REX_B(s);
4160 op2_offset = offsetof(CPUX86State,xmm_regs[rm]);
4162 } else {
4163 op1_offset = offsetof(CPUX86State,fpregs[reg].mmx);
4164 if (mod != 3) {
4165 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4166 op2_offset = offsetof(CPUX86State,mmx_t0);
4167 gen_ldq_env_A0(s->mem_index, op2_offset);
4168 } else {
4169 rm = (modrm & 7);
4170 op2_offset = offsetof(CPUX86State,fpregs[rm].mmx);
4173 switch(b) {
4174 case 0x0f: /* 3DNow! data insns */
4175 if (!(s->cpuid_ext2_features & CPUID_EXT2_3DNOW))
4176 goto illegal_op;
4177 val = cpu_ldub_code(env, s->pc++);
4178 sse_fn_epp = sse_op_table5[val];
4179 if (!sse_fn_epp) {
4180 goto illegal_op;
4182 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
4183 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset);
4184 sse_fn_epp(cpu_env, cpu_ptr0, cpu_ptr1);
4185 break;
4186 case 0x70: /* pshufx insn */
4187 case 0xc6: /* pshufx insn */
4188 val = cpu_ldub_code(env, s->pc++);
4189 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
4190 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset);
4191 /* XXX: introduce a new table? */
4192 sse_fn_ppi = (SSEFunc_0_ppi)sse_fn_epp;
4193 sse_fn_ppi(cpu_ptr0, cpu_ptr1, tcg_const_i32(val));
4194 break;
4195 case 0xc2:
4196 /* compare insns */
4197 val = cpu_ldub_code(env, s->pc++);
4198 if (val >= 8)
4199 goto illegal_op;
4200 sse_fn_epp = sse_op_table4[val][b1];
4202 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
4203 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset);
4204 sse_fn_epp(cpu_env, cpu_ptr0, cpu_ptr1);
4205 break;
4206 case 0xf7:
4207 /* maskmov : we must prepare A0 */
4208 if (mod != 3)
4209 goto illegal_op;
4210 #ifdef TARGET_X86_64
4211 if (s->aflag == 2) {
4212 gen_op_movq_A0_reg(R_EDI);
4213 } else
4214 #endif
4216 gen_op_movl_A0_reg(R_EDI);
4217 if (s->aflag == 0)
4218 gen_op_andl_A0_ffff();
4220 gen_add_A0_ds_seg(s);
4222 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
4223 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset);
4224 /* XXX: introduce a new table? */
4225 sse_fn_eppt = (SSEFunc_0_eppt)sse_fn_epp;
4226 sse_fn_eppt(cpu_env, cpu_ptr0, cpu_ptr1, cpu_A0);
4227 break;
4228 default:
4229 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
4230 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset);
4231 sse_fn_epp(cpu_env, cpu_ptr0, cpu_ptr1);
4232 break;
4234 if (b == 0x2e || b == 0x2f) {
4235 set_cc_op(s, CC_OP_EFLAGS);
4240 /* convert one instruction. s->is_jmp is set if the translation must
4241 be stopped. Return the next pc value */
4242 static target_ulong disas_insn(CPUX86State *env, DisasContext *s,
4243 target_ulong pc_start)
4245 int b, prefixes, aflag, dflag;
4246 int shift, ot;
4247 int modrm, reg, rm, mod, reg_addr, op, opreg, offset_addr, val;
4248 target_ulong next_eip, tval;
4249 int rex_w, rex_r;
4251 if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP | CPU_LOG_TB_OP_OPT))) {
4252 tcg_gen_debug_insn_start(pc_start);
4254 s->pc = pc_start;
4255 prefixes = 0;
4256 aflag = s->code32;
4257 dflag = s->code32;
4258 s->override = -1;
4259 rex_w = -1;
4260 rex_r = 0;
4261 #ifdef TARGET_X86_64
4262 s->rex_x = 0;
4263 s->rex_b = 0;
4264 x86_64_hregs = 0;
4265 #endif
4266 s->rip_offset = 0; /* for relative ip address */
4267 next_byte:
4268 b = cpu_ldub_code(env, s->pc);
4269 s->pc++;
4270 /* check prefixes */
4271 #ifdef TARGET_X86_64
4272 if (CODE64(s)) {
4273 switch (b) {
4274 case 0xf3:
4275 prefixes |= PREFIX_REPZ;
4276 goto next_byte;
4277 case 0xf2:
4278 prefixes |= PREFIX_REPNZ;
4279 goto next_byte;
4280 case 0xf0:
4281 prefixes |= PREFIX_LOCK;
4282 goto next_byte;
4283 case 0x2e:
4284 s->override = R_CS;
4285 goto next_byte;
4286 case 0x36:
4287 s->override = R_SS;
4288 goto next_byte;
4289 case 0x3e:
4290 s->override = R_DS;
4291 goto next_byte;
4292 case 0x26:
4293 s->override = R_ES;
4294 goto next_byte;
4295 case 0x64:
4296 s->override = R_FS;
4297 goto next_byte;
4298 case 0x65:
4299 s->override = R_GS;
4300 goto next_byte;
4301 case 0x66:
4302 prefixes |= PREFIX_DATA;
4303 goto next_byte;
4304 case 0x67:
4305 prefixes |= PREFIX_ADR;
4306 goto next_byte;
4307 case 0x40 ... 0x4f:
4308 /* REX prefix */
4309 rex_w = (b >> 3) & 1;
4310 rex_r = (b & 0x4) << 1;
4311 s->rex_x = (b & 0x2) << 2;
4312 REX_B(s) = (b & 0x1) << 3;
4313 x86_64_hregs = 1; /* select uniform byte register addressing */
4314 goto next_byte;
4316 if (rex_w == 1) {
4317 /* 0x66 is ignored if rex.w is set */
4318 dflag = 2;
4319 } else {
4320 if (prefixes & PREFIX_DATA)
4321 dflag ^= 1;
4323 if (!(prefixes & PREFIX_ADR))
4324 aflag = 2;
4325 } else
4326 #endif
4328 switch (b) {
4329 case 0xf3:
4330 prefixes |= PREFIX_REPZ;
4331 goto next_byte;
4332 case 0xf2:
4333 prefixes |= PREFIX_REPNZ;
4334 goto next_byte;
4335 case 0xf0:
4336 prefixes |= PREFIX_LOCK;
4337 goto next_byte;
4338 case 0x2e:
4339 s->override = R_CS;
4340 goto next_byte;
4341 case 0x36:
4342 s->override = R_SS;
4343 goto next_byte;
4344 case 0x3e:
4345 s->override = R_DS;
4346 goto next_byte;
4347 case 0x26:
4348 s->override = R_ES;
4349 goto next_byte;
4350 case 0x64:
4351 s->override = R_FS;
4352 goto next_byte;
4353 case 0x65:
4354 s->override = R_GS;
4355 goto next_byte;
4356 case 0x66:
4357 prefixes |= PREFIX_DATA;
4358 goto next_byte;
4359 case 0x67:
4360 prefixes |= PREFIX_ADR;
4361 goto next_byte;
4363 if (prefixes & PREFIX_DATA)
4364 dflag ^= 1;
4365 if (prefixes & PREFIX_ADR)
4366 aflag ^= 1;
4369 s->prefix = prefixes;
4370 s->aflag = aflag;
4371 s->dflag = dflag;
4373 /* lock generation */
4374 if (prefixes & PREFIX_LOCK)
4375 gen_helper_lock();
4377 /* now check op code */
4378 reswitch:
4379 switch(b) {
4380 case 0x0f:
4381 /**************************/
4382 /* extended op code */
4383 b = cpu_ldub_code(env, s->pc++) | 0x100;
4384 goto reswitch;
4386 /**************************/
4387 /* arith & logic */
4388 case 0x00 ... 0x05:
4389 case 0x08 ... 0x0d:
4390 case 0x10 ... 0x15:
4391 case 0x18 ... 0x1d:
4392 case 0x20 ... 0x25:
4393 case 0x28 ... 0x2d:
4394 case 0x30 ... 0x35:
4395 case 0x38 ... 0x3d:
4397 int op, f, val;
4398 op = (b >> 3) & 7;
4399 f = (b >> 1) & 3;
4401 if ((b & 1) == 0)
4402 ot = OT_BYTE;
4403 else
4404 ot = dflag + OT_WORD;
4406 switch(f) {
4407 case 0: /* OP Ev, Gv */
4408 modrm = cpu_ldub_code(env, s->pc++);
4409 reg = ((modrm >> 3) & 7) | rex_r;
4410 mod = (modrm >> 6) & 3;
4411 rm = (modrm & 7) | REX_B(s);
4412 if (mod != 3) {
4413 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4414 opreg = OR_TMP0;
4415 } else if (op == OP_XORL && rm == reg) {
4416 xor_zero:
4417 /* xor reg, reg optimisation */
4418 gen_op_movl_T0_0();
4419 set_cc_op(s, CC_OP_LOGICB + ot);
4420 gen_op_mov_reg_T0(ot, reg);
4421 gen_op_update1_cc();
4422 break;
4423 } else {
4424 opreg = rm;
4426 gen_op_mov_TN_reg(ot, 1, reg);
4427 gen_op(s, op, ot, opreg);
4428 break;
4429 case 1: /* OP Gv, Ev */
4430 modrm = cpu_ldub_code(env, s->pc++);
4431 mod = (modrm >> 6) & 3;
4432 reg = ((modrm >> 3) & 7) | rex_r;
4433 rm = (modrm & 7) | REX_B(s);
4434 if (mod != 3) {
4435 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4436 gen_op_ld_T1_A0(ot + s->mem_index);
4437 } else if (op == OP_XORL && rm == reg) {
4438 goto xor_zero;
4439 } else {
4440 gen_op_mov_TN_reg(ot, 1, rm);
4442 gen_op(s, op, ot, reg);
4443 break;
4444 case 2: /* OP A, Iv */
4445 val = insn_get(env, s, ot);
4446 gen_op_movl_T1_im(val);
4447 gen_op(s, op, ot, OR_EAX);
4448 break;
4451 break;
4453 case 0x82:
4454 if (CODE64(s))
4455 goto illegal_op;
4456 case 0x80: /* GRP1 */
4457 case 0x81:
4458 case 0x83:
4460 int val;
4462 if ((b & 1) == 0)
4463 ot = OT_BYTE;
4464 else
4465 ot = dflag + OT_WORD;
4467 modrm = cpu_ldub_code(env, s->pc++);
4468 mod = (modrm >> 6) & 3;
4469 rm = (modrm & 7) | REX_B(s);
4470 op = (modrm >> 3) & 7;
4472 if (mod != 3) {
4473 if (b == 0x83)
4474 s->rip_offset = 1;
4475 else
4476 s->rip_offset = insn_const_size(ot);
4477 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4478 opreg = OR_TMP0;
4479 } else {
4480 opreg = rm;
4483 switch(b) {
4484 default:
4485 case 0x80:
4486 case 0x81:
4487 case 0x82:
4488 val = insn_get(env, s, ot);
4489 break;
4490 case 0x83:
4491 val = (int8_t)insn_get(env, s, OT_BYTE);
4492 break;
4494 gen_op_movl_T1_im(val);
4495 gen_op(s, op, ot, opreg);
4497 break;
4499 /**************************/
4500 /* inc, dec, and other misc arith */
4501 case 0x40 ... 0x47: /* inc Gv */
4502 ot = dflag ? OT_LONG : OT_WORD;
4503 gen_inc(s, ot, OR_EAX + (b & 7), 1);
4504 break;
4505 case 0x48 ... 0x4f: /* dec Gv */
4506 ot = dflag ? OT_LONG : OT_WORD;
4507 gen_inc(s, ot, OR_EAX + (b & 7), -1);
4508 break;
4509 case 0xf6: /* GRP3 */
4510 case 0xf7:
4511 if ((b & 1) == 0)
4512 ot = OT_BYTE;
4513 else
4514 ot = dflag + OT_WORD;
4516 modrm = cpu_ldub_code(env, s->pc++);
4517 mod = (modrm >> 6) & 3;
4518 rm = (modrm & 7) | REX_B(s);
4519 op = (modrm >> 3) & 7;
4520 if (mod != 3) {
4521 if (op == 0)
4522 s->rip_offset = insn_const_size(ot);
4523 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4524 gen_op_ld_T0_A0(ot + s->mem_index);
4525 } else {
4526 gen_op_mov_TN_reg(ot, 0, rm);
4529 switch(op) {
4530 case 0: /* test */
4531 val = insn_get(env, s, ot);
4532 gen_op_movl_T1_im(val);
4533 gen_op_testl_T0_T1_cc();
4534 set_cc_op(s, CC_OP_LOGICB + ot);
4535 break;
4536 case 2: /* not */
4537 tcg_gen_not_tl(cpu_T[0], cpu_T[0]);
4538 if (mod != 3) {
4539 gen_op_st_T0_A0(ot + s->mem_index);
4540 } else {
4541 gen_op_mov_reg_T0(ot, rm);
4543 break;
4544 case 3: /* neg */
4545 tcg_gen_neg_tl(cpu_T[0], cpu_T[0]);
4546 if (mod != 3) {
4547 gen_op_st_T0_A0(ot + s->mem_index);
4548 } else {
4549 gen_op_mov_reg_T0(ot, rm);
4551 gen_op_update_neg_cc();
4552 set_cc_op(s, CC_OP_SUBB + ot);
4553 break;
4554 case 4: /* mul */
4555 switch(ot) {
4556 case OT_BYTE:
4557 gen_op_mov_TN_reg(OT_BYTE, 1, R_EAX);
4558 tcg_gen_ext8u_tl(cpu_T[0], cpu_T[0]);
4559 tcg_gen_ext8u_tl(cpu_T[1], cpu_T[1]);
4560 /* XXX: use 32 bit mul which could be faster */
4561 tcg_gen_mul_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
4562 gen_op_mov_reg_T0(OT_WORD, R_EAX);
4563 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4564 tcg_gen_andi_tl(cpu_cc_src, cpu_T[0], 0xff00);
4565 set_cc_op(s, CC_OP_MULB);
4566 break;
4567 case OT_WORD:
4568 gen_op_mov_TN_reg(OT_WORD, 1, R_EAX);
4569 tcg_gen_ext16u_tl(cpu_T[0], cpu_T[0]);
4570 tcg_gen_ext16u_tl(cpu_T[1], cpu_T[1]);
4571 /* XXX: use 32 bit mul which could be faster */
4572 tcg_gen_mul_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
4573 gen_op_mov_reg_T0(OT_WORD, R_EAX);
4574 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4575 tcg_gen_shri_tl(cpu_T[0], cpu_T[0], 16);
4576 gen_op_mov_reg_T0(OT_WORD, R_EDX);
4577 tcg_gen_mov_tl(cpu_cc_src, cpu_T[0]);
4578 set_cc_op(s, CC_OP_MULW);
4579 break;
4580 default:
4581 case OT_LONG:
4582 #ifdef TARGET_X86_64
4583 gen_op_mov_TN_reg(OT_LONG, 1, R_EAX);
4584 tcg_gen_ext32u_tl(cpu_T[0], cpu_T[0]);
4585 tcg_gen_ext32u_tl(cpu_T[1], cpu_T[1]);
4586 tcg_gen_mul_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
4587 gen_op_mov_reg_T0(OT_LONG, R_EAX);
4588 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4589 tcg_gen_shri_tl(cpu_T[0], cpu_T[0], 32);
4590 gen_op_mov_reg_T0(OT_LONG, R_EDX);
4591 tcg_gen_mov_tl(cpu_cc_src, cpu_T[0]);
4592 #else
4594 TCGv_i64 t0, t1;
4595 t0 = tcg_temp_new_i64();
4596 t1 = tcg_temp_new_i64();
4597 gen_op_mov_TN_reg(OT_LONG, 1, R_EAX);
4598 tcg_gen_extu_i32_i64(t0, cpu_T[0]);
4599 tcg_gen_extu_i32_i64(t1, cpu_T[1]);
4600 tcg_gen_mul_i64(t0, t0, t1);
4601 tcg_gen_trunc_i64_i32(cpu_T[0], t0);
4602 gen_op_mov_reg_T0(OT_LONG, R_EAX);
4603 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4604 tcg_gen_shri_i64(t0, t0, 32);
4605 tcg_gen_trunc_i64_i32(cpu_T[0], t0);
4606 gen_op_mov_reg_T0(OT_LONG, R_EDX);
4607 tcg_gen_mov_tl(cpu_cc_src, cpu_T[0]);
4609 #endif
4610 set_cc_op(s, CC_OP_MULL);
4611 break;
4612 #ifdef TARGET_X86_64
4613 case OT_QUAD:
4614 gen_helper_mulq_EAX_T0(cpu_env, cpu_T[0]);
4615 set_cc_op(s, CC_OP_MULQ);
4616 break;
4617 #endif
4619 break;
4620 case 5: /* imul */
4621 switch(ot) {
4622 case OT_BYTE:
4623 gen_op_mov_TN_reg(OT_BYTE, 1, R_EAX);
4624 tcg_gen_ext8s_tl(cpu_T[0], cpu_T[0]);
4625 tcg_gen_ext8s_tl(cpu_T[1], cpu_T[1]);
4626 /* XXX: use 32 bit mul which could be faster */
4627 tcg_gen_mul_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
4628 gen_op_mov_reg_T0(OT_WORD, R_EAX);
4629 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4630 tcg_gen_ext8s_tl(cpu_tmp0, cpu_T[0]);
4631 tcg_gen_sub_tl(cpu_cc_src, cpu_T[0], cpu_tmp0);
4632 set_cc_op(s, CC_OP_MULB);
4633 break;
4634 case OT_WORD:
4635 gen_op_mov_TN_reg(OT_WORD, 1, R_EAX);
4636 tcg_gen_ext16s_tl(cpu_T[0], cpu_T[0]);
4637 tcg_gen_ext16s_tl(cpu_T[1], cpu_T[1]);
4638 /* XXX: use 32 bit mul which could be faster */
4639 tcg_gen_mul_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
4640 gen_op_mov_reg_T0(OT_WORD, R_EAX);
4641 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4642 tcg_gen_ext16s_tl(cpu_tmp0, cpu_T[0]);
4643 tcg_gen_sub_tl(cpu_cc_src, cpu_T[0], cpu_tmp0);
4644 tcg_gen_shri_tl(cpu_T[0], cpu_T[0], 16);
4645 gen_op_mov_reg_T0(OT_WORD, R_EDX);
4646 set_cc_op(s, CC_OP_MULW);
4647 break;
4648 default:
4649 case OT_LONG:
4650 #ifdef TARGET_X86_64
4651 gen_op_mov_TN_reg(OT_LONG, 1, R_EAX);
4652 tcg_gen_ext32s_tl(cpu_T[0], cpu_T[0]);
4653 tcg_gen_ext32s_tl(cpu_T[1], cpu_T[1]);
4654 tcg_gen_mul_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
4655 gen_op_mov_reg_T0(OT_LONG, R_EAX);
4656 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4657 tcg_gen_ext32s_tl(cpu_tmp0, cpu_T[0]);
4658 tcg_gen_sub_tl(cpu_cc_src, cpu_T[0], cpu_tmp0);
4659 tcg_gen_shri_tl(cpu_T[0], cpu_T[0], 32);
4660 gen_op_mov_reg_T0(OT_LONG, R_EDX);
4661 #else
4663 TCGv_i64 t0, t1;
4664 t0 = tcg_temp_new_i64();
4665 t1 = tcg_temp_new_i64();
4666 gen_op_mov_TN_reg(OT_LONG, 1, R_EAX);
4667 tcg_gen_ext_i32_i64(t0, cpu_T[0]);
4668 tcg_gen_ext_i32_i64(t1, cpu_T[1]);
4669 tcg_gen_mul_i64(t0, t0, t1);
4670 tcg_gen_trunc_i64_i32(cpu_T[0], t0);
4671 gen_op_mov_reg_T0(OT_LONG, R_EAX);
4672 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4673 tcg_gen_sari_tl(cpu_tmp0, cpu_T[0], 31);
4674 tcg_gen_shri_i64(t0, t0, 32);
4675 tcg_gen_trunc_i64_i32(cpu_T[0], t0);
4676 gen_op_mov_reg_T0(OT_LONG, R_EDX);
4677 tcg_gen_sub_tl(cpu_cc_src, cpu_T[0], cpu_tmp0);
4679 #endif
4680 set_cc_op(s, CC_OP_MULL);
4681 break;
4682 #ifdef TARGET_X86_64
4683 case OT_QUAD:
4684 gen_helper_imulq_EAX_T0(cpu_env, cpu_T[0]);
4685 set_cc_op(s, CC_OP_MULQ);
4686 break;
4687 #endif
4689 break;
4690 case 6: /* div */
4691 switch(ot) {
4692 case OT_BYTE:
4693 gen_jmp_im(pc_start - s->cs_base);
4694 gen_helper_divb_AL(cpu_env, cpu_T[0]);
4695 break;
4696 case OT_WORD:
4697 gen_jmp_im(pc_start - s->cs_base);
4698 gen_helper_divw_AX(cpu_env, cpu_T[0]);
4699 break;
4700 default:
4701 case OT_LONG:
4702 gen_jmp_im(pc_start - s->cs_base);
4703 gen_helper_divl_EAX(cpu_env, cpu_T[0]);
4704 break;
4705 #ifdef TARGET_X86_64
4706 case OT_QUAD:
4707 gen_jmp_im(pc_start - s->cs_base);
4708 gen_helper_divq_EAX(cpu_env, cpu_T[0]);
4709 break;
4710 #endif
4712 break;
4713 case 7: /* idiv */
4714 switch(ot) {
4715 case OT_BYTE:
4716 gen_jmp_im(pc_start - s->cs_base);
4717 gen_helper_idivb_AL(cpu_env, cpu_T[0]);
4718 break;
4719 case OT_WORD:
4720 gen_jmp_im(pc_start - s->cs_base);
4721 gen_helper_idivw_AX(cpu_env, cpu_T[0]);
4722 break;
4723 default:
4724 case OT_LONG:
4725 gen_jmp_im(pc_start - s->cs_base);
4726 gen_helper_idivl_EAX(cpu_env, cpu_T[0]);
4727 break;
4728 #ifdef TARGET_X86_64
4729 case OT_QUAD:
4730 gen_jmp_im(pc_start - s->cs_base);
4731 gen_helper_idivq_EAX(cpu_env, cpu_T[0]);
4732 break;
4733 #endif
4735 break;
4736 default:
4737 goto illegal_op;
4739 break;
4741 case 0xfe: /* GRP4 */
4742 case 0xff: /* GRP5 */
4743 if ((b & 1) == 0)
4744 ot = OT_BYTE;
4745 else
4746 ot = dflag + OT_WORD;
4748 modrm = cpu_ldub_code(env, s->pc++);
4749 mod = (modrm >> 6) & 3;
4750 rm = (modrm & 7) | REX_B(s);
4751 op = (modrm >> 3) & 7;
4752 if (op >= 2 && b == 0xfe) {
4753 goto illegal_op;
4755 if (CODE64(s)) {
4756 if (op == 2 || op == 4) {
4757 /* operand size for jumps is 64 bit */
4758 ot = OT_QUAD;
4759 } else if (op == 3 || op == 5) {
4760 ot = dflag ? OT_LONG + (rex_w == 1) : OT_WORD;
4761 } else if (op == 6) {
4762 /* default push size is 64 bit */
4763 ot = dflag ? OT_QUAD : OT_WORD;
4766 if (mod != 3) {
4767 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4768 if (op >= 2 && op != 3 && op != 5)
4769 gen_op_ld_T0_A0(ot + s->mem_index);
4770 } else {
4771 gen_op_mov_TN_reg(ot, 0, rm);
4774 switch(op) {
4775 case 0: /* inc Ev */
4776 if (mod != 3)
4777 opreg = OR_TMP0;
4778 else
4779 opreg = rm;
4780 gen_inc(s, ot, opreg, 1);
4781 break;
4782 case 1: /* dec Ev */
4783 if (mod != 3)
4784 opreg = OR_TMP0;
4785 else
4786 opreg = rm;
4787 gen_inc(s, ot, opreg, -1);
4788 break;
4789 case 2: /* call Ev */
4790 /* XXX: optimize if memory (no 'and' is necessary) */
4791 if (s->dflag == 0)
4792 gen_op_andl_T0_ffff();
4793 next_eip = s->pc - s->cs_base;
4794 gen_movtl_T1_im(next_eip);
4795 gen_push_T1(s);
4796 gen_op_jmp_T0();
4797 gen_eob(s);
4798 break;
4799 case 3: /* lcall Ev */
4800 gen_op_ld_T1_A0(ot + s->mem_index);
4801 gen_add_A0_im(s, 1 << (ot - OT_WORD + 1));
4802 gen_op_ldu_T0_A0(OT_WORD + s->mem_index);
4803 do_lcall:
4804 if (s->pe && !s->vm86) {
4805 gen_update_cc_op(s);
4806 gen_jmp_im(pc_start - s->cs_base);
4807 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
4808 gen_helper_lcall_protected(cpu_env, cpu_tmp2_i32, cpu_T[1],
4809 tcg_const_i32(dflag),
4810 tcg_const_i32(s->pc - pc_start));
4811 } else {
4812 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
4813 gen_helper_lcall_real(cpu_env, cpu_tmp2_i32, cpu_T[1],
4814 tcg_const_i32(dflag),
4815 tcg_const_i32(s->pc - s->cs_base));
4817 gen_eob(s);
4818 break;
4819 case 4: /* jmp Ev */
4820 if (s->dflag == 0)
4821 gen_op_andl_T0_ffff();
4822 gen_op_jmp_T0();
4823 gen_eob(s);
4824 break;
4825 case 5: /* ljmp Ev */
4826 gen_op_ld_T1_A0(ot + s->mem_index);
4827 gen_add_A0_im(s, 1 << (ot - OT_WORD + 1));
4828 gen_op_ldu_T0_A0(OT_WORD + s->mem_index);
4829 do_ljmp:
4830 if (s->pe && !s->vm86) {
4831 gen_update_cc_op(s);
4832 gen_jmp_im(pc_start - s->cs_base);
4833 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
4834 gen_helper_ljmp_protected(cpu_env, cpu_tmp2_i32, cpu_T[1],
4835 tcg_const_i32(s->pc - pc_start));
4836 } else {
4837 gen_op_movl_seg_T0_vm(R_CS);
4838 gen_op_movl_T0_T1();
4839 gen_op_jmp_T0();
4841 gen_eob(s);
4842 break;
4843 case 6: /* push Ev */
4844 gen_push_T0(s);
4845 break;
4846 default:
4847 goto illegal_op;
4849 break;
4851 case 0x84: /* test Ev, Gv */
4852 case 0x85:
4853 if ((b & 1) == 0)
4854 ot = OT_BYTE;
4855 else
4856 ot = dflag + OT_WORD;
4858 modrm = cpu_ldub_code(env, s->pc++);
4859 reg = ((modrm >> 3) & 7) | rex_r;
4861 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
4862 gen_op_mov_TN_reg(ot, 1, reg);
4863 gen_op_testl_T0_T1_cc();
4864 set_cc_op(s, CC_OP_LOGICB + ot);
4865 break;
4867 case 0xa8: /* test eAX, Iv */
4868 case 0xa9:
4869 if ((b & 1) == 0)
4870 ot = OT_BYTE;
4871 else
4872 ot = dflag + OT_WORD;
4873 val = insn_get(env, s, ot);
4875 gen_op_mov_TN_reg(ot, 0, OR_EAX);
4876 gen_op_movl_T1_im(val);
4877 gen_op_testl_T0_T1_cc();
4878 set_cc_op(s, CC_OP_LOGICB + ot);
4879 break;
4881 case 0x98: /* CWDE/CBW */
4882 #ifdef TARGET_X86_64
4883 if (dflag == 2) {
4884 gen_op_mov_TN_reg(OT_LONG, 0, R_EAX);
4885 tcg_gen_ext32s_tl(cpu_T[0], cpu_T[0]);
4886 gen_op_mov_reg_T0(OT_QUAD, R_EAX);
4887 } else
4888 #endif
4889 if (dflag == 1) {
4890 gen_op_mov_TN_reg(OT_WORD, 0, R_EAX);
4891 tcg_gen_ext16s_tl(cpu_T[0], cpu_T[0]);
4892 gen_op_mov_reg_T0(OT_LONG, R_EAX);
4893 } else {
4894 gen_op_mov_TN_reg(OT_BYTE, 0, R_EAX);
4895 tcg_gen_ext8s_tl(cpu_T[0], cpu_T[0]);
4896 gen_op_mov_reg_T0(OT_WORD, R_EAX);
4898 break;
4899 case 0x99: /* CDQ/CWD */
4900 #ifdef TARGET_X86_64
4901 if (dflag == 2) {
4902 gen_op_mov_TN_reg(OT_QUAD, 0, R_EAX);
4903 tcg_gen_sari_tl(cpu_T[0], cpu_T[0], 63);
4904 gen_op_mov_reg_T0(OT_QUAD, R_EDX);
4905 } else
4906 #endif
4907 if (dflag == 1) {
4908 gen_op_mov_TN_reg(OT_LONG, 0, R_EAX);
4909 tcg_gen_ext32s_tl(cpu_T[0], cpu_T[0]);
4910 tcg_gen_sari_tl(cpu_T[0], cpu_T[0], 31);
4911 gen_op_mov_reg_T0(OT_LONG, R_EDX);
4912 } else {
4913 gen_op_mov_TN_reg(OT_WORD, 0, R_EAX);
4914 tcg_gen_ext16s_tl(cpu_T[0], cpu_T[0]);
4915 tcg_gen_sari_tl(cpu_T[0], cpu_T[0], 15);
4916 gen_op_mov_reg_T0(OT_WORD, R_EDX);
4918 break;
4919 case 0x1af: /* imul Gv, Ev */
4920 case 0x69: /* imul Gv, Ev, I */
4921 case 0x6b:
4922 ot = dflag + OT_WORD;
4923 modrm = cpu_ldub_code(env, s->pc++);
4924 reg = ((modrm >> 3) & 7) | rex_r;
4925 if (b == 0x69)
4926 s->rip_offset = insn_const_size(ot);
4927 else if (b == 0x6b)
4928 s->rip_offset = 1;
4929 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
4930 if (b == 0x69) {
4931 val = insn_get(env, s, ot);
4932 gen_op_movl_T1_im(val);
4933 } else if (b == 0x6b) {
4934 val = (int8_t)insn_get(env, s, OT_BYTE);
4935 gen_op_movl_T1_im(val);
4936 } else {
4937 gen_op_mov_TN_reg(ot, 1, reg);
4940 #ifdef TARGET_X86_64
4941 if (ot == OT_QUAD) {
4942 gen_helper_imulq_T0_T1(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
4943 } else
4944 #endif
4945 if (ot == OT_LONG) {
4946 #ifdef TARGET_X86_64
4947 tcg_gen_ext32s_tl(cpu_T[0], cpu_T[0]);
4948 tcg_gen_ext32s_tl(cpu_T[1], cpu_T[1]);
4949 tcg_gen_mul_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
4950 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4951 tcg_gen_ext32s_tl(cpu_tmp0, cpu_T[0]);
4952 tcg_gen_sub_tl(cpu_cc_src, cpu_T[0], cpu_tmp0);
4953 #else
4955 TCGv_i64 t0, t1;
4956 t0 = tcg_temp_new_i64();
4957 t1 = tcg_temp_new_i64();
4958 tcg_gen_ext_i32_i64(t0, cpu_T[0]);
4959 tcg_gen_ext_i32_i64(t1, cpu_T[1]);
4960 tcg_gen_mul_i64(t0, t0, t1);
4961 tcg_gen_trunc_i64_i32(cpu_T[0], t0);
4962 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4963 tcg_gen_sari_tl(cpu_tmp0, cpu_T[0], 31);
4964 tcg_gen_shri_i64(t0, t0, 32);
4965 tcg_gen_trunc_i64_i32(cpu_T[1], t0);
4966 tcg_gen_sub_tl(cpu_cc_src, cpu_T[1], cpu_tmp0);
4968 #endif
4969 } else {
4970 tcg_gen_ext16s_tl(cpu_T[0], cpu_T[0]);
4971 tcg_gen_ext16s_tl(cpu_T[1], cpu_T[1]);
4972 /* XXX: use 32 bit mul which could be faster */
4973 tcg_gen_mul_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
4974 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4975 tcg_gen_ext16s_tl(cpu_tmp0, cpu_T[0]);
4976 tcg_gen_sub_tl(cpu_cc_src, cpu_T[0], cpu_tmp0);
4978 gen_op_mov_reg_T0(ot, reg);
4979 set_cc_op(s, CC_OP_MULB + ot);
4980 break;
4981 case 0x1c0:
4982 case 0x1c1: /* xadd Ev, Gv */
4983 if ((b & 1) == 0)
4984 ot = OT_BYTE;
4985 else
4986 ot = dflag + OT_WORD;
4987 modrm = cpu_ldub_code(env, s->pc++);
4988 reg = ((modrm >> 3) & 7) | rex_r;
4989 mod = (modrm >> 6) & 3;
4990 if (mod == 3) {
4991 rm = (modrm & 7) | REX_B(s);
4992 gen_op_mov_TN_reg(ot, 0, reg);
4993 gen_op_mov_TN_reg(ot, 1, rm);
4994 gen_op_addl_T0_T1();
4995 gen_op_mov_reg_T1(ot, reg);
4996 gen_op_mov_reg_T0(ot, rm);
4997 } else {
4998 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4999 gen_op_mov_TN_reg(ot, 0, reg);
5000 gen_op_ld_T1_A0(ot + s->mem_index);
5001 gen_op_addl_T0_T1();
5002 gen_op_st_T0_A0(ot + s->mem_index);
5003 gen_op_mov_reg_T1(ot, reg);
5005 gen_op_update2_cc();
5006 set_cc_op(s, CC_OP_ADDB + ot);
5007 break;
5008 case 0x1b0:
5009 case 0x1b1: /* cmpxchg Ev, Gv */
5011 int label1, label2;
5012 TCGv t0, t1, t2, a0;
5014 if ((b & 1) == 0)
5015 ot = OT_BYTE;
5016 else
5017 ot = dflag + OT_WORD;
5018 modrm = cpu_ldub_code(env, s->pc++);
5019 reg = ((modrm >> 3) & 7) | rex_r;
5020 mod = (modrm >> 6) & 3;
5021 t0 = tcg_temp_local_new();
5022 t1 = tcg_temp_local_new();
5023 t2 = tcg_temp_local_new();
5024 a0 = tcg_temp_local_new();
5025 gen_op_mov_v_reg(ot, t1, reg);
5026 if (mod == 3) {
5027 rm = (modrm & 7) | REX_B(s);
5028 gen_op_mov_v_reg(ot, t0, rm);
5029 } else {
5030 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5031 tcg_gen_mov_tl(a0, cpu_A0);
5032 gen_op_ld_v(ot + s->mem_index, t0, a0);
5033 rm = 0; /* avoid warning */
5035 label1 = gen_new_label();
5036 tcg_gen_mov_tl(t2, cpu_regs[R_EAX]);
5037 gen_extu(ot, t0);
5038 gen_extu(ot, t2);
5039 tcg_gen_brcond_tl(TCG_COND_EQ, t2, t0, label1);
5040 label2 = gen_new_label();
5041 if (mod == 3) {
5042 gen_op_mov_reg_v(ot, R_EAX, t0);
5043 tcg_gen_br(label2);
5044 gen_set_label(label1);
5045 gen_op_mov_reg_v(ot, rm, t1);
5046 } else {
5047 /* perform no-op store cycle like physical cpu; must be
5048 before changing accumulator to ensure idempotency if
5049 the store faults and the instruction is restarted */
5050 gen_op_st_v(ot + s->mem_index, t0, a0);
5051 gen_op_mov_reg_v(ot, R_EAX, t0);
5052 tcg_gen_br(label2);
5053 gen_set_label(label1);
5054 gen_op_st_v(ot + s->mem_index, t1, a0);
5056 gen_set_label(label2);
5057 tcg_gen_mov_tl(cpu_cc_src, t0);
5058 tcg_gen_mov_tl(cpu_cc_srcT, t2);
5059 tcg_gen_sub_tl(cpu_cc_dst, t2, t0);
5060 set_cc_op(s, CC_OP_SUBB + ot);
5061 tcg_temp_free(t0);
5062 tcg_temp_free(t1);
5063 tcg_temp_free(t2);
5064 tcg_temp_free(a0);
5066 break;
5067 case 0x1c7: /* cmpxchg8b */
5068 modrm = cpu_ldub_code(env, s->pc++);
5069 mod = (modrm >> 6) & 3;
5070 if ((mod == 3) || ((modrm & 0x38) != 0x8))
5071 goto illegal_op;
5072 #ifdef TARGET_X86_64
5073 if (dflag == 2) {
5074 if (!(s->cpuid_ext_features & CPUID_EXT_CX16))
5075 goto illegal_op;
5076 gen_jmp_im(pc_start - s->cs_base);
5077 gen_update_cc_op(s);
5078 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5079 gen_helper_cmpxchg16b(cpu_env, cpu_A0);
5080 } else
5081 #endif
5083 if (!(s->cpuid_features & CPUID_CX8))
5084 goto illegal_op;
5085 gen_jmp_im(pc_start - s->cs_base);
5086 gen_update_cc_op(s);
5087 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5088 gen_helper_cmpxchg8b(cpu_env, cpu_A0);
5090 set_cc_op(s, CC_OP_EFLAGS);
5091 break;
5093 /**************************/
5094 /* push/pop */
5095 case 0x50 ... 0x57: /* push */
5096 gen_op_mov_TN_reg(OT_LONG, 0, (b & 7) | REX_B(s));
5097 gen_push_T0(s);
5098 break;
5099 case 0x58 ... 0x5f: /* pop */
5100 if (CODE64(s)) {
5101 ot = dflag ? OT_QUAD : OT_WORD;
5102 } else {
5103 ot = dflag + OT_WORD;
5105 gen_pop_T0(s);
5106 /* NOTE: order is important for pop %sp */
5107 gen_pop_update(s);
5108 gen_op_mov_reg_T0(ot, (b & 7) | REX_B(s));
5109 break;
5110 case 0x60: /* pusha */
5111 if (CODE64(s))
5112 goto illegal_op;
5113 gen_pusha(s);
5114 break;
5115 case 0x61: /* popa */
5116 if (CODE64(s))
5117 goto illegal_op;
5118 gen_popa(s);
5119 break;
5120 case 0x68: /* push Iv */
5121 case 0x6a:
5122 if (CODE64(s)) {
5123 ot = dflag ? OT_QUAD : OT_WORD;
5124 } else {
5125 ot = dflag + OT_WORD;
5127 if (b == 0x68)
5128 val = insn_get(env, s, ot);
5129 else
5130 val = (int8_t)insn_get(env, s, OT_BYTE);
5131 gen_op_movl_T0_im(val);
5132 gen_push_T0(s);
5133 break;
5134 case 0x8f: /* pop Ev */
5135 if (CODE64(s)) {
5136 ot = dflag ? OT_QUAD : OT_WORD;
5137 } else {
5138 ot = dflag + OT_WORD;
5140 modrm = cpu_ldub_code(env, s->pc++);
5141 mod = (modrm >> 6) & 3;
5142 gen_pop_T0(s);
5143 if (mod == 3) {
5144 /* NOTE: order is important for pop %sp */
5145 gen_pop_update(s);
5146 rm = (modrm & 7) | REX_B(s);
5147 gen_op_mov_reg_T0(ot, rm);
5148 } else {
5149 /* NOTE: order is important too for MMU exceptions */
5150 s->popl_esp_hack = 1 << ot;
5151 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 1);
5152 s->popl_esp_hack = 0;
5153 gen_pop_update(s);
5155 break;
5156 case 0xc8: /* enter */
5158 int level;
5159 val = cpu_lduw_code(env, s->pc);
5160 s->pc += 2;
5161 level = cpu_ldub_code(env, s->pc++);
5162 gen_enter(s, val, level);
5164 break;
5165 case 0xc9: /* leave */
5166 /* XXX: exception not precise (ESP is updated before potential exception) */
5167 if (CODE64(s)) {
5168 gen_op_mov_TN_reg(OT_QUAD, 0, R_EBP);
5169 gen_op_mov_reg_T0(OT_QUAD, R_ESP);
5170 } else if (s->ss32) {
5171 gen_op_mov_TN_reg(OT_LONG, 0, R_EBP);
5172 gen_op_mov_reg_T0(OT_LONG, R_ESP);
5173 } else {
5174 gen_op_mov_TN_reg(OT_WORD, 0, R_EBP);
5175 gen_op_mov_reg_T0(OT_WORD, R_ESP);
5177 gen_pop_T0(s);
5178 if (CODE64(s)) {
5179 ot = dflag ? OT_QUAD : OT_WORD;
5180 } else {
5181 ot = dflag + OT_WORD;
5183 gen_op_mov_reg_T0(ot, R_EBP);
5184 gen_pop_update(s);
5185 break;
5186 case 0x06: /* push es */
5187 case 0x0e: /* push cs */
5188 case 0x16: /* push ss */
5189 case 0x1e: /* push ds */
5190 if (CODE64(s))
5191 goto illegal_op;
5192 gen_op_movl_T0_seg(b >> 3);
5193 gen_push_T0(s);
5194 break;
5195 case 0x1a0: /* push fs */
5196 case 0x1a8: /* push gs */
5197 gen_op_movl_T0_seg((b >> 3) & 7);
5198 gen_push_T0(s);
5199 break;
5200 case 0x07: /* pop es */
5201 case 0x17: /* pop ss */
5202 case 0x1f: /* pop ds */
5203 if (CODE64(s))
5204 goto illegal_op;
5205 reg = b >> 3;
5206 gen_pop_T0(s);
5207 gen_movl_seg_T0(s, reg, pc_start - s->cs_base);
5208 gen_pop_update(s);
5209 if (reg == R_SS) {
5210 /* if reg == SS, inhibit interrupts/trace. */
5211 /* If several instructions disable interrupts, only the
5212 _first_ does it */
5213 if (!(s->tb->flags & HF_INHIBIT_IRQ_MASK))
5214 gen_helper_set_inhibit_irq(cpu_env);
5215 s->tf = 0;
5217 if (s->is_jmp) {
5218 gen_jmp_im(s->pc - s->cs_base);
5219 gen_eob(s);
5221 break;
5222 case 0x1a1: /* pop fs */
5223 case 0x1a9: /* pop gs */
5224 gen_pop_T0(s);
5225 gen_movl_seg_T0(s, (b >> 3) & 7, pc_start - s->cs_base);
5226 gen_pop_update(s);
5227 if (s->is_jmp) {
5228 gen_jmp_im(s->pc - s->cs_base);
5229 gen_eob(s);
5231 break;
5233 /**************************/
5234 /* mov */
5235 case 0x88:
5236 case 0x89: /* mov Gv, Ev */
5237 if ((b & 1) == 0)
5238 ot = OT_BYTE;
5239 else
5240 ot = dflag + OT_WORD;
5241 modrm = cpu_ldub_code(env, s->pc++);
5242 reg = ((modrm >> 3) & 7) | rex_r;
5244 /* generate a generic store */
5245 gen_ldst_modrm(env, s, modrm, ot, reg, 1);
5246 break;
5247 case 0xc6:
5248 case 0xc7: /* mov Ev, Iv */
5249 if ((b & 1) == 0)
5250 ot = OT_BYTE;
5251 else
5252 ot = dflag + OT_WORD;
5253 modrm = cpu_ldub_code(env, s->pc++);
5254 mod = (modrm >> 6) & 3;
5255 if (mod != 3) {
5256 s->rip_offset = insn_const_size(ot);
5257 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5259 val = insn_get(env, s, ot);
5260 gen_op_movl_T0_im(val);
5261 if (mod != 3)
5262 gen_op_st_T0_A0(ot + s->mem_index);
5263 else
5264 gen_op_mov_reg_T0(ot, (modrm & 7) | REX_B(s));
5265 break;
5266 case 0x8a:
5267 case 0x8b: /* mov Ev, Gv */
5268 if ((b & 1) == 0)
5269 ot = OT_BYTE;
5270 else
5271 ot = OT_WORD + dflag;
5272 modrm = cpu_ldub_code(env, s->pc++);
5273 reg = ((modrm >> 3) & 7) | rex_r;
5275 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
5276 gen_op_mov_reg_T0(ot, reg);
5277 break;
5278 case 0x8e: /* mov seg, Gv */
5279 modrm = cpu_ldub_code(env, s->pc++);
5280 reg = (modrm >> 3) & 7;
5281 if (reg >= 6 || reg == R_CS)
5282 goto illegal_op;
5283 gen_ldst_modrm(env, s, modrm, OT_WORD, OR_TMP0, 0);
5284 gen_movl_seg_T0(s, reg, pc_start - s->cs_base);
5285 if (reg == R_SS) {
5286 /* if reg == SS, inhibit interrupts/trace */
5287 /* If several instructions disable interrupts, only the
5288 _first_ does it */
5289 if (!(s->tb->flags & HF_INHIBIT_IRQ_MASK))
5290 gen_helper_set_inhibit_irq(cpu_env);
5291 s->tf = 0;
5293 if (s->is_jmp) {
5294 gen_jmp_im(s->pc - s->cs_base);
5295 gen_eob(s);
5297 break;
5298 case 0x8c: /* mov Gv, seg */
5299 modrm = cpu_ldub_code(env, s->pc++);
5300 reg = (modrm >> 3) & 7;
5301 mod = (modrm >> 6) & 3;
5302 if (reg >= 6)
5303 goto illegal_op;
5304 gen_op_movl_T0_seg(reg);
5305 if (mod == 3)
5306 ot = OT_WORD + dflag;
5307 else
5308 ot = OT_WORD;
5309 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 1);
5310 break;
5312 case 0x1b6: /* movzbS Gv, Eb */
5313 case 0x1b7: /* movzwS Gv, Eb */
5314 case 0x1be: /* movsbS Gv, Eb */
5315 case 0x1bf: /* movswS Gv, Eb */
5317 int d_ot;
5318 /* d_ot is the size of destination */
5319 d_ot = dflag + OT_WORD;
5320 /* ot is the size of source */
5321 ot = (b & 1) + OT_BYTE;
5322 modrm = cpu_ldub_code(env, s->pc++);
5323 reg = ((modrm >> 3) & 7) | rex_r;
5324 mod = (modrm >> 6) & 3;
5325 rm = (modrm & 7) | REX_B(s);
5327 if (mod == 3) {
5328 gen_op_mov_TN_reg(ot, 0, rm);
5329 switch(ot | (b & 8)) {
5330 case OT_BYTE:
5331 tcg_gen_ext8u_tl(cpu_T[0], cpu_T[0]);
5332 break;
5333 case OT_BYTE | 8:
5334 tcg_gen_ext8s_tl(cpu_T[0], cpu_T[0]);
5335 break;
5336 case OT_WORD:
5337 tcg_gen_ext16u_tl(cpu_T[0], cpu_T[0]);
5338 break;
5339 default:
5340 case OT_WORD | 8:
5341 tcg_gen_ext16s_tl(cpu_T[0], cpu_T[0]);
5342 break;
5344 gen_op_mov_reg_T0(d_ot, reg);
5345 } else {
5346 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5347 if (b & 8) {
5348 gen_op_lds_T0_A0(ot + s->mem_index);
5349 } else {
5350 gen_op_ldu_T0_A0(ot + s->mem_index);
5352 gen_op_mov_reg_T0(d_ot, reg);
5355 break;
5357 case 0x8d: /* lea */
5358 ot = dflag + OT_WORD;
5359 modrm = cpu_ldub_code(env, s->pc++);
5360 mod = (modrm >> 6) & 3;
5361 if (mod == 3)
5362 goto illegal_op;
5363 reg = ((modrm >> 3) & 7) | rex_r;
5364 /* we must ensure that no segment is added */
5365 s->override = -1;
5366 val = s->addseg;
5367 s->addseg = 0;
5368 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5369 s->addseg = val;
5370 gen_op_mov_reg_A0(ot - OT_WORD, reg);
5371 break;
5373 case 0xa0: /* mov EAX, Ov */
5374 case 0xa1:
5375 case 0xa2: /* mov Ov, EAX */
5376 case 0xa3:
5378 target_ulong offset_addr;
5380 if ((b & 1) == 0)
5381 ot = OT_BYTE;
5382 else
5383 ot = dflag + OT_WORD;
5384 #ifdef TARGET_X86_64
5385 if (s->aflag == 2) {
5386 offset_addr = cpu_ldq_code(env, s->pc);
5387 s->pc += 8;
5388 gen_op_movq_A0_im(offset_addr);
5389 } else
5390 #endif
5392 if (s->aflag) {
5393 offset_addr = insn_get(env, s, OT_LONG);
5394 } else {
5395 offset_addr = insn_get(env, s, OT_WORD);
5397 gen_op_movl_A0_im(offset_addr);
5399 gen_add_A0_ds_seg(s);
5400 if ((b & 2) == 0) {
5401 gen_op_ld_T0_A0(ot + s->mem_index);
5402 gen_op_mov_reg_T0(ot, R_EAX);
5403 } else {
5404 gen_op_mov_TN_reg(ot, 0, R_EAX);
5405 gen_op_st_T0_A0(ot + s->mem_index);
5408 break;
5409 case 0xd7: /* xlat */
5410 #ifdef TARGET_X86_64
5411 if (s->aflag == 2) {
5412 gen_op_movq_A0_reg(R_EBX);
5413 gen_op_mov_TN_reg(OT_QUAD, 0, R_EAX);
5414 tcg_gen_andi_tl(cpu_T[0], cpu_T[0], 0xff);
5415 tcg_gen_add_tl(cpu_A0, cpu_A0, cpu_T[0]);
5416 } else
5417 #endif
5419 gen_op_movl_A0_reg(R_EBX);
5420 gen_op_mov_TN_reg(OT_LONG, 0, R_EAX);
5421 tcg_gen_andi_tl(cpu_T[0], cpu_T[0], 0xff);
5422 tcg_gen_add_tl(cpu_A0, cpu_A0, cpu_T[0]);
5423 if (s->aflag == 0)
5424 gen_op_andl_A0_ffff();
5425 else
5426 tcg_gen_andi_tl(cpu_A0, cpu_A0, 0xffffffff);
5428 gen_add_A0_ds_seg(s);
5429 gen_op_ldu_T0_A0(OT_BYTE + s->mem_index);
5430 gen_op_mov_reg_T0(OT_BYTE, R_EAX);
5431 break;
5432 case 0xb0 ... 0xb7: /* mov R, Ib */
5433 val = insn_get(env, s, OT_BYTE);
5434 gen_op_movl_T0_im(val);
5435 gen_op_mov_reg_T0(OT_BYTE, (b & 7) | REX_B(s));
5436 break;
5437 case 0xb8 ... 0xbf: /* mov R, Iv */
5438 #ifdef TARGET_X86_64
5439 if (dflag == 2) {
5440 uint64_t tmp;
5441 /* 64 bit case */
5442 tmp = cpu_ldq_code(env, s->pc);
5443 s->pc += 8;
5444 reg = (b & 7) | REX_B(s);
5445 gen_movtl_T0_im(tmp);
5446 gen_op_mov_reg_T0(OT_QUAD, reg);
5447 } else
5448 #endif
5450 ot = dflag ? OT_LONG : OT_WORD;
5451 val = insn_get(env, s, ot);
5452 reg = (b & 7) | REX_B(s);
5453 gen_op_movl_T0_im(val);
5454 gen_op_mov_reg_T0(ot, reg);
5456 break;
5458 case 0x91 ... 0x97: /* xchg R, EAX */
5459 do_xchg_reg_eax:
5460 ot = dflag + OT_WORD;
5461 reg = (b & 7) | REX_B(s);
5462 rm = R_EAX;
5463 goto do_xchg_reg;
5464 case 0x86:
5465 case 0x87: /* xchg Ev, Gv */
5466 if ((b & 1) == 0)
5467 ot = OT_BYTE;
5468 else
5469 ot = dflag + OT_WORD;
5470 modrm = cpu_ldub_code(env, s->pc++);
5471 reg = ((modrm >> 3) & 7) | rex_r;
5472 mod = (modrm >> 6) & 3;
5473 if (mod == 3) {
5474 rm = (modrm & 7) | REX_B(s);
5475 do_xchg_reg:
5476 gen_op_mov_TN_reg(ot, 0, reg);
5477 gen_op_mov_TN_reg(ot, 1, rm);
5478 gen_op_mov_reg_T0(ot, rm);
5479 gen_op_mov_reg_T1(ot, reg);
5480 } else {
5481 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5482 gen_op_mov_TN_reg(ot, 0, reg);
5483 /* for xchg, lock is implicit */
5484 if (!(prefixes & PREFIX_LOCK))
5485 gen_helper_lock();
5486 gen_op_ld_T1_A0(ot + s->mem_index);
5487 gen_op_st_T0_A0(ot + s->mem_index);
5488 if (!(prefixes & PREFIX_LOCK))
5489 gen_helper_unlock();
5490 gen_op_mov_reg_T1(ot, reg);
5492 break;
5493 case 0xc4: /* les Gv */
5494 if (CODE64(s))
5495 goto illegal_op;
5496 op = R_ES;
5497 goto do_lxx;
5498 case 0xc5: /* lds Gv */
5499 if (CODE64(s))
5500 goto illegal_op;
5501 op = R_DS;
5502 goto do_lxx;
5503 case 0x1b2: /* lss Gv */
5504 op = R_SS;
5505 goto do_lxx;
5506 case 0x1b4: /* lfs Gv */
5507 op = R_FS;
5508 goto do_lxx;
5509 case 0x1b5: /* lgs Gv */
5510 op = R_GS;
5511 do_lxx:
5512 ot = dflag ? OT_LONG : OT_WORD;
5513 modrm = cpu_ldub_code(env, s->pc++);
5514 reg = ((modrm >> 3) & 7) | rex_r;
5515 mod = (modrm >> 6) & 3;
5516 if (mod == 3)
5517 goto illegal_op;
5518 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5519 gen_op_ld_T1_A0(ot + s->mem_index);
5520 gen_add_A0_im(s, 1 << (ot - OT_WORD + 1));
5521 /* load the segment first to handle exceptions properly */
5522 gen_op_ldu_T0_A0(OT_WORD + s->mem_index);
5523 gen_movl_seg_T0(s, op, pc_start - s->cs_base);
5524 /* then put the data */
5525 gen_op_mov_reg_T1(ot, reg);
5526 if (s->is_jmp) {
5527 gen_jmp_im(s->pc - s->cs_base);
5528 gen_eob(s);
5530 break;
5532 /************************/
5533 /* shifts */
5534 case 0xc0:
5535 case 0xc1:
5536 /* shift Ev,Ib */
5537 shift = 2;
5538 grp2:
5540 if ((b & 1) == 0)
5541 ot = OT_BYTE;
5542 else
5543 ot = dflag + OT_WORD;
5545 modrm = cpu_ldub_code(env, s->pc++);
5546 mod = (modrm >> 6) & 3;
5547 op = (modrm >> 3) & 7;
5549 if (mod != 3) {
5550 if (shift == 2) {
5551 s->rip_offset = 1;
5553 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5554 opreg = OR_TMP0;
5555 } else {
5556 opreg = (modrm & 7) | REX_B(s);
5559 /* simpler op */
5560 if (shift == 0) {
5561 gen_shift(s, op, ot, opreg, OR_ECX);
5562 } else {
5563 if (shift == 2) {
5564 shift = cpu_ldub_code(env, s->pc++);
5566 gen_shifti(s, op, ot, opreg, shift);
5569 break;
5570 case 0xd0:
5571 case 0xd1:
5572 /* shift Ev,1 */
5573 shift = 1;
5574 goto grp2;
5575 case 0xd2:
5576 case 0xd3:
5577 /* shift Ev,cl */
5578 shift = 0;
5579 goto grp2;
5581 case 0x1a4: /* shld imm */
5582 op = 0;
5583 shift = 1;
5584 goto do_shiftd;
5585 case 0x1a5: /* shld cl */
5586 op = 0;
5587 shift = 0;
5588 goto do_shiftd;
5589 case 0x1ac: /* shrd imm */
5590 op = 1;
5591 shift = 1;
5592 goto do_shiftd;
5593 case 0x1ad: /* shrd cl */
5594 op = 1;
5595 shift = 0;
5596 do_shiftd:
5597 ot = dflag + OT_WORD;
5598 modrm = cpu_ldub_code(env, s->pc++);
5599 mod = (modrm >> 6) & 3;
5600 rm = (modrm & 7) | REX_B(s);
5601 reg = ((modrm >> 3) & 7) | rex_r;
5602 if (mod != 3) {
5603 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5604 opreg = OR_TMP0;
5605 } else {
5606 opreg = rm;
5608 gen_op_mov_TN_reg(ot, 1, reg);
5610 if (shift) {
5611 TCGv imm = tcg_const_tl(cpu_ldub_code(env, s->pc++));
5612 gen_shiftd_rm_T1(s, ot, opreg, op, imm);
5613 tcg_temp_free(imm);
5614 } else {
5615 gen_shiftd_rm_T1(s, ot, opreg, op, cpu_regs[R_ECX]);
5617 break;
5619 /************************/
5620 /* floats */
5621 case 0xd8 ... 0xdf:
5622 if (s->flags & (HF_EM_MASK | HF_TS_MASK)) {
5623 /* if CR0.EM or CR0.TS are set, generate an FPU exception */
5624 /* XXX: what to do if illegal op ? */
5625 gen_exception(s, EXCP07_PREX, pc_start - s->cs_base);
5626 break;
5628 modrm = cpu_ldub_code(env, s->pc++);
5629 mod = (modrm >> 6) & 3;
5630 rm = modrm & 7;
5631 op = ((b & 7) << 3) | ((modrm >> 3) & 7);
5632 if (mod != 3) {
5633 /* memory op */
5634 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5635 switch(op) {
5636 case 0x00 ... 0x07: /* fxxxs */
5637 case 0x10 ... 0x17: /* fixxxl */
5638 case 0x20 ... 0x27: /* fxxxl */
5639 case 0x30 ... 0x37: /* fixxx */
5641 int op1;
5642 op1 = op & 7;
5644 switch(op >> 4) {
5645 case 0:
5646 gen_op_ld_T0_A0(OT_LONG + s->mem_index);
5647 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
5648 gen_helper_flds_FT0(cpu_env, cpu_tmp2_i32);
5649 break;
5650 case 1:
5651 gen_op_ld_T0_A0(OT_LONG + s->mem_index);
5652 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
5653 gen_helper_fildl_FT0(cpu_env, cpu_tmp2_i32);
5654 break;
5655 case 2:
5656 tcg_gen_qemu_ld64(cpu_tmp1_i64, cpu_A0,
5657 (s->mem_index >> 2) - 1);
5658 gen_helper_fldl_FT0(cpu_env, cpu_tmp1_i64);
5659 break;
5660 case 3:
5661 default:
5662 gen_op_lds_T0_A0(OT_WORD + s->mem_index);
5663 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
5664 gen_helper_fildl_FT0(cpu_env, cpu_tmp2_i32);
5665 break;
5668 gen_helper_fp_arith_ST0_FT0(op1);
5669 if (op1 == 3) {
5670 /* fcomp needs pop */
5671 gen_helper_fpop(cpu_env);
5674 break;
5675 case 0x08: /* flds */
5676 case 0x0a: /* fsts */
5677 case 0x0b: /* fstps */
5678 case 0x18 ... 0x1b: /* fildl, fisttpl, fistl, fistpl */
5679 case 0x28 ... 0x2b: /* fldl, fisttpll, fstl, fstpl */
5680 case 0x38 ... 0x3b: /* filds, fisttps, fists, fistps */
5681 switch(op & 7) {
5682 case 0:
5683 switch(op >> 4) {
5684 case 0:
5685 gen_op_ld_T0_A0(OT_LONG + s->mem_index);
5686 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
5687 gen_helper_flds_ST0(cpu_env, cpu_tmp2_i32);
5688 break;
5689 case 1:
5690 gen_op_ld_T0_A0(OT_LONG + s->mem_index);
5691 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
5692 gen_helper_fildl_ST0(cpu_env, cpu_tmp2_i32);
5693 break;
5694 case 2:
5695 tcg_gen_qemu_ld64(cpu_tmp1_i64, cpu_A0,
5696 (s->mem_index >> 2) - 1);
5697 gen_helper_fldl_ST0(cpu_env, cpu_tmp1_i64);
5698 break;
5699 case 3:
5700 default:
5701 gen_op_lds_T0_A0(OT_WORD + s->mem_index);
5702 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
5703 gen_helper_fildl_ST0(cpu_env, cpu_tmp2_i32);
5704 break;
5706 break;
5707 case 1:
5708 /* XXX: the corresponding CPUID bit must be tested ! */
5709 switch(op >> 4) {
5710 case 1:
5711 gen_helper_fisttl_ST0(cpu_tmp2_i32, cpu_env);
5712 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
5713 gen_op_st_T0_A0(OT_LONG + s->mem_index);
5714 break;
5715 case 2:
5716 gen_helper_fisttll_ST0(cpu_tmp1_i64, cpu_env);
5717 tcg_gen_qemu_st64(cpu_tmp1_i64, cpu_A0,
5718 (s->mem_index >> 2) - 1);
5719 break;
5720 case 3:
5721 default:
5722 gen_helper_fistt_ST0(cpu_tmp2_i32, cpu_env);
5723 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
5724 gen_op_st_T0_A0(OT_WORD + s->mem_index);
5725 break;
5727 gen_helper_fpop(cpu_env);
5728 break;
5729 default:
5730 switch(op >> 4) {
5731 case 0:
5732 gen_helper_fsts_ST0(cpu_tmp2_i32, cpu_env);
5733 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
5734 gen_op_st_T0_A0(OT_LONG + s->mem_index);
5735 break;
5736 case 1:
5737 gen_helper_fistl_ST0(cpu_tmp2_i32, cpu_env);
5738 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
5739 gen_op_st_T0_A0(OT_LONG + s->mem_index);
5740 break;
5741 case 2:
5742 gen_helper_fstl_ST0(cpu_tmp1_i64, cpu_env);
5743 tcg_gen_qemu_st64(cpu_tmp1_i64, cpu_A0,
5744 (s->mem_index >> 2) - 1);
5745 break;
5746 case 3:
5747 default:
5748 gen_helper_fist_ST0(cpu_tmp2_i32, cpu_env);
5749 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
5750 gen_op_st_T0_A0(OT_WORD + s->mem_index);
5751 break;
5753 if ((op & 7) == 3)
5754 gen_helper_fpop(cpu_env);
5755 break;
5757 break;
5758 case 0x0c: /* fldenv mem */
5759 gen_update_cc_op(s);
5760 gen_jmp_im(pc_start - s->cs_base);
5761 gen_helper_fldenv(cpu_env, cpu_A0, tcg_const_i32(s->dflag));
5762 break;
5763 case 0x0d: /* fldcw mem */
5764 gen_op_ld_T0_A0(OT_WORD + s->mem_index);
5765 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
5766 gen_helper_fldcw(cpu_env, cpu_tmp2_i32);
5767 break;
5768 case 0x0e: /* fnstenv mem */
5769 gen_update_cc_op(s);
5770 gen_jmp_im(pc_start - s->cs_base);
5771 gen_helper_fstenv(cpu_env, cpu_A0, tcg_const_i32(s->dflag));
5772 break;
5773 case 0x0f: /* fnstcw mem */
5774 gen_helper_fnstcw(cpu_tmp2_i32, cpu_env);
5775 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
5776 gen_op_st_T0_A0(OT_WORD + s->mem_index);
5777 break;
5778 case 0x1d: /* fldt mem */
5779 gen_update_cc_op(s);
5780 gen_jmp_im(pc_start - s->cs_base);
5781 gen_helper_fldt_ST0(cpu_env, cpu_A0);
5782 break;
5783 case 0x1f: /* fstpt mem */
5784 gen_update_cc_op(s);
5785 gen_jmp_im(pc_start - s->cs_base);
5786 gen_helper_fstt_ST0(cpu_env, cpu_A0);
5787 gen_helper_fpop(cpu_env);
5788 break;
5789 case 0x2c: /* frstor mem */
5790 gen_update_cc_op(s);
5791 gen_jmp_im(pc_start - s->cs_base);
5792 gen_helper_frstor(cpu_env, cpu_A0, tcg_const_i32(s->dflag));
5793 break;
5794 case 0x2e: /* fnsave mem */
5795 gen_update_cc_op(s);
5796 gen_jmp_im(pc_start - s->cs_base);
5797 gen_helper_fsave(cpu_env, cpu_A0, tcg_const_i32(s->dflag));
5798 break;
5799 case 0x2f: /* fnstsw mem */
5800 gen_helper_fnstsw(cpu_tmp2_i32, cpu_env);
5801 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
5802 gen_op_st_T0_A0(OT_WORD + s->mem_index);
5803 break;
5804 case 0x3c: /* fbld */
5805 gen_update_cc_op(s);
5806 gen_jmp_im(pc_start - s->cs_base);
5807 gen_helper_fbld_ST0(cpu_env, cpu_A0);
5808 break;
5809 case 0x3e: /* fbstp */
5810 gen_update_cc_op(s);
5811 gen_jmp_im(pc_start - s->cs_base);
5812 gen_helper_fbst_ST0(cpu_env, cpu_A0);
5813 gen_helper_fpop(cpu_env);
5814 break;
5815 case 0x3d: /* fildll */
5816 tcg_gen_qemu_ld64(cpu_tmp1_i64, cpu_A0,
5817 (s->mem_index >> 2) - 1);
5818 gen_helper_fildll_ST0(cpu_env, cpu_tmp1_i64);
5819 break;
5820 case 0x3f: /* fistpll */
5821 gen_helper_fistll_ST0(cpu_tmp1_i64, cpu_env);
5822 tcg_gen_qemu_st64(cpu_tmp1_i64, cpu_A0,
5823 (s->mem_index >> 2) - 1);
5824 gen_helper_fpop(cpu_env);
5825 break;
5826 default:
5827 goto illegal_op;
5829 } else {
5830 /* register float ops */
5831 opreg = rm;
5833 switch(op) {
5834 case 0x08: /* fld sti */
5835 gen_helper_fpush(cpu_env);
5836 gen_helper_fmov_ST0_STN(cpu_env,
5837 tcg_const_i32((opreg + 1) & 7));
5838 break;
5839 case 0x09: /* fxchg sti */
5840 case 0x29: /* fxchg4 sti, undocumented op */
5841 case 0x39: /* fxchg7 sti, undocumented op */
5842 gen_helper_fxchg_ST0_STN(cpu_env, tcg_const_i32(opreg));
5843 break;
5844 case 0x0a: /* grp d9/2 */
5845 switch(rm) {
5846 case 0: /* fnop */
5847 /* check exceptions (FreeBSD FPU probe) */
5848 gen_update_cc_op(s);
5849 gen_jmp_im(pc_start - s->cs_base);
5850 gen_helper_fwait(cpu_env);
5851 break;
5852 default:
5853 goto illegal_op;
5855 break;
5856 case 0x0c: /* grp d9/4 */
5857 switch(rm) {
5858 case 0: /* fchs */
5859 gen_helper_fchs_ST0(cpu_env);
5860 break;
5861 case 1: /* fabs */
5862 gen_helper_fabs_ST0(cpu_env);
5863 break;
5864 case 4: /* ftst */
5865 gen_helper_fldz_FT0(cpu_env);
5866 gen_helper_fcom_ST0_FT0(cpu_env);
5867 break;
5868 case 5: /* fxam */
5869 gen_helper_fxam_ST0(cpu_env);
5870 break;
5871 default:
5872 goto illegal_op;
5874 break;
5875 case 0x0d: /* grp d9/5 */
5877 switch(rm) {
5878 case 0:
5879 gen_helper_fpush(cpu_env);
5880 gen_helper_fld1_ST0(cpu_env);
5881 break;
5882 case 1:
5883 gen_helper_fpush(cpu_env);
5884 gen_helper_fldl2t_ST0(cpu_env);
5885 break;
5886 case 2:
5887 gen_helper_fpush(cpu_env);
5888 gen_helper_fldl2e_ST0(cpu_env);
5889 break;
5890 case 3:
5891 gen_helper_fpush(cpu_env);
5892 gen_helper_fldpi_ST0(cpu_env);
5893 break;
5894 case 4:
5895 gen_helper_fpush(cpu_env);
5896 gen_helper_fldlg2_ST0(cpu_env);
5897 break;
5898 case 5:
5899 gen_helper_fpush(cpu_env);
5900 gen_helper_fldln2_ST0(cpu_env);
5901 break;
5902 case 6:
5903 gen_helper_fpush(cpu_env);
5904 gen_helper_fldz_ST0(cpu_env);
5905 break;
5906 default:
5907 goto illegal_op;
5910 break;
5911 case 0x0e: /* grp d9/6 */
5912 switch(rm) {
5913 case 0: /* f2xm1 */
5914 gen_helper_f2xm1(cpu_env);
5915 break;
5916 case 1: /* fyl2x */
5917 gen_helper_fyl2x(cpu_env);
5918 break;
5919 case 2: /* fptan */
5920 gen_helper_fptan(cpu_env);
5921 break;
5922 case 3: /* fpatan */
5923 gen_helper_fpatan(cpu_env);
5924 break;
5925 case 4: /* fxtract */
5926 gen_helper_fxtract(cpu_env);
5927 break;
5928 case 5: /* fprem1 */
5929 gen_helper_fprem1(cpu_env);
5930 break;
5931 case 6: /* fdecstp */
5932 gen_helper_fdecstp(cpu_env);
5933 break;
5934 default:
5935 case 7: /* fincstp */
5936 gen_helper_fincstp(cpu_env);
5937 break;
5939 break;
5940 case 0x0f: /* grp d9/7 */
5941 switch(rm) {
5942 case 0: /* fprem */
5943 gen_helper_fprem(cpu_env);
5944 break;
5945 case 1: /* fyl2xp1 */
5946 gen_helper_fyl2xp1(cpu_env);
5947 break;
5948 case 2: /* fsqrt */
5949 gen_helper_fsqrt(cpu_env);
5950 break;
5951 case 3: /* fsincos */
5952 gen_helper_fsincos(cpu_env);
5953 break;
5954 case 5: /* fscale */
5955 gen_helper_fscale(cpu_env);
5956 break;
5957 case 4: /* frndint */
5958 gen_helper_frndint(cpu_env);
5959 break;
5960 case 6: /* fsin */
5961 gen_helper_fsin(cpu_env);
5962 break;
5963 default:
5964 case 7: /* fcos */
5965 gen_helper_fcos(cpu_env);
5966 break;
5968 break;
5969 case 0x00: case 0x01: case 0x04 ... 0x07: /* fxxx st, sti */
5970 case 0x20: case 0x21: case 0x24 ... 0x27: /* fxxx sti, st */
5971 case 0x30: case 0x31: case 0x34 ... 0x37: /* fxxxp sti, st */
5973 int op1;
5975 op1 = op & 7;
5976 if (op >= 0x20) {
5977 gen_helper_fp_arith_STN_ST0(op1, opreg);
5978 if (op >= 0x30)
5979 gen_helper_fpop(cpu_env);
5980 } else {
5981 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
5982 gen_helper_fp_arith_ST0_FT0(op1);
5985 break;
5986 case 0x02: /* fcom */
5987 case 0x22: /* fcom2, undocumented op */
5988 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
5989 gen_helper_fcom_ST0_FT0(cpu_env);
5990 break;
5991 case 0x03: /* fcomp */
5992 case 0x23: /* fcomp3, undocumented op */
5993 case 0x32: /* fcomp5, undocumented op */
5994 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
5995 gen_helper_fcom_ST0_FT0(cpu_env);
5996 gen_helper_fpop(cpu_env);
5997 break;
5998 case 0x15: /* da/5 */
5999 switch(rm) {
6000 case 1: /* fucompp */
6001 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(1));
6002 gen_helper_fucom_ST0_FT0(cpu_env);
6003 gen_helper_fpop(cpu_env);
6004 gen_helper_fpop(cpu_env);
6005 break;
6006 default:
6007 goto illegal_op;
6009 break;
6010 case 0x1c:
6011 switch(rm) {
6012 case 0: /* feni (287 only, just do nop here) */
6013 break;
6014 case 1: /* fdisi (287 only, just do nop here) */
6015 break;
6016 case 2: /* fclex */
6017 gen_helper_fclex(cpu_env);
6018 break;
6019 case 3: /* fninit */
6020 gen_helper_fninit(cpu_env);
6021 break;
6022 case 4: /* fsetpm (287 only, just do nop here) */
6023 break;
6024 default:
6025 goto illegal_op;
6027 break;
6028 case 0x1d: /* fucomi */
6029 gen_update_cc_op(s);
6030 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6031 gen_helper_fucomi_ST0_FT0(cpu_env);
6032 set_cc_op(s, CC_OP_EFLAGS);
6033 break;
6034 case 0x1e: /* fcomi */
6035 gen_update_cc_op(s);
6036 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6037 gen_helper_fcomi_ST0_FT0(cpu_env);
6038 set_cc_op(s, CC_OP_EFLAGS);
6039 break;
6040 case 0x28: /* ffree sti */
6041 gen_helper_ffree_STN(cpu_env, tcg_const_i32(opreg));
6042 break;
6043 case 0x2a: /* fst sti */
6044 gen_helper_fmov_STN_ST0(cpu_env, tcg_const_i32(opreg));
6045 break;
6046 case 0x2b: /* fstp sti */
6047 case 0x0b: /* fstp1 sti, undocumented op */
6048 case 0x3a: /* fstp8 sti, undocumented op */
6049 case 0x3b: /* fstp9 sti, undocumented op */
6050 gen_helper_fmov_STN_ST0(cpu_env, tcg_const_i32(opreg));
6051 gen_helper_fpop(cpu_env);
6052 break;
6053 case 0x2c: /* fucom st(i) */
6054 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6055 gen_helper_fucom_ST0_FT0(cpu_env);
6056 break;
6057 case 0x2d: /* fucomp st(i) */
6058 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6059 gen_helper_fucom_ST0_FT0(cpu_env);
6060 gen_helper_fpop(cpu_env);
6061 break;
6062 case 0x33: /* de/3 */
6063 switch(rm) {
6064 case 1: /* fcompp */
6065 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(1));
6066 gen_helper_fcom_ST0_FT0(cpu_env);
6067 gen_helper_fpop(cpu_env);
6068 gen_helper_fpop(cpu_env);
6069 break;
6070 default:
6071 goto illegal_op;
6073 break;
6074 case 0x38: /* ffreep sti, undocumented op */
6075 gen_helper_ffree_STN(cpu_env, tcg_const_i32(opreg));
6076 gen_helper_fpop(cpu_env);
6077 break;
6078 case 0x3c: /* df/4 */
6079 switch(rm) {
6080 case 0:
6081 gen_helper_fnstsw(cpu_tmp2_i32, cpu_env);
6082 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
6083 gen_op_mov_reg_T0(OT_WORD, R_EAX);
6084 break;
6085 default:
6086 goto illegal_op;
6088 break;
6089 case 0x3d: /* fucomip */
6090 gen_update_cc_op(s);
6091 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6092 gen_helper_fucomi_ST0_FT0(cpu_env);
6093 gen_helper_fpop(cpu_env);
6094 set_cc_op(s, CC_OP_EFLAGS);
6095 break;
6096 case 0x3e: /* fcomip */
6097 gen_update_cc_op(s);
6098 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6099 gen_helper_fcomi_ST0_FT0(cpu_env);
6100 gen_helper_fpop(cpu_env);
6101 set_cc_op(s, CC_OP_EFLAGS);
6102 break;
6103 case 0x10 ... 0x13: /* fcmovxx */
6104 case 0x18 ... 0x1b:
6106 int op1, l1;
6107 static const uint8_t fcmov_cc[8] = {
6108 (JCC_B << 1),
6109 (JCC_Z << 1),
6110 (JCC_BE << 1),
6111 (JCC_P << 1),
6113 op1 = fcmov_cc[op & 3] | (((op >> 3) & 1) ^ 1);
6114 l1 = gen_new_label();
6115 gen_jcc1_noeob(s, op1, l1);
6116 gen_helper_fmov_ST0_STN(cpu_env, tcg_const_i32(opreg));
6117 gen_set_label(l1);
6119 break;
6120 default:
6121 goto illegal_op;
6124 break;
6125 /************************/
6126 /* string ops */
6128 case 0xa4: /* movsS */
6129 case 0xa5:
6130 if ((b & 1) == 0)
6131 ot = OT_BYTE;
6132 else
6133 ot = dflag + OT_WORD;
6135 if (prefixes & (PREFIX_REPZ | PREFIX_REPNZ)) {
6136 gen_repz_movs(s, ot, pc_start - s->cs_base, s->pc - s->cs_base);
6137 } else {
6138 gen_movs(s, ot);
6140 break;
6142 case 0xaa: /* stosS */
6143 case 0xab:
6144 if ((b & 1) == 0)
6145 ot = OT_BYTE;
6146 else
6147 ot = dflag + OT_WORD;
6149 if (prefixes & (PREFIX_REPZ | PREFIX_REPNZ)) {
6150 gen_repz_stos(s, ot, pc_start - s->cs_base, s->pc - s->cs_base);
6151 } else {
6152 gen_stos(s, ot);
6154 break;
6155 case 0xac: /* lodsS */
6156 case 0xad:
6157 if ((b & 1) == 0)
6158 ot = OT_BYTE;
6159 else
6160 ot = dflag + OT_WORD;
6161 if (prefixes & (PREFIX_REPZ | PREFIX_REPNZ)) {
6162 gen_repz_lods(s, ot, pc_start - s->cs_base, s->pc - s->cs_base);
6163 } else {
6164 gen_lods(s, ot);
6166 break;
6167 case 0xae: /* scasS */
6168 case 0xaf:
6169 if ((b & 1) == 0)
6170 ot = OT_BYTE;
6171 else
6172 ot = dflag + OT_WORD;
6173 if (prefixes & PREFIX_REPNZ) {
6174 gen_repz_scas(s, ot, pc_start - s->cs_base, s->pc - s->cs_base, 1);
6175 } else if (prefixes & PREFIX_REPZ) {
6176 gen_repz_scas(s, ot, pc_start - s->cs_base, s->pc - s->cs_base, 0);
6177 } else {
6178 gen_scas(s, ot);
6180 break;
6182 case 0xa6: /* cmpsS */
6183 case 0xa7:
6184 if ((b & 1) == 0)
6185 ot = OT_BYTE;
6186 else
6187 ot = dflag + OT_WORD;
6188 if (prefixes & PREFIX_REPNZ) {
6189 gen_repz_cmps(s, ot, pc_start - s->cs_base, s->pc - s->cs_base, 1);
6190 } else if (prefixes & PREFIX_REPZ) {
6191 gen_repz_cmps(s, ot, pc_start - s->cs_base, s->pc - s->cs_base, 0);
6192 } else {
6193 gen_cmps(s, ot);
6195 break;
6196 case 0x6c: /* insS */
6197 case 0x6d:
6198 if ((b & 1) == 0)
6199 ot = OT_BYTE;
6200 else
6201 ot = dflag ? OT_LONG : OT_WORD;
6202 gen_op_mov_TN_reg(OT_WORD, 0, R_EDX);
6203 gen_op_andl_T0_ffff();
6204 gen_check_io(s, ot, pc_start - s->cs_base,
6205 SVM_IOIO_TYPE_MASK | svm_is_rep(prefixes) | 4);
6206 if (prefixes & (PREFIX_REPZ | PREFIX_REPNZ)) {
6207 gen_repz_ins(s, ot, pc_start - s->cs_base, s->pc - s->cs_base);
6208 } else {
6209 gen_ins(s, ot);
6210 if (use_icount) {
6211 gen_jmp(s, s->pc - s->cs_base);
6214 break;
6215 case 0x6e: /* outsS */
6216 case 0x6f:
6217 if ((b & 1) == 0)
6218 ot = OT_BYTE;
6219 else
6220 ot = dflag ? OT_LONG : OT_WORD;
6221 gen_op_mov_TN_reg(OT_WORD, 0, R_EDX);
6222 gen_op_andl_T0_ffff();
6223 gen_check_io(s, ot, pc_start - s->cs_base,
6224 svm_is_rep(prefixes) | 4);
6225 if (prefixes & (PREFIX_REPZ | PREFIX_REPNZ)) {
6226 gen_repz_outs(s, ot, pc_start - s->cs_base, s->pc - s->cs_base);
6227 } else {
6228 gen_outs(s, ot);
6229 if (use_icount) {
6230 gen_jmp(s, s->pc - s->cs_base);
6233 break;
6235 /************************/
6236 /* port I/O */
6238 case 0xe4:
6239 case 0xe5:
6240 if ((b & 1) == 0)
6241 ot = OT_BYTE;
6242 else
6243 ot = dflag ? OT_LONG : OT_WORD;
6244 val = cpu_ldub_code(env, s->pc++);
6245 gen_op_movl_T0_im(val);
6246 gen_check_io(s, ot, pc_start - s->cs_base,
6247 SVM_IOIO_TYPE_MASK | svm_is_rep(prefixes));
6248 if (use_icount)
6249 gen_io_start();
6250 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
6251 gen_helper_in_func(ot, cpu_T[1], cpu_tmp2_i32);
6252 gen_op_mov_reg_T1(ot, R_EAX);
6253 if (use_icount) {
6254 gen_io_end();
6255 gen_jmp(s, s->pc - s->cs_base);
6257 break;
6258 case 0xe6:
6259 case 0xe7:
6260 if ((b & 1) == 0)
6261 ot = OT_BYTE;
6262 else
6263 ot = dflag ? OT_LONG : OT_WORD;
6264 val = cpu_ldub_code(env, s->pc++);
6265 gen_op_movl_T0_im(val);
6266 gen_check_io(s, ot, pc_start - s->cs_base,
6267 svm_is_rep(prefixes));
6268 gen_op_mov_TN_reg(ot, 1, R_EAX);
6270 if (use_icount)
6271 gen_io_start();
6272 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
6273 tcg_gen_trunc_tl_i32(cpu_tmp3_i32, cpu_T[1]);
6274 gen_helper_out_func(ot, cpu_tmp2_i32, cpu_tmp3_i32);
6275 if (use_icount) {
6276 gen_io_end();
6277 gen_jmp(s, s->pc - s->cs_base);
6279 break;
6280 case 0xec:
6281 case 0xed:
6282 if ((b & 1) == 0)
6283 ot = OT_BYTE;
6284 else
6285 ot = dflag ? OT_LONG : OT_WORD;
6286 gen_op_mov_TN_reg(OT_WORD, 0, R_EDX);
6287 gen_op_andl_T0_ffff();
6288 gen_check_io(s, ot, pc_start - s->cs_base,
6289 SVM_IOIO_TYPE_MASK | svm_is_rep(prefixes));
6290 if (use_icount)
6291 gen_io_start();
6292 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
6293 gen_helper_in_func(ot, cpu_T[1], cpu_tmp2_i32);
6294 gen_op_mov_reg_T1(ot, R_EAX);
6295 if (use_icount) {
6296 gen_io_end();
6297 gen_jmp(s, s->pc - s->cs_base);
6299 break;
6300 case 0xee:
6301 case 0xef:
6302 if ((b & 1) == 0)
6303 ot = OT_BYTE;
6304 else
6305 ot = dflag ? OT_LONG : OT_WORD;
6306 gen_op_mov_TN_reg(OT_WORD, 0, R_EDX);
6307 gen_op_andl_T0_ffff();
6308 gen_check_io(s, ot, pc_start - s->cs_base,
6309 svm_is_rep(prefixes));
6310 gen_op_mov_TN_reg(ot, 1, R_EAX);
6312 if (use_icount)
6313 gen_io_start();
6314 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
6315 tcg_gen_trunc_tl_i32(cpu_tmp3_i32, cpu_T[1]);
6316 gen_helper_out_func(ot, cpu_tmp2_i32, cpu_tmp3_i32);
6317 if (use_icount) {
6318 gen_io_end();
6319 gen_jmp(s, s->pc - s->cs_base);
6321 break;
6323 /************************/
6324 /* control */
6325 case 0xc2: /* ret im */
6326 val = cpu_ldsw_code(env, s->pc);
6327 s->pc += 2;
6328 gen_pop_T0(s);
6329 if (CODE64(s) && s->dflag)
6330 s->dflag = 2;
6331 gen_stack_update(s, val + (2 << s->dflag));
6332 if (s->dflag == 0)
6333 gen_op_andl_T0_ffff();
6334 gen_op_jmp_T0();
6335 gen_eob(s);
6336 break;
6337 case 0xc3: /* ret */
6338 gen_pop_T0(s);
6339 gen_pop_update(s);
6340 if (s->dflag == 0)
6341 gen_op_andl_T0_ffff();
6342 gen_op_jmp_T0();
6343 gen_eob(s);
6344 break;
6345 case 0xca: /* lret im */
6346 val = cpu_ldsw_code(env, s->pc);
6347 s->pc += 2;
6348 do_lret:
6349 if (s->pe && !s->vm86) {
6350 gen_update_cc_op(s);
6351 gen_jmp_im(pc_start - s->cs_base);
6352 gen_helper_lret_protected(cpu_env, tcg_const_i32(s->dflag),
6353 tcg_const_i32(val));
6354 } else {
6355 gen_stack_A0(s);
6356 /* pop offset */
6357 gen_op_ld_T0_A0(1 + s->dflag + s->mem_index);
6358 if (s->dflag == 0)
6359 gen_op_andl_T0_ffff();
6360 /* NOTE: keeping EIP updated is not a problem in case of
6361 exception */
6362 gen_op_jmp_T0();
6363 /* pop selector */
6364 gen_op_addl_A0_im(2 << s->dflag);
6365 gen_op_ld_T0_A0(1 + s->dflag + s->mem_index);
6366 gen_op_movl_seg_T0_vm(R_CS);
6367 /* add stack offset */
6368 gen_stack_update(s, val + (4 << s->dflag));
6370 gen_eob(s);
6371 break;
6372 case 0xcb: /* lret */
6373 val = 0;
6374 goto do_lret;
6375 case 0xcf: /* iret */
6376 gen_svm_check_intercept(s, pc_start, SVM_EXIT_IRET);
6377 if (!s->pe) {
6378 /* real mode */
6379 gen_helper_iret_real(cpu_env, tcg_const_i32(s->dflag));
6380 set_cc_op(s, CC_OP_EFLAGS);
6381 } else if (s->vm86) {
6382 if (s->iopl != 3) {
6383 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
6384 } else {
6385 gen_helper_iret_real(cpu_env, tcg_const_i32(s->dflag));
6386 set_cc_op(s, CC_OP_EFLAGS);
6388 } else {
6389 gen_update_cc_op(s);
6390 gen_jmp_im(pc_start - s->cs_base);
6391 gen_helper_iret_protected(cpu_env, tcg_const_i32(s->dflag),
6392 tcg_const_i32(s->pc - s->cs_base));
6393 set_cc_op(s, CC_OP_EFLAGS);
6395 gen_eob(s);
6396 break;
6397 case 0xe8: /* call im */
6399 if (dflag)
6400 tval = (int32_t)insn_get(env, s, OT_LONG);
6401 else
6402 tval = (int16_t)insn_get(env, s, OT_WORD);
6403 next_eip = s->pc - s->cs_base;
6404 tval += next_eip;
6405 if (s->dflag == 0)
6406 tval &= 0xffff;
6407 else if(!CODE64(s))
6408 tval &= 0xffffffff;
6409 gen_movtl_T0_im(next_eip);
6410 gen_push_T0(s);
6411 gen_jmp(s, tval);
6413 break;
6414 case 0x9a: /* lcall im */
6416 unsigned int selector, offset;
6418 if (CODE64(s))
6419 goto illegal_op;
6420 ot = dflag ? OT_LONG : OT_WORD;
6421 offset = insn_get(env, s, ot);
6422 selector = insn_get(env, s, OT_WORD);
6424 gen_op_movl_T0_im(selector);
6425 gen_op_movl_T1_imu(offset);
6427 goto do_lcall;
6428 case 0xe9: /* jmp im */
6429 if (dflag)
6430 tval = (int32_t)insn_get(env, s, OT_LONG);
6431 else
6432 tval = (int16_t)insn_get(env, s, OT_WORD);
6433 tval += s->pc - s->cs_base;
6434 if (s->dflag == 0)
6435 tval &= 0xffff;
6436 else if(!CODE64(s))
6437 tval &= 0xffffffff;
6438 gen_jmp(s, tval);
6439 break;
6440 case 0xea: /* ljmp im */
6442 unsigned int selector, offset;
6444 if (CODE64(s))
6445 goto illegal_op;
6446 ot = dflag ? OT_LONG : OT_WORD;
6447 offset = insn_get(env, s, ot);
6448 selector = insn_get(env, s, OT_WORD);
6450 gen_op_movl_T0_im(selector);
6451 gen_op_movl_T1_imu(offset);
6453 goto do_ljmp;
6454 case 0xeb: /* jmp Jb */
6455 tval = (int8_t)insn_get(env, s, OT_BYTE);
6456 tval += s->pc - s->cs_base;
6457 if (s->dflag == 0)
6458 tval &= 0xffff;
6459 gen_jmp(s, tval);
6460 break;
6461 case 0x70 ... 0x7f: /* jcc Jb */
6462 tval = (int8_t)insn_get(env, s, OT_BYTE);
6463 goto do_jcc;
6464 case 0x180 ... 0x18f: /* jcc Jv */
6465 if (dflag) {
6466 tval = (int32_t)insn_get(env, s, OT_LONG);
6467 } else {
6468 tval = (int16_t)insn_get(env, s, OT_WORD);
6470 do_jcc:
6471 next_eip = s->pc - s->cs_base;
6472 tval += next_eip;
6473 if (s->dflag == 0)
6474 tval &= 0xffff;
6475 gen_jcc(s, b, tval, next_eip);
6476 break;
6478 case 0x190 ... 0x19f: /* setcc Gv */
6479 modrm = cpu_ldub_code(env, s->pc++);
6480 gen_setcc1(s, b, cpu_T[0]);
6481 gen_ldst_modrm(env, s, modrm, OT_BYTE, OR_TMP0, 1);
6482 break;
6483 case 0x140 ... 0x14f: /* cmov Gv, Ev */
6484 ot = dflag + OT_WORD;
6485 modrm = cpu_ldub_code(env, s->pc++);
6486 reg = ((modrm >> 3) & 7) | rex_r;
6487 gen_cmovcc1(env, s, ot, b, modrm, reg);
6488 break;
6490 /************************/
6491 /* flags */
6492 case 0x9c: /* pushf */
6493 gen_svm_check_intercept(s, pc_start, SVM_EXIT_PUSHF);
6494 if (s->vm86 && s->iopl != 3) {
6495 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
6496 } else {
6497 gen_update_cc_op(s);
6498 gen_helper_read_eflags(cpu_T[0], cpu_env);
6499 gen_push_T0(s);
6501 break;
6502 case 0x9d: /* popf */
6503 gen_svm_check_intercept(s, pc_start, SVM_EXIT_POPF);
6504 if (s->vm86 && s->iopl != 3) {
6505 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
6506 } else {
6507 gen_pop_T0(s);
6508 if (s->cpl == 0) {
6509 if (s->dflag) {
6510 gen_helper_write_eflags(cpu_env, cpu_T[0],
6511 tcg_const_i32((TF_MASK | AC_MASK |
6512 ID_MASK | NT_MASK |
6513 IF_MASK |
6514 IOPL_MASK)));
6515 } else {
6516 gen_helper_write_eflags(cpu_env, cpu_T[0],
6517 tcg_const_i32((TF_MASK | AC_MASK |
6518 ID_MASK | NT_MASK |
6519 IF_MASK | IOPL_MASK)
6520 & 0xffff));
6522 } else {
6523 if (s->cpl <= s->iopl) {
6524 if (s->dflag) {
6525 gen_helper_write_eflags(cpu_env, cpu_T[0],
6526 tcg_const_i32((TF_MASK |
6527 AC_MASK |
6528 ID_MASK |
6529 NT_MASK |
6530 IF_MASK)));
6531 } else {
6532 gen_helper_write_eflags(cpu_env, cpu_T[0],
6533 tcg_const_i32((TF_MASK |
6534 AC_MASK |
6535 ID_MASK |
6536 NT_MASK |
6537 IF_MASK)
6538 & 0xffff));
6540 } else {
6541 if (s->dflag) {
6542 gen_helper_write_eflags(cpu_env, cpu_T[0],
6543 tcg_const_i32((TF_MASK | AC_MASK |
6544 ID_MASK | NT_MASK)));
6545 } else {
6546 gen_helper_write_eflags(cpu_env, cpu_T[0],
6547 tcg_const_i32((TF_MASK | AC_MASK |
6548 ID_MASK | NT_MASK)
6549 & 0xffff));
6553 gen_pop_update(s);
6554 set_cc_op(s, CC_OP_EFLAGS);
6555 /* abort translation because TF/AC flag may change */
6556 gen_jmp_im(s->pc - s->cs_base);
6557 gen_eob(s);
6559 break;
6560 case 0x9e: /* sahf */
6561 if (CODE64(s) && !(s->cpuid_ext3_features & CPUID_EXT3_LAHF_LM))
6562 goto illegal_op;
6563 gen_op_mov_TN_reg(OT_BYTE, 0, R_AH);
6564 gen_compute_eflags(s);
6565 tcg_gen_andi_tl(cpu_cc_src, cpu_cc_src, CC_O);
6566 tcg_gen_andi_tl(cpu_T[0], cpu_T[0], CC_S | CC_Z | CC_A | CC_P | CC_C);
6567 tcg_gen_or_tl(cpu_cc_src, cpu_cc_src, cpu_T[0]);
6568 break;
6569 case 0x9f: /* lahf */
6570 if (CODE64(s) && !(s->cpuid_ext3_features & CPUID_EXT3_LAHF_LM))
6571 goto illegal_op;
6572 gen_compute_eflags(s);
6573 /* Note: gen_compute_eflags() only gives the condition codes */
6574 tcg_gen_ori_tl(cpu_T[0], cpu_cc_src, 0x02);
6575 gen_op_mov_reg_T0(OT_BYTE, R_AH);
6576 break;
6577 case 0xf5: /* cmc */
6578 gen_compute_eflags(s);
6579 tcg_gen_xori_tl(cpu_cc_src, cpu_cc_src, CC_C);
6580 break;
6581 case 0xf8: /* clc */
6582 gen_compute_eflags(s);
6583 tcg_gen_andi_tl(cpu_cc_src, cpu_cc_src, ~CC_C);
6584 break;
6585 case 0xf9: /* stc */
6586 gen_compute_eflags(s);
6587 tcg_gen_ori_tl(cpu_cc_src, cpu_cc_src, CC_C);
6588 break;
6589 case 0xfc: /* cld */
6590 tcg_gen_movi_i32(cpu_tmp2_i32, 1);
6591 tcg_gen_st_i32(cpu_tmp2_i32, cpu_env, offsetof(CPUX86State, df));
6592 break;
6593 case 0xfd: /* std */
6594 tcg_gen_movi_i32(cpu_tmp2_i32, -1);
6595 tcg_gen_st_i32(cpu_tmp2_i32, cpu_env, offsetof(CPUX86State, df));
6596 break;
6598 /************************/
6599 /* bit operations */
6600 case 0x1ba: /* bt/bts/btr/btc Gv, im */
6601 ot = dflag + OT_WORD;
6602 modrm = cpu_ldub_code(env, s->pc++);
6603 op = (modrm >> 3) & 7;
6604 mod = (modrm >> 6) & 3;
6605 rm = (modrm & 7) | REX_B(s);
6606 if (mod != 3) {
6607 s->rip_offset = 1;
6608 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
6609 gen_op_ld_T0_A0(ot + s->mem_index);
6610 } else {
6611 gen_op_mov_TN_reg(ot, 0, rm);
6613 /* load shift */
6614 val = cpu_ldub_code(env, s->pc++);
6615 gen_op_movl_T1_im(val);
6616 if (op < 4)
6617 goto illegal_op;
6618 op -= 4;
6619 goto bt_op;
6620 case 0x1a3: /* bt Gv, Ev */
6621 op = 0;
6622 goto do_btx;
6623 case 0x1ab: /* bts */
6624 op = 1;
6625 goto do_btx;
6626 case 0x1b3: /* btr */
6627 op = 2;
6628 goto do_btx;
6629 case 0x1bb: /* btc */
6630 op = 3;
6631 do_btx:
6632 ot = dflag + OT_WORD;
6633 modrm = cpu_ldub_code(env, s->pc++);
6634 reg = ((modrm >> 3) & 7) | rex_r;
6635 mod = (modrm >> 6) & 3;
6636 rm = (modrm & 7) | REX_B(s);
6637 gen_op_mov_TN_reg(OT_LONG, 1, reg);
6638 if (mod != 3) {
6639 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
6640 /* specific case: we need to add a displacement */
6641 gen_exts(ot, cpu_T[1]);
6642 tcg_gen_sari_tl(cpu_tmp0, cpu_T[1], 3 + ot);
6643 tcg_gen_shli_tl(cpu_tmp0, cpu_tmp0, ot);
6644 tcg_gen_add_tl(cpu_A0, cpu_A0, cpu_tmp0);
6645 gen_op_ld_T0_A0(ot + s->mem_index);
6646 } else {
6647 gen_op_mov_TN_reg(ot, 0, rm);
6649 bt_op:
6650 tcg_gen_andi_tl(cpu_T[1], cpu_T[1], (1 << (3 + ot)) - 1);
6651 switch(op) {
6652 case 0:
6653 tcg_gen_shr_tl(cpu_cc_src, cpu_T[0], cpu_T[1]);
6654 tcg_gen_movi_tl(cpu_cc_dst, 0);
6655 break;
6656 case 1:
6657 tcg_gen_shr_tl(cpu_tmp4, cpu_T[0], cpu_T[1]);
6658 tcg_gen_movi_tl(cpu_tmp0, 1);
6659 tcg_gen_shl_tl(cpu_tmp0, cpu_tmp0, cpu_T[1]);
6660 tcg_gen_or_tl(cpu_T[0], cpu_T[0], cpu_tmp0);
6661 break;
6662 case 2:
6663 tcg_gen_shr_tl(cpu_tmp4, cpu_T[0], cpu_T[1]);
6664 tcg_gen_movi_tl(cpu_tmp0, 1);
6665 tcg_gen_shl_tl(cpu_tmp0, cpu_tmp0, cpu_T[1]);
6666 tcg_gen_not_tl(cpu_tmp0, cpu_tmp0);
6667 tcg_gen_and_tl(cpu_T[0], cpu_T[0], cpu_tmp0);
6668 break;
6669 default:
6670 case 3:
6671 tcg_gen_shr_tl(cpu_tmp4, cpu_T[0], cpu_T[1]);
6672 tcg_gen_movi_tl(cpu_tmp0, 1);
6673 tcg_gen_shl_tl(cpu_tmp0, cpu_tmp0, cpu_T[1]);
6674 tcg_gen_xor_tl(cpu_T[0], cpu_T[0], cpu_tmp0);
6675 break;
6677 set_cc_op(s, CC_OP_SARB + ot);
6678 if (op != 0) {
6679 if (mod != 3)
6680 gen_op_st_T0_A0(ot + s->mem_index);
6681 else
6682 gen_op_mov_reg_T0(ot, rm);
6683 tcg_gen_mov_tl(cpu_cc_src, cpu_tmp4);
6684 tcg_gen_movi_tl(cpu_cc_dst, 0);
6686 break;
6687 case 0x1bc: /* bsf */
6688 case 0x1bd: /* bsr */
6690 int label1;
6691 TCGv t0;
6693 ot = dflag + OT_WORD;
6694 modrm = cpu_ldub_code(env, s->pc++);
6695 reg = ((modrm >> 3) & 7) | rex_r;
6696 gen_ldst_modrm(env, s,modrm, ot, OR_TMP0, 0);
6697 gen_extu(ot, cpu_T[0]);
6698 t0 = tcg_temp_local_new();
6699 tcg_gen_mov_tl(t0, cpu_T[0]);
6700 if ((b & 1) && (prefixes & PREFIX_REPZ) &&
6701 (s->cpuid_ext3_features & CPUID_EXT3_ABM)) {
6702 switch(ot) {
6703 case OT_WORD: gen_helper_lzcnt(cpu_T[0], t0,
6704 tcg_const_i32(16)); break;
6705 case OT_LONG: gen_helper_lzcnt(cpu_T[0], t0,
6706 tcg_const_i32(32)); break;
6707 case OT_QUAD: gen_helper_lzcnt(cpu_T[0], t0,
6708 tcg_const_i32(64)); break;
6710 gen_op_mov_reg_T0(ot, reg);
6711 } else {
6712 label1 = gen_new_label();
6713 tcg_gen_movi_tl(cpu_cc_dst, 0);
6714 tcg_gen_brcondi_tl(TCG_COND_EQ, t0, 0, label1);
6715 if (b & 1) {
6716 gen_helper_bsr(cpu_T[0], t0);
6717 } else {
6718 gen_helper_bsf(cpu_T[0], t0);
6720 gen_op_mov_reg_T0(ot, reg);
6721 tcg_gen_movi_tl(cpu_cc_dst, 1);
6722 gen_set_label(label1);
6723 set_cc_op(s, CC_OP_LOGICB + ot);
6725 tcg_temp_free(t0);
6727 break;
6728 /************************/
6729 /* bcd */
6730 case 0x27: /* daa */
6731 if (CODE64(s))
6732 goto illegal_op;
6733 gen_update_cc_op(s);
6734 gen_helper_daa(cpu_env);
6735 set_cc_op(s, CC_OP_EFLAGS);
6736 break;
6737 case 0x2f: /* das */
6738 if (CODE64(s))
6739 goto illegal_op;
6740 gen_update_cc_op(s);
6741 gen_helper_das(cpu_env);
6742 set_cc_op(s, CC_OP_EFLAGS);
6743 break;
6744 case 0x37: /* aaa */
6745 if (CODE64(s))
6746 goto illegal_op;
6747 gen_update_cc_op(s);
6748 gen_helper_aaa(cpu_env);
6749 set_cc_op(s, CC_OP_EFLAGS);
6750 break;
6751 case 0x3f: /* aas */
6752 if (CODE64(s))
6753 goto illegal_op;
6754 gen_update_cc_op(s);
6755 gen_helper_aas(cpu_env);
6756 set_cc_op(s, CC_OP_EFLAGS);
6757 break;
6758 case 0xd4: /* aam */
6759 if (CODE64(s))
6760 goto illegal_op;
6761 val = cpu_ldub_code(env, s->pc++);
6762 if (val == 0) {
6763 gen_exception(s, EXCP00_DIVZ, pc_start - s->cs_base);
6764 } else {
6765 gen_helper_aam(cpu_env, tcg_const_i32(val));
6766 set_cc_op(s, CC_OP_LOGICB);
6768 break;
6769 case 0xd5: /* aad */
6770 if (CODE64(s))
6771 goto illegal_op;
6772 val = cpu_ldub_code(env, s->pc++);
6773 gen_helper_aad(cpu_env, tcg_const_i32(val));
6774 set_cc_op(s, CC_OP_LOGICB);
6775 break;
6776 /************************/
6777 /* misc */
6778 case 0x90: /* nop */
6779 /* XXX: correct lock test for all insn */
6780 if (prefixes & PREFIX_LOCK) {
6781 goto illegal_op;
6783 /* If REX_B is set, then this is xchg eax, r8d, not a nop. */
6784 if (REX_B(s)) {
6785 goto do_xchg_reg_eax;
6787 if (prefixes & PREFIX_REPZ) {
6788 gen_svm_check_intercept(s, pc_start, SVM_EXIT_PAUSE);
6790 break;
6791 case 0x9b: /* fwait */
6792 if ((s->flags & (HF_MP_MASK | HF_TS_MASK)) ==
6793 (HF_MP_MASK | HF_TS_MASK)) {
6794 gen_exception(s, EXCP07_PREX, pc_start - s->cs_base);
6795 } else {
6796 gen_update_cc_op(s);
6797 gen_jmp_im(pc_start - s->cs_base);
6798 gen_helper_fwait(cpu_env);
6800 break;
6801 case 0xcc: /* int3 */
6802 gen_interrupt(s, EXCP03_INT3, pc_start - s->cs_base, s->pc - s->cs_base);
6803 break;
6804 case 0xcd: /* int N */
6805 val = cpu_ldub_code(env, s->pc++);
6806 if (s->vm86 && s->iopl != 3) {
6807 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
6808 } else {
6809 gen_interrupt(s, val, pc_start - s->cs_base, s->pc - s->cs_base);
6811 break;
6812 case 0xce: /* into */
6813 if (CODE64(s))
6814 goto illegal_op;
6815 gen_update_cc_op(s);
6816 gen_jmp_im(pc_start - s->cs_base);
6817 gen_helper_into(cpu_env, tcg_const_i32(s->pc - pc_start));
6818 break;
6819 #ifdef WANT_ICEBP
6820 case 0xf1: /* icebp (undocumented, exits to external debugger) */
6821 gen_svm_check_intercept(s, pc_start, SVM_EXIT_ICEBP);
6822 #if 1
6823 gen_debug(s, pc_start - s->cs_base);
6824 #else
6825 /* start debug */
6826 tb_flush(env);
6827 qemu_set_log(CPU_LOG_INT | CPU_LOG_TB_IN_ASM);
6828 #endif
6829 break;
6830 #endif
6831 case 0xfa: /* cli */
6832 if (!s->vm86) {
6833 if (s->cpl <= s->iopl) {
6834 gen_helper_cli(cpu_env);
6835 } else {
6836 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
6838 } else {
6839 if (s->iopl == 3) {
6840 gen_helper_cli(cpu_env);
6841 } else {
6842 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
6845 break;
6846 case 0xfb: /* sti */
6847 if (!s->vm86) {
6848 if (s->cpl <= s->iopl) {
6849 gen_sti:
6850 gen_helper_sti(cpu_env);
6851 /* interruptions are enabled only the first insn after sti */
6852 /* If several instructions disable interrupts, only the
6853 _first_ does it */
6854 if (!(s->tb->flags & HF_INHIBIT_IRQ_MASK))
6855 gen_helper_set_inhibit_irq(cpu_env);
6856 /* give a chance to handle pending irqs */
6857 gen_jmp_im(s->pc - s->cs_base);
6858 gen_eob(s);
6859 } else {
6860 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
6862 } else {
6863 if (s->iopl == 3) {
6864 goto gen_sti;
6865 } else {
6866 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
6869 break;
6870 case 0x62: /* bound */
6871 if (CODE64(s))
6872 goto illegal_op;
6873 ot = dflag ? OT_LONG : OT_WORD;
6874 modrm = cpu_ldub_code(env, s->pc++);
6875 reg = (modrm >> 3) & 7;
6876 mod = (modrm >> 6) & 3;
6877 if (mod == 3)
6878 goto illegal_op;
6879 gen_op_mov_TN_reg(ot, 0, reg);
6880 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
6881 gen_jmp_im(pc_start - s->cs_base);
6882 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
6883 if (ot == OT_WORD) {
6884 gen_helper_boundw(cpu_env, cpu_A0, cpu_tmp2_i32);
6885 } else {
6886 gen_helper_boundl(cpu_env, cpu_A0, cpu_tmp2_i32);
6888 break;
6889 case 0x1c8 ... 0x1cf: /* bswap reg */
6890 reg = (b & 7) | REX_B(s);
6891 #ifdef TARGET_X86_64
6892 if (dflag == 2) {
6893 gen_op_mov_TN_reg(OT_QUAD, 0, reg);
6894 tcg_gen_bswap64_i64(cpu_T[0], cpu_T[0]);
6895 gen_op_mov_reg_T0(OT_QUAD, reg);
6896 } else
6897 #endif
6899 gen_op_mov_TN_reg(OT_LONG, 0, reg);
6900 tcg_gen_ext32u_tl(cpu_T[0], cpu_T[0]);
6901 tcg_gen_bswap32_tl(cpu_T[0], cpu_T[0]);
6902 gen_op_mov_reg_T0(OT_LONG, reg);
6904 break;
6905 case 0xd6: /* salc */
6906 if (CODE64(s))
6907 goto illegal_op;
6908 gen_compute_eflags_c(s, cpu_T[0]);
6909 tcg_gen_neg_tl(cpu_T[0], cpu_T[0]);
6910 gen_op_mov_reg_T0(OT_BYTE, R_EAX);
6911 break;
6912 case 0xe0: /* loopnz */
6913 case 0xe1: /* loopz */
6914 case 0xe2: /* loop */
6915 case 0xe3: /* jecxz */
6917 int l1, l2, l3;
6919 tval = (int8_t)insn_get(env, s, OT_BYTE);
6920 next_eip = s->pc - s->cs_base;
6921 tval += next_eip;
6922 if (s->dflag == 0)
6923 tval &= 0xffff;
6925 l1 = gen_new_label();
6926 l2 = gen_new_label();
6927 l3 = gen_new_label();
6928 b &= 3;
6929 switch(b) {
6930 case 0: /* loopnz */
6931 case 1: /* loopz */
6932 gen_op_add_reg_im(s->aflag, R_ECX, -1);
6933 gen_op_jz_ecx(s->aflag, l3);
6934 gen_jcc1(s, (JCC_Z << 1) | (b ^ 1), l1);
6935 break;
6936 case 2: /* loop */
6937 gen_op_add_reg_im(s->aflag, R_ECX, -1);
6938 gen_op_jnz_ecx(s->aflag, l1);
6939 break;
6940 default:
6941 case 3: /* jcxz */
6942 gen_op_jz_ecx(s->aflag, l1);
6943 break;
6946 gen_set_label(l3);
6947 gen_jmp_im(next_eip);
6948 tcg_gen_br(l2);
6950 gen_set_label(l1);
6951 gen_jmp_im(tval);
6952 gen_set_label(l2);
6953 gen_eob(s);
6955 break;
6956 case 0x130: /* wrmsr */
6957 case 0x132: /* rdmsr */
6958 if (s->cpl != 0) {
6959 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
6960 } else {
6961 gen_update_cc_op(s);
6962 gen_jmp_im(pc_start - s->cs_base);
6963 if (b & 2) {
6964 gen_helper_rdmsr(cpu_env);
6965 } else {
6966 gen_helper_wrmsr(cpu_env);
6969 break;
6970 case 0x131: /* rdtsc */
6971 gen_update_cc_op(s);
6972 gen_jmp_im(pc_start - s->cs_base);
6973 if (use_icount)
6974 gen_io_start();
6975 gen_helper_rdtsc(cpu_env);
6976 if (use_icount) {
6977 gen_io_end();
6978 gen_jmp(s, s->pc - s->cs_base);
6980 break;
6981 case 0x133: /* rdpmc */
6982 gen_update_cc_op(s);
6983 gen_jmp_im(pc_start - s->cs_base);
6984 gen_helper_rdpmc(cpu_env);
6985 break;
6986 case 0x134: /* sysenter */
6987 /* For Intel SYSENTER is valid on 64-bit */
6988 if (CODE64(s) && env->cpuid_vendor1 != CPUID_VENDOR_INTEL_1)
6989 goto illegal_op;
6990 if (!s->pe) {
6991 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
6992 } else {
6993 gen_update_cc_op(s);
6994 gen_jmp_im(pc_start - s->cs_base);
6995 gen_helper_sysenter(cpu_env);
6996 gen_eob(s);
6998 break;
6999 case 0x135: /* sysexit */
7000 /* For Intel SYSEXIT is valid on 64-bit */
7001 if (CODE64(s) && env->cpuid_vendor1 != CPUID_VENDOR_INTEL_1)
7002 goto illegal_op;
7003 if (!s->pe) {
7004 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7005 } else {
7006 gen_update_cc_op(s);
7007 gen_jmp_im(pc_start - s->cs_base);
7008 gen_helper_sysexit(cpu_env, tcg_const_i32(dflag));
7009 gen_eob(s);
7011 break;
7012 #ifdef TARGET_X86_64
7013 case 0x105: /* syscall */
7014 /* XXX: is it usable in real mode ? */
7015 gen_update_cc_op(s);
7016 gen_jmp_im(pc_start - s->cs_base);
7017 gen_helper_syscall(cpu_env, tcg_const_i32(s->pc - pc_start));
7018 gen_eob(s);
7019 break;
7020 case 0x107: /* sysret */
7021 if (!s->pe) {
7022 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7023 } else {
7024 gen_update_cc_op(s);
7025 gen_jmp_im(pc_start - s->cs_base);
7026 gen_helper_sysret(cpu_env, tcg_const_i32(s->dflag));
7027 /* condition codes are modified only in long mode */
7028 if (s->lma) {
7029 set_cc_op(s, CC_OP_EFLAGS);
7031 gen_eob(s);
7033 break;
7034 #endif
7035 case 0x1a2: /* cpuid */
7036 gen_update_cc_op(s);
7037 gen_jmp_im(pc_start - s->cs_base);
7038 gen_helper_cpuid(cpu_env);
7039 break;
7040 case 0xf4: /* hlt */
7041 if (s->cpl != 0) {
7042 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7043 } else {
7044 gen_update_cc_op(s);
7045 gen_jmp_im(pc_start - s->cs_base);
7046 gen_helper_hlt(cpu_env, tcg_const_i32(s->pc - pc_start));
7047 s->is_jmp = DISAS_TB_JUMP;
7049 break;
7050 case 0x100:
7051 modrm = cpu_ldub_code(env, s->pc++);
7052 mod = (modrm >> 6) & 3;
7053 op = (modrm >> 3) & 7;
7054 switch(op) {
7055 case 0: /* sldt */
7056 if (!s->pe || s->vm86)
7057 goto illegal_op;
7058 gen_svm_check_intercept(s, pc_start, SVM_EXIT_LDTR_READ);
7059 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,ldt.selector));
7060 ot = OT_WORD;
7061 if (mod == 3)
7062 ot += s->dflag;
7063 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 1);
7064 break;
7065 case 2: /* lldt */
7066 if (!s->pe || s->vm86)
7067 goto illegal_op;
7068 if (s->cpl != 0) {
7069 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7070 } else {
7071 gen_svm_check_intercept(s, pc_start, SVM_EXIT_LDTR_WRITE);
7072 gen_ldst_modrm(env, s, modrm, OT_WORD, OR_TMP0, 0);
7073 gen_jmp_im(pc_start - s->cs_base);
7074 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
7075 gen_helper_lldt(cpu_env, cpu_tmp2_i32);
7077 break;
7078 case 1: /* str */
7079 if (!s->pe || s->vm86)
7080 goto illegal_op;
7081 gen_svm_check_intercept(s, pc_start, SVM_EXIT_TR_READ);
7082 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,tr.selector));
7083 ot = OT_WORD;
7084 if (mod == 3)
7085 ot += s->dflag;
7086 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 1);
7087 break;
7088 case 3: /* ltr */
7089 if (!s->pe || s->vm86)
7090 goto illegal_op;
7091 if (s->cpl != 0) {
7092 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7093 } else {
7094 gen_svm_check_intercept(s, pc_start, SVM_EXIT_TR_WRITE);
7095 gen_ldst_modrm(env, s, modrm, OT_WORD, OR_TMP0, 0);
7096 gen_jmp_im(pc_start - s->cs_base);
7097 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
7098 gen_helper_ltr(cpu_env, cpu_tmp2_i32);
7100 break;
7101 case 4: /* verr */
7102 case 5: /* verw */
7103 if (!s->pe || s->vm86)
7104 goto illegal_op;
7105 gen_ldst_modrm(env, s, modrm, OT_WORD, OR_TMP0, 0);
7106 gen_update_cc_op(s);
7107 if (op == 4) {
7108 gen_helper_verr(cpu_env, cpu_T[0]);
7109 } else {
7110 gen_helper_verw(cpu_env, cpu_T[0]);
7112 set_cc_op(s, CC_OP_EFLAGS);
7113 break;
7114 default:
7115 goto illegal_op;
7117 break;
7118 case 0x101:
7119 modrm = cpu_ldub_code(env, s->pc++);
7120 mod = (modrm >> 6) & 3;
7121 op = (modrm >> 3) & 7;
7122 rm = modrm & 7;
7123 switch(op) {
7124 case 0: /* sgdt */
7125 if (mod == 3)
7126 goto illegal_op;
7127 gen_svm_check_intercept(s, pc_start, SVM_EXIT_GDTR_READ);
7128 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7129 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State, gdt.limit));
7130 gen_op_st_T0_A0(OT_WORD + s->mem_index);
7131 gen_add_A0_im(s, 2);
7132 tcg_gen_ld_tl(cpu_T[0], cpu_env, offsetof(CPUX86State, gdt.base));
7133 if (!s->dflag)
7134 gen_op_andl_T0_im(0xffffff);
7135 gen_op_st_T0_A0(CODE64(s) + OT_LONG + s->mem_index);
7136 break;
7137 case 1:
7138 if (mod == 3) {
7139 switch (rm) {
7140 case 0: /* monitor */
7141 if (!(s->cpuid_ext_features & CPUID_EXT_MONITOR) ||
7142 s->cpl != 0)
7143 goto illegal_op;
7144 gen_update_cc_op(s);
7145 gen_jmp_im(pc_start - s->cs_base);
7146 #ifdef TARGET_X86_64
7147 if (s->aflag == 2) {
7148 gen_op_movq_A0_reg(R_EAX);
7149 } else
7150 #endif
7152 gen_op_movl_A0_reg(R_EAX);
7153 if (s->aflag == 0)
7154 gen_op_andl_A0_ffff();
7156 gen_add_A0_ds_seg(s);
7157 gen_helper_monitor(cpu_env, cpu_A0);
7158 break;
7159 case 1: /* mwait */
7160 if (!(s->cpuid_ext_features & CPUID_EXT_MONITOR) ||
7161 s->cpl != 0)
7162 goto illegal_op;
7163 gen_update_cc_op(s);
7164 gen_jmp_im(pc_start - s->cs_base);
7165 gen_helper_mwait(cpu_env, tcg_const_i32(s->pc - pc_start));
7166 gen_eob(s);
7167 break;
7168 case 2: /* clac */
7169 if (!(s->cpuid_7_0_ebx_features & CPUID_7_0_EBX_SMAP) ||
7170 s->cpl != 0) {
7171 goto illegal_op;
7173 gen_helper_clac(cpu_env);
7174 gen_jmp_im(s->pc - s->cs_base);
7175 gen_eob(s);
7176 break;
7177 case 3: /* stac */
7178 if (!(s->cpuid_7_0_ebx_features & CPUID_7_0_EBX_SMAP) ||
7179 s->cpl != 0) {
7180 goto illegal_op;
7182 gen_helper_stac(cpu_env);
7183 gen_jmp_im(s->pc - s->cs_base);
7184 gen_eob(s);
7185 break;
7186 default:
7187 goto illegal_op;
7189 } else { /* sidt */
7190 gen_svm_check_intercept(s, pc_start, SVM_EXIT_IDTR_READ);
7191 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7192 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State, idt.limit));
7193 gen_op_st_T0_A0(OT_WORD + s->mem_index);
7194 gen_add_A0_im(s, 2);
7195 tcg_gen_ld_tl(cpu_T[0], cpu_env, offsetof(CPUX86State, idt.base));
7196 if (!s->dflag)
7197 gen_op_andl_T0_im(0xffffff);
7198 gen_op_st_T0_A0(CODE64(s) + OT_LONG + s->mem_index);
7200 break;
7201 case 2: /* lgdt */
7202 case 3: /* lidt */
7203 if (mod == 3) {
7204 gen_update_cc_op(s);
7205 gen_jmp_im(pc_start - s->cs_base);
7206 switch(rm) {
7207 case 0: /* VMRUN */
7208 if (!(s->flags & HF_SVME_MASK) || !s->pe)
7209 goto illegal_op;
7210 if (s->cpl != 0) {
7211 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7212 break;
7213 } else {
7214 gen_helper_vmrun(cpu_env, tcg_const_i32(s->aflag),
7215 tcg_const_i32(s->pc - pc_start));
7216 tcg_gen_exit_tb(0);
7217 s->is_jmp = DISAS_TB_JUMP;
7219 break;
7220 case 1: /* VMMCALL */
7221 if (!(s->flags & HF_SVME_MASK))
7222 goto illegal_op;
7223 gen_helper_vmmcall(cpu_env);
7224 break;
7225 case 2: /* VMLOAD */
7226 if (!(s->flags & HF_SVME_MASK) || !s->pe)
7227 goto illegal_op;
7228 if (s->cpl != 0) {
7229 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7230 break;
7231 } else {
7232 gen_helper_vmload(cpu_env, tcg_const_i32(s->aflag));
7234 break;
7235 case 3: /* VMSAVE */
7236 if (!(s->flags & HF_SVME_MASK) || !s->pe)
7237 goto illegal_op;
7238 if (s->cpl != 0) {
7239 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7240 break;
7241 } else {
7242 gen_helper_vmsave(cpu_env, tcg_const_i32(s->aflag));
7244 break;
7245 case 4: /* STGI */
7246 if ((!(s->flags & HF_SVME_MASK) &&
7247 !(s->cpuid_ext3_features & CPUID_EXT3_SKINIT)) ||
7248 !s->pe)
7249 goto illegal_op;
7250 if (s->cpl != 0) {
7251 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7252 break;
7253 } else {
7254 gen_helper_stgi(cpu_env);
7256 break;
7257 case 5: /* CLGI */
7258 if (!(s->flags & HF_SVME_MASK) || !s->pe)
7259 goto illegal_op;
7260 if (s->cpl != 0) {
7261 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7262 break;
7263 } else {
7264 gen_helper_clgi(cpu_env);
7266 break;
7267 case 6: /* SKINIT */
7268 if ((!(s->flags & HF_SVME_MASK) &&
7269 !(s->cpuid_ext3_features & CPUID_EXT3_SKINIT)) ||
7270 !s->pe)
7271 goto illegal_op;
7272 gen_helper_skinit(cpu_env);
7273 break;
7274 case 7: /* INVLPGA */
7275 if (!(s->flags & HF_SVME_MASK) || !s->pe)
7276 goto illegal_op;
7277 if (s->cpl != 0) {
7278 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7279 break;
7280 } else {
7281 gen_helper_invlpga(cpu_env, tcg_const_i32(s->aflag));
7283 break;
7284 default:
7285 goto illegal_op;
7287 } else if (s->cpl != 0) {
7288 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7289 } else {
7290 gen_svm_check_intercept(s, pc_start,
7291 op==2 ? SVM_EXIT_GDTR_WRITE : SVM_EXIT_IDTR_WRITE);
7292 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7293 gen_op_ld_T1_A0(OT_WORD + s->mem_index);
7294 gen_add_A0_im(s, 2);
7295 gen_op_ld_T0_A0(CODE64(s) + OT_LONG + s->mem_index);
7296 if (!s->dflag)
7297 gen_op_andl_T0_im(0xffffff);
7298 if (op == 2) {
7299 tcg_gen_st_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,gdt.base));
7300 tcg_gen_st32_tl(cpu_T[1], cpu_env, offsetof(CPUX86State,gdt.limit));
7301 } else {
7302 tcg_gen_st_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,idt.base));
7303 tcg_gen_st32_tl(cpu_T[1], cpu_env, offsetof(CPUX86State,idt.limit));
7306 break;
7307 case 4: /* smsw */
7308 gen_svm_check_intercept(s, pc_start, SVM_EXIT_READ_CR0);
7309 #if defined TARGET_X86_64 && defined HOST_WORDS_BIGENDIAN
7310 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,cr[0]) + 4);
7311 #else
7312 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,cr[0]));
7313 #endif
7314 gen_ldst_modrm(env, s, modrm, OT_WORD, OR_TMP0, 1);
7315 break;
7316 case 6: /* lmsw */
7317 if (s->cpl != 0) {
7318 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7319 } else {
7320 gen_svm_check_intercept(s, pc_start, SVM_EXIT_WRITE_CR0);
7321 gen_ldst_modrm(env, s, modrm, OT_WORD, OR_TMP0, 0);
7322 gen_helper_lmsw(cpu_env, cpu_T[0]);
7323 gen_jmp_im(s->pc - s->cs_base);
7324 gen_eob(s);
7326 break;
7327 case 7:
7328 if (mod != 3) { /* invlpg */
7329 if (s->cpl != 0) {
7330 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7331 } else {
7332 gen_update_cc_op(s);
7333 gen_jmp_im(pc_start - s->cs_base);
7334 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7335 gen_helper_invlpg(cpu_env, cpu_A0);
7336 gen_jmp_im(s->pc - s->cs_base);
7337 gen_eob(s);
7339 } else {
7340 switch (rm) {
7341 case 0: /* swapgs */
7342 #ifdef TARGET_X86_64
7343 if (CODE64(s)) {
7344 if (s->cpl != 0) {
7345 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7346 } else {
7347 tcg_gen_ld_tl(cpu_T[0], cpu_env,
7348 offsetof(CPUX86State,segs[R_GS].base));
7349 tcg_gen_ld_tl(cpu_T[1], cpu_env,
7350 offsetof(CPUX86State,kernelgsbase));
7351 tcg_gen_st_tl(cpu_T[1], cpu_env,
7352 offsetof(CPUX86State,segs[R_GS].base));
7353 tcg_gen_st_tl(cpu_T[0], cpu_env,
7354 offsetof(CPUX86State,kernelgsbase));
7356 } else
7357 #endif
7359 goto illegal_op;
7361 break;
7362 case 1: /* rdtscp */
7363 if (!(s->cpuid_ext2_features & CPUID_EXT2_RDTSCP))
7364 goto illegal_op;
7365 gen_update_cc_op(s);
7366 gen_jmp_im(pc_start - s->cs_base);
7367 if (use_icount)
7368 gen_io_start();
7369 gen_helper_rdtscp(cpu_env);
7370 if (use_icount) {
7371 gen_io_end();
7372 gen_jmp(s, s->pc - s->cs_base);
7374 break;
7375 default:
7376 goto illegal_op;
7379 break;
7380 default:
7381 goto illegal_op;
7383 break;
7384 case 0x108: /* invd */
7385 case 0x109: /* wbinvd */
7386 if (s->cpl != 0) {
7387 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7388 } else {
7389 gen_svm_check_intercept(s, pc_start, (b & 2) ? SVM_EXIT_INVD : SVM_EXIT_WBINVD);
7390 /* nothing to do */
7392 break;
7393 case 0x63: /* arpl or movslS (x86_64) */
7394 #ifdef TARGET_X86_64
7395 if (CODE64(s)) {
7396 int d_ot;
7397 /* d_ot is the size of destination */
7398 d_ot = dflag + OT_WORD;
7400 modrm = cpu_ldub_code(env, s->pc++);
7401 reg = ((modrm >> 3) & 7) | rex_r;
7402 mod = (modrm >> 6) & 3;
7403 rm = (modrm & 7) | REX_B(s);
7405 if (mod == 3) {
7406 gen_op_mov_TN_reg(OT_LONG, 0, rm);
7407 /* sign extend */
7408 if (d_ot == OT_QUAD)
7409 tcg_gen_ext32s_tl(cpu_T[0], cpu_T[0]);
7410 gen_op_mov_reg_T0(d_ot, reg);
7411 } else {
7412 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7413 if (d_ot == OT_QUAD) {
7414 gen_op_lds_T0_A0(OT_LONG + s->mem_index);
7415 } else {
7416 gen_op_ld_T0_A0(OT_LONG + s->mem_index);
7418 gen_op_mov_reg_T0(d_ot, reg);
7420 } else
7421 #endif
7423 int label1;
7424 TCGv t0, t1, t2, a0;
7426 if (!s->pe || s->vm86)
7427 goto illegal_op;
7428 t0 = tcg_temp_local_new();
7429 t1 = tcg_temp_local_new();
7430 t2 = tcg_temp_local_new();
7431 ot = OT_WORD;
7432 modrm = cpu_ldub_code(env, s->pc++);
7433 reg = (modrm >> 3) & 7;
7434 mod = (modrm >> 6) & 3;
7435 rm = modrm & 7;
7436 if (mod != 3) {
7437 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7438 gen_op_ld_v(ot + s->mem_index, t0, cpu_A0);
7439 a0 = tcg_temp_local_new();
7440 tcg_gen_mov_tl(a0, cpu_A0);
7441 } else {
7442 gen_op_mov_v_reg(ot, t0, rm);
7443 TCGV_UNUSED(a0);
7445 gen_op_mov_v_reg(ot, t1, reg);
7446 tcg_gen_andi_tl(cpu_tmp0, t0, 3);
7447 tcg_gen_andi_tl(t1, t1, 3);
7448 tcg_gen_movi_tl(t2, 0);
7449 label1 = gen_new_label();
7450 tcg_gen_brcond_tl(TCG_COND_GE, cpu_tmp0, t1, label1);
7451 tcg_gen_andi_tl(t0, t0, ~3);
7452 tcg_gen_or_tl(t0, t0, t1);
7453 tcg_gen_movi_tl(t2, CC_Z);
7454 gen_set_label(label1);
7455 if (mod != 3) {
7456 gen_op_st_v(ot + s->mem_index, t0, a0);
7457 tcg_temp_free(a0);
7458 } else {
7459 gen_op_mov_reg_v(ot, rm, t0);
7461 gen_compute_eflags(s);
7462 tcg_gen_andi_tl(cpu_cc_src, cpu_cc_src, ~CC_Z);
7463 tcg_gen_or_tl(cpu_cc_src, cpu_cc_src, t2);
7464 tcg_temp_free(t0);
7465 tcg_temp_free(t1);
7466 tcg_temp_free(t2);
7468 break;
7469 case 0x102: /* lar */
7470 case 0x103: /* lsl */
7472 int label1;
7473 TCGv t0;
7474 if (!s->pe || s->vm86)
7475 goto illegal_op;
7476 ot = dflag ? OT_LONG : OT_WORD;
7477 modrm = cpu_ldub_code(env, s->pc++);
7478 reg = ((modrm >> 3) & 7) | rex_r;
7479 gen_ldst_modrm(env, s, modrm, OT_WORD, OR_TMP0, 0);
7480 t0 = tcg_temp_local_new();
7481 gen_update_cc_op(s);
7482 if (b == 0x102) {
7483 gen_helper_lar(t0, cpu_env, cpu_T[0]);
7484 } else {
7485 gen_helper_lsl(t0, cpu_env, cpu_T[0]);
7487 tcg_gen_andi_tl(cpu_tmp0, cpu_cc_src, CC_Z);
7488 label1 = gen_new_label();
7489 tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_tmp0, 0, label1);
7490 gen_op_mov_reg_v(ot, reg, t0);
7491 gen_set_label(label1);
7492 set_cc_op(s, CC_OP_EFLAGS);
7493 tcg_temp_free(t0);
7495 break;
7496 case 0x118:
7497 modrm = cpu_ldub_code(env, s->pc++);
7498 mod = (modrm >> 6) & 3;
7499 op = (modrm >> 3) & 7;
7500 switch(op) {
7501 case 0: /* prefetchnta */
7502 case 1: /* prefetchnt0 */
7503 case 2: /* prefetchnt0 */
7504 case 3: /* prefetchnt0 */
7505 if (mod == 3)
7506 goto illegal_op;
7507 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7508 /* nothing more to do */
7509 break;
7510 default: /* nop (multi byte) */
7511 gen_nop_modrm(env, s, modrm);
7512 break;
7514 break;
7515 case 0x119 ... 0x11f: /* nop (multi byte) */
7516 modrm = cpu_ldub_code(env, s->pc++);
7517 gen_nop_modrm(env, s, modrm);
7518 break;
7519 case 0x120: /* mov reg, crN */
7520 case 0x122: /* mov crN, reg */
7521 if (s->cpl != 0) {
7522 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7523 } else {
7524 modrm = cpu_ldub_code(env, s->pc++);
7525 /* Ignore the mod bits (assume (modrm&0xc0)==0xc0).
7526 * AMD documentation (24594.pdf) and testing of
7527 * intel 386 and 486 processors all show that the mod bits
7528 * are assumed to be 1's, regardless of actual values.
7530 rm = (modrm & 7) | REX_B(s);
7531 reg = ((modrm >> 3) & 7) | rex_r;
7532 if (CODE64(s))
7533 ot = OT_QUAD;
7534 else
7535 ot = OT_LONG;
7536 if ((prefixes & PREFIX_LOCK) && (reg == 0) &&
7537 (s->cpuid_ext3_features & CPUID_EXT3_CR8LEG)) {
7538 reg = 8;
7540 switch(reg) {
7541 case 0:
7542 case 2:
7543 case 3:
7544 case 4:
7545 case 8:
7546 gen_update_cc_op(s);
7547 gen_jmp_im(pc_start - s->cs_base);
7548 if (b & 2) {
7549 gen_op_mov_TN_reg(ot, 0, rm);
7550 gen_helper_write_crN(cpu_env, tcg_const_i32(reg),
7551 cpu_T[0]);
7552 gen_jmp_im(s->pc - s->cs_base);
7553 gen_eob(s);
7554 } else {
7555 gen_helper_read_crN(cpu_T[0], cpu_env, tcg_const_i32(reg));
7556 gen_op_mov_reg_T0(ot, rm);
7558 break;
7559 default:
7560 goto illegal_op;
7563 break;
7564 case 0x121: /* mov reg, drN */
7565 case 0x123: /* mov drN, reg */
7566 if (s->cpl != 0) {
7567 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7568 } else {
7569 modrm = cpu_ldub_code(env, s->pc++);
7570 /* Ignore the mod bits (assume (modrm&0xc0)==0xc0).
7571 * AMD documentation (24594.pdf) and testing of
7572 * intel 386 and 486 processors all show that the mod bits
7573 * are assumed to be 1's, regardless of actual values.
7575 rm = (modrm & 7) | REX_B(s);
7576 reg = ((modrm >> 3) & 7) | rex_r;
7577 if (CODE64(s))
7578 ot = OT_QUAD;
7579 else
7580 ot = OT_LONG;
7581 /* XXX: do it dynamically with CR4.DE bit */
7582 if (reg == 4 || reg == 5 || reg >= 8)
7583 goto illegal_op;
7584 if (b & 2) {
7585 gen_svm_check_intercept(s, pc_start, SVM_EXIT_WRITE_DR0 + reg);
7586 gen_op_mov_TN_reg(ot, 0, rm);
7587 gen_helper_movl_drN_T0(cpu_env, tcg_const_i32(reg), cpu_T[0]);
7588 gen_jmp_im(s->pc - s->cs_base);
7589 gen_eob(s);
7590 } else {
7591 gen_svm_check_intercept(s, pc_start, SVM_EXIT_READ_DR0 + reg);
7592 tcg_gen_ld_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,dr[reg]));
7593 gen_op_mov_reg_T0(ot, rm);
7596 break;
7597 case 0x106: /* clts */
7598 if (s->cpl != 0) {
7599 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7600 } else {
7601 gen_svm_check_intercept(s, pc_start, SVM_EXIT_WRITE_CR0);
7602 gen_helper_clts(cpu_env);
7603 /* abort block because static cpu state changed */
7604 gen_jmp_im(s->pc - s->cs_base);
7605 gen_eob(s);
7607 break;
7608 /* MMX/3DNow!/SSE/SSE2/SSE3/SSSE3/SSE4 support */
7609 case 0x1c3: /* MOVNTI reg, mem */
7610 if (!(s->cpuid_features & CPUID_SSE2))
7611 goto illegal_op;
7612 ot = s->dflag == 2 ? OT_QUAD : OT_LONG;
7613 modrm = cpu_ldub_code(env, s->pc++);
7614 mod = (modrm >> 6) & 3;
7615 if (mod == 3)
7616 goto illegal_op;
7617 reg = ((modrm >> 3) & 7) | rex_r;
7618 /* generate a generic store */
7619 gen_ldst_modrm(env, s, modrm, ot, reg, 1);
7620 break;
7621 case 0x1ae:
7622 modrm = cpu_ldub_code(env, s->pc++);
7623 mod = (modrm >> 6) & 3;
7624 op = (modrm >> 3) & 7;
7625 switch(op) {
7626 case 0: /* fxsave */
7627 if (mod == 3 || !(s->cpuid_features & CPUID_FXSR) ||
7628 (s->prefix & PREFIX_LOCK))
7629 goto illegal_op;
7630 if ((s->flags & HF_EM_MASK) || (s->flags & HF_TS_MASK)) {
7631 gen_exception(s, EXCP07_PREX, pc_start - s->cs_base);
7632 break;
7634 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7635 gen_update_cc_op(s);
7636 gen_jmp_im(pc_start - s->cs_base);
7637 gen_helper_fxsave(cpu_env, cpu_A0, tcg_const_i32((s->dflag == 2)));
7638 break;
7639 case 1: /* fxrstor */
7640 if (mod == 3 || !(s->cpuid_features & CPUID_FXSR) ||
7641 (s->prefix & PREFIX_LOCK))
7642 goto illegal_op;
7643 if ((s->flags & HF_EM_MASK) || (s->flags & HF_TS_MASK)) {
7644 gen_exception(s, EXCP07_PREX, pc_start - s->cs_base);
7645 break;
7647 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7648 gen_update_cc_op(s);
7649 gen_jmp_im(pc_start - s->cs_base);
7650 gen_helper_fxrstor(cpu_env, cpu_A0,
7651 tcg_const_i32((s->dflag == 2)));
7652 break;
7653 case 2: /* ldmxcsr */
7654 case 3: /* stmxcsr */
7655 if (s->flags & HF_TS_MASK) {
7656 gen_exception(s, EXCP07_PREX, pc_start - s->cs_base);
7657 break;
7659 if ((s->flags & HF_EM_MASK) || !(s->flags & HF_OSFXSR_MASK) ||
7660 mod == 3)
7661 goto illegal_op;
7662 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7663 if (op == 2) {
7664 gen_op_ld_T0_A0(OT_LONG + s->mem_index);
7665 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
7666 gen_helper_ldmxcsr(cpu_env, cpu_tmp2_i32);
7667 } else {
7668 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State, mxcsr));
7669 gen_op_st_T0_A0(OT_LONG + s->mem_index);
7671 break;
7672 case 5: /* lfence */
7673 case 6: /* mfence */
7674 if ((modrm & 0xc7) != 0xc0 || !(s->cpuid_features & CPUID_SSE2))
7675 goto illegal_op;
7676 break;
7677 case 7: /* sfence / clflush */
7678 if ((modrm & 0xc7) == 0xc0) {
7679 /* sfence */
7680 /* XXX: also check for cpuid_ext2_features & CPUID_EXT2_EMMX */
7681 if (!(s->cpuid_features & CPUID_SSE))
7682 goto illegal_op;
7683 } else {
7684 /* clflush */
7685 if (!(s->cpuid_features & CPUID_CLFLUSH))
7686 goto illegal_op;
7687 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7689 break;
7690 default:
7691 goto illegal_op;
7693 break;
7694 case 0x10d: /* 3DNow! prefetch(w) */
7695 modrm = cpu_ldub_code(env, s->pc++);
7696 mod = (modrm >> 6) & 3;
7697 if (mod == 3)
7698 goto illegal_op;
7699 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7700 /* ignore for now */
7701 break;
7702 case 0x1aa: /* rsm */
7703 gen_svm_check_intercept(s, pc_start, SVM_EXIT_RSM);
7704 if (!(s->flags & HF_SMM_MASK))
7705 goto illegal_op;
7706 gen_update_cc_op(s);
7707 gen_jmp_im(s->pc - s->cs_base);
7708 gen_helper_rsm(cpu_env);
7709 gen_eob(s);
7710 break;
7711 case 0x1b8: /* SSE4.2 popcnt */
7712 if ((prefixes & (PREFIX_REPZ | PREFIX_LOCK | PREFIX_REPNZ)) !=
7713 PREFIX_REPZ)
7714 goto illegal_op;
7715 if (!(s->cpuid_ext_features & CPUID_EXT_POPCNT))
7716 goto illegal_op;
7718 modrm = cpu_ldub_code(env, s->pc++);
7719 reg = ((modrm >> 3) & 7) | rex_r;
7721 if (s->prefix & PREFIX_DATA)
7722 ot = OT_WORD;
7723 else if (s->dflag != 2)
7724 ot = OT_LONG;
7725 else
7726 ot = OT_QUAD;
7728 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
7729 gen_helper_popcnt(cpu_T[0], cpu_env, cpu_T[0], tcg_const_i32(ot));
7730 gen_op_mov_reg_T0(ot, reg);
7732 set_cc_op(s, CC_OP_EFLAGS);
7733 break;
7734 case 0x10e ... 0x10f:
7735 /* 3DNow! instructions, ignore prefixes */
7736 s->prefix &= ~(PREFIX_REPZ | PREFIX_REPNZ | PREFIX_DATA);
7737 case 0x110 ... 0x117:
7738 case 0x128 ... 0x12f:
7739 case 0x138 ... 0x13a:
7740 case 0x150 ... 0x179:
7741 case 0x17c ... 0x17f:
7742 case 0x1c2:
7743 case 0x1c4 ... 0x1c6:
7744 case 0x1d0 ... 0x1fe:
7745 gen_sse(env, s, b, pc_start, rex_r);
7746 break;
7747 default:
7748 goto illegal_op;
7750 /* lock generation */
7751 if (s->prefix & PREFIX_LOCK)
7752 gen_helper_unlock();
7753 return s->pc;
7754 illegal_op:
7755 if (s->prefix & PREFIX_LOCK)
7756 gen_helper_unlock();
7757 /* XXX: ensure that no lock was generated */
7758 gen_exception(s, EXCP06_ILLOP, pc_start - s->cs_base);
7759 return s->pc;
7762 void optimize_flags_init(void)
7764 cpu_env = tcg_global_reg_new_ptr(TCG_AREG0, "env");
7765 cpu_cc_op = tcg_global_mem_new_i32(TCG_AREG0,
7766 offsetof(CPUX86State, cc_op), "cc_op");
7767 cpu_cc_dst = tcg_global_mem_new(TCG_AREG0, offsetof(CPUX86State, cc_dst),
7768 "cc_dst");
7769 cpu_cc_src = tcg_global_mem_new(TCG_AREG0, offsetof(CPUX86State, cc_src),
7770 "cc_src");
7771 cpu_cc_src2 = tcg_global_mem_new(TCG_AREG0, offsetof(CPUX86State, cc_src2),
7772 "cc_src2");
7774 #ifdef TARGET_X86_64
7775 cpu_regs[R_EAX] = tcg_global_mem_new_i64(TCG_AREG0,
7776 offsetof(CPUX86State, regs[R_EAX]), "rax");
7777 cpu_regs[R_ECX] = tcg_global_mem_new_i64(TCG_AREG0,
7778 offsetof(CPUX86State, regs[R_ECX]), "rcx");
7779 cpu_regs[R_EDX] = tcg_global_mem_new_i64(TCG_AREG0,
7780 offsetof(CPUX86State, regs[R_EDX]), "rdx");
7781 cpu_regs[R_EBX] = tcg_global_mem_new_i64(TCG_AREG0,
7782 offsetof(CPUX86State, regs[R_EBX]), "rbx");
7783 cpu_regs[R_ESP] = tcg_global_mem_new_i64(TCG_AREG0,
7784 offsetof(CPUX86State, regs[R_ESP]), "rsp");
7785 cpu_regs[R_EBP] = tcg_global_mem_new_i64(TCG_AREG0,
7786 offsetof(CPUX86State, regs[R_EBP]), "rbp");
7787 cpu_regs[R_ESI] = tcg_global_mem_new_i64(TCG_AREG0,
7788 offsetof(CPUX86State, regs[R_ESI]), "rsi");
7789 cpu_regs[R_EDI] = tcg_global_mem_new_i64(TCG_AREG0,
7790 offsetof(CPUX86State, regs[R_EDI]), "rdi");
7791 cpu_regs[8] = tcg_global_mem_new_i64(TCG_AREG0,
7792 offsetof(CPUX86State, regs[8]), "r8");
7793 cpu_regs[9] = tcg_global_mem_new_i64(TCG_AREG0,
7794 offsetof(CPUX86State, regs[9]), "r9");
7795 cpu_regs[10] = tcg_global_mem_new_i64(TCG_AREG0,
7796 offsetof(CPUX86State, regs[10]), "r10");
7797 cpu_regs[11] = tcg_global_mem_new_i64(TCG_AREG0,
7798 offsetof(CPUX86State, regs[11]), "r11");
7799 cpu_regs[12] = tcg_global_mem_new_i64(TCG_AREG0,
7800 offsetof(CPUX86State, regs[12]), "r12");
7801 cpu_regs[13] = tcg_global_mem_new_i64(TCG_AREG0,
7802 offsetof(CPUX86State, regs[13]), "r13");
7803 cpu_regs[14] = tcg_global_mem_new_i64(TCG_AREG0,
7804 offsetof(CPUX86State, regs[14]), "r14");
7805 cpu_regs[15] = tcg_global_mem_new_i64(TCG_AREG0,
7806 offsetof(CPUX86State, regs[15]), "r15");
7807 #else
7808 cpu_regs[R_EAX] = tcg_global_mem_new_i32(TCG_AREG0,
7809 offsetof(CPUX86State, regs[R_EAX]), "eax");
7810 cpu_regs[R_ECX] = tcg_global_mem_new_i32(TCG_AREG0,
7811 offsetof(CPUX86State, regs[R_ECX]), "ecx");
7812 cpu_regs[R_EDX] = tcg_global_mem_new_i32(TCG_AREG0,
7813 offsetof(CPUX86State, regs[R_EDX]), "edx");
7814 cpu_regs[R_EBX] = tcg_global_mem_new_i32(TCG_AREG0,
7815 offsetof(CPUX86State, regs[R_EBX]), "ebx");
7816 cpu_regs[R_ESP] = tcg_global_mem_new_i32(TCG_AREG0,
7817 offsetof(CPUX86State, regs[R_ESP]), "esp");
7818 cpu_regs[R_EBP] = tcg_global_mem_new_i32(TCG_AREG0,
7819 offsetof(CPUX86State, regs[R_EBP]), "ebp");
7820 cpu_regs[R_ESI] = tcg_global_mem_new_i32(TCG_AREG0,
7821 offsetof(CPUX86State, regs[R_ESI]), "esi");
7822 cpu_regs[R_EDI] = tcg_global_mem_new_i32(TCG_AREG0,
7823 offsetof(CPUX86State, regs[R_EDI]), "edi");
7824 #endif
7826 /* register helpers */
7827 #define GEN_HELPER 2
7828 #include "helper.h"
7831 /* generate intermediate code in gen_opc_buf and gen_opparam_buf for
7832 basic block 'tb'. If search_pc is TRUE, also generate PC
7833 information for each intermediate instruction. */
7834 static inline void gen_intermediate_code_internal(CPUX86State *env,
7835 TranslationBlock *tb,
7836 int search_pc)
7838 DisasContext dc1, *dc = &dc1;
7839 target_ulong pc_ptr;
7840 uint16_t *gen_opc_end;
7841 CPUBreakpoint *bp;
7842 int j, lj;
7843 uint64_t flags;
7844 target_ulong pc_start;
7845 target_ulong cs_base;
7846 int num_insns;
7847 int max_insns;
7849 /* generate intermediate code */
7850 pc_start = tb->pc;
7851 cs_base = tb->cs_base;
7852 flags = tb->flags;
7854 dc->pe = (flags >> HF_PE_SHIFT) & 1;
7855 dc->code32 = (flags >> HF_CS32_SHIFT) & 1;
7856 dc->ss32 = (flags >> HF_SS32_SHIFT) & 1;
7857 dc->addseg = (flags >> HF_ADDSEG_SHIFT) & 1;
7858 dc->f_st = 0;
7859 dc->vm86 = (flags >> VM_SHIFT) & 1;
7860 dc->cpl = (flags >> HF_CPL_SHIFT) & 3;
7861 dc->iopl = (flags >> IOPL_SHIFT) & 3;
7862 dc->tf = (flags >> TF_SHIFT) & 1;
7863 dc->singlestep_enabled = env->singlestep_enabled;
7864 dc->cc_op = CC_OP_DYNAMIC;
7865 dc->cc_op_dirty = false;
7866 dc->cs_base = cs_base;
7867 dc->tb = tb;
7868 dc->popl_esp_hack = 0;
7869 /* select memory access functions */
7870 dc->mem_index = 0;
7871 if (flags & HF_SOFTMMU_MASK) {
7872 dc->mem_index = (cpu_mmu_index(env) + 1) << 2;
7874 dc->cpuid_features = env->cpuid_features;
7875 dc->cpuid_ext_features = env->cpuid_ext_features;
7876 dc->cpuid_ext2_features = env->cpuid_ext2_features;
7877 dc->cpuid_ext3_features = env->cpuid_ext3_features;
7878 dc->cpuid_7_0_ebx_features = env->cpuid_7_0_ebx_features;
7879 #ifdef TARGET_X86_64
7880 dc->lma = (flags >> HF_LMA_SHIFT) & 1;
7881 dc->code64 = (flags >> HF_CS64_SHIFT) & 1;
7882 #endif
7883 dc->flags = flags;
7884 dc->jmp_opt = !(dc->tf || env->singlestep_enabled ||
7885 (flags & HF_INHIBIT_IRQ_MASK)
7886 #ifndef CONFIG_SOFTMMU
7887 || (flags & HF_SOFTMMU_MASK)
7888 #endif
7890 #if 0
7891 /* check addseg logic */
7892 if (!dc->addseg && (dc->vm86 || !dc->pe || !dc->code32))
7893 printf("ERROR addseg\n");
7894 #endif
7896 cpu_T[0] = tcg_temp_new();
7897 cpu_T[1] = tcg_temp_new();
7898 cpu_A0 = tcg_temp_new();
7900 cpu_tmp0 = tcg_temp_new();
7901 cpu_tmp1_i64 = tcg_temp_new_i64();
7902 cpu_tmp2_i32 = tcg_temp_new_i32();
7903 cpu_tmp3_i32 = tcg_temp_new_i32();
7904 cpu_tmp4 = tcg_temp_new();
7905 cpu_tmp5 = tcg_temp_new();
7906 cpu_ptr0 = tcg_temp_new_ptr();
7907 cpu_ptr1 = tcg_temp_new_ptr();
7908 cpu_cc_srcT = tcg_temp_local_new();
7910 gen_opc_end = tcg_ctx.gen_opc_buf + OPC_MAX_SIZE;
7912 dc->is_jmp = DISAS_NEXT;
7913 pc_ptr = pc_start;
7914 lj = -1;
7915 num_insns = 0;
7916 max_insns = tb->cflags & CF_COUNT_MASK;
7917 if (max_insns == 0)
7918 max_insns = CF_COUNT_MASK;
7920 gen_icount_start();
7921 for(;;) {
7922 if (unlikely(!QTAILQ_EMPTY(&env->breakpoints))) {
7923 QTAILQ_FOREACH(bp, &env->breakpoints, entry) {
7924 if (bp->pc == pc_ptr &&
7925 !((bp->flags & BP_CPU) && (tb->flags & HF_RF_MASK))) {
7926 gen_debug(dc, pc_ptr - dc->cs_base);
7927 break;
7931 if (search_pc) {
7932 j = tcg_ctx.gen_opc_ptr - tcg_ctx.gen_opc_buf;
7933 if (lj < j) {
7934 lj++;
7935 while (lj < j)
7936 tcg_ctx.gen_opc_instr_start[lj++] = 0;
7938 tcg_ctx.gen_opc_pc[lj] = pc_ptr;
7939 gen_opc_cc_op[lj] = dc->cc_op;
7940 tcg_ctx.gen_opc_instr_start[lj] = 1;
7941 tcg_ctx.gen_opc_icount[lj] = num_insns;
7943 if (num_insns + 1 == max_insns && (tb->cflags & CF_LAST_IO))
7944 gen_io_start();
7946 pc_ptr = disas_insn(env, dc, pc_ptr);
7947 num_insns++;
7948 /* stop translation if indicated */
7949 if (dc->is_jmp)
7950 break;
7951 /* if single step mode, we generate only one instruction and
7952 generate an exception */
7953 /* if irq were inhibited with HF_INHIBIT_IRQ_MASK, we clear
7954 the flag and abort the translation to give the irqs a
7955 change to be happen */
7956 if (dc->tf || dc->singlestep_enabled ||
7957 (flags & HF_INHIBIT_IRQ_MASK)) {
7958 gen_jmp_im(pc_ptr - dc->cs_base);
7959 gen_eob(dc);
7960 break;
7962 /* if too long translation, stop generation too */
7963 if (tcg_ctx.gen_opc_ptr >= gen_opc_end ||
7964 (pc_ptr - pc_start) >= (TARGET_PAGE_SIZE - 32) ||
7965 num_insns >= max_insns) {
7966 gen_jmp_im(pc_ptr - dc->cs_base);
7967 gen_eob(dc);
7968 break;
7970 if (singlestep) {
7971 gen_jmp_im(pc_ptr - dc->cs_base);
7972 gen_eob(dc);
7973 break;
7976 if (tb->cflags & CF_LAST_IO)
7977 gen_io_end();
7978 gen_icount_end(tb, num_insns);
7979 *tcg_ctx.gen_opc_ptr = INDEX_op_end;
7980 /* we don't forget to fill the last values */
7981 if (search_pc) {
7982 j = tcg_ctx.gen_opc_ptr - tcg_ctx.gen_opc_buf;
7983 lj++;
7984 while (lj <= j)
7985 tcg_ctx.gen_opc_instr_start[lj++] = 0;
7988 #ifdef DEBUG_DISAS
7989 if (qemu_loglevel_mask(CPU_LOG_TB_IN_ASM)) {
7990 int disas_flags;
7991 qemu_log("----------------\n");
7992 qemu_log("IN: %s\n", lookup_symbol(pc_start));
7993 #ifdef TARGET_X86_64
7994 if (dc->code64)
7995 disas_flags = 2;
7996 else
7997 #endif
7998 disas_flags = !dc->code32;
7999 log_target_disas(env, pc_start, pc_ptr - pc_start, disas_flags);
8000 qemu_log("\n");
8002 #endif
8004 if (!search_pc) {
8005 tb->size = pc_ptr - pc_start;
8006 tb->icount = num_insns;
8010 void gen_intermediate_code(CPUX86State *env, TranslationBlock *tb)
8012 gen_intermediate_code_internal(env, tb, 0);
8015 void gen_intermediate_code_pc(CPUX86State *env, TranslationBlock *tb)
8017 gen_intermediate_code_internal(env, tb, 1);
8020 void restore_state_to_opc(CPUX86State *env, TranslationBlock *tb, int pc_pos)
8022 int cc_op;
8023 #ifdef DEBUG_DISAS
8024 if (qemu_loglevel_mask(CPU_LOG_TB_OP)) {
8025 int i;
8026 qemu_log("RESTORE:\n");
8027 for(i = 0;i <= pc_pos; i++) {
8028 if (tcg_ctx.gen_opc_instr_start[i]) {
8029 qemu_log("0x%04x: " TARGET_FMT_lx "\n", i,
8030 tcg_ctx.gen_opc_pc[i]);
8033 qemu_log("pc_pos=0x%x eip=" TARGET_FMT_lx " cs_base=%x\n",
8034 pc_pos, tcg_ctx.gen_opc_pc[pc_pos] - tb->cs_base,
8035 (uint32_t)tb->cs_base);
8037 #endif
8038 env->eip = tcg_ctx.gen_opc_pc[pc_pos] - tb->cs_base;
8039 cc_op = gen_opc_cc_op[pc_pos];
8040 if (cc_op != CC_OP_DYNAMIC)
8041 env->cc_op = cc_op;