1 /* ----------------------------------------------------------------------- *
3 * Copyright 1996-2012 The NASM Authors - All Rights Reserved
4 * See the file AUTHORS included with the NASM distribution for
5 * the specific copyright holders.
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following
11 * * Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * * Redistributions in binary form must reproduce the above
14 * copyright notice, this list of conditions and the following
15 * disclaimer in the documentation and/or other materials provided
16 * with the distribution.
18 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
19 * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
20 * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
21 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
22 * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
23 * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
24 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
25 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
26 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
28 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
29 * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
30 * EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32 * ----------------------------------------------------------------------- */
35 * disasm.c where all the _work_ gets done in the Netwide Disassembler
53 * Flags that go into the `segment' field of `insn' structures
56 #define SEG_RELATIVE 1
63 #define SEG_SIGNED 128
70 uint8_t osize
; /* Operand size */
71 uint8_t asize
; /* Address size */
72 uint8_t osp
; /* Operand size prefix present */
73 uint8_t asp
; /* Address size prefix present */
74 uint8_t rep
; /* Rep prefix present */
75 uint8_t seg
; /* Segment override prefix present */
76 uint8_t wait
; /* WAIT "prefix" present */
77 uint8_t lock
; /* Lock prefix present */
78 uint8_t vex
[3]; /* VEX prefix present */
79 uint8_t vex_c
; /* VEX "class" (VEX, XOP, ...) */
80 uint8_t vex_m
; /* VEX.M field */
82 uint8_t vex_lp
; /* VEX.LP fields */
83 uint32_t rex
; /* REX prefix present */
84 uint8_t evex
[3]; /* EVEX prefix present */
87 #define getu8(x) (*(uint8_t *)(x))
89 /* Littleendian CPU which can handle unaligned references */
90 #define getu16(x) (*(uint16_t *)(x))
91 #define getu32(x) (*(uint32_t *)(x))
92 #define getu64(x) (*(uint64_t *)(x))
94 static uint16_t getu16(uint8_t *data
)
96 return (uint16_t)data
[0] + ((uint16_t)data
[1] << 8);
98 static uint32_t getu32(uint8_t *data
)
100 return (uint32_t)getu16(data
) + ((uint32_t)getu16(data
+2) << 16);
102 static uint64_t getu64(uint8_t *data
)
104 return (uint64_t)getu32(data
) + ((uint64_t)getu32(data
+4) << 32);
108 #define gets8(x) ((int8_t)getu8(x))
109 #define gets16(x) ((int16_t)getu16(x))
110 #define gets32(x) ((int32_t)getu32(x))
111 #define gets64(x) ((int64_t)getu64(x))
113 /* Important: regval must already have been adjusted for rex extensions */
114 static enum reg_enum
whichreg(opflags_t regflags
, int regval
, int rex
)
118 static const struct {
121 } specific_registers
[] = {
147 if (!(regflags
& (REGISTER
|REGMEM
)))
148 return 0; /* Registers not permissible?! */
150 regflags
|= REGISTER
;
152 for (i
= 0; i
< ARRAY_SIZE(specific_registers
); i
++)
153 if (!(specific_registers
[i
].flags
& ~regflags
))
154 return specific_registers
[i
].reg
;
156 /* All the entries below look up regval in an 16-entry array */
157 if (regval
< 0 || regval
> (rex
& REX_EV
? 31 : 15))
160 if (!(REG8
& ~regflags
)) {
161 if (rex
& (REX_P
|REX_NH
))
162 return nasm_rd_reg8_rex
[regval
];
164 return nasm_rd_reg8
[regval
];
166 if (!(REG16
& ~regflags
))
167 return nasm_rd_reg16
[regval
];
168 if (!(REG32
& ~regflags
))
169 return nasm_rd_reg32
[regval
];
170 if (!(REG64
& ~regflags
))
171 return nasm_rd_reg64
[regval
];
172 if (!(REG_SREG
& ~regflags
))
173 return nasm_rd_sreg
[regval
& 7]; /* Ignore REX */
174 if (!(REG_CREG
& ~regflags
))
175 return nasm_rd_creg
[regval
];
176 if (!(REG_DREG
& ~regflags
))
177 return nasm_rd_dreg
[regval
];
178 if (!(REG_TREG
& ~regflags
)) {
180 return 0; /* TR registers are ill-defined with rex */
181 return nasm_rd_treg
[regval
];
183 if (!(FPUREG
& ~regflags
))
184 return nasm_rd_fpureg
[regval
& 7]; /* Ignore REX */
185 if (!(MMXREG
& ~regflags
))
186 return nasm_rd_mmxreg
[regval
& 7]; /* Ignore REX */
187 if (!(XMMREG
& ~regflags
))
188 return nasm_rd_xmmreg
[regval
];
189 if (!(YMMREG
& ~regflags
))
190 return nasm_rd_ymmreg
[regval
];
191 if (!(ZMMREG
& ~regflags
))
192 return nasm_rd_zmmreg
[regval
];
193 if (!(OPMASKREG
& ~regflags
))
194 return nasm_rd_opmaskreg
[regval
];
200 * Find N value for compressed displacement (disp8 * N)
202 static uint8_t get_disp8N(insn
*ins
)
204 const uint8_t fv_n
[2][2][VLMAX
] = {{{16, 32, 64}, {4, 4, 4}},
205 {{16, 32, 64}, {8, 8, 8}}};
206 const uint8_t hv_n
[2][VLMAX
] = {{8, 16, 32}, {4, 4, 4}};
207 const uint8_t dup_n
[VLMAX
] = {8, 32, 64};
209 bool evex_b
= (ins
->evex_p
[2] & EVEX_P2B
) >> 4;
210 enum ttypes tuple
= ins
->evex_tuple
;
211 /* vex_wlp composed as [wwllpp] */
212 enum vectlens vectlen
= (ins
->evex_p
[2] & EVEX_P2LL
) >> 5;
213 /* wig(=2) is treated as w0(=0) */
214 bool evex_w
= (ins
->evex_p
[1] & EVEX_P1W
) >> 7;
219 n
= fv_n
[evex_w
][evex_b
][vectlen
];
222 n
= hv_n
[evex_b
][vectlen
];
226 /* 16, 32, 64 for VL 128, 256, 512 respectively*/
227 n
= 1 << (vectlen
+ 4);
229 case T1S8
: /* N = 1 */
230 case T1S16
: /* N = 2 */
231 n
= tuple
- T1S8
+ 1;
234 /* N = 4 for 32bit, 8 for 64bit */
239 /* N = 4 for 32bit, 8 for 64bit */
240 n
= (tuple
== T1F32
? 4 : 8);
245 if (vectlen
+ 7 <= (evex_w
+ 5) + (tuple
- T2
+ 1))
248 n
= 1 << (tuple
- T2
+ evex_w
+ 3);
253 n
= 1 << (OVM
- tuple
+ vectlen
+ 1);
270 * Process an effective address (ModRM) specification.
272 static uint8_t *do_ea(uint8_t *data
, int modrm
, int asize
,
273 int segsize
, enum ea_type type
,
274 operand
*op
, insn
*ins
)
276 int mod
, rm
, scale
, index
, base
;
280 bool is_evex
= !!(ins
->rex
& REX_EV
);
282 mod
= (modrm
>> 6) & 03;
285 if (mod
!= 3 && asize
!= 16 && rm
== 4)
291 if (mod
== 3) { /* pure register version */
292 op
->basereg
= rm
+(rex
& REX_B
? 8 : 0);
293 op
->segment
|= SEG_RMREG
;
294 if (is_evex
&& segsize
== 64) {
295 op
->basereg
+= (evex
[0] & EVEX_P0X
? 0 : 16);
305 * <mod> specifies the displacement size (none, byte or
306 * word), and <rm> specifies the register combination.
307 * Exception: mod=0,rm=6 does not specify [BP] as one might
308 * expect, but instead specifies [disp16].
311 if (type
!= EA_SCALAR
)
314 op
->indexreg
= op
->basereg
= -1;
315 op
->scale
= 1; /* always, in 16 bits */
346 if (rm
== 6 && mod
== 0) { /* special case */
350 mod
= 2; /* fake disp16 */
354 op
->segment
|= SEG_NODISP
;
357 op
->segment
|= SEG_DISP8
;
358 if (ins
->evex_tuple
!= 0) {
359 op
->offset
= gets8(data
) * get_disp8N(ins
);
361 op
->offset
= gets8(data
);
366 op
->segment
|= SEG_DISP16
;
367 op
->offset
= *data
++;
368 op
->offset
|= ((unsigned)*data
++) << 8;
374 * Once again, <mod> specifies displacement size (this time
375 * none, byte or *dword*), while <rm> specifies the base
376 * register. Again, [EBP] is missing, replaced by a pure
377 * disp32 (this time that's mod=0,rm=*5*) in 32-bit mode,
378 * and RIP-relative addressing in 64-bit mode.
381 * indicates not a single base register, but instead the
382 * presence of a SIB byte...
384 int a64
= asize
== 64;
389 op
->basereg
= nasm_rd_reg64
[rm
| ((rex
& REX_B
) ? 8 : 0)];
391 op
->basereg
= nasm_rd_reg32
[rm
| ((rex
& REX_B
) ? 8 : 0)];
393 if (rm
== 5 && mod
== 0) {
395 op
->eaflags
|= EAF_REL
;
396 op
->segment
|= SEG_RELATIVE
;
397 mod
= 2; /* fake disp32 */
401 op
->disp_size
= asize
;
404 mod
= 2; /* fake disp32 */
408 if (rm
== 4) { /* process SIB */
410 scale
= (sib
>> 6) & 03;
411 index
= (sib
>> 3) & 07;
414 op
->scale
= 1 << scale
;
417 vsib_hi
= (rex
& REX_X
? 8 : 0) |
418 (evex
[2] & EVEX_P2VP
? 0 : 16);
421 if (type
== EA_XMMVSIB
)
422 op
->indexreg
= nasm_rd_xmmreg
[index
| vsib_hi
];
423 else if (type
== EA_YMMVSIB
)
424 op
->indexreg
= nasm_rd_ymmreg
[index
| vsib_hi
];
425 else if (type
== EA_ZMMVSIB
)
426 op
->indexreg
= nasm_rd_zmmreg
[index
| vsib_hi
];
427 else if (index
== 4 && !(rex
& REX_X
))
428 op
->indexreg
= -1; /* ESP/RSP cannot be an index */
430 op
->indexreg
= nasm_rd_reg64
[index
| ((rex
& REX_X
) ? 8 : 0)];
432 op
->indexreg
= nasm_rd_reg32
[index
| ((rex
& REX_X
) ? 8 : 0)];
434 if (base
== 5 && mod
== 0) {
436 mod
= 2; /* Fake disp32 */
438 op
->basereg
= nasm_rd_reg64
[base
| ((rex
& REX_B
) ? 8 : 0)];
440 op
->basereg
= nasm_rd_reg32
[base
| ((rex
& REX_B
) ? 8 : 0)];
444 } else if (type
!= EA_SCALAR
) {
445 /* Can't have VSIB without SIB */
451 op
->segment
|= SEG_NODISP
;
454 op
->segment
|= SEG_DISP8
;
455 if (ins
->evex_tuple
!= 0) {
456 op
->offset
= gets8(data
) * get_disp8N(ins
);
458 op
->offset
= gets8(data
);
463 op
->segment
|= SEG_DISP32
;
464 op
->offset
= gets32(data
);
473 * Determine whether the instruction template in t corresponds to the data
474 * stream in data. Return the number of bytes matched if so.
476 #define case4(x) case (x): case (x)+1: case (x)+2: case (x)+3
478 static int matches(const struct itemplate
*t
, uint8_t *data
,
479 const struct prefix_info
*prefix
, int segsize
, insn
*ins
)
481 uint8_t *r
= (uint8_t *)(t
->code
);
482 uint8_t *origdata
= data
;
483 bool a_used
= false, o_used
= false;
484 enum prefixes drep
= 0;
485 enum prefixes dwait
= 0;
486 uint8_t lock
= prefix
->lock
;
487 int osize
= prefix
->osize
;
488 int asize
= prefix
->asize
;
491 struct operand
*opx
, *opy
;
494 int regmask
= (segsize
== 64) ? 15 : 7;
495 enum ea_type eat
= EA_SCALAR
;
497 for (i
= 0; i
< MAX_OPERANDS
; i
++) {
498 ins
->oprs
[i
].segment
= ins
->oprs
[i
].disp_size
=
499 (segsize
== 64 ? SEG_64BIT
: segsize
== 32 ? SEG_32BIT
: 0);
503 ins
->rex
= prefix
->rex
;
504 memset(ins
->prefixes
, 0, sizeof ins
->prefixes
);
506 if (t
->flags
& (segsize
== 64 ? IF_NOLONG
: IF_LONG
))
509 if (prefix
->rep
== 0xF2)
510 drep
= (t
->flags
& IF_BND
? P_BND
: P_REPNE
);
511 else if (prefix
->rep
== 0xF3)
514 dwait
= prefix
->wait
? P_WAIT
: 0;
516 while ((c
= *r
++) != 0) {
517 op1
= (c
& 3) + ((opex
& 1) << 2);
518 op2
= ((c
>> 3) & 3) + ((opex
& 2) << 1);
519 opx
= &ins
->oprs
[op1
];
520 opy
= &ins
->oprs
[op2
];
541 int t
= *r
++, d
= *data
++;
542 if (d
< t
|| d
> t
+ 7)
545 opx
->basereg
= (d
-t
)+
546 (ins
->rex
& REX_B
? 8 : 0);
547 opx
->segment
|= SEG_RMREG
;
553 opx
->offset
= (int8_t)*data
++;
554 opx
->segment
|= SEG_SIGNED
;
558 opx
->offset
= *data
++;
562 opx
->offset
= *data
++;
566 opx
->offset
= getu16(data
);
572 opx
->offset
= getu32(data
);
575 opx
->offset
= getu16(data
);
578 if (segsize
!= asize
)
579 opx
->disp_size
= asize
;
583 opx
->offset
= getu32(data
);
588 opx
->offset
= gets32(data
);
595 opx
->offset
= getu16(data
);
601 opx
->offset
= getu32(data
);
607 opx
->offset
= getu64(data
);
615 opx
->offset
= gets8(data
++);
616 opx
->segment
|= SEG_RELATIVE
;
620 opx
->offset
= getu64(data
);
625 opx
->offset
= gets16(data
);
627 opx
->segment
|= SEG_RELATIVE
;
628 opx
->segment
&= ~SEG_32BIT
;
631 case4(064): /* rel */
632 opx
->segment
|= SEG_RELATIVE
;
633 /* In long mode rel is always 32 bits, sign extended. */
634 if (segsize
== 64 || osize
== 32) {
635 opx
->offset
= gets32(data
);
638 opx
->segment
|= SEG_32BIT
;
639 opx
->type
= (opx
->type
& ~SIZE_MASK
)
640 | (segsize
== 64 ? BITS64
: BITS32
);
642 opx
->offset
= gets16(data
);
644 opx
->segment
&= ~SEG_32BIT
;
645 opx
->type
= (opx
->type
& ~SIZE_MASK
) | BITS16
;
650 opx
->offset
= gets32(data
);
652 opx
->segment
|= SEG_32BIT
| SEG_RELATIVE
;
661 opx
->segment
|= SEG_RMREG
;
662 data
= do_ea(data
, modrm
, asize
, segsize
, eat
, opy
, ins
);
665 opx
->basereg
= ((modrm
>> 3) & 7) + (ins
->rex
& REX_R
? 8 : 0);
666 if ((ins
->rex
& REX_EV
) && (segsize
== 64))
667 opx
->basereg
+= (ins
->evex_p
[0] & EVEX_P0RP
? 0 : 16);
673 uint8_t ximm
= *data
++;
675 ins
->oprs
[c
>> 3].basereg
= (ximm
>> 4) & regmask
;
676 ins
->oprs
[c
>> 3].segment
|= SEG_RMREG
;
677 ins
->oprs
[c
& 7].offset
= ximm
& 15;
683 uint8_t ximm
= *data
++;
689 ins
->oprs
[c
>> 4].basereg
= (ximm
>> 4) & regmask
;
690 ins
->oprs
[c
>> 4].segment
|= SEG_RMREG
;
696 uint8_t ximm
= *data
++;
698 opx
->basereg
= (ximm
>> 4) & regmask
;
699 opx
->segment
|= SEG_RMREG
;
713 if (((modrm
>> 3) & 07) != (c
& 07))
714 return false; /* spare field doesn't match up */
715 data
= do_ea(data
, modrm
, asize
, segsize
, eat
, opy
, ins
);
724 uint8_t evexm
= *r
++;
725 uint8_t evexwlp
= *r
++;
726 ins
->evex_tuple
= *r
++ - 0300;
729 if ((prefix
->rex
& (REX_EV
|REX_V
|REX_P
)) != REX_EV
)
732 if ((evexm
& 0x1f) != prefix
->vex_m
)
735 switch (evexwlp
& 060) {
737 if (prefix
->rex
& REX_W
)
741 if (!(prefix
->rex
& REX_W
))
745 case 040: /* VEX.W is a don't care */
752 /* If EVEX.b is set, EVEX.L'L can be rounding control bits */
753 if ((evexwlp
^ prefix
->vex_lp
) &
754 ((prefix
->evex
[2] & EVEX_P2B
) ? 0x03 : 0x0f))
758 if ((prefix
->vex_v
!= 0) ||
759 (!(prefix
->evex
[2] & EVEX_P2VP
) &&
760 ((eat
< EA_XMMVSIB
) || (eat
> EA_ZMMVSIB
))))
763 opx
->segment
|= SEG_RMREG
;
764 opx
->basereg
= ((~prefix
->evex
[2] & EVEX_P2VP
) << (4 - 3) ) |
768 memcpy(ins
->evex_p
, prefix
->evex
, 3);
779 if ((prefix
->rex
& (REX_V
|REX_P
)) != REX_V
)
782 if ((vexm
& 0x1f) != prefix
->vex_m
)
785 switch (vexwlp
& 060) {
787 if (prefix
->rex
& REX_W
)
791 if (!(prefix
->rex
& REX_W
))
795 case 040: /* VEX.W is a don't care */
802 /* The 010 bit of vexwlp is set if VEX.L is ignored */
803 if ((vexwlp
^ prefix
->vex_lp
) & ((vexwlp
& 010) ? 03 : 07))
807 if (prefix
->vex_v
!= 0)
810 opx
->segment
|= SEG_RMREG
;
811 opx
->basereg
= prefix
->vex_v
;
818 if (prefix
->rep
== 0xF3)
823 if (prefix
->rep
== 0xF2)
825 else if (prefix
->rep
== 0xF3)
830 if (prefix
->lock
== 0xF0) {
831 if (prefix
->rep
== 0xF2)
833 else if (prefix
->rep
== 0xF3)
853 if (asize
!= segsize
)
867 if (prefix
->rex
& REX_B
)
872 if (prefix
->rex
& REX_X
)
877 if (prefix
->rex
& REX_R
)
882 if (prefix
->rex
& REX_W
)
901 if (osize
!= (segsize
== 16) ? 16 : 32)
908 ins
->rex
|= REX_W
; /* 64-bit only instruction */
925 int t
= *r
++, d
= *data
++;
926 if (d
< t
|| d
> t
+ 15)
929 ins
->condition
= d
- t
;
934 if (prefix
->rep
== 0xF3)
944 if (prefix
->rep
!= 0xF2)
950 if (prefix
->rep
!= 0xF3)
975 if (prefix
->wait
!= 0x9B)
981 if (prefix
->osp
|| prefix
->rep
)
986 if (!prefix
->osp
|| prefix
->rep
)
1030 return false; /* Unknown code */
1034 if (!vex_ok
&& (ins
->rex
& (REX_V
| REX_EV
)))
1037 /* REX cannot be combined with VEX */
1038 if ((ins
->rex
& REX_V
) && (prefix
->rex
& REX_P
))
1042 * Check for unused rep or a/o prefixes.
1044 for (i
= 0; i
< t
->operands
; i
++) {
1045 if (ins
->oprs
[i
].segment
!= SEG_RMREG
)
1050 if (ins
->prefixes
[PPS_LOCK
])
1052 ins
->prefixes
[PPS_LOCK
] = P_LOCK
;
1055 if (ins
->prefixes
[PPS_REP
])
1057 ins
->prefixes
[PPS_REP
] = drep
;
1059 ins
->prefixes
[PPS_WAIT
] = dwait
;
1061 if (osize
!= ((segsize
== 16) ? 16 : 32)) {
1062 enum prefixes pfx
= 0;
1076 if (ins
->prefixes
[PPS_OSIZE
])
1078 ins
->prefixes
[PPS_OSIZE
] = pfx
;
1081 if (!a_used
&& asize
!= segsize
) {
1082 if (ins
->prefixes
[PPS_ASIZE
])
1084 ins
->prefixes
[PPS_ASIZE
] = asize
== 16 ? P_A16
: P_A32
;
1087 /* Fix: check for redundant REX prefixes */
1089 return data
- origdata
;
1092 /* Condition names for disassembly, sorted by x86 code */
1093 static const char * const condition_name
[16] = {
1094 "o", "no", "c", "nc", "z", "nz", "na", "a",
1095 "s", "ns", "pe", "po", "l", "nl", "ng", "g"
1098 int32_t disasm(uint8_t *data
, char *output
, int outbufsize
, int segsize
,
1099 int32_t offset
, int autosync
, iflags_t prefer
)
1101 const struct itemplate
* const *p
, * const *best_p
;
1102 const struct disasm_index
*ix
;
1104 int length
, best_length
= 0;
1106 int i
, slen
, colon
, n
;
1110 iflags_t goodness
, best
, flags
;
1112 struct prefix_info prefix
;
1116 memset(&ins
, 0, sizeof ins
);
1119 * Scan for prefixes.
1121 memset(&prefix
, 0, sizeof prefix
);
1122 prefix
.asize
= segsize
;
1123 prefix
.osize
= (segsize
== 64) ? 32 : segsize
;
1130 while (!end_prefix
) {
1134 prefix
.rep
= *data
++;
1138 prefix
.wait
= *data
++;
1142 prefix
.lock
= *data
++;
1146 segover
= "cs", prefix
.seg
= *data
++;
1149 segover
= "ss", prefix
.seg
= *data
++;
1152 segover
= "ds", prefix
.seg
= *data
++;
1155 segover
= "es", prefix
.seg
= *data
++;
1158 segover
= "fs", prefix
.seg
= *data
++;
1161 segover
= "gs", prefix
.seg
= *data
++;
1165 prefix
.osize
= (segsize
== 16) ? 32 : 16;
1166 prefix
.osp
= *data
++;
1169 prefix
.asize
= (segsize
== 32) ? 16 : 32;
1170 prefix
.asp
= *data
++;
1175 if (segsize
== 64 || (data
[1] & 0xc0) == 0xc0) {
1176 prefix
.vex
[0] = *data
++;
1177 prefix
.vex
[1] = *data
++;
1180 prefix
.vex_c
= RV_VEX
;
1182 if (prefix
.vex
[0] == 0xc4) {
1183 prefix
.vex
[2] = *data
++;
1184 prefix
.rex
|= (~prefix
.vex
[1] >> 5) & 7; /* REX_RXB */
1185 prefix
.rex
|= (prefix
.vex
[2] >> (7-3)) & REX_W
;
1186 prefix
.vex_m
= prefix
.vex
[1] & 0x1f;
1187 prefix
.vex_v
= (~prefix
.vex
[2] >> 3) & 15;
1188 prefix
.vex_lp
= prefix
.vex
[2] & 7;
1190 prefix
.rex
|= (~prefix
.vex
[1] >> (7-2)) & REX_R
;
1192 prefix
.vex_v
= (~prefix
.vex
[1] >> 3) & 15;
1193 prefix
.vex_lp
= prefix
.vex
[1] & 7;
1196 ix
= itable_vex
[RV_VEX
][prefix
.vex_m
][prefix
.vex_lp
& 3];
1203 uint8_t evex_p0
= data
[1] & 0x0f;
1204 if (segsize
== 64 ||
1205 ((evex_p0
>= 0x01) && (evex_p0
<= 0x03))) {
1206 data
++; /* 62h EVEX prefix */
1207 prefix
.evex
[0] = *data
++;
1208 prefix
.evex
[1] = *data
++;
1209 prefix
.evex
[2] = *data
++;
1211 prefix
.rex
= REX_EV
;
1212 prefix
.vex_c
= RV_EVEX
;
1213 prefix
.rex
|= (~prefix
.evex
[0] >> 5) & 7; /* REX_RXB */
1214 prefix
.rex
|= (prefix
.evex
[1] >> (7-3)) & REX_W
;
1215 prefix
.vex_m
= prefix
.evex
[0] & EVEX_P0MM
;
1216 prefix
.vex_v
= (~prefix
.evex
[1] & EVEX_P1VVVV
) >> 3;
1217 prefix
.vex_lp
= ((prefix
.evex
[2] & EVEX_P2LL
) >> (5-2)) |
1218 (prefix
.evex
[1] & EVEX_P1PP
);
1220 ix
= itable_vex
[prefix
.vex_c
][prefix
.vex_m
][prefix
.vex_lp
& 3];
1227 if ((data
[1] & 030) != 0 &&
1228 (segsize
== 64 || (data
[1] & 0xc0) == 0xc0)) {
1229 prefix
.vex
[0] = *data
++;
1230 prefix
.vex
[1] = *data
++;
1231 prefix
.vex
[2] = *data
++;
1234 prefix
.vex_c
= RV_XOP
;
1236 prefix
.rex
|= (~prefix
.vex
[1] >> 5) & 7; /* REX_RXB */
1237 prefix
.rex
|= (prefix
.vex
[2] >> (7-3)) & REX_W
;
1238 prefix
.vex_m
= prefix
.vex
[1] & 0x1f;
1239 prefix
.vex_v
= (~prefix
.vex
[2] >> 3) & 15;
1240 prefix
.vex_lp
= prefix
.vex
[2] & 7;
1242 ix
= itable_vex
[RV_XOP
][prefix
.vex_m
][prefix
.vex_lp
& 3];
1263 if (segsize
== 64) {
1264 prefix
.rex
= *data
++;
1265 if (prefix
.rex
& REX_W
)
1277 best
= -1; /* Worst possible */
1279 best_pref
= INT_MAX
;
1282 return 0; /* No instruction table at all... */
1286 while (ix
->n
== -1) {
1287 ix
= (const struct disasm_index
*)ix
->p
+ *dp
++;
1290 p
= (const struct itemplate
* const *)ix
->p
;
1291 for (n
= ix
->n
; n
; n
--, p
++) {
1292 if ((length
= matches(*p
, data
, &prefix
, segsize
, &tmp_ins
))) {
1295 * Final check to make sure the types of r/m match up.
1296 * XXX: Need to make sure this is actually correct.
1298 for (i
= 0; i
< (*p
)->operands
; i
++) {
1300 /* If it's a mem-only EA but we have a
1302 ((tmp_ins
.oprs
[i
].segment
& SEG_RMREG
) &&
1303 is_class(MEMORY
, (*p
)->opd
[i
])) ||
1304 /* If it's a reg-only EA but we have a memory
1306 (!(tmp_ins
.oprs
[i
].segment
& SEG_RMREG
) &&
1307 !(REG_EA
& ~(*p
)->opd
[i
]) &&
1308 !((*p
)->opd
[i
] & REG_SMASK
)) ||
1309 /* Register type mismatch (eg FS vs REG_DESS):
1311 ((((*p
)->opd
[i
] & (REGISTER
| FPUREG
)) ||
1312 (tmp_ins
.oprs
[i
].segment
& SEG_RMREG
)) &&
1313 !whichreg((*p
)->opd
[i
],
1314 tmp_ins
.oprs
[i
].basereg
, tmp_ins
.rex
))
1322 * Note: we always prefer instructions which incorporate
1323 * prefixes in the instructions themselves. This is to allow
1324 * e.g. PAUSE to be preferred to REP NOP, and deal with
1325 * MMX/SSE instructions where prefixes are used to select
1326 * between MMX and SSE register sets or outright opcode
1331 goodness
= ((*p
)->flags
& IF_PFMASK
) ^ prefer
;
1333 for (i
= 0; i
< MAXPREFIX
; i
++)
1334 if (tmp_ins
.prefixes
[i
])
1336 if (nprefix
< best_pref
||
1337 (nprefix
== best_pref
&& goodness
< best
)) {
1338 /* This is the best one found so far */
1341 best_pref
= nprefix
;
1342 best_length
= length
;
1350 return 0; /* no instruction was matched */
1352 /* Pick the best match */
1354 length
= best_length
;
1355 flags
= (*p
)->flags
;
1359 /* TODO: snprintf returns the value that the string would have if
1360 * the buffer were long enough, and not the actual length of
1361 * the returned string, so each instance of using the return
1362 * value of snprintf should actually be checked to assure that
1363 * the return value is "sane." Maybe a macro wrapper could
1364 * be used for that purpose.
1366 for (i
= 0; i
< MAXPREFIX
; i
++) {
1367 const char *prefix
= prefix_name(ins
.prefixes
[i
]);
1369 slen
+= snprintf(output
+slen
, outbufsize
-slen
, "%s ", prefix
);
1373 if (i
>= FIRST_COND_OPCODE
)
1374 slen
+= snprintf(output
+ slen
, outbufsize
- slen
, "%s%s",
1375 nasm_insn_names
[i
], condition_name
[ins
.condition
]);
1377 slen
+= snprintf(output
+ slen
, outbufsize
- slen
, "%s",
1378 nasm_insn_names
[i
]);
1381 is_evex
= !!(ins
.rex
& REX_EV
);
1382 length
+= data
- origdata
; /* fix up for prefixes */
1383 for (i
= 0; i
< (*p
)->operands
; i
++) {
1384 opflags_t t
= (*p
)->opd
[i
];
1385 const operand
*o
= &ins
.oprs
[i
];
1388 output
[slen
++] = (colon
? ':' : i
== 0 ? ' ' : ',');
1391 if (o
->segment
& SEG_RELATIVE
) {
1392 offs
+= offset
+ length
;
1394 * sort out wraparound
1396 if (!(o
->segment
& (SEG_32BIT
|SEG_64BIT
)))
1398 else if (segsize
!= 64)
1402 * add sync marker, if autosync is on
1413 if ((t
& (REGISTER
| FPUREG
)) ||
1414 (o
->segment
& SEG_RMREG
)) {
1416 reg
= whichreg(t
, o
->basereg
, ins
.rex
);
1418 slen
+= snprintf(output
+ slen
, outbufsize
- slen
, "to ");
1419 slen
+= snprintf(output
+ slen
, outbufsize
- slen
, "%s",
1420 nasm_reg_names
[reg
-EXPR_REG_START
]);
1421 } else if (!(UNITY
& ~t
)) {
1422 output
[slen
++] = '1';
1423 } else if (t
& IMMEDIATE
) {
1426 snprintf(output
+ slen
, outbufsize
- slen
, "byte ");
1427 if (o
->segment
& SEG_SIGNED
) {
1430 output
[slen
++] = '-';
1432 output
[slen
++] = '+';
1434 } else if (t
& BITS16
) {
1436 snprintf(output
+ slen
, outbufsize
- slen
, "word ");
1437 } else if (t
& BITS32
) {
1439 snprintf(output
+ slen
, outbufsize
- slen
, "dword ");
1440 } else if (t
& BITS64
) {
1442 snprintf(output
+ slen
, outbufsize
- slen
, "qword ");
1443 } else if (t
& NEAR
) {
1445 snprintf(output
+ slen
, outbufsize
- slen
, "near ");
1446 } else if (t
& SHORT
) {
1448 snprintf(output
+ slen
, outbufsize
- slen
, "short ");
1451 snprintf(output
+ slen
, outbufsize
- slen
, "0x%"PRIx64
"",
1453 } else if (!(MEM_OFFS
& ~t
)) {
1455 snprintf(output
+ slen
, outbufsize
- slen
,
1456 "[%s%s%s0x%"PRIx64
"]",
1457 (segover
? segover
: ""),
1458 (segover
? ":" : ""),
1459 (o
->disp_size
== 64 ? "qword " :
1460 o
->disp_size
== 32 ? "dword " :
1461 o
->disp_size
== 16 ? "word " : ""), offs
);
1463 } else if (is_class(REGMEM
, t
)) {
1464 int started
= false;
1467 snprintf(output
+ slen
, outbufsize
- slen
, "byte ");
1470 snprintf(output
+ slen
, outbufsize
- slen
, "word ");
1473 snprintf(output
+ slen
, outbufsize
- slen
, "dword ");
1476 snprintf(output
+ slen
, outbufsize
- slen
, "qword ");
1479 snprintf(output
+ slen
, outbufsize
- slen
, "tword ");
1482 snprintf(output
+ slen
, outbufsize
- slen
, "oword ");
1485 snprintf(output
+ slen
, outbufsize
- slen
, "yword ");
1488 snprintf(output
+ slen
, outbufsize
- slen
, "zword ");
1490 slen
+= snprintf(output
+ slen
, outbufsize
- slen
, "far ");
1493 snprintf(output
+ slen
, outbufsize
- slen
, "near ");
1494 output
[slen
++] = '[';
1496 slen
+= snprintf(output
+ slen
, outbufsize
- slen
, "%s",
1497 (o
->disp_size
== 64 ? "qword " :
1498 o
->disp_size
== 32 ? "dword " :
1499 o
->disp_size
== 16 ? "word " :
1501 if (o
->eaflags
& EAF_REL
)
1502 slen
+= snprintf(output
+ slen
, outbufsize
- slen
, "rel ");
1505 snprintf(output
+ slen
, outbufsize
- slen
, "%s:",
1509 if (o
->basereg
!= -1) {
1510 slen
+= snprintf(output
+ slen
, outbufsize
- slen
, "%s",
1511 nasm_reg_names
[(o
->basereg
-EXPR_REG_START
)]);
1514 if (o
->indexreg
!= -1 && !(flags
& IF_MIB
)) {
1516 output
[slen
++] = '+';
1517 slen
+= snprintf(output
+ slen
, outbufsize
- slen
, "%s",
1518 nasm_reg_names
[(o
->indexreg
-EXPR_REG_START
)]);
1521 snprintf(output
+ slen
, outbufsize
- slen
, "*%d",
1527 if (o
->segment
& SEG_DISP8
) {
1530 uint32_t offset
= offs
;
1531 if ((int32_t)offset
< 0) {
1538 snprintf(output
+ slen
, outbufsize
- slen
, "%s0x%"PRIx32
"",
1542 uint8_t offset
= offs
;
1543 if ((int8_t)offset
< 0) {
1550 snprintf(output
+ slen
, outbufsize
- slen
, "%s0x%"PRIx8
"",
1553 } else if (o
->segment
& SEG_DISP16
) {
1555 uint16_t offset
= offs
;
1556 if ((int16_t)offset
< 0 && started
) {
1560 prefix
= started
? "+" : "";
1563 snprintf(output
+ slen
, outbufsize
- slen
,
1564 "%s0x%"PRIx16
"", prefix
, offset
);
1565 } else if (o
->segment
& SEG_DISP32
) {
1566 if (prefix
.asize
== 64) {
1568 uint64_t offset
= (int64_t)(int32_t)offs
;
1569 if ((int32_t)offs
< 0 && started
) {
1573 prefix
= started
? "+" : "";
1576 snprintf(output
+ slen
, outbufsize
- slen
,
1577 "%s0x%"PRIx64
"", prefix
, offset
);
1580 uint32_t offset
= offs
;
1581 if ((int32_t) offset
< 0 && started
) {
1585 prefix
= started
? "+" : "";
1588 snprintf(output
+ slen
, outbufsize
- slen
,
1589 "%s0x%"PRIx32
"", prefix
, offset
);
1593 if (o
->indexreg
!= -1 && (flags
& IF_MIB
)) {
1594 output
[slen
++] = ',';
1595 slen
+= snprintf(output
+ slen
, outbufsize
- slen
, "%s",
1596 nasm_reg_names
[(o
->indexreg
-EXPR_REG_START
)]);
1599 snprintf(output
+ slen
, outbufsize
- slen
, "*%d",
1604 output
[slen
++] = ']';
1607 snprintf(output
+ slen
, outbufsize
- slen
, "<operand%d>",
1611 output
[slen
] = '\0';
1612 if (segover
) { /* unused segment override */
1614 int count
= slen
+ 1;
1616 p
[count
+ 3] = p
[count
];
1617 strncpy(output
, segover
, 2);
1624 * This is called when we don't have a complete instruction. If it
1625 * is a standalone *single-byte* prefix show it as such, otherwise
1626 * print it as a literal.
1628 int32_t eatbyte(uint8_t *data
, char *output
, int outbufsize
, int segsize
)
1630 uint8_t byte
= *data
;
1631 const char *str
= NULL
;
1665 str
= (segsize
== 16) ? "o32" : "o16";
1668 str
= (segsize
== 32) ? "a16" : "a32";
1686 if (segsize
== 64) {
1687 snprintf(output
, outbufsize
, "rex%s%s%s%s%s",
1688 (byte
== REX_P
) ? "" : ".",
1689 (byte
& REX_W
) ? "w" : "",
1690 (byte
& REX_R
) ? "r" : "",
1691 (byte
& REX_X
) ? "x" : "",
1692 (byte
& REX_B
) ? "b" : "");
1695 /* else fall through */
1697 snprintf(output
, outbufsize
, "db 0x%02x", byte
);
1702 snprintf(output
, outbufsize
, "%s", str
);