1 /* assemble.c code generation for the Netwide Assembler
3 * The Netwide Assembler is copyright (C) 1996 Simon Tatham and
4 * Julian Hall. All rights reserved. The software is
5 * redistributable under the licence given in the file "Licence"
6 * distributed in the NASM archive.
8 * the actual codes (C syntax, i.e. octal):
9 * \0 - terminates the code. (Unless it's a literal of course.)
10 * \1, \2, \3 - that many literal bytes follow in the code stream
11 * \4, \6 - the POP/PUSH (respectively) codes for CS, DS, ES, SS
12 * (POP is never used for CS) depending on operand 0
13 * \5, \7 - the second byte of POP/PUSH codes for FS, GS, depending
15 * \10..\13 - a literal byte follows in the code stream, to be added
16 * to the register value of operand 0..3
17 * \14..\17 - a signed byte immediate operand, from operand 0..3
18 * \20..\23 - a byte immediate operand, from operand 0..3
19 * \24..\27 - an unsigned byte immediate operand, from operand 0..3
20 * \30..\33 - a word immediate operand, from operand 0..3
21 * \34..\37 - select between \3[0-3] and \4[0-3] depending on 16/32 bit
22 * assembly mode or the operand-size override on the operand
23 * \40..\43 - a long immediate operand, from operand 0..3
24 * \44..\47 - select between \3[0-3], \4[0-3] and \5[4-7]
25 * depending on the address size of the instruction.
26 * \50..\53 - a byte relative operand, from operand 0..3
27 * \54..\57 - a qword immediate operand, from operand 0..3
28 * \60..\63 - a word relative operand, from operand 0..3
29 * \64..\67 - select between \6[0-3] and \7[0-3] depending on 16/32 bit
30 * assembly mode or the operand-size override on the operand
31 * \70..\73 - a long relative operand, from operand 0..3
32 * \74..\77 - a word constant, from the _segment_ part of operand 0..3
33 * \1ab - a ModRM, calculated on EA in operand a, with the spare
34 * field the register value of operand b.
35 * \140..\143 - an immediate word or signed byte for operand 0..3
36 * \144..\147 - or 2 (s-field) into next opcode byte if operand 0..3
37 * is a signed byte rather than a word.
38 * \150..\153 - an immediate dword or signed byte for operand 0..3
39 * \154..\157 - or 2 (s-field) into next opcode byte if operand 0..3
40 * is a signed byte rather than a dword.
41 * \160..\163 - this instruction uses DREX rather than REX, with the
42 * OC0 field set to 0, and the dest field taken from
44 * \164..\167 - this instruction uses DREX rather than REX, with the
45 * OC0 field set to 1, and the dest field taken from
47 * \170 - encodes the literal byte 0. (Some compilers don't take
48 * kindly to a zero byte in the _middle_ of a compile time
49 * string constant, so I had to put this hack in.)
50 * \171 - placement of DREX suffix in the absence of an EA
51 * \2ab - a ModRM, calculated on EA in operand a, with the spare
52 * field equal to digit b.
53 * \310 - indicates fixed 16-bit address size, i.e. optional 0x67.
54 * \311 - indicates fixed 32-bit address size, i.e. optional 0x67.
55 * \312 - (disassembler only) marker on LOOP, LOOPxx instructions.
56 * \313 - indicates fixed 64-bit address size, 0x67 invalid.
57 * \320 - indicates fixed 16-bit operand size, i.e. optional 0x66.
58 * \321 - indicates fixed 32-bit operand size, i.e. optional 0x66.
59 * \322 - indicates that this instruction is only valid when the
60 * operand size is the default (instruction to disassembler,
61 * generates no code in the assembler)
62 * \323 - indicates fixed 64-bit operand size, REX on extensions only.
63 * \324 - indicates 64-bit operand size requiring REX prefix.
64 * \330 - a literal byte follows in the code stream, to be added
65 * to the condition code value of the instruction.
66 * \331 - instruction not valid with REP prefix. Hint for
67 * disassembler only; for SSE instructions.
68 * \332 - REP prefix (0xF2 byte) used as opcode extension.
69 * \333 - REP prefix (0xF3 byte) used as opcode extension.
70 * \334 - LOCK prefix used instead of REX.R
71 * \335 - disassemble a rep (0xF3 byte) prefix as repe not rep.
72 * \340 - reserve <operand 0> bytes of uninitialized storage.
73 * Operand 0 had better be a segmentless constant.
74 * \364 - operand-size prefix (0x66) not permitted
75 * \365 - address-size prefix (0x67) not permitted
76 * \366 - operand-size prefix (0x66) used as opcode extension
77 * \367 - address-size prefix (0x67) used as opcode extension
78 * \370,\371,\372 - match only if operand 0 meets byte jump criteria.
79 * 370 is used for Jcc, 371 is used for JMP.
80 * \373 - assemble 0x03 if bits==16, 0x05 if bits==32;
81 * used for conditional jump over longer jump
99 int sib_present
; /* is a SIB byte necessary? */
100 int bytes
; /* # of bytes of offset needed */
101 int size
; /* lazy - this is sib+bytes+1 */
102 uint8_t modrm
, sib
, rex
, rip
; /* the bytes themselves */
105 static uint32_t cpu
; /* cpu level received from nasm.c */
106 static efunc errfunc
;
107 static struct ofmt
*outfmt
;
108 static ListGen
*list
;
110 static int32_t calcsize(int32_t, int32_t, int, insn
*, const char *);
111 static void gencode(int32_t, int32_t, int, insn
*, const char *, int32_t);
112 static int matches(const struct itemplate
*, insn
*, int bits
);
113 static int32_t regflag(const operand
*);
114 static int32_t regval(const operand
*);
115 static int rexflags(int, int32_t, int);
116 static int op_rexflags(const operand
*, int);
117 static ea
*process_ea(operand
*, ea
*, int, int, int, int32_t, int);
118 static void add_asp(insn
*, int);
120 static int has_prefix(insn
* ins
, enum prefix_pos pos
, enum prefixes prefix
)
122 return ins
->prefixes
[pos
] == prefix
;
125 static void assert_no_prefix(insn
* ins
, enum prefix_pos pos
)
127 if (ins
->prefixes
[pos
])
128 errfunc(ERR_NONFATAL
, "invalid %s prefix",
129 prefix_name(ins
->prefixes
[pos
]));
132 static const char *size_name(int size
)
152 static void warn_overflow(int size
, int64_t data
)
155 int64_t lim
= (1 << (size
*8))-1;
157 if (data
< ~lim
|| data
> lim
)
158 errfunc(ERR_WARNING
, "%s data exceeds bounds", size_name(size
));
162 * This routine wrappers the real output format's output routine,
163 * in order to pass a copy of the data off to the listing file
164 * generator at the same time.
166 static void out(int32_t offset
, int32_t segto
, const void *data
,
167 uint32_t type
, int32_t segment
, int32_t wrt
)
169 static int32_t lineno
= 0; /* static!!! */
170 static char *lnfname
= NULL
;
172 if ((type
& OUT_TYPMASK
) == OUT_ADDRESS
) {
173 if (segment
!= NO_SEG
|| wrt
!= NO_SEG
) {
175 * This address is relocated. We must write it as
176 * OUT_ADDRESS, so there's no work to be done here.
178 list
->output(offset
, data
, type
);
180 uint8_t p
[8], *q
= p
;
182 * This is a non-relocated address, and we're going to
183 * convert it into RAWDATA format.
185 if ((type
& OUT_SIZMASK
) == 4) {
186 WRITELONG(q
, *(int32_t *)data
);
187 list
->output(offset
, p
, OUT_RAWDATA
+ 4);
188 } else if ((type
& OUT_SIZMASK
) == 8) {
189 WRITEDLONG(q
, *(int64_t *)data
);
190 list
->output(offset
, p
, OUT_RAWDATA
+ 8);
192 WRITESHORT(q
, *(int32_t *)data
);
193 list
->output(offset
, p
, OUT_RAWDATA
+ 2);
196 } else if ((type
& OUT_TYPMASK
) == OUT_RAWDATA
) {
197 list
->output(offset
, data
, type
);
198 } else if ((type
& OUT_TYPMASK
) == OUT_RESERVE
) {
199 list
->output(offset
, NULL
, type
);
200 } else if ((type
& OUT_TYPMASK
) == OUT_REL2ADR
||
201 (type
& OUT_TYPMASK
) == OUT_REL4ADR
) {
202 list
->output(offset
, data
, type
);
206 * this call to src_get determines when we call the
207 * debug-format-specific "linenum" function
208 * it updates lineno and lnfname to the current values
209 * returning 0 if "same as last time", -2 if lnfname
210 * changed, and the amount by which lineno changed,
211 * if it did. thus, these variables must be static
214 if (src_get(&lineno
, &lnfname
)) {
215 outfmt
->current_dfmt
->linenum(lnfname
, lineno
, segto
);
218 outfmt
->output(segto
, data
, type
, segment
, wrt
);
221 static int jmp_match(int32_t segment
, int32_t offset
, int bits
,
222 insn
* ins
, const char *code
)
227 if (c
!= 0370 && c
!= 0371)
229 if (ins
->oprs
[0].opflags
& OPFLAG_FORWARD
) {
230 if ((optimizing
< 0 || (ins
->oprs
[0].type
& STRICT
))
234 return (pass0
== 0); /* match a forward reference */
236 isize
= calcsize(segment
, offset
, bits
, ins
, code
);
237 if (ins
->oprs
[0].segment
!= segment
)
239 isize
= ins
->oprs
[0].offset
- offset
- isize
; /* isize is now the delta */
240 if (isize
>= -128L && isize
<= 127L)
241 return 1; /* it is byte size */
246 int32_t assemble(int32_t segment
, int32_t offset
, int bits
, uint32_t cp
,
247 insn
* instruction
, struct ofmt
*output
, efunc error
,
250 const struct itemplate
*temp
;
255 int32_t start
= offset
;
256 int32_t wsize
= 0; /* size for DB etc. */
258 errfunc
= error
; /* to pass to other functions */
260 outfmt
= output
; /* likewise */
261 list
= listgen
; /* and again */
263 switch (instruction
->opcode
) {
290 int32_t t
= instruction
->times
;
293 "instruction->times < 0 (%ld) in assemble()", t
);
295 while (t
--) { /* repeat TIMES times */
296 for (e
= instruction
->eops
; e
; e
= e
->next
) {
297 if (e
->type
== EOT_DB_NUMBER
) {
299 if (e
->segment
!= NO_SEG
)
300 errfunc(ERR_NONFATAL
,
301 "one-byte relocation attempted");
303 uint8_t out_byte
= e
->offset
;
304 out(offset
, segment
, &out_byte
,
305 OUT_RAWDATA
+ 1, NO_SEG
, NO_SEG
);
307 } else if (wsize
> 8) {
308 errfunc(ERR_NONFATAL
, "integer supplied to a DT or DO"
311 out(offset
, segment
, &e
->offset
,
312 OUT_ADDRESS
+ wsize
, e
->segment
, e
->wrt
);
314 } else if (e
->type
== EOT_DB_STRING
) {
317 out(offset
, segment
, e
->stringval
,
318 OUT_RAWDATA
+ e
->stringlen
, NO_SEG
, NO_SEG
);
319 align
= e
->stringlen
% wsize
;
322 align
= wsize
- align
;
323 out(offset
, segment
, "\0\0\0\0\0\0\0\0",
324 OUT_RAWDATA
+ align
, NO_SEG
, NO_SEG
);
326 offset
+= e
->stringlen
+ align
;
329 if (t
> 0 && t
== instruction
->times
- 1) {
331 * Dummy call to list->output to give the offset to the
334 list
->output(offset
, NULL
, OUT_RAWDATA
);
335 list
->uplevel(LIST_TIMES
);
338 if (instruction
->times
> 1)
339 list
->downlevel(LIST_TIMES
);
340 return offset
- start
;
343 if (instruction
->opcode
== I_INCBIN
) {
344 static char fname
[FILENAME_MAX
];
347 char *prefix
= "", *combine
;
348 char **pPrevPath
= NULL
;
350 len
= FILENAME_MAX
- 1;
351 if (len
> instruction
->eops
->stringlen
)
352 len
= instruction
->eops
->stringlen
;
353 strncpy(fname
, instruction
->eops
->stringval
, len
);
356 while (1) { /* added by alexfru: 'incbin' uses include paths */
357 combine
= nasm_malloc(strlen(prefix
) + len
+ 1);
358 strcpy(combine
, prefix
);
359 strcat(combine
, fname
);
361 if ((fp
= fopen(combine
, "rb")) != NULL
) {
367 pPrevPath
= pp_get_include_path_ptr(pPrevPath
);
368 if (pPrevPath
== NULL
)
374 error(ERR_NONFATAL
, "`incbin': unable to open file `%s'",
376 else if (fseek(fp
, 0L, SEEK_END
) < 0)
377 error(ERR_NONFATAL
, "`incbin': unable to seek on file `%s'",
380 static char buf
[2048];
381 int32_t t
= instruction
->times
;
385 if (instruction
->eops
->next
) {
386 base
= instruction
->eops
->next
->offset
;
388 if (instruction
->eops
->next
->next
&&
389 len
> instruction
->eops
->next
->next
->offset
)
390 len
= instruction
->eops
->next
->next
->offset
;
393 * Dummy call to list->output to give the offset to the
396 list
->output(offset
, NULL
, OUT_RAWDATA
);
397 list
->uplevel(LIST_INCBIN
);
401 fseek(fp
, base
, SEEK_SET
);
405 fread(buf
, 1, (l
> (int32_t) sizeof(buf
) ? (int32_t) sizeof(buf
) : l
),
409 * This shouldn't happen unless the file
410 * actually changes while we are reading
414 "`incbin': unexpected EOF while"
415 " reading file `%s'", fname
);
416 t
= 0; /* Try to exit cleanly */
419 out(offset
, segment
, buf
, OUT_RAWDATA
+ m
,
424 list
->downlevel(LIST_INCBIN
);
425 if (instruction
->times
> 1) {
427 * Dummy call to list->output to give the offset to the
430 list
->output(offset
, NULL
, OUT_RAWDATA
);
431 list
->uplevel(LIST_TIMES
);
432 list
->downlevel(LIST_TIMES
);
435 return instruction
->times
* len
;
437 return 0; /* if we're here, there's an error */
440 /* Check to see if we need an address-size prefix */
441 add_asp(instruction
, bits
);
445 for (temp
= nasm_instructions
[instruction
->opcode
]; temp
->opcode
!= -1; temp
++){
446 int m
= matches(temp
, instruction
, bits
);
449 m
+= jmp_match(segment
, offset
, bits
, instruction
, temp
->code
);
451 if (m
== 100) { /* matches! */
452 const char *codes
= temp
->code
;
453 int32_t insn_size
= calcsize(segment
, offset
, bits
,
455 itimes
= instruction
->times
;
456 if (insn_size
< 0) /* shouldn't be, on pass two */
457 error(ERR_PANIC
, "errors made it through from pass one");
460 for (j
= 0; j
< MAXPREFIX
; j
++) {
462 switch (instruction
->prefixes
[j
]) {
478 "cs segment base ignored in 64-bit mode");
485 "ds segment base ignored in 64-bit mode");
492 "es segment base ignored in 64-bit mode");
505 "ss segment base ignored in 64-bit mode");
512 "segr6 and segr7 cannot be used as prefixes");
517 "16-bit addressing is not supported "
519 } else if (bits
!= 16)
529 "64-bit addressing is only supported "
553 error(ERR_PANIC
, "invalid instruction prefix");
556 out(offset
, segment
, &c
, OUT_RAWDATA
+ 1,
561 insn_end
= offset
+ insn_size
;
562 gencode(segment
, offset
, bits
, instruction
, codes
,
565 if (itimes
> 0 && itimes
== instruction
->times
- 1) {
567 * Dummy call to list->output to give the offset to the
570 list
->output(offset
, NULL
, OUT_RAWDATA
);
571 list
->uplevel(LIST_TIMES
);
574 if (instruction
->times
> 1)
575 list
->downlevel(LIST_TIMES
);
576 return offset
- start
;
577 } else if (m
> 0 && m
> size_prob
) {
583 if (temp
->opcode
== -1) { /* didn't match any instruction */
586 error(ERR_NONFATAL
, "operation size not specified");
589 error(ERR_NONFATAL
, "mismatch in operand sizes");
592 error(ERR_NONFATAL
, "no instruction for this cpu level");
595 error(ERR_NONFATAL
, "instruction not supported in 64-bit mode");
599 "invalid combination of opcode and operands");
606 int32_t insn_size(int32_t segment
, int32_t offset
, int bits
, uint32_t cp
,
607 insn
* instruction
, efunc error
)
609 const struct itemplate
*temp
;
611 errfunc
= error
; /* to pass to other functions */
614 if (instruction
->opcode
== -1)
617 if (instruction
->opcode
== I_DB
|| instruction
->opcode
== I_DW
||
618 instruction
->opcode
== I_DD
|| instruction
->opcode
== I_DQ
||
619 instruction
->opcode
== I_DT
|| instruction
->opcode
== I_DO
) {
621 int32_t isize
, osize
, wsize
= 0; /* placate gcc */
624 switch (instruction
->opcode
) {
647 for (e
= instruction
->eops
; e
; e
= e
->next
) {
651 if (e
->type
== EOT_DB_NUMBER
)
653 else if (e
->type
== EOT_DB_STRING
)
654 osize
= e
->stringlen
;
656 align
= (-osize
) % wsize
;
659 isize
+= osize
+ align
;
661 return isize
* instruction
->times
;
664 if (instruction
->opcode
== I_INCBIN
) {
665 char fname
[FILENAME_MAX
];
668 char *prefix
= "", *combine
;
669 char **pPrevPath
= NULL
;
671 len
= FILENAME_MAX
- 1;
672 if (len
> instruction
->eops
->stringlen
)
673 len
= instruction
->eops
->stringlen
;
674 strncpy(fname
, instruction
->eops
->stringval
, len
);
677 /* added by alexfru: 'incbin' uses include paths */
679 combine
= nasm_malloc(strlen(prefix
) + len
+ 1);
680 strcpy(combine
, prefix
);
681 strcat(combine
, fname
);
683 if ((fp
= fopen(combine
, "rb")) != NULL
) {
689 pPrevPath
= pp_get_include_path_ptr(pPrevPath
);
690 if (pPrevPath
== NULL
)
696 error(ERR_NONFATAL
, "`incbin': unable to open file `%s'",
698 else if (fseek(fp
, 0L, SEEK_END
) < 0)
699 error(ERR_NONFATAL
, "`incbin': unable to seek on file `%s'",
704 if (instruction
->eops
->next
) {
705 len
-= instruction
->eops
->next
->offset
;
706 if (instruction
->eops
->next
->next
&&
707 len
> instruction
->eops
->next
->next
->offset
) {
708 len
= instruction
->eops
->next
->next
->offset
;
711 return instruction
->times
* len
;
713 return 0; /* if we're here, there's an error */
716 /* Check to see if we need an address-size prefix */
717 add_asp(instruction
, bits
);
719 for (temp
= nasm_instructions
[instruction
->opcode
]; temp
->opcode
!= -1; temp
++) {
720 int m
= matches(temp
, instruction
, bits
);
722 m
+= jmp_match(segment
, offset
, bits
, instruction
, temp
->code
);
725 /* we've matched an instruction. */
727 const char *codes
= temp
->code
;
730 isize
= calcsize(segment
, offset
, bits
, instruction
, codes
);
733 for (j
= 0; j
< MAXPREFIX
; j
++) {
734 switch (instruction
->prefixes
[j
]) {
760 return isize
* instruction
->times
;
763 return -1; /* didn't match any instruction */
766 /* check that opn[op] is a signed byte of size 16 or 32,
767 and return the signed value*/
768 static int is_sbyte(insn
* ins
, int op
, int size
)
773 ret
= !(ins
->forw_ref
&& ins
->oprs
[op
].opflags
) && /* dead in the water on forward reference or External */
775 !(ins
->oprs
[op
].type
& STRICT
) &&
776 ins
->oprs
[op
].wrt
== NO_SEG
&& ins
->oprs
[op
].segment
== NO_SEG
;
778 v
= ins
->oprs
[op
].offset
;
780 v
= (int16_t)v
; /* sign extend if 16 bits */
782 return ret
&& v
>= -128L && v
<= 127L;
785 static int32_t calcsize(int32_t segment
, int32_t offset
, int bits
,
786 insn
* ins
, const char *codes
)
791 ins
->rex
= 0; /* Ensure REX is reset */
793 if (ins
->prefixes
[PPS_OSIZE
] == P_O64
)
796 (void)segment
; /* Don't warn that this parameter is unused */
797 (void)offset
; /* Don't warn that this parameter is unused */
800 switch (c
= *codes
++) {
804 codes
+= c
, length
+= c
;
817 op_rexflags(&ins
->oprs
[c
- 010], REX_B
|REX_H
|REX_P
|REX_W
);
848 if (ins
->oprs
[c
- 034].type
& (BITS16
| BITS32
| BITS64
))
849 length
+= (ins
->oprs
[c
- 034].type
& BITS16
) ? 2 : 4;
851 length
+= (bits
== 16) ? 2 : 4;
863 length
+= ins
->addr_size
>> 3;
875 length
+= 8; /* MOV reg64/imm */
887 if (ins
->oprs
[c
- 064].type
& (BITS16
| BITS32
| BITS64
))
888 length
+= (ins
->oprs
[c
- 064].type
& BITS16
) ? 2 : 4;
890 length
+= (bits
== 16) ? 2 : 4;
908 length
+= is_sbyte(ins
, c
- 0140, 16) ? 1 : 2;
921 length
+= is_sbyte(ins
, c
- 0150, 32) ? 1 : 4;
936 ins
->drexdst
= regval(&ins
->oprs
[c
& 3]);
943 ins
->rex
|= REX_D
|REX_OC
;
944 ins
->drexdst
= regval(&ins
->oprs
[c
& 3]);
959 length
+= (bits
!= 16) && !has_prefix(ins
, PPS_ASIZE
, P_A16
);
962 length
+= (bits
!= 32) && !has_prefix(ins
, PPS_ASIZE
, P_A32
);
967 if (bits
!= 64 || has_prefix(ins
, PPS_ASIZE
, P_A16
) ||
968 has_prefix(ins
, PPS_ASIZE
, P_A32
))
972 length
+= (bits
!= 16);
975 length
+= (bits
== 16);
1002 if (ins
->oprs
[0].segment
!= NO_SEG
)
1003 errfunc(ERR_NONFATAL
, "attempt to reserve non-constant"
1004 " quantity of BSS space");
1006 length
+= ins
->oprs
[0].offset
<< (c
- 0340);
1022 default: /* can't do it by 'case' statements */
1023 if (c
>= 0100 && c
<= 0277) { /* it's an EA */
1027 ea_data
.rex
= 0; /* Ensure ea.REX is initially 0 */
1030 /* pick rfield from operand b */
1031 rflags
= regflag(&ins
->oprs
[c
& 7]);
1032 rfield
= regvals
[ins
->oprs
[c
& 7].basereg
];
1039 (&ins
->oprs
[(c
>> 3) & 7], &ea_data
, bits
,
1040 ins
->addr_size
, rfield
, rflags
, ins
->forw_ref
)) {
1041 errfunc(ERR_NONFATAL
, "invalid effective address");
1044 ins
->rex
|= ea_data
.rex
;
1045 length
+= ea_data
.size
;
1048 errfunc(ERR_PANIC
, "internal instruction table corrupt"
1049 ": instruction code 0x%02X given", c
);
1052 ins
->rex
&= rex_mask
;
1054 if (ins
->rex
& REX_D
) {
1055 if (ins
->rex
& REX_H
) {
1056 errfunc(ERR_NONFATAL
, "cannot use high register in drex instruction");
1059 if (bits
!= 64 && ((ins
->rex
& (REX_W
|REX_X
|REX_B
)) ||
1060 ins
->drexdst
> 7)) {
1061 errfunc(ERR_NONFATAL
, "invalid operands in non-64-bit mode");
1065 } else if (ins
->rex
& REX_REAL
) {
1066 if (ins
->rex
& REX_H
) {
1067 errfunc(ERR_NONFATAL
, "cannot use high register in rex instruction");
1069 } else if (bits
== 64) {
1071 } else if ((ins
->rex
& REX_L
) &&
1072 !(ins
->rex
& (REX_P
|REX_W
|REX_X
|REX_B
)) &&
1075 assert_no_prefix(ins
, PPS_LREP
);
1078 errfunc(ERR_NONFATAL
, "invalid operands in non-64-bit mode");
1086 #define EMIT_REX() \
1087 if (!(ins->rex & REX_D) && (ins->rex & REX_REAL) && (bits == 64)) { \
1088 ins->rex = (ins->rex & REX_REAL)|REX_P; \
1089 out(offset, segment, &ins->rex, OUT_RAWDATA+1, NO_SEG, NO_SEG); \
1094 static void gencode(int32_t segment
, int32_t offset
, int bits
,
1095 insn
* ins
, const char *codes
, int32_t insn_end
)
1097 static char condval
[] = { /* conditional opcodes */
1098 0x7, 0x3, 0x2, 0x6, 0x2, 0x4, 0xF, 0xD, 0xC, 0xE, 0x6, 0x2,
1099 0x3, 0x7, 0x3, 0x5, 0xE, 0xC, 0xD, 0xF, 0x1, 0xB, 0x9, 0x5,
1100 0x0, 0xA, 0xA, 0xB, 0x8, 0x4
1108 switch (c
= *codes
++) {
1113 out(offset
, segment
, codes
, OUT_RAWDATA
+ c
, NO_SEG
, NO_SEG
);
1120 switch (ins
->oprs
[0].basereg
) {
1122 bytes
[0] = 0x0E + (c
== 0x04 ? 1 : 0);
1125 bytes
[0] = 0x1E + (c
== 0x04 ? 1 : 0);
1128 bytes
[0] = 0x06 + (c
== 0x04 ? 1 : 0);
1131 bytes
[0] = 0x16 + (c
== 0x04 ? 1 : 0);
1135 "bizarre 8086 segment register received");
1137 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1, NO_SEG
, NO_SEG
);
1143 switch (ins
->oprs
[0].basereg
) {
1145 bytes
[0] = 0xA0 + (c
== 0x05 ? 1 : 0);
1148 bytes
[0] = 0xA8 + (c
== 0x05 ? 1 : 0);
1152 "bizarre 386 segment register received");
1154 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1, NO_SEG
, NO_SEG
);
1163 bytes
[0] = *codes
++ + ((regval(&ins
->oprs
[c
- 010])) & 7);
1164 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1, NO_SEG
, NO_SEG
);
1172 if (ins
->oprs
[c
- 014].offset
< -128
1173 || ins
->oprs
[c
- 014].offset
> 127) {
1174 errfunc(ERR_WARNING
, "signed byte value exceeds bounds");
1177 if (ins
->oprs
[c
- 014].segment
!= NO_SEG
) {
1178 data
= ins
->oprs
[c
- 014].offset
;
1179 out(offset
, segment
, &data
, OUT_ADDRESS
+ 1,
1180 ins
->oprs
[c
- 014].segment
, ins
->oprs
[c
- 014].wrt
);
1182 bytes
[0] = ins
->oprs
[c
- 014].offset
;
1183 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1, NO_SEG
,
1193 if (ins
->oprs
[c
- 020].offset
< -256
1194 || ins
->oprs
[c
- 020].offset
> 255) {
1195 errfunc(ERR_WARNING
, "byte value exceeds bounds");
1197 if (ins
->oprs
[c
- 020].segment
!= NO_SEG
) {
1198 data
= ins
->oprs
[c
- 020].offset
;
1199 out(offset
, segment
, &data
, OUT_ADDRESS
+ 1,
1200 ins
->oprs
[c
- 020].segment
, ins
->oprs
[c
- 020].wrt
);
1202 bytes
[0] = ins
->oprs
[c
- 020].offset
;
1203 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1, NO_SEG
,
1213 if (ins
->oprs
[c
- 024].offset
< 0
1214 || ins
->oprs
[c
- 024].offset
> 255)
1215 errfunc(ERR_WARNING
, "unsigned byte value exceeds bounds");
1216 if (ins
->oprs
[c
- 024].segment
!= NO_SEG
) {
1217 data
= ins
->oprs
[c
- 024].offset
;
1218 out(offset
, segment
, &data
, OUT_ADDRESS
+ 1,
1219 ins
->oprs
[c
- 024].segment
, ins
->oprs
[c
- 024].wrt
);
1221 bytes
[0] = ins
->oprs
[c
- 024].offset
;
1222 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1, NO_SEG
,
1232 data
= ins
->oprs
[c
- 030].offset
;
1233 if (ins
->oprs
[c
- 030].segment
== NO_SEG
&&
1234 ins
->oprs
[c
- 030].wrt
== NO_SEG
)
1235 warn_overflow(2, data
);
1236 out(offset
, segment
, &data
, OUT_ADDRESS
+ 2,
1237 ins
->oprs
[c
- 030].segment
, ins
->oprs
[c
- 030].wrt
);
1245 if (ins
->oprs
[c
- 034].type
& (BITS16
| BITS32
))
1246 size
= (ins
->oprs
[c
- 034].type
& BITS16
) ? 2 : 4;
1248 size
= (bits
== 16) ? 2 : 4;
1249 data
= ins
->oprs
[c
- 034].offset
;
1250 warn_overflow(size
, data
);
1251 out(offset
, segment
, &data
, OUT_ADDRESS
+ size
,
1252 ins
->oprs
[c
- 034].segment
, ins
->oprs
[c
- 034].wrt
);
1260 data
= ins
->oprs
[c
- 040].offset
;
1261 out(offset
, segment
, &data
, OUT_ADDRESS
+ 4,
1262 ins
->oprs
[c
- 040].segment
, ins
->oprs
[c
- 040].wrt
);
1270 data
= ins
->oprs
[c
- 044].offset
;
1271 size
= ins
->addr_size
>> 3;
1272 warn_overflow(size
, data
);
1273 out(offset
, segment
, &data
, OUT_ADDRESS
+ size
,
1274 ins
->oprs
[c
- 044].segment
, ins
->oprs
[c
- 044].wrt
);
1282 if (ins
->oprs
[c
- 050].segment
!= segment
)
1283 errfunc(ERR_NONFATAL
,
1284 "short relative jump outside segment");
1285 data
= ins
->oprs
[c
- 050].offset
- insn_end
;
1286 if (data
> 127 || data
< -128)
1287 errfunc(ERR_NONFATAL
, "short jump is out of range");
1289 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1, NO_SEG
, NO_SEG
);
1297 data
= (int64_t)ins
->oprs
[c
- 054].offset
;
1298 out(offset
, segment
, &data
, OUT_ADDRESS
+ 8,
1299 ins
->oprs
[c
- 054].segment
, ins
->oprs
[c
- 054].wrt
);
1307 if (ins
->oprs
[c
- 060].segment
!= segment
) {
1308 data
= ins
->oprs
[c
- 060].offset
;
1309 out(offset
, segment
, &data
,
1310 OUT_REL2ADR
+ insn_end
- offset
,
1311 ins
->oprs
[c
- 060].segment
, ins
->oprs
[c
- 060].wrt
);
1313 data
= ins
->oprs
[c
- 060].offset
- insn_end
;
1314 out(offset
, segment
, &data
,
1315 OUT_ADDRESS
+ 2, NO_SEG
, NO_SEG
);
1324 if (ins
->oprs
[c
- 064].type
& (BITS16
| BITS32
| BITS64
))
1325 size
= (ins
->oprs
[c
- 064].type
& BITS16
) ? 2 : 4;
1327 size
= (bits
== 16) ? 2 : 4;
1328 if (ins
->oprs
[c
- 064].segment
!= segment
) {
1329 int32_t reltype
= (size
== 2 ? OUT_REL2ADR
: OUT_REL4ADR
);
1330 data
= ins
->oprs
[c
- 064].offset
;
1331 out(offset
, segment
, &data
, reltype
+ insn_end
- offset
,
1332 ins
->oprs
[c
- 064].segment
, ins
->oprs
[c
- 064].wrt
);
1334 data
= ins
->oprs
[c
- 064].offset
- insn_end
;
1335 out(offset
, segment
, &data
,
1336 OUT_ADDRESS
+ size
, NO_SEG
, NO_SEG
);
1345 if (ins
->oprs
[c
- 070].segment
!= segment
) {
1346 data
= ins
->oprs
[c
- 070].offset
;
1347 out(offset
, segment
, &data
,
1348 OUT_REL4ADR
+ insn_end
- offset
,
1349 ins
->oprs
[c
- 070].segment
, ins
->oprs
[c
- 070].wrt
);
1351 data
= ins
->oprs
[c
- 070].offset
- insn_end
;
1352 out(offset
, segment
, &data
,
1353 OUT_ADDRESS
+ 4, NO_SEG
, NO_SEG
);
1362 if (ins
->oprs
[c
- 074].segment
== NO_SEG
)
1363 errfunc(ERR_NONFATAL
, "value referenced by FAR is not"
1366 out(offset
, segment
, &data
, OUT_ADDRESS
+ 2,
1367 outfmt
->segbase(1 + ins
->oprs
[c
- 074].segment
),
1368 ins
->oprs
[c
- 074].wrt
);
1376 data
= ins
->oprs
[c
- 0140].offset
;
1377 if (is_sbyte(ins
, c
- 0140, 16)) {
1379 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1, NO_SEG
,
1383 if (ins
->oprs
[c
- 0140].segment
== NO_SEG
&&
1384 ins
->oprs
[c
- 0140].wrt
== NO_SEG
)
1385 warn_overflow(2, data
);
1386 out(offset
, segment
, &data
, OUT_ADDRESS
+ 2,
1387 ins
->oprs
[c
- 0140].segment
, ins
->oprs
[c
- 0140].wrt
);
1398 bytes
[0] = *codes
++;
1399 if (is_sbyte(ins
, c
- 0144, 16))
1400 bytes
[0] |= 2; /* s-bit */
1401 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1, NO_SEG
, NO_SEG
);
1409 data
= ins
->oprs
[c
- 0150].offset
;
1410 if (is_sbyte(ins
, c
- 0150, 32)) {
1412 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1, NO_SEG
,
1416 out(offset
, segment
, &data
, OUT_ADDRESS
+ 4,
1417 ins
->oprs
[c
- 0150].segment
, ins
->oprs
[c
- 0150].wrt
);
1428 bytes
[0] = *codes
++;
1429 if (is_sbyte(ins
, c
- 0154, 32))
1430 bytes
[0] |= 2; /* s-bit */
1431 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1, NO_SEG
, NO_SEG
);
1448 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1, NO_SEG
, NO_SEG
);
1454 (ins
->drexdst
<< 4) |
1455 (ins
->rex
& REX_OC
? 0x08 : 0) |
1456 (ins
->rex
& (REX_R
|REX_X
|REX_B
));
1458 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1, NO_SEG
, NO_SEG
);
1469 if (bits
== 32 && !has_prefix(ins
, PPS_ASIZE
, P_A16
)) {
1471 out(offset
, segment
, bytes
,
1472 OUT_RAWDATA
+ 1, NO_SEG
, NO_SEG
);
1479 if (bits
!= 32 && !has_prefix(ins
, PPS_ASIZE
, P_A32
)) {
1481 out(offset
, segment
, bytes
,
1482 OUT_RAWDATA
+ 1, NO_SEG
, NO_SEG
);
1498 out(offset
, segment
, bytes
,
1499 OUT_RAWDATA
+ 1, NO_SEG
, NO_SEG
);
1508 out(offset
, segment
, bytes
,
1509 OUT_RAWDATA
+ 1, NO_SEG
, NO_SEG
);
1524 *bytes
= *codes
++ ^ condval
[ins
->condition
];
1525 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1, NO_SEG
, NO_SEG
);
1534 *bytes
= c
- 0332 + 0xF2;
1535 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1, NO_SEG
, NO_SEG
);
1540 if (ins
->rex
& REX_R
) {
1542 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1, NO_SEG
, NO_SEG
);
1545 ins
->rex
&= ~(REX_L
|REX_R
);
1554 if (ins
->oprs
[0].segment
!= NO_SEG
)
1555 errfunc(ERR_PANIC
, "non-constant BSS size in pass two");
1557 int32_t size
= ins
->oprs
[0].offset
<< (c
- 0340);
1559 out(offset
, segment
, NULL
,
1560 OUT_RESERVE
+ size
, NO_SEG
, NO_SEG
);
1571 *bytes
= c
- 0366 + 0x66;
1572 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1, NO_SEG
, NO_SEG
);
1582 *bytes
= bits
== 16 ? 3 : 5;
1583 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1, NO_SEG
, NO_SEG
);
1587 default: /* can't do it by 'case' statements */
1588 if (c
>= 0100 && c
<= 0277) { /* it's an EA */
1596 /* pick rfield from operand b */
1597 rflags
= regflag(&ins
->oprs
[c
& 7]);
1598 rfield
= regvals
[ins
->oprs
[c
& 7].basereg
];
1600 /* rfield is constant */
1606 (&ins
->oprs
[(c
>> 3) & 7], &ea_data
, bits
,
1607 ins
->addr_size
, rfield
, rflags
, ins
->forw_ref
)) {
1608 errfunc(ERR_NONFATAL
, "invalid effective address");
1612 *p
++ = ea_data
.modrm
;
1613 if (ea_data
.sib_present
)
1616 /* DREX suffixes come between the SIB and the displacement */
1617 if (ins
->rex
& REX_D
) {
1619 (ins
->drexdst
<< 4) |
1620 (ins
->rex
& REX_OC
? 0x08 : 0) |
1621 (ins
->rex
& (REX_R
|REX_X
|REX_B
));
1626 out(offset
, segment
, bytes
, OUT_RAWDATA
+ s
,
1629 switch (ea_data
.bytes
) {
1633 if (ins
->oprs
[(c
>> 3) & 7].segment
!= NO_SEG
) {
1634 data
= ins
->oprs
[(c
>> 3) & 7].offset
;
1635 out(offset
, segment
, &data
, OUT_ADDRESS
+ 1,
1636 ins
->oprs
[(c
>> 3) & 7].segment
,
1637 ins
->oprs
[(c
>> 3) & 7].wrt
);
1639 *bytes
= ins
->oprs
[(c
>> 3) & 7].offset
;
1640 out(offset
, segment
, bytes
, OUT_RAWDATA
+ 1,
1648 data
= ins
->oprs
[(c
>> 3) & 7].offset
;
1649 out(offset
, segment
, &data
,
1650 (ea_data
.rip
? OUT_REL4ADR
: OUT_ADDRESS
)
1652 ins
->oprs
[(c
>> 3) & 7].segment
,
1653 ins
->oprs
[(c
>> 3) & 7].wrt
);
1659 errfunc(ERR_PANIC
, "internal instruction table corrupt"
1660 ": instruction code 0x%02X given", c
);
1664 static int32_t regflag(const operand
* o
)
1666 if (o
->basereg
< EXPR_REG_START
|| o
->basereg
>= REG_ENUM_LIMIT
) {
1667 errfunc(ERR_PANIC
, "invalid operand passed to regflag()");
1669 return reg_flags
[o
->basereg
];
1672 static int32_t regval(const operand
* o
)
1674 if (o
->basereg
< EXPR_REG_START
|| o
->basereg
>= REG_ENUM_LIMIT
) {
1675 errfunc(ERR_PANIC
, "invalid operand passed to regval()");
1677 return regvals
[o
->basereg
];
1680 static int op_rexflags(const operand
* o
, int mask
)
1685 if (o
->basereg
< EXPR_REG_START
|| o
->basereg
>= REG_ENUM_LIMIT
) {
1686 errfunc(ERR_PANIC
, "invalid operand passed to op_rexflags()");
1689 flags
= reg_flags
[o
->basereg
];
1690 val
= regvals
[o
->basereg
];
1692 return rexflags(val
, flags
, mask
);
1695 static int rexflags(int val
, int32_t flags
, int mask
)
1700 rex
|= REX_B
|REX_X
|REX_R
;
1703 if (!(REG_HIGH
& ~flags
)) /* AH, CH, DH, BH */
1705 else if (!(REG8
& ~flags
) && val
>= 4) /* SPL, BPL, SIL, DIL */
1711 static int matches(const struct itemplate
*itemp
, insn
* instruction
, int bits
)
1713 int i
, size
[MAX_OPERANDS
], asize
, oprs
, ret
;
1720 if (itemp
->opcode
!= instruction
->opcode
)
1724 * Count the operands
1726 if (itemp
->operands
!= instruction
->operands
)
1730 * Check that no spurious colons or TOs are present
1732 for (i
= 0; i
< itemp
->operands
; i
++)
1733 if (instruction
->oprs
[i
].type
& ~itemp
->opd
[i
] & (COLON
| TO
))
1737 * Check that the operand flags all match up
1739 for (i
= 0; i
< itemp
->operands
; i
++) {
1740 if (itemp
->opd
[i
] & SAME_AS
) {
1741 int j
= itemp
->opd
[i
] & ~SAME_AS
;
1742 if (instruction
->oprs
[i
].type
!= instruction
->oprs
[j
].type
||
1743 instruction
->oprs
[i
].basereg
!= instruction
->oprs
[j
].basereg
)
1745 } else if (itemp
->opd
[i
] & ~instruction
->oprs
[i
].type
||
1746 ((itemp
->opd
[i
] & SIZE_MASK
) &&
1747 ((itemp
->opd
[i
] ^ instruction
->oprs
[i
].type
) & SIZE_MASK
))) {
1748 if ((itemp
->opd
[i
] & ~instruction
->oprs
[i
].type
& ~SIZE_MASK
) ||
1749 (instruction
->oprs
[i
].type
& SIZE_MASK
))
1757 * Check operand sizes
1759 if (itemp
->flags
& IF_ARMASK
) {
1760 memset(size
, 0, sizeof size
);
1762 switch (itemp
->flags
& IF_ARMASK
) {
1776 break; /* Shouldn't happen */
1778 switch (itemp
->flags
& IF_SMASK
) {
1799 switch (itemp
->flags
& IF_SMASK
) {
1802 oprs
= itemp
->operands
;
1806 oprs
= itemp
->operands
;
1810 oprs
= itemp
->operands
;
1814 oprs
= itemp
->operands
;
1818 oprs
= itemp
->operands
;
1823 for (i
= 0; i
< MAX_OPERANDS
; i
++)
1827 if (itemp
->flags
& (IF_SM
| IF_SM2
)) {
1828 oprs
= (itemp
->flags
& IF_SM2
? 2 : itemp
->operands
);
1830 for (i
= 0; i
< oprs
; i
++) {
1831 if ((asize
= itemp
->opd
[i
] & SIZE_MASK
) != 0) {
1833 for (j
= 0; j
< oprs
; j
++)
1839 oprs
= itemp
->operands
;
1842 for (i
= 0; i
< itemp
->operands
; i
++) {
1843 if (!(itemp
->opd
[i
] & SIZE_MASK
) &&
1844 (instruction
->oprs
[i
].type
& SIZE_MASK
& ~size
[i
]))
1849 * Check template is okay at the set cpu level
1851 if (((itemp
->flags
& IF_PLEVEL
) > cpu
))
1855 * Check if instruction is available in long mode
1857 if ((itemp
->flags
& IF_NOLONG
) && (bits
== 64))
1861 * Check if special handling needed for Jumps
1863 if ((uint8_t)(itemp
->code
[0]) >= 0370)
1869 static ea
*process_ea(operand
* input
, ea
* output
, int bits
,
1870 int addrbits
, int rfield
, int32_t rflags
, int forw_ref
)
1872 output
->rip
= false;
1874 /* REX flags for the rfield operand */
1875 output
->rex
|= rexflags(rfield
, rflags
, REX_R
|REX_P
|REX_W
|REX_H
);
1877 if (!(REGISTER
& ~input
->type
)) { /* register direct */
1881 if (input
->basereg
< EXPR_REG_START
/* Verify as Register */
1882 || input
->basereg
>= REG_ENUM_LIMIT
)
1885 i
= regvals
[input
->basereg
];
1888 return NULL
; /* Invalid EA register */
1890 output
->rex
|= op_rexflags(input
, REX_B
|REX_P
|REX_W
|REX_H
);
1892 output
->sib_present
= false; /* no SIB necessary */
1893 output
->bytes
= 0; /* no offset necessary either */
1894 output
->modrm
= 0xC0 | ((rfield
& 7) << 3) | (i
& 7);
1895 } else { /* it's a memory reference */
1896 if (input
->basereg
== -1
1897 && (input
->indexreg
== -1 || input
->scale
== 0)) {
1898 /* it's a pure offset */
1899 if (bits
== 64 && (~input
->type
& IP_REL
)) {
1900 int scale
, index
, base
;
1901 output
->sib_present
= true;
1905 output
->sib
= (scale
<< 6) | (index
<< 3) | base
;
1907 output
->modrm
= 4 | ((rfield
& 7) << 3);
1908 output
->rip
= false;
1910 output
->sib_present
= false;
1911 output
->bytes
= (addrbits
!= 16 ? 4 : 2);
1912 output
->modrm
= (addrbits
!= 16 ? 5 : 6) | ((rfield
& 7) << 3);
1913 output
->rip
= bits
== 64;
1915 } else { /* it's an indirection */
1916 int i
= input
->indexreg
, b
= input
->basereg
, s
= input
->scale
;
1917 int32_t o
= input
->offset
, seg
= input
->segment
;
1918 int hb
= input
->hintbase
, ht
= input
->hinttype
;
1921 int32_t ix
, bx
; /* register flags */
1924 i
= -1; /* make this easy, at least */
1926 if (i
>= EXPR_REG_START
&& i
< REG_ENUM_LIMIT
) {
1934 if (b
!= -1 && b
>= EXPR_REG_START
&& b
< REG_ENUM_LIMIT
) {
1942 /* check for a 32/64-bit memory reference... */
1943 if ((ix
|bx
) & (BITS32
|BITS64
)) {
1944 /* it must be a 32/64-bit memory reference. Firstly we have
1945 * to check that all registers involved are type E/Rxx. */
1946 int32_t sok
= BITS32
|BITS64
;
1949 if (!(REG64
& ~ix
) || !(REG32
& ~ix
))
1957 return NULL
; /* Invalid register */
1958 if (~sok
& bx
& SIZE_MASK
)
1959 return NULL
; /* Invalid size */
1963 /* While we're here, ensure the user didn't specify
1965 if (input
->disp_size
== 16 || input
->disp_size
== 64)
1968 if (addrbits
== 16 ||
1969 (addrbits
== 32 && !(sok
& BITS32
)) ||
1970 (addrbits
== 64 && !(sok
& BITS64
)))
1973 /* now reorganize base/index */
1974 if (s
== 1 && bt
!= it
&& bt
!= -1 && it
!= -1 &&
1975 ((hb
== b
&& ht
== EAH_NOTBASE
)
1976 || (hb
== i
&& ht
== EAH_MAKEBASE
))) {
1977 /* swap if hints say so */
1978 t
= bt
, bt
= it
, it
= t
;
1979 t
= bx
, bx
= ix
, ix
= t
;
1981 if (bt
== it
) /* convert EAX+2*EAX to 3*EAX */
1982 bt
= -1, bx
= 0, s
++;
1983 if (bt
== -1 && s
== 1 && !(hb
== it
&& ht
== EAH_NOTBASE
)) {
1984 /* make single reg base, unless hint */
1985 bt
= it
, bx
= ix
, it
= -1, ix
= 0;
1987 if (((s
== 2 && it
!= REG_NUM_ESP
1988 && !(input
->eaflags
& EAF_TIMESTWO
)) || s
== 3
1989 || s
== 5 || s
== 9) && bt
== -1)
1990 bt
= it
, bx
= ix
, s
--; /* convert 3*EAX to EAX+2*EAX */
1991 if (it
== -1 && (bt
& 7) != REG_NUM_ESP
1992 && (input
->eaflags
& EAF_TIMESTWO
))
1993 it
= bt
, ix
= bx
, bt
= -1, bx
= 0, s
= 1;
1994 /* convert [NOSPLIT EAX] to sib format with 0x0 displacement */
1995 if (s
== 1 && it
== REG_NUM_ESP
) {
1996 /* swap ESP into base if scale is 1 */
1997 t
= it
, it
= bt
, bt
= t
;
1998 t
= ix
, ix
= bx
, bx
= t
;
2000 if (it
== REG_NUM_ESP
2001 || (s
!= 1 && s
!= 2 && s
!= 4 && s
!= 8 && it
!= -1))
2002 return NULL
; /* wrong, for various reasons */
2004 output
->rex
|= rexflags(it
, ix
, REX_X
);
2005 output
->rex
|= rexflags(bt
, bx
, REX_B
);
2007 if (it
== -1 && (bt
& 7) != REG_NUM_ESP
) {
2016 if (rm
!= REG_NUM_EBP
&& o
== 0 &&
2017 seg
== NO_SEG
&& !forw_ref
&&
2019 (EAF_BYTEOFFS
| EAF_WORDOFFS
)))
2021 else if (input
->eaflags
& EAF_BYTEOFFS
||
2022 (o
>= -128 && o
<= 127 && seg
== NO_SEG
2024 && !(input
->eaflags
& EAF_WORDOFFS
)))
2030 output
->sib_present
= false;
2031 output
->bytes
= (bt
== -1 || mod
== 2 ? 4 : mod
);
2032 output
->modrm
= (mod
<< 6) | ((rfield
& 7) << 3) | rm
;
2035 int mod
, scale
, index
, base
;
2055 default: /* then what the smeg is it? */
2056 return NULL
; /* panic */
2064 if (base
!= REG_NUM_EBP
&& o
== 0 &&
2065 seg
== NO_SEG
&& !forw_ref
&&
2067 (EAF_BYTEOFFS
| EAF_WORDOFFS
)))
2069 else if (input
->eaflags
& EAF_BYTEOFFS
||
2070 (o
>= -128 && o
<= 127 && seg
== NO_SEG
2072 && !(input
->eaflags
& EAF_WORDOFFS
)))
2078 output
->sib_present
= true;
2079 output
->bytes
= (bt
== -1 || mod
== 2 ? 4 : mod
);
2080 output
->modrm
= (mod
<< 6) | ((rfield
& 7) << 3) | 4;
2081 output
->sib
= (scale
<< 6) | (index
<< 3) | base
;
2083 } else { /* it's 16-bit */
2086 /* check for 64-bit long mode */
2090 /* check all registers are BX, BP, SI or DI */
2091 if ((b
!= -1 && b
!= R_BP
&& b
!= R_BX
&& b
!= R_SI
2092 && b
!= R_DI
) || (i
!= -1 && i
!= R_BP
&& i
!= R_BX
2093 && i
!= R_SI
&& i
!= R_DI
))
2096 /* ensure the user didn't specify DWORD/QWORD */
2097 if (input
->disp_size
== 32 || input
->disp_size
== 64)
2100 if (s
!= 1 && i
!= -1)
2101 return NULL
; /* no can do, in 16-bit EA */
2102 if (b
== -1 && i
!= -1) {
2107 if ((b
== R_SI
|| b
== R_DI
) && i
!= -1) {
2112 /* have BX/BP as base, SI/DI index */
2114 return NULL
; /* shouldn't ever happen, in theory */
2115 if (i
!= -1 && b
!= -1 &&
2116 (i
== R_BP
|| i
== R_BX
|| b
== R_SI
|| b
== R_DI
))
2117 return NULL
; /* invalid combinations */
2118 if (b
== -1) /* pure offset: handled above */
2119 return NULL
; /* so if it gets to here, panic! */
2123 switch (i
* 256 + b
) {
2124 case R_SI
* 256 + R_BX
:
2127 case R_DI
* 256 + R_BX
:
2130 case R_SI
* 256 + R_BP
:
2133 case R_DI
* 256 + R_BP
:
2151 if (rm
== -1) /* can't happen, in theory */
2152 return NULL
; /* so panic if it does */
2154 if (o
== 0 && seg
== NO_SEG
&& !forw_ref
&& rm
!= 6 &&
2155 !(input
->eaflags
& (EAF_BYTEOFFS
| EAF_WORDOFFS
)))
2157 else if (input
->eaflags
& EAF_BYTEOFFS
||
2158 (o
>= -128 && o
<= 127 && seg
== NO_SEG
2160 && !(input
->eaflags
& EAF_WORDOFFS
)))
2165 output
->sib_present
= false; /* no SIB - it's 16-bit */
2166 output
->bytes
= mod
; /* bytes of offset needed */
2167 output
->modrm
= (mod
<< 6) | ((rfield
& 7) << 3) | rm
;
2172 output
->size
= 1 + output
->sib_present
+ output
->bytes
;
2176 static void add_asp(insn
*ins
, int addrbits
)
2181 valid
= (addrbits
== 64) ? 64|32 : 32|16;
2183 switch (ins
->prefixes
[PPS_ASIZE
]) {
2194 valid
&= (addrbits
== 32) ? 16 : 32;
2200 for (j
= 0; j
< ins
->operands
; j
++) {
2201 if (!(MEMORY
& ~ins
->oprs
[j
].type
)) {
2204 /* Verify as Register */
2205 if (ins
->oprs
[j
].indexreg
< EXPR_REG_START
2206 || ins
->oprs
[j
].indexreg
>= REG_ENUM_LIMIT
)
2209 i
= reg_flags
[ins
->oprs
[j
].indexreg
];
2211 /* Verify as Register */
2212 if (ins
->oprs
[j
].basereg
< EXPR_REG_START
2213 || ins
->oprs
[j
].basereg
>= REG_ENUM_LIMIT
)
2216 b
= reg_flags
[ins
->oprs
[j
].basereg
];
2218 if (ins
->oprs
[j
].scale
== 0)
2222 int ds
= ins
->oprs
[j
].disp_size
;
2223 if ((addrbits
!= 64 && ds
> 8) ||
2224 (addrbits
== 64 && ds
== 16))
2244 if (valid
& addrbits
) {
2245 ins
->addr_size
= addrbits
;
2246 } else if (valid
& ((addrbits
== 32) ? 16 : 32)) {
2247 /* Add an address size prefix */
2248 enum prefixes pref
= (addrbits
== 32) ? P_A16
: P_A32
;
2249 ins
->prefixes
[PPS_ASIZE
] = pref
;
2250 ins
->addr_size
= (addrbits
== 32) ? 16 : 32;
2253 errfunc(ERR_NONFATAL
, "impossible combination of address sizes");
2254 ins
->addr_size
= addrbits
; /* Error recovery */
2257 defdisp
= ins
->addr_size
== 16 ? 16 : 32;
2259 for (j
= 0; j
< ins
->operands
; j
++) {
2260 if (!(MEM_OFFS
& ~ins
->oprs
[j
].type
) &&
2261 (ins
->oprs
[j
].disp_size
? ins
->oprs
[j
].disp_size
: defdisp
)
2262 != ins
->addr_size
) {
2263 /* mem_offs sizes must match the address size; if not,
2264 strip the MEM_OFFS bit and match only EA instructions */
2265 ins
->oprs
[j
].type
&= ~(MEM_OFFS
& ~MEMORY
);