1 /* assemble.c code generation for the Netwide Assembler
3 * The Netwide Assembler is copyright (C) 1996 Simon Tatham and
4 * Julian Hall. All rights reserved. The software is
5 * redistributable under the license given in the file "LICENSE"
6 * distributed in the NASM archive.
8 * the actual codes (C syntax, i.e. octal):
9 * \0 - terminates the code. (Unless it's a literal of course.)
10 * \1..\4 - that many literal bytes follow in the code stream
11 * \5 - add 4 to the primary operand number (b, low octdigit)
12 * \6 - add 4 to the secondary operand number (a, middle octdigit)
13 * \7 - add 4 to both the primary and the secondary operand number
14 * \10..\13 - a literal byte follows in the code stream, to be added
15 * to the register value of operand 0..3
16 * \14..\17 - a signed byte immediate operand, from operand 0..3
17 * \20..\23 - a byte immediate operand, from operand 0..3
18 * \24..\27 - an unsigned byte immediate operand, from operand 0..3
19 * \30..\33 - a word immediate operand, from operand 0..3
20 * \34..\37 - select between \3[0-3] and \4[0-3] depending on 16/32 bit
21 * assembly mode or the operand-size override on the operand
22 * \40..\43 - a long immediate operand, from operand 0..3
23 * \44..\47 - select between \3[0-3], \4[0-3] and \5[4-7]
24 * depending on the address size of the instruction.
25 * \50..\53 - a byte relative operand, from operand 0..3
26 * \54..\57 - a qword immediate operand, from operand 0..3
27 * \60..\63 - a word relative operand, from operand 0..3
28 * \64..\67 - select between \6[0-3] and \7[0-3] depending on 16/32 bit
29 * assembly mode or the operand-size override on the operand
30 * \70..\73 - a long relative operand, from operand 0..3
31 * \74..\77 - a word constant, from the _segment_ part of operand 0..3
32 * \1ab - a ModRM, calculated on EA in operand a, with the spare
33 * field the register value of operand b.
34 * \140..\143 - an immediate word or signed byte for operand 0..3
35 * \144..\147 - or 2 (s-field) into opcode byte if operand 0..3
36 * is a signed byte rather than a word. Opcode byte follows.
37 * \150..\153 - an immediate dword or signed byte for operand 0..3
38 * \154..\157 - or 2 (s-field) into opcode byte if operand 0..3
39 * is a signed byte rather than a dword. Opcode byte follows.
40 * \160..\163 - this instruction uses DREX rather than REX, with the
41 * OC0 field set to 0, and the dest field taken from
43 * \164..\167 - this instruction uses DREX rather than REX, with the
44 * OC0 field set to 1, and the dest field taken from
46 * \171 - placement of DREX suffix in the absence of an EA
47 * \172\ab - the register number from operand a in bits 7..4, with
48 * the 4-bit immediate from operand b in bits 3..0.
49 * \173\xab - the register number from operand a in bits 7..4, with
50 * the value b in bits 3..0.
51 * \174\a - the register number from operand a in bits 7..4, and
52 * an arbitrary value in bits 3..0 (assembled as zero.)
53 * \2ab - a ModRM, calculated on EA in operand a, with the spare
54 * field equal to digit b.
55 * \250..\253 - same as \150..\153, except warn if the 64-bit operand
56 * is not equal to the truncated and sign-extended 32-bit
57 * operand; used for 32-bit immediates in 64-bit mode.
58 * \254..\257 - a signed 32-bit operand to be extended to 64 bits.
59 * \260..\263 - this instruction uses VEX/XOP rather than REX, with the
60 * V field taken from operand 0..3.
61 * \270 - this instruction uses VEX/XOP rather than REX, with the
62 * V field set to 1111b.
64 * VEX/XOP prefixes are followed by the sequence:
65 * \tmm\wlp where mm is the M field; and wlp is:
67 * [w0] ww = 0 for W = 0
68 * [w1] ww = 1 for W = 1
69 * [wx] ww = 2 for W don't care (always assembled as 0)
70 * [ww] ww = 3 for W used as REX.W
72 * t = 0 for VEX (C4/C5), t = 1 for XOP (8F).
74 * \274..\277 - a signed byte immediate operand, from operand 0..3,
75 * which is to be extended to the operand size.
76 * \310 - indicates fixed 16-bit address size, i.e. optional 0x67.
77 * \311 - indicates fixed 32-bit address size, i.e. optional 0x67.
78 * \312 - (disassembler only) marker on LOOP, LOOPxx instructions.
79 * \313 - indicates fixed 64-bit address size, 0x67 invalid.
80 * \314 - (disassembler only) invalid with REX.B
81 * \315 - (disassembler only) invalid with REX.X
82 * \316 - (disassembler only) invalid with REX.R
83 * \317 - (disassembler only) invalid with REX.W
84 * \320 - indicates fixed 16-bit operand size, i.e. optional 0x66.
85 * \321 - indicates fixed 32-bit operand size, i.e. optional 0x66.
86 * \322 - indicates that this instruction is only valid when the
87 * operand size is the default (instruction to disassembler,
88 * generates no code in the assembler)
89 * \323 - indicates fixed 64-bit operand size, REX on extensions only.
90 * \324 - indicates 64-bit operand size requiring REX prefix.
91 * \330 - a literal byte follows in the code stream, to be added
92 * to the condition code value of the instruction.
93 * \331 - instruction not valid with REP prefix. Hint for
94 * disassembler only; for SSE instructions.
95 * \332 - REP prefix (0xF2 byte) used as opcode extension.
96 * \333 - REP prefix (0xF3 byte) used as opcode extension.
97 * \334 - LOCK prefix used instead of REX.R
98 * \335 - disassemble a rep (0xF3 byte) prefix as repe not rep.
99 * \336 - force a REP(E) prefix (0xF2) even if not specified.
100 * \337 - force a REPNE prefix (0xF3) even if not specified.
101 * \336-\337 are still listed as prefixes in the disassembler.
102 * \340 - reserve <operand 0> bytes of uninitialized storage.
103 * Operand 0 had better be a segmentless constant.
104 * \341 - this instruction needs a WAIT "prefix"
105 * \344,\345 - the PUSH/POP (respectively) codes for CS, DS, ES, SS
106 * (POP is never used for CS) depending on operand 0
107 * \346,\347 - the second byte of PUSH/POP codes for FS, GS, depending
109 * \360 - no SSE prefix (== \364\331)
110 * \361 - 66 SSE prefix (== \366\331)
111 * \362 - F2 SSE prefix (== \364\332)
112 * \363 - F3 SSE prefix (== \364\333)
113 * \364 - operand-size prefix (0x66) not permitted
114 * \365 - address-size prefix (0x67) not permitted
115 * \366 - operand-size prefix (0x66) used as opcode extension
116 * \367 - address-size prefix (0x67) used as opcode extension
117 * \370,\371,\372 - match only if operand 0 meets byte jump criteria.
118 * 370 is used for Jcc, 371 is used for JMP.
119 * \373 - assemble 0x03 if bits==16, 0x05 if bits==32;
120 * used for conditional jump over longer jump
123 #include "compiler.h"
127 #include <inttypes.h>
131 #include "assemble.h"
136 int sib_present
; /* is a SIB byte necessary? */
137 int bytes
; /* # of bytes of offset needed */
138 int size
; /* lazy - this is sib+bytes+1 */
139 uint8_t modrm
, sib
, rex
, rip
; /* the bytes themselves */
142 static uint32_t cpu
; /* cpu level received from nasm.c */
143 static efunc errfunc
;
144 static struct ofmt
*outfmt
;
145 static ListGen
*list
;
147 static int64_t calcsize(int32_t, int64_t, int, insn
*, const uint8_t *);
148 static void gencode(int32_t segment
, int64_t offset
, int bits
,
149 insn
* ins
, const struct itemplate
*temp
,
151 static int matches(const struct itemplate
*, insn
*, int bits
);
152 static int32_t regflag(const operand
*);
153 static int32_t regval(const operand
*);
154 static int rexflags(int, int32_t, int);
155 static int op_rexflags(const operand
*, int);
156 static ea
*process_ea(operand
*, ea
*, int, int, int, int32_t);
157 static void add_asp(insn
*, int);
159 static int has_prefix(insn
* ins
, enum prefix_pos pos
, enum prefixes prefix
)
161 return ins
->prefixes
[pos
] == prefix
;
164 static void assert_no_prefix(insn
* ins
, enum prefix_pos pos
)
166 if (ins
->prefixes
[pos
])
167 errfunc(ERR_NONFATAL
, "invalid %s prefix",
168 prefix_name(ins
->prefixes
[pos
]));
171 static const char *size_name(int size
)
193 static void warn_overflow(int size
, const struct operand
*o
)
195 if (size
< 8 && o
->wrt
== NO_SEG
&& o
->segment
== NO_SEG
) {
196 int64_t lim
= ((int64_t)1 << (size
*8))-1;
197 int64_t data
= o
->offset
;
199 if (data
< ~lim
|| data
> lim
)
200 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
201 "%s data exceeds bounds", size_name(size
));
205 * This routine wrappers the real output format's output routine,
206 * in order to pass a copy of the data off to the listing file
207 * generator at the same time.
209 static void out(int64_t offset
, int32_t segto
, const void *data
,
210 enum out_type type
, uint64_t size
,
211 int32_t segment
, int32_t wrt
)
213 static int32_t lineno
= 0; /* static!!! */
214 static char *lnfname
= NULL
;
217 if (type
== OUT_ADDRESS
&& segment
== NO_SEG
&& wrt
== NO_SEG
) {
219 * This is a non-relocated address, and we're going to
220 * convert it into RAWDATA format.
225 errfunc(ERR_PANIC
, "OUT_ADDRESS with size > 8");
229 WRITEADDR(q
, *(int64_t *)data
, size
);
234 list
->output(offset
, data
, type
, size
);
237 * this call to src_get determines when we call the
238 * debug-format-specific "linenum" function
239 * it updates lineno and lnfname to the current values
240 * returning 0 if "same as last time", -2 if lnfname
241 * changed, and the amount by which lineno changed,
242 * if it did. thus, these variables must be static
245 if (src_get(&lineno
, &lnfname
)) {
246 outfmt
->current_dfmt
->linenum(lnfname
, lineno
, segto
);
249 outfmt
->output(segto
, data
, type
, size
, segment
, wrt
);
252 static bool jmp_match(int32_t segment
, int64_t offset
, int bits
,
253 insn
* ins
, const uint8_t *code
)
258 if ((c
!= 0370 && c
!= 0371) || (ins
->oprs
[0].type
& STRICT
))
262 if (optimizing
< 0 && c
== 0371)
265 isize
= calcsize(segment
, offset
, bits
, ins
, code
);
267 if (ins
->oprs
[0].opflags
& OPFLAG_UNKNOWN
)
268 /* Be optimistic in pass 1 */
271 if (ins
->oprs
[0].segment
!= segment
)
274 isize
= ins
->oprs
[0].offset
- offset
- isize
; /* isize is delta */
275 return (isize
>= -128 && isize
<= 127); /* is it byte size? */
278 int64_t assemble(int32_t segment
, int64_t offset
, int bits
, uint32_t cp
,
279 insn
* instruction
, struct ofmt
*output
, efunc error
,
282 const struct itemplate
*temp
;
287 int64_t start
= offset
;
288 int64_t wsize
= 0; /* size for DB etc. */
290 errfunc
= error
; /* to pass to other functions */
292 outfmt
= output
; /* likewise */
293 list
= listgen
; /* and again */
295 switch (instruction
->opcode
) {
325 int32_t t
= instruction
->times
;
328 "instruction->times < 0 (%ld) in assemble()", t
);
330 while (t
--) { /* repeat TIMES times */
331 for (e
= instruction
->eops
; e
; e
= e
->next
) {
332 if (e
->type
== EOT_DB_NUMBER
) {
334 if (e
->segment
!= NO_SEG
)
335 errfunc(ERR_NONFATAL
,
336 "one-byte relocation attempted");
338 uint8_t out_byte
= e
->offset
;
339 out(offset
, segment
, &out_byte
,
340 OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
342 } else if (wsize
> 8) {
343 errfunc(ERR_NONFATAL
,
344 "integer supplied to a DT, DO or DY"
347 out(offset
, segment
, &e
->offset
,
348 OUT_ADDRESS
, wsize
, e
->segment
, e
->wrt
);
350 } else if (e
->type
== EOT_DB_STRING
||
351 e
->type
== EOT_DB_STRING_FREE
) {
354 out(offset
, segment
, e
->stringval
,
355 OUT_RAWDATA
, e
->stringlen
, NO_SEG
, NO_SEG
);
356 align
= e
->stringlen
% wsize
;
359 align
= wsize
- align
;
360 out(offset
, segment
, zero_buffer
,
361 OUT_RAWDATA
, align
, NO_SEG
, NO_SEG
);
363 offset
+= e
->stringlen
+ align
;
366 if (t
> 0 && t
== instruction
->times
- 1) {
368 * Dummy call to list->output to give the offset to the
371 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
372 list
->uplevel(LIST_TIMES
);
375 if (instruction
->times
> 1)
376 list
->downlevel(LIST_TIMES
);
377 return offset
- start
;
380 if (instruction
->opcode
== I_INCBIN
) {
381 const char *fname
= instruction
->eops
->stringval
;
384 fp
= fopen(fname
, "rb");
386 error(ERR_NONFATAL
, "`incbin': unable to open file `%s'",
388 } else if (fseek(fp
, 0L, SEEK_END
) < 0) {
389 error(ERR_NONFATAL
, "`incbin': unable to seek on file `%s'",
392 static char buf
[4096];
393 size_t t
= instruction
->times
;
398 if (instruction
->eops
->next
) {
399 base
= instruction
->eops
->next
->offset
;
401 if (instruction
->eops
->next
->next
&&
402 len
> (size_t)instruction
->eops
->next
->next
->offset
)
403 len
= (size_t)instruction
->eops
->next
->next
->offset
;
406 * Dummy call to list->output to give the offset to the
409 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
410 list
->uplevel(LIST_INCBIN
);
414 fseek(fp
, base
, SEEK_SET
);
418 fread(buf
, 1, (l
> (int32_t) sizeof(buf
) ? (int32_t) sizeof(buf
) : l
),
422 * This shouldn't happen unless the file
423 * actually changes while we are reading
427 "`incbin': unexpected EOF while"
428 " reading file `%s'", fname
);
429 t
= 0; /* Try to exit cleanly */
432 out(offset
, segment
, buf
, OUT_RAWDATA
, m
,
437 list
->downlevel(LIST_INCBIN
);
438 if (instruction
->times
> 1) {
440 * Dummy call to list->output to give the offset to the
443 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
444 list
->uplevel(LIST_TIMES
);
445 list
->downlevel(LIST_TIMES
);
448 return instruction
->times
* len
;
450 return 0; /* if we're here, there's an error */
453 /* Check to see if we need an address-size prefix */
454 add_asp(instruction
, bits
);
458 for (temp
= nasm_instructions
[instruction
->opcode
]; temp
->opcode
!= -1; temp
++){
459 int m
= matches(temp
, instruction
, bits
);
461 (m
== 99 && jmp_match(segment
, offset
, bits
,
462 instruction
, temp
->code
))) {
464 int64_t insn_size
= calcsize(segment
, offset
, bits
,
465 instruction
, temp
->code
);
466 itimes
= instruction
->times
;
467 if (insn_size
< 0) /* shouldn't be, on pass two */
468 error(ERR_PANIC
, "errors made it through from pass one");
471 for (j
= 0; j
< MAXPREFIX
; j
++) {
473 switch (instruction
->prefixes
[j
]) {
491 error(ERR_WARNING
| ERR_PASS2
,
492 "cs segment base generated, but will be ignored in 64-bit mode");
498 error(ERR_WARNING
| ERR_PASS2
,
499 "ds segment base generated, but will be ignored in 64-bit mode");
505 error(ERR_WARNING
| ERR_PASS2
,
506 "es segment base generated, but will be ignored in 64-bit mode");
518 error(ERR_WARNING
| ERR_PASS2
,
519 "ss segment base generated, but will be ignored in 64-bit mode");
526 "segr6 and segr7 cannot be used as prefixes");
531 "16-bit addressing is not supported "
533 } else if (bits
!= 16)
543 "64-bit addressing is only supported "
567 error(ERR_PANIC
, "invalid instruction prefix");
570 out(offset
, segment
, &c
, OUT_RAWDATA
, 1,
575 insn_end
= offset
+ insn_size
;
576 gencode(segment
, offset
, bits
, instruction
,
579 if (itimes
> 0 && itimes
== instruction
->times
- 1) {
581 * Dummy call to list->output to give the offset to the
584 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
585 list
->uplevel(LIST_TIMES
);
588 if (instruction
->times
> 1)
589 list
->downlevel(LIST_TIMES
);
590 return offset
- start
;
591 } else if (m
> 0 && m
> size_prob
) {
596 if (temp
->opcode
== -1) { /* didn't match any instruction */
599 error(ERR_NONFATAL
, "operation size not specified");
602 error(ERR_NONFATAL
, "mismatch in operand sizes");
605 error(ERR_NONFATAL
, "no instruction for this cpu level");
608 error(ERR_NONFATAL
, "instruction not supported in %d-bit mode",
613 "invalid combination of opcode and operands");
620 int64_t insn_size(int32_t segment
, int64_t offset
, int bits
, uint32_t cp
,
621 insn
* instruction
, efunc error
)
623 const struct itemplate
*temp
;
625 errfunc
= error
; /* to pass to other functions */
628 if (instruction
->opcode
== -1)
631 if (instruction
->opcode
== I_DB
|| instruction
->opcode
== I_DW
||
632 instruction
->opcode
== I_DD
|| instruction
->opcode
== I_DQ
||
633 instruction
->opcode
== I_DT
|| instruction
->opcode
== I_DO
||
634 instruction
->opcode
== I_DY
) {
636 int32_t isize
, osize
, wsize
= 0; /* placate gcc */
639 switch (instruction
->opcode
) {
665 for (e
= instruction
->eops
; e
; e
= e
->next
) {
669 if (e
->type
== EOT_DB_NUMBER
)
671 else if (e
->type
== EOT_DB_STRING
||
672 e
->type
== EOT_DB_STRING_FREE
)
673 osize
= e
->stringlen
;
675 align
= (-osize
) % wsize
;
678 isize
+= osize
+ align
;
680 return isize
* instruction
->times
;
683 if (instruction
->opcode
== I_INCBIN
) {
684 const char *fname
= instruction
->eops
->stringval
;
688 fp
= fopen(fname
, "rb");
690 error(ERR_NONFATAL
, "`incbin': unable to open file `%s'",
692 else if (fseek(fp
, 0L, SEEK_END
) < 0)
693 error(ERR_NONFATAL
, "`incbin': unable to seek on file `%s'",
698 if (instruction
->eops
->next
) {
699 len
-= instruction
->eops
->next
->offset
;
700 if (instruction
->eops
->next
->next
&&
701 len
> (size_t)instruction
->eops
->next
->next
->offset
) {
702 len
= (size_t)instruction
->eops
->next
->next
->offset
;
705 return instruction
->times
* len
;
707 return 0; /* if we're here, there's an error */
710 /* Check to see if we need an address-size prefix */
711 add_asp(instruction
, bits
);
713 for (temp
= nasm_instructions
[instruction
->opcode
]; temp
->opcode
!= -1; temp
++) {
714 int m
= matches(temp
, instruction
, bits
);
716 (m
== 99 && jmp_match(segment
, offset
, bits
,
717 instruction
, temp
->code
))) {
718 /* we've matched an instruction. */
720 const uint8_t *codes
= temp
->code
;
723 isize
= calcsize(segment
, offset
, bits
, instruction
, codes
);
726 for (j
= 0; j
< MAXPREFIX
; j
++) {
727 switch (instruction
->prefixes
[j
]) {
753 return isize
* instruction
->times
;
756 return -1; /* didn't match any instruction */
759 static bool possible_sbyte(operand
*o
)
761 return o
->wrt
== NO_SEG
&& o
->segment
== NO_SEG
&&
762 !(o
->opflags
& OPFLAG_UNKNOWN
) &&
763 optimizing
>= 0 && !(o
->type
& STRICT
);
766 /* check that opn[op] is a signed byte of size 16 or 32 */
767 static bool is_sbyte16(operand
*o
)
771 if (!possible_sbyte(o
))
775 return v
>= -128 && v
<= 127;
778 static bool is_sbyte32(operand
*o
)
782 if (!possible_sbyte(o
))
786 return v
>= -128 && v
<= 127;
789 /* Common construct */
790 #define case4(x) case (x): case (x)+1: case (x)+2: case (x)+3
792 static int64_t calcsize(int32_t segment
, int64_t offset
, int bits
,
793 insn
* ins
, const uint8_t *codes
)
802 ins
->rex
= 0; /* Ensure REX is reset */
804 if (ins
->prefixes
[PPS_OSIZE
] == P_O64
)
807 (void)segment
; /* Don't warn that this parameter is unused */
808 (void)offset
; /* Don't warn that this parameter is unused */
812 op1
= (c
& 3) + ((opex
& 1) << 2);
813 op2
= ((c
>> 3) & 3) + ((opex
& 2) << 1);
814 opx
= &ins
->oprs
[op1
];
815 opex
= 0; /* For the next iteration */
822 codes
+= c
, length
+= c
;
833 op_rexflags(opx
, REX_B
|REX_H
|REX_P
|REX_W
);
848 if (opx
->type
& (BITS16
| BITS32
| BITS64
))
849 length
+= (opx
->type
& BITS16
) ? 2 : 4;
851 length
+= (bits
== 16) ? 2 : 4;
859 length
+= ins
->addr_size
>> 3;
867 length
+= 8; /* MOV reg64/imm */
875 if (opx
->type
& (BITS16
| BITS32
| BITS64
))
876 length
+= (opx
->type
& BITS16
) ? 2 : 4;
878 length
+= (bits
== 16) ? 2 : 4;
890 length
+= is_sbyte16(opx
) ? 1 : 2;
899 length
+= is_sbyte32(opx
) ? 1 : 4;
910 ins
->drexdst
= regval(opx
);
915 ins
->rex
|= REX_D
|REX_OC
;
916 ins
->drexdst
= regval(opx
);
930 length
+= is_sbyte32(opx
) ? 1 : 4;
939 ins
->drexdst
= regval(opx
);
940 ins
->vex_cm
= *codes
++;
941 ins
->vex_wlp
= *codes
++;
947 ins
->vex_cm
= *codes
++;
948 ins
->vex_wlp
= *codes
++;
961 length
+= (bits
!= 16) && !has_prefix(ins
, PPS_ASIZE
, P_A16
);
965 length
+= (bits
!= 32) && !has_prefix(ins
, PPS_ASIZE
, P_A32
);
972 if (bits
!= 64 || has_prefix(ins
, PPS_ASIZE
, P_A16
) ||
973 has_prefix(ins
, PPS_ASIZE
, P_A32
))
981 length
+= (bits
!= 16);
985 length
+= (bits
== 16);
1019 if (!ins
->prefixes
[PPS_LREP
])
1020 ins
->prefixes
[PPS_LREP
] = P_REP
;
1024 if (!ins
->prefixes
[PPS_LREP
])
1025 ins
->prefixes
[PPS_LREP
] = P_REPNE
;
1029 if (ins
->oprs
[0].segment
!= NO_SEG
)
1030 errfunc(ERR_NONFATAL
, "attempt to reserve non-constant"
1031 " quantity of BSS space");
1033 length
+= ins
->oprs
[0].offset
;
1037 if (!ins
->prefixes
[PPS_WAIT
])
1038 ins
->prefixes
[PPS_WAIT
] = P_WAIT
;
1088 struct operand
*opy
= &ins
->oprs
[op2
];
1090 ea_data
.rex
= 0; /* Ensure ea.REX is initially 0 */
1093 /* pick rfield from operand b (opx) */
1094 rflags
= regflag(opx
);
1095 rfield
= nasm_regvals
[opx
->basereg
];
1100 if (!process_ea(opy
, &ea_data
, bits
,
1101 ins
->addr_size
, rfield
, rflags
)) {
1102 errfunc(ERR_NONFATAL
, "invalid effective address");
1105 ins
->rex
|= ea_data
.rex
;
1106 length
+= ea_data
.size
;
1112 errfunc(ERR_PANIC
, "internal instruction table corrupt"
1113 ": instruction code \\%o (0x%02X) given", c
, c
);
1118 ins
->rex
&= rex_mask
;
1120 if (ins
->rex
& REX_V
) {
1121 int bad32
= REX_R
|REX_W
|REX_X
|REX_B
;
1123 if (ins
->rex
& REX_H
) {
1124 errfunc(ERR_NONFATAL
, "cannot use high register in vex instruction");
1127 switch (ins
->vex_wlp
& 030) {
1141 if (bits
!= 64 && ((ins
->rex
& bad32
) || ins
->drexdst
> 7)) {
1142 errfunc(ERR_NONFATAL
, "invalid operands in non-64-bit mode");
1145 if (ins
->vex_cm
!= 1 || (ins
->rex
& (REX_W
|REX_R
|REX_B
)))
1149 } else if (ins
->rex
& REX_D
) {
1150 if (ins
->rex
& REX_H
) {
1151 errfunc(ERR_NONFATAL
, "cannot use high register in drex instruction");
1154 if (bits
!= 64 && ((ins
->rex
& (REX_R
|REX_W
|REX_X
|REX_B
)) ||
1155 ins
->drexdst
> 7)) {
1156 errfunc(ERR_NONFATAL
, "invalid operands in non-64-bit mode");
1160 } else if (ins
->rex
& REX_REAL
) {
1161 if (ins
->rex
& REX_H
) {
1162 errfunc(ERR_NONFATAL
, "cannot use high register in rex instruction");
1164 } else if (bits
== 64) {
1166 } else if ((ins
->rex
& REX_L
) &&
1167 !(ins
->rex
& (REX_P
|REX_W
|REX_X
|REX_B
)) &&
1170 assert_no_prefix(ins
, PPS_LREP
);
1173 errfunc(ERR_NONFATAL
, "invalid operands in non-64-bit mode");
1181 #define EMIT_REX() \
1182 if (!(ins->rex & (REX_D|REX_V)) && (ins->rex & REX_REAL) && (bits == 64)) { \
1183 ins->rex = (ins->rex & REX_REAL)|REX_P; \
1184 out(offset, segment, &ins->rex, OUT_RAWDATA, 1, NO_SEG, NO_SEG); \
1189 static void gencode(int32_t segment
, int64_t offset
, int bits
,
1190 insn
* ins
, const struct itemplate
*temp
,
1193 static char condval
[] = { /* conditional opcodes */
1194 0x7, 0x3, 0x2, 0x6, 0x2, 0x4, 0xF, 0xD, 0xC, 0xE, 0x6, 0x2,
1195 0x3, 0x7, 0x3, 0x5, 0xE, 0xC, 0xD, 0xF, 0x1, 0xB, 0x9, 0x5,
1196 0x0, 0xA, 0xA, 0xB, 0x8, 0x4
1203 struct operand
*opx
;
1204 const uint8_t *codes
= temp
->code
;
1209 op1
= (c
& 3) + ((opex
& 1) << 2);
1210 op2
= ((c
>> 3) & 3) + ((opex
& 2) << 1);
1211 opx
= &ins
->oprs
[op1
];
1212 opex
= 0; /* For the next iteration */
1220 out(offset
, segment
, codes
, OUT_RAWDATA
, c
, NO_SEG
, NO_SEG
);
1233 bytes
[0] = *codes
++ + (regval(opx
) & 7);
1234 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1239 /* The test for BITS8 and SBYTE here is intended to avoid
1240 warning on optimizer actions due to SBYTE, while still
1241 warn on explicit BYTE directives. Also warn, obviously,
1242 if the optimizer isn't enabled. */
1243 if (((opx
->type
& BITS8
) ||
1244 !(opx
->type
& temp
->opd
[op1
] & BYTENESS
)) &&
1245 (opx
->offset
< -128 || opx
->offset
> 127)) {
1246 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1247 "signed byte value exceeds bounds");
1249 if (opx
->segment
!= NO_SEG
) {
1251 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1252 opx
->segment
, opx
->wrt
);
1254 bytes
[0] = opx
->offset
;
1255 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1262 if (opx
->offset
< -256 || opx
->offset
> 255) {
1263 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1264 "byte value exceeds bounds");
1266 if (opx
->segment
!= NO_SEG
) {
1268 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1269 opx
->segment
, opx
->wrt
);
1271 bytes
[0] = opx
->offset
;
1272 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1279 if (opx
->offset
< 0 || opx
->offset
> 255)
1280 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1281 "unsigned byte value exceeds bounds");
1282 if (opx
->segment
!= NO_SEG
) {
1284 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1285 opx
->segment
, opx
->wrt
);
1287 bytes
[0] = opx
->offset
;
1288 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1295 warn_overflow(2, opx
);
1297 out(offset
, segment
, &data
, OUT_ADDRESS
, 2,
1298 opx
->segment
, opx
->wrt
);
1303 if (opx
->type
& (BITS16
| BITS32
))
1304 size
= (opx
->type
& BITS16
) ? 2 : 4;
1306 size
= (bits
== 16) ? 2 : 4;
1307 warn_overflow(size
, opx
);
1309 out(offset
, segment
, &data
, OUT_ADDRESS
, size
,
1310 opx
->segment
, opx
->wrt
);
1315 warn_overflow(4, opx
);
1317 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1318 opx
->segment
, opx
->wrt
);
1324 size
= ins
->addr_size
>> 3;
1325 warn_overflow(size
, opx
);
1326 out(offset
, segment
, &data
, OUT_ADDRESS
, size
,
1327 opx
->segment
, opx
->wrt
);
1332 if (opx
->segment
!= segment
)
1333 errfunc(ERR_NONFATAL
,
1334 "short relative jump outside segment");
1335 data
= opx
->offset
- insn_end
;
1336 if (data
> 127 || data
< -128)
1337 errfunc(ERR_NONFATAL
, "short jump is out of range");
1339 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1344 data
= (int64_t)opx
->offset
;
1345 out(offset
, segment
, &data
, OUT_ADDRESS
, 8,
1346 opx
->segment
, opx
->wrt
);
1351 if (opx
->segment
!= segment
) {
1353 out(offset
, segment
, &data
,
1354 OUT_REL2ADR
, insn_end
- offset
,
1355 opx
->segment
, opx
->wrt
);
1357 data
= opx
->offset
- insn_end
;
1358 out(offset
, segment
, &data
,
1359 OUT_ADDRESS
, 2, NO_SEG
, NO_SEG
);
1365 if (opx
->type
& (BITS16
| BITS32
| BITS64
))
1366 size
= (opx
->type
& BITS16
) ? 2 : 4;
1368 size
= (bits
== 16) ? 2 : 4;
1369 if (opx
->segment
!= segment
) {
1371 out(offset
, segment
, &data
,
1372 size
== 2 ? OUT_REL2ADR
: OUT_REL4ADR
,
1373 insn_end
- offset
, opx
->segment
, opx
->wrt
);
1375 data
= opx
->offset
- insn_end
;
1376 out(offset
, segment
, &data
,
1377 OUT_ADDRESS
, size
, NO_SEG
, NO_SEG
);
1383 if (opx
->segment
!= segment
) {
1385 out(offset
, segment
, &data
,
1386 OUT_REL4ADR
, insn_end
- offset
,
1387 opx
->segment
, opx
->wrt
);
1389 data
= opx
->offset
- insn_end
;
1390 out(offset
, segment
, &data
,
1391 OUT_ADDRESS
, 4, NO_SEG
, NO_SEG
);
1397 if (opx
->segment
== NO_SEG
)
1398 errfunc(ERR_NONFATAL
, "value referenced by FAR is not"
1401 out(offset
, segment
, &data
, OUT_ADDRESS
, 2,
1402 outfmt
->segbase(1 + opx
->segment
),
1409 warn_overflow(2, opx
);
1410 if (is_sbyte16(opx
)) {
1412 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1416 out(offset
, segment
, &data
, OUT_ADDRESS
, 2,
1417 opx
->segment
, opx
->wrt
);
1424 bytes
[0] = *codes
++;
1425 if (is_sbyte16(opx
))
1426 bytes
[0] |= 2; /* s-bit */
1427 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1433 warn_overflow(4, opx
);
1434 if (is_sbyte32(opx
)) {
1436 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1440 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1441 opx
->segment
, opx
->wrt
);
1448 bytes
[0] = *codes
++;
1449 if (is_sbyte32(opx
))
1450 bytes
[0] |= 2; /* s-bit */
1451 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1461 (ins
->drexdst
<< 4) |
1462 (ins
->rex
& REX_OC
? 0x08 : 0) |
1463 (ins
->rex
& (REX_R
|REX_X
|REX_B
));
1465 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1471 opx
= &ins
->oprs
[c
>> 3];
1472 bytes
[0] = nasm_regvals
[opx
->basereg
] << 4;
1473 opx
= &ins
->oprs
[c
& 7];
1474 if (opx
->segment
!= NO_SEG
|| opx
->wrt
!= NO_SEG
) {
1475 errfunc(ERR_NONFATAL
,
1476 "non-absolute expression not permitted as argument %d",
1479 if (opx
->offset
& ~15) {
1480 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1481 "four-bit argument exceeds bounds");
1483 bytes
[0] |= opx
->offset
& 15;
1485 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1491 opx
= &ins
->oprs
[c
>> 4];
1492 bytes
[0] = nasm_regvals
[opx
->basereg
] << 4;
1494 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1500 opx
= &ins
->oprs
[c
];
1501 bytes
[0] = nasm_regvals
[opx
->basereg
] << 4;
1502 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1508 if (opx
->wrt
== NO_SEG
&& opx
->segment
== NO_SEG
&&
1509 (int32_t)data
!= (int64_t)data
) {
1510 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1511 "signed dword immediate exceeds bounds");
1513 if (is_sbyte32(opx
)) {
1515 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1519 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1520 opx
->segment
, opx
->wrt
);
1527 if (opx
->wrt
== NO_SEG
&& opx
->segment
== NO_SEG
&&
1528 (int32_t)data
!= (int64_t)data
) {
1529 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1530 "signed dword immediate exceeds bounds");
1532 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1533 opx
->segment
, opx
->wrt
);
1540 if (ins
->vex_cm
!= 1 || (ins
->rex
& (REX_W
|REX_X
|REX_B
))) {
1541 bytes
[0] = (ins
->vex_cm
>> 6) ? 0x8f : 0xc4;
1542 bytes
[1] = (ins
->vex_cm
& 31) | ((~ins
->rex
& 7) << 5);
1543 bytes
[2] = ((ins
->rex
& REX_W
) << (7-3)) |
1544 ((~ins
->drexdst
& 15)<< 3) | (ins
->vex_wlp
& 07);
1545 out(offset
, segment
, &bytes
, OUT_RAWDATA
, 3, NO_SEG
, NO_SEG
);
1549 bytes
[1] = ((~ins
->rex
& REX_R
) << (7-2)) |
1550 ((~ins
->drexdst
& 15) << 3) | (ins
->vex_wlp
& 07);
1551 out(offset
, segment
, &bytes
, OUT_RAWDATA
, 2, NO_SEG
, NO_SEG
);
1561 if (ins
->rex
& REX_W
)
1563 else if (ins
->prefixes
[PPS_OSIZE
] == P_O16
)
1565 else if (ins
->prefixes
[PPS_OSIZE
] == P_O32
)
1570 um
= (uint64_t)2 << (s
-1);
1573 if (uv
> 127 && uv
< (uint64_t)-128 &&
1574 (uv
< um
-128 || uv
> um
-1)) {
1575 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1576 "signed byte value exceeds bounds");
1578 if (opx
->segment
!= NO_SEG
) {
1580 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1581 opx
->segment
, opx
->wrt
);
1584 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1595 if (bits
== 32 && !has_prefix(ins
, PPS_ASIZE
, P_A16
)) {
1597 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1604 if (bits
!= 32 && !has_prefix(ins
, PPS_ASIZE
, P_A32
)) {
1606 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1625 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1634 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1649 *bytes
= *codes
++ ^ condval
[ins
->condition
];
1650 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1659 *bytes
= c
- 0332 + 0xF2;
1660 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1665 if (ins
->rex
& REX_R
) {
1667 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1670 ins
->rex
&= ~(REX_L
|REX_R
);
1681 if (ins
->oprs
[0].segment
!= NO_SEG
)
1682 errfunc(ERR_PANIC
, "non-constant BSS size in pass two");
1684 int64_t size
= ins
->oprs
[0].offset
;
1686 out(offset
, segment
, NULL
,
1687 OUT_RESERVE
, size
, NO_SEG
, NO_SEG
);
1698 switch (ins
->oprs
[0].basereg
) {
1713 "bizarre 8086 segment register received");
1715 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1722 switch (ins
->oprs
[0].basereg
) {
1731 "bizarre 386 segment register received");
1733 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1742 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1748 bytes
[0] = c
- 0362 + 0xf2;
1749 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1759 *bytes
= c
- 0366 + 0x66;
1760 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1770 *bytes
= bits
== 16 ? 3 : 5;
1771 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1794 struct operand
*opy
= &ins
->oprs
[op2
];
1797 /* pick rfield from operand b (opx) */
1798 rflags
= regflag(opx
);
1799 rfield
= nasm_regvals
[opx
->basereg
];
1801 /* rfield is constant */
1806 if (!process_ea(opy
, &ea_data
, bits
, ins
->addr_size
,
1808 errfunc(ERR_NONFATAL
, "invalid effective address");
1813 *p
++ = ea_data
.modrm
;
1814 if (ea_data
.sib_present
)
1817 /* DREX suffixes come between the SIB and the displacement */
1818 if (ins
->rex
& REX_D
) {
1819 *p
++ = (ins
->drexdst
<< 4) |
1820 (ins
->rex
& REX_OC
? 0x08 : 0) |
1821 (ins
->rex
& (REX_R
|REX_X
|REX_B
));
1826 out(offset
, segment
, bytes
, OUT_RAWDATA
, s
, NO_SEG
, NO_SEG
);
1829 * Make sure the address gets the right offset in case
1830 * the line breaks in the .lst file (BR 1197827)
1835 switch (ea_data
.bytes
) {
1843 warn_overflow(ea_data
.bytes
, opy
);
1846 if (opy
->segment
== segment
) {
1848 out(offset
, segment
, &data
, OUT_ADDRESS
,
1849 ea_data
.bytes
, NO_SEG
, NO_SEG
);
1851 out(offset
, segment
, &data
, OUT_REL4ADR
,
1852 insn_end
- offset
, opy
->segment
, opy
->wrt
);
1856 out(offset
, segment
, &data
, OUT_ADDRESS
,
1857 ea_data
.bytes
, opy
->segment
, opy
->wrt
);
1863 "Invalid amount of bytes (%d) for offset?!",
1872 errfunc(ERR_PANIC
, "internal instruction table corrupt"
1873 ": instruction code \\%o (0x%02X) given", c
, c
);
1879 static int32_t regflag(const operand
* o
)
1881 if (o
->basereg
< EXPR_REG_START
|| o
->basereg
>= REG_ENUM_LIMIT
) {
1882 errfunc(ERR_PANIC
, "invalid operand passed to regflag()");
1884 return nasm_reg_flags
[o
->basereg
];
1887 static int32_t regval(const operand
* o
)
1889 if (o
->basereg
< EXPR_REG_START
|| o
->basereg
>= REG_ENUM_LIMIT
) {
1890 errfunc(ERR_PANIC
, "invalid operand passed to regval()");
1892 return nasm_regvals
[o
->basereg
];
1895 static int op_rexflags(const operand
* o
, int mask
)
1900 if (o
->basereg
< EXPR_REG_START
|| o
->basereg
>= REG_ENUM_LIMIT
) {
1901 errfunc(ERR_PANIC
, "invalid operand passed to op_rexflags()");
1904 flags
= nasm_reg_flags
[o
->basereg
];
1905 val
= nasm_regvals
[o
->basereg
];
1907 return rexflags(val
, flags
, mask
);
1910 static int rexflags(int val
, int32_t flags
, int mask
)
1915 rex
|= REX_B
|REX_X
|REX_R
;
1918 if (!(REG_HIGH
& ~flags
)) /* AH, CH, DH, BH */
1920 else if (!(REG8
& ~flags
) && val
>= 4) /* SPL, BPL, SIL, DIL */
1926 static int matches(const struct itemplate
*itemp
, insn
* instruction
, int bits
)
1928 int i
, size
[MAX_OPERANDS
], asize
, oprs
, ret
;
1935 if (itemp
->opcode
!= instruction
->opcode
)
1939 * Count the operands
1941 if (itemp
->operands
!= instruction
->operands
)
1945 * Check that no spurious colons or TOs are present
1947 for (i
= 0; i
< itemp
->operands
; i
++)
1948 if (instruction
->oprs
[i
].type
& ~itemp
->opd
[i
] & (COLON
| TO
))
1952 * Process size flags
1954 if (itemp
->flags
& IF_ARMASK
) {
1955 memset(size
, 0, sizeof size
);
1957 i
= ((itemp
->flags
& IF_ARMASK
) >> IF_ARSHFT
) - 1;
1959 switch (itemp
->flags
& IF_SMASK
) {
1996 switch (itemp
->flags
& IF_SMASK
) {
2031 for (i
= 0; i
< MAX_OPERANDS
; i
++)
2036 * Check that the operand flags all match up
2038 for (i
= 0; i
< itemp
->operands
; i
++) {
2039 int32_t type
= instruction
->oprs
[i
].type
;
2040 if (!(type
& SIZE_MASK
))
2043 if (itemp
->opd
[i
] & SAME_AS
) {
2044 int j
= itemp
->opd
[i
] & ~SAME_AS
;
2045 if (type
!= instruction
->oprs
[j
].type
||
2046 instruction
->oprs
[i
].basereg
!= instruction
->oprs
[j
].basereg
)
2048 } else if (itemp
->opd
[i
] & ~type
||
2049 ((itemp
->opd
[i
] & SIZE_MASK
) &&
2050 ((itemp
->opd
[i
] ^ type
) & SIZE_MASK
))) {
2051 if ((itemp
->opd
[i
] & ~type
& ~SIZE_MASK
) ||
2060 * Check operand sizes
2062 if (itemp
->flags
& (IF_SM
| IF_SM2
)) {
2063 oprs
= (itemp
->flags
& IF_SM2
? 2 : itemp
->operands
);
2065 for (i
= 0; i
< oprs
; i
++) {
2066 if ((asize
= itemp
->opd
[i
] & SIZE_MASK
) != 0) {
2068 for (j
= 0; j
< oprs
; j
++)
2074 oprs
= itemp
->operands
;
2077 for (i
= 0; i
< itemp
->operands
; i
++) {
2078 if (!(itemp
->opd
[i
] & SIZE_MASK
) &&
2079 (instruction
->oprs
[i
].type
& SIZE_MASK
& ~size
[i
]))
2084 * Check template is okay at the set cpu level
2086 if (((itemp
->flags
& IF_PLEVEL
) > cpu
))
2090 * Verify the appropriate long mode flag.
2092 if ((itemp
->flags
& (bits
== 64 ? IF_NOLONG
: IF_LONG
)))
2096 * Check if special handling needed for Jumps
2098 if ((uint8_t)(itemp
->code
[0]) >= 0370)
2104 static ea
*process_ea(operand
* input
, ea
* output
, int bits
,
2105 int addrbits
, int rfield
, int32_t rflags
)
2107 bool forw_ref
= !!(input
->opflags
& OPFLAG_UNKNOWN
);
2109 output
->rip
= false;
2111 /* REX flags for the rfield operand */
2112 output
->rex
|= rexflags(rfield
, rflags
, REX_R
|REX_P
|REX_W
|REX_H
);
2114 if (!(REGISTER
& ~input
->type
)) { /* register direct */
2118 if (input
->basereg
< EXPR_REG_START
/* Verify as Register */
2119 || input
->basereg
>= REG_ENUM_LIMIT
)
2122 i
= nasm_regvals
[input
->basereg
];
2125 return NULL
; /* Invalid EA register */
2127 output
->rex
|= op_rexflags(input
, REX_B
|REX_P
|REX_W
|REX_H
);
2129 output
->sib_present
= false; /* no SIB necessary */
2130 output
->bytes
= 0; /* no offset necessary either */
2131 output
->modrm
= 0xC0 | ((rfield
& 7) << 3) | (i
& 7);
2132 } else { /* it's a memory reference */
2133 if (input
->basereg
== -1
2134 && (input
->indexreg
== -1 || input
->scale
== 0)) {
2135 /* it's a pure offset */
2136 if (bits
== 64 && (~input
->type
& IP_REL
)) {
2137 int scale
, index
, base
;
2138 output
->sib_present
= true;
2142 output
->sib
= (scale
<< 6) | (index
<< 3) | base
;
2144 output
->modrm
= 4 | ((rfield
& 7) << 3);
2145 output
->rip
= false;
2147 output
->sib_present
= false;
2148 output
->bytes
= (addrbits
!= 16 ? 4 : 2);
2149 output
->modrm
= (addrbits
!= 16 ? 5 : 6) | ((rfield
& 7) << 3);
2150 output
->rip
= bits
== 64;
2152 } else { /* it's an indirection */
2153 int i
= input
->indexreg
, b
= input
->basereg
, s
= input
->scale
;
2154 int32_t o
= input
->offset
, seg
= input
->segment
;
2155 int hb
= input
->hintbase
, ht
= input
->hinttype
;
2158 int32_t ix
, bx
; /* register flags */
2161 i
= -1; /* make this easy, at least */
2163 if (i
>= EXPR_REG_START
&& i
< REG_ENUM_LIMIT
) {
2164 it
= nasm_regvals
[i
];
2165 ix
= nasm_reg_flags
[i
];
2171 if (b
>= EXPR_REG_START
&& b
< REG_ENUM_LIMIT
) {
2172 bt
= nasm_regvals
[b
];
2173 bx
= nasm_reg_flags
[b
];
2179 /* check for a 32/64-bit memory reference... */
2180 if ((ix
|bx
) & (BITS32
|BITS64
)) {
2181 /* it must be a 32/64-bit memory reference. Firstly we have
2182 * to check that all registers involved are type E/Rxx. */
2183 int32_t sok
= BITS32
|BITS64
;
2186 if (!(REG64
& ~ix
) || !(REG32
& ~ix
))
2194 return NULL
; /* Invalid register */
2195 if (~sok
& bx
& SIZE_MASK
)
2196 return NULL
; /* Invalid size */
2200 /* While we're here, ensure the user didn't specify
2202 if (input
->disp_size
== 16 || input
->disp_size
== 64)
2205 if (addrbits
== 16 ||
2206 (addrbits
== 32 && !(sok
& BITS32
)) ||
2207 (addrbits
== 64 && !(sok
& BITS64
)))
2210 /* now reorganize base/index */
2211 if (s
== 1 && bt
!= it
&& bt
!= -1 && it
!= -1 &&
2212 ((hb
== b
&& ht
== EAH_NOTBASE
)
2213 || (hb
== i
&& ht
== EAH_MAKEBASE
))) {
2214 /* swap if hints say so */
2215 t
= bt
, bt
= it
, it
= t
;
2216 t
= bx
, bx
= ix
, ix
= t
;
2218 if (bt
== it
) /* convert EAX+2*EAX to 3*EAX */
2219 bt
= -1, bx
= 0, s
++;
2220 if (bt
== -1 && s
== 1 && !(hb
== it
&& ht
== EAH_NOTBASE
)) {
2221 /* make single reg base, unless hint */
2222 bt
= it
, bx
= ix
, it
= -1, ix
= 0;
2224 if (((s
== 2 && it
!= REG_NUM_ESP
2225 && !(input
->eaflags
& EAF_TIMESTWO
)) || s
== 3
2226 || s
== 5 || s
== 9) && bt
== -1)
2227 bt
= it
, bx
= ix
, s
--; /* convert 3*EAX to EAX+2*EAX */
2228 if (it
== -1 && (bt
& 7) != REG_NUM_ESP
2229 && (input
->eaflags
& EAF_TIMESTWO
))
2230 it
= bt
, ix
= bx
, bt
= -1, bx
= 0, s
= 1;
2231 /* convert [NOSPLIT EAX] to sib format with 0x0 displacement */
2232 if (s
== 1 && it
== REG_NUM_ESP
) {
2233 /* swap ESP into base if scale is 1 */
2234 t
= it
, it
= bt
, bt
= t
;
2235 t
= ix
, ix
= bx
, bx
= t
;
2237 if (it
== REG_NUM_ESP
2238 || (s
!= 1 && s
!= 2 && s
!= 4 && s
!= 8 && it
!= -1))
2239 return NULL
; /* wrong, for various reasons */
2241 output
->rex
|= rexflags(it
, ix
, REX_X
);
2242 output
->rex
|= rexflags(bt
, bx
, REX_B
);
2244 if (it
== -1 && (bt
& 7) != REG_NUM_ESP
) {
2253 if (rm
!= REG_NUM_EBP
&& o
== 0 &&
2254 seg
== NO_SEG
&& !forw_ref
&&
2256 (EAF_BYTEOFFS
| EAF_WORDOFFS
)))
2258 else if (input
->eaflags
& EAF_BYTEOFFS
||
2259 (o
>= -128 && o
<= 127 && seg
== NO_SEG
2261 && !(input
->eaflags
& EAF_WORDOFFS
)))
2267 output
->sib_present
= false;
2268 output
->bytes
= (bt
== -1 || mod
== 2 ? 4 : mod
);
2269 output
->modrm
= (mod
<< 6) | ((rfield
& 7) << 3) | rm
;
2272 int mod
, scale
, index
, base
;
2292 default: /* then what the smeg is it? */
2293 return NULL
; /* panic */
2301 if (base
!= REG_NUM_EBP
&& o
== 0 &&
2302 seg
== NO_SEG
&& !forw_ref
&&
2304 (EAF_BYTEOFFS
| EAF_WORDOFFS
)))
2306 else if (input
->eaflags
& EAF_BYTEOFFS
||
2307 (o
>= -128 && o
<= 127 && seg
== NO_SEG
2309 && !(input
->eaflags
& EAF_WORDOFFS
)))
2315 output
->sib_present
= true;
2316 output
->bytes
= (bt
== -1 || mod
== 2 ? 4 : mod
);
2317 output
->modrm
= (mod
<< 6) | ((rfield
& 7) << 3) | 4;
2318 output
->sib
= (scale
<< 6) | (index
<< 3) | base
;
2320 } else { /* it's 16-bit */
2323 /* check for 64-bit long mode */
2327 /* check all registers are BX, BP, SI or DI */
2328 if ((b
!= -1 && b
!= R_BP
&& b
!= R_BX
&& b
!= R_SI
2329 && b
!= R_DI
) || (i
!= -1 && i
!= R_BP
&& i
!= R_BX
2330 && i
!= R_SI
&& i
!= R_DI
))
2333 /* ensure the user didn't specify DWORD/QWORD */
2334 if (input
->disp_size
== 32 || input
->disp_size
== 64)
2337 if (s
!= 1 && i
!= -1)
2338 return NULL
; /* no can do, in 16-bit EA */
2339 if (b
== -1 && i
!= -1) {
2344 if ((b
== R_SI
|| b
== R_DI
) && i
!= -1) {
2349 /* have BX/BP as base, SI/DI index */
2351 return NULL
; /* shouldn't ever happen, in theory */
2352 if (i
!= -1 && b
!= -1 &&
2353 (i
== R_BP
|| i
== R_BX
|| b
== R_SI
|| b
== R_DI
))
2354 return NULL
; /* invalid combinations */
2355 if (b
== -1) /* pure offset: handled above */
2356 return NULL
; /* so if it gets to here, panic! */
2360 switch (i
* 256 + b
) {
2361 case R_SI
* 256 + R_BX
:
2364 case R_DI
* 256 + R_BX
:
2367 case R_SI
* 256 + R_BP
:
2370 case R_DI
* 256 + R_BP
:
2388 if (rm
== -1) /* can't happen, in theory */
2389 return NULL
; /* so panic if it does */
2391 if (o
== 0 && seg
== NO_SEG
&& !forw_ref
&& rm
!= 6 &&
2392 !(input
->eaflags
& (EAF_BYTEOFFS
| EAF_WORDOFFS
)))
2394 else if (input
->eaflags
& EAF_BYTEOFFS
||
2395 (o
>= -128 && o
<= 127 && seg
== NO_SEG
2397 && !(input
->eaflags
& EAF_WORDOFFS
)))
2402 output
->sib_present
= false; /* no SIB - it's 16-bit */
2403 output
->bytes
= mod
; /* bytes of offset needed */
2404 output
->modrm
= (mod
<< 6) | ((rfield
& 7) << 3) | rm
;
2409 output
->size
= 1 + output
->sib_present
+ output
->bytes
;
2413 static void add_asp(insn
*ins
, int addrbits
)
2418 valid
= (addrbits
== 64) ? 64|32 : 32|16;
2420 switch (ins
->prefixes
[PPS_ASIZE
]) {
2431 valid
&= (addrbits
== 32) ? 16 : 32;
2437 for (j
= 0; j
< ins
->operands
; j
++) {
2438 if (!(MEMORY
& ~ins
->oprs
[j
].type
)) {
2441 /* Verify as Register */
2442 if (ins
->oprs
[j
].indexreg
< EXPR_REG_START
2443 || ins
->oprs
[j
].indexreg
>= REG_ENUM_LIMIT
)
2446 i
= nasm_reg_flags
[ins
->oprs
[j
].indexreg
];
2448 /* Verify as Register */
2449 if (ins
->oprs
[j
].basereg
< EXPR_REG_START
2450 || ins
->oprs
[j
].basereg
>= REG_ENUM_LIMIT
)
2453 b
= nasm_reg_flags
[ins
->oprs
[j
].basereg
];
2455 if (ins
->oprs
[j
].scale
== 0)
2459 int ds
= ins
->oprs
[j
].disp_size
;
2460 if ((addrbits
!= 64 && ds
> 8) ||
2461 (addrbits
== 64 && ds
== 16))
2481 if (valid
& addrbits
) {
2482 ins
->addr_size
= addrbits
;
2483 } else if (valid
& ((addrbits
== 32) ? 16 : 32)) {
2484 /* Add an address size prefix */
2485 enum prefixes pref
= (addrbits
== 32) ? P_A16
: P_A32
;
2486 ins
->prefixes
[PPS_ASIZE
] = pref
;
2487 ins
->addr_size
= (addrbits
== 32) ? 16 : 32;
2490 errfunc(ERR_NONFATAL
, "impossible combination of address sizes");
2491 ins
->addr_size
= addrbits
; /* Error recovery */
2494 defdisp
= ins
->addr_size
== 16 ? 16 : 32;
2496 for (j
= 0; j
< ins
->operands
; j
++) {
2497 if (!(MEM_OFFS
& ~ins
->oprs
[j
].type
) &&
2498 (ins
->oprs
[j
].disp_size
? ins
->oprs
[j
].disp_size
: defdisp
)
2499 != ins
->addr_size
) {
2500 /* mem_offs sizes must match the address size; if not,
2501 strip the MEM_OFFS bit and match only EA instructions */
2502 ins
->oprs
[j
].type
&= ~(MEM_OFFS
& ~MEMORY
);