1 /* assemble.c code generation for the Netwide Assembler
3 * The Netwide Assembler is copyright (C) 1996 Simon Tatham and
4 * Julian Hall. All rights reserved. The software is
5 * redistributable under the license given in the file "LICENSE"
6 * distributed in the NASM archive.
8 * the actual codes (C syntax, i.e. octal):
9 * \0 - terminates the code. (Unless it's a literal of course.)
10 * \1, \2, \3 - that many literal bytes follow in the code stream
11 * \10..\13 - a literal byte follows in the code stream, to be added
12 * to the register value of operand 0..3
13 * \14..\17 - a signed byte immediate operand, from operand 0..3
14 * \20..\23 - a byte immediate operand, from operand 0..3
15 * \24..\27 - an unsigned byte immediate operand, from operand 0..3
16 * \30..\33 - a word immediate operand, from operand 0..3
17 * \34..\37 - select between \3[0-3] and \4[0-3] depending on 16/32 bit
18 * assembly mode or the operand-size override on the operand
19 * \40..\43 - a long immediate operand, from operand 0..3
20 * \44..\47 - select between \3[0-3], \4[0-3] and \5[4-7]
21 * depending on the address size of the instruction.
22 * \50..\53 - a byte relative operand, from operand 0..3
23 * \54..\57 - a qword immediate operand, from operand 0..3
24 * \60..\63 - a word relative operand, from operand 0..3
25 * \64..\67 - select between \6[0-3] and \7[0-3] depending on 16/32 bit
26 * assembly mode or the operand-size override on the operand
27 * \70..\73 - a long relative operand, from operand 0..3
28 * \74..\77 - a word constant, from the _segment_ part of operand 0..3
29 * \1ab - a ModRM, calculated on EA in operand a, with the spare
30 * field the register value of operand b.
31 * \140..\143 - an immediate word or signed byte for operand 0..3
32 * \144..\147 - or 2 (s-field) into opcode byte if operand 0..3
33 * is a signed byte rather than a word. Opcode byte follows.
34 * \150..\153 - an immediate dword or signed byte for operand 0..3
35 * \154..\157 - or 2 (s-field) into opcode byte if operand 0..3
36 * is a signed byte rather than a dword. Opcode byte follows.
37 * \160..\163 - this instruction uses DREX rather than REX, with the
38 * OC0 field set to 0, and the dest field taken from
40 * \164..\167 - this instruction uses DREX rather than REX, with the
41 * OC0 field set to 1, and the dest field taken from
43 * \171 - placement of DREX suffix in the absence of an EA
44 * \172\ab - the register number from operand a in bits 7..4, with
45 * the 4-bit immediate from operand b in bits 3..0.
46 * \173\xab - the register number from operand a in bits 7..4, with
47 * the value b in bits 3..0.
48 * \174\a - the register number from operand a in bits 7..4, and
49 * an arbitrary value in bits 3..0 (assembled as zero.)
50 * \2ab - a ModRM, calculated on EA in operand a, with the spare
51 * field equal to digit b.
52 * \250..\253 - same as \150..\153, except warn if the 64-bit operand
53 * is not equal to the truncated and sign-extended 32-bit
54 * operand; used for 32-bit immediates in 64-bit mode.
55 * \254..\257 - a signed 32-bit operand to be extended to 64 bits.
56 * \260..\263 - this instruction uses VEX rather than REX, with the
57 * V field taken from operand 0..3.
58 * \270 - this instruction uses VEX rather than REX, with the
59 * V field set to 1111b.
61 * VEX prefixes are followed by the sequence:
62 * \mm\wlp where mm is the M field; and wlp is:
64 * [w0] ww = 0 for W = 0
65 * [w1] ww = 1 for W = 1
66 * [wx] ww = 2 for W don't care (always assembled as 0)
67 * [ww] ww = 3 for W used as REX.W
70 * \274..\277 - a signed byte immediate operand, from operand 0..3,
71 * which is to be extended to the operand size.
72 * \310 - indicates fixed 16-bit address size, i.e. optional 0x67.
73 * \311 - indicates fixed 32-bit address size, i.e. optional 0x67.
74 * \312 - (disassembler only) marker on LOOP, LOOPxx instructions.
75 * \313 - indicates fixed 64-bit address size, 0x67 invalid.
76 * \314 - (disassembler only) invalid with REX.B
77 * \315 - (disassembler only) invalid with REX.X
78 * \316 - (disassembler only) invalid with REX.R
79 * \317 - (disassembler only) invalid with REX.W
80 * \320 - indicates fixed 16-bit operand size, i.e. optional 0x66.
81 * \321 - indicates fixed 32-bit operand size, i.e. optional 0x66.
82 * \322 - indicates that this instruction is only valid when the
83 * operand size is the default (instruction to disassembler,
84 * generates no code in the assembler)
85 * \323 - indicates fixed 64-bit operand size, REX on extensions only.
86 * \324 - indicates 64-bit operand size requiring REX prefix.
87 * \330 - a literal byte follows in the code stream, to be added
88 * to the condition code value of the instruction.
89 * \331 - instruction not valid with REP prefix. Hint for
90 * disassembler only; for SSE instructions.
91 * \332 - REP prefix (0xF2 byte) used as opcode extension.
92 * \333 - REP prefix (0xF3 byte) used as opcode extension.
93 * \334 - LOCK prefix used instead of REX.R
94 * \335 - disassemble a rep (0xF3 byte) prefix as repe not rep.
95 * \336 - force a REP(E) prefix (0xF2) even if not specified.
96 * \337 - force a REPNE prefix (0xF3) even if not specified.
97 * \336-\337 are still listed as prefixes in the disassembler.
98 * \340 - reserve <operand 0> bytes of uninitialized storage.
99 * Operand 0 had better be a segmentless constant.
100 * \344,\345 - the PUSH/POP (respectively) codes for CS, DS, ES, SS
101 * (POP is never used for CS) depending on operand 0
102 * \346,\347 - the second byte of PUSH/POP codes for FS, GS, depending
104 * \360 - no SSE prefix (== \364\331)
105 * \361 - 66 SSE prefix (== \366\331)
106 * \362 - F2 SSE prefix (== \364\332)
107 * \363 - F3 SSE prefix (== \364\333)
108 * \364 - operand-size prefix (0x66) not permitted
109 * \365 - address-size prefix (0x67) not permitted
110 * \366 - operand-size prefix (0x66) used as opcode extension
111 * \367 - address-size prefix (0x67) used as opcode extension
112 * \370,\371,\372 - match only if operand 0 meets byte jump criteria.
113 * 370 is used for Jcc, 371 is used for JMP.
114 * \373 - assemble 0x03 if bits==16, 0x05 if bits==32;
115 * used for conditional jump over longer jump
118 #include "compiler.h"
122 #include <inttypes.h>
126 #include "assemble.h"
130 /* Initialized to zero by the C standard */
131 static const uint8_t const_zero_buf
[256];
134 int sib_present
; /* is a SIB byte necessary? */
135 int bytes
; /* # of bytes of offset needed */
136 int size
; /* lazy - this is sib+bytes+1 */
137 uint8_t modrm
, sib
, rex
, rip
; /* the bytes themselves */
140 static uint32_t cpu
; /* cpu level received from nasm.c */
141 static efunc errfunc
;
142 static struct ofmt
*outfmt
;
143 static ListGen
*list
;
145 static int64_t calcsize(int32_t, int64_t, int, insn
*, const uint8_t *);
146 static void gencode(int32_t segment
, int64_t offset
, int bits
,
147 insn
* ins
, const struct itemplate
*temp
,
149 static int matches(const struct itemplate
*, insn
*, int bits
);
150 static int32_t regflag(const operand
*);
151 static int32_t regval(const operand
*);
152 static int rexflags(int, int32_t, int);
153 static int op_rexflags(const operand
*, int);
154 static ea
*process_ea(operand
*, ea
*, int, int, int, int32_t);
155 static void add_asp(insn
*, int);
157 static int has_prefix(insn
* ins
, enum prefix_pos pos
, enum prefixes prefix
)
159 return ins
->prefixes
[pos
] == prefix
;
162 static void assert_no_prefix(insn
* ins
, enum prefix_pos pos
)
164 if (ins
->prefixes
[pos
])
165 errfunc(ERR_NONFATAL
, "invalid %s prefix",
166 prefix_name(ins
->prefixes
[pos
]));
169 static const char *size_name(int size
)
191 static void warn_overflow(int size
, const struct operand
*o
)
193 if (size
< 8 && o
->wrt
== NO_SEG
&& o
->segment
== NO_SEG
) {
194 int64_t lim
= ((int64_t)1 << (size
*8))-1;
195 int64_t data
= o
->offset
;
197 if (data
< ~lim
|| data
> lim
)
198 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
199 "%s data exceeds bounds", size_name(size
));
203 * This routine wrappers the real output format's output routine,
204 * in order to pass a copy of the data off to the listing file
205 * generator at the same time.
207 static void out(int64_t offset
, int32_t segto
, const void *data
,
208 enum out_type type
, uint64_t size
,
209 int32_t segment
, int32_t wrt
)
211 static int32_t lineno
= 0; /* static!!! */
212 static char *lnfname
= NULL
;
215 if (type
== OUT_ADDRESS
&& segment
== NO_SEG
&& wrt
== NO_SEG
) {
217 * This is a non-relocated address, and we're going to
218 * convert it into RAWDATA format.
223 errfunc(ERR_PANIC
, "OUT_ADDRESS with size > 8");
227 WRITEADDR(q
, *(int64_t *)data
, size
);
232 list
->output(offset
, data
, type
, size
);
235 * this call to src_get determines when we call the
236 * debug-format-specific "linenum" function
237 * it updates lineno and lnfname to the current values
238 * returning 0 if "same as last time", -2 if lnfname
239 * changed, and the amount by which lineno changed,
240 * if it did. thus, these variables must be static
243 if (src_get(&lineno
, &lnfname
)) {
244 outfmt
->current_dfmt
->linenum(lnfname
, lineno
, segto
);
247 outfmt
->output(segto
, data
, type
, size
, segment
, wrt
);
250 static bool jmp_match(int32_t segment
, int64_t offset
, int bits
,
251 insn
* ins
, const uint8_t *code
)
256 if ((c
!= 0370 && c
!= 0371) || (ins
->oprs
[0].type
& STRICT
))
260 if (optimizing
< 0 && c
== 0371)
263 isize
= calcsize(segment
, offset
, bits
, ins
, code
);
264 if (ins
->oprs
[0].segment
!= segment
)
267 isize
= ins
->oprs
[0].offset
- offset
- isize
; /* isize is delta */
268 return (isize
>= -128 && isize
<= 127); /* is it byte size? */
271 int64_t assemble(int32_t segment
, int64_t offset
, int bits
, uint32_t cp
,
272 insn
* instruction
, struct ofmt
*output
, efunc error
,
275 const struct itemplate
*temp
;
280 int64_t start
= offset
;
281 int64_t wsize
= 0; /* size for DB etc. */
283 errfunc
= error
; /* to pass to other functions */
285 outfmt
= output
; /* likewise */
286 list
= listgen
; /* and again */
288 switch (instruction
->opcode
) {
318 int32_t t
= instruction
->times
;
321 "instruction->times < 0 (%ld) in assemble()", t
);
323 while (t
--) { /* repeat TIMES times */
324 for (e
= instruction
->eops
; e
; e
= e
->next
) {
325 if (e
->type
== EOT_DB_NUMBER
) {
327 if (e
->segment
!= NO_SEG
)
328 errfunc(ERR_NONFATAL
,
329 "one-byte relocation attempted");
331 uint8_t out_byte
= e
->offset
;
332 out(offset
, segment
, &out_byte
,
333 OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
335 } else if (wsize
> 8) {
336 errfunc(ERR_NONFATAL
,
337 "integer supplied to a DT, DO or DY"
340 out(offset
, segment
, &e
->offset
,
341 OUT_ADDRESS
, wsize
, e
->segment
, e
->wrt
);
343 } else if (e
->type
== EOT_DB_STRING
||
344 e
->type
== EOT_DB_STRING_FREE
) {
347 out(offset
, segment
, e
->stringval
,
348 OUT_RAWDATA
, e
->stringlen
, NO_SEG
, NO_SEG
);
349 align
= e
->stringlen
% wsize
;
352 align
= wsize
- align
;
353 out(offset
, segment
, const_zero_buf
,
354 OUT_RAWDATA
, align
, NO_SEG
, NO_SEG
);
356 offset
+= e
->stringlen
+ align
;
359 if (t
> 0 && t
== instruction
->times
- 1) {
361 * Dummy call to list->output to give the offset to the
364 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
365 list
->uplevel(LIST_TIMES
);
368 if (instruction
->times
> 1)
369 list
->downlevel(LIST_TIMES
);
370 return offset
- start
;
373 if (instruction
->opcode
== I_INCBIN
) {
374 const char *fname
= instruction
->eops
->stringval
;
377 fp
= fopen(fname
, "rb");
379 error(ERR_NONFATAL
, "`incbin': unable to open file `%s'",
381 } else if (fseek(fp
, 0L, SEEK_END
) < 0) {
382 error(ERR_NONFATAL
, "`incbin': unable to seek on file `%s'",
385 static char buf
[4096];
386 size_t t
= instruction
->times
;
391 if (instruction
->eops
->next
) {
392 base
= instruction
->eops
->next
->offset
;
394 if (instruction
->eops
->next
->next
&&
395 len
> (size_t)instruction
->eops
->next
->next
->offset
)
396 len
= (size_t)instruction
->eops
->next
->next
->offset
;
399 * Dummy call to list->output to give the offset to the
402 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
403 list
->uplevel(LIST_INCBIN
);
407 fseek(fp
, base
, SEEK_SET
);
411 fread(buf
, 1, (l
> (int32_t) sizeof(buf
) ? (int32_t) sizeof(buf
) : l
),
415 * This shouldn't happen unless the file
416 * actually changes while we are reading
420 "`incbin': unexpected EOF while"
421 " reading file `%s'", fname
);
422 t
= 0; /* Try to exit cleanly */
425 out(offset
, segment
, buf
, OUT_RAWDATA
, m
,
430 list
->downlevel(LIST_INCBIN
);
431 if (instruction
->times
> 1) {
433 * Dummy call to list->output to give the offset to the
436 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
437 list
->uplevel(LIST_TIMES
);
438 list
->downlevel(LIST_TIMES
);
441 return instruction
->times
* len
;
443 return 0; /* if we're here, there's an error */
446 /* Check to see if we need an address-size prefix */
447 add_asp(instruction
, bits
);
451 for (temp
= nasm_instructions
[instruction
->opcode
]; temp
->opcode
!= -1; temp
++){
452 int m
= matches(temp
, instruction
, bits
);
454 (m
== 99 && jmp_match(segment
, offset
, bits
,
455 instruction
, temp
->code
))) {
457 int64_t insn_size
= calcsize(segment
, offset
, bits
,
458 instruction
, temp
->code
);
459 itimes
= instruction
->times
;
460 if (insn_size
< 0) /* shouldn't be, on pass two */
461 error(ERR_PANIC
, "errors made it through from pass one");
464 for (j
= 0; j
< MAXPREFIX
; j
++) {
466 switch (instruction
->prefixes
[j
]) {
481 error(ERR_WARNING
| ERR_PASS2
,
482 "cs segment base generated, but will be ignored in 64-bit mode");
488 error(ERR_WARNING
| ERR_PASS2
,
489 "ds segment base generated, but will be ignored in 64-bit mode");
495 error(ERR_WARNING
| ERR_PASS2
,
496 "es segment base generated, but will be ignored in 64-bit mode");
508 error(ERR_WARNING
| ERR_PASS2
,
509 "ss segment base generated, but will be ignored in 64-bit mode");
516 "segr6 and segr7 cannot be used as prefixes");
521 "16-bit addressing is not supported "
523 } else if (bits
!= 16)
533 "64-bit addressing is only supported "
557 error(ERR_PANIC
, "invalid instruction prefix");
560 out(offset
, segment
, &c
, OUT_RAWDATA
, 1,
565 insn_end
= offset
+ insn_size
;
566 gencode(segment
, offset
, bits
, instruction
,
569 if (itimes
> 0 && itimes
== instruction
->times
- 1) {
571 * Dummy call to list->output to give the offset to the
574 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
575 list
->uplevel(LIST_TIMES
);
578 if (instruction
->times
> 1)
579 list
->downlevel(LIST_TIMES
);
580 return offset
- start
;
581 } else if (m
> 0 && m
> size_prob
) {
586 if (temp
->opcode
== -1) { /* didn't match any instruction */
589 error(ERR_NONFATAL
, "operation size not specified");
592 error(ERR_NONFATAL
, "mismatch in operand sizes");
595 error(ERR_NONFATAL
, "no instruction for this cpu level");
598 error(ERR_NONFATAL
, "instruction not supported in 64-bit mode");
602 "invalid combination of opcode and operands");
609 int64_t insn_size(int32_t segment
, int64_t offset
, int bits
, uint32_t cp
,
610 insn
* instruction
, efunc error
)
612 const struct itemplate
*temp
;
614 errfunc
= error
; /* to pass to other functions */
617 if (instruction
->opcode
== -1)
620 if (instruction
->opcode
== I_DB
|| instruction
->opcode
== I_DW
||
621 instruction
->opcode
== I_DD
|| instruction
->opcode
== I_DQ
||
622 instruction
->opcode
== I_DT
|| instruction
->opcode
== I_DO
||
623 instruction
->opcode
== I_DY
) {
625 int32_t isize
, osize
, wsize
= 0; /* placate gcc */
628 switch (instruction
->opcode
) {
654 for (e
= instruction
->eops
; e
; e
= e
->next
) {
658 if (e
->type
== EOT_DB_NUMBER
)
660 else if (e
->type
== EOT_DB_STRING
||
661 e
->type
== EOT_DB_STRING_FREE
)
662 osize
= e
->stringlen
;
664 align
= (-osize
) % wsize
;
667 isize
+= osize
+ align
;
669 return isize
* instruction
->times
;
672 if (instruction
->opcode
== I_INCBIN
) {
673 const char *fname
= instruction
->eops
->stringval
;
677 fp
= fopen(fname
, "rb");
679 error(ERR_NONFATAL
, "`incbin': unable to open file `%s'",
681 else if (fseek(fp
, 0L, SEEK_END
) < 0)
682 error(ERR_NONFATAL
, "`incbin': unable to seek on file `%s'",
687 if (instruction
->eops
->next
) {
688 len
-= instruction
->eops
->next
->offset
;
689 if (instruction
->eops
->next
->next
&&
690 len
> (size_t)instruction
->eops
->next
->next
->offset
) {
691 len
= (size_t)instruction
->eops
->next
->next
->offset
;
694 return instruction
->times
* len
;
696 return 0; /* if we're here, there's an error */
699 /* Check to see if we need an address-size prefix */
700 add_asp(instruction
, bits
);
702 for (temp
= nasm_instructions
[instruction
->opcode
]; temp
->opcode
!= -1; temp
++) {
703 int m
= matches(temp
, instruction
, bits
);
705 (m
== 99 && jmp_match(segment
, offset
, bits
,
706 instruction
, temp
->code
))) {
707 /* we've matched an instruction. */
709 const uint8_t *codes
= temp
->code
;
712 isize
= calcsize(segment
, offset
, bits
, instruction
, codes
);
715 for (j
= 0; j
< MAXPREFIX
; j
++) {
716 switch (instruction
->prefixes
[j
]) {
742 return isize
* instruction
->times
;
745 return -1; /* didn't match any instruction */
748 static bool possible_sbyte(operand
*o
)
750 return o
->wrt
== NO_SEG
&& o
->segment
== NO_SEG
&&
751 !(o
->opflags
& OPFLAG_FORWARD
) &&
752 optimizing
>= 0 && !(o
->type
& STRICT
);
755 /* check that opn[op] is a signed byte of size 16 or 32 */
756 static bool is_sbyte16(operand
*o
)
760 if (!possible_sbyte(o
))
764 return v
>= -128 && v
<= 127;
767 static bool is_sbyte32(operand
*o
)
771 if (!possible_sbyte(o
))
775 return v
>= -128 && v
<= 127;
778 /* Common construct */
779 #define case4(x) case (x): case (x)+1: case (x)+2: case (x)+3
781 static int64_t calcsize(int32_t segment
, int64_t offset
, int bits
,
782 insn
* ins
, const uint8_t *codes
)
789 ins
->rex
= 0; /* Ensure REX is reset */
791 if (ins
->prefixes
[PPS_OSIZE
] == P_O64
)
794 (void)segment
; /* Don't warn that this parameter is unused */
795 (void)offset
; /* Don't warn that this parameter is unused */
799 opx
= &ins
->oprs
[c
& 3];
804 codes
+= c
, length
+= c
;
809 op_rexflags(opx
, REX_B
|REX_H
|REX_P
|REX_W
);
824 if (opx
->type
& (BITS16
| BITS32
| BITS64
))
825 length
+= (opx
->type
& BITS16
) ? 2 : 4;
827 length
+= (bits
== 16) ? 2 : 4;
835 length
+= ins
->addr_size
>> 3;
843 length
+= 8; /* MOV reg64/imm */
851 if (opx
->type
& (BITS16
| BITS32
| BITS64
))
852 length
+= (opx
->type
& BITS16
) ? 2 : 4;
854 length
+= (bits
== 16) ? 2 : 4;
866 length
+= is_sbyte16(opx
) ? 1 : 2;
875 length
+= is_sbyte32(opx
) ? 1 : 4;
886 ins
->drexdst
= regval(opx
);
891 ins
->rex
|= REX_D
|REX_OC
;
892 ins
->drexdst
= regval(opx
);
906 length
+= is_sbyte32(opx
) ? 1 : 4;
915 ins
->drexdst
= regval(opx
);
916 ins
->vex_m
= *codes
++;
917 ins
->vex_wlp
= *codes
++;
923 ins
->vex_m
= *codes
++;
924 ins
->vex_wlp
= *codes
++;
937 length
+= (bits
!= 16) && !has_prefix(ins
, PPS_ASIZE
, P_A16
);
941 length
+= (bits
!= 32) && !has_prefix(ins
, PPS_ASIZE
, P_A32
);
948 if (bits
!= 64 || has_prefix(ins
, PPS_ASIZE
, P_A16
) ||
949 has_prefix(ins
, PPS_ASIZE
, P_A32
))
957 length
+= (bits
!= 16);
961 length
+= (bits
== 16);
995 if (!ins
->prefixes
[PPS_LREP
])
996 ins
->prefixes
[PPS_LREP
] = P_REP
;
1000 if (!ins
->prefixes
[PPS_LREP
])
1001 ins
->prefixes
[PPS_LREP
] = P_REPNE
;
1005 if (ins
->oprs
[0].segment
!= NO_SEG
)
1006 errfunc(ERR_NONFATAL
, "attempt to reserve non-constant"
1007 " quantity of BSS space");
1009 length
+= ins
->oprs
[0].offset
;
1059 ea_data
.rex
= 0; /* Ensure ea.REX is initially 0 */
1062 /* pick rfield from operand b */
1063 rflags
= regflag(&ins
->oprs
[c
& 7]);
1064 rfield
= nasm_regvals
[ins
->oprs
[c
& 7].basereg
];
1071 (&ins
->oprs
[(c
>> 3) & 7], &ea_data
, bits
,
1072 ins
->addr_size
, rfield
, rflags
)) {
1073 errfunc(ERR_NONFATAL
, "invalid effective address");
1076 ins
->rex
|= ea_data
.rex
;
1077 length
+= ea_data
.size
;
1083 errfunc(ERR_PANIC
, "internal instruction table corrupt"
1084 ": instruction code 0x%02X given", c
);
1089 ins
->rex
&= rex_mask
;
1091 if (ins
->rex
& REX_V
) {
1092 int bad32
= REX_R
|REX_W
|REX_X
|REX_B
;
1094 if (ins
->rex
& REX_H
) {
1095 errfunc(ERR_NONFATAL
, "cannot use high register in vex instruction");
1098 switch (ins
->vex_wlp
& 030) {
1112 if (bits
!= 64 && ((ins
->rex
& bad32
) || ins
->drexdst
> 7)) {
1113 errfunc(ERR_NONFATAL
, "invalid operands in non-64-bit mode");
1116 if (ins
->vex_m
!= 1 || (ins
->rex
& (REX_W
|REX_R
|REX_B
)))
1120 } else if (ins
->rex
& REX_D
) {
1121 if (ins
->rex
& REX_H
) {
1122 errfunc(ERR_NONFATAL
, "cannot use high register in drex instruction");
1125 if (bits
!= 64 && ((ins
->rex
& (REX_R
|REX_W
|REX_X
|REX_B
)) ||
1126 ins
->drexdst
> 7)) {
1127 errfunc(ERR_NONFATAL
, "invalid operands in non-64-bit mode");
1131 } else if (ins
->rex
& REX_REAL
) {
1132 if (ins
->rex
& REX_H
) {
1133 errfunc(ERR_NONFATAL
, "cannot use high register in rex instruction");
1135 } else if (bits
== 64) {
1137 } else if ((ins
->rex
& REX_L
) &&
1138 !(ins
->rex
& (REX_P
|REX_W
|REX_X
|REX_B
)) &&
1141 assert_no_prefix(ins
, PPS_LREP
);
1144 errfunc(ERR_NONFATAL
, "invalid operands in non-64-bit mode");
1152 #define EMIT_REX() \
1153 if (!(ins->rex & (REX_D|REX_V)) && (ins->rex & REX_REAL) && (bits == 64)) { \
1154 ins->rex = (ins->rex & REX_REAL)|REX_P; \
1155 out(offset, segment, &ins->rex, OUT_RAWDATA, 1, NO_SEG, NO_SEG); \
1160 static void gencode(int32_t segment
, int64_t offset
, int bits
,
1161 insn
* ins
, const struct itemplate
*temp
,
1164 static char condval
[] = { /* conditional opcodes */
1165 0x7, 0x3, 0x2, 0x6, 0x2, 0x4, 0xF, 0xD, 0xC, 0xE, 0x6, 0x2,
1166 0x3, 0x7, 0x3, 0x5, 0xE, 0xC, 0xD, 0xF, 0x1, 0xB, 0x9, 0x5,
1167 0x0, 0xA, 0xA, 0xB, 0x8, 0x4
1173 struct operand
*opx
;
1174 const uint8_t *codes
= temp
->code
;
1178 opx
= &ins
->oprs
[c
& 3];
1184 out(offset
, segment
, codes
, OUT_RAWDATA
, c
, NO_SEG
, NO_SEG
);
1191 bytes
[0] = *codes
++ + ((regval(opx
)) & 7);
1192 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1197 /* The test for BITS8 and SBYTE here is intended to avoid
1198 warning on optimizer actions due to SBYTE, while still
1199 warn on explicit BYTE directives. Also warn, obviously,
1200 if the optimizer isn't enabled. */
1201 if (((opx
->type
& BITS8
) ||
1202 !(opx
->type
& temp
->opd
[c
& 3] & BYTENESS
)) &&
1203 (opx
->offset
< -128 || opx
->offset
> 127)) {
1204 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1205 "signed byte value exceeds bounds");
1207 if (opx
->segment
!= NO_SEG
) {
1209 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1210 opx
->segment
, opx
->wrt
);
1212 bytes
[0] = opx
->offset
;
1213 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1220 if (opx
->offset
< -256 || opx
->offset
> 255) {
1221 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1222 "byte value exceeds bounds");
1224 if (opx
->segment
!= NO_SEG
) {
1226 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1227 opx
->segment
, opx
->wrt
);
1229 bytes
[0] = opx
->offset
;
1230 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1237 if (opx
->offset
< 0 || opx
->offset
> 255)
1238 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1239 "unsigned byte value exceeds bounds");
1240 if (opx
->segment
!= NO_SEG
) {
1242 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1243 opx
->segment
, opx
->wrt
);
1245 bytes
[0] = opx
->offset
;
1246 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1253 warn_overflow(2, opx
);
1255 out(offset
, segment
, &data
, OUT_ADDRESS
, 2,
1256 opx
->segment
, opx
->wrt
);
1261 if (opx
->type
& (BITS16
| BITS32
))
1262 size
= (opx
->type
& BITS16
) ? 2 : 4;
1264 size
= (bits
== 16) ? 2 : 4;
1265 warn_overflow(size
, opx
);
1267 out(offset
, segment
, &data
, OUT_ADDRESS
, size
,
1268 opx
->segment
, opx
->wrt
);
1273 warn_overflow(4, opx
);
1275 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1276 opx
->segment
, opx
->wrt
);
1282 size
= ins
->addr_size
>> 3;
1283 warn_overflow(size
, opx
);
1284 out(offset
, segment
, &data
, OUT_ADDRESS
, size
,
1285 opx
->segment
, opx
->wrt
);
1290 if (opx
->segment
!= segment
)
1291 errfunc(ERR_NONFATAL
,
1292 "short relative jump outside segment");
1293 data
= opx
->offset
- insn_end
;
1294 if (data
> 127 || data
< -128)
1295 errfunc(ERR_NONFATAL
, "short jump is out of range");
1297 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1302 data
= (int64_t)opx
->offset
;
1303 out(offset
, segment
, &data
, OUT_ADDRESS
, 8,
1304 opx
->segment
, opx
->wrt
);
1309 if (opx
->segment
!= segment
) {
1311 out(offset
, segment
, &data
,
1312 OUT_REL2ADR
, insn_end
- offset
,
1313 opx
->segment
, opx
->wrt
);
1315 data
= opx
->offset
- insn_end
;
1316 out(offset
, segment
, &data
,
1317 OUT_ADDRESS
, 2, NO_SEG
, NO_SEG
);
1323 if (opx
->type
& (BITS16
| BITS32
| BITS64
))
1324 size
= (opx
->type
& BITS16
) ? 2 : 4;
1326 size
= (bits
== 16) ? 2 : 4;
1327 if (opx
->segment
!= segment
) {
1329 out(offset
, segment
, &data
,
1330 size
== 2 ? OUT_REL2ADR
: OUT_REL4ADR
,
1331 insn_end
- offset
, opx
->segment
, opx
->wrt
);
1333 data
= opx
->offset
- insn_end
;
1334 out(offset
, segment
, &data
,
1335 OUT_ADDRESS
, size
, NO_SEG
, NO_SEG
);
1341 if (opx
->segment
!= segment
) {
1343 out(offset
, segment
, &data
,
1344 OUT_REL4ADR
, insn_end
- offset
,
1345 opx
->segment
, opx
->wrt
);
1347 data
= opx
->offset
- insn_end
;
1348 out(offset
, segment
, &data
,
1349 OUT_ADDRESS
, 4, NO_SEG
, NO_SEG
);
1355 if (opx
->segment
== NO_SEG
)
1356 errfunc(ERR_NONFATAL
, "value referenced by FAR is not"
1359 out(offset
, segment
, &data
, OUT_ADDRESS
, 2,
1360 outfmt
->segbase(1 + opx
->segment
),
1367 warn_overflow(2, opx
);
1368 if (is_sbyte16(opx
)) {
1370 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1374 out(offset
, segment
, &data
, OUT_ADDRESS
, 2,
1375 opx
->segment
, opx
->wrt
);
1382 bytes
[0] = *codes
++;
1383 if (is_sbyte16(opx
))
1384 bytes
[0] |= 2; /* s-bit */
1385 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1391 warn_overflow(4, opx
);
1392 if (is_sbyte32(opx
)) {
1394 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1398 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1399 opx
->segment
, opx
->wrt
);
1406 bytes
[0] = *codes
++;
1407 if (is_sbyte32(opx
))
1408 bytes
[0] |= 2; /* s-bit */
1409 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1419 (ins
->drexdst
<< 4) |
1420 (ins
->rex
& REX_OC
? 0x08 : 0) |
1421 (ins
->rex
& (REX_R
|REX_X
|REX_B
));
1423 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1429 opx
= &ins
->oprs
[c
>> 3];
1430 bytes
[0] = nasm_regvals
[opx
->basereg
] << 4;
1431 opx
= &ins
->oprs
[c
& 7];
1432 if (opx
->segment
!= NO_SEG
|| opx
->wrt
!= NO_SEG
) {
1433 errfunc(ERR_NONFATAL
,
1434 "non-absolute expression not permitted as argument %d",
1437 if (opx
->offset
& ~15) {
1438 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1439 "four-bit argument exceeds bounds");
1441 bytes
[0] |= opx
->offset
& 15;
1443 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1449 opx
= &ins
->oprs
[c
>> 4];
1450 bytes
[0] = nasm_regvals
[opx
->basereg
] << 4;
1452 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1458 opx
= &ins
->oprs
[c
];
1459 bytes
[0] = nasm_regvals
[opx
->basereg
] << 4;
1460 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1466 if (opx
->wrt
== NO_SEG
&& opx
->segment
== NO_SEG
&&
1467 (int32_t)data
!= (int64_t)data
) {
1468 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1469 "signed dword immediate exceeds bounds");
1471 if (is_sbyte32(opx
)) {
1473 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1477 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1478 opx
->segment
, opx
->wrt
);
1485 if (opx
->wrt
== NO_SEG
&& opx
->segment
== NO_SEG
&&
1486 (int32_t)data
!= (int64_t)data
) {
1487 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1488 "signed dword immediate exceeds bounds");
1490 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1491 opx
->segment
, opx
->wrt
);
1498 if (ins
->vex_m
!= 1 || (ins
->rex
& (REX_W
|REX_X
|REX_B
))) {
1500 bytes
[1] = ins
->vex_m
| ((~ins
->rex
& 7) << 5);
1501 bytes
[2] = ((ins
->rex
& REX_W
) << (7-3)) |
1502 ((~ins
->drexdst
& 15)<< 3) | (ins
->vex_wlp
& 07);
1503 out(offset
, segment
, &bytes
, OUT_RAWDATA
, 3, NO_SEG
, NO_SEG
);
1507 bytes
[1] = ((~ins
->rex
& REX_R
) << (7-2)) |
1508 ((~ins
->drexdst
& 15) << 3) | (ins
->vex_wlp
& 07);
1509 out(offset
, segment
, &bytes
, OUT_RAWDATA
, 2, NO_SEG
, NO_SEG
);
1519 if (ins
->rex
& REX_W
)
1521 else if (ins
->prefixes
[PPS_OSIZE
] == P_O16
)
1523 else if (ins
->prefixes
[PPS_OSIZE
] == P_O32
)
1528 um
= (uint64_t)2 << (s
-1);
1531 if (uv
> 127 && uv
< (uint64_t)-128 &&
1532 (uv
< um
-128 || uv
> um
-1)) {
1533 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1534 "signed byte value exceeds bounds");
1536 if (opx
->segment
!= NO_SEG
) {
1538 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1539 opx
->segment
, opx
->wrt
);
1542 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1553 if (bits
== 32 && !has_prefix(ins
, PPS_ASIZE
, P_A16
)) {
1555 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1562 if (bits
!= 32 && !has_prefix(ins
, PPS_ASIZE
, P_A32
)) {
1564 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1583 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1592 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1607 *bytes
= *codes
++ ^ condval
[ins
->condition
];
1608 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1617 *bytes
= c
- 0332 + 0xF2;
1618 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1623 if (ins
->rex
& REX_R
) {
1625 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1628 ins
->rex
&= ~(REX_L
|REX_R
);
1639 if (ins
->oprs
[0].segment
!= NO_SEG
)
1640 errfunc(ERR_PANIC
, "non-constant BSS size in pass two");
1642 int64_t size
= ins
->oprs
[0].offset
;
1644 out(offset
, segment
, NULL
,
1645 OUT_RESERVE
, size
, NO_SEG
, NO_SEG
);
1653 switch (ins
->oprs
[0].basereg
) {
1668 "bizarre 8086 segment register received");
1670 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1677 switch (ins
->oprs
[0].basereg
) {
1686 "bizarre 386 segment register received");
1688 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1697 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1703 bytes
[0] = c
- 0362 + 0xf2;
1704 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1714 *bytes
= c
- 0366 + 0x66;
1715 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1725 *bytes
= bits
== 16 ? 3 : 5;
1726 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1751 /* pick rfield from operand b */
1752 rflags
= regflag(&ins
->oprs
[c
& 7]);
1753 rfield
= nasm_regvals
[ins
->oprs
[c
& 7].basereg
];
1755 /* rfield is constant */
1761 (&ins
->oprs
[(c
>> 3) & 7], &ea_data
, bits
,
1762 ins
->addr_size
, rfield
, rflags
)) {
1763 errfunc(ERR_NONFATAL
, "invalid effective address");
1768 *p
++ = ea_data
.modrm
;
1769 if (ea_data
.sib_present
)
1772 /* DREX suffixes come between the SIB and the displacement */
1773 if (ins
->rex
& REX_D
) {
1775 (ins
->drexdst
<< 4) |
1776 (ins
->rex
& REX_OC
? 0x08 : 0) |
1777 (ins
->rex
& (REX_R
|REX_X
|REX_B
));
1782 out(offset
, segment
, bytes
, OUT_RAWDATA
, s
, NO_SEG
, NO_SEG
);
1785 * Make sure the address gets the right offset in case
1786 * the line breaks in the .lst file (BR 1197827)
1791 switch (ea_data
.bytes
) {
1795 if (ins
->oprs
[(c
>> 3) & 7].segment
!= NO_SEG
) {
1796 data
= ins
->oprs
[(c
>> 3) & 7].offset
;
1797 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1798 ins
->oprs
[(c
>> 3) & 7].segment
,
1799 ins
->oprs
[(c
>> 3) & 7].wrt
);
1801 *bytes
= ins
->oprs
[(c
>> 3) & 7].offset
;
1802 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1,
1810 data
= ins
->oprs
[(c
>> 3) & 7].offset
;
1811 warn_overflow(ea_data
.bytes
, opx
);
1814 data
-= insn_end
- (offset
+ea_data
.bytes
);
1819 out(offset
, segment
, &data
, type
, ea_data
.bytes
,
1820 ins
->oprs
[(c
>> 3) & 7].segment
,
1821 ins
->oprs
[(c
>> 3) & 7].wrt
);
1829 errfunc(ERR_PANIC
, "internal instruction table corrupt"
1830 ": instruction code 0x%02X given", c
);
1836 static int32_t regflag(const operand
* o
)
1838 if (o
->basereg
< EXPR_REG_START
|| o
->basereg
>= REG_ENUM_LIMIT
) {
1839 errfunc(ERR_PANIC
, "invalid operand passed to regflag()");
1841 return nasm_reg_flags
[o
->basereg
];
1844 static int32_t regval(const operand
* o
)
1846 if (o
->basereg
< EXPR_REG_START
|| o
->basereg
>= REG_ENUM_LIMIT
) {
1847 errfunc(ERR_PANIC
, "invalid operand passed to regval()");
1849 return nasm_regvals
[o
->basereg
];
1852 static int op_rexflags(const operand
* o
, int mask
)
1857 if (o
->basereg
< EXPR_REG_START
|| o
->basereg
>= REG_ENUM_LIMIT
) {
1858 errfunc(ERR_PANIC
, "invalid operand passed to op_rexflags()");
1861 flags
= nasm_reg_flags
[o
->basereg
];
1862 val
= nasm_regvals
[o
->basereg
];
1864 return rexflags(val
, flags
, mask
);
1867 static int rexflags(int val
, int32_t flags
, int mask
)
1872 rex
|= REX_B
|REX_X
|REX_R
;
1875 if (!(REG_HIGH
& ~flags
)) /* AH, CH, DH, BH */
1877 else if (!(REG8
& ~flags
) && val
>= 4) /* SPL, BPL, SIL, DIL */
1883 static int matches(const struct itemplate
*itemp
, insn
* instruction
, int bits
)
1885 int i
, size
[MAX_OPERANDS
], asize
, oprs
, ret
;
1892 if (itemp
->opcode
!= instruction
->opcode
)
1896 * Count the operands
1898 if (itemp
->operands
!= instruction
->operands
)
1902 * Check that no spurious colons or TOs are present
1904 for (i
= 0; i
< itemp
->operands
; i
++)
1905 if (instruction
->oprs
[i
].type
& ~itemp
->opd
[i
] & (COLON
| TO
))
1909 * Process size flags
1911 if (itemp
->flags
& IF_ARMASK
) {
1912 memset(size
, 0, sizeof size
);
1914 i
= ((itemp
->flags
& IF_ARMASK
) >> IF_ARSHFT
) - 1;
1916 switch (itemp
->flags
& IF_SMASK
) {
1953 switch (itemp
->flags
& IF_SMASK
) {
1988 for (i
= 0; i
< MAX_OPERANDS
; i
++)
1993 * Check that the operand flags all match up
1995 for (i
= 0; i
< itemp
->operands
; i
++) {
1996 int32_t type
= instruction
->oprs
[i
].type
;
1997 if (!(type
& SIZE_MASK
))
2000 if (itemp
->opd
[i
] & SAME_AS
) {
2001 int j
= itemp
->opd
[i
] & ~SAME_AS
;
2002 if (type
!= instruction
->oprs
[j
].type
||
2003 instruction
->oprs
[i
].basereg
!= instruction
->oprs
[j
].basereg
)
2005 } else if (itemp
->opd
[i
] & ~type
||
2006 ((itemp
->opd
[i
] & SIZE_MASK
) &&
2007 ((itemp
->opd
[i
] ^ type
) & SIZE_MASK
))) {
2008 if ((itemp
->opd
[i
] & ~type
& ~SIZE_MASK
) ||
2017 * Check operand sizes
2019 if (itemp
->flags
& (IF_SM
| IF_SM2
)) {
2020 oprs
= (itemp
->flags
& IF_SM2
? 2 : itemp
->operands
);
2022 for (i
= 0; i
< oprs
; i
++) {
2023 if ((asize
= itemp
->opd
[i
] & SIZE_MASK
) != 0) {
2025 for (j
= 0; j
< oprs
; j
++)
2031 oprs
= itemp
->operands
;
2034 for (i
= 0; i
< itemp
->operands
; i
++) {
2035 if (!(itemp
->opd
[i
] & SIZE_MASK
) &&
2036 (instruction
->oprs
[i
].type
& SIZE_MASK
& ~size
[i
]))
2041 * Check template is okay at the set cpu level
2043 if (((itemp
->flags
& IF_PLEVEL
) > cpu
))
2047 * Check if instruction is available in long mode
2049 if ((itemp
->flags
& IF_NOLONG
) && (bits
== 64))
2053 * Check if special handling needed for Jumps
2055 if ((uint8_t)(itemp
->code
[0]) >= 0370)
2061 static ea
*process_ea(operand
* input
, ea
* output
, int bits
,
2062 int addrbits
, int rfield
, int32_t rflags
)
2064 bool forw_ref
= !!(input
->opflags
& OPFLAG_FORWARD
);
2066 output
->rip
= false;
2068 /* REX flags for the rfield operand */
2069 output
->rex
|= rexflags(rfield
, rflags
, REX_R
|REX_P
|REX_W
|REX_H
);
2071 if (!(REGISTER
& ~input
->type
)) { /* register direct */
2075 if (input
->basereg
< EXPR_REG_START
/* Verify as Register */
2076 || input
->basereg
>= REG_ENUM_LIMIT
)
2079 i
= nasm_regvals
[input
->basereg
];
2082 return NULL
; /* Invalid EA register */
2084 output
->rex
|= op_rexflags(input
, REX_B
|REX_P
|REX_W
|REX_H
);
2086 output
->sib_present
= false; /* no SIB necessary */
2087 output
->bytes
= 0; /* no offset necessary either */
2088 output
->modrm
= 0xC0 | ((rfield
& 7) << 3) | (i
& 7);
2089 } else { /* it's a memory reference */
2090 if (input
->basereg
== -1
2091 && (input
->indexreg
== -1 || input
->scale
== 0)) {
2092 /* it's a pure offset */
2093 if (bits
== 64 && (~input
->type
& IP_REL
)) {
2094 int scale
, index
, base
;
2095 output
->sib_present
= true;
2099 output
->sib
= (scale
<< 6) | (index
<< 3) | base
;
2101 output
->modrm
= 4 | ((rfield
& 7) << 3);
2102 output
->rip
= false;
2104 output
->sib_present
= false;
2105 output
->bytes
= (addrbits
!= 16 ? 4 : 2);
2106 output
->modrm
= (addrbits
!= 16 ? 5 : 6) | ((rfield
& 7) << 3);
2107 output
->rip
= bits
== 64;
2109 } else { /* it's an indirection */
2110 int i
= input
->indexreg
, b
= input
->basereg
, s
= input
->scale
;
2111 int32_t o
= input
->offset
, seg
= input
->segment
;
2112 int hb
= input
->hintbase
, ht
= input
->hinttype
;
2115 int32_t ix
, bx
; /* register flags */
2118 i
= -1; /* make this easy, at least */
2120 if (i
>= EXPR_REG_START
&& i
< REG_ENUM_LIMIT
) {
2121 it
= nasm_regvals
[i
];
2122 ix
= nasm_reg_flags
[i
];
2128 if (b
>= EXPR_REG_START
&& b
< REG_ENUM_LIMIT
) {
2129 bt
= nasm_regvals
[b
];
2130 bx
= nasm_reg_flags
[b
];
2136 /* check for a 32/64-bit memory reference... */
2137 if ((ix
|bx
) & (BITS32
|BITS64
)) {
2138 /* it must be a 32/64-bit memory reference. Firstly we have
2139 * to check that all registers involved are type E/Rxx. */
2140 int32_t sok
= BITS32
|BITS64
;
2143 if (!(REG64
& ~ix
) || !(REG32
& ~ix
))
2151 return NULL
; /* Invalid register */
2152 if (~sok
& bx
& SIZE_MASK
)
2153 return NULL
; /* Invalid size */
2157 /* While we're here, ensure the user didn't specify
2159 if (input
->disp_size
== 16 || input
->disp_size
== 64)
2162 if (addrbits
== 16 ||
2163 (addrbits
== 32 && !(sok
& BITS32
)) ||
2164 (addrbits
== 64 && !(sok
& BITS64
)))
2167 /* now reorganize base/index */
2168 if (s
== 1 && bt
!= it
&& bt
!= -1 && it
!= -1 &&
2169 ((hb
== b
&& ht
== EAH_NOTBASE
)
2170 || (hb
== i
&& ht
== EAH_MAKEBASE
))) {
2171 /* swap if hints say so */
2172 t
= bt
, bt
= it
, it
= t
;
2173 t
= bx
, bx
= ix
, ix
= t
;
2175 if (bt
== it
) /* convert EAX+2*EAX to 3*EAX */
2176 bt
= -1, bx
= 0, s
++;
2177 if (bt
== -1 && s
== 1 && !(hb
== it
&& ht
== EAH_NOTBASE
)) {
2178 /* make single reg base, unless hint */
2179 bt
= it
, bx
= ix
, it
= -1, ix
= 0;
2181 if (((s
== 2 && it
!= REG_NUM_ESP
2182 && !(input
->eaflags
& EAF_TIMESTWO
)) || s
== 3
2183 || s
== 5 || s
== 9) && bt
== -1)
2184 bt
= it
, bx
= ix
, s
--; /* convert 3*EAX to EAX+2*EAX */
2185 if (it
== -1 && (bt
& 7) != REG_NUM_ESP
2186 && (input
->eaflags
& EAF_TIMESTWO
))
2187 it
= bt
, ix
= bx
, bt
= -1, bx
= 0, s
= 1;
2188 /* convert [NOSPLIT EAX] to sib format with 0x0 displacement */
2189 if (s
== 1 && it
== REG_NUM_ESP
) {
2190 /* swap ESP into base if scale is 1 */
2191 t
= it
, it
= bt
, bt
= t
;
2192 t
= ix
, ix
= bx
, bx
= t
;
2194 if (it
== REG_NUM_ESP
2195 || (s
!= 1 && s
!= 2 && s
!= 4 && s
!= 8 && it
!= -1))
2196 return NULL
; /* wrong, for various reasons */
2198 output
->rex
|= rexflags(it
, ix
, REX_X
);
2199 output
->rex
|= rexflags(bt
, bx
, REX_B
);
2201 if (it
== -1 && (bt
& 7) != REG_NUM_ESP
) {
2210 if (rm
!= REG_NUM_EBP
&& o
== 0 &&
2211 seg
== NO_SEG
&& !forw_ref
&&
2213 (EAF_BYTEOFFS
| EAF_WORDOFFS
)))
2215 else if (input
->eaflags
& EAF_BYTEOFFS
||
2216 (o
>= -128 && o
<= 127 && seg
== NO_SEG
2218 && !(input
->eaflags
& EAF_WORDOFFS
)))
2224 output
->sib_present
= false;
2225 output
->bytes
= (bt
== -1 || mod
== 2 ? 4 : mod
);
2226 output
->modrm
= (mod
<< 6) | ((rfield
& 7) << 3) | rm
;
2229 int mod
, scale
, index
, base
;
2249 default: /* then what the smeg is it? */
2250 return NULL
; /* panic */
2258 if (base
!= REG_NUM_EBP
&& o
== 0 &&
2259 seg
== NO_SEG
&& !forw_ref
&&
2261 (EAF_BYTEOFFS
| EAF_WORDOFFS
)))
2263 else if (input
->eaflags
& EAF_BYTEOFFS
||
2264 (o
>= -128 && o
<= 127 && seg
== NO_SEG
2266 && !(input
->eaflags
& EAF_WORDOFFS
)))
2272 output
->sib_present
= true;
2273 output
->bytes
= (bt
== -1 || mod
== 2 ? 4 : mod
);
2274 output
->modrm
= (mod
<< 6) | ((rfield
& 7) << 3) | 4;
2275 output
->sib
= (scale
<< 6) | (index
<< 3) | base
;
2277 } else { /* it's 16-bit */
2280 /* check for 64-bit long mode */
2284 /* check all registers are BX, BP, SI or DI */
2285 if ((b
!= -1 && b
!= R_BP
&& b
!= R_BX
&& b
!= R_SI
2286 && b
!= R_DI
) || (i
!= -1 && i
!= R_BP
&& i
!= R_BX
2287 && i
!= R_SI
&& i
!= R_DI
))
2290 /* ensure the user didn't specify DWORD/QWORD */
2291 if (input
->disp_size
== 32 || input
->disp_size
== 64)
2294 if (s
!= 1 && i
!= -1)
2295 return NULL
; /* no can do, in 16-bit EA */
2296 if (b
== -1 && i
!= -1) {
2301 if ((b
== R_SI
|| b
== R_DI
) && i
!= -1) {
2306 /* have BX/BP as base, SI/DI index */
2308 return NULL
; /* shouldn't ever happen, in theory */
2309 if (i
!= -1 && b
!= -1 &&
2310 (i
== R_BP
|| i
== R_BX
|| b
== R_SI
|| b
== R_DI
))
2311 return NULL
; /* invalid combinations */
2312 if (b
== -1) /* pure offset: handled above */
2313 return NULL
; /* so if it gets to here, panic! */
2317 switch (i
* 256 + b
) {
2318 case R_SI
* 256 + R_BX
:
2321 case R_DI
* 256 + R_BX
:
2324 case R_SI
* 256 + R_BP
:
2327 case R_DI
* 256 + R_BP
:
2345 if (rm
== -1) /* can't happen, in theory */
2346 return NULL
; /* so panic if it does */
2348 if (o
== 0 && seg
== NO_SEG
&& !forw_ref
&& rm
!= 6 &&
2349 !(input
->eaflags
& (EAF_BYTEOFFS
| EAF_WORDOFFS
)))
2351 else if (input
->eaflags
& EAF_BYTEOFFS
||
2352 (o
>= -128 && o
<= 127 && seg
== NO_SEG
2354 && !(input
->eaflags
& EAF_WORDOFFS
)))
2359 output
->sib_present
= false; /* no SIB - it's 16-bit */
2360 output
->bytes
= mod
; /* bytes of offset needed */
2361 output
->modrm
= (mod
<< 6) | ((rfield
& 7) << 3) | rm
;
2366 output
->size
= 1 + output
->sib_present
+ output
->bytes
;
2370 static void add_asp(insn
*ins
, int addrbits
)
2375 valid
= (addrbits
== 64) ? 64|32 : 32|16;
2377 switch (ins
->prefixes
[PPS_ASIZE
]) {
2388 valid
&= (addrbits
== 32) ? 16 : 32;
2394 for (j
= 0; j
< ins
->operands
; j
++) {
2395 if (!(MEMORY
& ~ins
->oprs
[j
].type
)) {
2398 /* Verify as Register */
2399 if (ins
->oprs
[j
].indexreg
< EXPR_REG_START
2400 || ins
->oprs
[j
].indexreg
>= REG_ENUM_LIMIT
)
2403 i
= nasm_reg_flags
[ins
->oprs
[j
].indexreg
];
2405 /* Verify as Register */
2406 if (ins
->oprs
[j
].basereg
< EXPR_REG_START
2407 || ins
->oprs
[j
].basereg
>= REG_ENUM_LIMIT
)
2410 b
= nasm_reg_flags
[ins
->oprs
[j
].basereg
];
2412 if (ins
->oprs
[j
].scale
== 0)
2416 int ds
= ins
->oprs
[j
].disp_size
;
2417 if ((addrbits
!= 64 && ds
> 8) ||
2418 (addrbits
== 64 && ds
== 16))
2438 if (valid
& addrbits
) {
2439 ins
->addr_size
= addrbits
;
2440 } else if (valid
& ((addrbits
== 32) ? 16 : 32)) {
2441 /* Add an address size prefix */
2442 enum prefixes pref
= (addrbits
== 32) ? P_A16
: P_A32
;
2443 ins
->prefixes
[PPS_ASIZE
] = pref
;
2444 ins
->addr_size
= (addrbits
== 32) ? 16 : 32;
2447 errfunc(ERR_NONFATAL
, "impossible combination of address sizes");
2448 ins
->addr_size
= addrbits
; /* Error recovery */
2451 defdisp
= ins
->addr_size
== 16 ? 16 : 32;
2453 for (j
= 0; j
< ins
->operands
; j
++) {
2454 if (!(MEM_OFFS
& ~ins
->oprs
[j
].type
) &&
2455 (ins
->oprs
[j
].disp_size
? ins
->oprs
[j
].disp_size
: defdisp
)
2456 != ins
->addr_size
) {
2457 /* mem_offs sizes must match the address size; if not,
2458 strip the MEM_OFFS bit and match only EA instructions */
2459 ins
->oprs
[j
].type
&= ~(MEM_OFFS
& ~MEMORY
);