1 /* assemble.c code generation for the Netwide Assembler
3 * The Netwide Assembler is copyright (C) 1996 Simon Tatham and
4 * Julian Hall. All rights reserved. The software is
5 * redistributable under the license given in the file "LICENSE"
6 * distributed in the NASM archive.
8 * the actual codes (C syntax, i.e. octal):
9 * \0 - terminates the code. (Unless it's a literal of course.)
10 * \1, \2, \3 - that many literal bytes follow in the code stream
11 * \10..\13 - a literal byte follows in the code stream, to be added
12 * to the register value of operand 0..3
13 * \14..\17 - a signed byte immediate operand, from operand 0..3
14 * \20..\23 - a byte immediate operand, from operand 0..3
15 * \24..\27 - an unsigned byte immediate operand, from operand 0..3
16 * \30..\33 - a word immediate operand, from operand 0..3
17 * \34..\37 - select between \3[0-3] and \4[0-3] depending on 16/32 bit
18 * assembly mode or the operand-size override on the operand
19 * \40..\43 - a long immediate operand, from operand 0..3
20 * \44..\47 - select between \3[0-3], \4[0-3] and \5[4-7]
21 * depending on the address size of the instruction.
22 * \50..\53 - a byte relative operand, from operand 0..3
23 * \54..\57 - a qword immediate operand, from operand 0..3
24 * \60..\63 - a word relative operand, from operand 0..3
25 * \64..\67 - select between \6[0-3] and \7[0-3] depending on 16/32 bit
26 * assembly mode or the operand-size override on the operand
27 * \70..\73 - a long relative operand, from operand 0..3
28 * \74..\77 - a word constant, from the _segment_ part of operand 0..3
29 * \1ab - a ModRM, calculated on EA in operand a, with the spare
30 * field the register value of operand b.
31 * \140..\143 - an immediate word or signed byte for operand 0..3
32 * \144..\147 - or 2 (s-field) into opcode byte if operand 0..3
33 * is a signed byte rather than a word. Opcode byte follows.
34 * \150..\153 - an immediate dword or signed byte for operand 0..3
35 * \154..\157 - or 2 (s-field) into opcode byte if operand 0..3
36 * is a signed byte rather than a dword. Opcode byte follows.
37 * \160..\163 - this instruction uses DREX rather than REX, with the
38 * OC0 field set to 0, and the dest field taken from
40 * \164..\167 - this instruction uses DREX rather than REX, with the
41 * OC0 field set to 1, and the dest field taken from
43 * \171 - placement of DREX suffix in the absence of an EA
44 * \172\ab - the register number from operand a in bits 7..4, with
45 * the 4-bit immediate from operand b in bits 3..0.
46 * \173\xab - the register number from operand a in bits 7..4, with
47 * the value b in bits 3..0.
48 * \174\a - the register number from operand a in bits 7..4, and
49 * an arbitrary value in bits 3..0 (assembled as zero.)
50 * \2ab - a ModRM, calculated on EA in operand a, with the spare
51 * field equal to digit b.
52 * \250..\253 - same as \150..\153, except warn if the 64-bit operand
53 * is not equal to the truncated and sign-extended 32-bit
54 * operand; used for 32-bit immediates in 64-bit mode.
55 * \254..\257 - a signed 32-bit operand to be extended to 64 bits.
56 * \260..\263 - this instruction uses VEX rather than REX, with the
57 * V field taken from operand 0..3.
58 * \270 - this instruction uses VEX rather than REX, with the
59 * V field set to 1111b.
61 * VEX prefixes are followed by the sequence:
62 * \mm\wlp where mm is the M field; and wlp is:
64 * [w0] ww = 0 for W = 0
65 * [w1] ww = 1 for W = 1
66 * [wx] ww = 2 for W don't care (always assembled as 0)
67 * [ww] ww = 3 for W used as REX.W
70 * \274..\277 - a signed byte immediate operand, from operand 0..3,
71 * which is to be extended to the operand size.
72 * \310 - indicates fixed 16-bit address size, i.e. optional 0x67.
73 * \311 - indicates fixed 32-bit address size, i.e. optional 0x67.
74 * \312 - (disassembler only) marker on LOOP, LOOPxx instructions.
75 * \313 - indicates fixed 64-bit address size, 0x67 invalid.
76 * \314 - (disassembler only) invalid with REX.B
77 * \315 - (disassembler only) invalid with REX.X
78 * \316 - (disassembler only) invalid with REX.R
79 * \317 - (disassembler only) invalid with REX.W
80 * \320 - indicates fixed 16-bit operand size, i.e. optional 0x66.
81 * \321 - indicates fixed 32-bit operand size, i.e. optional 0x66.
82 * \322 - indicates that this instruction is only valid when the
83 * operand size is the default (instruction to disassembler,
84 * generates no code in the assembler)
85 * \323 - indicates fixed 64-bit operand size, REX on extensions only.
86 * \324 - indicates 64-bit operand size requiring REX prefix.
87 * \330 - a literal byte follows in the code stream, to be added
88 * to the condition code value of the instruction.
89 * \331 - instruction not valid with REP prefix. Hint for
90 * disassembler only; for SSE instructions.
91 * \332 - REP prefix (0xF2 byte) used as opcode extension.
92 * \333 - REP prefix (0xF3 byte) used as opcode extension.
93 * \334 - LOCK prefix used instead of REX.R
94 * \335 - disassemble a rep (0xF3 byte) prefix as repe not rep.
95 * \336 - force a REP(E) prefix (0xF2) even if not specified.
96 * \337 - force a REPNE prefix (0xF3) even if not specified.
97 * \336-\337 are still listed as prefixes in the disassembler.
98 * \340 - reserve <operand 0> bytes of uninitialized storage.
99 * Operand 0 had better be a segmentless constant.
100 * \344,\345 - the PUSH/POP (respectively) codes for CS, DS, ES, SS
101 * (POP is never used for CS) depending on operand 0
102 * \346,\347 - the second byte of PUSH/POP codes for FS, GS, depending
104 * \360 - no SSE prefix (== \364\331)
105 * \361 - 66 SSE prefix (== \366\331)
106 * \362 - F2 SSE prefix (== \364\332)
107 * \363 - F3 SSE prefix (== \364\333)
108 * \364 - operand-size prefix (0x66) not permitted
109 * \365 - address-size prefix (0x67) not permitted
110 * \366 - operand-size prefix (0x66) used as opcode extension
111 * \367 - address-size prefix (0x67) used as opcode extension
112 * \370,\371,\372 - match only if operand 0 meets byte jump criteria.
113 * 370 is used for Jcc, 371 is used for JMP.
114 * \373 - assemble 0x03 if bits==16, 0x05 if bits==32;
115 * used for conditional jump over longer jump
118 #include "compiler.h"
122 #include <inttypes.h>
126 #include "assemble.h"
130 /* Initialized to zero by the C standard */
131 static const uint8_t const_zero_buf
[256];
134 int sib_present
; /* is a SIB byte necessary? */
135 int bytes
; /* # of bytes of offset needed */
136 int size
; /* lazy - this is sib+bytes+1 */
137 uint8_t modrm
, sib
, rex
, rip
; /* the bytes themselves */
140 static uint32_t cpu
; /* cpu level received from nasm.c */
141 static efunc errfunc
;
142 static struct ofmt
*outfmt
;
143 static ListGen
*list
;
145 static int64_t calcsize(int32_t, int64_t, int, insn
*, const uint8_t *);
146 static void gencode(int32_t segment
, int64_t offset
, int bits
,
147 insn
* ins
, const struct itemplate
*temp
,
149 static int matches(const struct itemplate
*, insn
*, int bits
);
150 static int32_t regflag(const operand
*);
151 static int32_t regval(const operand
*);
152 static int rexflags(int, int32_t, int);
153 static int op_rexflags(const operand
*, int);
154 static ea
*process_ea(operand
*, ea
*, int, int, int, int32_t);
155 static void add_asp(insn
*, int);
157 static int has_prefix(insn
* ins
, enum prefix_pos pos
, enum prefixes prefix
)
159 return ins
->prefixes
[pos
] == prefix
;
162 static void assert_no_prefix(insn
* ins
, enum prefix_pos pos
)
164 if (ins
->prefixes
[pos
])
165 errfunc(ERR_NONFATAL
, "invalid %s prefix",
166 prefix_name(ins
->prefixes
[pos
]));
169 static const char *size_name(int size
)
191 static void warn_overflow(int size
, const struct operand
*o
)
193 if (size
< 8 && o
->wrt
== NO_SEG
&& o
->segment
== NO_SEG
) {
194 int64_t lim
= ((int64_t)1 << (size
*8))-1;
195 int64_t data
= o
->offset
;
197 if (data
< ~lim
|| data
> lim
)
198 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
199 "%s data exceeds bounds", size_name(size
));
203 * This routine wrappers the real output format's output routine,
204 * in order to pass a copy of the data off to the listing file
205 * generator at the same time.
207 static void out(int64_t offset
, int32_t segto
, const void *data
,
208 enum out_type type
, uint64_t size
,
209 int32_t segment
, int32_t wrt
)
211 static int32_t lineno
= 0; /* static!!! */
212 static char *lnfname
= NULL
;
215 if (type
== OUT_ADDRESS
&& segment
== NO_SEG
&& wrt
== NO_SEG
) {
217 * This is a non-relocated address, and we're going to
218 * convert it into RAWDATA format.
223 errfunc(ERR_PANIC
, "OUT_ADDRESS with size > 8");
227 WRITEADDR(q
, *(int64_t *)data
, size
);
232 list
->output(offset
, data
, type
, size
);
235 * this call to src_get determines when we call the
236 * debug-format-specific "linenum" function
237 * it updates lineno and lnfname to the current values
238 * returning 0 if "same as last time", -2 if lnfname
239 * changed, and the amount by which lineno changed,
240 * if it did. thus, these variables must be static
243 if (src_get(&lineno
, &lnfname
)) {
244 outfmt
->current_dfmt
->linenum(lnfname
, lineno
, segto
);
247 outfmt
->output(segto
, data
, type
, size
, segment
, wrt
);
250 static bool jmp_match(int32_t segment
, int64_t offset
, int bits
,
251 insn
* ins
, const uint8_t *code
)
256 if ((c
!= 0370 && c
!= 0371) || (ins
->oprs
[0].type
& STRICT
))
260 if (optimizing
< 0 && c
== 0371)
263 isize
= calcsize(segment
, offset
, bits
, ins
, code
);
264 if (ins
->oprs
[0].segment
!= segment
)
267 isize
= ins
->oprs
[0].offset
- offset
- isize
; /* isize is delta */
268 return (isize
>= -128 && isize
<= 127); /* is it byte size? */
271 int64_t assemble(int32_t segment
, int64_t offset
, int bits
, uint32_t cp
,
272 insn
* instruction
, struct ofmt
*output
, efunc error
,
275 const struct itemplate
*temp
;
280 int64_t start
= offset
;
281 int64_t wsize
= 0; /* size for DB etc. */
283 errfunc
= error
; /* to pass to other functions */
285 outfmt
= output
; /* likewise */
286 list
= listgen
; /* and again */
288 switch (instruction
->opcode
) {
318 int32_t t
= instruction
->times
;
321 "instruction->times < 0 (%ld) in assemble()", t
);
323 while (t
--) { /* repeat TIMES times */
324 for (e
= instruction
->eops
; e
; e
= e
->next
) {
325 if (e
->type
== EOT_DB_NUMBER
) {
327 if (e
->segment
!= NO_SEG
)
328 errfunc(ERR_NONFATAL
,
329 "one-byte relocation attempted");
331 uint8_t out_byte
= e
->offset
;
332 out(offset
, segment
, &out_byte
,
333 OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
335 } else if (wsize
> 8) {
336 errfunc(ERR_NONFATAL
,
337 "integer supplied to a DT, DO or DY"
340 out(offset
, segment
, &e
->offset
,
341 OUT_ADDRESS
, wsize
, e
->segment
, e
->wrt
);
343 } else if (e
->type
== EOT_DB_STRING
||
344 e
->type
== EOT_DB_STRING_FREE
) {
347 out(offset
, segment
, e
->stringval
,
348 OUT_RAWDATA
, e
->stringlen
, NO_SEG
, NO_SEG
);
349 align
= e
->stringlen
% wsize
;
352 align
= wsize
- align
;
353 out(offset
, segment
, const_zero_buf
,
354 OUT_RAWDATA
, align
, NO_SEG
, NO_SEG
);
356 offset
+= e
->stringlen
+ align
;
359 if (t
> 0 && t
== instruction
->times
- 1) {
361 * Dummy call to list->output to give the offset to the
364 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
365 list
->uplevel(LIST_TIMES
);
368 if (instruction
->times
> 1)
369 list
->downlevel(LIST_TIMES
);
370 return offset
- start
;
373 if (instruction
->opcode
== I_INCBIN
) {
374 const char *fname
= instruction
->eops
->stringval
;
377 fp
= fopen(fname
, "rb");
379 error(ERR_NONFATAL
, "`incbin': unable to open file `%s'",
381 } else if (fseek(fp
, 0L, SEEK_END
) < 0) {
382 error(ERR_NONFATAL
, "`incbin': unable to seek on file `%s'",
385 static char buf
[4096];
386 size_t t
= instruction
->times
;
391 if (instruction
->eops
->next
) {
392 base
= instruction
->eops
->next
->offset
;
394 if (instruction
->eops
->next
->next
&&
395 len
> (size_t)instruction
->eops
->next
->next
->offset
)
396 len
= (size_t)instruction
->eops
->next
->next
->offset
;
399 * Dummy call to list->output to give the offset to the
402 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
403 list
->uplevel(LIST_INCBIN
);
407 fseek(fp
, base
, SEEK_SET
);
411 fread(buf
, 1, (l
> (int32_t) sizeof(buf
) ? (int32_t) sizeof(buf
) : l
),
415 * This shouldn't happen unless the file
416 * actually changes while we are reading
420 "`incbin': unexpected EOF while"
421 " reading file `%s'", fname
);
422 t
= 0; /* Try to exit cleanly */
425 out(offset
, segment
, buf
, OUT_RAWDATA
, m
,
430 list
->downlevel(LIST_INCBIN
);
431 if (instruction
->times
> 1) {
433 * Dummy call to list->output to give the offset to the
436 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
437 list
->uplevel(LIST_TIMES
);
438 list
->downlevel(LIST_TIMES
);
441 return instruction
->times
* len
;
443 return 0; /* if we're here, there's an error */
446 /* Check to see if we need an address-size prefix */
447 add_asp(instruction
, bits
);
451 for (temp
= nasm_instructions
[instruction
->opcode
]; temp
->opcode
!= -1; temp
++){
452 int m
= matches(temp
, instruction
, bits
);
454 (m
== 99 && jmp_match(segment
, offset
, bits
,
455 instruction
, temp
->code
))) {
457 int64_t insn_size
= calcsize(segment
, offset
, bits
,
458 instruction
, temp
->code
);
459 itimes
= instruction
->times
;
460 if (insn_size
< 0) /* shouldn't be, on pass two */
461 error(ERR_PANIC
, "errors made it through from pass one");
464 for (j
= 0; j
< MAXPREFIX
; j
++) {
466 switch (instruction
->prefixes
[j
]) {
481 error(ERR_WARNING
| ERR_PASS2
,
482 "cs segment base generated, but will be ignored in 64-bit mode");
488 error(ERR_WARNING
| ERR_PASS2
,
489 "ds segment base generated, but will be ignored in 64-bit mode");
495 error(ERR_WARNING
| ERR_PASS2
,
496 "es segment base generated, but will be ignored in 64-bit mode");
508 error(ERR_WARNING
| ERR_PASS2
,
509 "ss segment base generated, but will be ignored in 64-bit mode");
516 "segr6 and segr7 cannot be used as prefixes");
521 "16-bit addressing is not supported "
523 } else if (bits
!= 16)
533 "64-bit addressing is only supported "
557 error(ERR_PANIC
, "invalid instruction prefix");
560 out(offset
, segment
, &c
, OUT_RAWDATA
, 1,
565 insn_end
= offset
+ insn_size
;
566 gencode(segment
, offset
, bits
, instruction
,
569 if (itimes
> 0 && itimes
== instruction
->times
- 1) {
571 * Dummy call to list->output to give the offset to the
574 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
575 list
->uplevel(LIST_TIMES
);
578 if (instruction
->times
> 1)
579 list
->downlevel(LIST_TIMES
);
580 return offset
- start
;
581 } else if (m
> 0 && m
> size_prob
) {
586 if (temp
->opcode
== -1) { /* didn't match any instruction */
589 error(ERR_NONFATAL
, "operation size not specified");
592 error(ERR_NONFATAL
, "mismatch in operand sizes");
595 error(ERR_NONFATAL
, "no instruction for this cpu level");
598 error(ERR_NONFATAL
, "instruction not supported in 64-bit mode");
602 "invalid combination of opcode and operands");
609 int64_t insn_size(int32_t segment
, int64_t offset
, int bits
, uint32_t cp
,
610 insn
* instruction
, efunc error
)
612 const struct itemplate
*temp
;
614 errfunc
= error
; /* to pass to other functions */
617 if (instruction
->opcode
== -1)
620 if (instruction
->opcode
== I_DB
|| instruction
->opcode
== I_DW
||
621 instruction
->opcode
== I_DD
|| instruction
->opcode
== I_DQ
||
622 instruction
->opcode
== I_DT
|| instruction
->opcode
== I_DO
||
623 instruction
->opcode
== I_DY
) {
625 int32_t isize
, osize
, wsize
= 0; /* placate gcc */
628 switch (instruction
->opcode
) {
654 for (e
= instruction
->eops
; e
; e
= e
->next
) {
658 if (e
->type
== EOT_DB_NUMBER
)
660 else if (e
->type
== EOT_DB_STRING
||
661 e
->type
== EOT_DB_STRING_FREE
)
662 osize
= e
->stringlen
;
664 align
= (-osize
) % wsize
;
667 isize
+= osize
+ align
;
669 return isize
* instruction
->times
;
672 if (instruction
->opcode
== I_INCBIN
) {
673 const char *fname
= instruction
->eops
->stringval
;
677 fp
= fopen(fname
, "rb");
679 error(ERR_NONFATAL
, "`incbin': unable to open file `%s'",
681 else if (fseek(fp
, 0L, SEEK_END
) < 0)
682 error(ERR_NONFATAL
, "`incbin': unable to seek on file `%s'",
687 if (instruction
->eops
->next
) {
688 len
-= instruction
->eops
->next
->offset
;
689 if (instruction
->eops
->next
->next
&&
690 len
> (size_t)instruction
->eops
->next
->next
->offset
) {
691 len
= (size_t)instruction
->eops
->next
->next
->offset
;
694 return instruction
->times
* len
;
696 return 0; /* if we're here, there's an error */
699 /* Check to see if we need an address-size prefix */
700 add_asp(instruction
, bits
);
702 for (temp
= nasm_instructions
[instruction
->opcode
]; temp
->opcode
!= -1; temp
++) {
703 int m
= matches(temp
, instruction
, bits
);
705 (m
== 99 && jmp_match(segment
, offset
, bits
,
706 instruction
, temp
->code
))) {
707 /* we've matched an instruction. */
709 const uint8_t *codes
= temp
->code
;
712 isize
= calcsize(segment
, offset
, bits
, instruction
, codes
);
715 for (j
= 0; j
< MAXPREFIX
; j
++) {
716 switch (instruction
->prefixes
[j
]) {
742 return isize
* instruction
->times
;
745 return -1; /* didn't match any instruction */
748 static bool possible_sbyte(operand
*o
)
750 return o
->wrt
== NO_SEG
&& o
->segment
== NO_SEG
&&
751 !(o
->opflags
& OPFLAG_FORWARD
) &&
752 optimizing
>= 0 && !(o
->type
& STRICT
);
755 /* check that opn[op] is a signed byte of size 16 or 32 */
756 static bool is_sbyte16(operand
*o
)
760 if (!possible_sbyte(o
))
764 return v
>= -128 && v
<= 127;
767 static bool is_sbyte32(operand
*o
)
771 if (!possible_sbyte(o
))
775 return v
>= -128 && v
<= 127;
778 /* Common construct */
779 #define case4(x) case (x): case (x)+1: case (x)+2: case (x)+3
781 static int64_t calcsize(int32_t segment
, int64_t offset
, int bits
,
782 insn
* ins
, const uint8_t *codes
)
789 ins
->rex
= 0; /* Ensure REX is reset */
791 if (ins
->prefixes
[PPS_OSIZE
] == P_O64
)
794 (void)segment
; /* Don't warn that this parameter is unused */
795 (void)offset
; /* Don't warn that this parameter is unused */
799 opx
= &ins
->oprs
[c
& 3];
804 codes
+= c
, length
+= c
;
809 op_rexflags(opx
, REX_B
|REX_H
|REX_P
|REX_W
);
824 if (opx
->type
& (BITS16
| BITS32
| BITS64
))
825 length
+= (opx
->type
& BITS16
) ? 2 : 4;
827 length
+= (bits
== 16) ? 2 : 4;
835 length
+= ins
->addr_size
>> 3;
843 length
+= 8; /* MOV reg64/imm */
851 if (opx
->type
& (BITS16
| BITS32
| BITS64
))
852 length
+= (opx
->type
& BITS16
) ? 2 : 4;
854 length
+= (bits
== 16) ? 2 : 4;
866 length
+= is_sbyte16(opx
) ? 1 : 2;
875 length
+= is_sbyte32(opx
) ? 1 : 4;
886 ins
->drexdst
= regval(opx
);
891 ins
->rex
|= REX_D
|REX_OC
;
892 ins
->drexdst
= regval(opx
);
906 length
+= is_sbyte32(opx
) ? 1 : 4;
915 ins
->drexdst
= regval(opx
);
916 ins
->vex_m
= *codes
++;
917 ins
->vex_wlp
= *codes
++;
923 ins
->vex_m
= *codes
++;
924 ins
->vex_wlp
= *codes
++;
937 length
+= (bits
!= 16) && !has_prefix(ins
, PPS_ASIZE
, P_A16
);
941 length
+= (bits
!= 32) && !has_prefix(ins
, PPS_ASIZE
, P_A32
);
948 if (bits
!= 64 || has_prefix(ins
, PPS_ASIZE
, P_A16
) ||
949 has_prefix(ins
, PPS_ASIZE
, P_A32
))
957 length
+= (bits
!= 16);
961 length
+= (bits
== 16);
995 if (!ins
->prefixes
[PPS_LREP
])
996 ins
->prefixes
[PPS_LREP
] = P_REP
;
1000 if (!ins
->prefixes
[PPS_LREP
])
1001 ins
->prefixes
[PPS_LREP
] = P_REPNE
;
1005 if (ins
->oprs
[0].segment
!= NO_SEG
)
1006 errfunc(ERR_NONFATAL
, "attempt to reserve non-constant"
1007 " quantity of BSS space");
1009 length
+= ins
->oprs
[0].offset
;
1059 ea_data
.rex
= 0; /* Ensure ea.REX is initially 0 */
1062 /* pick rfield from operand b */
1063 rflags
= regflag(&ins
->oprs
[c
& 7]);
1064 rfield
= nasm_regvals
[ins
->oprs
[c
& 7].basereg
];
1071 (&ins
->oprs
[(c
>> 3) & 7], &ea_data
, bits
,
1072 ins
->addr_size
, rfield
, rflags
)) {
1073 errfunc(ERR_NONFATAL
, "invalid effective address");
1076 ins
->rex
|= ea_data
.rex
;
1077 length
+= ea_data
.size
;
1083 errfunc(ERR_PANIC
, "internal instruction table corrupt"
1084 ": instruction code 0x%02X given", c
);
1089 ins
->rex
&= rex_mask
;
1091 if (ins
->rex
& REX_V
) {
1092 int bad32
= REX_R
|REX_W
|REX_X
|REX_B
;
1094 if (ins
->rex
& REX_H
) {
1095 errfunc(ERR_NONFATAL
, "cannot use high register in vex instruction");
1098 switch (ins
->vex_wlp
& 030) {
1112 if (bits
!= 64 && ((ins
->rex
& bad32
) || ins
->drexdst
> 7)) {
1113 errfunc(ERR_NONFATAL
, "invalid operands in non-64-bit mode");
1116 if (ins
->vex_m
!= 1 || (ins
->rex
& (REX_W
|REX_R
|REX_B
)))
1120 } else if (ins
->rex
& REX_D
) {
1121 if (ins
->rex
& REX_H
) {
1122 errfunc(ERR_NONFATAL
, "cannot use high register in drex instruction");
1125 if (bits
!= 64 && ((ins
->rex
& (REX_R
|REX_W
|REX_X
|REX_B
)) ||
1126 ins
->drexdst
> 7)) {
1127 errfunc(ERR_NONFATAL
, "invalid operands in non-64-bit mode");
1131 } else if (ins
->rex
& REX_REAL
) {
1132 if (ins
->rex
& REX_H
) {
1133 errfunc(ERR_NONFATAL
, "cannot use high register in rex instruction");
1135 } else if (bits
== 64) {
1137 } else if ((ins
->rex
& REX_L
) &&
1138 !(ins
->rex
& (REX_P
|REX_W
|REX_X
|REX_B
)) &&
1141 assert_no_prefix(ins
, PPS_LREP
);
1144 errfunc(ERR_NONFATAL
, "invalid operands in non-64-bit mode");
1152 #define EMIT_REX() \
1153 if (!(ins->rex & (REX_D|REX_V)) && (ins->rex & REX_REAL) && (bits == 64)) { \
1154 ins->rex = (ins->rex & REX_REAL)|REX_P; \
1155 out(offset, segment, &ins->rex, OUT_RAWDATA, 1, NO_SEG, NO_SEG); \
1160 static void gencode(int32_t segment
, int64_t offset
, int bits
,
1161 insn
* ins
, const struct itemplate
*temp
,
1164 static char condval
[] = { /* conditional opcodes */
1165 0x7, 0x3, 0x2, 0x6, 0x2, 0x4, 0xF, 0xD, 0xC, 0xE, 0x6, 0x2,
1166 0x3, 0x7, 0x3, 0x5, 0xE, 0xC, 0xD, 0xF, 0x1, 0xB, 0x9, 0x5,
1167 0x0, 0xA, 0xA, 0xB, 0x8, 0x4
1173 struct operand
*opx
;
1174 const uint8_t *codes
= temp
->code
;
1178 opx
= &ins
->oprs
[c
& 3];
1184 out(offset
, segment
, codes
, OUT_RAWDATA
, c
, NO_SEG
, NO_SEG
);
1191 bytes
[0] = *codes
++ + ((regval(opx
)) & 7);
1192 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1197 /* The test for BITS8 and SBYTE here is intended to avoid
1198 warning on optimizer actions due to SBYTE, while still
1199 warn on explicit BYTE directives. Also warn, obviously,
1200 if the optimizer isn't enabled. */
1201 if (((opx
->type
& BITS8
) ||
1202 !(opx
->type
& temp
->opd
[c
& 3] & BYTENESS
)) &&
1203 (opx
->offset
< -128 || opx
->offset
> 127)) {
1204 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1205 "signed byte value exceeds bounds");
1207 if (opx
->segment
!= NO_SEG
) {
1209 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1210 opx
->segment
, opx
->wrt
);
1212 bytes
[0] = opx
->offset
;
1213 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1220 if (opx
->offset
< -256 || opx
->offset
> 255) {
1221 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1222 "byte value exceeds bounds");
1224 if (opx
->segment
!= NO_SEG
) {
1226 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1227 opx
->segment
, opx
->wrt
);
1229 bytes
[0] = opx
->offset
;
1230 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1237 if (opx
->offset
< 0 || opx
->offset
> 255)
1238 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1239 "unsigned byte value exceeds bounds");
1240 if (opx
->segment
!= NO_SEG
) {
1242 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1243 opx
->segment
, opx
->wrt
);
1245 bytes
[0] = opx
->offset
;
1246 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1253 warn_overflow(2, opx
);
1255 out(offset
, segment
, &data
, OUT_ADDRESS
, 2,
1256 opx
->segment
, opx
->wrt
);
1261 if (opx
->type
& (BITS16
| BITS32
))
1262 size
= (opx
->type
& BITS16
) ? 2 : 4;
1264 size
= (bits
== 16) ? 2 : 4;
1265 warn_overflow(size
, opx
);
1267 out(offset
, segment
, &data
, OUT_ADDRESS
, size
,
1268 opx
->segment
, opx
->wrt
);
1273 warn_overflow(4, opx
);
1275 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1276 opx
->segment
, opx
->wrt
);
1282 size
= ins
->addr_size
>> 3;
1283 warn_overflow(size
, opx
);
1284 out(offset
, segment
, &data
, OUT_ADDRESS
, size
,
1285 opx
->segment
, opx
->wrt
);
1290 if (opx
->segment
!= segment
)
1291 errfunc(ERR_NONFATAL
,
1292 "short relative jump outside segment");
1293 data
= opx
->offset
- insn_end
;
1294 if (data
> 127 || data
< -128)
1295 errfunc(ERR_NONFATAL
, "short jump is out of range");
1297 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1302 data
= (int64_t)opx
->offset
;
1303 out(offset
, segment
, &data
, OUT_ADDRESS
, 8,
1304 opx
->segment
, opx
->wrt
);
1309 if (opx
->segment
!= segment
) {
1311 out(offset
, segment
, &data
,
1312 OUT_REL2ADR
, insn_end
- offset
,
1313 opx
->segment
, opx
->wrt
);
1315 data
= opx
->offset
- insn_end
;
1316 out(offset
, segment
, &data
,
1317 OUT_ADDRESS
, 2, NO_SEG
, NO_SEG
);
1323 if (opx
->type
& (BITS16
| BITS32
| BITS64
))
1324 size
= (opx
->type
& BITS16
) ? 2 : 4;
1326 size
= (bits
== 16) ? 2 : 4;
1327 if (opx
->segment
!= segment
) {
1329 out(offset
, segment
, &data
,
1330 size
== 2 ? OUT_REL2ADR
: OUT_REL4ADR
,
1331 insn_end
- offset
, opx
->segment
, opx
->wrt
);
1333 data
= opx
->offset
- insn_end
;
1334 out(offset
, segment
, &data
,
1335 OUT_ADDRESS
, size
, NO_SEG
, NO_SEG
);
1341 if (opx
->segment
!= segment
) {
1343 out(offset
, segment
, &data
,
1344 OUT_REL4ADR
, insn_end
- offset
,
1345 opx
->segment
, opx
->wrt
);
1347 data
= opx
->offset
- insn_end
;
1348 out(offset
, segment
, &data
,
1349 OUT_ADDRESS
, 4, NO_SEG
, NO_SEG
);
1355 if (opx
->segment
== NO_SEG
)
1356 errfunc(ERR_NONFATAL
, "value referenced by FAR is not"
1359 out(offset
, segment
, &data
, OUT_ADDRESS
, 2,
1360 outfmt
->segbase(1 + opx
->segment
),
1367 warn_overflow(2, opx
);
1368 if (is_sbyte16(opx
)) {
1370 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1374 out(offset
, segment
, &data
, OUT_ADDRESS
, 2,
1375 opx
->segment
, opx
->wrt
);
1382 bytes
[0] = *codes
++;
1383 if (is_sbyte16(opx
))
1384 bytes
[0] |= 2; /* s-bit */
1385 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1391 warn_overflow(4, opx
);
1392 if (is_sbyte32(opx
)) {
1394 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1398 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1399 opx
->segment
, opx
->wrt
);
1406 bytes
[0] = *codes
++;
1407 if (is_sbyte32(opx
))
1408 bytes
[0] |= 2; /* s-bit */
1409 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1419 (ins
->drexdst
<< 4) |
1420 (ins
->rex
& REX_OC
? 0x08 : 0) |
1421 (ins
->rex
& (REX_R
|REX_X
|REX_B
));
1423 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1429 opx
= &ins
->oprs
[c
>> 3];
1430 bytes
[0] = nasm_regvals
[opx
->basereg
] << 4;
1431 opx
= &ins
->oprs
[c
& 7];
1432 if (opx
->segment
!= NO_SEG
|| opx
->wrt
!= NO_SEG
) {
1433 errfunc(ERR_NONFATAL
,
1434 "non-absolute expression not permitted as argument %d",
1437 if (opx
->offset
& ~15) {
1438 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1439 "four-bit argument exceeds bounds");
1441 bytes
[0] |= opx
->offset
& 15;
1443 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1449 opx
= &ins
->oprs
[c
>> 4];
1450 bytes
[0] = nasm_regvals
[opx
->basereg
] << 4;
1452 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1458 opx
= &ins
->oprs
[c
];
1459 bytes
[0] = nasm_regvals
[opx
->basereg
] << 4;
1460 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1466 if (opx
->wrt
== NO_SEG
&& opx
->segment
== NO_SEG
&&
1467 (int32_t)data
!= (int64_t)data
) {
1468 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1469 "signed dword immediate exceeds bounds");
1471 if (is_sbyte32(opx
)) {
1473 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1477 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1478 opx
->segment
, opx
->wrt
);
1485 if (opx
->wrt
== NO_SEG
&& opx
->segment
== NO_SEG
&&
1486 (int32_t)data
!= (int64_t)data
) {
1487 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1488 "signed dword immediate exceeds bounds");
1490 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1491 opx
->segment
, opx
->wrt
);
1498 if (ins
->vex_m
!= 1 || (ins
->rex
& (REX_W
|REX_X
|REX_B
))) {
1500 bytes
[1] = ins
->vex_m
| ((~ins
->rex
& 7) << 5);
1501 bytes
[2] = ((ins
->rex
& REX_W
) << (7-3)) |
1502 ((~ins
->drexdst
& 15)<< 3) | (ins
->vex_wlp
& 07);
1503 out(offset
, segment
, &bytes
, OUT_RAWDATA
, 3, NO_SEG
, NO_SEG
);
1507 bytes
[1] = ((~ins
->rex
& REX_R
) << (7-2)) |
1508 ((~ins
->drexdst
& 15) << 3) | (ins
->vex_wlp
& 07);
1509 out(offset
, segment
, &bytes
, OUT_RAWDATA
, 2, NO_SEG
, NO_SEG
);
1519 if (ins
->rex
& REX_W
)
1521 else if (ins
->prefixes
[PPS_OSIZE
] == P_O16
)
1523 else if (ins
->prefixes
[PPS_OSIZE
] == P_O32
)
1528 um
= (uint64_t)2 << (s
-1);
1531 if (uv
> 127 && uv
< (uint64_t)-128 &&
1532 (uv
< um
-128 || uv
> um
-1)) {
1533 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1534 "signed byte value exceeds bounds");
1536 if (opx
->segment
!= NO_SEG
) {
1538 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1539 opx
->segment
, opx
->wrt
);
1542 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1553 if (bits
== 32 && !has_prefix(ins
, PPS_ASIZE
, P_A16
)) {
1555 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1562 if (bits
!= 32 && !has_prefix(ins
, PPS_ASIZE
, P_A32
)) {
1564 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1583 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1592 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1607 *bytes
= *codes
++ ^ condval
[ins
->condition
];
1608 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1617 *bytes
= c
- 0332 + 0xF2;
1618 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1623 if (ins
->rex
& REX_R
) {
1625 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1628 ins
->rex
&= ~(REX_L
|REX_R
);
1639 if (ins
->oprs
[0].segment
!= NO_SEG
)
1640 errfunc(ERR_PANIC
, "non-constant BSS size in pass two");
1642 int64_t size
= ins
->oprs
[0].offset
;
1644 out(offset
, segment
, NULL
,
1645 OUT_RESERVE
, size
, NO_SEG
, NO_SEG
);
1653 switch (ins
->oprs
[0].basereg
) {
1668 "bizarre 8086 segment register received");
1670 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1677 switch (ins
->oprs
[0].basereg
) {
1686 "bizarre 386 segment register received");
1688 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1697 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1703 bytes
[0] = c
- 0362 + 0xf2;
1704 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1714 *bytes
= c
- 0366 + 0x66;
1715 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1725 *bytes
= bits
== 16 ? 3 : 5;
1726 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1751 /* pick rfield from operand b */
1752 rflags
= regflag(&ins
->oprs
[c
& 7]);
1753 rfield
= nasm_regvals
[ins
->oprs
[c
& 7].basereg
];
1755 /* rfield is constant */
1761 (&ins
->oprs
[(c
>> 3) & 7], &ea_data
, bits
,
1762 ins
->addr_size
, rfield
, rflags
)) {
1763 errfunc(ERR_NONFATAL
, "invalid effective address");
1768 *p
++ = ea_data
.modrm
;
1769 if (ea_data
.sib_present
)
1772 /* DREX suffixes come between the SIB and the displacement */
1773 if (ins
->rex
& REX_D
) {
1775 (ins
->drexdst
<< 4) |
1776 (ins
->rex
& REX_OC
? 0x08 : 0) |
1777 (ins
->rex
& (REX_R
|REX_X
|REX_B
));
1782 out(offset
, segment
, bytes
, OUT_RAWDATA
, s
, NO_SEG
, NO_SEG
);
1785 * Make sure the address gets the right offset in case
1786 * the line breaks in the .lst file (BR 1197827)
1791 switch (ea_data
.bytes
) {
1795 if (ins
->oprs
[(c
>> 3) & 7].segment
!= NO_SEG
) {
1796 data
= ins
->oprs
[(c
>> 3) & 7].offset
;
1797 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1798 ins
->oprs
[(c
>> 3) & 7].segment
,
1799 ins
->oprs
[(c
>> 3) & 7].wrt
);
1801 *bytes
= ins
->oprs
[(c
>> 3) & 7].offset
;
1802 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1,
1810 data
= ins
->oprs
[(c
>> 3) & 7].offset
;
1811 warn_overflow(ea_data
.bytes
, opx
);
1814 out(offset
, segment
, &data
,
1815 OUT_REL4ADR
, insn_end
- offset
,
1816 ins
->oprs
[(c
>> 3) & 7].segment
,
1817 ins
->oprs
[(c
>> 3) & 7].wrt
);
1820 out(offset
, segment
, &data
,
1821 OUT_ADDRESS
, ea_data
.bytes
,
1822 ins
->oprs
[(c
>> 3) & 7].segment
,
1823 ins
->oprs
[(c
>> 3) & 7].wrt
);
1832 errfunc(ERR_PANIC
, "internal instruction table corrupt"
1833 ": instruction code 0x%02X given", c
);
1839 static int32_t regflag(const operand
* o
)
1841 if (o
->basereg
< EXPR_REG_START
|| o
->basereg
>= REG_ENUM_LIMIT
) {
1842 errfunc(ERR_PANIC
, "invalid operand passed to regflag()");
1844 return nasm_reg_flags
[o
->basereg
];
1847 static int32_t regval(const operand
* o
)
1849 if (o
->basereg
< EXPR_REG_START
|| o
->basereg
>= REG_ENUM_LIMIT
) {
1850 errfunc(ERR_PANIC
, "invalid operand passed to regval()");
1852 return nasm_regvals
[o
->basereg
];
1855 static int op_rexflags(const operand
* o
, int mask
)
1860 if (o
->basereg
< EXPR_REG_START
|| o
->basereg
>= REG_ENUM_LIMIT
) {
1861 errfunc(ERR_PANIC
, "invalid operand passed to op_rexflags()");
1864 flags
= nasm_reg_flags
[o
->basereg
];
1865 val
= nasm_regvals
[o
->basereg
];
1867 return rexflags(val
, flags
, mask
);
1870 static int rexflags(int val
, int32_t flags
, int mask
)
1875 rex
|= REX_B
|REX_X
|REX_R
;
1878 if (!(REG_HIGH
& ~flags
)) /* AH, CH, DH, BH */
1880 else if (!(REG8
& ~flags
) && val
>= 4) /* SPL, BPL, SIL, DIL */
1886 static int matches(const struct itemplate
*itemp
, insn
* instruction
, int bits
)
1888 int i
, size
[MAX_OPERANDS
], asize
, oprs
, ret
;
1895 if (itemp
->opcode
!= instruction
->opcode
)
1899 * Count the operands
1901 if (itemp
->operands
!= instruction
->operands
)
1905 * Check that no spurious colons or TOs are present
1907 for (i
= 0; i
< itemp
->operands
; i
++)
1908 if (instruction
->oprs
[i
].type
& ~itemp
->opd
[i
] & (COLON
| TO
))
1912 * Process size flags
1914 if (itemp
->flags
& IF_ARMASK
) {
1915 memset(size
, 0, sizeof size
);
1917 i
= ((itemp
->flags
& IF_ARMASK
) >> IF_ARSHFT
) - 1;
1919 switch (itemp
->flags
& IF_SMASK
) {
1956 switch (itemp
->flags
& IF_SMASK
) {
1991 for (i
= 0; i
< MAX_OPERANDS
; i
++)
1996 * Check that the operand flags all match up
1998 for (i
= 0; i
< itemp
->operands
; i
++) {
1999 int32_t type
= instruction
->oprs
[i
].type
;
2000 if (!(type
& SIZE_MASK
))
2003 if (itemp
->opd
[i
] & SAME_AS
) {
2004 int j
= itemp
->opd
[i
] & ~SAME_AS
;
2005 if (type
!= instruction
->oprs
[j
].type
||
2006 instruction
->oprs
[i
].basereg
!= instruction
->oprs
[j
].basereg
)
2008 } else if (itemp
->opd
[i
] & ~type
||
2009 ((itemp
->opd
[i
] & SIZE_MASK
) &&
2010 ((itemp
->opd
[i
] ^ type
) & SIZE_MASK
))) {
2011 if ((itemp
->opd
[i
] & ~type
& ~SIZE_MASK
) ||
2020 * Check operand sizes
2022 if (itemp
->flags
& (IF_SM
| IF_SM2
)) {
2023 oprs
= (itemp
->flags
& IF_SM2
? 2 : itemp
->operands
);
2025 for (i
= 0; i
< oprs
; i
++) {
2026 if ((asize
= itemp
->opd
[i
] & SIZE_MASK
) != 0) {
2028 for (j
= 0; j
< oprs
; j
++)
2034 oprs
= itemp
->operands
;
2037 for (i
= 0; i
< itemp
->operands
; i
++) {
2038 if (!(itemp
->opd
[i
] & SIZE_MASK
) &&
2039 (instruction
->oprs
[i
].type
& SIZE_MASK
& ~size
[i
]))
2044 * Check template is okay at the set cpu level
2046 if (((itemp
->flags
& IF_PLEVEL
) > cpu
))
2050 * Check if instruction is available in long mode
2052 if ((itemp
->flags
& IF_NOLONG
) && (bits
== 64))
2056 * Check if special handling needed for Jumps
2058 if ((uint8_t)(itemp
->code
[0]) >= 0370)
2064 static ea
*process_ea(operand
* input
, ea
* output
, int bits
,
2065 int addrbits
, int rfield
, int32_t rflags
)
2067 bool forw_ref
= !!(input
->opflags
& OPFLAG_FORWARD
);
2069 output
->rip
= false;
2071 /* REX flags for the rfield operand */
2072 output
->rex
|= rexflags(rfield
, rflags
, REX_R
|REX_P
|REX_W
|REX_H
);
2074 if (!(REGISTER
& ~input
->type
)) { /* register direct */
2078 if (input
->basereg
< EXPR_REG_START
/* Verify as Register */
2079 || input
->basereg
>= REG_ENUM_LIMIT
)
2082 i
= nasm_regvals
[input
->basereg
];
2085 return NULL
; /* Invalid EA register */
2087 output
->rex
|= op_rexflags(input
, REX_B
|REX_P
|REX_W
|REX_H
);
2089 output
->sib_present
= false; /* no SIB necessary */
2090 output
->bytes
= 0; /* no offset necessary either */
2091 output
->modrm
= 0xC0 | ((rfield
& 7) << 3) | (i
& 7);
2092 } else { /* it's a memory reference */
2093 if (input
->basereg
== -1
2094 && (input
->indexreg
== -1 || input
->scale
== 0)) {
2095 /* it's a pure offset */
2096 if (bits
== 64 && (~input
->type
& IP_REL
)) {
2097 int scale
, index
, base
;
2098 output
->sib_present
= true;
2102 output
->sib
= (scale
<< 6) | (index
<< 3) | base
;
2104 output
->modrm
= 4 | ((rfield
& 7) << 3);
2105 output
->rip
= false;
2107 output
->sib_present
= false;
2108 output
->bytes
= (addrbits
!= 16 ? 4 : 2);
2109 output
->modrm
= (addrbits
!= 16 ? 5 : 6) | ((rfield
& 7) << 3);
2110 output
->rip
= bits
== 64;
2112 } else { /* it's an indirection */
2113 int i
= input
->indexreg
, b
= input
->basereg
, s
= input
->scale
;
2114 int32_t o
= input
->offset
, seg
= input
->segment
;
2115 int hb
= input
->hintbase
, ht
= input
->hinttype
;
2118 int32_t ix
, bx
; /* register flags */
2121 i
= -1; /* make this easy, at least */
2123 if (i
>= EXPR_REG_START
&& i
< REG_ENUM_LIMIT
) {
2124 it
= nasm_regvals
[i
];
2125 ix
= nasm_reg_flags
[i
];
2131 if (b
>= EXPR_REG_START
&& b
< REG_ENUM_LIMIT
) {
2132 bt
= nasm_regvals
[b
];
2133 bx
= nasm_reg_flags
[b
];
2139 /* check for a 32/64-bit memory reference... */
2140 if ((ix
|bx
) & (BITS32
|BITS64
)) {
2141 /* it must be a 32/64-bit memory reference. Firstly we have
2142 * to check that all registers involved are type E/Rxx. */
2143 int32_t sok
= BITS32
|BITS64
;
2146 if (!(REG64
& ~ix
) || !(REG32
& ~ix
))
2154 return NULL
; /* Invalid register */
2155 if (~sok
& bx
& SIZE_MASK
)
2156 return NULL
; /* Invalid size */
2160 /* While we're here, ensure the user didn't specify
2162 if (input
->disp_size
== 16 || input
->disp_size
== 64)
2165 if (addrbits
== 16 ||
2166 (addrbits
== 32 && !(sok
& BITS32
)) ||
2167 (addrbits
== 64 && !(sok
& BITS64
)))
2170 /* now reorganize base/index */
2171 if (s
== 1 && bt
!= it
&& bt
!= -1 && it
!= -1 &&
2172 ((hb
== b
&& ht
== EAH_NOTBASE
)
2173 || (hb
== i
&& ht
== EAH_MAKEBASE
))) {
2174 /* swap if hints say so */
2175 t
= bt
, bt
= it
, it
= t
;
2176 t
= bx
, bx
= ix
, ix
= t
;
2178 if (bt
== it
) /* convert EAX+2*EAX to 3*EAX */
2179 bt
= -1, bx
= 0, s
++;
2180 if (bt
== -1 && s
== 1 && !(hb
== it
&& ht
== EAH_NOTBASE
)) {
2181 /* make single reg base, unless hint */
2182 bt
= it
, bx
= ix
, it
= -1, ix
= 0;
2184 if (((s
== 2 && it
!= REG_NUM_ESP
2185 && !(input
->eaflags
& EAF_TIMESTWO
)) || s
== 3
2186 || s
== 5 || s
== 9) && bt
== -1)
2187 bt
= it
, bx
= ix
, s
--; /* convert 3*EAX to EAX+2*EAX */
2188 if (it
== -1 && (bt
& 7) != REG_NUM_ESP
2189 && (input
->eaflags
& EAF_TIMESTWO
))
2190 it
= bt
, ix
= bx
, bt
= -1, bx
= 0, s
= 1;
2191 /* convert [NOSPLIT EAX] to sib format with 0x0 displacement */
2192 if (s
== 1 && it
== REG_NUM_ESP
) {
2193 /* swap ESP into base if scale is 1 */
2194 t
= it
, it
= bt
, bt
= t
;
2195 t
= ix
, ix
= bx
, bx
= t
;
2197 if (it
== REG_NUM_ESP
2198 || (s
!= 1 && s
!= 2 && s
!= 4 && s
!= 8 && it
!= -1))
2199 return NULL
; /* wrong, for various reasons */
2201 output
->rex
|= rexflags(it
, ix
, REX_X
);
2202 output
->rex
|= rexflags(bt
, bx
, REX_B
);
2204 if (it
== -1 && (bt
& 7) != REG_NUM_ESP
) {
2213 if (rm
!= REG_NUM_EBP
&& o
== 0 &&
2214 seg
== NO_SEG
&& !forw_ref
&&
2216 (EAF_BYTEOFFS
| EAF_WORDOFFS
)))
2218 else if (input
->eaflags
& EAF_BYTEOFFS
||
2219 (o
>= -128 && o
<= 127 && seg
== NO_SEG
2221 && !(input
->eaflags
& EAF_WORDOFFS
)))
2227 output
->sib_present
= false;
2228 output
->bytes
= (bt
== -1 || mod
== 2 ? 4 : mod
);
2229 output
->modrm
= (mod
<< 6) | ((rfield
& 7) << 3) | rm
;
2232 int mod
, scale
, index
, base
;
2252 default: /* then what the smeg is it? */
2253 return NULL
; /* panic */
2261 if (base
!= REG_NUM_EBP
&& o
== 0 &&
2262 seg
== NO_SEG
&& !forw_ref
&&
2264 (EAF_BYTEOFFS
| EAF_WORDOFFS
)))
2266 else if (input
->eaflags
& EAF_BYTEOFFS
||
2267 (o
>= -128 && o
<= 127 && seg
== NO_SEG
2269 && !(input
->eaflags
& EAF_WORDOFFS
)))
2275 output
->sib_present
= true;
2276 output
->bytes
= (bt
== -1 || mod
== 2 ? 4 : mod
);
2277 output
->modrm
= (mod
<< 6) | ((rfield
& 7) << 3) | 4;
2278 output
->sib
= (scale
<< 6) | (index
<< 3) | base
;
2280 } else { /* it's 16-bit */
2283 /* check for 64-bit long mode */
2287 /* check all registers are BX, BP, SI or DI */
2288 if ((b
!= -1 && b
!= R_BP
&& b
!= R_BX
&& b
!= R_SI
2289 && b
!= R_DI
) || (i
!= -1 && i
!= R_BP
&& i
!= R_BX
2290 && i
!= R_SI
&& i
!= R_DI
))
2293 /* ensure the user didn't specify DWORD/QWORD */
2294 if (input
->disp_size
== 32 || input
->disp_size
== 64)
2297 if (s
!= 1 && i
!= -1)
2298 return NULL
; /* no can do, in 16-bit EA */
2299 if (b
== -1 && i
!= -1) {
2304 if ((b
== R_SI
|| b
== R_DI
) && i
!= -1) {
2309 /* have BX/BP as base, SI/DI index */
2311 return NULL
; /* shouldn't ever happen, in theory */
2312 if (i
!= -1 && b
!= -1 &&
2313 (i
== R_BP
|| i
== R_BX
|| b
== R_SI
|| b
== R_DI
))
2314 return NULL
; /* invalid combinations */
2315 if (b
== -1) /* pure offset: handled above */
2316 return NULL
; /* so if it gets to here, panic! */
2320 switch (i
* 256 + b
) {
2321 case R_SI
* 256 + R_BX
:
2324 case R_DI
* 256 + R_BX
:
2327 case R_SI
* 256 + R_BP
:
2330 case R_DI
* 256 + R_BP
:
2348 if (rm
== -1) /* can't happen, in theory */
2349 return NULL
; /* so panic if it does */
2351 if (o
== 0 && seg
== NO_SEG
&& !forw_ref
&& rm
!= 6 &&
2352 !(input
->eaflags
& (EAF_BYTEOFFS
| EAF_WORDOFFS
)))
2354 else if (input
->eaflags
& EAF_BYTEOFFS
||
2355 (o
>= -128 && o
<= 127 && seg
== NO_SEG
2357 && !(input
->eaflags
& EAF_WORDOFFS
)))
2362 output
->sib_present
= false; /* no SIB - it's 16-bit */
2363 output
->bytes
= mod
; /* bytes of offset needed */
2364 output
->modrm
= (mod
<< 6) | ((rfield
& 7) << 3) | rm
;
2369 output
->size
= 1 + output
->sib_present
+ output
->bytes
;
2373 static void add_asp(insn
*ins
, int addrbits
)
2378 valid
= (addrbits
== 64) ? 64|32 : 32|16;
2380 switch (ins
->prefixes
[PPS_ASIZE
]) {
2391 valid
&= (addrbits
== 32) ? 16 : 32;
2397 for (j
= 0; j
< ins
->operands
; j
++) {
2398 if (!(MEMORY
& ~ins
->oprs
[j
].type
)) {
2401 /* Verify as Register */
2402 if (ins
->oprs
[j
].indexreg
< EXPR_REG_START
2403 || ins
->oprs
[j
].indexreg
>= REG_ENUM_LIMIT
)
2406 i
= nasm_reg_flags
[ins
->oprs
[j
].indexreg
];
2408 /* Verify as Register */
2409 if (ins
->oprs
[j
].basereg
< EXPR_REG_START
2410 || ins
->oprs
[j
].basereg
>= REG_ENUM_LIMIT
)
2413 b
= nasm_reg_flags
[ins
->oprs
[j
].basereg
];
2415 if (ins
->oprs
[j
].scale
== 0)
2419 int ds
= ins
->oprs
[j
].disp_size
;
2420 if ((addrbits
!= 64 && ds
> 8) ||
2421 (addrbits
== 64 && ds
== 16))
2441 if (valid
& addrbits
) {
2442 ins
->addr_size
= addrbits
;
2443 } else if (valid
& ((addrbits
== 32) ? 16 : 32)) {
2444 /* Add an address size prefix */
2445 enum prefixes pref
= (addrbits
== 32) ? P_A16
: P_A32
;
2446 ins
->prefixes
[PPS_ASIZE
] = pref
;
2447 ins
->addr_size
= (addrbits
== 32) ? 16 : 32;
2450 errfunc(ERR_NONFATAL
, "impossible combination of address sizes");
2451 ins
->addr_size
= addrbits
; /* Error recovery */
2454 defdisp
= ins
->addr_size
== 16 ? 16 : 32;
2456 for (j
= 0; j
< ins
->operands
; j
++) {
2457 if (!(MEM_OFFS
& ~ins
->oprs
[j
].type
) &&
2458 (ins
->oprs
[j
].disp_size
? ins
->oprs
[j
].disp_size
: defdisp
)
2459 != ins
->addr_size
) {
2460 /* mem_offs sizes must match the address size; if not,
2461 strip the MEM_OFFS bit and match only EA instructions */
2462 ins
->oprs
[j
].type
&= ~(MEM_OFFS
& ~MEMORY
);