doc/Makefile.in: avoid deleting opt_var.txt, fix dependencies
[nasm.git] / assemble.c
blobf15b11a8d3d691f4ac605361190a3698811f6173
1 /* assemble.c code generation for the Netwide Assembler
3 * The Netwide Assembler is copyright (C) 1996 Simon Tatham and
4 * Julian Hall. All rights reserved. The software is
5 * redistributable under the license given in the file "LICENSE"
6 * distributed in the NASM archive.
8 * the actual codes (C syntax, i.e. octal):
9 * \0 - terminates the code. (Unless it's a literal of course.)
10 * \1, \2, \3 - that many literal bytes follow in the code stream
11 * \4, \6 - the POP/PUSH (respectively) codes for CS, DS, ES, SS
12 * (POP is never used for CS) depending on operand 0
13 * \5, \7 - the second byte of POP/PUSH codes for FS, GS, depending
14 * on operand 0
15 * \10..\13 - a literal byte follows in the code stream, to be added
16 * to the register value of operand 0..3
17 * \14..\17 - a signed byte immediate operand, from operand 0..3
18 * \20..\23 - a byte immediate operand, from operand 0..3
19 * \24..\27 - an unsigned byte immediate operand, from operand 0..3
20 * \30..\33 - a word immediate operand, from operand 0..3
21 * \34..\37 - select between \3[0-3] and \4[0-3] depending on 16/32 bit
22 * assembly mode or the operand-size override on the operand
23 * \40..\43 - a long immediate operand, from operand 0..3
24 * \44..\47 - select between \3[0-3], \4[0-3] and \5[4-7]
25 * depending on the address size of the instruction.
26 * \50..\53 - a byte relative operand, from operand 0..3
27 * \54..\57 - a qword immediate operand, from operand 0..3
28 * \60..\63 - a word relative operand, from operand 0..3
29 * \64..\67 - select between \6[0-3] and \7[0-3] depending on 16/32 bit
30 * assembly mode or the operand-size override on the operand
31 * \70..\73 - a long relative operand, from operand 0..3
32 * \74..\77 - a word constant, from the _segment_ part of operand 0..3
33 * \1ab - a ModRM, calculated on EA in operand a, with the spare
34 * field the register value of operand b.
35 * \140..\143 - an immediate word or signed byte for operand 0..3
36 * \144..\147 - or 2 (s-field) into opcode byte if operand 0..3
37 * is a signed byte rather than a word. Opcode byte follows.
38 * \150..\153 - an immediate dword or signed byte for operand 0..3
39 * \154..\157 - or 2 (s-field) into opcode byte if operand 0..3
40 * is a signed byte rather than a word. Opcode byte follows.
41 * \160..\163 - this instruction uses DREX rather than REX, with the
42 * OC0 field set to 0, and the dest field taken from
43 * operand 0..3.
44 * \164..\167 - this instruction uses DREX rather than REX, with the
45 * OC0 field set to 1, and the dest field taken from
46 * operand 0..3.
47 * \170 - encodes the literal byte 0. (Some compilers don't take
48 * kindly to a zero byte in the _middle_ of a compile time
49 * string constant, so I had to put this hack in.)
50 * \171 - placement of DREX suffix in the absence of an EA
51 * \2ab - a ModRM, calculated on EA in operand a, with the spare
52 * field equal to digit b.
53 * \310 - indicates fixed 16-bit address size, i.e. optional 0x67.
54 * \311 - indicates fixed 32-bit address size, i.e. optional 0x67.
55 * \312 - (disassembler only) marker on LOOP, LOOPxx instructions.
56 * \313 - indicates fixed 64-bit address size, 0x67 invalid.
57 * \314 - (disassembler only) invalid with REX.B
58 * \315 - (disassembler only) invalid with REX.X
59 * \316 - (disassembler only) invalid with REX.R
60 * \317 - (disassembler only) invalid with REX.W
61 * \320 - indicates fixed 16-bit operand size, i.e. optional 0x66.
62 * \321 - indicates fixed 32-bit operand size, i.e. optional 0x66.
63 * \322 - indicates that this instruction is only valid when the
64 * operand size is the default (instruction to disassembler,
65 * generates no code in the assembler)
66 * \323 - indicates fixed 64-bit operand size, REX on extensions only.
67 * \324 - indicates 64-bit operand size requiring REX prefix.
68 * \330 - a literal byte follows in the code stream, to be added
69 * to the condition code value of the instruction.
70 * \331 - instruction not valid with REP prefix. Hint for
71 * disassembler only; for SSE instructions.
72 * \332 - REP prefix (0xF2 byte) used as opcode extension.
73 * \333 - REP prefix (0xF3 byte) used as opcode extension.
74 * \334 - LOCK prefix used instead of REX.R
75 * \335 - disassemble a rep (0xF3 byte) prefix as repe not rep.
76 * \340 - reserve <operand 0> bytes of uninitialized storage.
77 * Operand 0 had better be a segmentless constant.
78 * \364 - operand-size prefix (0x66) not permitted
79 * \365 - address-size prefix (0x67) not permitted
80 * \366 - operand-size prefix (0x66) used as opcode extension
81 * \367 - address-size prefix (0x67) used as opcode extension
82 * \370,\371,\372 - match only if operand 0 meets byte jump criteria.
83 * 370 is used for Jcc, 371 is used for JMP.
84 * \373 - assemble 0x03 if bits==16, 0x05 if bits==32;
85 * used for conditional jump over longer jump
88 #include "compiler.h"
90 #include <stdio.h>
91 #include <string.h>
92 #include <inttypes.h>
94 #include "nasm.h"
95 #include "nasmlib.h"
96 #include "assemble.h"
97 #include "insns.h"
98 #include "preproc.h"
99 #include "regflags.c"
100 #include "regvals.c"
102 typedef struct {
103 int sib_present; /* is a SIB byte necessary? */
104 int bytes; /* # of bytes of offset needed */
105 int size; /* lazy - this is sib+bytes+1 */
106 uint8_t modrm, sib, rex, rip; /* the bytes themselves */
107 } ea;
109 static uint32_t cpu; /* cpu level received from nasm.c */
110 static efunc errfunc;
111 static struct ofmt *outfmt;
112 static ListGen *list;
114 static int64_t calcsize(int32_t, int64_t, int, insn *, const char *);
115 static void gencode(int32_t, int64_t, int, insn *, const char *, int64_t);
116 static int matches(const struct itemplate *, insn *, int bits);
117 static int32_t regflag(const operand *);
118 static int32_t regval(const operand *);
119 static int rexflags(int, int32_t, int);
120 static int op_rexflags(const operand *, int);
121 static ea *process_ea(operand *, ea *, int, int, int, int32_t, int);
122 static void add_asp(insn *, int);
124 static int has_prefix(insn * ins, enum prefix_pos pos, enum prefixes prefix)
126 return ins->prefixes[pos] == prefix;
129 static void assert_no_prefix(insn * ins, enum prefix_pos pos)
131 if (ins->prefixes[pos])
132 errfunc(ERR_NONFATAL, "invalid %s prefix",
133 prefix_name(ins->prefixes[pos]));
136 static const char *size_name(int size)
138 switch (size) {
139 case 1:
140 return "byte";
141 case 2:
142 return "word";
143 case 4:
144 return "dword";
145 case 8:
146 return "qword";
147 case 10:
148 return "tword";
149 case 16:
150 return "oword";
151 default:
152 return "???";
156 static void warn_overflow(int size, int64_t data)
158 if (size < 8) {
159 int64_t lim = ((int64_t)1 << (size*8))-1;
161 if (data < ~lim || data > lim)
162 errfunc(ERR_WARNING | ERR_WARN_NOV, "%s data exceeds bounds", size_name(size));
166 * This routine wrappers the real output format's output routine,
167 * in order to pass a copy of the data off to the listing file
168 * generator at the same time.
170 static void out(int64_t offset, int32_t segto, const void *data,
171 enum out_type type, uint64_t size,
172 int32_t segment, int32_t wrt)
174 static int32_t lineno = 0; /* static!!! */
175 static char *lnfname = NULL;
176 uint8_t p[8];
178 if (type == OUT_ADDRESS && segment == NO_SEG && wrt == NO_SEG) {
180 * This is a non-relocated address, and we're going to
181 * convert it into RAWDATA format.
183 uint8_t *q = p;
185 if (size > 8) {
186 errfunc(ERR_PANIC, "OUT_ADDRESS with size > 8");
187 return;
190 WRITEADDR(q, *(int64_t *)data, size);
191 data = p;
192 type = OUT_RAWDATA;
195 list->output(offset, data, type, size);
198 * this call to src_get determines when we call the
199 * debug-format-specific "linenum" function
200 * it updates lineno and lnfname to the current values
201 * returning 0 if "same as last time", -2 if lnfname
202 * changed, and the amount by which lineno changed,
203 * if it did. thus, these variables must be static
206 if (src_get(&lineno, &lnfname)) {
207 outfmt->current_dfmt->linenum(lnfname, lineno, segto);
210 outfmt->output(segto, data, type, size, segment, wrt);
213 static int jmp_match(int32_t segment, int64_t offset, int bits,
214 insn * ins, const char *code)
216 int64_t isize;
217 uint8_t c = code[0];
219 if (c != 0370 && c != 0371)
220 return 0;
221 if (ins->oprs[0].opflags & OPFLAG_FORWARD) {
222 if ((optimizing < 0 || (ins->oprs[0].type & STRICT))
223 && c == 0370)
224 return 1;
225 else
226 return (pass0 == 0); /* match a forward reference */
228 isize = calcsize(segment, offset, bits, ins, code);
229 if (ins->oprs[0].segment != segment)
230 return 0;
231 isize = ins->oprs[0].offset - offset - isize; /* isize is now the delta */
232 if (isize >= -128L && isize <= 127L)
233 return 1; /* it is byte size */
235 return 0;
238 int64_t assemble(int32_t segment, int64_t offset, int bits, uint32_t cp,
239 insn * instruction, struct ofmt *output, efunc error,
240 ListGen * listgen)
242 const struct itemplate *temp;
243 int j;
244 int size_prob;
245 int64_t insn_end;
246 int32_t itimes;
247 int64_t start = offset;
248 int64_t wsize = 0; /* size for DB etc. */
250 errfunc = error; /* to pass to other functions */
251 cpu = cp;
252 outfmt = output; /* likewise */
253 list = listgen; /* and again */
255 switch (instruction->opcode) {
256 case -1:
257 return 0;
258 case I_DB:
259 wsize = 1;
260 break;
261 case I_DW:
262 wsize = 2;
263 break;
264 case I_DD:
265 wsize = 4;
266 break;
267 case I_DQ:
268 wsize = 8;
269 break;
270 case I_DT:
271 wsize = 10;
272 break;
273 case I_DO:
274 wsize = 16;
275 break;
276 default:
277 break;
280 if (wsize) {
281 extop *e;
282 int32_t t = instruction->times;
283 if (t < 0)
284 errfunc(ERR_PANIC,
285 "instruction->times < 0 (%ld) in assemble()", t);
287 while (t--) { /* repeat TIMES times */
288 for (e = instruction->eops; e; e = e->next) {
289 if (e->type == EOT_DB_NUMBER) {
290 if (wsize == 1) {
291 if (e->segment != NO_SEG)
292 errfunc(ERR_NONFATAL,
293 "one-byte relocation attempted");
294 else {
295 uint8_t out_byte = e->offset;
296 out(offset, segment, &out_byte,
297 OUT_RAWDATA, 1, NO_SEG, NO_SEG);
299 } else if (wsize > 8) {
300 errfunc(ERR_NONFATAL, "integer supplied to a DT or DO"
301 " instruction");
302 } else
303 out(offset, segment, &e->offset,
304 OUT_ADDRESS, wsize, e->segment, e->wrt);
305 offset += wsize;
306 } else if (e->type == EOT_DB_STRING) {
307 int align;
309 out(offset, segment, e->stringval,
310 OUT_RAWDATA, e->stringlen, NO_SEG, NO_SEG);
311 align = e->stringlen % wsize;
313 if (align) {
314 align = wsize - align;
315 out(offset, segment, "\0\0\0\0\0\0\0\0",
316 OUT_RAWDATA, align, NO_SEG, NO_SEG);
318 offset += e->stringlen + align;
321 if (t > 0 && t == instruction->times - 1) {
323 * Dummy call to list->output to give the offset to the
324 * listing module.
326 list->output(offset, NULL, OUT_RAWDATA, 0);
327 list->uplevel(LIST_TIMES);
330 if (instruction->times > 1)
331 list->downlevel(LIST_TIMES);
332 return offset - start;
335 if (instruction->opcode == I_INCBIN) {
336 static char fname[FILENAME_MAX];
337 FILE *fp;
338 int32_t len;
339 char *prefix = "", *combine;
340 char **pPrevPath = NULL;
342 len = FILENAME_MAX - 1;
343 if (len > instruction->eops->stringlen)
344 len = instruction->eops->stringlen;
345 strncpy(fname, instruction->eops->stringval, len);
346 fname[len] = '\0';
348 while (1) { /* added by alexfru: 'incbin' uses include paths */
349 combine = nasm_malloc(strlen(prefix) + len + 1);
350 strcpy(combine, prefix);
351 strcat(combine, fname);
353 if ((fp = fopen(combine, "rb")) != NULL) {
354 nasm_free(combine);
355 break;
358 nasm_free(combine);
359 pPrevPath = pp_get_include_path_ptr(pPrevPath);
360 if (pPrevPath == NULL)
361 break;
362 prefix = *pPrevPath;
365 if (fp == NULL)
366 error(ERR_NONFATAL, "`incbin': unable to open file `%s'",
367 fname);
368 else if (fseek(fp, 0L, SEEK_END) < 0)
369 error(ERR_NONFATAL, "`incbin': unable to seek on file `%s'",
370 fname);
371 else {
372 static char buf[2048];
373 int32_t t = instruction->times;
374 int32_t base = 0;
376 len = ftell(fp);
377 if (instruction->eops->next) {
378 base = instruction->eops->next->offset;
379 len -= base;
380 if (instruction->eops->next->next &&
381 len > instruction->eops->next->next->offset)
382 len = instruction->eops->next->next->offset;
385 * Dummy call to list->output to give the offset to the
386 * listing module.
388 list->output(offset, NULL, OUT_RAWDATA, 0);
389 list->uplevel(LIST_INCBIN);
390 while (t--) {
391 int32_t l;
393 fseek(fp, base, SEEK_SET);
394 l = len;
395 while (l > 0) {
396 int32_t m =
397 fread(buf, 1, (l > (int32_t) sizeof(buf) ? (int32_t) sizeof(buf) : l),
398 fp);
399 if (!m) {
401 * This shouldn't happen unless the file
402 * actually changes while we are reading
403 * it.
405 error(ERR_NONFATAL,
406 "`incbin': unexpected EOF while"
407 " reading file `%s'", fname);
408 t = 0; /* Try to exit cleanly */
409 break;
411 out(offset, segment, buf, OUT_RAWDATA, m,
412 NO_SEG, NO_SEG);
413 l -= m;
416 list->downlevel(LIST_INCBIN);
417 if (instruction->times > 1) {
419 * Dummy call to list->output to give the offset to the
420 * listing module.
422 list->output(offset, NULL, OUT_RAWDATA, 0);
423 list->uplevel(LIST_TIMES);
424 list->downlevel(LIST_TIMES);
426 fclose(fp);
427 return instruction->times * len;
429 return 0; /* if we're here, there's an error */
432 /* Check to see if we need an address-size prefix */
433 add_asp(instruction, bits);
435 size_prob = false;
437 for (temp = nasm_instructions[instruction->opcode]; temp->opcode != -1; temp++){
438 int m = matches(temp, instruction, bits);
440 if (m == 99)
441 m += jmp_match(segment, offset, bits, instruction, temp->code);
443 if (m == 100) { /* matches! */
444 const char *codes = temp->code;
445 int64_t insn_size = calcsize(segment, offset, bits,
446 instruction, codes);
447 itimes = instruction->times;
448 if (insn_size < 0) /* shouldn't be, on pass two */
449 error(ERR_PANIC, "errors made it through from pass one");
450 else
451 while (itimes--) {
452 for (j = 0; j < MAXPREFIX; j++) {
453 uint8_t c = 0;
454 switch (instruction->prefixes[j]) {
455 case P_LOCK:
456 c = 0xF0;
457 break;
458 case P_REPNE:
459 case P_REPNZ:
460 c = 0xF2;
461 break;
462 case P_REPE:
463 case P_REPZ:
464 case P_REP:
465 c = 0xF3;
466 break;
467 case R_CS:
468 if (bits == 64) {
469 error(ERR_WARNING,
470 "cs segment base generated, but will be ignored in 64-bit mode");
472 c = 0x2E;
473 break;
474 case R_DS:
475 if (bits == 64) {
476 error(ERR_WARNING,
477 "ds segment base generated, but will be ignored in 64-bit mode");
479 c = 0x3E;
480 break;
481 case R_ES:
482 if (bits == 64) {
483 error(ERR_WARNING,
484 "es segment base generated, but will be ignored in 64-bit mode");
486 c = 0x26;
487 break;
488 case R_FS:
489 c = 0x64;
490 break;
491 case R_GS:
492 c = 0x65;
493 break;
494 case R_SS:
495 if (bits == 64) {
496 error(ERR_WARNING,
497 "ss segment base generated, but will be ignored in 64-bit mode");
499 c = 0x36;
500 break;
501 case R_SEGR6:
502 case R_SEGR7:
503 error(ERR_NONFATAL,
504 "segr6 and segr7 cannot be used as prefixes");
505 break;
506 case P_A16:
507 if (bits == 64) {
508 error(ERR_NONFATAL,
509 "16-bit addressing is not supported "
510 "in 64-bit mode");
511 } else if (bits != 16)
512 c = 0x67;
513 break;
514 case P_A32:
515 if (bits != 32)
516 c = 0x67;
517 break;
518 case P_A64:
519 if (bits != 64) {
520 error(ERR_NONFATAL,
521 "64-bit addressing is only supported "
522 "in 64-bit mode");
524 break;
525 case P_ASP:
526 c = 0x67;
527 break;
528 case P_O16:
529 if (bits != 16)
530 c = 0x66;
531 break;
532 case P_O32:
533 if (bits == 16)
534 c = 0x66;
535 break;
536 case P_O64:
537 /* REX.W */
538 break;
539 case P_OSP:
540 c = 0x66;
541 break;
542 case P_none:
543 break;
544 default:
545 error(ERR_PANIC, "invalid instruction prefix");
547 if (c != 0) {
548 out(offset, segment, &c, OUT_RAWDATA, 1,
549 NO_SEG, NO_SEG);
550 offset++;
553 insn_end = offset + insn_size;
554 gencode(segment, offset, bits, instruction, codes,
555 insn_end);
556 offset += insn_size;
557 if (itimes > 0 && itimes == instruction->times - 1) {
559 * Dummy call to list->output to give the offset to the
560 * listing module.
562 list->output(offset, NULL, OUT_RAWDATA, 0);
563 list->uplevel(LIST_TIMES);
566 if (instruction->times > 1)
567 list->downlevel(LIST_TIMES);
568 return offset - start;
569 } else if (m > 0 && m > size_prob) {
570 size_prob = m;
572 // temp++;
575 if (temp->opcode == -1) { /* didn't match any instruction */
576 switch (size_prob) {
577 case 1:
578 error(ERR_NONFATAL, "operation size not specified");
579 break;
580 case 2:
581 error(ERR_NONFATAL, "mismatch in operand sizes");
582 break;
583 case 3:
584 error(ERR_NONFATAL, "no instruction for this cpu level");
585 break;
586 case 4:
587 error(ERR_NONFATAL, "instruction not supported in 64-bit mode");
588 break;
589 default:
590 error(ERR_NONFATAL,
591 "invalid combination of opcode and operands");
592 break;
595 return 0;
598 int64_t insn_size(int32_t segment, int64_t offset, int bits, uint32_t cp,
599 insn * instruction, efunc error)
601 const struct itemplate *temp;
603 errfunc = error; /* to pass to other functions */
604 cpu = cp;
606 if (instruction->opcode == -1)
607 return 0;
609 if (instruction->opcode == I_DB || instruction->opcode == I_DW ||
610 instruction->opcode == I_DD || instruction->opcode == I_DQ ||
611 instruction->opcode == I_DT || instruction->opcode == I_DO) {
612 extop *e;
613 int32_t isize, osize, wsize = 0; /* placate gcc */
615 isize = 0;
616 switch (instruction->opcode) {
617 case I_DB:
618 wsize = 1;
619 break;
620 case I_DW:
621 wsize = 2;
622 break;
623 case I_DD:
624 wsize = 4;
625 break;
626 case I_DQ:
627 wsize = 8;
628 break;
629 case I_DT:
630 wsize = 10;
631 break;
632 case I_DO:
633 wsize = 16;
634 break;
635 default:
636 break;
639 for (e = instruction->eops; e; e = e->next) {
640 int32_t align;
642 osize = 0;
643 if (e->type == EOT_DB_NUMBER)
644 osize = 1;
645 else if (e->type == EOT_DB_STRING)
646 osize = e->stringlen;
648 align = (-osize) % wsize;
649 if (align < 0)
650 align += wsize;
651 isize += osize + align;
653 return isize * instruction->times;
656 if (instruction->opcode == I_INCBIN) {
657 char fname[FILENAME_MAX];
658 FILE *fp;
659 int32_t len;
660 char *prefix = "", *combine;
661 char **pPrevPath = NULL;
663 len = FILENAME_MAX - 1;
664 if (len > instruction->eops->stringlen)
665 len = instruction->eops->stringlen;
666 strncpy(fname, instruction->eops->stringval, len);
667 fname[len] = '\0';
669 /* added by alexfru: 'incbin' uses include paths */
670 while (1) {
671 combine = nasm_malloc(strlen(prefix) + len + 1);
672 strcpy(combine, prefix);
673 strcat(combine, fname);
675 if ((fp = fopen(combine, "rb")) != NULL) {
676 nasm_free(combine);
677 break;
680 nasm_free(combine);
681 pPrevPath = pp_get_include_path_ptr(pPrevPath);
682 if (pPrevPath == NULL)
683 break;
684 prefix = *pPrevPath;
687 if (fp == NULL)
688 error(ERR_NONFATAL, "`incbin': unable to open file `%s'",
689 fname);
690 else if (fseek(fp, 0L, SEEK_END) < 0)
691 error(ERR_NONFATAL, "`incbin': unable to seek on file `%s'",
692 fname);
693 else {
694 len = ftell(fp);
695 fclose(fp);
696 if (instruction->eops->next) {
697 len -= instruction->eops->next->offset;
698 if (instruction->eops->next->next &&
699 len > instruction->eops->next->next->offset) {
700 len = instruction->eops->next->next->offset;
703 return instruction->times * len;
705 return 0; /* if we're here, there's an error */
708 /* Check to see if we need an address-size prefix */
709 add_asp(instruction, bits);
711 for (temp = nasm_instructions[instruction->opcode]; temp->opcode != -1; temp++) {
712 int m = matches(temp, instruction, bits);
713 if (m == 99)
714 m += jmp_match(segment, offset, bits, instruction, temp->code);
716 if (m == 100) {
717 /* we've matched an instruction. */
718 int64_t isize;
719 const char *codes = temp->code;
720 int j;
722 isize = calcsize(segment, offset, bits, instruction, codes);
723 if (isize < 0)
724 return -1;
725 for (j = 0; j < MAXPREFIX; j++) {
726 switch (instruction->prefixes[j]) {
727 case P_A16:
728 if (bits != 16)
729 isize++;
730 break;
731 case P_A32:
732 if (bits != 32)
733 isize++;
734 break;
735 case P_O16:
736 if (bits != 16)
737 isize++;
738 break;
739 case P_O32:
740 if (bits == 16)
741 isize++;
742 break;
743 case P_A64:
744 case P_O64:
745 case P_none:
746 break;
747 default:
748 isize++;
749 break;
752 return isize * instruction->times;
755 return -1; /* didn't match any instruction */
758 /* check that opn[op] is a signed byte of size 16 or 32,
759 and return the signed value*/
760 static int is_sbyte(insn * ins, int op, int size)
762 int32_t v;
763 int ret;
765 ret = !(ins->forw_ref && ins->oprs[op].opflags) && /* dead in the water on forward reference or External */
766 optimizing >= 0 &&
767 !(ins->oprs[op].type & STRICT) &&
768 ins->oprs[op].wrt == NO_SEG && ins->oprs[op].segment == NO_SEG;
770 v = ins->oprs[op].offset;
771 if (size == 16)
772 v = (int16_t)v; /* sign extend if 16 bits */
774 return ret && v >= -128L && v <= 127L;
777 static int64_t calcsize(int32_t segment, int64_t offset, int bits,
778 insn * ins, const char *codes)
780 int64_t length = 0;
781 uint8_t c;
782 int rex_mask = ~0;
783 struct operand *opx;
785 ins->rex = 0; /* Ensure REX is reset */
787 if (ins->prefixes[PPS_OSIZE] == P_O64)
788 ins->rex |= REX_W;
790 (void)segment; /* Don't warn that this parameter is unused */
791 (void)offset; /* Don't warn that this parameter is unused */
793 while (*codes) {
794 c = *codes++;
795 opx = &ins->oprs[c & 3];
796 switch (c) {
797 case 01:
798 case 02:
799 case 03:
800 codes += c, length += c;
801 break;
802 case 04:
803 case 05:
804 case 06:
805 case 07:
806 length++;
807 break;
808 case 010:
809 case 011:
810 case 012:
811 case 013:
812 ins->rex |=
813 op_rexflags(opx, REX_B|REX_H|REX_P|REX_W);
814 codes++, length++;
815 break;
816 case 014:
817 case 015:
818 case 016:
819 case 017:
820 length++;
821 break;
822 case 020:
823 case 021:
824 case 022:
825 case 023:
826 length++;
827 break;
828 case 024:
829 case 025:
830 case 026:
831 case 027:
832 length++;
833 break;
834 case 030:
835 case 031:
836 case 032:
837 case 033:
838 length += 2;
839 break;
840 case 034:
841 case 035:
842 case 036:
843 case 037:
844 if (opx->type & (BITS16 | BITS32 | BITS64))
845 length += (opx->type & BITS16) ? 2 : 4;
846 else
847 length += (bits == 16) ? 2 : 4;
848 break;
849 case 040:
850 case 041:
851 case 042:
852 case 043:
853 length += 4;
854 break;
855 case 044:
856 case 045:
857 case 046:
858 case 047:
859 length += ins->addr_size >> 3;
860 break;
861 case 050:
862 case 051:
863 case 052:
864 case 053:
865 length++;
866 break;
867 case 054:
868 case 055:
869 case 056:
870 case 057:
871 length += 8; /* MOV reg64/imm */
872 break;
873 case 060:
874 case 061:
875 case 062:
876 case 063:
877 length += 2;
878 break;
879 case 064:
880 case 065:
881 case 066:
882 case 067:
883 if (opx->type & (BITS16 | BITS32 | BITS64))
884 length += (opx->type & BITS16) ? 2 : 4;
885 else
886 length += (bits == 16) ? 2 : 4;
887 break;
888 case 070:
889 case 071:
890 case 072:
891 case 073:
892 length += 4;
893 break;
894 case 074:
895 case 075:
896 case 076:
897 case 077:
898 length += 2;
899 break;
900 case 0140:
901 case 0141:
902 case 0142:
903 case 0143:
904 length += is_sbyte(ins, c & 3, 16) ? 1 : 2;
905 break;
906 case 0144:
907 case 0145:
908 case 0146:
909 case 0147:
910 codes++;
911 length++;
912 break;
913 case 0150:
914 case 0151:
915 case 0152:
916 case 0153:
917 length += is_sbyte(ins, c & 3, 32) ? 1 : 4;
918 break;
919 case 0154:
920 case 0155:
921 case 0156:
922 case 0157:
923 codes++;
924 length++;
925 break;
926 case 0160:
927 case 0161:
928 case 0162:
929 case 0163:
930 length++;
931 ins->rex |= REX_D;
932 ins->drexdst = regval(&ins->oprs[c & 3]);
933 break;
934 case 0164:
935 case 0165:
936 case 0166:
937 case 0167:
938 length++;
939 ins->rex |= REX_D|REX_OC;
940 ins->drexdst = regval(&ins->oprs[c & 3]);
941 break;
942 case 0170:
943 length++;
944 break;
945 case 0171:
946 break;
947 case 0300:
948 case 0301:
949 case 0302:
950 case 0303:
951 break;
952 case 0310:
953 if (bits == 64)
954 return -1;
955 length += (bits != 16) && !has_prefix(ins, PPS_ASIZE, P_A16);
956 break;
957 case 0311:
958 length += (bits != 32) && !has_prefix(ins, PPS_ASIZE, P_A32);
959 break;
960 case 0312:
961 break;
962 case 0313:
963 if (bits != 64 || has_prefix(ins, PPS_ASIZE, P_A16) ||
964 has_prefix(ins, PPS_ASIZE, P_A32))
965 return -1;
966 break;
967 case 0314:
968 case 0315:
969 case 0316:
970 case 0317:
971 break;
972 case 0320:
973 length += (bits != 16);
974 break;
975 case 0321:
976 length += (bits == 16);
977 break;
978 case 0322:
979 break;
980 case 0323:
981 rex_mask &= ~REX_W;
982 break;
983 case 0324:
984 ins->rex |= REX_W;
985 break;
986 case 0330:
987 codes++, length++;
988 break;
989 case 0331:
990 break;
991 case 0332:
992 case 0333:
993 length++;
994 break;
995 case 0334:
996 ins->rex |= REX_L;
997 break;
998 case 0335:
999 break;
1000 case 0340:
1001 if (ins->oprs[0].segment != NO_SEG)
1002 errfunc(ERR_NONFATAL, "attempt to reserve non-constant"
1003 " quantity of BSS space");
1004 else
1005 length += ins->oprs[0].offset;
1006 break;
1007 case 0364:
1008 case 0365:
1009 break;
1010 case 0366:
1011 case 0367:
1012 length++;
1013 break;
1014 case 0370:
1015 case 0371:
1016 case 0372:
1017 break;
1018 case 0373:
1019 length++;
1020 break;
1021 default: /* can't do it by 'case' statements */
1022 if (c >= 0100 && c <= 0277) { /* it's an EA */
1023 ea ea_data;
1024 int rfield;
1025 int32_t rflags;
1026 ea_data.rex = 0; /* Ensure ea.REX is initially 0 */
1028 if (c <= 0177) {
1029 /* pick rfield from operand b */
1030 rflags = regflag(&ins->oprs[c & 7]);
1031 rfield = regvals[ins->oprs[c & 7].basereg];
1032 } else {
1033 rflags = 0;
1034 rfield = c & 7;
1037 if (!process_ea
1038 (&ins->oprs[(c >> 3) & 7], &ea_data, bits,
1039 ins->addr_size, rfield, rflags, ins->forw_ref)) {
1040 errfunc(ERR_NONFATAL, "invalid effective address");
1041 return -1;
1042 } else {
1043 ins->rex |= ea_data.rex;
1044 length += ea_data.size;
1046 } else {
1047 errfunc(ERR_PANIC, "internal instruction table corrupt"
1048 ": instruction code 0x%02X given", c);
1053 ins->rex &= rex_mask;
1055 if (ins->rex & REX_D) {
1056 if (ins->rex & REX_H) {
1057 errfunc(ERR_NONFATAL, "cannot use high register in drex instruction");
1058 return -1;
1060 if (bits != 64 && ((ins->rex & (REX_W|REX_X|REX_B)) ||
1061 ins->drexdst > 7)) {
1062 errfunc(ERR_NONFATAL, "invalid operands in non-64-bit mode");
1063 return -1;
1065 length++;
1066 } else if (ins->rex & REX_REAL) {
1067 if (ins->rex & REX_H) {
1068 errfunc(ERR_NONFATAL, "cannot use high register in rex instruction");
1069 return -1;
1070 } else if (bits == 64) {
1071 length++;
1072 } else if ((ins->rex & REX_L) &&
1073 !(ins->rex & (REX_P|REX_W|REX_X|REX_B)) &&
1074 cpu >= IF_X86_64) {
1075 /* LOCK-as-REX.R */
1076 assert_no_prefix(ins, PPS_LREP);
1077 length++;
1078 } else {
1079 errfunc(ERR_NONFATAL, "invalid operands in non-64-bit mode");
1080 return -1;
1084 return length;
1087 #define EMIT_REX() \
1088 if (!(ins->rex & REX_D) && (ins->rex & REX_REAL) && (bits == 64)) { \
1089 ins->rex = (ins->rex & REX_REAL)|REX_P; \
1090 out(offset, segment, &ins->rex, OUT_RAWDATA, 1, NO_SEG, NO_SEG); \
1091 ins->rex = 0; \
1092 offset += 1; \
1095 static void gencode(int32_t segment, int64_t offset, int bits,
1096 insn * ins, const char *codes, int64_t insn_end)
1098 static char condval[] = { /* conditional opcodes */
1099 0x7, 0x3, 0x2, 0x6, 0x2, 0x4, 0xF, 0xD, 0xC, 0xE, 0x6, 0x2,
1100 0x3, 0x7, 0x3, 0x5, 0xE, 0xC, 0xD, 0xF, 0x1, 0xB, 0x9, 0x5,
1101 0x0, 0xA, 0xA, 0xB, 0x8, 0x4
1103 uint8_t c;
1104 uint8_t bytes[4];
1105 int64_t size;
1106 int64_t data;
1107 struct operand *opx;
1109 while (*codes) {
1110 c = *codes++;
1111 opx = &ins->oprs[c & 3];
1112 switch (c) {
1113 case 01:
1114 case 02:
1115 case 03:
1116 EMIT_REX();
1117 out(offset, segment, codes, OUT_RAWDATA, c, NO_SEG, NO_SEG);
1118 codes += c;
1119 offset += c;
1120 break;
1122 case 04:
1123 case 06:
1124 switch (ins->oprs[0].basereg) {
1125 case R_CS:
1126 bytes[0] = 0x0E + (c == 0x04 ? 1 : 0);
1127 break;
1128 case R_DS:
1129 bytes[0] = 0x1E + (c == 0x04 ? 1 : 0);
1130 break;
1131 case R_ES:
1132 bytes[0] = 0x06 + (c == 0x04 ? 1 : 0);
1133 break;
1134 case R_SS:
1135 bytes[0] = 0x16 + (c == 0x04 ? 1 : 0);
1136 break;
1137 default:
1138 errfunc(ERR_PANIC,
1139 "bizarre 8086 segment register received");
1141 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1142 offset++;
1143 break;
1145 case 05:
1146 case 07:
1147 switch (ins->oprs[0].basereg) {
1148 case R_FS:
1149 bytes[0] = 0xA0 + (c == 0x05 ? 1 : 0);
1150 break;
1151 case R_GS:
1152 bytes[0] = 0xA8 + (c == 0x05 ? 1 : 0);
1153 break;
1154 default:
1155 errfunc(ERR_PANIC,
1156 "bizarre 386 segment register received");
1158 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1159 offset++;
1160 break;
1162 case 010:
1163 case 011:
1164 case 012:
1165 case 013:
1166 EMIT_REX();
1167 bytes[0] = *codes++ + ((regval(opx)) & 7);
1168 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1169 offset += 1;
1170 break;
1172 case 014:
1173 case 015:
1174 case 016:
1175 case 017:
1176 if (opx->offset < -128 || opx->offset > 127) {
1177 errfunc(ERR_WARNING | ERR_WARN_NOV,
1178 "signed byte value exceeds bounds");
1181 if (opx->segment != NO_SEG) {
1182 data = opx->offset;
1183 out(offset, segment, &data, OUT_ADDRESS, 1,
1184 opx->segment, opx->wrt);
1185 } else {
1186 bytes[0] = opx->offset;
1187 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG,
1188 NO_SEG);
1190 offset += 1;
1191 break;
1193 case 020:
1194 case 021:
1195 case 022:
1196 case 023:
1197 if (opx->offset < -256 || opx->offset > 255) {
1198 errfunc(ERR_WARNING | ERR_WARN_NOV,
1199 "byte value exceeds bounds");
1201 if (opx->segment != NO_SEG) {
1202 data = opx->offset;
1203 out(offset, segment, &data, OUT_ADDRESS, 1,
1204 opx->segment, opx->wrt);
1205 } else {
1206 bytes[0] = opx->offset;
1207 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG,
1208 NO_SEG);
1210 offset += 1;
1211 break;
1213 case 024:
1214 case 025:
1215 case 026:
1216 case 027:
1217 if (opx->offset < 0 || opx->offset > 255)
1218 errfunc(ERR_WARNING | ERR_WARN_NOV,
1219 "unsigned byte value exceeds bounds");
1220 if (opx->segment != NO_SEG) {
1221 data = opx->offset;
1222 out(offset, segment, &data, OUT_ADDRESS, 1,
1223 opx->segment, opx->wrt);
1224 } else {
1225 bytes[0] = opx->offset;
1226 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG,
1227 NO_SEG);
1229 offset += 1;
1230 break;
1232 case 030:
1233 case 031:
1234 case 032:
1235 case 033:
1236 data = opx->offset;
1237 if (opx->segment == NO_SEG && opx->wrt == NO_SEG)
1238 warn_overflow(2, data);
1239 out(offset, segment, &data, OUT_ADDRESS, 2,
1240 opx->segment, opx->wrt);
1241 offset += 2;
1242 break;
1244 case 034:
1245 case 035:
1246 case 036:
1247 case 037:
1248 if (opx->type & (BITS16 | BITS32))
1249 size = (opx->type & BITS16) ? 2 : 4;
1250 else
1251 size = (bits == 16) ? 2 : 4;
1252 data = opx->offset;
1253 if (opx->segment == NO_SEG && opx->wrt == NO_SEG)
1254 warn_overflow(size, data);
1255 out(offset, segment, &data, OUT_ADDRESS, size,
1256 opx->segment, opx->wrt);
1257 offset += size;
1258 break;
1260 case 040:
1261 case 041:
1262 case 042:
1263 case 043:
1264 data = opx->offset;
1265 if (opx->segment == NO_SEG && opx->wrt == NO_SEG)
1266 warn_overflow(4, data);
1267 out(offset, segment, &data, OUT_ADDRESS, 4,
1268 opx->segment, opx->wrt);
1269 offset += 4;
1270 break;
1272 case 044:
1273 case 045:
1274 case 046:
1275 case 047:
1276 data = opx->offset;
1277 size = ins->addr_size >> 3;
1278 if (opx->segment == NO_SEG &&
1279 opx->wrt == NO_SEG)
1280 warn_overflow(size, data);
1281 out(offset, segment, &data, OUT_ADDRESS, size,
1282 opx->segment, opx->wrt);
1283 offset += size;
1284 break;
1286 case 050:
1287 case 051:
1288 case 052:
1289 case 053:
1290 if (opx->segment != segment)
1291 errfunc(ERR_NONFATAL,
1292 "short relative jump outside segment");
1293 data = opx->offset - insn_end;
1294 if (data > 127 || data < -128)
1295 errfunc(ERR_NONFATAL, "short jump is out of range");
1296 bytes[0] = data;
1297 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1298 offset += 1;
1299 break;
1301 case 054:
1302 case 055:
1303 case 056:
1304 case 057:
1305 data = (int64_t)opx->offset;
1306 out(offset, segment, &data, OUT_ADDRESS, 8,
1307 opx->segment, opx->wrt);
1308 offset += 8;
1309 break;
1311 case 060:
1312 case 061:
1313 case 062:
1314 case 063:
1315 if (opx->segment != segment) {
1316 data = opx->offset;
1317 out(offset, segment, &data,
1318 OUT_REL2ADR, insn_end - offset,
1319 opx->segment, opx->wrt);
1320 } else {
1321 data = opx->offset - insn_end;
1322 out(offset, segment, &data,
1323 OUT_ADDRESS, 2, NO_SEG, NO_SEG);
1325 offset += 2;
1326 break;
1328 case 064:
1329 case 065:
1330 case 066:
1331 case 067:
1332 if (opx->type & (BITS16 | BITS32 | BITS64))
1333 size = (opx->type & BITS16) ? 2 : 4;
1334 else
1335 size = (bits == 16) ? 2 : 4;
1336 if (opx->segment != segment) {
1337 data = opx->offset;
1338 out(offset, segment, &data,
1339 size == 2 ? OUT_REL2ADR : OUT_REL4ADR,
1340 insn_end - offset, opx->segment, opx->wrt);
1341 } else {
1342 data = opx->offset - insn_end;
1343 out(offset, segment, &data,
1344 OUT_ADDRESS, size, NO_SEG, NO_SEG);
1346 offset += size;
1347 break;
1349 case 070:
1350 case 071:
1351 case 072:
1352 case 073:
1353 if (opx->segment != segment) {
1354 data = opx->offset;
1355 out(offset, segment, &data,
1356 OUT_REL4ADR, insn_end - offset,
1357 opx->segment, opx->wrt);
1358 } else {
1359 data = opx->offset - insn_end;
1360 out(offset, segment, &data,
1361 OUT_ADDRESS, 4, NO_SEG, NO_SEG);
1363 offset += 4;
1364 break;
1366 case 074:
1367 case 075:
1368 case 076:
1369 case 077:
1370 if (opx->segment == NO_SEG)
1371 errfunc(ERR_NONFATAL, "value referenced by FAR is not"
1372 " relocatable");
1373 data = 0L;
1374 out(offset, segment, &data, OUT_ADDRESS, 2,
1375 outfmt->segbase(1 + opx->segment),
1376 opx->wrt);
1377 offset += 2;
1378 break;
1380 case 0140:
1381 case 0141:
1382 case 0142:
1383 case 0143:
1384 data = opx->offset;
1385 if (is_sbyte(ins, c & 3, 16)) {
1386 bytes[0] = data;
1387 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG,
1388 NO_SEG);
1389 offset++;
1390 } else {
1391 if (opx->segment == NO_SEG &&
1392 opx->wrt == NO_SEG)
1393 warn_overflow(2, data);
1394 out(offset, segment, &data, OUT_ADDRESS, 2,
1395 opx->segment, opx->wrt);
1396 offset += 2;
1398 break;
1400 case 0144:
1401 case 0145:
1402 case 0146:
1403 case 0147:
1404 EMIT_REX();
1405 bytes[0] = *codes++;
1406 if (is_sbyte(ins, c & 3, 16))
1407 bytes[0] |= 2; /* s-bit */
1408 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1409 offset++;
1410 break;
1412 case 0150:
1413 case 0151:
1414 case 0152:
1415 case 0153:
1416 data = opx->offset;
1417 if (is_sbyte(ins, c & 3, 32)) {
1418 bytes[0] = data;
1419 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG,
1420 NO_SEG);
1421 offset++;
1422 } else {
1423 out(offset, segment, &data, OUT_ADDRESS, 4,
1424 opx->segment, opx->wrt);
1425 offset += 4;
1427 break;
1429 case 0154:
1430 case 0155:
1431 case 0156:
1432 case 0157:
1433 EMIT_REX();
1434 bytes[0] = *codes++;
1435 if (is_sbyte(ins, c & 3, 32))
1436 bytes[0] |= 2; /* s-bit */
1437 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1438 offset++;
1439 break;
1441 case 0160:
1442 case 0161:
1443 case 0162:
1444 case 0163:
1445 case 0164:
1446 case 0165:
1447 case 0166:
1448 case 0167:
1449 break;
1451 case 0170:
1452 EMIT_REX();
1453 bytes[0] = 0;
1454 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1455 offset += 1;
1456 break;
1458 case 0171:
1459 bytes[0] =
1460 (ins->drexdst << 4) |
1461 (ins->rex & REX_OC ? 0x08 : 0) |
1462 (ins->rex & (REX_R|REX_X|REX_B));
1463 ins->rex = 0;
1464 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1465 offset++;
1466 break;
1468 case 0300:
1469 case 0301:
1470 case 0302:
1471 case 0303:
1472 break;
1474 case 0310:
1475 if (bits == 32 && !has_prefix(ins, PPS_ASIZE, P_A16)) {
1476 *bytes = 0x67;
1477 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1478 offset += 1;
1479 } else
1480 offset += 0;
1481 break;
1483 case 0311:
1484 if (bits != 32 && !has_prefix(ins, PPS_ASIZE, P_A32)) {
1485 *bytes = 0x67;
1486 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1487 offset += 1;
1488 } else
1489 offset += 0;
1490 break;
1492 case 0312:
1493 break;
1495 case 0313:
1496 ins->rex = 0;
1497 break;
1499 case 0314:
1500 case 0315:
1501 case 0316:
1502 case 0317:
1503 break;
1505 case 0320:
1506 if (bits != 16) {
1507 *bytes = 0x66;
1508 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1509 offset += 1;
1510 } else
1511 offset += 0;
1512 break;
1514 case 0321:
1515 if (bits == 16) {
1516 *bytes = 0x66;
1517 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1518 offset += 1;
1519 } else
1520 offset += 0;
1521 break;
1523 case 0322:
1524 case 0323:
1525 break;
1527 case 0324:
1528 ins->rex |= REX_W;
1529 break;
1531 case 0330:
1532 *bytes = *codes++ ^ condval[ins->condition];
1533 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1534 offset += 1;
1535 break;
1537 case 0331:
1538 break;
1540 case 0332:
1541 case 0333:
1542 *bytes = c - 0332 + 0xF2;
1543 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1544 offset += 1;
1545 break;
1547 case 0334:
1548 if (ins->rex & REX_R) {
1549 *bytes = 0xF0;
1550 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1551 offset += 1;
1553 ins->rex &= ~(REX_L|REX_R);
1554 break;
1556 case 0335:
1557 break;
1559 case 0340:
1560 if (ins->oprs[0].segment != NO_SEG)
1561 errfunc(ERR_PANIC, "non-constant BSS size in pass two");
1562 else {
1563 int64_t size = ins->oprs[0].offset;
1564 if (size > 0)
1565 out(offset, segment, NULL,
1566 OUT_RESERVE, size, NO_SEG, NO_SEG);
1567 offset += size;
1569 break;
1571 case 0364:
1572 case 0365:
1573 break;
1575 case 0366:
1576 case 0367:
1577 *bytes = c - 0366 + 0x66;
1578 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1579 offset += 1;
1580 break;
1582 case 0370:
1583 case 0371:
1584 case 0372:
1585 break;
1587 case 0373:
1588 *bytes = bits == 16 ? 3 : 5;
1589 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1590 offset += 1;
1591 break;
1593 default: /* can't do it by 'case' statements */
1594 if (c >= 0100 && c <= 0277) { /* it's an EA */
1595 ea ea_data;
1596 int rfield;
1597 int32_t rflags;
1598 uint8_t *p;
1599 int32_t s;
1601 if (c <= 0177) {
1602 /* pick rfield from operand b */
1603 rflags = regflag(&ins->oprs[c & 7]);
1604 rfield = regvals[ins->oprs[c & 7].basereg];
1605 } else {
1606 /* rfield is constant */
1607 rflags = 0;
1608 rfield = c & 7;
1611 if (!process_ea
1612 (&ins->oprs[(c >> 3) & 7], &ea_data, bits,
1613 ins->addr_size, rfield, rflags, ins->forw_ref)) {
1614 errfunc(ERR_NONFATAL, "invalid effective address");
1618 p = bytes;
1619 *p++ = ea_data.modrm;
1620 if (ea_data.sib_present)
1621 *p++ = ea_data.sib;
1623 /* DREX suffixes come between the SIB and the displacement */
1624 if (ins->rex & REX_D) {
1625 *p++ =
1626 (ins->drexdst << 4) |
1627 (ins->rex & REX_OC ? 0x08 : 0) |
1628 (ins->rex & (REX_R|REX_X|REX_B));
1629 ins->rex = 0;
1632 s = p - bytes;
1633 out(offset, segment, bytes, OUT_RAWDATA, s, NO_SEG, NO_SEG);
1635 switch (ea_data.bytes) {
1636 case 0:
1637 break;
1638 case 1:
1639 if (ins->oprs[(c >> 3) & 7].segment != NO_SEG) {
1640 data = ins->oprs[(c >> 3) & 7].offset;
1641 out(offset, segment, &data, OUT_ADDRESS, 1,
1642 ins->oprs[(c >> 3) & 7].segment,
1643 ins->oprs[(c >> 3) & 7].wrt);
1644 } else {
1645 *bytes = ins->oprs[(c >> 3) & 7].offset;
1646 out(offset, segment, bytes, OUT_RAWDATA, 1,
1647 NO_SEG, NO_SEG);
1649 s++;
1650 break;
1651 case 8:
1652 case 2:
1653 case 4:
1654 data = ins->oprs[(c >> 3) & 7].offset;
1655 warn_overflow(ea_data.bytes, data);
1656 out(offset, segment, &data,
1657 ea_data.rip ? OUT_REL4ADR : OUT_ADDRESS,
1658 ea_data.bytes,
1659 ins->oprs[(c >> 3) & 7].segment,
1660 ins->oprs[(c >> 3) & 7].wrt);
1661 s += ea_data.bytes;
1662 break;
1664 offset += s;
1665 } else {
1666 errfunc(ERR_PANIC, "internal instruction table corrupt"
1667 ": instruction code 0x%02X given", c);
1673 static int32_t regflag(const operand * o)
1675 if (o->basereg < EXPR_REG_START || o->basereg >= REG_ENUM_LIMIT) {
1676 errfunc(ERR_PANIC, "invalid operand passed to regflag()");
1678 return reg_flags[o->basereg];
1681 static int32_t regval(const operand * o)
1683 if (o->basereg < EXPR_REG_START || o->basereg >= REG_ENUM_LIMIT) {
1684 errfunc(ERR_PANIC, "invalid operand passed to regval()");
1686 return regvals[o->basereg];
1689 static int op_rexflags(const operand * o, int mask)
1691 int32_t flags;
1692 int val;
1694 if (o->basereg < EXPR_REG_START || o->basereg >= REG_ENUM_LIMIT) {
1695 errfunc(ERR_PANIC, "invalid operand passed to op_rexflags()");
1698 flags = reg_flags[o->basereg];
1699 val = regvals[o->basereg];
1701 return rexflags(val, flags, mask);
1704 static int rexflags(int val, int32_t flags, int mask)
1706 int rex = 0;
1708 if (val >= 8)
1709 rex |= REX_B|REX_X|REX_R;
1710 if (flags & BITS64)
1711 rex |= REX_W;
1712 if (!(REG_HIGH & ~flags)) /* AH, CH, DH, BH */
1713 rex |= REX_H;
1714 else if (!(REG8 & ~flags) && val >= 4) /* SPL, BPL, SIL, DIL */
1715 rex |= REX_P;
1717 return rex & mask;
1720 static int matches(const struct itemplate *itemp, insn * instruction, int bits)
1722 int i, size[MAX_OPERANDS], asize, oprs, ret;
1724 ret = 100;
1727 * Check the opcode
1729 if (itemp->opcode != instruction->opcode)
1730 return 0;
1733 * Count the operands
1735 if (itemp->operands != instruction->operands)
1736 return 0;
1739 * Check that no spurious colons or TOs are present
1741 for (i = 0; i < itemp->operands; i++)
1742 if (instruction->oprs[i].type & ~itemp->opd[i] & (COLON | TO))
1743 return 0;
1746 * Check that the operand flags all match up
1748 for (i = 0; i < itemp->operands; i++) {
1749 if (itemp->opd[i] & SAME_AS) {
1750 int j = itemp->opd[i] & ~SAME_AS;
1751 if (instruction->oprs[i].type != instruction->oprs[j].type ||
1752 instruction->oprs[i].basereg != instruction->oprs[j].basereg)
1753 return 0;
1754 } else if (itemp->opd[i] & ~instruction->oprs[i].type ||
1755 ((itemp->opd[i] & SIZE_MASK) &&
1756 ((itemp->opd[i] ^ instruction->oprs[i].type) & SIZE_MASK))) {
1757 if ((itemp->opd[i] & ~instruction->oprs[i].type & ~SIZE_MASK) ||
1758 (instruction->oprs[i].type & SIZE_MASK))
1759 return 0;
1760 else
1761 return 1;
1766 * Check operand sizes
1768 if (itemp->flags & IF_ARMASK) {
1769 memset(size, 0, sizeof size);
1771 switch (itemp->flags & IF_ARMASK) {
1772 case IF_AR0:
1773 i = 0;
1774 break;
1775 case IF_AR1:
1776 i = 1;
1777 break;
1778 case IF_AR2:
1779 i = 2;
1780 break;
1781 case IF_AR3:
1782 i = 3;
1783 break;
1784 default:
1785 break; /* Shouldn't happen */
1787 switch (itemp->flags & IF_SMASK) {
1788 case IF_SB:
1789 size[i] = BITS8;
1790 break;
1791 case IF_SW:
1792 size[i] = BITS16;
1793 break;
1794 case IF_SD:
1795 size[i] = BITS32;
1796 break;
1797 case IF_SQ:
1798 size[i] = BITS64;
1799 break;
1800 case IF_SO:
1801 size[i] = BITS128;
1802 break;
1803 default:
1804 break;
1806 } else {
1807 asize = 0;
1808 switch (itemp->flags & IF_SMASK) {
1809 case IF_SB:
1810 asize = BITS8;
1811 oprs = itemp->operands;
1812 break;
1813 case IF_SW:
1814 asize = BITS16;
1815 oprs = itemp->operands;
1816 break;
1817 case IF_SD:
1818 asize = BITS32;
1819 oprs = itemp->operands;
1820 break;
1821 case IF_SQ:
1822 asize = BITS64;
1823 oprs = itemp->operands;
1824 break;
1825 case IF_SO:
1826 asize = BITS128;
1827 oprs = itemp->operands;
1828 break;
1829 default:
1830 break;
1832 for (i = 0; i < MAX_OPERANDS; i++)
1833 size[i] = asize;
1836 if (itemp->flags & (IF_SM | IF_SM2)) {
1837 oprs = (itemp->flags & IF_SM2 ? 2 : itemp->operands);
1838 asize = 0;
1839 for (i = 0; i < oprs; i++) {
1840 if ((asize = itemp->opd[i] & SIZE_MASK) != 0) {
1841 int j;
1842 for (j = 0; j < oprs; j++)
1843 size[j] = asize;
1844 break;
1847 } else {
1848 oprs = itemp->operands;
1851 for (i = 0; i < itemp->operands; i++) {
1852 if (!(itemp->opd[i] & SIZE_MASK) &&
1853 (instruction->oprs[i].type & SIZE_MASK & ~size[i]))
1854 return 2;
1858 * Check template is okay at the set cpu level
1860 if (((itemp->flags & IF_PLEVEL) > cpu))
1861 return 3;
1864 * Check if instruction is available in long mode
1866 if ((itemp->flags & IF_NOLONG) && (bits == 64))
1867 return 4;
1870 * Check if special handling needed for Jumps
1872 if ((uint8_t)(itemp->code[0]) >= 0370)
1873 return 99;
1875 return ret;
1878 static ea *process_ea(operand * input, ea * output, int bits,
1879 int addrbits, int rfield, int32_t rflags, int forw_ref)
1881 output->rip = false;
1883 /* REX flags for the rfield operand */
1884 output->rex |= rexflags(rfield, rflags, REX_R|REX_P|REX_W|REX_H);
1886 if (!(REGISTER & ~input->type)) { /* register direct */
1887 int i;
1888 int32_t f;
1890 if (input->basereg < EXPR_REG_START /* Verify as Register */
1891 || input->basereg >= REG_ENUM_LIMIT)
1892 return NULL;
1893 f = regflag(input);
1894 i = regvals[input->basereg];
1896 if (REG_EA & ~f)
1897 return NULL; /* Invalid EA register */
1899 output->rex |= op_rexflags(input, REX_B|REX_P|REX_W|REX_H);
1901 output->sib_present = false; /* no SIB necessary */
1902 output->bytes = 0; /* no offset necessary either */
1903 output->modrm = 0xC0 | ((rfield & 7) << 3) | (i & 7);
1904 } else { /* it's a memory reference */
1905 if (input->basereg == -1
1906 && (input->indexreg == -1 || input->scale == 0)) {
1907 /* it's a pure offset */
1908 if (bits == 64 && (~input->type & IP_REL)) {
1909 int scale, index, base;
1910 output->sib_present = true;
1911 scale = 0;
1912 index = 4;
1913 base = 5;
1914 output->sib = (scale << 6) | (index << 3) | base;
1915 output->bytes = 4;
1916 output->modrm = 4 | ((rfield & 7) << 3);
1917 output->rip = false;
1918 } else {
1919 output->sib_present = false;
1920 output->bytes = (addrbits != 16 ? 4 : 2);
1921 output->modrm = (addrbits != 16 ? 5 : 6) | ((rfield & 7) << 3);
1922 output->rip = bits == 64;
1924 } else { /* it's an indirection */
1925 int i = input->indexreg, b = input->basereg, s = input->scale;
1926 int32_t o = input->offset, seg = input->segment;
1927 int hb = input->hintbase, ht = input->hinttype;
1928 int t;
1929 int it, bt;
1930 int32_t ix, bx; /* register flags */
1932 if (s == 0)
1933 i = -1; /* make this easy, at least */
1935 if (i >= EXPR_REG_START && i < REG_ENUM_LIMIT) {
1936 it = regvals[i];
1937 ix = reg_flags[i];
1938 } else {
1939 it = -1;
1940 ix = 0;
1943 if (b >= EXPR_REG_START && b < REG_ENUM_LIMIT) {
1944 bt = regvals[b];
1945 bx = reg_flags[b];
1946 } else {
1947 bt = -1;
1948 bx = 0;
1951 /* check for a 32/64-bit memory reference... */
1952 if ((ix|bx) & (BITS32|BITS64)) {
1953 /* it must be a 32/64-bit memory reference. Firstly we have
1954 * to check that all registers involved are type E/Rxx. */
1955 int32_t sok = BITS32|BITS64;
1957 if (it != -1) {
1958 if (!(REG64 & ~ix) || !(REG32 & ~ix))
1959 sok &= ix;
1960 else
1961 return NULL;
1964 if (bt != -1) {
1965 if (REG_GPR & ~bx)
1966 return NULL; /* Invalid register */
1967 if (~sok & bx & SIZE_MASK)
1968 return NULL; /* Invalid size */
1969 sok &= bx;
1972 /* While we're here, ensure the user didn't specify
1973 WORD or QWORD. */
1974 if (input->disp_size == 16 || input->disp_size == 64)
1975 return NULL;
1977 if (addrbits == 16 ||
1978 (addrbits == 32 && !(sok & BITS32)) ||
1979 (addrbits == 64 && !(sok & BITS64)))
1980 return NULL;
1982 /* now reorganize base/index */
1983 if (s == 1 && bt != it && bt != -1 && it != -1 &&
1984 ((hb == b && ht == EAH_NOTBASE)
1985 || (hb == i && ht == EAH_MAKEBASE))) {
1986 /* swap if hints say so */
1987 t = bt, bt = it, it = t;
1988 t = bx, bx = ix, ix = t;
1990 if (bt == it) /* convert EAX+2*EAX to 3*EAX */
1991 bt = -1, bx = 0, s++;
1992 if (bt == -1 && s == 1 && !(hb == it && ht == EAH_NOTBASE)) {
1993 /* make single reg base, unless hint */
1994 bt = it, bx = ix, it = -1, ix = 0;
1996 if (((s == 2 && it != REG_NUM_ESP
1997 && !(input->eaflags & EAF_TIMESTWO)) || s == 3
1998 || s == 5 || s == 9) && bt == -1)
1999 bt = it, bx = ix, s--; /* convert 3*EAX to EAX+2*EAX */
2000 if (it == -1 && (bt & 7) != REG_NUM_ESP
2001 && (input->eaflags & EAF_TIMESTWO))
2002 it = bt, ix = bx, bt = -1, bx = 0, s = 1;
2003 /* convert [NOSPLIT EAX] to sib format with 0x0 displacement */
2004 if (s == 1 && it == REG_NUM_ESP) {
2005 /* swap ESP into base if scale is 1 */
2006 t = it, it = bt, bt = t;
2007 t = ix, ix = bx, bx = t;
2009 if (it == REG_NUM_ESP
2010 || (s != 1 && s != 2 && s != 4 && s != 8 && it != -1))
2011 return NULL; /* wrong, for various reasons */
2013 output->rex |= rexflags(it, ix, REX_X);
2014 output->rex |= rexflags(bt, bx, REX_B);
2016 if (it == -1 && (bt & 7) != REG_NUM_ESP) {
2017 /* no SIB needed */
2018 int mod, rm;
2020 if (bt == -1) {
2021 rm = 5;
2022 mod = 0;
2023 } else {
2024 rm = (bt & 7);
2025 if (rm != REG_NUM_EBP && o == 0 &&
2026 seg == NO_SEG && !forw_ref &&
2027 !(input->eaflags &
2028 (EAF_BYTEOFFS | EAF_WORDOFFS)))
2029 mod = 0;
2030 else if (input->eaflags & EAF_BYTEOFFS ||
2031 (o >= -128 && o <= 127 && seg == NO_SEG
2032 && !forw_ref
2033 && !(input->eaflags & EAF_WORDOFFS)))
2034 mod = 1;
2035 else
2036 mod = 2;
2039 output->sib_present = false;
2040 output->bytes = (bt == -1 || mod == 2 ? 4 : mod);
2041 output->modrm = (mod << 6) | ((rfield & 7) << 3) | rm;
2042 } else {
2043 /* we need a SIB */
2044 int mod, scale, index, base;
2046 if (it == -1)
2047 index = 4, s = 1;
2048 else
2049 index = (it & 7);
2051 switch (s) {
2052 case 1:
2053 scale = 0;
2054 break;
2055 case 2:
2056 scale = 1;
2057 break;
2058 case 4:
2059 scale = 2;
2060 break;
2061 case 8:
2062 scale = 3;
2063 break;
2064 default: /* then what the smeg is it? */
2065 return NULL; /* panic */
2068 if (bt == -1) {
2069 base = 5;
2070 mod = 0;
2071 } else {
2072 base = (bt & 7);
2073 if (base != REG_NUM_EBP && o == 0 &&
2074 seg == NO_SEG && !forw_ref &&
2075 !(input->eaflags &
2076 (EAF_BYTEOFFS | EAF_WORDOFFS)))
2077 mod = 0;
2078 else if (input->eaflags & EAF_BYTEOFFS ||
2079 (o >= -128 && o <= 127 && seg == NO_SEG
2080 && !forw_ref
2081 && !(input->eaflags & EAF_WORDOFFS)))
2082 mod = 1;
2083 else
2084 mod = 2;
2087 output->sib_present = true;
2088 output->bytes = (bt == -1 || mod == 2 ? 4 : mod);
2089 output->modrm = (mod << 6) | ((rfield & 7) << 3) | 4;
2090 output->sib = (scale << 6) | (index << 3) | base;
2092 } else { /* it's 16-bit */
2093 int mod, rm;
2095 /* check for 64-bit long mode */
2096 if (addrbits == 64)
2097 return NULL;
2099 /* check all registers are BX, BP, SI or DI */
2100 if ((b != -1 && b != R_BP && b != R_BX && b != R_SI
2101 && b != R_DI) || (i != -1 && i != R_BP && i != R_BX
2102 && i != R_SI && i != R_DI))
2103 return NULL;
2105 /* ensure the user didn't specify DWORD/QWORD */
2106 if (input->disp_size == 32 || input->disp_size == 64)
2107 return NULL;
2109 if (s != 1 && i != -1)
2110 return NULL; /* no can do, in 16-bit EA */
2111 if (b == -1 && i != -1) {
2112 int tmp = b;
2113 b = i;
2114 i = tmp;
2115 } /* swap */
2116 if ((b == R_SI || b == R_DI) && i != -1) {
2117 int tmp = b;
2118 b = i;
2119 i = tmp;
2121 /* have BX/BP as base, SI/DI index */
2122 if (b == i)
2123 return NULL; /* shouldn't ever happen, in theory */
2124 if (i != -1 && b != -1 &&
2125 (i == R_BP || i == R_BX || b == R_SI || b == R_DI))
2126 return NULL; /* invalid combinations */
2127 if (b == -1) /* pure offset: handled above */
2128 return NULL; /* so if it gets to here, panic! */
2130 rm = -1;
2131 if (i != -1)
2132 switch (i * 256 + b) {
2133 case R_SI * 256 + R_BX:
2134 rm = 0;
2135 break;
2136 case R_DI * 256 + R_BX:
2137 rm = 1;
2138 break;
2139 case R_SI * 256 + R_BP:
2140 rm = 2;
2141 break;
2142 case R_DI * 256 + R_BP:
2143 rm = 3;
2144 break;
2145 } else
2146 switch (b) {
2147 case R_SI:
2148 rm = 4;
2149 break;
2150 case R_DI:
2151 rm = 5;
2152 break;
2153 case R_BP:
2154 rm = 6;
2155 break;
2156 case R_BX:
2157 rm = 7;
2158 break;
2160 if (rm == -1) /* can't happen, in theory */
2161 return NULL; /* so panic if it does */
2163 if (o == 0 && seg == NO_SEG && !forw_ref && rm != 6 &&
2164 !(input->eaflags & (EAF_BYTEOFFS | EAF_WORDOFFS)))
2165 mod = 0;
2166 else if (input->eaflags & EAF_BYTEOFFS ||
2167 (o >= -128 && o <= 127 && seg == NO_SEG
2168 && !forw_ref
2169 && !(input->eaflags & EAF_WORDOFFS)))
2170 mod = 1;
2171 else
2172 mod = 2;
2174 output->sib_present = false; /* no SIB - it's 16-bit */
2175 output->bytes = mod; /* bytes of offset needed */
2176 output->modrm = (mod << 6) | ((rfield & 7) << 3) | rm;
2181 output->size = 1 + output->sib_present + output->bytes;
2182 return output;
2185 static void add_asp(insn *ins, int addrbits)
2187 int j, valid;
2188 int defdisp;
2190 valid = (addrbits == 64) ? 64|32 : 32|16;
2192 switch (ins->prefixes[PPS_ASIZE]) {
2193 case P_A16:
2194 valid &= 16;
2195 break;
2196 case P_A32:
2197 valid &= 32;
2198 break;
2199 case P_A64:
2200 valid &= 64;
2201 break;
2202 case P_ASP:
2203 valid &= (addrbits == 32) ? 16 : 32;
2204 break;
2205 default:
2206 break;
2209 for (j = 0; j < ins->operands; j++) {
2210 if (!(MEMORY & ~ins->oprs[j].type)) {
2211 int32_t i, b;
2213 /* Verify as Register */
2214 if (ins->oprs[j].indexreg < EXPR_REG_START
2215 || ins->oprs[j].indexreg >= REG_ENUM_LIMIT)
2216 i = 0;
2217 else
2218 i = reg_flags[ins->oprs[j].indexreg];
2220 /* Verify as Register */
2221 if (ins->oprs[j].basereg < EXPR_REG_START
2222 || ins->oprs[j].basereg >= REG_ENUM_LIMIT)
2223 b = 0;
2224 else
2225 b = reg_flags[ins->oprs[j].basereg];
2227 if (ins->oprs[j].scale == 0)
2228 i = 0;
2230 if (!i && !b) {
2231 int ds = ins->oprs[j].disp_size;
2232 if ((addrbits != 64 && ds > 8) ||
2233 (addrbits == 64 && ds == 16))
2234 valid &= ds;
2235 } else {
2236 if (!(REG16 & ~b))
2237 valid &= 16;
2238 if (!(REG32 & ~b))
2239 valid &= 32;
2240 if (!(REG64 & ~b))
2241 valid &= 64;
2243 if (!(REG16 & ~i))
2244 valid &= 16;
2245 if (!(REG32 & ~i))
2246 valid &= 32;
2247 if (!(REG64 & ~i))
2248 valid &= 64;
2253 if (valid & addrbits) {
2254 ins->addr_size = addrbits;
2255 } else if (valid & ((addrbits == 32) ? 16 : 32)) {
2256 /* Add an address size prefix */
2257 enum prefixes pref = (addrbits == 32) ? P_A16 : P_A32;
2258 ins->prefixes[PPS_ASIZE] = pref;
2259 ins->addr_size = (addrbits == 32) ? 16 : 32;
2260 } else {
2261 /* Impossible... */
2262 errfunc(ERR_NONFATAL, "impossible combination of address sizes");
2263 ins->addr_size = addrbits; /* Error recovery */
2266 defdisp = ins->addr_size == 16 ? 16 : 32;
2268 for (j = 0; j < ins->operands; j++) {
2269 if (!(MEM_OFFS & ~ins->oprs[j].type) &&
2270 (ins->oprs[j].disp_size ? ins->oprs[j].disp_size : defdisp)
2271 != ins->addr_size) {
2272 /* mem_offs sizes must match the address size; if not,
2273 strip the MEM_OFFS bit and match only EA instructions */
2274 ins->oprs[j].type &= ~(MEM_OFFS & ~MEMORY);