assemble.c

   1 /* assemble.c   code generation for the Netwide Assembler
   2  *
   3  * The Netwide Assembler is copyright (C) 1996 Simon Tatham and
   4  * Julian Hall. All rights reserved. The software is
   5  * redistributable under the license given in the file "LICENSE"
   6  * distributed in the NASM archive.
   7  *
   8  * the actual codes (C syntax, i.e. octal):
   9  * \0            - terminates the code. (Unless it's a literal of course.)
  10  * \1, \2, \3    - that many literal bytes follow in the code stream
  11  * \4, \6        - the POP/PUSH (respectively) codes for CS, DS, ES, SS
  12  *                 (POP is never used for CS) depending on operand 0
  13  * \5, \7        - the second byte of POP/PUSH codes for FS, GS, depending
  14  *                 on operand 0
  15  * \10..\13      - a literal byte follows in the code stream, to be added
  16  *                 to the register value of operand 0..3
  17  * \14..\17      - a signed byte immediate operand, from operand 0..3
  18  * \20..\23      - a byte immediate operand, from operand 0..3
  19  * \24..\27      - an unsigned byte immediate operand, from operand 0..3
  20  * \30..\33      - a word immediate operand, from operand 0..3
  21  * \34..\37      - select between \3[0-3] and \4[0-3] depending on 16/32 bit
  22  *                 assembly mode or the operand-size override on the operand
  23  * \40..\43      - a long immediate operand, from operand 0..3
  24  * \44..\47      - select between \3[0-3], \4[0-3] and \5[4-7]
  25  *                 depending on the address size of the instruction.
  26  * \50..\53      - a byte relative operand, from operand 0..3
  27  * \54..\57      - a qword immediate operand, from operand 0..3
  28  * \60..\63      - a word relative operand, from operand 0..3
  29  * \64..\67      - select between \6[0-3] and \7[0-3] depending on 16/32 bit
  30  *                 assembly mode or the operand-size override on the operand
  31  * \70..\73      - a long relative operand, from operand 0..3
  32  * \74..\77       - a word constant, from the _segment_ part of operand 0..3
  33  * \1ab          - a ModRM, calculated on EA in operand a, with the spare
  34  *                 field the register value of operand b.
  35  * \140..\143    - an immediate word or signed byte for operand 0..3
  36  * \144..\147    - or 2 (s-field) into opcode byte if operand 0..3
  37  *                  is a signed byte rather than a word.  Opcode byte follows.
  38  * \150..\153     - an immediate dword or signed byte for operand 0..3
  39  * \154..\157    - or 2 (s-field) into opcode byte if operand 0..3
  40  *                  is a signed byte rather than a word.  Opcode byte follows.
  41  * \160..\163    - this instruction uses DREX rather than REX, with the
  42  *                 OC0 field set to 0, and the dest field taken from
  43  *                 operand 0..3.
  44  * \164..\167    - this instruction uses DREX rather than REX, with the
  45  *                 OC0 field set to 1, and the dest field taken from
  46  *                 operand 0..3.
  47  * \170          - encodes the literal byte 0. (Some compilers don't take
  48  *                 kindly to a zero byte in the _middle_ of a compile time
  49  *                 string constant, so I had to put this hack in.)
  50  * \171          - placement of DREX suffix in the absence of an EA
  51  * \2ab          - a ModRM, calculated on EA in operand a, with the spare
  52  *                 field equal to digit b.
  53  * \310          - indicates fixed 16-bit address size, i.e. optional 0x67.
  54  * \311          - indicates fixed 32-bit address size, i.e. optional 0x67.
  55  * \312          - (disassembler only) marker on LOOP, LOOPxx instructions.
  56  * \313          - indicates fixed 64-bit address size, 0x67 invalid.
  57  * \314          - (disassembler only) invalid with REX.B
  58  * \315          - (disassembler only) invalid with REX.X
  59  * \316          - (disassembler only) invalid with REX.R
  60  * \317          - (disassembler only) invalid with REX.W
  61  * \320          - indicates fixed 16-bit operand size, i.e. optional 0x66.
  62  * \321          - indicates fixed 32-bit operand size, i.e. optional 0x66.
  63  * \322          - indicates that this instruction is only valid when the
  64  *                 operand size is the default (instruction to disassembler,
  65  *                 generates no code in the assembler)
  66  * \323          - indicates fixed 64-bit operand size, REX on extensions only.
  67  * \324          - indicates 64-bit operand size requiring REX prefix.
  68  * \330          - a literal byte follows in the code stream, to be added
  69  *                 to the condition code value of the instruction.
  70  * \331          - instruction not valid with REP prefix.  Hint for
  71  *                 disassembler only; for SSE instructions.
  72  * \332          - REP prefix (0xF2 byte) used as opcode extension.
  73  * \333          - REP prefix (0xF3 byte) used as opcode extension.
  74  * \334          - LOCK prefix used instead of REX.R
  75  * \335          - disassemble a rep (0xF3 byte) prefix as repe not rep.
  76  * \340          - reserve <operand 0> bytes of uninitialized storage.
  77  *                 Operand 0 had better be a segmentless constant.
  78  * \364          - operand-size prefix (0x66) not permitted
  79  * \365          - address-size prefix (0x67) not permitted
  80  * \366          - operand-size prefix (0x66) used as opcode extension
  81  * \367          - address-size prefix (0x67) used as opcode extension
  82  * \370,\371,\372 - match only if operand 0 meets byte jump criteria.
  83  *                 370 is used for Jcc, 371 is used for JMP.
  84  * \373          - assemble 0x03 if bits==16, 0x05 if bits==32;
  85  *                 used for conditional jump over longer jump
  86  */
  87
  88 #include "compiler.h"
  89
  90 #include <stdio.h>
  91 #include <string.h>
  92 #include <inttypes.h>
  93
  94 #include "nasm.h"
  95 #include "nasmlib.h"
  96 #include "assemble.h"
  97 #include "insns.h"
  98 #include "preproc.h"
  99 #include "regflags.c"
 100 #include "regvals.c"
 101
 102 typedef struct {
 103     int sib_present;                 /* is a SIB byte necessary? */
 104     int bytes;                       /* # of bytes of offset needed */
 105     int size;                        /* lazy - this is sib+bytes+1 */
 106     uint8_t modrm, sib, rex, rip;    /* the bytes themselves */
 107 } ea;
 108
 109 static uint32_t cpu;            /* cpu level received from nasm.c */
 110 static efunc errfunc;
 111 static struct ofmt *outfmt;
 112 static ListGen *list;
 113
 114 static int64_t calcsize(int32_t, int64_t, int, insn *, const char *);
 115 static void gencode(int32_t, int64_t, int, insn *, const char *, int64_t);
 116 static int matches(const struct itemplate *, insn *, int bits);
 117 static int32_t regflag(const operand *);
 118 static int32_t regval(const operand *);
 119 static int rexflags(int, int32_t, int);
 120 static int op_rexflags(const operand *, int);
 121 static ea *process_ea(operand *, ea *, int, int, int, int32_t, int);
 122 static void add_asp(insn *, int);
 123
 124 static int has_prefix(insn * ins, enum prefix_pos pos, enum prefixes prefix)
 125 {
 126     return ins->prefixes[pos] == prefix;
 127 }
 128
 129 static void assert_no_prefix(insn * ins, enum prefix_pos pos)
 130 {
 131     if (ins->prefixes[pos])
 132         errfunc(ERR_NONFATAL, "invalid %s prefix",
 133                 prefix_name(ins->prefixes[pos]));
 134 }
 135
 136 static const char *size_name(int size)
 137 {
 138     switch (size) {
 139     case 1:
 140         return "byte";
 141     case 2:
 142         return "word";
 143     case 4:
 144         return "dword";
 145     case 8:
 146         return "qword";
 147     case 10:
 148         return "tword";
 149     case 16:
 150         return "oword";
 151     default:
 152         return "???";
 153     }
 154 }
 155
 156 static void warn_overflow(int size, int64_t data)
 157 {
 158     if (size < 8) {
 159         int64_t lim = ((int64_t)1 << (size*8))-1;
 160
 161         if (data < ~lim || data > lim)
 162             errfunc(ERR_WARNING | ERR_WARN_NOV, "%s data exceeds bounds", size_name(size));
 163     }
 164 }
 165 /*
 166  * This routine wrappers the real output format's output routine,
 167  * in order to pass a copy of the data off to the listing file
 168  * generator at the same time.
 169  */
 170 static void out(int64_t offset, int32_t segto, const void *data,
 171                 enum out_type type, uint64_t size,
 172                 int32_t segment, int32_t wrt)
 173 {
 174     static int32_t lineno = 0;     /* static!!! */
 175     static char *lnfname = NULL;
 176     uint8_t p[8];
 177
 178     if (type == OUT_ADDRESS && segment == NO_SEG && wrt == NO_SEG) {
 179         /*
 180          * This is a non-relocated address, and we're going to
 181          * convert it into RAWDATA format.
 182          */
 183         uint8_t *q = p;
 184
 185         if (size > 8) {
 186             errfunc(ERR_PANIC, "OUT_ADDRESS with size > 8");
 187             return;
 188         }
 189
 190         WRITEADDR(q, *(int64_t *)data, size);
 191         data = p;
 192         type = OUT_RAWDATA;
 193     }
 194
 195     list->output(offset, data, type, size);
 196
 197     /*
 198      * this call to src_get determines when we call the
 199      * debug-format-specific "linenum" function
 200      * it updates lineno and lnfname to the current values
 201      * returning 0 if "same as last time", -2 if lnfname
 202      * changed, and the amount by which lineno changed,
 203      * if it did. thus, these variables must be static
 204      */
 205
 206     if (src_get(&lineno, &lnfname)) {
 207         outfmt->current_dfmt->linenum(lnfname, lineno, segto);
 208     }
 209
 210     outfmt->output(segto, data, type, size, segment, wrt);
 211 }
 212
 213 static int jmp_match(int32_t segment, int64_t offset, int bits,
 214                      insn * ins, const char *code)
 215 {
 216     int64_t isize;
 217     uint8_t c = code[0];
 218
 219     if (c != 0370 && c != 0371)
 220         return 0;
 221     if (ins->oprs[0].opflags & OPFLAG_FORWARD) {
 222         if ((optimizing < 0 || (ins->oprs[0].type & STRICT))
 223             && c == 0370)
 224             return 1;
 225         else
 226             return (pass0 == 0);        /* match a forward reference */
 227     }
 228     isize = calcsize(segment, offset, bits, ins, code);
 229     if (ins->oprs[0].segment != segment)
 230         return 0;
 231     isize = ins->oprs[0].offset - offset - isize;       /* isize is now the delta */
 232     if (isize >= -128L && isize <= 127L)
 233         return 1;               /* it is byte size */
 234
 235     return 0;
 236 }
 237
 238 int64_t assemble(int32_t segment, int64_t offset, int bits, uint32_t cp,
 239               insn * instruction, struct ofmt *output, efunc error,
 240               ListGen * listgen)
 241 {
 242     const struct itemplate *temp;
 243     int j;
 244     int size_prob;
 245     int64_t insn_end;
 246     int32_t itimes;
 247     int64_t start = offset;
 248     int64_t wsize = 0;             /* size for DB etc. */
 249
 250     errfunc = error;            /* to pass to other functions */
 251     cpu = cp;
 252     outfmt = output;            /* likewise */
 253     list = listgen;             /* and again */
 254
 255     switch (instruction->opcode) {
 256     case -1:
 257         return 0;
 258     case I_DB:
 259         wsize = 1;
 260         break;
 261     case I_DW:
 262         wsize = 2;
 263         break;
 264     case I_DD:
 265         wsize = 4;
 266         break;
 267     case I_DQ:
 268         wsize = 8;
 269         break;
 270     case I_DT:
 271         wsize = 10;
 272         break;
 273     case I_DO:
 274         wsize = 16;
 275         break;
 276     default:
 277         break;
 278     }
 279
 280     if (wsize) {
 281         extop *e;
 282         int32_t t = instruction->times;
 283         if (t < 0)
 284             errfunc(ERR_PANIC,
 285                     "instruction->times < 0 (%ld) in assemble()", t);
 286
 287         while (t--) {           /* repeat TIMES times */
 288             for (e = instruction->eops; e; e = e->next) {
 289                 if (e->type == EOT_DB_NUMBER) {
 290                     if (wsize == 1) {
 291                         if (e->segment != NO_SEG)
 292                             errfunc(ERR_NONFATAL,
 293                                     "one-byte relocation attempted");
 294                         else {
 295                             uint8_t out_byte = e->offset;
 296                             out(offset, segment, &out_byte,
 297                                 OUT_RAWDATA, 1, NO_SEG, NO_SEG);
 298                         }
 299                     } else if (wsize > 8) {
 300                         errfunc(ERR_NONFATAL, "integer supplied to a DT or DO"
 301                                 " instruction");
 302                     } else
 303                         out(offset, segment, &e->offset,
 304                             OUT_ADDRESS, wsize, e->segment, e->wrt);
 305                     offset += wsize;
 306                 } else if (e->type == EOT_DB_STRING) {
 307                     int align;
 308
 309                     out(offset, segment, e->stringval,
 310                         OUT_RAWDATA, e->stringlen, NO_SEG, NO_SEG);
 311                     align = e->stringlen % wsize;
 312
 313                     if (align) {
 314                         align = wsize - align;
 315                         out(offset, segment, "\0\0\0\0\0\0\0\0",
 316                             OUT_RAWDATA, align, NO_SEG, NO_SEG);
 317                     }
 318                     offset += e->stringlen + align;
 319                 }
 320             }
 321             if (t > 0 && t == instruction->times - 1) {
 322                 /*
 323                  * Dummy call to list->output to give the offset to the
 324                  * listing module.
 325                  */
 326                 list->output(offset, NULL, OUT_RAWDATA, 0);
 327                 list->uplevel(LIST_TIMES);
 328             }
 329         }
 330         if (instruction->times > 1)
 331             list->downlevel(LIST_TIMES);
 332         return offset - start;
 333     }
 334
 335     if (instruction->opcode == I_INCBIN) {
 336         static char fname[FILENAME_MAX];
 337         FILE *fp;
 338         int32_t len;
 339         char *prefix = "", *combine;
 340         char **pPrevPath = NULL;
 341
 342         len = FILENAME_MAX - 1;
 343         if (len > instruction->eops->stringlen)
 344             len = instruction->eops->stringlen;
 345         strncpy(fname, instruction->eops->stringval, len);
 346         fname[len] = '\0';
 347
 348         while (1) {         /* added by alexfru: 'incbin' uses include paths */
 349             combine = nasm_malloc(strlen(prefix) + len + 1);
 350             strcpy(combine, prefix);
 351             strcat(combine, fname);
 352
 353             if ((fp = fopen(combine, "rb")) != NULL) {
 354                 nasm_free(combine);
 355                 break;
 356             }
 357
 358             nasm_free(combine);
 359             pPrevPath = pp_get_include_path_ptr(pPrevPath);
 360             if (pPrevPath == NULL)
 361                 break;
 362             prefix = *pPrevPath;
 363         }
 364
 365         if (fp == NULL)
 366             error(ERR_NONFATAL, "`incbin': unable to open file `%s'",
 367                   fname);
 368         else if (fseek(fp, 0L, SEEK_END) < 0)
 369             error(ERR_NONFATAL, "`incbin': unable to seek on file `%s'",
 370                   fname);
 371         else {
 372             static char buf[2048];
 373             int32_t t = instruction->times;
 374             int32_t base = 0;
 375
 376             len = ftell(fp);
 377             if (instruction->eops->next) {
 378                 base = instruction->eops->next->offset;
 379                 len -= base;
 380                 if (instruction->eops->next->next &&
 381                     len > instruction->eops->next->next->offset)
 382                     len = instruction->eops->next->next->offset;
 383             }
 384             /*
 385              * Dummy call to list->output to give the offset to the
 386              * listing module.
 387              */
 388             list->output(offset, NULL, OUT_RAWDATA, 0);
 389             list->uplevel(LIST_INCBIN);
 390             while (t--) {
 391                 int32_t l;
 392
 393                 fseek(fp, base, SEEK_SET);
 394                 l = len;
 395                 while (l > 0) {
 396                     int32_t m =
 397                         fread(buf, 1, (l > (int32_t) sizeof(buf) ? (int32_t) sizeof(buf) : l),
 398                               fp);
 399                     if (!m) {
 400                         /*
 401                          * This shouldn't happen unless the file
 402                          * actually changes while we are reading
 403                          * it.
 404                          */
 405                         error(ERR_NONFATAL,
 406                               "`incbin': unexpected EOF while"
 407                               " reading file `%s'", fname);
 408                         t = 0;  /* Try to exit cleanly */
 409                         break;
 410                     }
 411                     out(offset, segment, buf, OUT_RAWDATA, m,
 412                         NO_SEG, NO_SEG);
 413                     l -= m;
 414                 }
 415             }
 416             list->downlevel(LIST_INCBIN);
 417             if (instruction->times > 1) {
 418                 /*
 419                  * Dummy call to list->output to give the offset to the
 420                  * listing module.
 421                  */
 422                 list->output(offset, NULL, OUT_RAWDATA, 0);
 423                 list->uplevel(LIST_TIMES);
 424                 list->downlevel(LIST_TIMES);
 425             }
 426             fclose(fp);
 427             return instruction->times * len;
 428         }
 429         return 0;               /* if we're here, there's an error */
 430     }
 431
 432     /* Check to see if we need an address-size prefix */
 433     add_asp(instruction, bits);
 434
 435     size_prob = false;
 436
 437     for (temp = nasm_instructions[instruction->opcode]; temp->opcode != -1; temp++){
 438         int m = matches(temp, instruction, bits);
 439
 440         if (m == 99)
 441             m += jmp_match(segment, offset, bits, instruction, temp->code);
 442
 443         if (m == 100) {         /* matches! */
 444             const char *codes = temp->code;
 445             int64_t insn_size = calcsize(segment, offset, bits,
 446                                       instruction, codes);
 447             itimes = instruction->times;
 448             if (insn_size < 0)  /* shouldn't be, on pass two */
 449                 error(ERR_PANIC, "errors made it through from pass one");
 450             else
 451                 while (itimes--) {
 452                     for (j = 0; j < MAXPREFIX; j++) {
 453                         uint8_t c = 0;
 454                         switch (instruction->prefixes[j]) {
 455                         case P_LOCK:
 456                             c = 0xF0;
 457                             break;
 458                         case P_REPNE:
 459                         case P_REPNZ:
 460                             c = 0xF2;
 461                             break;
 462                         case P_REPE:
 463                         case P_REPZ:
 464                         case P_REP:
 465                             c = 0xF3;
 466                             break;
 467                         case R_CS:
 468                             if (bits == 64) {
 469                                 error(ERR_WARNING,
 470                                       "cs segment base generated, but will be ignored in 64-bit mode");
 471                             }
 472                             c = 0x2E;
 473                             break;
 474                         case R_DS:
 475                             if (bits == 64) {
 476                                 error(ERR_WARNING,
 477                                       "ds segment base generated, but will be ignored in 64-bit mode");
 478                             }
 479                             c = 0x3E;
 480                             break;
 481                         case R_ES:
 482                            if (bits == 64) {
 483                                 error(ERR_WARNING,
 484                                       "es segment base generated, but will be ignored in 64-bit mode");
 485                            }
 486                             c = 0x26;
 487                             break;
 488                         case R_FS:
 489                             c = 0x64;
 490                             break;
 491                         case R_GS:
 492                             c = 0x65;
 493                             break;
 494                         case R_SS:
 495                             if (bits == 64) {
 496                                 error(ERR_WARNING,
 497                                       "ss segment base generated, but will be ignored in 64-bit mode");
 498                             }
 499                             c = 0x36;
 500                             break;
 501                         case R_SEGR6:
 502                         case R_SEGR7:
 503                             error(ERR_NONFATAL,
 504                                   "segr6 and segr7 cannot be used as prefixes");
 505                             break;
 506                         case P_A16:
 507                             if (bits == 64) {
 508                                 error(ERR_NONFATAL,
 509                                       "16-bit addressing is not supported "
 510                                       "in 64-bit mode");
 511                             } else if (bits != 16)
 512                                 c = 0x67;
 513                             break;
 514                         case P_A32:
 515                             if (bits != 32)
 516                                 c = 0x67;
 517                             break;
 518                         case P_A64:
 519                             if (bits != 64) {
 520                                 error(ERR_NONFATAL,
 521                                       "64-bit addressing is only supported "
 522                                       "in 64-bit mode");
 523                             }
 524                             break;
 525                         case P_ASP:
 526                             c = 0x67;
 527                             break;
 528                         case P_O16:
 529                             if (bits != 16)
 530                                 c = 0x66;
 531                             break;
 532                         case P_O32:
 533                             if (bits == 16)
 534                                 c = 0x66;
 535                             break;
 536                         case P_O64:
 537                             /* REX.W */
 538                             break;
 539                         case P_OSP:
 540                             c = 0x66;
 541                             break;
 542                         case P_none:
 543                             break;
 544                         default:
 545                             error(ERR_PANIC, "invalid instruction prefix");
 546                         }
 547                         if (c != 0) {
 548                             out(offset, segment, &c, OUT_RAWDATA, 1,
 549                                 NO_SEG, NO_SEG);
 550                             offset++;
 551                         }
 552                     }
 553                     insn_end = offset + insn_size;
 554                     gencode(segment, offset, bits, instruction, codes,
 555                             insn_end);
 556                     offset += insn_size;
 557                     if (itimes > 0 && itimes == instruction->times - 1) {
 558                         /*
 559                          * Dummy call to list->output to give the offset to the
 560                          * listing module.
 561                          */
 562                         list->output(offset, NULL, OUT_RAWDATA, 0);
 563                         list->uplevel(LIST_TIMES);
 564                     }
 565                 }
 566             if (instruction->times > 1)
 567                 list->downlevel(LIST_TIMES);
 568             return offset - start;
 569         } else if (m > 0 && m > size_prob) {
 570             size_prob = m;
 571         }
 572 //        temp++;
 573     }
 574
 575     if (temp->opcode == -1) {   /* didn't match any instruction */
 576         switch (size_prob) {
 577         case 1:
 578             error(ERR_NONFATAL, "operation size not specified");
 579             break;
 580         case 2:
 581             error(ERR_NONFATAL, "mismatch in operand sizes");
 582             break;
 583         case 3:
 584             error(ERR_NONFATAL, "no instruction for this cpu level");
 585             break;
 586         case 4:
 587             error(ERR_NONFATAL, "instruction not supported in 64-bit mode");
 588             break;
 589         default:
 590             error(ERR_NONFATAL,
 591                   "invalid combination of opcode and operands");
 592             break;
 593         }
 594     }
 595     return 0;
 596 }
 597
 598 int64_t insn_size(int32_t segment, int64_t offset, int bits, uint32_t cp,
 599                insn * instruction, efunc error)
 600 {
 601     const struct itemplate *temp;
 602
 603     errfunc = error;            /* to pass to other functions */
 604     cpu = cp;
 605
 606     if (instruction->opcode == -1)
 607         return 0;
 608
 609     if (instruction->opcode == I_DB || instruction->opcode == I_DW ||
 610         instruction->opcode == I_DD || instruction->opcode == I_DQ ||
 611         instruction->opcode == I_DT || instruction->opcode == I_DO) {
 612         extop *e;
 613         int32_t isize, osize, wsize = 0;   /* placate gcc */
 614
 615         isize = 0;
 616         switch (instruction->opcode) {
 617         case I_DB:
 618             wsize = 1;
 619             break;
 620         case I_DW:
 621             wsize = 2;
 622             break;
 623         case I_DD:
 624             wsize = 4;
 625             break;
 626         case I_DQ:
 627             wsize = 8;
 628             break;
 629         case I_DT:
 630             wsize = 10;
 631             break;
 632         case I_DO:
 633             wsize = 16;
 634             break;
 635         default:
 636             break;
 637         }
 638
 639         for (e = instruction->eops; e; e = e->next) {
 640             int32_t align;
 641
 642             osize = 0;
 643             if (e->type == EOT_DB_NUMBER)
 644                 osize = 1;
 645             else if (e->type == EOT_DB_STRING)
 646                 osize = e->stringlen;
 647
 648             align = (-osize) % wsize;
 649             if (align < 0)
 650                 align += wsize;
 651             isize += osize + align;
 652         }
 653         return isize * instruction->times;
 654     }
 655
 656     if (instruction->opcode == I_INCBIN) {
 657         char fname[FILENAME_MAX];
 658         FILE *fp;
 659         int32_t len;
 660         char *prefix = "", *combine;
 661         char **pPrevPath = NULL;
 662
 663         len = FILENAME_MAX - 1;
 664         if (len > instruction->eops->stringlen)
 665             len = instruction->eops->stringlen;
 666         strncpy(fname, instruction->eops->stringval, len);
 667         fname[len] = '\0';
 668
 669         /* added by alexfru: 'incbin' uses include paths */
 670         while (1) {
 671             combine = nasm_malloc(strlen(prefix) + len + 1);
 672             strcpy(combine, prefix);
 673             strcat(combine, fname);
 674
 675             if ((fp = fopen(combine, "rb")) != NULL) {
 676                 nasm_free(combine);
 677                 break;
 678             }
 679
 680             nasm_free(combine);
 681             pPrevPath = pp_get_include_path_ptr(pPrevPath);
 682             if (pPrevPath == NULL)
 683                 break;
 684             prefix = *pPrevPath;
 685         }
 686
 687         if (fp == NULL)
 688             error(ERR_NONFATAL, "`incbin': unable to open file `%s'",
 689                   fname);
 690         else if (fseek(fp, 0L, SEEK_END) < 0)
 691             error(ERR_NONFATAL, "`incbin': unable to seek on file `%s'",
 692                   fname);
 693         else {
 694             len = ftell(fp);
 695             fclose(fp);
 696             if (instruction->eops->next) {
 697                 len -= instruction->eops->next->offset;
 698                 if (instruction->eops->next->next &&
 699                     len > instruction->eops->next->next->offset) {
 700                     len = instruction->eops->next->next->offset;
 701                 }
 702             }
 703             return instruction->times * len;
 704         }
 705         return 0;               /* if we're here, there's an error */
 706     }
 707
 708     /* Check to see if we need an address-size prefix */
 709     add_asp(instruction, bits);
 710
 711     for (temp = nasm_instructions[instruction->opcode]; temp->opcode != -1; temp++) {
 712         int m = matches(temp, instruction, bits);
 713         if (m == 99)
 714             m += jmp_match(segment, offset, bits, instruction, temp->code);
 715
 716         if (m == 100) {
 717             /* we've matched an instruction. */
 718             int64_t isize;
 719             const char *codes = temp->code;
 720             int j;
 721
 722             isize = calcsize(segment, offset, bits, instruction, codes);
 723             if (isize < 0)
 724                 return -1;
 725             for (j = 0; j < MAXPREFIX; j++) {
 726                 switch (instruction->prefixes[j]) {
 727                 case P_A16:
 728                     if (bits != 16)
 729                         isize++;
 730                     break;
 731                 case P_A32:
 732                     if (bits != 32)
 733                         isize++;
 734                     break;
 735                 case P_O16:
 736                     if (bits != 16)
 737                         isize++;
 738                     break;
 739                 case P_O32:
 740                     if (bits == 16)
 741                         isize++;
 742                     break;
 743                 case P_A64:
 744                 case P_O64:
 745                 case P_none:
 746                     break;
 747                 default:
 748                     isize++;
 749                     break;
 750                 }
 751             }
 752             return isize * instruction->times;
 753         }
 754     }
 755     return -1;                  /* didn't match any instruction */
 756 }
 757
 758 /* check that  opn[op]  is a signed byte of size 16 or 32,
 759                                         and return the signed value*/
 760 static int is_sbyte(insn * ins, int op, int size)
 761 {
 762     int32_t v;
 763     int ret;
 764
 765     ret = !(ins->forw_ref && ins->oprs[op].opflags) &&  /* dead in the water on forward reference or External */
 766         optimizing >= 0 &&
 767         !(ins->oprs[op].type & STRICT) &&
 768         ins->oprs[op].wrt == NO_SEG && ins->oprs[op].segment == NO_SEG;
 769
 770     v = ins->oprs[op].offset;
 771     if (size == 16)
 772         v = (int16_t)v;    /* sign extend if 16 bits */
 773
 774     return ret && v >= -128L && v <= 127L;
 775 }
 776
 777 static int64_t calcsize(int32_t segment, int64_t offset, int bits,
 778                      insn * ins, const char *codes)
 779 {
 780     int64_t length = 0;
 781     uint8_t c;
 782     int rex_mask = ~0;
 783     struct operand *opx;
 784
 785     ins->rex = 0;               /* Ensure REX is reset */
 786
 787     if (ins->prefixes[PPS_OSIZE] == P_O64)
 788         ins->rex |= REX_W;
 789
 790     (void)segment;              /* Don't warn that this parameter is unused */
 791     (void)offset;               /* Don't warn that this parameter is unused */
 792
 793     while (*codes) {
 794         c = *codes++;
 795         opx = &ins->oprs[c & 3];
 796         switch (c) {
 797         case 01:
 798         case 02:
 799         case 03:
 800             codes += c, length += c;
 801             break;
 802         case 04:
 803         case 05:
 804         case 06:
 805         case 07:
 806             length++;
 807             break;
 808         case 010:
 809         case 011:
 810         case 012:
 811         case 013:
 812             ins->rex |=
 813                 op_rexflags(opx, REX_B|REX_H|REX_P|REX_W);
 814             codes++, length++;
 815             break;
 816         case 014:
 817         case 015:
 818         case 016:
 819         case 017:
 820             length++;
 821             break;
 822         case 020:
 823         case 021:
 824         case 022:
 825         case 023:
 826             length++;
 827             break;
 828         case 024:
 829         case 025:
 830         case 026:
 831         case 027:
 832             length++;
 833             break;
 834         case 030:
 835         case 031:
 836         case 032:
 837         case 033:
 838             length += 2;
 839             break;
 840         case 034:
 841         case 035:
 842         case 036:
 843         case 037:
 844             if (opx->type & (BITS16 | BITS32 | BITS64))
 845                 length += (opx->type & BITS16) ? 2 : 4;
 846             else
 847                 length += (bits == 16) ? 2 : 4;
 848             break;
 849         case 040:
 850         case 041:
 851         case 042:
 852         case 043:
 853             length += 4;
 854             break;
 855         case 044:
 856         case 045:
 857         case 046:
 858         case 047:
 859             length += ins->addr_size >> 3;
 860             break;
 861         case 050:
 862         case 051:
 863         case 052:
 864         case 053:
 865             length++;
 866             break;
 867         case 054:
 868         case 055:
 869         case 056:
 870         case 057:
 871             length += 8; /* MOV reg64/imm */
 872             break;
 873         case 060:
 874         case 061:
 875         case 062:
 876         case 063:
 877             length += 2;
 878             break;
 879         case 064:
 880         case 065:
 881         case 066:
 882         case 067:
 883             if (opx->type & (BITS16 | BITS32 | BITS64))
 884                 length += (opx->type & BITS16) ? 2 : 4;
 885             else
 886                 length += (bits == 16) ? 2 : 4;
 887             break;
 888         case 070:
 889         case 071:
 890         case 072:
 891         case 073:
 892             length += 4;
 893             break;
 894         case 074:
 895         case 075:
 896         case 076:
 897         case 077:
 898             length += 2;
 899             break;
 900         case 0140:
 901         case 0141:
 902         case 0142:
 903         case 0143:
 904             length += is_sbyte(ins, c & 3, 16) ? 1 : 2;
 905             break;
 906         case 0144:
 907         case 0145:
 908         case 0146:
 909         case 0147:
 910             codes++;
 911             length++;
 912             break;
 913         case 0150:
 914         case 0151:
 915         case 0152:
 916         case 0153:
 917             length += is_sbyte(ins, c & 3, 32) ? 1 : 4;
 918             break;
 919         case 0154:
 920         case 0155:
 921         case 0156:
 922         case 0157:
 923             codes++;
 924             length++;
 925             break;
 926         case 0160:
 927         case 0161:
 928         case 0162:
 929         case 0163:
 930             length++;
 931             ins->rex |= REX_D;
 932             ins->drexdst = regval(&ins->oprs[c & 3]);
 933             break;
 934         case 0164:
 935         case 0165:
 936         case 0166:
 937         case 0167:
 938             length++;
 939             ins->rex |= REX_D|REX_OC;
 940             ins->drexdst = regval(&ins->oprs[c & 3]);
 941             break;
 942         case 0170:
 943             length++;
 944             break;
 945         case 0171:
 946             break;
 947         case 0300:
 948         case 0301:
 949         case 0302:
 950         case 0303:
 951             break;
 952         case 0310:
 953             if (bits == 64)
 954                 return -1;
 955             length += (bits != 16) && !has_prefix(ins, PPS_ASIZE, P_A16);
 956             break;
 957         case 0311:
 958             length += (bits != 32) && !has_prefix(ins, PPS_ASIZE, P_A32);
 959             break;
 960         case 0312:
 961             break;
 962         case 0313:
 963             if (bits != 64 || has_prefix(ins, PPS_ASIZE, P_A16) ||
 964                 has_prefix(ins, PPS_ASIZE, P_A32))
 965                 return -1;
 966             break;
 967         case 0314:
 968         case 0315:
 969         case 0316:
 970         case 0317:
 971             break;
 972         case 0320:
 973             length += (bits != 16);
 974             break;
 975         case 0321:
 976             length += (bits == 16);
 977             break;
 978         case 0322:
 979             break;
 980         case 0323:
 981             rex_mask &= ~REX_W;
 982             break;
 983         case 0324:
 984             ins->rex |= REX_W;
 985             break;
 986         case 0330:
 987             codes++, length++;
 988             break;
 989         case 0331:
 990             break;
 991         case 0332:
 992         case 0333:
 993             length++;
 994             break;
 995         case 0334:
 996             ins->rex |= REX_L;
 997             break;
 998         case 0335:
 999             break;
1000         case 0340:
1001             if (ins->oprs[0].segment != NO_SEG)
1002                 errfunc(ERR_NONFATAL, "attempt to reserve non-constant"
1003                         " quantity of BSS space");
1004             else
1005                 length += ins->oprs[0].offset;
1006             break;
1007         case 0364:
1008         case 0365:
1009             break;
1010         case 0366:
1011         case 0367:
1012             length++;
1013             break;
1014         case 0370:
1015         case 0371:
1016         case 0372:
1017             break;
1018         case 0373:
1019             length++;
1020             break;
1021         default:               /* can't do it by 'case' statements */
1022             if (c >= 0100 && c <= 0277) {       /* it's an EA */
1023                 ea ea_data;
1024                 int rfield;
1025                 int32_t rflags;
1026                 ea_data.rex = 0;           /* Ensure ea.REX is initially 0 */
1027
1028                 if (c <= 0177) {
1029                     /* pick rfield from operand b */
1030                     rflags = regflag(&ins->oprs[c & 7]);
1031                     rfield = regvals[ins->oprs[c & 7].basereg];
1032                 } else {
1033                     rflags = 0;
1034                     rfield = c & 7;
1035                 }
1036
1037                 if (!process_ea
1038                     (&ins->oprs[(c >> 3) & 7], &ea_data, bits,
1039                      ins->addr_size, rfield, rflags, ins->forw_ref)) {
1040                     errfunc(ERR_NONFATAL, "invalid effective address");
1041                     return -1;
1042                 } else {
1043                     ins->rex |= ea_data.rex;
1044                     length += ea_data.size;
1045                 }
1046             } else {
1047                 errfunc(ERR_PANIC, "internal instruction table corrupt"
1048                         ": instruction code 0x%02X given", c);
1049             }
1050         }
1051     }
1052
1053     ins->rex &= rex_mask;
1054
1055     if (ins->rex & REX_D) {
1056         if (ins->rex & REX_H) {
1057             errfunc(ERR_NONFATAL, "cannot use high register in drex instruction");
1058             return -1;
1059         }
1060         if (bits != 64 && ((ins->rex & (REX_W|REX_X|REX_B)) ||
1061                            ins->drexdst > 7)) {
1062             errfunc(ERR_NONFATAL, "invalid operands in non-64-bit mode");
1063             return -1;
1064         }
1065         length++;
1066     } else if (ins->rex & REX_REAL) {
1067         if (ins->rex & REX_H) {
1068             errfunc(ERR_NONFATAL, "cannot use high register in rex instruction");
1069             return -1;
1070         } else if (bits == 64) {
1071             length++;
1072         } else if ((ins->rex & REX_L) &&
1073                    !(ins->rex & (REX_P|REX_W|REX_X|REX_B)) &&
1074                    cpu >= IF_X86_64) {
1075             /* LOCK-as-REX.R */
1076             assert_no_prefix(ins, PPS_LREP);
1077             length++;
1078         } else {
1079             errfunc(ERR_NONFATAL, "invalid operands in non-64-bit mode");
1080             return -1;
1081         }
1082     }
1083
1084     return length;
1085 }
1086
1087 #define EMIT_REX()                                                      \
1088     if (!(ins->rex & REX_D) && (ins->rex & REX_REAL) && (bits == 64)) { \
1089         ins->rex = (ins->rex & REX_REAL)|REX_P;                         \
1090         out(offset, segment, &ins->rex, OUT_RAWDATA, 1, NO_SEG, NO_SEG); \
1091         ins->rex = 0;                                                   \
1092         offset += 1; \
1093     }
1094
1095 static void gencode(int32_t segment, int64_t offset, int bits,
1096                     insn * ins, const char *codes, int64_t insn_end)
1097 {
1098     static char condval[] = {   /* conditional opcodes */
1099         0x7, 0x3, 0x2, 0x6, 0x2, 0x4, 0xF, 0xD, 0xC, 0xE, 0x6, 0x2,
1100         0x3, 0x7, 0x3, 0x5, 0xE, 0xC, 0xD, 0xF, 0x1, 0xB, 0x9, 0x5,
1101         0x0, 0xA, 0xA, 0xB, 0x8, 0x4
1102     };
1103     uint8_t c;
1104     uint8_t bytes[4];
1105     int64_t size;
1106     int64_t data;
1107     struct operand *opx;
1108
1109     while (*codes) {
1110         c = *codes++;
1111         opx = &ins->oprs[c & 3];
1112         switch (c) {
1113         case 01:
1114         case 02:
1115         case 03:
1116             EMIT_REX();
1117             out(offset, segment, codes, OUT_RAWDATA, c, NO_SEG, NO_SEG);
1118             codes += c;
1119             offset += c;
1120             break;
1121
1122         case 04:
1123         case 06:
1124             switch (ins->oprs[0].basereg) {
1125             case R_CS:
1126                 bytes[0] = 0x0E + (c == 0x04 ? 1 : 0);
1127                 break;
1128             case R_DS:
1129                 bytes[0] = 0x1E + (c == 0x04 ? 1 : 0);
1130                 break;
1131             case R_ES:
1132                 bytes[0] = 0x06 + (c == 0x04 ? 1 : 0);
1133                 break;
1134             case R_SS:
1135                 bytes[0] = 0x16 + (c == 0x04 ? 1 : 0);
1136                 break;
1137             default:
1138                 errfunc(ERR_PANIC,
1139                         "bizarre 8086 segment register received");
1140             }
1141             out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1142             offset++;
1143             break;
1144
1145         case 05:
1146         case 07:
1147             switch (ins->oprs[0].basereg) {
1148             case R_FS:
1149                 bytes[0] = 0xA0 + (c == 0x05 ? 1 : 0);
1150                 break;
1151             case R_GS:
1152                 bytes[0] = 0xA8 + (c == 0x05 ? 1 : 0);
1153                 break;
1154             default:
1155                 errfunc(ERR_PANIC,
1156                         "bizarre 386 segment register received");
1157             }
1158             out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1159             offset++;
1160             break;
1161
1162         case 010:
1163         case 011:
1164         case 012:
1165         case 013:
1166             EMIT_REX();
1167             bytes[0] = *codes++ + ((regval(opx)) & 7);
1168             out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1169             offset += 1;
1170             break;
1171
1172         case 014:
1173         case 015:
1174         case 016:
1175         case 017:
1176             if (opx->offset < -128 || opx->offset > 127) {
1177                 errfunc(ERR_WARNING | ERR_WARN_NOV,
1178                         "signed byte value exceeds bounds");
1179             }
1180
1181             if (opx->segment != NO_SEG) {
1182                 data = opx->offset;
1183                 out(offset, segment, &data, OUT_ADDRESS, 1,
1184                     opx->segment, opx->wrt);
1185             } else {
1186                 bytes[0] = opx->offset;
1187                 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG,
1188                     NO_SEG);
1189             }
1190             offset += 1;
1191             break;
1192
1193         case 020:
1194         case 021:
1195         case 022:
1196         case 023:
1197             if (opx->offset < -256 || opx->offset > 255) {
1198                 errfunc(ERR_WARNING | ERR_WARN_NOV,
1199                         "byte value exceeds bounds");
1200             }
1201             if (opx->segment != NO_SEG) {
1202                 data = opx->offset;
1203                 out(offset, segment, &data, OUT_ADDRESS, 1,
1204                     opx->segment, opx->wrt);
1205             } else {
1206                 bytes[0] = opx->offset;
1207                 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG,
1208                     NO_SEG);
1209             }
1210             offset += 1;
1211             break;
1212
1213         case 024:
1214         case 025:
1215         case 026:
1216         case 027:
1217             if (opx->offset < 0 || opx->offset > 255)
1218                 errfunc(ERR_WARNING | ERR_WARN_NOV,
1219                         "unsigned byte value exceeds bounds");
1220             if (opx->segment != NO_SEG) {
1221                 data = opx->offset;
1222                 out(offset, segment, &data, OUT_ADDRESS, 1,
1223                     opx->segment, opx->wrt);
1224             } else {
1225                 bytes[0] = opx->offset;
1226                 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG,
1227                     NO_SEG);
1228             }
1229             offset += 1;
1230             break;
1231
1232         case 030:
1233         case 031:
1234         case 032:
1235         case 033:
1236             data = opx->offset;
1237             if (opx->segment == NO_SEG && opx->wrt == NO_SEG)
1238                 warn_overflow(2, data);
1239             out(offset, segment, &data, OUT_ADDRESS, 2,
1240                 opx->segment, opx->wrt);
1241             offset += 2;
1242             break;
1243
1244         case 034:
1245         case 035:
1246         case 036:
1247         case 037:
1248             if (opx->type & (BITS16 | BITS32))
1249                 size = (opx->type & BITS16) ? 2 : 4;
1250             else
1251                 size = (bits == 16) ? 2 : 4;
1252             data = opx->offset;
1253             if (opx->segment == NO_SEG && opx->wrt == NO_SEG)
1254                 warn_overflow(size, data);
1255             out(offset, segment, &data, OUT_ADDRESS, size,
1256                 opx->segment, opx->wrt);
1257             offset += size;
1258             break;
1259
1260         case 040:
1261         case 041:
1262         case 042:
1263         case 043:
1264             data = opx->offset;
1265             if (opx->segment == NO_SEG && opx->wrt == NO_SEG)
1266                 warn_overflow(4, data);
1267             out(offset, segment, &data, OUT_ADDRESS, 4,
1268                 opx->segment, opx->wrt);
1269             offset += 4;
1270             break;
1271
1272         case 044:
1273         case 045:
1274         case 046:
1275         case 047:
1276             data = opx->offset;
1277             size = ins->addr_size >> 3;
1278             if (opx->segment == NO_SEG &&
1279                 opx->wrt == NO_SEG)
1280                 warn_overflow(size, data);
1281             out(offset, segment, &data, OUT_ADDRESS, size,
1282                 opx->segment, opx->wrt);
1283             offset += size;
1284             break;
1285
1286         case 050:
1287         case 051:
1288         case 052:
1289         case 053:
1290             if (opx->segment != segment)
1291                 errfunc(ERR_NONFATAL,
1292                         "short relative jump outside segment");
1293             data = opx->offset - insn_end;
1294             if (data > 127 || data < -128)
1295                 errfunc(ERR_NONFATAL, "short jump is out of range");
1296             bytes[0] = data;
1297             out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1298             offset += 1;
1299             break;
1300
1301         case 054:
1302         case 055:
1303         case 056:
1304         case 057:
1305             data = (int64_t)opx->offset;
1306             out(offset, segment, &data, OUT_ADDRESS, 8,
1307                 opx->segment, opx->wrt);
1308             offset += 8;
1309             break;
1310
1311         case 060:
1312         case 061:
1313         case 062:
1314         case 063:
1315             if (opx->segment != segment) {
1316                 data = opx->offset;
1317                 out(offset, segment, &data,
1318                     OUT_REL2ADR, insn_end - offset,
1319                     opx->segment, opx->wrt);
1320             } else {
1321                 data = opx->offset - insn_end;
1322                 out(offset, segment, &data,
1323                     OUT_ADDRESS, 2, NO_SEG, NO_SEG);
1324             }
1325             offset += 2;
1326             break;
1327
1328         case 064:
1329         case 065:
1330         case 066:
1331         case 067:
1332             if (opx->type & (BITS16 | BITS32 | BITS64))
1333                 size = (opx->type & BITS16) ? 2 : 4;
1334             else
1335                 size = (bits == 16) ? 2 : 4;
1336             if (opx->segment != segment) {
1337                 data = opx->offset;
1338                 out(offset, segment, &data,
1339                     size == 2 ? OUT_REL2ADR : OUT_REL4ADR,
1340                     insn_end - offset, opx->segment, opx->wrt);
1341             } else {
1342                 data = opx->offset - insn_end;
1343                 out(offset, segment, &data,
1344                     OUT_ADDRESS, size, NO_SEG, NO_SEG);
1345             }
1346             offset += size;
1347             break;
1348
1349         case 070:
1350         case 071:
1351         case 072:
1352         case 073:
1353             if (opx->segment != segment) {
1354                 data = opx->offset;
1355                 out(offset, segment, &data,
1356                     OUT_REL4ADR, insn_end - offset,
1357                     opx->segment, opx->wrt);
1358             } else {
1359                 data = opx->offset - insn_end;
1360                 out(offset, segment, &data,
1361                     OUT_ADDRESS, 4, NO_SEG, NO_SEG);
1362             }
1363             offset += 4;
1364             break;
1365
1366         case 074:
1367         case 075:
1368         case 076:
1369         case 077:
1370             if (opx->segment == NO_SEG)
1371                 errfunc(ERR_NONFATAL, "value referenced by FAR is not"
1372                         " relocatable");
1373             data = 0L;
1374             out(offset, segment, &data, OUT_ADDRESS, 2,
1375                 outfmt->segbase(1 + opx->segment),
1376                 opx->wrt);
1377             offset += 2;
1378             break;
1379
1380         case 0140:
1381         case 0141:
1382         case 0142:
1383         case 0143:
1384             data = opx->offset;
1385             if (is_sbyte(ins, c & 3, 16)) {
1386                 bytes[0] = data;
1387                 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG,
1388                     NO_SEG);
1389                 offset++;
1390             } else {
1391                 if (opx->segment == NO_SEG &&
1392                     opx->wrt == NO_SEG)
1393                     warn_overflow(2, data);
1394                 out(offset, segment, &data, OUT_ADDRESS, 2,
1395                     opx->segment, opx->wrt);
1396                 offset += 2;
1397             }
1398             break;
1399
1400         case 0144:
1401         case 0145:
1402         case 0146:
1403         case 0147:
1404             EMIT_REX();
1405             bytes[0] = *codes++;
1406             if (is_sbyte(ins, c & 3, 16))
1407                 bytes[0] |= 2;  /* s-bit */
1408             out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1409             offset++;
1410             break;
1411
1412         case 0150:
1413         case 0151:
1414         case 0152:
1415         case 0153:
1416             data = opx->offset;
1417             if (is_sbyte(ins, c & 3, 32)) {
1418                 bytes[0] = data;
1419                 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG,
1420                     NO_SEG);
1421                 offset++;
1422             } else {
1423                 out(offset, segment, &data, OUT_ADDRESS, 4,
1424                     opx->segment, opx->wrt);
1425                 offset += 4;
1426             }
1427             break;
1428
1429         case 0154:
1430         case 0155:
1431         case 0156:
1432         case 0157:
1433             EMIT_REX();
1434             bytes[0] = *codes++;
1435             if (is_sbyte(ins, c & 3, 32))
1436                 bytes[0] |= 2;  /* s-bit */
1437             out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1438             offset++;
1439             break;
1440
1441         case 0160:
1442         case 0161:
1443         case 0162:
1444         case 0163:
1445         case 0164:
1446         case 0165:
1447         case 0166:
1448         case 0167:
1449             break;
1450
1451         case 0170:
1452             EMIT_REX();
1453             bytes[0] = 0;
1454             out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1455             offset += 1;
1456             break;
1457
1458         case 0171:
1459             bytes[0] =
1460                 (ins->drexdst << 4) |
1461                 (ins->rex & REX_OC ? 0x08 : 0) |
1462                 (ins->rex & (REX_R|REX_X|REX_B));
1463             ins->rex = 0;
1464             out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1465             offset++;
1466             break;
1467
1468         case 0300:
1469         case 0301:
1470         case 0302:
1471         case 0303:
1472             break;
1473
1474         case 0310:
1475             if (bits == 32 && !has_prefix(ins, PPS_ASIZE, P_A16)) {
1476                 *bytes = 0x67;
1477                 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1478                 offset += 1;
1479             } else
1480                 offset += 0;
1481             break;
1482
1483         case 0311:
1484             if (bits != 32 && !has_prefix(ins, PPS_ASIZE, P_A32)) {
1485                 *bytes = 0x67;
1486                 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1487                 offset += 1;
1488             } else
1489                 offset += 0;
1490             break;
1491
1492         case 0312:
1493             break;
1494
1495         case 0313:
1496             ins->rex = 0;
1497             break;
1498
1499         case 0314:
1500         case 0315:
1501         case 0316:
1502         case 0317:
1503             break;
1504
1505         case 0320:
1506             if (bits != 16) {
1507                 *bytes = 0x66;
1508                 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1509                 offset += 1;
1510             } else
1511                 offset += 0;
1512             break;
1513
1514         case 0321:
1515             if (bits == 16) {
1516                 *bytes = 0x66;
1517                 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1518                 offset += 1;
1519             } else
1520                 offset += 0;
1521             break;
1522
1523         case 0322:
1524         case 0323:
1525             break;
1526
1527         case 0324:
1528             ins->rex |= REX_W;
1529             break;
1530
1531         case 0330:
1532             *bytes = *codes++ ^ condval[ins->condition];
1533             out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1534             offset += 1;
1535             break;
1536
1537         case 0331:
1538             break;
1539
1540         case 0332:
1541         case 0333:
1542             *bytes = c - 0332 + 0xF2;
1543             out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1544             offset += 1;
1545             break;
1546
1547         case 0334:
1548             if (ins->rex & REX_R) {
1549                 *bytes = 0xF0;
1550                 out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1551                 offset += 1;
1552             }
1553             ins->rex &= ~(REX_L|REX_R);
1554             break;
1555
1556         case 0335:
1557             break;
1558
1559         case 0340:
1560             if (ins->oprs[0].segment != NO_SEG)
1561                 errfunc(ERR_PANIC, "non-constant BSS size in pass two");
1562             else {
1563                 int64_t size = ins->oprs[0].offset;
1564                 if (size > 0)
1565                     out(offset, segment, NULL,
1566                         OUT_RESERVE, size, NO_SEG, NO_SEG);
1567                 offset += size;
1568             }
1569             break;
1570
1571         case 0364:
1572         case 0365:
1573             break;
1574
1575         case 0366:
1576         case 0367:
1577             *bytes = c - 0366 + 0x66;
1578             out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1579             offset += 1;
1580             break;
1581
1582         case 0370:
1583         case 0371:
1584         case 0372:
1585             break;
1586
1587         case 0373:
1588             *bytes = bits == 16 ? 3 : 5;
1589             out(offset, segment, bytes, OUT_RAWDATA, 1, NO_SEG, NO_SEG);
1590             offset += 1;
1591             break;
1592
1593         default:               /* can't do it by 'case' statements */
1594             if (c >= 0100 && c <= 0277) {       /* it's an EA */
1595                 ea ea_data;
1596                 int rfield;
1597                 int32_t rflags;
1598                 uint8_t *p;
1599                 int32_t s;
1600
1601                 if (c <= 0177) {
1602                     /* pick rfield from operand b */
1603                     rflags = regflag(&ins->oprs[c & 7]);
1604                     rfield = regvals[ins->oprs[c & 7].basereg];
1605                 } else {
1606                     /* rfield is constant */
1607                     rflags = 0;
1608                     rfield = c & 7;
1609                 }
1610
1611                 if (!process_ea
1612                     (&ins->oprs[(c >> 3) & 7], &ea_data, bits,
1613                      ins->addr_size, rfield, rflags, ins->forw_ref)) {
1614                     errfunc(ERR_NONFATAL, "invalid effective address");
1615                 }
1616
1617
1618                 p = bytes;
1619                 *p++ = ea_data.modrm;
1620                 if (ea_data.sib_present)
1621                     *p++ = ea_data.sib;
1622
1623                 /* DREX suffixes come between the SIB and the displacement */
1624                 if (ins->rex & REX_D) {
1625                     *p++ =
1626                         (ins->drexdst << 4) |
1627                         (ins->rex & REX_OC ? 0x08 : 0) |
1628                         (ins->rex & (REX_R|REX_X|REX_B));
1629                     ins->rex = 0;
1630                 }
1631
1632                 s = p - bytes;
1633                 out(offset, segment, bytes, OUT_RAWDATA, s, NO_SEG, NO_SEG);
1634
1635                 switch (ea_data.bytes) {
1636                 case 0:
1637                     break;
1638                 case 1:
1639                     if (ins->oprs[(c >> 3) & 7].segment != NO_SEG) {
1640                         data = ins->oprs[(c >> 3) & 7].offset;
1641                         out(offset, segment, &data, OUT_ADDRESS, 1,
1642                             ins->oprs[(c >> 3) & 7].segment,
1643                             ins->oprs[(c >> 3) & 7].wrt);
1644                     } else {
1645                         *bytes = ins->oprs[(c >> 3) & 7].offset;
1646                         out(offset, segment, bytes, OUT_RAWDATA, 1,
1647                             NO_SEG, NO_SEG);
1648                     }
1649                     s++;
1650                     break;
1651                 case 8:
1652                 case 2:
1653                 case 4:
1654                     data = ins->oprs[(c >> 3) & 7].offset;
1655                     warn_overflow(ea_data.bytes, data);
1656                     out(offset, segment, &data,
1657                         ea_data.rip ?  OUT_REL4ADR : OUT_ADDRESS,
1658                         ea_data.bytes,
1659                         ins->oprs[(c >> 3) & 7].segment,
1660                         ins->oprs[(c >> 3) & 7].wrt);
1661                     s += ea_data.bytes;
1662                     break;
1663                 }
1664                 offset += s;
1665             } else {
1666                 errfunc(ERR_PANIC, "internal instruction table corrupt"
1667                         ": instruction code 0x%02X given", c);
1668             }
1669         }
1670     }
1671 }
1672
1673 static int32_t regflag(const operand * o)
1674 {
1675     if (o->basereg < EXPR_REG_START || o->basereg >= REG_ENUM_LIMIT) {
1676         errfunc(ERR_PANIC, "invalid operand passed to regflag()");
1677     }
1678     return reg_flags[o->basereg];
1679 }
1680
1681 static int32_t regval(const operand * o)
1682 {
1683     if (o->basereg < EXPR_REG_START || o->basereg >= REG_ENUM_LIMIT) {
1684         errfunc(ERR_PANIC, "invalid operand passed to regval()");
1685     }
1686     return regvals[o->basereg];
1687 }
1688
1689 static int op_rexflags(const operand * o, int mask)
1690 {
1691     int32_t flags;
1692     int val;
1693
1694     if (o->basereg < EXPR_REG_START || o->basereg >= REG_ENUM_LIMIT) {
1695         errfunc(ERR_PANIC, "invalid operand passed to op_rexflags()");
1696     }
1697
1698     flags = reg_flags[o->basereg];
1699     val = regvals[o->basereg];
1700
1701     return rexflags(val, flags, mask);
1702 }
1703
1704 static int rexflags(int val, int32_t flags, int mask)
1705 {
1706     int rex = 0;
1707
1708     if (val >= 8)
1709         rex |= REX_B|REX_X|REX_R;
1710     if (flags & BITS64)
1711         rex |= REX_W;
1712     if (!(REG_HIGH & ~flags))   /* AH, CH, DH, BH */
1713         rex |= REX_H;
1714     else if (!(REG8 & ~flags) && val >= 4) /* SPL, BPL, SIL, DIL */
1715         rex |= REX_P;
1716
1717     return rex & mask;
1718 }
1719
1720 static int matches(const struct itemplate *itemp, insn * instruction, int bits)
1721 {
1722     int i, size[MAX_OPERANDS], asize, oprs, ret;
1723
1724     ret = 100;
1725
1726     /*
1727      * Check the opcode
1728      */
1729     if (itemp->opcode != instruction->opcode)
1730         return 0;
1731
1732     /*
1733      * Count the operands
1734      */
1735     if (itemp->operands != instruction->operands)
1736         return 0;
1737
1738     /*
1739      * Check that no spurious colons or TOs are present
1740      */
1741     for (i = 0; i < itemp->operands; i++)
1742         if (instruction->oprs[i].type & ~itemp->opd[i] & (COLON | TO))
1743             return 0;
1744
1745     /*
1746      * Check that the operand flags all match up
1747      */
1748     for (i = 0; i < itemp->operands; i++) {
1749         if (itemp->opd[i] & SAME_AS) {
1750             int j = itemp->opd[i] & ~SAME_AS;
1751             if (instruction->oprs[i].type != instruction->oprs[j].type ||
1752                 instruction->oprs[i].basereg != instruction->oprs[j].basereg)
1753                 return 0;
1754         } else  if (itemp->opd[i] & ~instruction->oprs[i].type ||
1755             ((itemp->opd[i] & SIZE_MASK) &&
1756              ((itemp->opd[i] ^ instruction->oprs[i].type) & SIZE_MASK))) {
1757             if ((itemp->opd[i] & ~instruction->oprs[i].type & ~SIZE_MASK) ||
1758                 (instruction->oprs[i].type & SIZE_MASK))
1759                 return 0;
1760             else
1761                 return 1;
1762         }
1763     }
1764
1765     /*
1766      * Check operand sizes
1767      */
1768     if (itemp->flags & IF_ARMASK) {
1769         memset(size, 0, sizeof size);
1770
1771         switch (itemp->flags & IF_ARMASK) {
1772         case IF_AR0:
1773             i = 0;
1774             break;
1775         case IF_AR1:
1776             i = 1;
1777             break;
1778         case IF_AR2:
1779             i = 2;
1780             break;
1781         case IF_AR3:
1782             i = 3;
1783             break;
1784         default:
1785             break;              /* Shouldn't happen */
1786         }
1787         switch (itemp->flags & IF_SMASK) {
1788         case IF_SB:
1789             size[i] = BITS8;
1790             break;
1791         case IF_SW:
1792             size[i] = BITS16;
1793             break;
1794         case IF_SD:
1795             size[i] = BITS32;
1796             break;
1797         case IF_SQ:
1798             size[i] = BITS64;
1799             break;
1800         case IF_SO:
1801             size[i] = BITS128;
1802             break;
1803         default:
1804             break;
1805         }
1806     } else {
1807         asize = 0;
1808         switch (itemp->flags & IF_SMASK) {
1809         case IF_SB:
1810             asize = BITS8;
1811             oprs = itemp->operands;
1812             break;
1813         case IF_SW:
1814             asize = BITS16;
1815             oprs = itemp->operands;
1816             break;
1817         case IF_SD:
1818             asize = BITS32;
1819             oprs = itemp->operands;
1820             break;
1821         case IF_SQ:
1822             asize = BITS64;
1823             oprs = itemp->operands;
1824             break;
1825         case IF_SO:
1826             asize = BITS128;
1827             oprs = itemp->operands;
1828             break;
1829         default:
1830             break;
1831         }
1832         for (i = 0; i < MAX_OPERANDS; i++)
1833             size[i] = asize;
1834     }
1835
1836     if (itemp->flags & (IF_SM | IF_SM2)) {
1837         oprs = (itemp->flags & IF_SM2 ? 2 : itemp->operands);
1838         asize = 0;
1839         for (i = 0; i < oprs; i++) {
1840             if ((asize = itemp->opd[i] & SIZE_MASK) != 0) {
1841                 int j;
1842                 for (j = 0; j < oprs; j++)
1843                     size[j] = asize;
1844                 break;
1845             }
1846         }
1847     } else {
1848         oprs = itemp->operands;
1849     }
1850
1851     for (i = 0; i < itemp->operands; i++) {
1852         if (!(itemp->opd[i] & SIZE_MASK) &&
1853             (instruction->oprs[i].type & SIZE_MASK & ~size[i]))
1854             return 2;
1855     }
1856
1857     /*
1858      * Check template is okay at the set cpu level
1859      */
1860     if (((itemp->flags & IF_PLEVEL) > cpu))
1861         return 3;
1862
1863     /*
1864      * Check if instruction is available in long mode
1865      */
1866     if ((itemp->flags & IF_NOLONG) && (bits == 64))
1867         return 4;
1868
1869     /*
1870      * Check if special handling needed for Jumps
1871      */
1872     if ((uint8_t)(itemp->code[0]) >= 0370)
1873         return 99;
1874
1875     return ret;
1876 }
1877
1878 static ea *process_ea(operand * input, ea * output, int bits,
1879                       int addrbits, int rfield, int32_t rflags, int forw_ref)
1880 {
1881     output->rip = false;
1882
1883     /* REX flags for the rfield operand */
1884     output->rex |= rexflags(rfield, rflags, REX_R|REX_P|REX_W|REX_H);
1885
1886     if (!(REGISTER & ~input->type)) {   /* register direct */
1887         int i;
1888         int32_t f;
1889
1890         if (input->basereg < EXPR_REG_START /* Verify as Register */
1891             || input->basereg >= REG_ENUM_LIMIT)
1892             return NULL;
1893         f = regflag(input);
1894         i = regvals[input->basereg];
1895
1896         if (REG_EA & ~f)
1897             return NULL;        /* Invalid EA register */
1898
1899         output->rex |= op_rexflags(input, REX_B|REX_P|REX_W|REX_H);
1900
1901         output->sib_present = false;             /* no SIB necessary */
1902         output->bytes = 0;  /* no offset necessary either */
1903         output->modrm = 0xC0 | ((rfield & 7) << 3) | (i & 7);
1904     } else {                    /* it's a memory reference */
1905         if (input->basereg == -1
1906             && (input->indexreg == -1 || input->scale == 0)) {
1907             /* it's a pure offset */
1908             if (bits == 64 && (~input->type & IP_REL)) {
1909               int scale, index, base;
1910               output->sib_present = true;
1911               scale = 0;
1912               index = 4;
1913               base = 5;
1914               output->sib = (scale << 6) | (index << 3) | base;
1915               output->bytes = 4;
1916               output->modrm = 4 | ((rfield & 7) << 3);
1917               output->rip = false;
1918             } else {
1919               output->sib_present = false;
1920               output->bytes = (addrbits != 16 ? 4 : 2);
1921               output->modrm = (addrbits != 16 ? 5 : 6) | ((rfield & 7) << 3);
1922               output->rip = bits == 64;
1923             }
1924         } else {                /* it's an indirection */
1925             int i = input->indexreg, b = input->basereg, s = input->scale;
1926             int32_t o = input->offset, seg = input->segment;
1927             int hb = input->hintbase, ht = input->hinttype;
1928             int t;
1929             int it, bt;
1930             int32_t ix, bx;     /* register flags */
1931
1932             if (s == 0)
1933                 i = -1;         /* make this easy, at least */
1934
1935             if (i >= EXPR_REG_START && i < REG_ENUM_LIMIT) {
1936                 it = regvals[i];
1937                 ix = reg_flags[i];
1938             } else {
1939                 it = -1;
1940                 ix = 0;
1941             }
1942
1943             if (b >= EXPR_REG_START && b < REG_ENUM_LIMIT) {
1944                 bt = regvals[b];
1945                 bx = reg_flags[b];
1946             } else {
1947                 bt = -1;
1948                 bx = 0;
1949             }
1950
1951             /* check for a 32/64-bit memory reference... */
1952             if ((ix|bx) & (BITS32|BITS64)) {
1953                 /* it must be a 32/64-bit memory reference. Firstly we have
1954                  * to check that all registers involved are type E/Rxx. */
1955                 int32_t sok = BITS32|BITS64;
1956
1957                 if (it != -1) {
1958                     if (!(REG64 & ~ix) || !(REG32 & ~ix))
1959                         sok &= ix;
1960                     else
1961                         return NULL;
1962                 }
1963
1964                 if (bt != -1) {
1965                     if (REG_GPR & ~bx)
1966                         return NULL; /* Invalid register */
1967                     if (~sok & bx & SIZE_MASK)
1968                         return NULL; /* Invalid size */
1969                     sok &= bx;
1970                 }
1971
1972                 /* While we're here, ensure the user didn't specify
1973                    WORD or QWORD. */
1974                 if (input->disp_size == 16 || input->disp_size == 64)
1975                     return NULL;
1976
1977                 if (addrbits == 16 ||
1978                     (addrbits == 32 && !(sok & BITS32)) ||
1979                     (addrbits == 64 && !(sok & BITS64)))
1980                     return NULL;
1981
1982                 /* now reorganize base/index */
1983                 if (s == 1 && bt != it && bt != -1 && it != -1 &&
1984                     ((hb == b && ht == EAH_NOTBASE)
1985                      || (hb == i && ht == EAH_MAKEBASE))) {
1986                     /* swap if hints say so */
1987                     t = bt, bt = it, it = t;
1988                     t = bx, bx = ix, ix = t;
1989                 }
1990                 if (bt == it)     /* convert EAX+2*EAX to 3*EAX */
1991                     bt = -1, bx = 0, s++;
1992                 if (bt == -1 && s == 1 && !(hb == it && ht == EAH_NOTBASE)) {
1993                     /* make single reg base, unless hint */
1994                     bt = it, bx = ix, it = -1, ix = 0;
1995                 }
1996                 if (((s == 2 && it != REG_NUM_ESP
1997                       && !(input->eaflags & EAF_TIMESTWO)) || s == 3
1998                      || s == 5 || s == 9) && bt == -1)
1999                     bt = it, bx = ix, s--; /* convert 3*EAX to EAX+2*EAX */
2000                 if (it == -1 && (bt & 7) != REG_NUM_ESP
2001                     && (input->eaflags & EAF_TIMESTWO))
2002                     it = bt, ix = bx, bt = -1, bx = 0, s = 1;
2003                 /* convert [NOSPLIT EAX] to sib format with 0x0 displacement */
2004                 if (s == 1 && it == REG_NUM_ESP) {
2005                     /* swap ESP into base if scale is 1 */
2006                     t = it, it = bt, bt = t;
2007                     t = ix, ix = bx, bx = t;
2008                 }
2009                 if (it == REG_NUM_ESP
2010                     || (s != 1 && s != 2 && s != 4 && s != 8 && it != -1))
2011                     return NULL;        /* wrong, for various reasons */
2012
2013                 output->rex |= rexflags(it, ix, REX_X);
2014                 output->rex |= rexflags(bt, bx, REX_B);
2015
2016                 if (it == -1 && (bt & 7) != REG_NUM_ESP) {
2017                     /* no SIB needed */
2018                     int mod, rm;
2019
2020                     if (bt == -1) {
2021                         rm = 5;
2022                         mod = 0;
2023                     } else {
2024                         rm = (bt & 7);
2025                         if (rm != REG_NUM_EBP && o == 0 &&
2026                                 seg == NO_SEG && !forw_ref &&
2027                                 !(input->eaflags &
2028                                   (EAF_BYTEOFFS | EAF_WORDOFFS)))
2029                             mod = 0;
2030                         else if (input->eaflags & EAF_BYTEOFFS ||
2031                                  (o >= -128 && o <= 127 && seg == NO_SEG
2032                                   && !forw_ref
2033                                   && !(input->eaflags & EAF_WORDOFFS)))
2034                             mod = 1;
2035                         else
2036                             mod = 2;
2037                     }
2038
2039                     output->sib_present = false;
2040                     output->bytes = (bt == -1 || mod == 2 ? 4 : mod);
2041                     output->modrm = (mod << 6) | ((rfield & 7) << 3) | rm;
2042                 } else {
2043                     /* we need a SIB */
2044                     int mod, scale, index, base;
2045
2046                     if (it == -1)
2047                         index = 4, s = 1;
2048                     else
2049                         index = (it & 7);
2050
2051                     switch (s) {
2052                     case 1:
2053                         scale = 0;
2054                         break;
2055                     case 2:
2056                         scale = 1;
2057                         break;
2058                     case 4:
2059                         scale = 2;
2060                         break;
2061                     case 8:
2062                         scale = 3;
2063                         break;
2064                     default:   /* then what the smeg is it? */
2065                         return NULL;    /* panic */
2066                     }
2067
2068                     if (bt == -1) {
2069                         base = 5;
2070                         mod = 0;
2071                     } else {
2072                         base = (bt & 7);
2073                         if (base != REG_NUM_EBP && o == 0 &&
2074                                     seg == NO_SEG && !forw_ref &&
2075                                     !(input->eaflags &
2076                                       (EAF_BYTEOFFS | EAF_WORDOFFS)))
2077                             mod = 0;
2078                         else if (input->eaflags & EAF_BYTEOFFS ||
2079                                  (o >= -128 && o <= 127 && seg == NO_SEG
2080                                   && !forw_ref
2081                                   && !(input->eaflags & EAF_WORDOFFS)))
2082                             mod = 1;
2083                         else
2084                             mod = 2;
2085                     }
2086
2087                     output->sib_present = true;
2088                     output->bytes =  (bt == -1 || mod == 2 ? 4 : mod);
2089                     output->modrm = (mod << 6) | ((rfield & 7) << 3) | 4;
2090                     output->sib = (scale << 6) | (index << 3) | base;
2091                 }
2092             } else {            /* it's 16-bit */
2093                 int mod, rm;
2094
2095                 /* check for 64-bit long mode */
2096                 if (addrbits == 64)
2097                     return NULL;
2098
2099                 /* check all registers are BX, BP, SI or DI */
2100                 if ((b != -1 && b != R_BP && b != R_BX && b != R_SI
2101                      && b != R_DI) || (i != -1 && i != R_BP && i != R_BX
2102                                        && i != R_SI && i != R_DI))
2103                     return NULL;
2104
2105                 /* ensure the user didn't specify DWORD/QWORD */
2106                 if (input->disp_size == 32 || input->disp_size == 64)
2107                     return NULL;
2108
2109                 if (s != 1 && i != -1)
2110                     return NULL;        /* no can do, in 16-bit EA */
2111                 if (b == -1 && i != -1) {
2112                     int tmp = b;
2113                     b = i;
2114                     i = tmp;
2115                 }               /* swap */
2116                 if ((b == R_SI || b == R_DI) && i != -1) {
2117                     int tmp = b;
2118                     b = i;
2119                     i = tmp;
2120                 }
2121                 /* have BX/BP as base, SI/DI index */
2122                 if (b == i)
2123                     return NULL;        /* shouldn't ever happen, in theory */
2124                 if (i != -1 && b != -1 &&
2125                     (i == R_BP || i == R_BX || b == R_SI || b == R_DI))
2126                     return NULL;        /* invalid combinations */
2127                 if (b == -1)    /* pure offset: handled above */
2128                     return NULL;        /* so if it gets to here, panic! */
2129
2130                 rm = -1;
2131                 if (i != -1)
2132                     switch (i * 256 + b) {
2133                     case R_SI * 256 + R_BX:
2134                         rm = 0;
2135                         break;
2136                     case R_DI * 256 + R_BX:
2137                         rm = 1;
2138                         break;
2139                     case R_SI * 256 + R_BP:
2140                         rm = 2;
2141                         break;
2142                     case R_DI * 256 + R_BP:
2143                         rm = 3;
2144                         break;
2145                 } else
2146                     switch (b) {
2147                     case R_SI:
2148                         rm = 4;
2149                         break;
2150                     case R_DI:
2151                         rm = 5;
2152                         break;
2153                     case R_BP:
2154                         rm = 6;
2155                         break;
2156                     case R_BX:
2157                         rm = 7;
2158                         break;
2159                     }
2160                 if (rm == -1)   /* can't happen, in theory */
2161                     return NULL;        /* so panic if it does */
2162
2163                 if (o == 0 && seg == NO_SEG && !forw_ref && rm != 6 &&
2164                     !(input->eaflags & (EAF_BYTEOFFS | EAF_WORDOFFS)))
2165                     mod = 0;
2166                 else if (input->eaflags & EAF_BYTEOFFS ||
2167                          (o >= -128 && o <= 127 && seg == NO_SEG
2168                           && !forw_ref
2169                           && !(input->eaflags & EAF_WORDOFFS)))
2170                     mod = 1;
2171                 else
2172                     mod = 2;
2173
2174                 output->sib_present = false;    /* no SIB - it's 16-bit */
2175                 output->bytes = mod;    /* bytes of offset needed */
2176                 output->modrm = (mod << 6) | ((rfield & 7) << 3) | rm;
2177             }
2178         }
2179     }
2180
2181     output->size = 1 + output->sib_present + output->bytes;
2182     return output;
2183 }
2184
2185 static void add_asp(insn *ins, int addrbits)
2186 {
2187     int j, valid;
2188     int defdisp;
2189
2190     valid = (addrbits == 64) ? 64|32 : 32|16;
2191
2192     switch (ins->prefixes[PPS_ASIZE]) {
2193     case P_A16:
2194         valid &= 16;
2195         break;
2196     case P_A32:
2197         valid &= 32;
2198         break;
2199     case P_A64:
2200         valid &= 64;
2201         break;
2202     case P_ASP:
2203         valid &= (addrbits == 32) ? 16 : 32;
2204         break;
2205     default:
2206         break;
2207     }
2208
2209     for (j = 0; j < ins->operands; j++) {
2210         if (!(MEMORY & ~ins->oprs[j].type)) {
2211             int32_t i, b;
2212
2213             /* Verify as Register */
2214             if (ins->oprs[j].indexreg < EXPR_REG_START
2215                 || ins->oprs[j].indexreg >= REG_ENUM_LIMIT)
2216                 i = 0;
2217             else
2218                 i = reg_flags[ins->oprs[j].indexreg];
2219
2220             /* Verify as Register */
2221             if (ins->oprs[j].basereg < EXPR_REG_START
2222                 || ins->oprs[j].basereg >= REG_ENUM_LIMIT)
2223                 b = 0;
2224             else
2225                 b = reg_flags[ins->oprs[j].basereg];
2226
2227             if (ins->oprs[j].scale == 0)
2228                 i = 0;
2229
2230             if (!i && !b) {
2231                 int ds = ins->oprs[j].disp_size;
2232                 if ((addrbits != 64 && ds > 8) ||
2233                     (addrbits == 64 && ds == 16))
2234                     valid &= ds;
2235             } else {
2236                 if (!(REG16 & ~b))
2237                     valid &= 16;
2238                 if (!(REG32 & ~b))
2239                     valid &= 32;
2240                 if (!(REG64 & ~b))
2241                     valid &= 64;
2242
2243                 if (!(REG16 & ~i))
2244                     valid &= 16;
2245                 if (!(REG32 & ~i))
2246                     valid &= 32;
2247                 if (!(REG64 & ~i))
2248                     valid &= 64;
2249             }
2250         }
2251     }
2252
2253     if (valid & addrbits) {
2254         ins->addr_size = addrbits;
2255     } else if (valid & ((addrbits == 32) ? 16 : 32)) {
2256         /* Add an address size prefix */
2257         enum prefixes pref = (addrbits == 32) ? P_A16 : P_A32;
2258         ins->prefixes[PPS_ASIZE] = pref;
2259         ins->addr_size = (addrbits == 32) ? 16 : 32;
2260     } else {
2261         /* Impossible... */
2262         errfunc(ERR_NONFATAL, "impossible combination of address sizes");
2263         ins->addr_size = addrbits; /* Error recovery */
2264     }
2265
2266     defdisp = ins->addr_size == 16 ? 16 : 32;
2267
2268     for (j = 0; j < ins->operands; j++) {
2269         if (!(MEM_OFFS & ~ins->oprs[j].type) &&
2270             (ins->oprs[j].disp_size ? ins->oprs[j].disp_size : defdisp)
2271             != ins->addr_size) {
2272             /* mem_offs sizes must match the address size; if not,
2273                strip the MEM_OFFS bit and match only EA instructions */
2274             ins->oprs[j].type &= ~(MEM_OFFS & ~MEMORY);
2275         }
2276     }
2277 }