preproc.c

   1 /* preproc.c   macro preprocessor for the Netwide Assembler
   2  *
   3  * The Netwide Assembler is copyright (C) 1996 Simon Tatham and
   4  * Julian Hall. All rights reserved. The software is
   5  * redistributable under the license given in the file "LICENSE"
   6  * distributed in the NASM archive.
   7  *
   8  * initial version 18/iii/97 by Simon Tatham
   9  */
  10
  11 /* Typical flow of text through preproc
  12  *
  13  * pp_getline gets tokenized lines, either
  14  *
  15  *   from a macro expansion
  16  *
  17  * or
  18  *   {
  19  *   read_line  gets raw text from stdmacpos, or predef, or current input file
  20  *   tokenize   converts to tokens
  21  *   }
  22  *
  23  * expand_mmac_params is used to expand %1 etc., unless a macro is being
  24  * defined or a false conditional is being processed
  25  * (%0, %1, %+1, %-1, %%foo
  26  *
  27  * do_directive checks for directives
  28  *
  29  * expand_smacro is used to expand single line macros
  30  *
  31  * expand_mmacro is used to expand multi-line macros
  32  *
  33  * detoken is used to convert the line back to text
  34  */
  35
  36 #include "compiler.h"
  37
  38 #include <stdio.h>
  39 #include <stdarg.h>
  40 #include <stdlib.h>
  41 #include <stddef.h>
  42 #include <string.h>
  43 #include <ctype.h>
  44 #include <limits.h>
  45 #include <inttypes.h>
  46
  47 #include "nasm.h"
  48 #include "nasmlib.h"
  49 #include "preproc.h"
  50 #include "hashtbl.h"
  51 #include "stdscan.h"
  52 #include "tokens.h"
  53
  54 typedef struct SMacro SMacro;
  55 typedef struct MMacro MMacro;
  56 typedef struct Context Context;
  57 typedef struct Token Token;
  58 typedef struct Blocks Blocks;
  59 typedef struct Line Line;
  60 typedef struct Include Include;
  61 typedef struct Cond Cond;
  62 typedef struct IncPath IncPath;
  63
  64 /*
  65  * Note on the storage of both SMacro and MMacros: the hash table
  66  * indexes them case-insensitively, and we then have to go through a
  67  * linked list of potential case aliases (and, for MMacros, parameter
  68  * ranges); this is to preserve the matching semantics of the earlier
  69  * code.  If the number of case aliases for a specific macro is a
  70  * performance issue, you may want to reconsider your coding style.
  71  */
  72
  73 /*
  74  * Store the definition of a single-line macro.
  75  */
  76 struct SMacro {
  77     SMacro *next;
  78     char *name;
  79     bool casesense;
  80     bool in_progress;
  81     unsigned int nparam;
  82     Token *expansion;
  83 };
  84
  85 /*
  86  * Store the definition of a multi-line macro. This is also used to
  87  * store the interiors of `%rep...%endrep' blocks, which are
  88  * effectively self-re-invoking multi-line macros which simply
  89  * don't have a name or bother to appear in the hash tables. %rep
  90  * blocks are signified by having a NULL `name' field.
  91  *
  92  * In a MMacro describing a `%rep' block, the `in_progress' field
  93  * isn't merely boolean, but gives the number of repeats left to
  94  * run.
  95  *
  96  * The `next' field is used for storing MMacros in hash tables; the
  97  * `next_active' field is for stacking them on istk entries.
  98  *
  99  * When a MMacro is being expanded, `params', `iline', `nparam',
 100  * `paramlen', `rotate' and `unique' are local to the invocation.
 101  */
 102 struct MMacro {
 103     MMacro *next;
 104     char *name;
 105     int nparam_min, nparam_max;
 106     bool casesense;
 107     bool plus;                   /* is the last parameter greedy? */
 108     bool nolist;                 /* is this macro listing-inhibited? */
 109     int64_t in_progress;
 110     Token *dlist;               /* All defaults as one list */
 111     Token **defaults;           /* Parameter default pointers */
 112     int ndefs;                  /* number of default parameters */
 113     Line *expansion;
 114
 115     MMacro *next_active;
 116     MMacro *rep_nest;           /* used for nesting %rep */
 117     Token **params;             /* actual parameters */
 118     Token *iline;               /* invocation line */
 119     unsigned int nparam, rotate;
 120     int *paramlen;
 121     uint64_t unique;
 122     int lineno;                 /* Current line number on expansion */
 123 };
 124
 125 /*
 126  * The context stack is composed of a linked list of these.
 127  */
 128 struct Context {
 129     Context *next;
 130     SMacro *localmac;
 131     char *name;
 132     uint32_t number;
 133 };
 134
 135 /*
 136  * This is the internal form which we break input lines up into.
 137  * Typically stored in linked lists.
 138  *
 139  * Note that `type' serves a double meaning: TOK_SMAC_PARAM is not
 140  * necessarily used as-is, but is intended to denote the number of
 141  * the substituted parameter. So in the definition
 142  *
 143  *     %define a(x,y) ( (x) & ~(y) )
 144  *
 145  * the token representing `x' will have its type changed to
 146  * TOK_SMAC_PARAM, but the one representing `y' will be
 147  * TOK_SMAC_PARAM+1.
 148  *
 149  * TOK_INTERNAL_STRING is a dirty hack: it's a single string token
 150  * which doesn't need quotes around it. Used in the pre-include
 151  * mechanism as an alternative to trying to find a sensible type of
 152  * quote to use on the filename we were passed.
 153  */
 154 enum pp_token_type {
 155     TOK_NONE = 0, TOK_WHITESPACE, TOK_COMMENT, TOK_ID,
 156     TOK_PREPROC_ID, TOK_STRING,
 157     TOK_NUMBER, TOK_FLOAT, TOK_SMAC_END, TOK_OTHER, TOK_SMAC_PARAM,
 158     TOK_INTERNAL_STRING
 159 };
 160
 161 struct Token {
 162     Token *next;
 163     char *text;
 164     SMacro *mac;                /* associated macro for TOK_SMAC_END */
 165     enum pp_token_type type;
 166 };
 167
 168 /*
 169  * Multi-line macro definitions are stored as a linked list of
 170  * these, which is essentially a container to allow several linked
 171  * lists of Tokens.
 172  *
 173  * Note that in this module, linked lists are treated as stacks
 174  * wherever possible. For this reason, Lines are _pushed_ on to the
 175  * `expansion' field in MMacro structures, so that the linked list,
 176  * if walked, would give the macro lines in reverse order; this
 177  * means that we can walk the list when expanding a macro, and thus
 178  * push the lines on to the `expansion' field in _istk_ in reverse
 179  * order (so that when popped back off they are in the right
 180  * order). It may seem cockeyed, and it relies on my design having
 181  * an even number of steps in, but it works...
 182  *
 183  * Some of these structures, rather than being actual lines, are
 184  * markers delimiting the end of the expansion of a given macro.
 185  * This is for use in the cycle-tracking and %rep-handling code.
 186  * Such structures have `finishes' non-NULL, and `first' NULL. All
 187  * others have `finishes' NULL, but `first' may still be NULL if
 188  * the line is blank.
 189  */
 190 struct Line {
 191     Line *next;
 192     MMacro *finishes;
 193     Token *first;
 194 };
 195
 196 /*
 197  * To handle an arbitrary level of file inclusion, we maintain a
 198  * stack (ie linked list) of these things.
 199  */
 200 struct Include {
 201     Include *next;
 202     FILE *fp;
 203     Cond *conds;
 204     Line *expansion;
 205     char *fname;
 206     int lineno, lineinc;
 207     MMacro *mstk;               /* stack of active macros/reps */
 208 };
 209
 210 /*
 211  * Include search path. This is simply a list of strings which get
 212  * prepended, in turn, to the name of an include file, in an
 213  * attempt to find the file if it's not in the current directory.
 214  */
 215 struct IncPath {
 216     IncPath *next;
 217     char *path;
 218 };
 219
 220 /*
 221  * Conditional assembly: we maintain a separate stack of these for
 222  * each level of file inclusion. (The only reason we keep the
 223  * stacks separate is to ensure that a stray `%endif' in a file
 224  * included from within the true branch of a `%if' won't terminate
 225  * it and cause confusion: instead, rightly, it'll cause an error.)
 226  */
 227 struct Cond {
 228     Cond *next;
 229     int state;
 230 };
 231 enum {
 232     /*
 233      * These states are for use just after %if or %elif: IF_TRUE
 234      * means the condition has evaluated to truth so we are
 235      * currently emitting, whereas IF_FALSE means we are not
 236      * currently emitting but will start doing so if a %else comes
 237      * up. In these states, all directives are admissible: %elif,
 238      * %else and %endif. (And of course %if.)
 239      */
 240     COND_IF_TRUE, COND_IF_FALSE,
 241     /*
 242      * These states come up after a %else: ELSE_TRUE means we're
 243      * emitting, and ELSE_FALSE means we're not. In ELSE_* states,
 244      * any %elif or %else will cause an error.
 245      */
 246     COND_ELSE_TRUE, COND_ELSE_FALSE,
 247     /*
 248      * This state means that we're not emitting now, and also that
 249      * nothing until %endif will be emitted at all. It's for use in
 250      * two circumstances: (i) when we've had our moment of emission
 251      * and have now started seeing %elifs, and (ii) when the
 252      * condition construct in question is contained within a
 253      * non-emitting branch of a larger condition construct.
 254      */
 255     COND_NEVER
 256 };
 257 #define emitting(x) ( (x) == COND_IF_TRUE || (x) == COND_ELSE_TRUE )
 258
 259 /*
 260  * These defines are used as the possible return values for do_directive
 261  */
 262 #define NO_DIRECTIVE_FOUND  0
 263 #define DIRECTIVE_FOUND     1
 264
 265 /*
 266  * Condition codes. Note that we use c_ prefix not C_ because C_ is
 267  * used in nasm.h for the "real" condition codes. At _this_ level,
 268  * we treat CXZ and ECXZ as condition codes, albeit non-invertible
 269  * ones, so we need a different enum...
 270  */
 271 static const char * const conditions[] = {
 272     "a", "ae", "b", "be", "c", "cxz", "e", "ecxz", "g", "ge", "l", "le",
 273     "na", "nae", "nb", "nbe", "nc", "ne", "ng", "nge", "nl", "nle", "no",
 274     "np", "ns", "nz", "o", "p", "pe", "po", "rcxz", "s", "z"
 275 };
 276 enum pp_conds {
 277     c_A, c_AE, c_B, c_BE, c_C, c_CXZ, c_E, c_ECXZ, c_G, c_GE, c_L, c_LE,
 278     c_NA, c_NAE, c_NB, c_NBE, c_NC, c_NE, c_NG, c_NGE, c_NL, c_NLE, c_NO,
 279     c_NP, c_NS, c_NZ, c_O, c_P, c_PE, c_PO, c_RCXZ, c_S, c_Z,
 280     c_none = -1
 281 };
 282 static const enum pp_conds inverse_ccs[] = {
 283     c_NA, c_NAE, c_NB, c_NBE, c_NC, -1, c_NE, -1, c_NG, c_NGE, c_NL, c_NLE,
 284     c_A, c_AE, c_B, c_BE, c_C, c_E, c_G, c_GE, c_L, c_LE, c_O, c_P, c_S,
 285     c_Z, c_NO, c_NP, c_PO, c_PE, -1, c_NS, c_NZ
 286 };
 287
 288 /*
 289  * Directive names.
 290  */
 291 /* If this is a an IF, ELIF, ELSE or ENDIF keyword */
 292 static int is_condition(enum preproc_token arg)
 293 {
 294     return PP_IS_COND(arg) || (arg == PP_ELSE) || (arg == PP_ENDIF);
 295 }
 296
 297 /* For TASM compatibility we need to be able to recognise TASM compatible
 298  * conditional compilation directives. Using the NASM pre-processor does
 299  * not work, so we look for them specifically from the following list and
 300  * then jam in the equivalent NASM directive into the input stream.
 301  */
 302
 303 enum {
 304     TM_ARG, TM_ELIF, TM_ELSE, TM_ENDIF, TM_IF, TM_IFDEF, TM_IFDIFI,
 305     TM_IFNDEF, TM_INCLUDE, TM_LOCAL
 306 };
 307
 308 static const char * const tasm_directives[] = {
 309     "arg", "elif", "else", "endif", "if", "ifdef", "ifdifi",
 310     "ifndef", "include", "local"
 311 };
 312
 313 static int StackSize = 4;
 314 static char *StackPointer = "ebp";
 315 static int ArgOffset = 8;
 316 static int LocalOffset = 0;
 317
 318 static Context *cstk;
 319 static Include *istk;
 320 static IncPath *ipath = NULL;
 321
 322 static efunc _error;            /* Pointer to client-provided error reporting function */
 323 static evalfunc evaluate;
 324
 325 static int pass;                /* HACK: pass 0 = generate dependencies only */
 326
 327 static uint64_t unique;    /* unique identifier numbers */
 328
 329 static Line *predef = NULL;
 330
 331 static ListGen *list;
 332
 333 /*
 334  * The current set of multi-line macros we have defined.
 335  */
 336 static struct hash_table *mmacros;
 337
 338 /*
 339  * The current set of single-line macros we have defined.
 340  */
 341 static struct hash_table *smacros;
 342
 343 /*
 344  * The multi-line macro we are currently defining, or the %rep
 345  * block we are currently reading, if any.
 346  */
 347 static MMacro *defining;
 348
 349 /*
 350  * The number of macro parameters to allocate space for at a time.
 351  */
 352 #define PARAM_DELTA 16
 353
 354 /*
 355  * The standard macro set: defined as `static char *stdmac[]'. Also
 356  * gives our position in the macro set, when we're processing it.
 357  */
 358 #include "macros.c"
 359 static const char * const *stdmacpos;
 360
 361 /*
 362  * The extra standard macros that come from the object format, if
 363  * any.
 364  */
 365 static const char * const *extrastdmac = NULL;
 366 bool any_extrastdmac;
 367
 368 /*
 369  * Tokens are allocated in blocks to improve speed
 370  */
 371 #define TOKEN_BLOCKSIZE 4096
 372 static Token *freeTokens = NULL;
 373 struct Blocks {
 374     Blocks *next;
 375     void *chunk;
 376 };
 377
 378 static Blocks blocks = { NULL, NULL };
 379
 380 /*
 381  * Forward declarations.
 382  */
 383 static Token *expand_mmac_params(Token * tline);
 384 static Token *expand_smacro(Token * tline);
 385 static Token *expand_id(Token * tline);
 386 static Context *get_ctx(char *name, bool all_contexts);
 387 static void make_tok_num(Token * tok, int64_t val);
 388 static void error(int severity, const char *fmt, ...);
 389 static void *new_Block(size_t size);
 390 static void delete_Blocks(void);
 391 static Token *new_Token(Token * next, enum pp_token_type type, char *text, int txtlen);
 392 static Token *delete_Token(Token * t);
 393
 394 /*
 395  * Macros for safe checking of token pointers, avoid *(NULL)
 396  */
 397 #define tok_type_(x,t) ((x) && (x)->type == (t))
 398 #define skip_white_(x) if (tok_type_((x), TOK_WHITESPACE)) (x)=(x)->next
 399 #define tok_is_(x,v) (tok_type_((x), TOK_OTHER) && !strcmp((x)->text,(v)))
 400 #define tok_isnt_(x,v) ((x) && ((x)->type!=TOK_OTHER || strcmp((x)->text,(v))))
 401
 402 /* Handle TASM specific directives, which do not contain a % in
 403  * front of them. We do it here because I could not find any other
 404  * place to do it for the moment, and it is a hack (ideally it would
 405  * be nice to be able to use the NASM pre-processor to do it).
 406  */
 407 static char *check_tasm_directive(char *line)
 408 {
 409     int32_t i, j, k, m, len;
 410     char *p = line, *oldline, oldchar;
 411
 412     /* Skip whitespace */
 413     while (isspace(*p) && *p != 0)
 414         p++;
 415
 416     /* Binary search for the directive name */
 417     i = -1;
 418     j = elements(tasm_directives);
 419     len = 0;
 420     while (!isspace(p[len]) && p[len] != 0)
 421         len++;
 422     if (len) {
 423         oldchar = p[len];
 424         p[len] = 0;
 425         while (j - i > 1) {
 426             k = (j + i) / 2;
 427             m = nasm_stricmp(p, tasm_directives[k]);
 428             if (m == 0) {
 429                 /* We have found a directive, so jam a % in front of it
 430                  * so that NASM will then recognise it as one if it's own.
 431                  */
 432                 p[len] = oldchar;
 433                 len = strlen(p);
 434                 oldline = line;
 435                 line = nasm_malloc(len + 2);
 436                 line[0] = '%';
 437                 if (k == TM_IFDIFI) {
 438                     /* NASM does not recognise IFDIFI, so we convert it to
 439                      * %ifdef BOGUS. This is not used in NASM comaptible
 440                      * code, but does need to parse for the TASM macro
 441                      * package.
 442                      */
 443                     strcpy(line + 1, "ifdef BOGUS");
 444                 } else {
 445                     memcpy(line + 1, p, len + 1);
 446                 }
 447                 nasm_free(oldline);
 448                 return line;
 449             } else if (m < 0) {
 450                 j = k;
 451             } else
 452                 i = k;
 453         }
 454         p[len] = oldchar;
 455     }
 456     return line;
 457 }
 458
 459 /*
 460  * The pre-preprocessing stage... This function translates line
 461  * number indications as they emerge from GNU cpp (`# lineno "file"
 462  * flags') into NASM preprocessor line number indications (`%line
 463  * lineno file').
 464  */
 465 static char *prepreproc(char *line)
 466 {
 467     int lineno, fnlen;
 468     char *fname, *oldline;
 469
 470     if (line[0] == '#' && line[1] == ' ') {
 471         oldline = line;
 472         fname = oldline + 2;
 473         lineno = atoi(fname);
 474         fname += strspn(fname, "0123456789 ");
 475         if (*fname == '"')
 476             fname++;
 477         fnlen = strcspn(fname, "\"");
 478         line = nasm_malloc(20 + fnlen);
 479         snprintf(line, 20 + fnlen, "%%line %d %.*s", lineno, fnlen, fname);
 480         nasm_free(oldline);
 481     }
 482     if (tasm_compatible_mode)
 483         return check_tasm_directive(line);
 484     return line;
 485 }
 486
 487 /*
 488  * Free a linked list of tokens.
 489  */
 490 static void free_tlist(Token * list)
 491 {
 492     while (list) {
 493         list = delete_Token(list);
 494     }
 495 }
 496
 497 /*
 498  * Free a linked list of lines.
 499  */
 500 static void free_llist(Line * list)
 501 {
 502     Line *l;
 503     while (list) {
 504         l = list;
 505         list = list->next;
 506         free_tlist(l->first);
 507         nasm_free(l);
 508     }
 509 }
 510
 511 /*
 512  * Free an MMacro
 513  */
 514 static void free_mmacro(MMacro * m)
 515 {
 516     nasm_free(m->name);
 517     free_tlist(m->dlist);
 518     nasm_free(m->defaults);
 519     free_llist(m->expansion);
 520     nasm_free(m);
 521 }
 522
 523 /*
 524  * Free all currently defined macros, and free the hash tables
 525  */
 526 static void free_macros(void)
 527 {
 528     struct hash_tbl_node *it;
 529     const char *key;
 530     SMacro *s;
 531     MMacro *m;
 532
 533     it = NULL;
 534     while ((s = hash_iterate(smacros, &it, &key)) != NULL) {
 535         nasm_free((void *)key);
 536         while (s) {
 537             SMacro *ns = s->next;
 538             nasm_free(s->name);
 539             free_tlist(s->expansion);
 540             nasm_free(s);
 541             s = ns;
 542         }
 543     }
 544     hash_free(smacros);
 545
 546     it = NULL;
 547     while ((m = hash_iterate(mmacros, &it, &key)) != NULL) {
 548         nasm_free((void *)key);
 549         while (m) {
 550             MMacro *nm = m->next;
 551             free_mmacro(m);
 552             m = nm;
 553         }
 554     }
 555     hash_free(mmacros);
 556 }
 557
 558 /*
 559  * Initialize the hash tables
 560  */
 561 static void init_macros(void)
 562 {
 563     smacros = hash_init();
 564     mmacros = hash_init();
 565 }
 566
 567 /*
 568  * Pop the context stack.
 569  */
 570 static void ctx_pop(void)
 571 {
 572     Context *c = cstk;
 573     SMacro *smac, *s;
 574
 575     cstk = cstk->next;
 576     smac = c->localmac;
 577     while (smac) {
 578         s = smac;
 579         smac = smac->next;
 580         nasm_free(s->name);
 581         free_tlist(s->expansion);
 582         nasm_free(s);
 583     }
 584     nasm_free(c->name);
 585     nasm_free(c);
 586 }
 587
 588 #define BUF_DELTA 512
 589 /*
 590  * Read a line from the top file in istk, handling multiple CR/LFs
 591  * at the end of the line read, and handling spurious ^Zs. Will
 592  * return lines from the standard macro set if this has not already
 593  * been done.
 594  */
 595 static char *read_line(void)
 596 {
 597     char *buffer, *p, *q;
 598     int bufsize, continued_count;
 599
 600     if (stdmacpos) {
 601         if (*stdmacpos) {
 602             char *ret = nasm_strdup(*stdmacpos++);
 603             if (!*stdmacpos && any_extrastdmac) {
 604                 stdmacpos = extrastdmac;
 605                 any_extrastdmac = false;
 606                 return ret;
 607             }
 608             /*
 609              * Nasty hack: here we push the contents of `predef' on
 610              * to the top-level expansion stack, since this is the
 611              * most convenient way to implement the pre-include and
 612              * pre-define features.
 613              */
 614             if (!*stdmacpos) {
 615                 Line *pd, *l;
 616                 Token *head, **tail, *t;
 617
 618                 for (pd = predef; pd; pd = pd->next) {
 619                     head = NULL;
 620                     tail = &head;
 621                     for (t = pd->first; t; t = t->next) {
 622                         *tail = new_Token(NULL, t->type, t->text, 0);
 623                         tail = &(*tail)->next;
 624                     }
 625                     l = nasm_malloc(sizeof(Line));
 626                     l->next = istk->expansion;
 627                     l->first = head;
 628                     l->finishes = false;
 629                     istk->expansion = l;
 630                 }
 631             }
 632             return ret;
 633         } else {
 634             stdmacpos = NULL;
 635         }
 636     }
 637
 638     bufsize = BUF_DELTA;
 639     buffer = nasm_malloc(BUF_DELTA);
 640     p = buffer;
 641     continued_count = 0;
 642     while (1) {
 643         q = fgets(p, bufsize - (p - buffer), istk->fp);
 644         if (!q)
 645             break;
 646         p += strlen(p);
 647         if (p > buffer && p[-1] == '\n') {
 648             /* Convert backslash-CRLF line continuation sequences into
 649                nothing at all (for DOS and Windows) */
 650             if (((p - 2) > buffer) && (p[-3] == '\\') && (p[-2] == '\r')) {
 651                 p -= 3;
 652                 *p = 0;
 653                 continued_count++;
 654             }
 655             /* Also convert backslash-LF line continuation sequences into
 656                nothing at all (for Unix) */
 657             else if (((p - 1) > buffer) && (p[-2] == '\\')) {
 658                 p -= 2;
 659                 *p = 0;
 660                 continued_count++;
 661             } else {
 662                 break;
 663             }
 664         }
 665         if (p - buffer > bufsize - 10) {
 666             int32_t offset = p - buffer;
 667             bufsize += BUF_DELTA;
 668             buffer = nasm_realloc(buffer, bufsize);
 669             p = buffer + offset;        /* prevent stale-pointer problems */
 670         }
 671     }
 672
 673     if (!q && p == buffer) {
 674         nasm_free(buffer);
 675         return NULL;
 676     }
 677
 678     src_set_linnum(src_get_linnum() + istk->lineinc +
 679                    (continued_count * istk->lineinc));
 680
 681     /*
 682      * Play safe: remove CRs as well as LFs, if any of either are
 683      * present at the end of the line.
 684      */
 685     while (--p >= buffer && (*p == '\n' || *p == '\r'))
 686         *p = '\0';
 687
 688     /*
 689      * Handle spurious ^Z, which may be inserted into source files
 690      * by some file transfer utilities.
 691      */
 692     buffer[strcspn(buffer, "\032")] = '\0';
 693
 694     list->line(LIST_READ, buffer);
 695
 696     return buffer;
 697 }
 698
 699 /*
 700  * Tokenize a line of text. This is a very simple process since we
 701  * don't need to parse the value out of e.g. numeric tokens: we
 702  * simply split one string into many.
 703  */
 704 static Token *tokenize(char *line)
 705 {
 706     char *p = line;
 707     enum pp_token_type type;
 708     Token *list = NULL;
 709     Token *t, **tail = &list;
 710
 711     while (*line) {
 712         p = line;
 713         if (*p == '%') {
 714             p++;
 715             if (isdigit(*p) ||
 716                 ((*p == '-' || *p == '+') && isdigit(p[1])) ||
 717                 ((*p == '+') && (isspace(p[1]) || !p[1]))) {
 718                 do {
 719                     p++;
 720                 }
 721                 while (isdigit(*p));
 722                 type = TOK_PREPROC_ID;
 723             } else if (*p == '{') {
 724                 p++;
 725                 while (*p && *p != '}') {
 726                     p[-1] = *p;
 727                     p++;
 728                 }
 729                 p[-1] = '\0';
 730                 if (*p)
 731                     p++;
 732                 type = TOK_PREPROC_ID;
 733             } else if (isidchar(*p) ||
 734                        ((*p == '!' || *p == '%' || *p == '$') &&
 735                         isidchar(p[1]))) {
 736                 do {
 737                     p++;
 738                 }
 739                 while (isidchar(*p));
 740                 type = TOK_PREPROC_ID;
 741             } else {
 742                 type = TOK_OTHER;
 743                 if (*p == '%')
 744                     p++;
 745             }
 746         } else if (isidstart(*p) || (*p == '$' && isidstart(p[1]))) {
 747             type = TOK_ID;
 748             p++;
 749             while (*p && isidchar(*p))
 750                 p++;
 751         } else if (*p == '\'' || *p == '"') {
 752             /*
 753              * A string token.
 754              */
 755             char c = *p;
 756             p++;
 757             type = TOK_STRING;
 758             while (*p && *p != c)
 759                 p++;
 760
 761             if (*p) {
 762                 p++;
 763             } else {
 764                 error(ERR_WARNING, "unterminated string");
 765                 /* Handling unterminated strings by UNV */
 766                 /* type = -1; */
 767             }
 768         } else if (isnumstart(*p)) {
 769             bool is_hex = false;
 770             bool is_float = false;
 771             bool has_e = false;
 772             char c, *r;
 773
 774             /*
 775              * A numeric token.
 776              */
 777
 778             if (*p == '$') {
 779                 p++;
 780                 is_hex = true;
 781             }
 782
 783             for (;;) {
 784                 c = *p++;
 785
 786                 if (!is_hex && (c == 'e' || c == 'E')) {
 787                     has_e = true;
 788                     if (*p == '+' || *p == '-') {
 789                         /* e can only be followed by +/- if it is either a
 790                            prefixed hex number or a floating-point number */
 791                         p++;
 792                         is_float = true;
 793                     }
 794                 } else if (c == 'H' || c == 'h' || c == 'X' || c == 'x') {
 795                     is_hex = true;
 796                 } else if (c == 'P' || c == 'p') {
 797                     is_float = true;
 798                     if (*p == '+' || *p == '-')
 799                         p++;
 800                 } else if (isnumchar(c) || c == '_')
 801                     ; /* just advance */
 802                 else if (c == '.') {
 803                     /* we need to deal with consequences of the legacy
 804                        parser, like "1.nolist" being two tokens
 805                        (TOK_NUMBER, TOK_ID) here; at least give it
 806                        a shot for now.  In the future, we probably need
 807                        a flex-based scanner with proper pattern matching
 808                        to do it as well as it can be done.  Nothing in
 809                        the world is going to help the person who wants
 810                        0x123.p16 interpreted as two tokens, though. */
 811                     r = p;
 812                     while (*r == '_')
 813                         r++;
 814
 815                     if (isdigit(*r) || (is_hex && isxdigit(*r)) ||
 816                         (!is_hex && (*r == 'e' || *r == 'E')) ||
 817                         (*r == 'p' || *r == 'P')) {
 818                         p = r;
 819                         is_float = true;
 820                     } else
 821                         break;  /* Terminate the token */
 822                 } else
 823                     break;
 824             }
 825             p--;        /* Point to first character beyond number */
 826
 827             if (has_e && !is_hex) {
 828                 /* 1e13 is floating-point, but 1e13h is not */
 829                 is_float = true;
 830             }
 831
 832             type = is_float ? TOK_FLOAT : TOK_NUMBER;
 833         } else if (isspace(*p)) {
 834             type = TOK_WHITESPACE;
 835             p++;
 836             while (*p && isspace(*p))
 837                 p++;
 838             /*
 839              * Whitespace just before end-of-line is discarded by
 840              * pretending it's a comment; whitespace just before a
 841              * comment gets lumped into the comment.
 842              */
 843             if (!*p || *p == ';') {
 844                 type = TOK_COMMENT;
 845                 while (*p)
 846                     p++;
 847             }
 848         } else if (*p == ';') {
 849             type = TOK_COMMENT;
 850             while (*p)
 851                 p++;
 852         } else {
 853             /*
 854              * Anything else is an operator of some kind. We check
 855              * for all the double-character operators (>>, <<, //,
 856              * %%, <=, >=, ==, !=, <>, &&, ||, ^^), but anything
 857              * else is a single-character operator.
 858              */
 859             type = TOK_OTHER;
 860             if ((p[0] == '>' && p[1] == '>') ||
 861                 (p[0] == '<' && p[1] == '<') ||
 862                 (p[0] == '/' && p[1] == '/') ||
 863                 (p[0] == '<' && p[1] == '=') ||
 864                 (p[0] == '>' && p[1] == '=') ||
 865                 (p[0] == '=' && p[1] == '=') ||
 866                 (p[0] == '!' && p[1] == '=') ||
 867                 (p[0] == '<' && p[1] == '>') ||
 868                 (p[0] == '&' && p[1] == '&') ||
 869                 (p[0] == '|' && p[1] == '|') ||
 870                 (p[0] == '^' && p[1] == '^')) {
 871                 p++;
 872             }
 873             p++;
 874         }
 875
 876         /* Handling unterminated string by UNV */
 877         /*if (type == -1)
 878            {
 879            *tail = t = new_Token(NULL, TOK_STRING, line, p-line+1);
 880            t->text[p-line] = *line;
 881            tail = &t->next;
 882            }
 883            else */
 884         if (type != TOK_COMMENT) {
 885             *tail = t = new_Token(NULL, type, line, p - line);
 886             tail = &t->next;
 887         }
 888         line = p;
 889     }
 890     return list;
 891 }
 892
 893 /*
 894  * this function allocates a new managed block of memory and
 895  * returns a pointer to the block.  The managed blocks are
 896  * deleted only all at once by the delete_Blocks function.
 897  */
 898 static void *new_Block(size_t size)
 899 {
 900     Blocks *b = &blocks;
 901
 902     /* first, get to the end of the linked list */
 903     while (b->next)
 904         b = b->next;
 905     /* now allocate the requested chunk */
 906     b->chunk = nasm_malloc(size);
 907
 908     /* now allocate a new block for the next request */
 909     b->next = nasm_malloc(sizeof(Blocks));
 910     /* and initialize the contents of the new block */
 911     b->next->next = NULL;
 912     b->next->chunk = NULL;
 913     return b->chunk;
 914 }
 915
 916 /*
 917  * this function deletes all managed blocks of memory
 918  */
 919 static void delete_Blocks(void)
 920 {
 921     Blocks *a, *b = &blocks;
 922
 923     /*
 924      * keep in mind that the first block, pointed to by blocks
 925      * is a static and not dynamically allocated, so we don't
 926      * free it.
 927      */
 928     while (b) {
 929         if (b->chunk)
 930             nasm_free(b->chunk);
 931         a = b;
 932         b = b->next;
 933         if (a != &blocks)
 934             nasm_free(a);
 935     }
 936 }
 937
 938 /*
 939  *  this function creates a new Token and passes a pointer to it
 940  *  back to the caller.  It sets the type and text elements, and
 941  *  also the mac and next elements to NULL.
 942  */
 943 static Token *new_Token(Token * next, enum pp_token_type type, char *text, int txtlen)
 944 {
 945     Token *t;
 946     int i;
 947
 948     if (freeTokens == NULL) {
 949         freeTokens = (Token *) new_Block(TOKEN_BLOCKSIZE * sizeof(Token));
 950         for (i = 0; i < TOKEN_BLOCKSIZE - 1; i++)
 951             freeTokens[i].next = &freeTokens[i + 1];
 952         freeTokens[i].next = NULL;
 953     }
 954     t = freeTokens;
 955     freeTokens = t->next;
 956     t->next = next;
 957     t->mac = NULL;
 958     t->type = type;
 959     if (type == TOK_WHITESPACE || text == NULL) {
 960         t->text = NULL;
 961     } else {
 962         if (txtlen == 0)
 963             txtlen = strlen(text);
 964         t->text = nasm_malloc(1 + txtlen);
 965         strncpy(t->text, text, txtlen);
 966         t->text[txtlen] = '\0';
 967     }
 968     return t;
 969 }
 970
 971 static Token *delete_Token(Token * t)
 972 {
 973     Token *next = t->next;
 974     nasm_free(t->text);
 975     t->next = freeTokens;
 976     freeTokens = t;
 977     return next;
 978 }
 979
 980 /*
 981  * Convert a line of tokens back into text.
 982  * If expand_locals is not zero, identifiers of the form "%$*xxx"
 983  * will be transformed into ..@ctxnum.xxx
 984  */
 985 static char *detoken(Token * tlist, int expand_locals)
 986 {
 987     Token *t;
 988     int len;
 989     char *line, *p;
 990     const char *q;
 991
 992     len = 0;
 993     for (t = tlist; t; t = t->next) {
 994         if (t->type == TOK_PREPROC_ID && t->text[1] == '!') {
 995             char *p = getenv(t->text + 2);
 996             nasm_free(t->text);
 997             if (p)
 998                 t->text = nasm_strdup(p);
 999             else
1000                 t->text = NULL;
1001         }
1002         /* Expand local macros here and not during preprocessing */
1003         if (expand_locals &&
1004             t->type == TOK_PREPROC_ID && t->text &&
1005             t->text[0] == '%' && t->text[1] == '$') {
1006             Context *ctx = get_ctx(t->text, false);
1007             if (ctx) {
1008                 char buffer[40];
1009                 char *p, *q = t->text + 2;
1010
1011                 q += strspn(q, "$");
1012                 snprintf(buffer, sizeof(buffer), "..@%"PRIu32".", ctx->number);
1013                 p = nasm_strcat(buffer, q);
1014                 nasm_free(t->text);
1015                 t->text = p;
1016             }
1017         }
1018         if (t->type == TOK_WHITESPACE) {
1019             len++;
1020         } else if (t->text) {
1021             len += strlen(t->text);
1022         }
1023     }
1024     p = line = nasm_malloc(len + 1);
1025     for (t = tlist; t; t = t->next) {
1026         if (t->type == TOK_WHITESPACE) {
1027             *p++ = ' ';
1028         } else if (t->text) {
1029             q = t->text;
1030             while (*q)
1031                 *p++ = *q++;
1032         }
1033     }
1034     *p = '\0';
1035     return line;
1036 }
1037
1038 /*
1039  * A scanner, suitable for use by the expression evaluator, which
1040  * operates on a line of Tokens. Expects a pointer to a pointer to
1041  * the first token in the line to be passed in as its private_data
1042  * field.
1043  *
1044  * FIX: This really needs to be unified with stdscan.
1045  */
1046 static int ppscan(void *private_data, struct tokenval *tokval)
1047 {
1048     Token **tlineptr = private_data;
1049     Token *tline;
1050     char ourcopy[MAX_KEYWORD+1], *p, *r, *s;
1051
1052     do {
1053         tline = *tlineptr;
1054         *tlineptr = tline ? tline->next : NULL;
1055     }
1056     while (tline && (tline->type == TOK_WHITESPACE ||
1057                      tline->type == TOK_COMMENT));
1058
1059     if (!tline)
1060         return tokval->t_type = TOKEN_EOS;
1061
1062     tokval->t_charptr = tline->text;
1063
1064     if (tline->text[0] == '$' && !tline->text[1])
1065         return tokval->t_type = TOKEN_HERE;
1066     if (tline->text[0] == '$' && tline->text[1] == '$' && !tline->text[2])
1067         return tokval->t_type = TOKEN_BASE;
1068
1069     if (tline->type == TOK_ID) {
1070         p = tokval->t_charptr = tline->text;
1071         if (p[0] == '$') {
1072             tokval->t_charptr++;
1073             return tokval->t_type = TOKEN_ID;
1074         }
1075
1076         for (r = p, s = ourcopy; *r; r++) {
1077             if (r > p+MAX_KEYWORD)
1078                 return tokval->t_type = TOKEN_ID; /* Not a keyword */
1079             *s++ = tolower(*r);
1080         }
1081         *s = '\0';
1082         /* right, so we have an identifier sitting in temp storage. now,
1083          * is it actually a register or instruction name, or what? */
1084         return nasm_token_hash(ourcopy, tokval);
1085     }
1086
1087     if (tline->type == TOK_NUMBER) {
1088         bool rn_error;
1089         tokval->t_integer = readnum(tline->text, &rn_error);
1090         if (rn_error)
1091             return tokval->t_type = TOKEN_ERRNUM;   /* some malformation occurred */
1092         tokval->t_charptr = tline->text;
1093         return tokval->t_type = TOKEN_NUM;
1094     }
1095
1096     if (tline->type == TOK_FLOAT) {
1097         return tokval->t_type = TOKEN_FLOAT;
1098     }
1099
1100     if (tline->type == TOK_STRING) {
1101         bool rn_warn;
1102         char q, *r;
1103         int l;
1104
1105         r = tline->text;
1106         q = *r++;
1107         l = strlen(r);
1108
1109         if (l == 0 || r[l - 1] != q)
1110             return tokval->t_type = TOKEN_ERRNUM;
1111         tokval->t_integer = readstrnum(r, l - 1, &rn_warn);
1112         if (rn_warn)
1113             error(ERR_WARNING | ERR_PASS1, "character constant too long");
1114         tokval->t_charptr = NULL;
1115         return tokval->t_type = TOKEN_NUM;
1116     }
1117
1118     if (tline->type == TOK_OTHER) {
1119         if (!strcmp(tline->text, "<<"))
1120             return tokval->t_type = TOKEN_SHL;
1121         if (!strcmp(tline->text, ">>"))
1122             return tokval->t_type = TOKEN_SHR;
1123         if (!strcmp(tline->text, "//"))
1124             return tokval->t_type = TOKEN_SDIV;
1125         if (!strcmp(tline->text, "%%"))
1126             return tokval->t_type = TOKEN_SMOD;
1127         if (!strcmp(tline->text, "=="))
1128             return tokval->t_type = TOKEN_EQ;
1129         if (!strcmp(tline->text, "<>"))
1130             return tokval->t_type = TOKEN_NE;
1131         if (!strcmp(tline->text, "!="))
1132             return tokval->t_type = TOKEN_NE;
1133         if (!strcmp(tline->text, "<="))
1134             return tokval->t_type = TOKEN_LE;
1135         if (!strcmp(tline->text, ">="))
1136             return tokval->t_type = TOKEN_GE;
1137         if (!strcmp(tline->text, "&&"))
1138             return tokval->t_type = TOKEN_DBL_AND;
1139         if (!strcmp(tline->text, "^^"))
1140             return tokval->t_type = TOKEN_DBL_XOR;
1141         if (!strcmp(tline->text, "||"))
1142             return tokval->t_type = TOKEN_DBL_OR;
1143     }
1144
1145     /*
1146      * We have no other options: just return the first character of
1147      * the token text.
1148      */
1149     return tokval->t_type = tline->text[0];
1150 }
1151
1152 /*
1153  * Compare a string to the name of an existing macro; this is a
1154  * simple wrapper which calls either strcmp or nasm_stricmp
1155  * depending on the value of the `casesense' parameter.
1156  */
1157 static int mstrcmp(const char *p, const char *q, bool casesense)
1158 {
1159     return casesense ? strcmp(p, q) : nasm_stricmp(p, q);
1160 }
1161
1162 /*
1163  * Return the Context structure associated with a %$ token. Return
1164  * NULL, having _already_ reported an error condition, if the
1165  * context stack isn't deep enough for the supplied number of $
1166  * signs.
1167  * If all_contexts == true, contexts that enclose current are
1168  * also scanned for such smacro, until it is found; if not -
1169  * only the context that directly results from the number of $'s
1170  * in variable's name.
1171  */
1172 static Context *get_ctx(char *name, bool all_contexts)
1173 {
1174     Context *ctx;
1175     SMacro *m;
1176     int i;
1177
1178     if (!name || name[0] != '%' || name[1] != '$')
1179         return NULL;
1180
1181     if (!cstk) {
1182         error(ERR_NONFATAL, "`%s': context stack is empty", name);
1183         return NULL;
1184     }
1185
1186     for (i = strspn(name + 2, "$"), ctx = cstk; (i > 0) && ctx; i--) {
1187         ctx = ctx->next;
1188 /*        i--;  Lino - 02/25/02 */
1189     }
1190     if (!ctx) {
1191         error(ERR_NONFATAL, "`%s': context stack is only"
1192               " %d level%s deep", name, i - 1, (i == 2 ? "" : "s"));
1193         return NULL;
1194     }
1195     if (!all_contexts)
1196         return ctx;
1197
1198     do {
1199         /* Search for this smacro in found context */
1200         m = ctx->localmac;
1201         while (m) {
1202             if (!mstrcmp(m->name, name, m->casesense))
1203                 return ctx;
1204             m = m->next;
1205         }
1206         ctx = ctx->next;
1207     }
1208     while (ctx);
1209     return NULL;
1210 }
1211
1212 /*
1213  * Open an include file. This routine must always return a valid
1214  * file pointer if it returns - it's responsible for throwing an
1215  * ERR_FATAL and bombing out completely if not. It should also try
1216  * the include path one by one until it finds the file or reaches
1217  * the end of the path.
1218  */
1219 static FILE *inc_fopen(char *file)
1220 {
1221     FILE *fp;
1222     char *prefix = "", *combine;
1223     IncPath *ip = ipath;
1224     static int namelen = 0;
1225     int len = strlen(file);
1226
1227     while (1) {
1228         combine = nasm_malloc(strlen(prefix) + len + 1);
1229         strcpy(combine, prefix);
1230         strcat(combine, file);
1231         fp = fopen(combine, "r");
1232         if (pass == 0 && fp) {
1233             namelen += strlen(combine) + 1;
1234             if (namelen > 62) {
1235                 printf(" \\\n  ");
1236                 namelen = 2;
1237             }
1238             printf(" %s", combine);
1239         }
1240         nasm_free(combine);
1241         if (fp)
1242             return fp;
1243         if (!ip)
1244             break;
1245         prefix = ip->path;
1246         ip = ip->next;
1247
1248         if (!prefix) {
1249                 /* -MG given and file not found */
1250                 if (pass == 0) {
1251                         namelen += strlen(file) + 1;
1252                         if (namelen > 62) {
1253                                 printf(" \\\n  ");
1254                                 namelen = 2;
1255                         }
1256                         printf(" %s", file);
1257                 }
1258             return NULL;
1259         }
1260     }
1261
1262     error(ERR_FATAL, "unable to open include file `%s'", file);
1263     return NULL;                /* never reached - placate compilers */
1264 }
1265
1266 /*
1267  * Search for a key in the hash index; adding it if necessary
1268  * (in which case we initialize the data pointer to NULL.)
1269  */
1270 static void **
1271 hash_findi_add(struct hash_table *hash, const char *str)
1272 {
1273     struct hash_insert hi;
1274     void **r;
1275     char *strx;
1276
1277     r = hash_findi(hash, str, &hi);
1278     if (r)
1279         return r;
1280
1281     strx = nasm_strdup(str);    /* Use a more efficient allocator here? */
1282     return hash_add(&hi, strx, NULL);
1283 }
1284
1285 /*
1286  * Like hash_findi, but returns the data element rather than a pointer
1287  * to it.  Used only when not adding a new element, hence no third
1288  * argument.
1289  */
1290 static void *
1291 hash_findix(struct hash_table *hash, const char *str)
1292 {
1293     void **p;
1294
1295     p = hash_findi(hash, str, NULL);
1296     return p ? *p : NULL;
1297 }
1298
1299 /*
1300  * Determine if we should warn on defining a single-line macro of
1301  * name `name', with `nparam' parameters. If nparam is 0 or -1, will
1302  * return true if _any_ single-line macro of that name is defined.
1303  * Otherwise, will return true if a single-line macro with either
1304  * `nparam' or no parameters is defined.
1305  *
1306  * If a macro with precisely the right number of parameters is
1307  * defined, or nparam is -1, the address of the definition structure
1308  * will be returned in `defn'; otherwise NULL will be returned. If `defn'
1309  * is NULL, no action will be taken regarding its contents, and no
1310  * error will occur.
1311  *
1312  * Note that this is also called with nparam zero to resolve
1313  * `ifdef'.
1314  *
1315  * If you already know which context macro belongs to, you can pass
1316  * the context pointer as first parameter; if you won't but name begins
1317  * with %$ the context will be automatically computed. If all_contexts
1318  * is true, macro will be searched in outer contexts as well.
1319  */
1320 static bool
1321 smacro_defined(Context * ctx, char *name, int nparam, SMacro ** defn,
1322                bool nocase)
1323 {
1324     SMacro *m;
1325
1326     if (ctx) {
1327         m = ctx->localmac;
1328     } else if (name[0] == '%' && name[1] == '$') {
1329         if (cstk)
1330             ctx = get_ctx(name, false);
1331         if (!ctx)
1332             return false;       /* got to return _something_ */
1333         m = ctx->localmac;
1334     } else {
1335         m = (SMacro *) hash_findix(smacros, name);
1336     }
1337
1338     while (m) {
1339         if (!mstrcmp(m->name, name, m->casesense && nocase) &&
1340             (nparam <= 0 || m->nparam == 0 || nparam == (int) m->nparam)) {
1341             if (defn) {
1342                 if (nparam == (int) m->nparam || nparam == -1)
1343                     *defn = m;
1344                 else
1345                     *defn = NULL;
1346             }
1347             return true;
1348         }
1349         m = m->next;
1350     }
1351
1352     return false;
1353 }
1354
1355 /*
1356  * Count and mark off the parameters in a multi-line macro call.
1357  * This is called both from within the multi-line macro expansion
1358  * code, and also to mark off the default parameters when provided
1359  * in a %macro definition line.
1360  */
1361 static void count_mmac_params(Token * t, int *nparam, Token *** params)
1362 {
1363     int paramsize, brace;
1364
1365     *nparam = paramsize = 0;
1366     *params = NULL;
1367     while (t) {
1368         if (*nparam >= paramsize) {
1369             paramsize += PARAM_DELTA;
1370             *params = nasm_realloc(*params, sizeof(**params) * paramsize);
1371         }
1372         skip_white_(t);
1373         brace = false;
1374         if (tok_is_(t, "{"))
1375             brace = true;
1376         (*params)[(*nparam)++] = t;
1377         while (tok_isnt_(t, brace ? "}" : ","))
1378             t = t->next;
1379         if (t) {                /* got a comma/brace */
1380             t = t->next;
1381             if (brace) {
1382                 /*
1383                  * Now we've found the closing brace, look further
1384                  * for the comma.
1385                  */
1386                 skip_white_(t);
1387                 if (tok_isnt_(t, ",")) {
1388                     error(ERR_NONFATAL,
1389                           "braces do not enclose all of macro parameter");
1390                     while (tok_isnt_(t, ","))
1391                         t = t->next;
1392                 }
1393                 if (t)
1394                     t = t->next;        /* eat the comma */
1395             }
1396         }
1397     }
1398 }
1399
1400 /*
1401  * Determine whether one of the various `if' conditions is true or
1402  * not.
1403  *
1404  * We must free the tline we get passed.
1405  */
1406 static bool if_condition(Token * tline, enum preproc_token ct)
1407 {
1408     enum pp_conditional i = PP_COND(ct);
1409     bool j;
1410     Token *t, *tt, **tptr, *origline;
1411     struct tokenval tokval;
1412     expr *evalresult;
1413     enum pp_token_type needtype;
1414
1415     origline = tline;
1416
1417     switch (i) {
1418     case PPC_IFCTX:
1419         j = false;              /* have we matched yet? */
1420         while (cstk && tline) {
1421             skip_white_(tline);
1422             if (!tline || tline->type != TOK_ID) {
1423                 error(ERR_NONFATAL,
1424                       "`%s' expects context identifiers", pp_directives[ct]);
1425                 free_tlist(origline);
1426                 return -1;
1427             }
1428             if (!nasm_stricmp(tline->text, cstk->name))
1429                 j = true;
1430             tline = tline->next;
1431         }
1432         break;
1433
1434     case PPC_IFDEF:
1435         j = false;              /* have we matched yet? */
1436         while (tline) {
1437             skip_white_(tline);
1438             if (!tline || (tline->type != TOK_ID &&
1439                            (tline->type != TOK_PREPROC_ID ||
1440                             tline->text[1] != '$'))) {
1441                 error(ERR_NONFATAL,
1442                       "`%s' expects macro identifiers", pp_directives[ct]);
1443                 goto fail;
1444             }
1445             if (smacro_defined(NULL, tline->text, 0, NULL, true))
1446                 j = true;
1447             tline = tline->next;
1448         }
1449         break;
1450
1451     case PPC_IFIDN:
1452     case PPC_IFIDNI:
1453         tline = expand_smacro(tline);
1454         t = tt = tline;
1455         while (tok_isnt_(tt, ","))
1456             tt = tt->next;
1457         if (!tt) {
1458             error(ERR_NONFATAL,
1459                   "`%s' expects two comma-separated arguments",
1460                   pp_directives[ct]);
1461             goto fail;
1462         }
1463         tt = tt->next;
1464         j = true;               /* assume equality unless proved not */
1465         while ((t->type != TOK_OTHER || strcmp(t->text, ",")) && tt) {
1466             if (tt->type == TOK_OTHER && !strcmp(tt->text, ",")) {
1467                 error(ERR_NONFATAL, "`%s': more than one comma on line",
1468                       pp_directives[ct]);
1469                 goto fail;
1470             }
1471             if (t->type == TOK_WHITESPACE) {
1472                 t = t->next;
1473                 continue;
1474             }
1475             if (tt->type == TOK_WHITESPACE) {
1476                 tt = tt->next;
1477                 continue;
1478             }
1479             if (tt->type != t->type) {
1480                 j = false;      /* found mismatching tokens */
1481                 break;
1482             }
1483             /* Unify surrounding quotes for strings */
1484             if (t->type == TOK_STRING) {
1485                 tt->text[0] = t->text[0];
1486                 tt->text[strlen(tt->text) - 1] = t->text[0];
1487             }
1488             if (mstrcmp(tt->text, t->text, i == PPC_IFIDN) != 0) {
1489                 j = false;      /* found mismatching tokens */
1490                 break;
1491             }
1492
1493             t = t->next;
1494             tt = tt->next;
1495         }
1496         if ((t->type != TOK_OTHER || strcmp(t->text, ",")) || tt)
1497             j = false;          /* trailing gunk on one end or other */
1498         break;
1499
1500     case PPC_IFMACRO:
1501         {
1502             bool found = false;
1503             MMacro searching, *mmac;
1504
1505             tline = tline->next;
1506             skip_white_(tline);
1507             tline = expand_id(tline);
1508             if (!tok_type_(tline, TOK_ID)) {
1509                 error(ERR_NONFATAL,
1510                       "`%s' expects a macro name", pp_directives[ct]);
1511                 goto fail;
1512             }
1513             searching.name = nasm_strdup(tline->text);
1514             searching.casesense = true;
1515             searching.plus = false;
1516             searching.nolist = false;
1517             searching.in_progress = 0;
1518             searching.rep_nest = NULL;
1519             searching.nparam_min = 0;
1520             searching.nparam_max = INT_MAX;
1521             tline = expand_smacro(tline->next);
1522             skip_white_(tline);
1523             if (!tline) {
1524             } else if (!tok_type_(tline, TOK_NUMBER)) {
1525                 error(ERR_NONFATAL,
1526                       "`%s' expects a parameter count or nothing",
1527                       pp_directives[ct]);
1528             } else {
1529                 searching.nparam_min = searching.nparam_max =
1530                     readnum(tline->text, &j);
1531                 if (j)
1532                     error(ERR_NONFATAL,
1533                           "unable to parse parameter count `%s'",
1534                           tline->text);
1535             }
1536             if (tline && tok_is_(tline->next, "-")) {
1537                 tline = tline->next->next;
1538                 if (tok_is_(tline, "*"))
1539                     searching.nparam_max = INT_MAX;
1540                 else if (!tok_type_(tline, TOK_NUMBER))
1541                     error(ERR_NONFATAL,
1542                           "`%s' expects a parameter count after `-'",
1543                           pp_directives[ct]);
1544                 else {
1545                     searching.nparam_max = readnum(tline->text, &j);
1546                     if (j)
1547                         error(ERR_NONFATAL,
1548                               "unable to parse parameter count `%s'",
1549                               tline->text);
1550                     if (searching.nparam_min > searching.nparam_max)
1551                         error(ERR_NONFATAL,
1552                               "minimum parameter count exceeds maximum");
1553                 }
1554             }
1555             if (tline && tok_is_(tline->next, "+")) {
1556                 tline = tline->next;
1557                 searching.plus = true;
1558             }
1559             mmac = (MMacro *) hash_findix(mmacros, searching.name);
1560             while (mmac) {
1561                 if (!strcmp(mmac->name, searching.name) &&
1562                     (mmac->nparam_min <= searching.nparam_max
1563                      || searching.plus)
1564                     && (searching.nparam_min <= mmac->nparam_max
1565                         || mmac->plus)) {
1566                     found = true;
1567                     break;
1568                 }
1569                 mmac = mmac->next;
1570             }
1571             nasm_free(searching.name);
1572             j = found;
1573             break;
1574         }
1575
1576     case PPC_IFID:
1577         needtype = TOK_ID;
1578         goto iftype;
1579     case PPC_IFNUM:
1580         needtype = TOK_NUMBER;
1581         goto iftype;
1582     case PPC_IFSTR:
1583         needtype = TOK_STRING;
1584         goto iftype;
1585
1586     iftype:
1587         tline = expand_smacro(tline);
1588         t = tline;
1589
1590         while (tok_type_(t, TOK_WHITESPACE) ||
1591                (needtype == TOK_NUMBER &&
1592                 tok_type_(t, TOK_OTHER) &&
1593                 (t->text[0] == '-' || t->text[0] == '+') &&
1594                 !t->text[1]))
1595             t = t->next;
1596
1597         j = t && t->type == needtype;
1598         break;
1599
1600     case PPC_IF:
1601         t = tline = expand_smacro(tline);
1602         tptr = &t;
1603         tokval.t_type = TOKEN_INVALID;
1604         evalresult = evaluate(ppscan, tptr, &tokval,
1605                               NULL, pass | CRITICAL, error, NULL);
1606         if (!evalresult)
1607             return -1;
1608         if (tokval.t_type)
1609             error(ERR_WARNING,
1610                   "trailing garbage after expression ignored");
1611         if (!is_simple(evalresult)) {
1612             error(ERR_NONFATAL,
1613                   "non-constant value given to `%s'", pp_directives[ct]);
1614             goto fail;
1615         }
1616         j = reloc_value(evalresult) != 0;
1617         return j;
1618
1619     default:
1620         error(ERR_FATAL,
1621               "preprocessor directive `%s' not yet implemented",
1622               pp_directives[ct]);
1623         goto fail;
1624     }
1625
1626     free_tlist(origline);
1627     return j ^ PP_NEGATIVE(ct);
1628
1629 fail:
1630     free_tlist(origline);
1631     return -1;
1632 }
1633
1634 /*
1635  * Expand macros in a string. Used in %error and %include directives.
1636  * First tokenize the string, apply "expand_smacro" and then de-tokenize back.
1637  * The returned variable should ALWAYS be freed after usage.
1638  */
1639 void expand_macros_in_string(char **p)
1640 {
1641     Token *line = tokenize(*p);
1642     line = expand_smacro(line);
1643     *p = detoken(line, false);
1644 }
1645
1646 /*
1647  * Common code for defining an smacro
1648  */
1649 static bool define_smacro(Context *ctx, char *mname, bool casesense,
1650                           int nparam, Token *expansion)
1651 {
1652     SMacro *smac, **smhead;
1653
1654     if (smacro_defined(ctx, mname, nparam, &smac, casesense)) {
1655         if (!smac) {
1656             error(ERR_WARNING,
1657                   "single-line macro `%s' defined both with and"
1658                   " without parameters", mname);
1659
1660             /* Some instances of the old code considered this a failure,
1661                some others didn't.  What is the right thing to do here? */
1662             free_tlist(expansion);
1663             return false;       /* Failure */
1664         } else {
1665             /*
1666              * We're redefining, so we have to take over an
1667              * existing SMacro structure. This means freeing
1668              * what was already in it.
1669              */
1670             nasm_free(smac->name);
1671             free_tlist(smac->expansion);
1672         }
1673     } else {
1674         if (!ctx)
1675             smhead = (SMacro **) hash_findi_add(smacros, mname);
1676         else
1677             smhead = &ctx->localmac;
1678
1679         smac = nasm_malloc(sizeof(SMacro));
1680         smac->next = *smhead;
1681         *smhead = smac;
1682     }
1683     smac->name = nasm_strdup(mname);
1684     smac->casesense = casesense;
1685     smac->nparam = nparam;
1686     smac->expansion = expansion;
1687     smac->in_progress = false;
1688     return true;                /* Success */
1689 }
1690
1691 /*
1692  * Undefine an smacro
1693  */
1694 static void undef_smacro(Context *ctx, const char *mname)
1695 {
1696     SMacro **smhead, *s, **sp;
1697
1698     if (!ctx)
1699         smhead = (SMacro **) hash_findi(smacros, mname, NULL);
1700     else
1701         smhead = &ctx->localmac;
1702
1703     if (smhead) {
1704         /*
1705          * We now have a macro name... go hunt for it.
1706          */
1707         sp = smhead;
1708         while ((s = *sp) != NULL) {
1709             if (!mstrcmp(s->name, mname, s->casesense)) {
1710                 *sp = s->next;
1711                 nasm_free(s->name);
1712                 free_tlist(s->expansion);
1713                 nasm_free(s);
1714             } else {
1715                 sp = &s->next;
1716             }
1717         }
1718     }
1719 }
1720
1721 /*
1722  * Decode a size directive
1723  */
1724 static int parse_size(const char *str) {
1725     static const char *size_names[] =
1726         { "byte", "dword", "oword", "qword", "tword", "word" };
1727     static const int sizes[] =
1728         { 0, 1, 4, 16, 8, 10, 2 };
1729
1730     return sizes[bsii(str, size_names, elements(size_names))+1];
1731 }
1732
1733 /**
1734  * find and process preprocessor directive in passed line
1735  * Find out if a line contains a preprocessor directive, and deal
1736  * with it if so.
1737  *
1738  * If a directive _is_ found, it is the responsibility of this routine
1739  * (and not the caller) to free_tlist() the line.
1740  *
1741  * @param tline a pointer to the current tokeninzed line linked list
1742  * @return DIRECTIVE_FOUND or NO_DIRECTIVE_FOUND
1743  *
1744  */
1745 static int do_directive(Token * tline)
1746 {
1747     enum preproc_token i;
1748     int j;
1749     bool err;
1750     int nparam;
1751     bool nolist;
1752     bool casesense;
1753     int k, m;
1754     int offset;
1755     char *p, *mname;
1756     Include *inc;
1757     Context *ctx;
1758     Cond *cond;
1759     MMacro *mmac, **mmhead;
1760     Token *t, *tt, *param_start, *macro_start, *last, **tptr, *origline;
1761     Line *l;
1762     struct tokenval tokval;
1763     expr *evalresult;
1764     MMacro *tmp_defining;       /* Used when manipulating rep_nest */
1765     int64_t count;
1766
1767     origline = tline;
1768
1769     skip_white_(tline);
1770     if (!tok_type_(tline, TOK_PREPROC_ID) ||
1771         (tline->text[1] == '%' || tline->text[1] == '$'
1772          || tline->text[1] == '!'))
1773         return NO_DIRECTIVE_FOUND;
1774
1775     i = pp_token_hash(tline->text);
1776
1777     /*
1778      * If we're in a non-emitting branch of a condition construct,
1779      * or walking to the end of an already terminated %rep block,
1780      * we should ignore all directives except for condition
1781      * directives.
1782      */
1783     if (((istk->conds && !emitting(istk->conds->state)) ||
1784          (istk->mstk && !istk->mstk->in_progress)) && !is_condition(i)) {
1785         return NO_DIRECTIVE_FOUND;
1786     }
1787
1788     /*
1789      * If we're defining a macro or reading a %rep block, we should
1790      * ignore all directives except for %macro/%imacro (which
1791      * generate an error), %endm/%endmacro, and (only if we're in a
1792      * %rep block) %endrep. If we're in a %rep block, another %rep
1793      * causes an error, so should be let through.
1794      */
1795     if (defining && i != PP_MACRO && i != PP_IMACRO &&
1796         i != PP_ENDMACRO && i != PP_ENDM &&
1797         (defining->name || (i != PP_ENDREP && i != PP_REP))) {
1798         return NO_DIRECTIVE_FOUND;
1799     }
1800
1801     switch (i) {
1802     case PP_INVALID:
1803         error(ERR_NONFATAL, "unknown preprocessor directive `%s'",
1804               tline->text);
1805         return NO_DIRECTIVE_FOUND;      /* didn't get it */
1806
1807     case PP_STACKSIZE:
1808         /* Directive to tell NASM what the default stack size is. The
1809          * default is for a 16-bit stack, and this can be overriden with
1810          * %stacksize large.
1811          * the following form:
1812          *
1813          *      ARG arg1:WORD, arg2:DWORD, arg4:QWORD
1814          */
1815         tline = tline->next;
1816         if (tline && tline->type == TOK_WHITESPACE)
1817             tline = tline->next;
1818         if (!tline || tline->type != TOK_ID) {
1819             error(ERR_NONFATAL, "`%%stacksize' missing size parameter");
1820             free_tlist(origline);
1821             return DIRECTIVE_FOUND;
1822         }
1823         if (nasm_stricmp(tline->text, "flat") == 0) {
1824             /* All subsequent ARG directives are for a 32-bit stack */
1825             StackSize = 4;
1826             StackPointer = "ebp";
1827             ArgOffset = 8;
1828             LocalOffset = 0;
1829         } else if (nasm_stricmp(tline->text, "flat64") == 0) {
1830             /* All subsequent ARG directives are for a 64-bit stack */
1831             StackSize = 8;
1832             StackPointer = "rbp";
1833             ArgOffset = 8;
1834             LocalOffset = 0;
1835         } else if (nasm_stricmp(tline->text, "large") == 0) {
1836             /* All subsequent ARG directives are for a 16-bit stack,
1837              * far function call.
1838              */
1839             StackSize = 2;
1840             StackPointer = "bp";
1841             ArgOffset = 4;
1842             LocalOffset = 0;
1843         } else if (nasm_stricmp(tline->text, "small") == 0) {
1844             /* All subsequent ARG directives are for a 16-bit stack,
1845              * far function call. We don't support near functions.
1846              */
1847             StackSize = 2;
1848             StackPointer = "bp";
1849             ArgOffset = 6;
1850             LocalOffset = 0;
1851         } else {
1852             error(ERR_NONFATAL, "`%%stacksize' invalid size type");
1853             free_tlist(origline);
1854             return DIRECTIVE_FOUND;
1855         }
1856         free_tlist(origline);
1857         return DIRECTIVE_FOUND;
1858
1859     case PP_ARG:
1860         /* TASM like ARG directive to define arguments to functions, in
1861          * the following form:
1862          *
1863          *      ARG arg1:WORD, arg2:DWORD, arg4:QWORD
1864          */
1865         offset = ArgOffset;
1866         do {
1867             char *arg, directive[256];
1868             int size = StackSize;
1869
1870             /* Find the argument name */
1871             tline = tline->next;
1872             if (tline && tline->type == TOK_WHITESPACE)
1873                 tline = tline->next;
1874             if (!tline || tline->type != TOK_ID) {
1875                 error(ERR_NONFATAL, "`%%arg' missing argument parameter");
1876                 free_tlist(origline);
1877                 return DIRECTIVE_FOUND;
1878             }
1879             arg = tline->text;
1880
1881             /* Find the argument size type */
1882             tline = tline->next;
1883             if (!tline || tline->type != TOK_OTHER
1884                 || tline->text[0] != ':') {
1885                 error(ERR_NONFATAL,
1886                       "Syntax error processing `%%arg' directive");
1887                 free_tlist(origline);
1888                 return DIRECTIVE_FOUND;
1889             }
1890             tline = tline->next;
1891             if (!tline || tline->type != TOK_ID) {
1892                 error(ERR_NONFATAL, "`%%arg' missing size type parameter");
1893                 free_tlist(origline);
1894                 return DIRECTIVE_FOUND;
1895             }
1896
1897             /* Allow macro expansion of type parameter */
1898             tt = tokenize(tline->text);
1899             tt = expand_smacro(tt);
1900             size = parse_size(tt->text);
1901             if (!size) {
1902                 error(ERR_NONFATAL,
1903                       "Invalid size type for `%%arg' missing directive");
1904                 free_tlist(tt);
1905                 free_tlist(origline);
1906                 return DIRECTIVE_FOUND;
1907             }
1908             free_tlist(tt);
1909
1910             /* Round up to even stack slots */
1911             size = (size+StackSize-1) & ~(StackSize-1);
1912
1913             /* Now define the macro for the argument */
1914             snprintf(directive, sizeof(directive), "%%define %s (%s+%d)",
1915                      arg, StackPointer, offset);
1916             do_directive(tokenize(directive));
1917             offset += size;
1918
1919             /* Move to the next argument in the list */
1920             tline = tline->next;
1921             if (tline && tline->type == TOK_WHITESPACE)
1922                 tline = tline->next;
1923         } while (tline && tline->type == TOK_OTHER && tline->text[0] == ',');
1924         ArgOffset = offset;
1925         free_tlist(origline);
1926         return DIRECTIVE_FOUND;
1927
1928     case PP_LOCAL:
1929         /* TASM like LOCAL directive to define local variables for a
1930          * function, in the following form:
1931          *
1932          *      LOCAL local1:WORD, local2:DWORD, local4:QWORD = LocalSize
1933          *
1934          * The '= LocalSize' at the end is ignored by NASM, but is
1935          * required by TASM to define the local parameter size (and used
1936          * by the TASM macro package).
1937          */
1938         offset = LocalOffset;
1939         do {
1940             char *local, directive[256];
1941             int size = StackSize;
1942
1943             /* Find the argument name */
1944             tline = tline->next;
1945             if (tline && tline->type == TOK_WHITESPACE)
1946                 tline = tline->next;
1947             if (!tline || tline->type != TOK_ID) {
1948                 error(ERR_NONFATAL,
1949                       "`%%local' missing argument parameter");
1950                 free_tlist(origline);
1951                 return DIRECTIVE_FOUND;
1952             }
1953             local = tline->text;
1954
1955             /* Find the argument size type */
1956             tline = tline->next;
1957             if (!tline || tline->type != TOK_OTHER
1958                 || tline->text[0] != ':') {
1959                 error(ERR_NONFATAL,
1960                       "Syntax error processing `%%local' directive");
1961                 free_tlist(origline);
1962                 return DIRECTIVE_FOUND;
1963             }
1964             tline = tline->next;
1965             if (!tline || tline->type != TOK_ID) {
1966                 error(ERR_NONFATAL,
1967                       "`%%local' missing size type parameter");
1968                 free_tlist(origline);
1969                 return DIRECTIVE_FOUND;
1970             }
1971
1972             /* Allow macro expansion of type parameter */
1973             tt = tokenize(tline->text);
1974             tt = expand_smacro(tt);
1975             size = parse_size(tt->text);
1976             if (!size) {
1977                 error(ERR_NONFATAL,
1978                       "Invalid size type for `%%local' missing directive");
1979                 free_tlist(tt);
1980                 free_tlist(origline);
1981                 return DIRECTIVE_FOUND;
1982             }
1983             free_tlist(tt);
1984
1985             /* Round up to even stack slots */
1986             size = (size+StackSize-1) & ~(StackSize-1);
1987
1988             offset += size;     /* Negative offset, increment before */
1989
1990             /* Now define the macro for the argument */
1991             snprintf(directive, sizeof(directive), "%%define %s (%s-%d)",
1992                      local, StackPointer, offset);
1993             do_directive(tokenize(directive));
1994
1995             /* Now define the assign to setup the enter_c macro correctly */
1996             snprintf(directive, sizeof(directive),
1997                      "%%assign %%$localsize %%$localsize+%d", size);
1998             do_directive(tokenize(directive));
1999
2000             /* Move to the next argument in the list */
2001             tline = tline->next;
2002             if (tline && tline->type == TOK_WHITESPACE)
2003                 tline = tline->next;
2004         } while (tline && tline->type == TOK_OTHER && tline->text[0] == ',');
2005         LocalOffset = offset;
2006         free_tlist(origline);
2007         return DIRECTIVE_FOUND;
2008
2009     case PP_CLEAR:
2010         if (tline->next)
2011             error(ERR_WARNING, "trailing garbage after `%%clear' ignored");
2012         free_macros();
2013         init_macros();
2014         free_tlist(origline);
2015         return DIRECTIVE_FOUND;
2016
2017     case PP_INCLUDE:
2018         tline = tline->next;
2019         skip_white_(tline);
2020         if (!tline || (tline->type != TOK_STRING &&
2021                        tline->type != TOK_INTERNAL_STRING)) {
2022             error(ERR_NONFATAL, "`%%include' expects a file name");
2023             free_tlist(origline);
2024             return DIRECTIVE_FOUND;     /* but we did _something_ */
2025         }
2026         if (tline->next)
2027             error(ERR_WARNING,
2028                   "trailing garbage after `%%include' ignored");
2029         if (tline->type != TOK_INTERNAL_STRING) {
2030             p = tline->text + 1;        /* point past the quote to the name */
2031             p[strlen(p) - 1] = '\0';    /* remove the trailing quote */
2032         } else
2033             p = tline->text;    /* internal_string is easier */
2034         expand_macros_in_string(&p);
2035         inc = nasm_malloc(sizeof(Include));
2036         inc->next = istk;
2037         inc->conds = NULL;
2038         inc->fp = inc_fopen(p);
2039         if (!inc->fp && pass == 0) {
2040             /* -MG given but file not found */
2041             nasm_free(inc);
2042         } else {
2043             inc->fname = src_set_fname(p);
2044             inc->lineno = src_set_linnum(0);
2045             inc->lineinc = 1;
2046             inc->expansion = NULL;
2047             inc->mstk = NULL;
2048             istk = inc;
2049             list->uplevel(LIST_INCLUDE);
2050         }
2051         free_tlist(origline);
2052         return DIRECTIVE_FOUND;
2053
2054     case PP_PUSH:
2055         tline = tline->next;
2056         skip_white_(tline);
2057         tline = expand_id(tline);
2058         if (!tok_type_(tline, TOK_ID)) {
2059             error(ERR_NONFATAL, "`%%push' expects a context identifier");
2060             free_tlist(origline);
2061             return DIRECTIVE_FOUND;     /* but we did _something_ */
2062         }
2063         if (tline->next)
2064             error(ERR_WARNING, "trailing garbage after `%%push' ignored");
2065         ctx = nasm_malloc(sizeof(Context));
2066         ctx->next = cstk;
2067         ctx->localmac = NULL;
2068         ctx->name = nasm_strdup(tline->text);
2069         ctx->number = unique++;
2070         cstk = ctx;
2071         free_tlist(origline);
2072         break;
2073
2074     case PP_REPL:
2075         tline = tline->next;
2076         skip_white_(tline);
2077         tline = expand_id(tline);
2078         if (!tok_type_(tline, TOK_ID)) {
2079             error(ERR_NONFATAL, "`%%repl' expects a context identifier");
2080             free_tlist(origline);
2081             return DIRECTIVE_FOUND;     /* but we did _something_ */
2082         }
2083         if (tline->next)
2084             error(ERR_WARNING, "trailing garbage after `%%repl' ignored");
2085         if (!cstk)
2086             error(ERR_NONFATAL, "`%%repl': context stack is empty");
2087         else {
2088             nasm_free(cstk->name);
2089             cstk->name = nasm_strdup(tline->text);
2090         }
2091         free_tlist(origline);
2092         break;
2093
2094     case PP_POP:
2095         if (tline->next)
2096             error(ERR_WARNING, "trailing garbage after `%%pop' ignored");
2097         if (!cstk)
2098             error(ERR_NONFATAL, "`%%pop': context stack is already empty");
2099         else
2100             ctx_pop();
2101         free_tlist(origline);
2102         break;
2103
2104     case PP_ERROR:
2105         tline->next = expand_smacro(tline->next);
2106         tline = tline->next;
2107         skip_white_(tline);
2108         if (tok_type_(tline, TOK_STRING)) {
2109             p = tline->text + 1;        /* point past the quote to the name */
2110             p[strlen(p) - 1] = '\0';    /* remove the trailing quote */
2111             expand_macros_in_string(&p);
2112             error(ERR_NONFATAL, "%s", p);
2113             nasm_free(p);
2114         } else {
2115             p = detoken(tline, false);
2116             error(ERR_WARNING, "%s", p);
2117             nasm_free(p);
2118         }
2119         free_tlist(origline);
2120         break;
2121
2122     CASE_PP_IF:
2123         if (istk->conds && !emitting(istk->conds->state))
2124             j = COND_NEVER;
2125         else {
2126             j = if_condition(tline->next, i);
2127             tline->next = NULL; /* it got freed */
2128             j = j < 0 ? COND_NEVER : j ? COND_IF_TRUE : COND_IF_FALSE;
2129         }
2130         cond = nasm_malloc(sizeof(Cond));
2131         cond->next = istk->conds;
2132         cond->state = j;
2133         istk->conds = cond;
2134         free_tlist(origline);
2135         return DIRECTIVE_FOUND;
2136
2137     CASE_PP_ELIF:
2138         if (!istk->conds)
2139             error(ERR_FATAL, "`%s': no matching `%%if'", pp_directives[i]);
2140         if (emitting(istk->conds->state)
2141             || istk->conds->state == COND_NEVER)
2142             istk->conds->state = COND_NEVER;
2143         else {
2144             /*
2145              * IMPORTANT: In the case of %if, we will already have
2146              * called expand_mmac_params(); however, if we're
2147              * processing an %elif we must have been in a
2148              * non-emitting mode, which would have inhibited
2149              * the normal invocation of expand_mmac_params().  Therefore,
2150              * we have to do it explicitly here.
2151              */
2152             j = if_condition(expand_mmac_params(tline->next), i);
2153             tline->next = NULL; /* it got freed */
2154             istk->conds->state =
2155                 j < 0 ? COND_NEVER : j ? COND_IF_TRUE : COND_IF_FALSE;
2156         }
2157         free_tlist(origline);
2158         return DIRECTIVE_FOUND;
2159
2160     case PP_ELSE:
2161         if (tline->next)
2162             error(ERR_WARNING, "trailing garbage after `%%else' ignored");
2163         if (!istk->conds)
2164             error(ERR_FATAL, "`%%else': no matching `%%if'");
2165         if (emitting(istk->conds->state)
2166             || istk->conds->state == COND_NEVER)
2167             istk->conds->state = COND_ELSE_FALSE;
2168         else
2169             istk->conds->state = COND_ELSE_TRUE;
2170         free_tlist(origline);
2171         return DIRECTIVE_FOUND;
2172
2173     case PP_ENDIF:
2174         if (tline->next)
2175             error(ERR_WARNING, "trailing garbage after `%%endif' ignored");
2176         if (!istk->conds)
2177             error(ERR_FATAL, "`%%endif': no matching `%%if'");
2178         cond = istk->conds;
2179         istk->conds = cond->next;
2180         nasm_free(cond);
2181         free_tlist(origline);
2182         return DIRECTIVE_FOUND;
2183
2184     case PP_MACRO:
2185     case PP_IMACRO:
2186         if (defining)
2187             error(ERR_FATAL,
2188                   "`%%%smacro': already defining a macro",
2189                   (i == PP_IMACRO ? "i" : ""));
2190         tline = tline->next;
2191         skip_white_(tline);
2192         tline = expand_id(tline);
2193         if (!tok_type_(tline, TOK_ID)) {
2194             error(ERR_NONFATAL,
2195                   "`%%%smacro' expects a macro name",
2196                   (i == PP_IMACRO ? "i" : ""));
2197             return DIRECTIVE_FOUND;
2198         }
2199         defining = nasm_malloc(sizeof(MMacro));
2200         defining->name = nasm_strdup(tline->text);
2201         defining->casesense = (i == PP_MACRO);
2202         defining->plus = false;
2203         defining->nolist = false;
2204         defining->in_progress = 0;
2205         defining->rep_nest = NULL;
2206         tline = expand_smacro(tline->next);
2207         skip_white_(tline);
2208         if (!tok_type_(tline, TOK_NUMBER)) {
2209             error(ERR_NONFATAL,
2210                   "`%%%smacro' expects a parameter count",
2211                   (i == PP_IMACRO ? "i" : ""));
2212             defining->nparam_min = defining->nparam_max = 0;
2213         } else {
2214             defining->nparam_min = defining->nparam_max =
2215                 readnum(tline->text, &err);
2216             if (err)
2217                 error(ERR_NONFATAL,
2218                       "unable to parse parameter count `%s'", tline->text);
2219         }
2220         if (tline && tok_is_(tline->next, "-")) {
2221             tline = tline->next->next;
2222             if (tok_is_(tline, "*"))
2223                 defining->nparam_max = INT_MAX;
2224             else if (!tok_type_(tline, TOK_NUMBER))
2225                 error(ERR_NONFATAL,
2226                       "`%%%smacro' expects a parameter count after `-'",
2227                       (i == PP_IMACRO ? "i" : ""));
2228             else {
2229                 defining->nparam_max = readnum(tline->text, &err);
2230                 if (err)
2231                     error(ERR_NONFATAL,
2232                           "unable to parse parameter count `%s'",
2233                           tline->text);
2234                 if (defining->nparam_min > defining->nparam_max)
2235                     error(ERR_NONFATAL,
2236                           "minimum parameter count exceeds maximum");
2237             }
2238         }
2239         if (tline && tok_is_(tline->next, "+")) {
2240             tline = tline->next;
2241             defining->plus = true;
2242         }
2243         if (tline && tok_type_(tline->next, TOK_ID) &&
2244             !nasm_stricmp(tline->next->text, ".nolist")) {
2245             tline = tline->next;
2246             defining->nolist = true;
2247         }
2248         mmac = (MMacro *) hash_findix(mmacros, defining->name);
2249         while (mmac) {
2250             if (!strcmp(mmac->name, defining->name) &&
2251                 (mmac->nparam_min <= defining->nparam_max
2252                  || defining->plus)
2253                 && (defining->nparam_min <= mmac->nparam_max
2254                     || mmac->plus)) {
2255                 error(ERR_WARNING,
2256                       "redefining multi-line macro `%s'", defining->name);
2257                 break;
2258             }
2259             mmac = mmac->next;
2260         }
2261         /*
2262          * Handle default parameters.
2263          */
2264         if (tline && tline->next) {
2265             defining->dlist = tline->next;
2266             tline->next = NULL;
2267             count_mmac_params(defining->dlist, &defining->ndefs,
2268                               &defining->defaults);
2269         } else {
2270             defining->dlist = NULL;
2271             defining->defaults = NULL;
2272         }
2273         defining->expansion = NULL;
2274         free_tlist(origline);
2275         return DIRECTIVE_FOUND;
2276
2277     case PP_ENDM:
2278     case PP_ENDMACRO:
2279         if (!defining) {
2280             error(ERR_NONFATAL, "`%s': not defining a macro", tline->text);
2281             return DIRECTIVE_FOUND;
2282         }
2283         mmhead = (MMacro **) hash_findi_add(mmacros, defining->name);
2284         defining->next = *mmhead;
2285         *mmhead = defining;
2286         defining = NULL;
2287         free_tlist(origline);
2288         return DIRECTIVE_FOUND;
2289
2290     case PP_ROTATE:
2291         if (tline->next && tline->next->type == TOK_WHITESPACE)
2292             tline = tline->next;
2293         if (tline->next == NULL) {
2294             free_tlist(origline);
2295             error(ERR_NONFATAL, "`%%rotate' missing rotate count");
2296             return DIRECTIVE_FOUND;
2297         }
2298         t = expand_smacro(tline->next);
2299         tline->next = NULL;
2300         free_tlist(origline);
2301         tline = t;
2302         tptr = &t;
2303         tokval.t_type = TOKEN_INVALID;
2304         evalresult =
2305             evaluate(ppscan, tptr, &tokval, NULL, pass, error, NULL);
2306         free_tlist(tline);
2307         if (!evalresult)
2308             return DIRECTIVE_FOUND;
2309         if (tokval.t_type)
2310             error(ERR_WARNING,
2311                   "trailing garbage after expression ignored");
2312         if (!is_simple(evalresult)) {
2313             error(ERR_NONFATAL, "non-constant value given to `%%rotate'");
2314             return DIRECTIVE_FOUND;
2315         }
2316         mmac = istk->mstk;
2317         while (mmac && !mmac->name)     /* avoid mistaking %reps for macros */
2318             mmac = mmac->next_active;
2319         if (!mmac) {
2320             error(ERR_NONFATAL, "`%%rotate' invoked outside a macro call");
2321         } else if (mmac->nparam == 0) {
2322             error(ERR_NONFATAL,
2323                   "`%%rotate' invoked within macro without parameters");
2324         } else {
2325             int rotate = mmac->rotate + reloc_value(evalresult);
2326
2327             rotate %= (int)mmac->nparam;
2328             if (rotate < 0)
2329                 rotate += mmac->nparam;
2330
2331             mmac->rotate = rotate;
2332         }
2333         return DIRECTIVE_FOUND;
2334
2335     case PP_REP:
2336         nolist = false;
2337         do {
2338             tline = tline->next;
2339         } while (tok_type_(tline, TOK_WHITESPACE));
2340
2341         if (tok_type_(tline, TOK_ID) &&
2342             nasm_stricmp(tline->text, ".nolist") == 0) {
2343             nolist = true;
2344             do {
2345                 tline = tline->next;
2346             } while (tok_type_(tline, TOK_WHITESPACE));
2347         }
2348
2349         if (tline) {
2350             t = expand_smacro(tline);
2351             tptr = &t;
2352             tokval.t_type = TOKEN_INVALID;
2353             evalresult =
2354                 evaluate(ppscan, tptr, &tokval, NULL, pass, error, NULL);
2355             if (!evalresult) {
2356                 free_tlist(origline);
2357                 return DIRECTIVE_FOUND;
2358             }
2359             if (tokval.t_type)
2360                 error(ERR_WARNING,
2361                       "trailing garbage after expression ignored");
2362             if (!is_simple(evalresult)) {
2363                 error(ERR_NONFATAL, "non-constant value given to `%%rep'");
2364                 return DIRECTIVE_FOUND;
2365             }
2366             count = reloc_value(evalresult) + 1;
2367         } else {
2368             error(ERR_NONFATAL, "`%%rep' expects a repeat count");
2369             count = 0;
2370         }
2371         free_tlist(origline);
2372
2373         tmp_defining = defining;
2374         defining = nasm_malloc(sizeof(MMacro));
2375         defining->name = NULL;  /* flags this macro as a %rep block */
2376         defining->casesense = false;
2377         defining->plus = false;
2378         defining->nolist = nolist;
2379         defining->in_progress = count;
2380         defining->nparam_min = defining->nparam_max = 0;
2381         defining->defaults = NULL;
2382         defining->dlist = NULL;
2383         defining->expansion = NULL;
2384         defining->next_active = istk->mstk;
2385         defining->rep_nest = tmp_defining;
2386         return DIRECTIVE_FOUND;
2387
2388     case PP_ENDREP:
2389         if (!defining || defining->name) {
2390             error(ERR_NONFATAL, "`%%endrep': no matching `%%rep'");
2391             return DIRECTIVE_FOUND;
2392         }
2393
2394         /*
2395          * Now we have a "macro" defined - although it has no name
2396          * and we won't be entering it in the hash tables - we must
2397          * push a macro-end marker for it on to istk->expansion.
2398          * After that, it will take care of propagating itself (a
2399          * macro-end marker line for a macro which is really a %rep
2400          * block will cause the macro to be re-expanded, complete
2401          * with another macro-end marker to ensure the process
2402          * continues) until the whole expansion is forcibly removed
2403          * from istk->expansion by a %exitrep.
2404          */
2405         l = nasm_malloc(sizeof(Line));
2406         l->next = istk->expansion;
2407         l->finishes = defining;
2408         l->first = NULL;
2409         istk->expansion = l;
2410
2411         istk->mstk = defining;
2412
2413         list->uplevel(defining->nolist ? LIST_MACRO_NOLIST : LIST_MACRO);
2414         tmp_defining = defining;
2415         defining = defining->rep_nest;
2416         free_tlist(origline);
2417         return DIRECTIVE_FOUND;
2418
2419     case PP_EXITREP:
2420         /*
2421          * We must search along istk->expansion until we hit a
2422          * macro-end marker for a macro with no name. Then we set
2423          * its `in_progress' flag to 0.
2424          */
2425         for (l = istk->expansion; l; l = l->next)
2426             if (l->finishes && !l->finishes->name)
2427                 break;
2428
2429         if (l)
2430             l->finishes->in_progress = 0;
2431         else
2432             error(ERR_NONFATAL, "`%%exitrep' not within `%%rep' block");
2433         free_tlist(origline);
2434         return DIRECTIVE_FOUND;
2435
2436     case PP_XDEFINE:
2437     case PP_IXDEFINE:
2438     case PP_DEFINE:
2439     case PP_IDEFINE:
2440         casesense = (i == PP_DEFINE || i == PP_XDEFINE);
2441
2442         tline = tline->next;
2443         skip_white_(tline);
2444         tline = expand_id(tline);
2445         if (!tline || (tline->type != TOK_ID &&
2446                        (tline->type != TOK_PREPROC_ID ||
2447                         tline->text[1] != '$'))) {
2448             error(ERR_NONFATAL, "`%s' expects a macro identifier",
2449                   pp_directives[i]);
2450             free_tlist(origline);
2451             return DIRECTIVE_FOUND;
2452         }
2453
2454         ctx = get_ctx(tline->text, false);
2455
2456         mname = tline->text;
2457         last = tline;
2458         param_start = tline = tline->next;
2459         nparam = 0;
2460
2461         /* Expand the macro definition now for %xdefine and %ixdefine */
2462         if ((i == PP_XDEFINE) || (i == PP_IXDEFINE))
2463             tline = expand_smacro(tline);
2464
2465         if (tok_is_(tline, "(")) {
2466             /*
2467              * This macro has parameters.
2468              */
2469
2470             tline = tline->next;
2471             while (1) {
2472                 skip_white_(tline);
2473                 if (!tline) {
2474                     error(ERR_NONFATAL, "parameter identifier expected");
2475                     free_tlist(origline);
2476                     return DIRECTIVE_FOUND;
2477                 }
2478                 if (tline->type != TOK_ID) {
2479                     error(ERR_NONFATAL,
2480                           "`%s': parameter identifier expected",
2481                           tline->text);
2482                     free_tlist(origline);
2483                     return DIRECTIVE_FOUND;
2484                 }
2485                 tline->type = TOK_SMAC_PARAM + nparam++;
2486                 tline = tline->next;
2487                 skip_white_(tline);
2488                 if (tok_is_(tline, ",")) {
2489                     tline = tline->next;
2490                     continue;
2491                 }
2492                 if (!tok_is_(tline, ")")) {
2493                     error(ERR_NONFATAL,
2494                           "`)' expected to terminate macro template");
2495                     free_tlist(origline);
2496                     return DIRECTIVE_FOUND;
2497                 }
2498                 break;
2499             }
2500             last = tline;
2501             tline = tline->next;
2502         }
2503         if (tok_type_(tline, TOK_WHITESPACE))
2504             last = tline, tline = tline->next;
2505         macro_start = NULL;
2506         last->next = NULL;
2507         t = tline;
2508         while (t) {
2509             if (t->type == TOK_ID) {
2510                 for (tt = param_start; tt; tt = tt->next)
2511                     if (tt->type >= TOK_SMAC_PARAM &&
2512                         !strcmp(tt->text, t->text))
2513                         t->type = tt->type;
2514             }
2515             tt = t->next;
2516             t->next = macro_start;
2517             macro_start = t;
2518             t = tt;
2519         }
2520         /*
2521          * Good. We now have a macro name, a parameter count, and a
2522          * token list (in reverse order) for an expansion. We ought
2523          * to be OK just to create an SMacro, store it, and let
2524          * free_tlist have the rest of the line (which we have
2525          * carefully re-terminated after chopping off the expansion
2526          * from the end).
2527          */
2528         define_smacro(ctx, mname, casesense, nparam, macro_start);
2529         free_tlist(origline);
2530         return DIRECTIVE_FOUND;
2531
2532     case PP_UNDEF:
2533         tline = tline->next;
2534         skip_white_(tline);
2535         tline = expand_id(tline);
2536         if (!tline || (tline->type != TOK_ID &&
2537                        (tline->type != TOK_PREPROC_ID ||
2538                         tline->text[1] != '$'))) {
2539             error(ERR_NONFATAL, "`%%undef' expects a macro identifier");
2540             free_tlist(origline);
2541             return DIRECTIVE_FOUND;
2542         }
2543         if (tline->next) {
2544             error(ERR_WARNING,
2545                   "trailing garbage after macro name ignored");
2546         }
2547
2548         /* Find the context that symbol belongs to */
2549         ctx = get_ctx(tline->text, false);
2550         undef_smacro(ctx, tline->text);
2551         free_tlist(origline);
2552         return DIRECTIVE_FOUND;
2553
2554     case PP_STRLEN:
2555         casesense = true;
2556
2557         tline = tline->next;
2558         skip_white_(tline);
2559         tline = expand_id(tline);
2560         if (!tline || (tline->type != TOK_ID &&
2561                        (tline->type != TOK_PREPROC_ID ||
2562                         tline->text[1] != '$'))) {
2563             error(ERR_NONFATAL,
2564                   "`%%strlen' expects a macro identifier as first parameter");
2565             free_tlist(origline);
2566             return DIRECTIVE_FOUND;
2567         }
2568         ctx = get_ctx(tline->text, false);
2569
2570         mname = tline->text;
2571         last = tline;
2572         tline = expand_smacro(tline->next);
2573         last->next = NULL;
2574
2575         t = tline;
2576         while (tok_type_(t, TOK_WHITESPACE))
2577             t = t->next;
2578         /* t should now point to the string */
2579         if (t->type != TOK_STRING) {
2580             error(ERR_NONFATAL,
2581                   "`%%strlen` requires string as second parameter");
2582             free_tlist(tline);
2583             free_tlist(origline);
2584             return DIRECTIVE_FOUND;
2585         }
2586
2587         macro_start = nasm_malloc(sizeof(*macro_start));
2588         macro_start->next = NULL;
2589         make_tok_num(macro_start, strlen(t->text) - 2);
2590         macro_start->mac = NULL;
2591
2592         /*
2593          * We now have a macro name, an implicit parameter count of
2594          * zero, and a numeric token to use as an expansion. Create
2595          * and store an SMacro.
2596          */
2597         define_smacro(ctx, mname, casesense, 0, macro_start);
2598         free_tlist(tline);
2599         free_tlist(origline);
2600         return DIRECTIVE_FOUND;
2601
2602     case PP_SUBSTR:
2603         casesense = true;
2604
2605         tline = tline->next;
2606         skip_white_(tline);
2607         tline = expand_id(tline);
2608         if (!tline || (tline->type != TOK_ID &&
2609                        (tline->type != TOK_PREPROC_ID ||
2610                         tline->text[1] != '$'))) {
2611             error(ERR_NONFATAL,
2612                   "`%%substr' expects a macro identifier as first parameter");
2613             free_tlist(origline);
2614             return DIRECTIVE_FOUND;
2615         }
2616         ctx = get_ctx(tline->text, false);
2617
2618         mname = tline->text;
2619         last = tline;
2620         tline = expand_smacro(tline->next);
2621         last->next = NULL;
2622
2623         t = tline->next;
2624         while (tok_type_(t, TOK_WHITESPACE))
2625             t = t->next;
2626
2627         /* t should now point to the string */
2628         if (t->type != TOK_STRING) {
2629             error(ERR_NONFATAL,
2630                   "`%%substr` requires string as second parameter");
2631             free_tlist(tline);
2632             free_tlist(origline);
2633             return DIRECTIVE_FOUND;
2634         }
2635
2636         tt = t->next;
2637         tptr = &tt;
2638         tokval.t_type = TOKEN_INVALID;
2639         evalresult =
2640             evaluate(ppscan, tptr, &tokval, NULL, pass, error, NULL);
2641         if (!evalresult) {
2642             free_tlist(tline);
2643             free_tlist(origline);
2644             return DIRECTIVE_FOUND;
2645         }
2646         if (!is_simple(evalresult)) {
2647             error(ERR_NONFATAL, "non-constant value given to `%%substr`");
2648             free_tlist(tline);
2649             free_tlist(origline);
2650             return DIRECTIVE_FOUND;
2651         }
2652
2653         macro_start = nasm_malloc(sizeof(*macro_start));
2654         macro_start->next = NULL;
2655         macro_start->text = nasm_strdup("'''");
2656         if (evalresult->value > 0
2657             && evalresult->value < (int) strlen(t->text) - 1) {
2658             macro_start->text[1] = t->text[evalresult->value];
2659         } else {
2660             macro_start->text[2] = '\0';
2661         }
2662         macro_start->type = TOK_STRING;
2663         macro_start->mac = NULL;
2664
2665         /*
2666          * We now have a macro name, an implicit parameter count of
2667          * zero, and a numeric token to use as an expansion. Create
2668          * and store an SMacro.
2669          */
2670         define_smacro(ctx, mname, casesense, 0, macro_start);
2671         free_tlist(tline);
2672         free_tlist(origline);
2673         return DIRECTIVE_FOUND;
2674
2675     case PP_ASSIGN:
2676     case PP_IASSIGN:
2677         casesense = (i == PP_ASSIGN);
2678
2679         tline = tline->next;
2680         skip_white_(tline);
2681         tline = expand_id(tline);
2682         if (!tline || (tline->type != TOK_ID &&
2683                        (tline->type != TOK_PREPROC_ID ||
2684                         tline->text[1] != '$'))) {
2685             error(ERR_NONFATAL,
2686                   "`%%%sassign' expects a macro identifier",
2687                   (i == PP_IASSIGN ? "i" : ""));
2688             free_tlist(origline);
2689             return DIRECTIVE_FOUND;
2690         }
2691         ctx = get_ctx(tline->text, false);
2692
2693         mname = tline->text;
2694         last = tline;
2695         tline = expand_smacro(tline->next);
2696         last->next = NULL;
2697
2698         t = tline;
2699         tptr = &t;
2700         tokval.t_type = TOKEN_INVALID;
2701         evalresult =
2702             evaluate(ppscan, tptr, &tokval, NULL, pass, error, NULL);
2703         free_tlist(tline);
2704         if (!evalresult) {
2705             free_tlist(origline);
2706             return DIRECTIVE_FOUND;
2707         }
2708
2709         if (tokval.t_type)
2710             error(ERR_WARNING,
2711                   "trailing garbage after expression ignored");
2712
2713         if (!is_simple(evalresult)) {
2714             error(ERR_NONFATAL,
2715                   "non-constant value given to `%%%sassign'",
2716                   (i == PP_IASSIGN ? "i" : ""));
2717             free_tlist(origline);
2718             return DIRECTIVE_FOUND;
2719         }
2720
2721         macro_start = nasm_malloc(sizeof(*macro_start));
2722         macro_start->next = NULL;
2723         make_tok_num(macro_start, reloc_value(evalresult));
2724         macro_start->mac = NULL;
2725
2726         /*
2727          * We now have a macro name, an implicit parameter count of
2728          * zero, and a numeric token to use as an expansion. Create
2729          * and store an SMacro.
2730          */
2731         define_smacro(ctx, mname, casesense, 0, macro_start);
2732         free_tlist(origline);
2733         return DIRECTIVE_FOUND;
2734
2735     case PP_LINE:
2736         /*
2737          * Syntax is `%line nnn[+mmm] [filename]'
2738          */
2739         tline = tline->next;
2740         skip_white_(tline);
2741         if (!tok_type_(tline, TOK_NUMBER)) {
2742             error(ERR_NONFATAL, "`%%line' expects line number");
2743             free_tlist(origline);
2744             return DIRECTIVE_FOUND;
2745         }
2746         k = readnum(tline->text, &err);
2747         m = 1;
2748         tline = tline->next;
2749         if (tok_is_(tline, "+")) {
2750             tline = tline->next;
2751             if (!tok_type_(tline, TOK_NUMBER)) {
2752                 error(ERR_NONFATAL, "`%%line' expects line increment");
2753                 free_tlist(origline);
2754                 return DIRECTIVE_FOUND;
2755             }
2756             m = readnum(tline->text, &err);
2757             tline = tline->next;
2758         }
2759         skip_white_(tline);
2760         src_set_linnum(k);
2761         istk->lineinc = m;
2762         if (tline) {
2763             nasm_free(src_set_fname(detoken(tline, false)));
2764         }
2765         free_tlist(origline);
2766         return DIRECTIVE_FOUND;
2767
2768     default:
2769         error(ERR_FATAL,
2770               "preprocessor directive `%s' not yet implemented",
2771               pp_directives[i]);
2772         break;
2773     }
2774     return DIRECTIVE_FOUND;
2775 }
2776
2777 /*
2778  * Ensure that a macro parameter contains a condition code and
2779  * nothing else. Return the condition code index if so, or -1
2780  * otherwise.
2781  */
2782 static int find_cc(Token * t)
2783 {
2784     Token *tt;
2785     int i, j, k, m;
2786
2787     if (!t)
2788             return -1;          /* Probably a %+ without a space */
2789
2790     skip_white_(t);
2791     if (t->type != TOK_ID)
2792         return -1;
2793     tt = t->next;
2794     skip_white_(tt);
2795     if (tt && (tt->type != TOK_OTHER || strcmp(tt->text, ",")))
2796         return -1;
2797
2798     i = -1;
2799     j = elements(conditions);
2800     while (j - i > 1) {
2801         k = (j + i) / 2;
2802         m = nasm_stricmp(t->text, conditions[k]);
2803         if (m == 0) {
2804             i = k;
2805             j = -2;
2806             break;
2807         } else if (m < 0) {
2808             j = k;
2809         } else
2810             i = k;
2811     }
2812     if (j != -2)
2813         return -1;
2814     return i;
2815 }
2816
2817 /*
2818  * Expand MMacro-local things: parameter references (%0, %n, %+n,
2819  * %-n) and MMacro-local identifiers (%%foo).
2820  */
2821 static Token *expand_mmac_params(Token * tline)
2822 {
2823     Token *t, *tt, **tail, *thead;
2824
2825     tail = &thead;
2826     thead = NULL;
2827
2828     while (tline) {
2829         if (tline->type == TOK_PREPROC_ID &&
2830             (((tline->text[1] == '+' || tline->text[1] == '-')
2831               && tline->text[2]) || tline->text[1] == '%'
2832              || (tline->text[1] >= '0' && tline->text[1] <= '9'))) {
2833             char *text = NULL;
2834             int type = 0, cc;   /* type = 0 to placate optimisers */
2835             char tmpbuf[30];
2836             unsigned int n;
2837             int i;
2838             MMacro *mac;
2839
2840             t = tline;
2841             tline = tline->next;
2842
2843             mac = istk->mstk;
2844             while (mac && !mac->name)   /* avoid mistaking %reps for macros */
2845                 mac = mac->next_active;
2846             if (!mac)
2847                 error(ERR_NONFATAL, "`%s': not in a macro call", t->text);
2848             else
2849                 switch (t->text[1]) {
2850                     /*
2851                      * We have to make a substitution of one of the
2852                      * forms %1, %-1, %+1, %%foo, %0.
2853                      */
2854                 case '0':
2855                     type = TOK_NUMBER;
2856                     snprintf(tmpbuf, sizeof(tmpbuf), "%d", mac->nparam);
2857                     text = nasm_strdup(tmpbuf);
2858                     break;
2859                 case '%':
2860                     type = TOK_ID;
2861                     snprintf(tmpbuf, sizeof(tmpbuf), "..@%"PRIu64".",
2862                              mac->unique);
2863                     text = nasm_strcat(tmpbuf, t->text + 2);
2864                     break;
2865                 case '-':
2866                     n = atoi(t->text + 2) - 1;
2867                     if (n >= mac->nparam)
2868                         tt = NULL;
2869                     else {
2870                         if (mac->nparam > 1)
2871                             n = (n + mac->rotate) % mac->nparam;
2872                         tt = mac->params[n];
2873                     }
2874                     cc = find_cc(tt);
2875                     if (cc == -1) {
2876                         error(ERR_NONFATAL,
2877                               "macro parameter %d is not a condition code",
2878                               n + 1);
2879                         text = NULL;
2880                     } else {
2881                         type = TOK_ID;
2882                         if (inverse_ccs[cc] == -1) {
2883                             error(ERR_NONFATAL,
2884                                   "condition code `%s' is not invertible",
2885                                   conditions[cc]);
2886                             text = NULL;
2887                         } else
2888                             text =
2889                                 nasm_strdup(conditions[inverse_ccs[cc]]);
2890                     }
2891                     break;
2892                 case '+':
2893                     n = atoi(t->text + 2) - 1;
2894                     if (n >= mac->nparam)
2895                         tt = NULL;
2896                     else {
2897                         if (mac->nparam > 1)
2898                             n = (n + mac->rotate) % mac->nparam;
2899                         tt = mac->params[n];
2900                     }
2901                     cc = find_cc(tt);
2902                     if (cc == -1) {
2903                         error(ERR_NONFATAL,
2904                               "macro parameter %d is not a condition code",
2905                               n + 1);
2906                         text = NULL;
2907                     } else {
2908                         type = TOK_ID;
2909                         text = nasm_strdup(conditions[cc]);
2910                     }
2911                     break;
2912                 default:
2913                     n = atoi(t->text + 1) - 1;
2914                     if (n >= mac->nparam)
2915                         tt = NULL;
2916                     else {
2917                         if (mac->nparam > 1)
2918                             n = (n + mac->rotate) % mac->nparam;
2919                         tt = mac->params[n];
2920                     }
2921                     if (tt) {
2922                         for (i = 0; i < mac->paramlen[n]; i++) {
2923                             *tail = new_Token(NULL, tt->type, tt->text, 0);
2924                             tail = &(*tail)->next;
2925                             tt = tt->next;
2926                         }
2927                     }
2928                     text = NULL;        /* we've done it here */
2929                     break;
2930                 }
2931             if (!text) {
2932                 delete_Token(t);
2933             } else {
2934                 *tail = t;
2935                 tail = &t->next;
2936                 t->type = type;
2937                 nasm_free(t->text);
2938                 t->text = text;
2939                 t->mac = NULL;
2940             }
2941             continue;
2942         } else {
2943             t = *tail = tline;
2944             tline = tline->next;
2945             t->mac = NULL;
2946             tail = &t->next;
2947         }
2948     }
2949     *tail = NULL;
2950     t = thead;
2951     for (; t && (tt = t->next) != NULL; t = t->next)
2952         switch (t->type) {
2953         case TOK_WHITESPACE:
2954             if (tt->type == TOK_WHITESPACE) {
2955                 t->next = delete_Token(tt);
2956             }
2957             break;
2958         case TOK_ID:
2959             if (tt->type == TOK_ID || tt->type == TOK_NUMBER) {
2960                 char *tmp = nasm_strcat(t->text, tt->text);
2961                 nasm_free(t->text);
2962                 t->text = tmp;
2963                 t->next = delete_Token(tt);
2964             }
2965             break;
2966         case TOK_NUMBER:
2967             if (tt->type == TOK_NUMBER) {
2968                 char *tmp = nasm_strcat(t->text, tt->text);
2969                 nasm_free(t->text);
2970                 t->text = tmp;
2971                 t->next = delete_Token(tt);
2972             }
2973             break;
2974         default:
2975             break;
2976         }
2977
2978     return thead;
2979 }
2980
2981 /*
2982  * Expand all single-line macro calls made in the given line.
2983  * Return the expanded version of the line. The original is deemed
2984  * to be destroyed in the process. (In reality we'll just move
2985  * Tokens from input to output a lot of the time, rather than
2986  * actually bothering to destroy and replicate.)
2987  */
2988 #define DEADMAN_LIMIT (1 << 20)
2989
2990 static Token *expand_smacro(Token * tline)
2991 {
2992     Token *t, *tt, *mstart, **tail, *thead;
2993     SMacro *head = NULL, *m;
2994     Token **params;
2995     int *paramsize;
2996     unsigned int nparam, sparam;
2997     int brackets, rescan;
2998     Token *org_tline = tline;
2999     Context *ctx;
3000     char *mname;
3001     int deadman = DEADMAN_LIMIT;
3002
3003     /*
3004      * Trick: we should avoid changing the start token pointer since it can
3005      * be contained in "next" field of other token. Because of this
3006      * we allocate a copy of first token and work with it; at the end of
3007      * routine we copy it back
3008      */
3009     if (org_tline) {
3010         tline =
3011             new_Token(org_tline->next, org_tline->type, org_tline->text,
3012                       0);
3013         tline->mac = org_tline->mac;
3014         nasm_free(org_tline->text);
3015         org_tline->text = NULL;
3016     }
3017
3018 again:
3019     tail = &thead;
3020     thead = NULL;
3021
3022     while (tline) {             /* main token loop */
3023         if (!--deadman) {
3024             error(ERR_NONFATAL, "interminable macro recursion");
3025             break;
3026         }
3027
3028         if ((mname = tline->text)) {
3029             /* if this token is a local macro, look in local context */
3030             if (tline->type == TOK_ID || tline->type == TOK_PREPROC_ID)
3031                 ctx = get_ctx(mname, true);
3032             else
3033                 ctx = NULL;
3034             if (!ctx) {
3035                 head = (SMacro *) hash_findix(smacros, mname);
3036             } else {
3037                 head = ctx->localmac;
3038             }
3039             /*
3040              * We've hit an identifier. As in is_mmacro below, we first
3041              * check whether the identifier is a single-line macro at
3042              * all, then think about checking for parameters if
3043              * necessary.
3044              */
3045             for (m = head; m; m = m->next)
3046                 if (!mstrcmp(m->name, mname, m->casesense))
3047                     break;
3048             if (m) {
3049                 mstart = tline;
3050                 params = NULL;
3051                 paramsize = NULL;
3052                 if (m->nparam == 0) {
3053                     /*
3054                      * Simple case: the macro is parameterless. Discard the
3055                      * one token that the macro call took, and push the
3056                      * expansion back on the to-do stack.
3057                      */
3058                     if (!m->expansion) {
3059                         if (!strcmp("__FILE__", m->name)) {
3060                             int32_t num = 0;
3061                             src_get(&num, &(tline->text));
3062                             nasm_quote(&(tline->text));
3063                             tline->type = TOK_STRING;
3064                             continue;
3065                         }
3066                         if (!strcmp("__LINE__", m->name)) {
3067                             nasm_free(tline->text);
3068                             make_tok_num(tline, src_get_linnum());
3069                             continue;
3070                         }
3071                         if (!strcmp("__BITS__", m->name)) {
3072                             nasm_free(tline->text);
3073                             make_tok_num(tline, globalbits);
3074                             continue;
3075                         }
3076                         tline = delete_Token(tline);
3077                         continue;
3078                     }
3079                 } else {
3080                     /*
3081                      * Complicated case: at least one macro with this name
3082                      * exists and takes parameters. We must find the
3083                      * parameters in the call, count them, find the SMacro
3084                      * that corresponds to that form of the macro call, and
3085                      * substitute for the parameters when we expand. What a
3086                      * pain.
3087                      */
3088                     /*tline = tline->next;
3089                        skip_white_(tline); */
3090                     do {
3091                         t = tline->next;
3092                         while (tok_type_(t, TOK_SMAC_END)) {
3093                             t->mac->in_progress = false;
3094                             t->text = NULL;
3095                             t = tline->next = delete_Token(t);
3096                         }
3097                         tline = t;
3098                     } while (tok_type_(tline, TOK_WHITESPACE));
3099                     if (!tok_is_(tline, "(")) {
3100                         /*
3101                          * This macro wasn't called with parameters: ignore
3102                          * the call. (Behaviour borrowed from gnu cpp.)
3103                          */
3104                         tline = mstart;
3105                         m = NULL;
3106                     } else {
3107                         int paren = 0;
3108                         int white = 0;
3109                         brackets = 0;
3110                         nparam = 0;
3111                         sparam = PARAM_DELTA;
3112                         params = nasm_malloc(sparam * sizeof(Token *));
3113                         params[0] = tline->next;
3114                         paramsize = nasm_malloc(sparam * sizeof(int));
3115                         paramsize[0] = 0;
3116                         while (true) {  /* parameter loop */
3117                             /*
3118                              * For some unusual expansions
3119                              * which concatenates function call
3120                              */
3121                             t = tline->next;
3122                             while (tok_type_(t, TOK_SMAC_END)) {
3123                                 t->mac->in_progress = false;
3124                                 t->text = NULL;
3125                                 t = tline->next = delete_Token(t);
3126                             }
3127                             tline = t;
3128
3129                             if (!tline) {
3130                                 error(ERR_NONFATAL,
3131                                       "macro call expects terminating `)'");
3132                                 break;
3133                             }
3134                             if (tline->type == TOK_WHITESPACE
3135                                 && brackets <= 0) {
3136                                 if (paramsize[nparam])
3137                                     white++;
3138                                 else
3139                                     params[nparam] = tline->next;
3140                                 continue;       /* parameter loop */
3141                             }
3142                             if (tline->type == TOK_OTHER
3143                                 && tline->text[1] == 0) {
3144                                 char ch = tline->text[0];
3145                                 if (ch == ',' && !paren && brackets <= 0) {
3146                                     if (++nparam >= sparam) {
3147                                         sparam += PARAM_DELTA;
3148                                         params = nasm_realloc(params,
3149                                                               sparam *
3150                                                               sizeof(Token
3151                                                                      *));
3152                                         paramsize =
3153                                             nasm_realloc(paramsize,
3154                                                          sparam *
3155                                                          sizeof(int));
3156                                     }
3157                                     params[nparam] = tline->next;
3158                                     paramsize[nparam] = 0;
3159                                     white = 0;
3160                                     continue;   /* parameter loop */
3161                                 }
3162                                 if (ch == '{' &&
3163                                     (brackets > 0 || (brackets == 0 &&
3164                                                       !paramsize[nparam])))
3165                                 {
3166                                     if (!(brackets++)) {
3167                                         params[nparam] = tline->next;
3168                                         continue;       /* parameter loop */
3169                                     }
3170                                 }
3171                                 if (ch == '}' && brackets > 0)
3172                                     if (--brackets == 0) {
3173                                         brackets = -1;
3174                                         continue;       /* parameter loop */
3175                                     }
3176                                 if (ch == '(' && !brackets)
3177                                     paren++;
3178                                 if (ch == ')' && brackets <= 0)
3179                                     if (--paren < 0)
3180                                         break;
3181                             }
3182                             if (brackets < 0) {
3183                                 brackets = 0;
3184                                 error(ERR_NONFATAL, "braces do not "
3185                                       "enclose all of macro parameter");
3186                             }
3187                             paramsize[nparam] += white + 1;
3188                             white = 0;
3189                         }       /* parameter loop */
3190                         nparam++;
3191                         while (m && (m->nparam != nparam ||
3192                                      mstrcmp(m->name, mname,
3193                                              m->casesense)))
3194                             m = m->next;
3195                         if (!m)
3196                             error(ERR_WARNING | ERR_WARN_MNP,
3197                                   "macro `%s' exists, "
3198                                   "but not taking %d parameters",
3199                                   mstart->text, nparam);
3200                     }
3201                 }
3202                 if (m && m->in_progress)
3203                     m = NULL;
3204                 if (!m) {       /* in progess or didn't find '(' or wrong nparam */
3205                     /*
3206                      * Design question: should we handle !tline, which
3207                      * indicates missing ')' here, or expand those
3208                      * macros anyway, which requires the (t) test a few
3209                      * lines down?
3210                      */
3211                     nasm_free(params);
3212                     nasm_free(paramsize);
3213                     tline = mstart;
3214                 } else {
3215                     /*
3216                      * Expand the macro: we are placed on the last token of the
3217                      * call, so that we can easily split the call from the
3218                      * following tokens. We also start by pushing an SMAC_END
3219                      * token for the cycle removal.
3220                      */
3221                     t = tline;
3222                     if (t) {
3223                         tline = t->next;
3224                         t->next = NULL;
3225                     }
3226                     tt = new_Token(tline, TOK_SMAC_END, NULL, 0);
3227                     tt->mac = m;
3228                     m->in_progress = true;
3229                     tline = tt;
3230                     for (t = m->expansion; t; t = t->next) {
3231                         if (t->type >= TOK_SMAC_PARAM) {
3232                             Token *pcopy = tline, **ptail = &pcopy;
3233                             Token *ttt, *pt;
3234                             int i;
3235
3236                             ttt = params[t->type - TOK_SMAC_PARAM];
3237                             for (i = paramsize[t->type - TOK_SMAC_PARAM];
3238                                  --i >= 0;) {
3239                                 pt = *ptail =
3240                                     new_Token(tline, ttt->type, ttt->text,
3241                                               0);
3242                                 ptail = &pt->next;
3243                                 ttt = ttt->next;
3244                             }
3245                             tline = pcopy;
3246                         } else {
3247                             tt = new_Token(tline, t->type, t->text, 0);
3248                             tline = tt;
3249                         }
3250                     }
3251
3252                     /*
3253                      * Having done that, get rid of the macro call, and clean
3254                      * up the parameters.
3255                      */
3256                     nasm_free(params);
3257                     nasm_free(paramsize);
3258                     free_tlist(mstart);
3259                     continue;   /* main token loop */
3260                 }
3261             }
3262         }
3263
3264         if (tline->type == TOK_SMAC_END) {
3265             tline->mac->in_progress = false;
3266             tline = delete_Token(tline);
3267         } else {
3268             t = *tail = tline;
3269             tline = tline->next;
3270             t->mac = NULL;
3271             t->next = NULL;
3272             tail = &t->next;
3273         }
3274     }
3275
3276     /*
3277      * Now scan the entire line and look for successive TOK_IDs that resulted
3278      * after expansion (they can't be produced by tokenize()). The successive
3279      * TOK_IDs should be concatenated.
3280      * Also we look for %+ tokens and concatenate the tokens before and after
3281      * them (without white spaces in between).
3282      */
3283     t = thead;
3284     rescan = 0;
3285     while (t) {
3286         while (t && t->type != TOK_ID && t->type != TOK_PREPROC_ID)
3287             t = t->next;
3288         if (!t || !t->next)
3289             break;
3290         if (t->next->type == TOK_ID ||
3291             t->next->type == TOK_PREPROC_ID ||
3292             t->next->type == TOK_NUMBER) {
3293             char *p = nasm_strcat(t->text, t->next->text);
3294             nasm_free(t->text);
3295             t->next = delete_Token(t->next);
3296             t->text = p;
3297             rescan = 1;
3298         } else if (t->next->type == TOK_WHITESPACE && t->next->next &&
3299                    t->next->next->type == TOK_PREPROC_ID &&
3300                    strcmp(t->next->next->text, "%+") == 0) {
3301             /* free the next whitespace, the %+ token and next whitespace */
3302             int i;
3303             for (i = 1; i <= 3; i++) {
3304                 if (!t->next
3305                     || (i != 2 && t->next->type != TOK_WHITESPACE))
3306                     break;
3307                 t->next = delete_Token(t->next);
3308             }                   /* endfor */
3309         } else
3310             t = t->next;
3311     }
3312     /* If we concatenaded something, re-scan the line for macros */
3313     if (rescan) {
3314         tline = thead;
3315         goto again;
3316     }
3317
3318     if (org_tline) {
3319         if (thead) {
3320             *org_tline = *thead;
3321             /* since we just gave text to org_line, don't free it */
3322             thead->text = NULL;
3323             delete_Token(thead);
3324         } else {
3325             /* the expression expanded to empty line;
3326                we can't return NULL for some reasons
3327                we just set the line to a single WHITESPACE token. */
3328             memset(org_tline, 0, sizeof(*org_tline));
3329             org_tline->text = NULL;
3330             org_tline->type = TOK_WHITESPACE;
3331         }
3332         thead = org_tline;
3333     }
3334
3335     return thead;
3336 }
3337
3338 /*
3339  * Similar to expand_smacro but used exclusively with macro identifiers
3340  * right before they are fetched in. The reason is that there can be
3341  * identifiers consisting of several subparts. We consider that if there
3342  * are more than one element forming the name, user wants a expansion,
3343  * otherwise it will be left as-is. Example:
3344  *
3345  *      %define %$abc cde
3346  *
3347  * the identifier %$abc will be left as-is so that the handler for %define
3348  * will suck it and define the corresponding value. Other case:
3349  *
3350  *      %define _%$abc cde
3351  *
3352  * In this case user wants name to be expanded *before* %define starts
3353  * working, so we'll expand %$abc into something (if it has a value;
3354  * otherwise it will be left as-is) then concatenate all successive
3355  * PP_IDs into one.
3356  */
3357 static Token *expand_id(Token * tline)
3358 {
3359     Token *cur, *oldnext = NULL;
3360
3361     if (!tline || !tline->next)
3362         return tline;
3363
3364     cur = tline;
3365     while (cur->next &&
3366            (cur->next->type == TOK_ID ||
3367             cur->next->type == TOK_PREPROC_ID
3368             || cur->next->type == TOK_NUMBER))
3369         cur = cur->next;
3370
3371     /* If identifier consists of just one token, don't expand */
3372     if (cur == tline)
3373         return tline;
3374
3375     if (cur) {
3376         oldnext = cur->next;    /* Detach the tail past identifier */
3377         cur->next = NULL;       /* so that expand_smacro stops here */
3378     }
3379
3380     tline = expand_smacro(tline);
3381
3382     if (cur) {
3383         /* expand_smacro possibly changhed tline; re-scan for EOL */
3384         cur = tline;
3385         while (cur && cur->next)
3386             cur = cur->next;
3387         if (cur)
3388             cur->next = oldnext;
3389     }
3390
3391     return tline;
3392 }
3393
3394 /*
3395  * Determine whether the given line constitutes a multi-line macro
3396  * call, and return the MMacro structure called if so. Doesn't have
3397  * to check for an initial label - that's taken care of in
3398  * expand_mmacro - but must check numbers of parameters. Guaranteed
3399  * to be called with tline->type == TOK_ID, so the putative macro
3400  * name is easy to find.
3401  */
3402 static MMacro *is_mmacro(Token * tline, Token *** params_array)
3403 {
3404     MMacro *head, *m;
3405     Token **params;
3406     int nparam;
3407
3408     head = (MMacro *) hash_findix(mmacros, tline->text);
3409
3410     /*
3411      * Efficiency: first we see if any macro exists with the given
3412      * name. If not, we can return NULL immediately. _Then_ we
3413      * count the parameters, and then we look further along the
3414      * list if necessary to find the proper MMacro.
3415      */
3416     for (m = head; m; m = m->next)
3417         if (!mstrcmp(m->name, tline->text, m->casesense))
3418             break;
3419     if (!m)
3420         return NULL;
3421
3422     /*
3423      * OK, we have a potential macro. Count and demarcate the
3424      * parameters.
3425      */
3426     count_mmac_params(tline->next, &nparam, &params);
3427
3428     /*
3429      * So we know how many parameters we've got. Find the MMacro
3430      * structure that handles this number.
3431      */
3432     while (m) {
3433         if (m->nparam_min <= nparam
3434             && (m->plus || nparam <= m->nparam_max)) {
3435             /*
3436              * This one is right. Just check if cycle removal
3437              * prohibits us using it before we actually celebrate...
3438              */
3439             if (m->in_progress) {
3440 #if 0
3441                 error(ERR_NONFATAL,
3442                       "self-reference in multi-line macro `%s'", m->name);
3443 #endif
3444                 nasm_free(params);
3445                 return NULL;
3446             }
3447             /*
3448              * It's right, and we can use it. Add its default
3449              * parameters to the end of our list if necessary.
3450              */
3451             if (m->defaults && nparam < m->nparam_min + m->ndefs) {
3452                 params =
3453                     nasm_realloc(params,
3454                                  ((m->nparam_min + m->ndefs +
3455                                    1) * sizeof(*params)));
3456                 while (nparam < m->nparam_min + m->ndefs) {
3457                     params[nparam] = m->defaults[nparam - m->nparam_min];
3458                     nparam++;
3459                 }
3460             }
3461             /*
3462              * If we've gone over the maximum parameter count (and
3463              * we're in Plus mode), ignore parameters beyond
3464              * nparam_max.
3465              */
3466             if (m->plus && nparam > m->nparam_max)
3467                 nparam = m->nparam_max;
3468             /*
3469              * Then terminate the parameter list, and leave.
3470              */
3471             if (!params) {      /* need this special case */
3472                 params = nasm_malloc(sizeof(*params));
3473                 nparam = 0;
3474             }
3475             params[nparam] = NULL;
3476             *params_array = params;
3477             return m;
3478         }
3479         /*
3480          * This one wasn't right: look for the next one with the
3481          * same name.
3482          */
3483         for (m = m->next; m; m = m->next)
3484             if (!mstrcmp(m->name, tline->text, m->casesense))
3485                 break;
3486     }
3487
3488     /*
3489      * After all that, we didn't find one with the right number of
3490      * parameters. Issue a warning, and fail to expand the macro.
3491      */
3492     error(ERR_WARNING | ERR_WARN_MNP,
3493           "macro `%s' exists, but not taking %d parameters",
3494           tline->text, nparam);
3495     nasm_free(params);
3496     return NULL;
3497 }
3498
3499 /*
3500  * Expand the multi-line macro call made by the given line, if
3501  * there is one to be expanded. If there is, push the expansion on
3502  * istk->expansion and return 1. Otherwise return 0.
3503  */
3504 static int expand_mmacro(Token * tline)
3505 {
3506     Token *startline = tline;
3507     Token *label = NULL;
3508     int dont_prepend = 0;
3509     Token **params, *t, *tt;
3510     MMacro *m;
3511     Line *l, *ll;
3512     int i, nparam, *paramlen;
3513
3514     t = tline;
3515     skip_white_(t);
3516 /*    if (!tok_type_(t, TOK_ID))  Lino 02/25/02 */
3517     if (!tok_type_(t, TOK_ID) && !tok_type_(t, TOK_PREPROC_ID))
3518         return 0;
3519     m = is_mmacro(t, &params);
3520     if (!m) {
3521         Token *last;
3522         /*
3523          * We have an id which isn't a macro call. We'll assume
3524          * it might be a label; we'll also check to see if a
3525          * colon follows it. Then, if there's another id after
3526          * that lot, we'll check it again for macro-hood.
3527          */
3528         label = last = t;
3529         t = t->next;
3530         if (tok_type_(t, TOK_WHITESPACE))
3531             last = t, t = t->next;
3532         if (tok_is_(t, ":")) {
3533             dont_prepend = 1;
3534             last = t, t = t->next;
3535             if (tok_type_(t, TOK_WHITESPACE))
3536                 last = t, t = t->next;
3537         }
3538         if (!tok_type_(t, TOK_ID) || (m = is_mmacro(t, &params)) == NULL)
3539             return 0;
3540         last->next = NULL;
3541         tline = t;
3542     }
3543
3544     /*
3545      * Fix up the parameters: this involves stripping leading and
3546      * trailing whitespace, then stripping braces if they are
3547      * present.
3548      */
3549     for (nparam = 0; params[nparam]; nparam++) ;
3550     paramlen = nparam ? nasm_malloc(nparam * sizeof(*paramlen)) : NULL;
3551
3552     for (i = 0; params[i]; i++) {
3553         int brace = false;
3554         int comma = (!m->plus || i < nparam - 1);
3555
3556         t = params[i];
3557         skip_white_(t);
3558         if (tok_is_(t, "{"))
3559             t = t->next, brace = true, comma = false;
3560         params[i] = t;
3561         paramlen[i] = 0;
3562         while (t) {
3563             if (comma && t->type == TOK_OTHER && !strcmp(t->text, ","))
3564                 break;          /* ... because we have hit a comma */
3565             if (comma && t->type == TOK_WHITESPACE
3566                 && tok_is_(t->next, ","))
3567                 break;          /* ... or a space then a comma */
3568             if (brace && t->type == TOK_OTHER && !strcmp(t->text, "}"))
3569                 break;          /* ... or a brace */
3570             t = t->next;
3571             paramlen[i]++;
3572         }
3573     }
3574
3575     /*
3576      * OK, we have a MMacro structure together with a set of
3577      * parameters. We must now go through the expansion and push
3578      * copies of each Line on to istk->expansion. Substitution of
3579      * parameter tokens and macro-local tokens doesn't get done
3580      * until the single-line macro substitution process; this is
3581      * because delaying them allows us to change the semantics
3582      * later through %rotate.
3583      *
3584      * First, push an end marker on to istk->expansion, mark this
3585      * macro as in progress, and set up its invocation-specific
3586      * variables.
3587      */
3588     ll = nasm_malloc(sizeof(Line));
3589     ll->next = istk->expansion;
3590     ll->finishes = m;
3591     ll->first = NULL;
3592     istk->expansion = ll;
3593
3594     m->in_progress = true;
3595     m->params = params;
3596     m->iline = tline;
3597     m->nparam = nparam;
3598     m->rotate = 0;
3599     m->paramlen = paramlen;
3600     m->unique = unique++;
3601     m->lineno = 0;
3602
3603     m->next_active = istk->mstk;
3604     istk->mstk = m;
3605
3606     for (l = m->expansion; l; l = l->next) {
3607         Token **tail;
3608
3609         ll = nasm_malloc(sizeof(Line));
3610         ll->finishes = NULL;
3611         ll->next = istk->expansion;
3612         istk->expansion = ll;
3613         tail = &ll->first;
3614
3615         for (t = l->first; t; t = t->next) {
3616             Token *x = t;
3617             if (t->type == TOK_PREPROC_ID &&
3618                 t->text[1] == '0' && t->text[2] == '0') {
3619                 dont_prepend = -1;
3620                 x = label;
3621                 if (!x)
3622                     continue;
3623             }
3624             tt = *tail = new_Token(NULL, x->type, x->text, 0);
3625             tail = &tt->next;
3626         }
3627         *tail = NULL;
3628     }
3629
3630     /*
3631      * If we had a label, push it on as the first line of
3632      * the macro expansion.
3633      */
3634     if (label) {
3635         if (dont_prepend < 0)
3636             free_tlist(startline);
3637         else {
3638             ll = nasm_malloc(sizeof(Line));
3639             ll->finishes = NULL;
3640             ll->next = istk->expansion;
3641             istk->expansion = ll;
3642             ll->first = startline;
3643             if (!dont_prepend) {
3644                 while (label->next)
3645                     label = label->next;
3646                 label->next = tt = new_Token(NULL, TOK_OTHER, ":", 0);
3647             }
3648         }
3649     }
3650
3651     list->uplevel(m->nolist ? LIST_MACRO_NOLIST : LIST_MACRO);
3652
3653     return 1;
3654 }
3655
3656 /*
3657  * Since preprocessor always operate only on the line that didn't
3658  * arrived yet, we should always use ERR_OFFBY1. Also since user
3659  * won't want to see same error twice (preprocessing is done once
3660  * per pass) we will want to show errors only during pass one.
3661  */
3662 static void error(int severity, const char *fmt, ...)
3663 {
3664     va_list arg;
3665     char buff[1024];
3666
3667     /* If we're in a dead branch of IF or something like it, ignore the error */
3668     if (istk && istk->conds && !emitting(istk->conds->state))
3669         return;
3670
3671     va_start(arg, fmt);
3672     vsnprintf(buff, sizeof(buff), fmt, arg);
3673     va_end(arg);
3674
3675     if (istk && istk->mstk && istk->mstk->name)
3676         _error(severity | ERR_PASS1, "(%s:%d) %s", istk->mstk->name,
3677                istk->mstk->lineno, buff);
3678     else
3679         _error(severity | ERR_PASS1, "%s", buff);
3680 }
3681
3682 static void
3683 pp_reset(char *file, int apass, efunc errfunc, evalfunc eval,
3684          ListGen * listgen)
3685 {
3686     _error = errfunc;
3687     cstk = NULL;
3688     istk = nasm_malloc(sizeof(Include));
3689     istk->next = NULL;
3690     istk->conds = NULL;
3691     istk->expansion = NULL;
3692     istk->mstk = NULL;
3693     istk->fp = fopen(file, "r");
3694     istk->fname = NULL;
3695     src_set_fname(nasm_strdup(file));
3696     src_set_linnum(0);
3697     istk->lineinc = 1;
3698     if (!istk->fp)
3699         error(ERR_FATAL | ERR_NOFILE, "unable to open input file `%s'",
3700               file);
3701     defining = NULL;
3702     init_macros();
3703     unique = 0;
3704     if (tasm_compatible_mode) {
3705         stdmacpos = stdmac;
3706     } else {
3707         stdmacpos = &stdmac[TASM_MACRO_COUNT];
3708     }
3709     any_extrastdmac = (extrastdmac != NULL);
3710     list = listgen;
3711     evaluate = eval;
3712     pass = apass;
3713 }
3714
3715 static char *pp_getline(void)
3716 {
3717     char *line;
3718     Token *tline;
3719
3720     while (1) {
3721         /*
3722          * Fetch a tokenized line, either from the macro-expansion
3723          * buffer or from the input file.
3724          */
3725         tline = NULL;
3726         while (istk->expansion && istk->expansion->finishes) {
3727             Line *l = istk->expansion;
3728             if (!l->finishes->name && l->finishes->in_progress > 1) {
3729                 Line *ll;
3730
3731                 /*
3732                  * This is a macro-end marker for a macro with no
3733                  * name, which means it's not really a macro at all
3734                  * but a %rep block, and the `in_progress' field is
3735                  * more than 1, meaning that we still need to
3736                  * repeat. (1 means the natural last repetition; 0
3737                  * means termination by %exitrep.) We have
3738                  * therefore expanded up to the %endrep, and must
3739                  * push the whole block on to the expansion buffer
3740                  * again. We don't bother to remove the macro-end
3741                  * marker: we'd only have to generate another one
3742                  * if we did.
3743                  */
3744                 l->finishes->in_progress--;
3745                 for (l = l->finishes->expansion; l; l = l->next) {
3746                     Token *t, *tt, **tail;
3747
3748                     ll = nasm_malloc(sizeof(Line));
3749                     ll->next = istk->expansion;
3750                     ll->finishes = NULL;
3751                     ll->first = NULL;
3752                     tail = &ll->first;
3753
3754                     for (t = l->first; t; t = t->next) {
3755                         if (t->text || t->type == TOK_WHITESPACE) {
3756                             tt = *tail =
3757                                 new_Token(NULL, t->type, t->text, 0);
3758                             tail = &tt->next;
3759                         }
3760                     }
3761
3762                     istk->expansion = ll;
3763                 }
3764             } else {
3765                 /*
3766                  * Check whether a `%rep' was started and not ended
3767                  * within this macro expansion. This can happen and
3768                  * should be detected. It's a fatal error because
3769                  * I'm too confused to work out how to recover
3770                  * sensibly from it.
3771                  */
3772                 if (defining) {
3773                     if (defining->name)
3774                         error(ERR_PANIC,
3775                               "defining with name in expansion");
3776                     else if (istk->mstk->name)
3777                         error(ERR_FATAL,
3778                               "`%%rep' without `%%endrep' within"
3779                               " expansion of macro `%s'",
3780                               istk->mstk->name);
3781                 }
3782
3783                 /*
3784                  * FIXME:  investigate the relationship at this point between
3785                  * istk->mstk and l->finishes
3786                  */
3787                 {
3788                     MMacro *m = istk->mstk;
3789                     istk->mstk = m->next_active;
3790                     if (m->name) {
3791                         /*
3792                          * This was a real macro call, not a %rep, and
3793                          * therefore the parameter information needs to
3794                          * be freed.
3795                          */
3796                         nasm_free(m->params);
3797                         free_tlist(m->iline);
3798                         nasm_free(m->paramlen);
3799                         l->finishes->in_progress = false;
3800                     } else
3801                         free_mmacro(m);
3802                 }
3803                 istk->expansion = l->next;
3804                 nasm_free(l);
3805                 list->downlevel(LIST_MACRO);
3806             }
3807         }
3808         while (1) {             /* until we get a line we can use */
3809
3810             if (istk->expansion) {      /* from a macro expansion */
3811                 char *p;
3812                 Line *l = istk->expansion;
3813                 if (istk->mstk)
3814                     istk->mstk->lineno++;
3815                 tline = l->first;
3816                 istk->expansion = l->next;
3817                 nasm_free(l);
3818                 p = detoken(tline, false);
3819                 list->line(LIST_MACRO, p);
3820                 nasm_free(p);
3821                 break;
3822             }
3823             line = read_line();
3824             if (line) {         /* from the current input file */
3825                 line = prepreproc(line);
3826                 tline = tokenize(line);
3827                 nasm_free(line);
3828                 break;
3829             }
3830             /*
3831              * The current file has ended; work down the istk
3832              */
3833             {
3834                 Include *i = istk;
3835                 fclose(i->fp);
3836                 if (i->conds)
3837                     error(ERR_FATAL,
3838                           "expected `%%endif' before end of file");
3839                 /* only set line and file name if there's a next node */
3840                 if (i->next) {
3841                     src_set_linnum(i->lineno);
3842                     nasm_free(src_set_fname(i->fname));
3843                 }
3844                 istk = i->next;
3845                 list->downlevel(LIST_INCLUDE);
3846                 nasm_free(i);
3847                 if (!istk)
3848                     return NULL;
3849             }
3850         }
3851
3852         /*
3853          * We must expand MMacro parameters and MMacro-local labels
3854          * _before_ we plunge into directive processing, to cope
3855          * with things like `%define something %1' such as STRUC
3856          * uses. Unless we're _defining_ a MMacro, in which case
3857          * those tokens should be left alone to go into the
3858          * definition; and unless we're in a non-emitting
3859          * condition, in which case we don't want to meddle with
3860          * anything.
3861          */
3862         if (!defining && !(istk->conds && !emitting(istk->conds->state)))
3863             tline = expand_mmac_params(tline);
3864
3865         /*
3866          * Check the line to see if it's a preprocessor directive.
3867          */
3868         if (do_directive(tline) == DIRECTIVE_FOUND) {
3869             continue;
3870         } else if (defining) {
3871             /*
3872              * We're defining a multi-line macro. We emit nothing
3873              * at all, and just
3874              * shove the tokenized line on to the macro definition.
3875              */
3876             Line *l = nasm_malloc(sizeof(Line));
3877             l->next = defining->expansion;
3878             l->first = tline;
3879             l->finishes = false;
3880             defining->expansion = l;
3881             continue;
3882         } else if (istk->conds && !emitting(istk->conds->state)) {
3883             /*
3884              * We're in a non-emitting branch of a condition block.
3885              * Emit nothing at all, not even a blank line: when we
3886              * emerge from the condition we'll give a line-number
3887              * directive so we keep our place correctly.
3888              */
3889             free_tlist(tline);
3890             continue;
3891         } else if (istk->mstk && !istk->mstk->in_progress) {
3892             /*
3893              * We're in a %rep block which has been terminated, so
3894              * we're walking through to the %endrep without
3895              * emitting anything. Emit nothing at all, not even a
3896              * blank line: when we emerge from the %rep block we'll
3897              * give a line-number directive so we keep our place
3898              * correctly.
3899              */
3900             free_tlist(tline);
3901             continue;
3902         } else {
3903             tline = expand_smacro(tline);
3904             if (!expand_mmacro(tline)) {
3905                 /*
3906                  * De-tokenize the line again, and emit it.
3907                  */
3908                 line = detoken(tline, true);
3909                 free_tlist(tline);
3910                 break;
3911             } else {
3912                 continue;       /* expand_mmacro calls free_tlist */
3913             }
3914         }
3915     }
3916
3917     return line;
3918 }
3919
3920 static void pp_cleanup(int pass)
3921 {
3922     if (defining) {
3923         error(ERR_NONFATAL, "end of file while still defining macro `%s'",
3924               defining->name);
3925         free_mmacro(defining);
3926     }
3927     while (cstk)
3928         ctx_pop();
3929     free_macros();
3930     while (istk) {
3931         Include *i = istk;
3932         istk = istk->next;
3933         fclose(i->fp);
3934         nasm_free(i->fname);
3935         nasm_free(i);
3936     }
3937     while (cstk)
3938         ctx_pop();
3939     if (pass == 0) {
3940         free_llist(predef);
3941         delete_Blocks();
3942     }
3943 }
3944
3945 void pp_include_path(char *path)
3946 {
3947     IncPath *i;
3948
3949     i = nasm_malloc(sizeof(IncPath));
3950     i->path = path ? nasm_strdup(path) : NULL;
3951     i->next = NULL;
3952
3953     if (ipath != NULL) {
3954         IncPath *j = ipath;
3955         while (j->next != NULL)
3956             j = j->next;
3957         j->next = i;
3958     } else {
3959         ipath = i;
3960     }
3961 }
3962
3963 /*
3964  * added by alexfru:
3965  *
3966  * This function is used to "export" the include paths, e.g.
3967  * the paths specified in the '-I' command switch.
3968  * The need for such exporting is due to the 'incbin' directive,
3969  * which includes raw binary files (unlike '%include', which
3970  * includes text source files). It would be real nice to be
3971  * able to specify paths to search for incbin'ned files also.
3972  * So, this is a simple workaround.
3973  *
3974  * The function use is simple:
3975  *
3976  * The 1st call (with NULL argument) returns a pointer to the 1st path
3977  * (char** type) or NULL if none include paths available.
3978  *
3979  * All subsequent calls take as argument the value returned by this
3980  * function last. The return value is either the next path
3981  * (char** type) or NULL if the end of the paths list is reached.
3982  *
3983  * It is maybe not the best way to do things, but I didn't want
3984  * to export too much, just one or two functions and no types or
3985  * variables exported.
3986  *
3987  * Can't say I like the current situation with e.g. this path list either,
3988  * it seems to be never deallocated after creation...
3989  */
3990 char **pp_get_include_path_ptr(char **pPrevPath)
3991 {
3992 /*   This macro returns offset of a member of a structure */
3993 #define GetMemberOffset(StructType,MemberName)\
3994   ((size_t)&((StructType*)0)->MemberName)
3995     IncPath *i;
3996
3997     if (pPrevPath == NULL) {
3998         if (ipath != NULL)
3999             return &ipath->path;
4000         else
4001             return NULL;
4002     }
4003     i = (IncPath *) ((char *)pPrevPath - GetMemberOffset(IncPath, path));
4004     i = i->next;
4005     if (i != NULL)
4006         return &i->path;
4007     else
4008         return NULL;
4009 #undef GetMemberOffset
4010 }
4011
4012 void pp_pre_include(char *fname)
4013 {
4014     Token *inc, *space, *name;
4015     Line *l;
4016
4017     name = new_Token(NULL, TOK_INTERNAL_STRING, fname, 0);
4018     space = new_Token(name, TOK_WHITESPACE, NULL, 0);
4019     inc = new_Token(space, TOK_PREPROC_ID, "%include", 0);
4020
4021     l = nasm_malloc(sizeof(Line));
4022     l->next = predef;
4023     l->first = inc;
4024     l->finishes = false;
4025     predef = l;
4026 }
4027
4028 void pp_pre_define(char *definition)
4029 {
4030     Token *def, *space;
4031     Line *l;
4032     char *equals;
4033
4034     equals = strchr(definition, '=');
4035     space = new_Token(NULL, TOK_WHITESPACE, NULL, 0);
4036     def = new_Token(space, TOK_PREPROC_ID, "%define", 0);
4037     if (equals)
4038         *equals = ' ';
4039     space->next = tokenize(definition);
4040     if (equals)
4041         *equals = '=';
4042
4043     l = nasm_malloc(sizeof(Line));
4044     l->next = predef;
4045     l->first = def;
4046     l->finishes = false;
4047     predef = l;
4048 }
4049
4050 void pp_pre_undefine(char *definition)
4051 {
4052     Token *def, *space;
4053     Line *l;
4054
4055     space = new_Token(NULL, TOK_WHITESPACE, NULL, 0);
4056     def = new_Token(space, TOK_PREPROC_ID, "%undef", 0);
4057     space->next = tokenize(definition);
4058
4059     l = nasm_malloc(sizeof(Line));
4060     l->next = predef;
4061     l->first = def;
4062     l->finishes = false;
4063     predef = l;
4064 }
4065
4066 /*
4067  * Added by Keith Kanios:
4068  *
4069  * This function is used to assist with "runtime" preprocessor
4070  * directives. (e.g. pp_runtime("%define __BITS__ 64");)
4071  *
4072  * ERRORS ARE IGNORED HERE, SO MAKE COMPLETELY SURE THAT YOU
4073  * PASS A VALID STRING TO THIS FUNCTION!!!!!
4074  */
4075
4076 void pp_runtime(char *definition)
4077 {
4078     Token *def;
4079
4080     def = tokenize(definition);
4081     if(do_directive(def) == NO_DIRECTIVE_FOUND)
4082         free_tlist(def);
4083
4084 }
4085
4086 void pp_extra_stdmac(const char **macros)
4087 {
4088     extrastdmac = macros;
4089 }
4090
4091 static void make_tok_num(Token * tok, int64_t val)
4092 {
4093     char numbuf[20];
4094     snprintf(numbuf, sizeof(numbuf), "%"PRId64"", val);
4095     tok->text = nasm_strdup(numbuf);
4096     tok->type = TOK_NUMBER;
4097 }
4098
4099 Preproc nasmpp = {
4100     pp_reset,
4101     pp_getline,
4102     pp_cleanup
4103 };