preproc.c

   1 /* preproc.c   macro preprocessor for the Netwide Assembler
   2  *
   3  * The Netwide Assembler is copyright (C) 1996 Simon Tatham and
   4  * Julian Hall. All rights reserved. The software is
   5  * redistributable under the license given in the file "LICENSE"
   6  * distributed in the NASM archive.
   7  *
   8  * initial version 18/iii/97 by Simon Tatham
   9  */
  10
  11 /* Typical flow of text through preproc
  12  *
  13  * pp_getline gets tokenized lines, either
  14  *
  15  *   from a macro expansion
  16  *
  17  * or
  18  *   {
  19  *   read_line  gets raw text from stdmacpos, or predef, or current input file
  20  *   tokenize   converts to tokens
  21  *   }
  22  *
  23  * expand_mmac_params is used to expand %1 etc., unless a macro is being
  24  * defined or a false conditional is being processed
  25  * (%0, %1, %+1, %-1, %%foo
  26  *
  27  * do_directive checks for directives
  28  *
  29  * expand_smacro is used to expand single line macros
  30  *
  31  * expand_mmacro is used to expand multi-line macros
  32  *
  33  * detoken is used to convert the line back to text
  34  */
  35
  36 #include "compiler.h"
  37
  38 #include <stdio.h>
  39 #include <stdarg.h>
  40 #include <stdlib.h>
  41 #include <stddef.h>
  42 #include <string.h>
  43 #include <ctype.h>
  44 #include <limits.h>
  45 #include <inttypes.h>
  46
  47 #include "nasm.h"
  48 #include "nasmlib.h"
  49 #include "preproc.h"
  50 #include "hashtbl.h"
  51 #include "quote.h"
  52 #include "stdscan.h"
  53 #include "tokens.h"
  54 #include "tables.h"
  55
  56 typedef struct SMacro SMacro;
  57 typedef struct MMacro MMacro;
  58 typedef struct Context Context;
  59 typedef struct Token Token;
  60 typedef struct Blocks Blocks;
  61 typedef struct Line Line;
  62 typedef struct Include Include;
  63 typedef struct Cond Cond;
  64 typedef struct IncPath IncPath;
  65
  66 /*
  67  * Note on the storage of both SMacro and MMacros: the hash table
  68  * indexes them case-insensitively, and we then have to go through a
  69  * linked list of potential case aliases (and, for MMacros, parameter
  70  * ranges); this is to preserve the matching semantics of the earlier
  71  * code.  If the number of case aliases for a specific macro is a
  72  * performance issue, you may want to reconsider your coding style.
  73  */
  74
  75 /*
  76  * Store the definition of a single-line macro.
  77  */
  78 struct SMacro {
  79     SMacro *next;
  80     char *name;
  81     bool casesense;
  82     bool in_progress;
  83     unsigned int nparam;
  84     Token *expansion;
  85 };
  86
  87 /*
  88  * Store the definition of a multi-line macro. This is also used to
  89  * store the interiors of `%rep...%endrep' blocks, which are
  90  * effectively self-re-invoking multi-line macros which simply
  91  * don't have a name or bother to appear in the hash tables. %rep
  92  * blocks are signified by having a NULL `name' field.
  93  *
  94  * In a MMacro describing a `%rep' block, the `in_progress' field
  95  * isn't merely boolean, but gives the number of repeats left to
  96  * run.
  97  *
  98  * The `next' field is used for storing MMacros in hash tables; the
  99  * `next_active' field is for stacking them on istk entries.
 100  *
 101  * When a MMacro is being expanded, `params', `iline', `nparam',
 102  * `paramlen', `rotate' and `unique' are local to the invocation.
 103  */
 104 struct MMacro {
 105     MMacro *next;
 106     char *name;
 107     int nparam_min, nparam_max;
 108     bool casesense;
 109     bool plus;                   /* is the last parameter greedy? */
 110     bool nolist;                 /* is this macro listing-inhibited? */
 111     int64_t in_progress;
 112     Token *dlist;               /* All defaults as one list */
 113     Token **defaults;           /* Parameter default pointers */
 114     int ndefs;                  /* number of default parameters */
 115     Line *expansion;
 116
 117     MMacro *next_active;
 118     MMacro *rep_nest;           /* used for nesting %rep */
 119     Token **params;             /* actual parameters */
 120     Token *iline;               /* invocation line */
 121     unsigned int nparam, rotate;
 122     int *paramlen;
 123     uint64_t unique;
 124     int lineno;                 /* Current line number on expansion */
 125 };
 126
 127 /*
 128  * The context stack is composed of a linked list of these.
 129  */
 130 struct Context {
 131     Context *next;
 132     char *name;
 133     struct hash_table localmac;
 134     uint32_t number;
 135 };
 136
 137 /*
 138  * This is the internal form which we break input lines up into.
 139  * Typically stored in linked lists.
 140  *
 141  * Note that `type' serves a double meaning: TOK_SMAC_PARAM is not
 142  * necessarily used as-is, but is intended to denote the number of
 143  * the substituted parameter. So in the definition
 144  *
 145  *     %define a(x,y) ( (x) & ~(y) )
 146  *
 147  * the token representing `x' will have its type changed to
 148  * TOK_SMAC_PARAM, but the one representing `y' will be
 149  * TOK_SMAC_PARAM+1.
 150  *
 151  * TOK_INTERNAL_STRING is a dirty hack: it's a single string token
 152  * which doesn't need quotes around it. Used in the pre-include
 153  * mechanism as an alternative to trying to find a sensible type of
 154  * quote to use on the filename we were passed.
 155  */
 156 enum pp_token_type {
 157     TOK_NONE = 0, TOK_WHITESPACE, TOK_COMMENT, TOK_ID,
 158     TOK_PREPROC_ID, TOK_STRING,
 159     TOK_NUMBER, TOK_FLOAT, TOK_SMAC_END, TOK_OTHER,
 160     TOK_INTERNAL_STRING,
 161     TOK_PREPROC_Q, TOK_PREPROC_QQ,
 162     TOK_SMAC_PARAM,             /* MUST BE LAST IN THE LIST!!! */
 163     TOK_MAX = INT_MAX           /* Keep compiler from reducing the range */
 164 };
 165
 166 struct Token {
 167     Token *next;
 168     char *text;
 169     union {
 170         SMacro *mac;            /* associated macro for TOK_SMAC_END */
 171         size_t len;             /* scratch length field */
 172     } a;                        /* Auxiliary data */
 173     enum pp_token_type type;
 174 };
 175
 176 /*
 177  * Multi-line macro definitions are stored as a linked list of
 178  * these, which is essentially a container to allow several linked
 179  * lists of Tokens.
 180  *
 181  * Note that in this module, linked lists are treated as stacks
 182  * wherever possible. For this reason, Lines are _pushed_ on to the
 183  * `expansion' field in MMacro structures, so that the linked list,
 184  * if walked, would give the macro lines in reverse order; this
 185  * means that we can walk the list when expanding a macro, and thus
 186  * push the lines on to the `expansion' field in _istk_ in reverse
 187  * order (so that when popped back off they are in the right
 188  * order). It may seem cockeyed, and it relies on my design having
 189  * an even number of steps in, but it works...
 190  *
 191  * Some of these structures, rather than being actual lines, are
 192  * markers delimiting the end of the expansion of a given macro.
 193  * This is for use in the cycle-tracking and %rep-handling code.
 194  * Such structures have `finishes' non-NULL, and `first' NULL. All
 195  * others have `finishes' NULL, but `first' may still be NULL if
 196  * the line is blank.
 197  */
 198 struct Line {
 199     Line *next;
 200     MMacro *finishes;
 201     Token *first;
 202 };
 203
 204 /*
 205  * To handle an arbitrary level of file inclusion, we maintain a
 206  * stack (ie linked list) of these things.
 207  */
 208 struct Include {
 209     Include *next;
 210     FILE *fp;
 211     Cond *conds;
 212     Line *expansion;
 213     char *fname;
 214     int lineno, lineinc;
 215     MMacro *mstk;               /* stack of active macros/reps */
 216 };
 217
 218 /*
 219  * Include search path. This is simply a list of strings which get
 220  * prepended, in turn, to the name of an include file, in an
 221  * attempt to find the file if it's not in the current directory.
 222  */
 223 struct IncPath {
 224     IncPath *next;
 225     char *path;
 226 };
 227
 228 /*
 229  * Conditional assembly: we maintain a separate stack of these for
 230  * each level of file inclusion. (The only reason we keep the
 231  * stacks separate is to ensure that a stray `%endif' in a file
 232  * included from within the true branch of a `%if' won't terminate
 233  * it and cause confusion: instead, rightly, it'll cause an error.)
 234  */
 235 struct Cond {
 236     Cond *next;
 237     int state;
 238 };
 239 enum {
 240     /*
 241      * These states are for use just after %if or %elif: IF_TRUE
 242      * means the condition has evaluated to truth so we are
 243      * currently emitting, whereas IF_FALSE means we are not
 244      * currently emitting but will start doing so if a %else comes
 245      * up. In these states, all directives are admissible: %elif,
 246      * %else and %endif. (And of course %if.)
 247      */
 248     COND_IF_TRUE, COND_IF_FALSE,
 249     /*
 250      * These states come up after a %else: ELSE_TRUE means we're
 251      * emitting, and ELSE_FALSE means we're not. In ELSE_* states,
 252      * any %elif or %else will cause an error.
 253      */
 254     COND_ELSE_TRUE, COND_ELSE_FALSE,
 255     /*
 256      * These states mean that we're not emitting now, and also that
 257      * nothing until %endif will be emitted at all. COND_DONE is
 258      * used when we've had our moment of emission
 259      * and have now started seeing %elifs. COND_NEVER is used when
 260      * the condition construct in question is contained within a
 261      * non-emitting branch of a larger condition construct,
 262      * or if there is an error.
 263      */
 264     COND_DONE, COND_NEVER
 265 };
 266 #define emitting(x) ( (x) == COND_IF_TRUE || (x) == COND_ELSE_TRUE )
 267
 268 /*
 269  * These defines are used as the possible return values for do_directive
 270  */
 271 #define NO_DIRECTIVE_FOUND  0
 272 #define DIRECTIVE_FOUND     1
 273
 274 /*
 275  * Condition codes. Note that we use c_ prefix not C_ because C_ is
 276  * used in nasm.h for the "real" condition codes. At _this_ level,
 277  * we treat CXZ and ECXZ as condition codes, albeit non-invertible
 278  * ones, so we need a different enum...
 279  */
 280 static const char * const conditions[] = {
 281     "a", "ae", "b", "be", "c", "cxz", "e", "ecxz", "g", "ge", "l", "le",
 282     "na", "nae", "nb", "nbe", "nc", "ne", "ng", "nge", "nl", "nle", "no",
 283     "np", "ns", "nz", "o", "p", "pe", "po", "rcxz", "s", "z"
 284 };
 285 enum pp_conds {
 286     c_A, c_AE, c_B, c_BE, c_C, c_CXZ, c_E, c_ECXZ, c_G, c_GE, c_L, c_LE,
 287     c_NA, c_NAE, c_NB, c_NBE, c_NC, c_NE, c_NG, c_NGE, c_NL, c_NLE, c_NO,
 288     c_NP, c_NS, c_NZ, c_O, c_P, c_PE, c_PO, c_RCXZ, c_S, c_Z,
 289     c_none = -1
 290 };
 291 static const enum pp_conds inverse_ccs[] = {
 292     c_NA, c_NAE, c_NB, c_NBE, c_NC, -1, c_NE, -1, c_NG, c_NGE, c_NL, c_NLE,
 293     c_A, c_AE, c_B, c_BE, c_C, c_E, c_G, c_GE, c_L, c_LE, c_O, c_P, c_S,
 294     c_Z, c_NO, c_NP, c_PO, c_PE, -1, c_NS, c_NZ
 295 };
 296
 297 /*
 298  * Directive names.
 299  */
 300 /* If this is a an IF, ELIF, ELSE or ENDIF keyword */
 301 static int is_condition(enum preproc_token arg)
 302 {
 303     return PP_IS_COND(arg) || (arg == PP_ELSE) || (arg == PP_ENDIF);
 304 }
 305
 306 /* For TASM compatibility we need to be able to recognise TASM compatible
 307  * conditional compilation directives. Using the NASM pre-processor does
 308  * not work, so we look for them specifically from the following list and
 309  * then jam in the equivalent NASM directive into the input stream.
 310  */
 311
 312 enum {
 313     TM_ARG, TM_ELIF, TM_ELSE, TM_ENDIF, TM_IF, TM_IFDEF, TM_IFDIFI,
 314     TM_IFNDEF, TM_INCLUDE, TM_LOCAL
 315 };
 316
 317 static const char * const tasm_directives[] = {
 318     "arg", "elif", "else", "endif", "if", "ifdef", "ifdifi",
 319     "ifndef", "include", "local"
 320 };
 321
 322 static int StackSize = 4;
 323 static char *StackPointer = "ebp";
 324 static int ArgOffset = 8;
 325 static int LocalOffset = 0;
 326
 327 static Context *cstk;
 328 static Include *istk;
 329 static IncPath *ipath = NULL;
 330
 331 static efunc _error;            /* Pointer to client-provided error reporting function */
 332 static evalfunc evaluate;
 333
 334 static int pass;                /* HACK: pass 0 = generate dependencies only */
 335 static StrList **dephead, **deptail; /* Dependency list */
 336
 337 static uint64_t unique;    /* unique identifier numbers */
 338
 339 static Line *predef = NULL;
 340 static bool do_predef;
 341
 342 static ListGen *list;
 343
 344 /*
 345  * The current set of multi-line macros we have defined.
 346  */
 347 static struct hash_table mmacros;
 348
 349 /*
 350  * The current set of single-line macros we have defined.
 351  */
 352 static struct hash_table smacros;
 353
 354 /*
 355  * The multi-line macro we are currently defining, or the %rep
 356  * block we are currently reading, if any.
 357  */
 358 static MMacro *defining;
 359
 360 static uint64_t nested_mac_count;
 361 static uint64_t nested_rep_count;
 362
 363 /*
 364  * The number of macro parameters to allocate space for at a time.
 365  */
 366 #define PARAM_DELTA 16
 367
 368 /*
 369  * The standard macro set: defined in macros.c in the array nasm_stdmac.
 370  * This gives our position in the macro set, when we're processing it.
 371  */
 372 static macros_t *stdmacpos;
 373
 374 /*
 375  * The extra standard macros that come from the object format, if
 376  * any.
 377  */
 378 static macros_t *extrastdmac = NULL;
 379 static bool any_extrastdmac;
 380
 381 /*
 382  * Tokens are allocated in blocks to improve speed
 383  */
 384 #define TOKEN_BLOCKSIZE 4096
 385 static Token *freeTokens = NULL;
 386 struct Blocks {
 387     Blocks *next;
 388     void *chunk;
 389 };
 390
 391 static Blocks blocks = { NULL, NULL };
 392
 393 /*
 394  * Forward declarations.
 395  */
 396 static Token *expand_mmac_params(Token * tline);
 397 static Token *expand_smacro(Token * tline);
 398 static Token *expand_id(Token * tline);
 399 static Context *get_ctx(const char *name, bool all_contexts);
 400 static void make_tok_num(Token * tok, int64_t val);
 401 static void error(int severity, const char *fmt, ...);
 402 static void error_precond(int severity, const char *fmt, ...);
 403 static void *new_Block(size_t size);
 404 static void delete_Blocks(void);
 405 static Token *new_Token(Token * next, enum pp_token_type type,
 406                         const char *text, int txtlen);
 407 static Token *delete_Token(Token * t);
 408
 409 /*
 410  * Macros for safe checking of token pointers, avoid *(NULL)
 411  */
 412 #define tok_type_(x,t) ((x) && (x)->type == (t))
 413 #define skip_white_(x) if (tok_type_((x), TOK_WHITESPACE)) (x)=(x)->next
 414 #define tok_is_(x,v) (tok_type_((x), TOK_OTHER) && !strcmp((x)->text,(v)))
 415 #define tok_isnt_(x,v) ((x) && ((x)->type!=TOK_OTHER || strcmp((x)->text,(v))))
 416
 417 /* Handle TASM specific directives, which do not contain a % in
 418  * front of them. We do it here because I could not find any other
 419  * place to do it for the moment, and it is a hack (ideally it would
 420  * be nice to be able to use the NASM pre-processor to do it).
 421  */
 422 static char *check_tasm_directive(char *line)
 423 {
 424     int32_t i, j, k, m, len;
 425     char *p = line, *oldline, oldchar;
 426
 427     /* Skip whitespace */
 428     while (nasm_isspace(*p) && *p != 0)
 429         p++;
 430
 431     /* Binary search for the directive name */
 432     i = -1;
 433     j = elements(tasm_directives);
 434     len = 0;
 435     while (!nasm_isspace(p[len]) && p[len] != 0)
 436         len++;
 437     if (len) {
 438         oldchar = p[len];
 439         p[len] = 0;
 440         while (j - i > 1) {
 441             k = (j + i) / 2;
 442             m = nasm_stricmp(p, tasm_directives[k]);
 443             if (m == 0) {
 444                 /* We have found a directive, so jam a % in front of it
 445                  * so that NASM will then recognise it as one if it's own.
 446                  */
 447                 p[len] = oldchar;
 448                 len = strlen(p);
 449                 oldline = line;
 450                 line = nasm_malloc(len + 2);
 451                 line[0] = '%';
 452                 if (k == TM_IFDIFI) {
 453                     /* NASM does not recognise IFDIFI, so we convert it to
 454                      * %ifdef BOGUS. This is not used in NASM comaptible
 455                      * code, but does need to parse for the TASM macro
 456                      * package.
 457                      */
 458                     strcpy(line + 1, "ifdef BOGUS");
 459                 } else {
 460                     memcpy(line + 1, p, len + 1);
 461                 }
 462                 nasm_free(oldline);
 463                 return line;
 464             } else if (m < 0) {
 465                 j = k;
 466             } else
 467                 i = k;
 468         }
 469         p[len] = oldchar;
 470     }
 471     return line;
 472 }
 473
 474 /*
 475  * The pre-preprocessing stage... This function translates line
 476  * number indications as they emerge from GNU cpp (`# lineno "file"
 477  * flags') into NASM preprocessor line number indications (`%line
 478  * lineno file').
 479  */
 480 static char *prepreproc(char *line)
 481 {
 482     int lineno, fnlen;
 483     char *fname, *oldline;
 484
 485     if (line[0] == '#' && line[1] == ' ') {
 486         oldline = line;
 487         fname = oldline + 2;
 488         lineno = atoi(fname);
 489         fname += strspn(fname, "0123456789 ");
 490         if (*fname == '"')
 491             fname++;
 492         fnlen = strcspn(fname, "\"");
 493         line = nasm_malloc(20 + fnlen);
 494         snprintf(line, 20 + fnlen, "%%line %d %.*s", lineno, fnlen, fname);
 495         nasm_free(oldline);
 496     }
 497     if (tasm_compatible_mode)
 498         return check_tasm_directive(line);
 499     return line;
 500 }
 501
 502 /*
 503  * Free a linked list of tokens.
 504  */
 505 static void free_tlist(Token * list)
 506 {
 507     while (list) {
 508         list = delete_Token(list);
 509     }
 510 }
 511
 512 /*
 513  * Free a linked list of lines.
 514  */
 515 static void free_llist(Line * list)
 516 {
 517     Line *l;
 518     while (list) {
 519         l = list;
 520         list = list->next;
 521         free_tlist(l->first);
 522         nasm_free(l);
 523     }
 524 }
 525
 526 /*
 527  * Free an MMacro
 528  */
 529 static void free_mmacro(MMacro * m)
 530 {
 531     nasm_free(m->name);
 532     free_tlist(m->dlist);
 533     nasm_free(m->defaults);
 534     free_llist(m->expansion);
 535     nasm_free(m);
 536 }
 537
 538 /*
 539  * Free all currently defined macros, and free the hash tables
 540  */
 541 static void free_smacro_table(struct hash_table *smt)
 542 {
 543     SMacro *s;
 544     const char *key;
 545     struct hash_tbl_node *it = NULL;
 546
 547     while ((s = hash_iterate(smt, &it, &key)) != NULL) {
 548         nasm_free((void *)key);
 549         while (s) {
 550             SMacro *ns = s->next;
 551             nasm_free(s->name);
 552             free_tlist(s->expansion);
 553             nasm_free(s);
 554             s = ns;
 555         }
 556     }
 557     hash_free(smt);
 558 }
 559
 560 static void free_mmacro_table(struct hash_table *mmt)
 561 {
 562     MMacro *m;
 563     const char *key;
 564     struct hash_tbl_node *it = NULL;
 565
 566     it = NULL;
 567     while ((m = hash_iterate(mmt, &it, &key)) != NULL) {
 568         nasm_free((void *)key);
 569         while (m) {
 570             MMacro *nm = m->next;
 571             free_mmacro(m);
 572             m = nm;
 573         }
 574     }
 575     hash_free(mmt);
 576 }
 577
 578 static void free_macros(void)
 579 {
 580     free_smacro_table(&smacros);
 581     free_mmacro_table(&mmacros);
 582 }
 583
 584 /*
 585  * Initialize the hash tables
 586  */
 587 static void init_macros(void)
 588 {
 589     hash_init(&smacros, HASH_LARGE);
 590     hash_init(&mmacros, HASH_LARGE);
 591 }
 592
 593 /*
 594  * Pop the context stack.
 595  */
 596 static void ctx_pop(void)
 597 {
 598     Context *c = cstk;
 599
 600     cstk = cstk->next;
 601     free_smacro_table(&c->localmac);
 602     nasm_free(c->name);
 603     nasm_free(c);
 604 }
 605
 606 /*
 607  * Search for a key in the hash index; adding it if necessary
 608  * (in which case we initialize the data pointer to NULL.)
 609  */
 610 static void **
 611 hash_findi_add(struct hash_table *hash, const char *str)
 612 {
 613     struct hash_insert hi;
 614     void **r;
 615     char *strx;
 616
 617     r = hash_findi(hash, str, &hi);
 618     if (r)
 619         return r;
 620
 621     strx = nasm_strdup(str);    /* Use a more efficient allocator here? */
 622     return hash_add(&hi, strx, NULL);
 623 }
 624
 625 /*
 626  * Like hash_findi, but returns the data element rather than a pointer
 627  * to it.  Used only when not adding a new element, hence no third
 628  * argument.
 629  */
 630 static void *
 631 hash_findix(struct hash_table *hash, const char *str)
 632 {
 633     void **p;
 634
 635     p = hash_findi(hash, str, NULL);
 636     return p ? *p : NULL;
 637 }
 638
 639 #define BUF_DELTA 512
 640 /*
 641  * Read a line from the top file in istk, handling multiple CR/LFs
 642  * at the end of the line read, and handling spurious ^Zs. Will
 643  * return lines from the standard macro set if this has not already
 644  * been done.
 645  */
 646 static char *read_line(void)
 647 {
 648     char *buffer, *p, *q;
 649     int bufsize, continued_count;
 650
 651     if (stdmacpos) {
 652         unsigned char c;
 653         const unsigned char *p = stdmacpos;
 654         char *ret, *q;
 655         size_t len = 0;
 656         while ((c = *p++)) {
 657             if (c >= 0x80)
 658                 len += pp_directives_len[c-0x80]+1;
 659             else
 660                 len++;
 661         }
 662         ret = nasm_malloc(len+1);
 663         q = ret;
 664         while ((c = *stdmacpos++)) {
 665             if (c >= 0x80) {
 666                 memcpy(q, pp_directives[c-0x80], pp_directives_len[c-0x80]);
 667                 q += pp_directives_len[c-0x80];
 668                 *q++ = ' ';
 669             } else {
 670                 *q++ = c;
 671             }
 672         }
 673         stdmacpos = p;
 674         *q = '\0';
 675
 676         if (!*stdmacpos) {
 677             /* This was the last of the standard macro chain... */
 678             stdmacpos = NULL;
 679             if (any_extrastdmac) {
 680                 stdmacpos = extrastdmac;
 681                 any_extrastdmac = false;
 682             } else if (do_predef) {
 683                 Line *pd, *l;
 684                 Token *head, **tail, *t;
 685
 686                 /*
 687                  * Nasty hack: here we push the contents of
 688                  * `predef' on to the top-level expansion stack,
 689                  * since this is the most convenient way to
 690                  * implement the pre-include and pre-define
 691                  * features.
 692                  */
 693                 for (pd = predef; pd; pd = pd->next) {
 694                     head = NULL;
 695                     tail = &head;
 696                     for (t = pd->first; t; t = t->next) {
 697                         *tail = new_Token(NULL, t->type, t->text, 0);
 698                         tail = &(*tail)->next;
 699                     }
 700                     l = nasm_malloc(sizeof(Line));
 701                     l->next = istk->expansion;
 702                     l->first = head;
 703                     l->finishes = NULL;
 704                     istk->expansion = l;
 705                 }
 706                 do_predef = false;
 707             }
 708         }
 709         return ret;
 710     }
 711
 712     bufsize = BUF_DELTA;
 713     buffer = nasm_malloc(BUF_DELTA);
 714     p = buffer;
 715     continued_count = 0;
 716     while (1) {
 717         q = fgets(p, bufsize - (p - buffer), istk->fp);
 718         if (!q)
 719             break;
 720         p += strlen(p);
 721         if (p > buffer && p[-1] == '\n') {
 722             /* Convert backslash-CRLF line continuation sequences into
 723                nothing at all (for DOS and Windows) */
 724             if (((p - 2) > buffer) && (p[-3] == '\\') && (p[-2] == '\r')) {
 725                 p -= 3;
 726                 *p = 0;
 727                 continued_count++;
 728             }
 729             /* Also convert backslash-LF line continuation sequences into
 730                nothing at all (for Unix) */
 731             else if (((p - 1) > buffer) && (p[-2] == '\\')) {
 732                 p -= 2;
 733                 *p = 0;
 734                 continued_count++;
 735             } else {
 736                 break;
 737             }
 738         }
 739         if (p - buffer > bufsize - 10) {
 740             int32_t offset = p - buffer;
 741             bufsize += BUF_DELTA;
 742             buffer = nasm_realloc(buffer, bufsize);
 743             p = buffer + offset;        /* prevent stale-pointer problems */
 744         }
 745     }
 746
 747     if (!q && p == buffer) {
 748         nasm_free(buffer);
 749         return NULL;
 750     }
 751
 752     src_set_linnum(src_get_linnum() + istk->lineinc +
 753                    (continued_count * istk->lineinc));
 754
 755     /*
 756      * Play safe: remove CRs as well as LFs, if any of either are
 757      * present at the end of the line.
 758      */
 759     while (--p >= buffer && (*p == '\n' || *p == '\r'))
 760         *p = '\0';
 761
 762     /*
 763      * Handle spurious ^Z, which may be inserted into source files
 764      * by some file transfer utilities.
 765      */
 766     buffer[strcspn(buffer, "\032")] = '\0';
 767
 768     list->line(LIST_READ, buffer);
 769
 770     return buffer;
 771 }
 772
 773 /*
 774  * Tokenize a line of text. This is a very simple process since we
 775  * don't need to parse the value out of e.g. numeric tokens: we
 776  * simply split one string into many.
 777  */
 778 static Token *tokenize(char *line)
 779 {
 780     char *p = line;
 781     enum pp_token_type type;
 782     Token *list = NULL;
 783     Token *t, **tail = &list;
 784
 785     while (*line) {
 786         p = line;
 787         if (*p == '%') {
 788             p++;
 789             if (nasm_isdigit(*p) ||
 790                 ((*p == '-' || *p == '+') && nasm_isdigit(p[1])) ||
 791                 ((*p == '+') && (nasm_isspace(p[1]) || !p[1]))) {
 792                 do {
 793                     p++;
 794                 }
 795                 while (nasm_isdigit(*p));
 796                 type = TOK_PREPROC_ID;
 797             } else if (*p == '{') {
 798                 p++;
 799                 while (*p && *p != '}') {
 800                     p[-1] = *p;
 801                     p++;
 802                 }
 803                 p[-1] = '\0';
 804                 if (*p)
 805                     p++;
 806                 type = TOK_PREPROC_ID;
 807             } else if (*p == '?') {
 808                 type = TOK_PREPROC_Q; /* %? */
 809                 p++;
 810                 if (*p == '?') {
 811                     type = TOK_PREPROC_QQ; /* %?? */
 812                     p++;
 813                 }
 814             } else if (isidchar(*p) ||
 815                        ((*p == '!' || *p == '%' || *p == '$') &&
 816                         isidchar(p[1]))) {
 817                 do {
 818                     p++;
 819                 }
 820                 while (isidchar(*p));
 821                 type = TOK_PREPROC_ID;
 822             } else {
 823                 type = TOK_OTHER;
 824                 if (*p == '%')
 825                     p++;
 826             }
 827         } else if (isidstart(*p) || (*p == '$' && isidstart(p[1]))) {
 828             type = TOK_ID;
 829             p++;
 830             while (*p && isidchar(*p))
 831                 p++;
 832         } else if (*p == '\'' || *p == '"' || *p == '`') {
 833             /*
 834              * A string token.
 835              */
 836             type = TOK_STRING;
 837             p = nasm_skip_string(p);
 838
 839             if (*p) {
 840                 p++;
 841             } else {
 842                 error(ERR_WARNING|ERR_PASS1, "unterminated string");
 843                 /* Handling unterminated strings by UNV */
 844                 /* type = -1; */
 845             }
 846         } else if (isnumstart(*p)) {
 847             bool is_hex = false;
 848             bool is_float = false;
 849             bool has_e = false;
 850             char c, *r;
 851
 852             /*
 853              * A numeric token.
 854              */
 855
 856             if (*p == '$') {
 857                 p++;
 858                 is_hex = true;
 859             }
 860
 861             for (;;) {
 862                 c = *p++;
 863
 864                 if (!is_hex && (c == 'e' || c == 'E')) {
 865                     has_e = true;
 866                     if (*p == '+' || *p == '-') {
 867                         /* e can only be followed by +/- if it is either a
 868                            prefixed hex number or a floating-point number */
 869                         p++;
 870                         is_float = true;
 871                     }
 872                 } else if (c == 'H' || c == 'h' || c == 'X' || c == 'x') {
 873                     is_hex = true;
 874                 } else if (c == 'P' || c == 'p') {
 875                     is_float = true;
 876                     if (*p == '+' || *p == '-')
 877                         p++;
 878                 } else if (isnumchar(c) || c == '_')
 879                     ; /* just advance */
 880                 else if (c == '.') {
 881                     /* we need to deal with consequences of the legacy
 882                        parser, like "1.nolist" being two tokens
 883                        (TOK_NUMBER, TOK_ID) here; at least give it
 884                        a shot for now.  In the future, we probably need
 885                        a flex-based scanner with proper pattern matching
 886                        to do it as well as it can be done.  Nothing in
 887                        the world is going to help the person who wants
 888                        0x123.p16 interpreted as two tokens, though. */
 889                     r = p;
 890                     while (*r == '_')
 891                         r++;
 892
 893                     if (nasm_isdigit(*r) || (is_hex && nasm_isxdigit(*r)) ||
 894                         (!is_hex && (*r == 'e' || *r == 'E')) ||
 895                         (*r == 'p' || *r == 'P')) {
 896                         p = r;
 897                         is_float = true;
 898                     } else
 899                         break;  /* Terminate the token */
 900                 } else
 901                     break;
 902             }
 903             p--;        /* Point to first character beyond number */
 904
 905             if (has_e && !is_hex) {
 906                 /* 1e13 is floating-point, but 1e13h is not */
 907                 is_float = true;
 908             }
 909
 910             type = is_float ? TOK_FLOAT : TOK_NUMBER;
 911         } else if (nasm_isspace(*p)) {
 912             type = TOK_WHITESPACE;
 913             p++;
 914             while (*p && nasm_isspace(*p))
 915                 p++;
 916             /*
 917              * Whitespace just before end-of-line is discarded by
 918              * pretending it's a comment; whitespace just before a
 919              * comment gets lumped into the comment.
 920              */
 921             if (!*p || *p == ';') {
 922                 type = TOK_COMMENT;
 923                 while (*p)
 924                     p++;
 925             }
 926         } else if (*p == ';') {
 927             type = TOK_COMMENT;
 928             while (*p)
 929                 p++;
 930         } else {
 931             /*
 932              * Anything else is an operator of some kind. We check
 933              * for all the double-character operators (>>, <<, //,
 934              * %%, <=, >=, ==, !=, <>, &&, ||, ^^), but anything
 935              * else is a single-character operator.
 936              */
 937             type = TOK_OTHER;
 938             if ((p[0] == '>' && p[1] == '>') ||
 939                 (p[0] == '<' && p[1] == '<') ||
 940                 (p[0] == '/' && p[1] == '/') ||
 941                 (p[0] == '<' && p[1] == '=') ||
 942                 (p[0] == '>' && p[1] == '=') ||
 943                 (p[0] == '=' && p[1] == '=') ||
 944                 (p[0] == '!' && p[1] == '=') ||
 945                 (p[0] == '<' && p[1] == '>') ||
 946                 (p[0] == '&' && p[1] == '&') ||
 947                 (p[0] == '|' && p[1] == '|') ||
 948                 (p[0] == '^' && p[1] == '^')) {
 949                 p++;
 950             }
 951             p++;
 952         }
 953
 954         /* Handling unterminated string by UNV */
 955         /*if (type == -1)
 956            {
 957            *tail = t = new_Token(NULL, TOK_STRING, line, p-line+1);
 958            t->text[p-line] = *line;
 959            tail = &t->next;
 960            }
 961            else */
 962         if (type != TOK_COMMENT) {
 963             *tail = t = new_Token(NULL, type, line, p - line);
 964             tail = &t->next;
 965         }
 966         line = p;
 967     }
 968     return list;
 969 }
 970
 971 /*
 972  * this function allocates a new managed block of memory and
 973  * returns a pointer to the block.  The managed blocks are
 974  * deleted only all at once by the delete_Blocks function.
 975  */
 976 static void *new_Block(size_t size)
 977 {
 978     Blocks *b = &blocks;
 979
 980     /* first, get to the end of the linked list */
 981     while (b->next)
 982         b = b->next;
 983     /* now allocate the requested chunk */
 984     b->chunk = nasm_malloc(size);
 985
 986     /* now allocate a new block for the next request */
 987     b->next = nasm_malloc(sizeof(Blocks));
 988     /* and initialize the contents of the new block */
 989     b->next->next = NULL;
 990     b->next->chunk = NULL;
 991     return b->chunk;
 992 }
 993
 994 /*
 995  * this function deletes all managed blocks of memory
 996  */
 997 static void delete_Blocks(void)
 998 {
 999     Blocks *a, *b = &blocks;
1000
1001     /*
1002      * keep in mind that the first block, pointed to by blocks
1003      * is a static and not dynamically allocated, so we don't
1004      * free it.
1005      */
1006     while (b) {
1007         if (b->chunk)
1008             nasm_free(b->chunk);
1009         a = b;
1010         b = b->next;
1011         if (a != &blocks)
1012             nasm_free(a);
1013     }
1014 }
1015
1016 /*
1017  *  this function creates a new Token and passes a pointer to it
1018  *  back to the caller.  It sets the type and text elements, and
1019  *  also the a.mac and next elements to NULL.
1020  */
1021 static Token *new_Token(Token * next, enum pp_token_type type,
1022                         const char *text, int txtlen)
1023 {
1024     Token *t;
1025     int i;
1026
1027     if (freeTokens == NULL) {
1028         freeTokens = (Token *) new_Block(TOKEN_BLOCKSIZE * sizeof(Token));
1029         for (i = 0; i < TOKEN_BLOCKSIZE - 1; i++)
1030             freeTokens[i].next = &freeTokens[i + 1];
1031         freeTokens[i].next = NULL;
1032     }
1033     t = freeTokens;
1034     freeTokens = t->next;
1035     t->next = next;
1036     t->a.mac = NULL;
1037     t->type = type;
1038     if (type == TOK_WHITESPACE || text == NULL) {
1039         t->text = NULL;
1040     } else {
1041         if (txtlen == 0)
1042             txtlen = strlen(text);
1043         t->text = nasm_malloc(txtlen+1);
1044         memcpy(t->text, text, txtlen);
1045         t->text[txtlen] = '\0';
1046     }
1047     return t;
1048 }
1049
1050 static Token *delete_Token(Token * t)
1051 {
1052     Token *next = t->next;
1053     nasm_free(t->text);
1054     t->next = freeTokens;
1055     freeTokens = t;
1056     return next;
1057 }
1058
1059 /*
1060  * Convert a line of tokens back into text.
1061  * If expand_locals is not zero, identifiers of the form "%$*xxx"
1062  * will be transformed into ..@ctxnum.xxx
1063  */
1064 static char *detoken(Token * tlist, bool expand_locals)
1065 {
1066     Token *t;
1067     int len;
1068     char *line, *p;
1069     const char *q;
1070
1071     len = 0;
1072     for (t = tlist; t; t = t->next) {
1073         if (t->type == TOK_PREPROC_ID && t->text[1] == '!') {
1074             char *p = getenv(t->text + 2);
1075             nasm_free(t->text);
1076             if (p)
1077                 t->text = nasm_strdup(p);
1078             else
1079                 t->text = NULL;
1080         }
1081         /* Expand local macros here and not during preprocessing */
1082         if (expand_locals &&
1083             t->type == TOK_PREPROC_ID && t->text &&
1084             t->text[0] == '%' && t->text[1] == '$') {
1085             Context *ctx = get_ctx(t->text, false);
1086             if (ctx) {
1087                 char buffer[40];
1088                 char *p, *q = t->text + 2;
1089
1090                 q += strspn(q, "$");
1091                 snprintf(buffer, sizeof(buffer), "..@%"PRIu32".", ctx->number);
1092                 p = nasm_strcat(buffer, q);
1093                 nasm_free(t->text);
1094                 t->text = p;
1095             }
1096         }
1097         if (t->type == TOK_WHITESPACE) {
1098             len++;
1099         } else if (t->text) {
1100             len += strlen(t->text);
1101         }
1102     }
1103     p = line = nasm_malloc(len + 1);
1104     for (t = tlist; t; t = t->next) {
1105         if (t->type == TOK_WHITESPACE) {
1106             *p++ = ' ';
1107         } else if (t->text) {
1108             q = t->text;
1109             while (*q)
1110                 *p++ = *q++;
1111         }
1112     }
1113     *p = '\0';
1114     return line;
1115 }
1116
1117 /*
1118  * A scanner, suitable for use by the expression evaluator, which
1119  * operates on a line of Tokens. Expects a pointer to a pointer to
1120  * the first token in the line to be passed in as its private_data
1121  * field.
1122  *
1123  * FIX: This really needs to be unified with stdscan.
1124  */
1125 static int ppscan(void *private_data, struct tokenval *tokval)
1126 {
1127     Token **tlineptr = private_data;
1128     Token *tline;
1129     char ourcopy[MAX_KEYWORD+1], *p, *r, *s;
1130
1131     do {
1132         tline = *tlineptr;
1133         *tlineptr = tline ? tline->next : NULL;
1134     }
1135     while (tline && (tline->type == TOK_WHITESPACE ||
1136                      tline->type == TOK_COMMENT));
1137
1138     if (!tline)
1139         return tokval->t_type = TOKEN_EOS;
1140
1141     tokval->t_charptr = tline->text;
1142
1143     if (tline->text[0] == '$' && !tline->text[1])
1144         return tokval->t_type = TOKEN_HERE;
1145     if (tline->text[0] == '$' && tline->text[1] == '$' && !tline->text[2])
1146         return tokval->t_type = TOKEN_BASE;
1147
1148     if (tline->type == TOK_ID) {
1149         p = tokval->t_charptr = tline->text;
1150         if (p[0] == '$') {
1151             tokval->t_charptr++;
1152             return tokval->t_type = TOKEN_ID;
1153         }
1154
1155         for (r = p, s = ourcopy; *r; r++) {
1156             if (r >= p+MAX_KEYWORD)
1157                 return tokval->t_type = TOKEN_ID; /* Not a keyword */
1158             *s++ = nasm_tolower(*r);
1159         }
1160         *s = '\0';
1161         /* right, so we have an identifier sitting in temp storage. now,
1162          * is it actually a register or instruction name, or what? */
1163         return nasm_token_hash(ourcopy, tokval);
1164     }
1165
1166     if (tline->type == TOK_NUMBER) {
1167         bool rn_error;
1168         tokval->t_integer = readnum(tline->text, &rn_error);
1169         tokval->t_charptr = tline->text;
1170         if (rn_error)
1171             return tokval->t_type = TOKEN_ERRNUM;
1172         else
1173             return tokval->t_type = TOKEN_NUM;
1174     }
1175
1176     if (tline->type == TOK_FLOAT) {
1177         return tokval->t_type = TOKEN_FLOAT;
1178     }
1179
1180     if (tline->type == TOK_STRING) {
1181         char bq, *ep;
1182
1183         bq = tline->text[0];
1184         tokval->t_charptr = tline->text;
1185         tokval->t_inttwo = nasm_unquote(tline->text, &ep);
1186
1187         if (ep[0] != bq || ep[1] != '\0')
1188             return tokval->t_type = TOKEN_ERRSTR;
1189         else
1190             return tokval->t_type = TOKEN_STR;
1191     }
1192
1193     if (tline->type == TOK_OTHER) {
1194         if (!strcmp(tline->text, "<<"))
1195             return tokval->t_type = TOKEN_SHL;
1196         if (!strcmp(tline->text, ">>"))
1197             return tokval->t_type = TOKEN_SHR;
1198         if (!strcmp(tline->text, "//"))
1199             return tokval->t_type = TOKEN_SDIV;
1200         if (!strcmp(tline->text, "%%"))
1201             return tokval->t_type = TOKEN_SMOD;
1202         if (!strcmp(tline->text, "=="))
1203             return tokval->t_type = TOKEN_EQ;
1204         if (!strcmp(tline->text, "<>"))
1205             return tokval->t_type = TOKEN_NE;
1206         if (!strcmp(tline->text, "!="))
1207             return tokval->t_type = TOKEN_NE;
1208         if (!strcmp(tline->text, "<="))
1209             return tokval->t_type = TOKEN_LE;
1210         if (!strcmp(tline->text, ">="))
1211             return tokval->t_type = TOKEN_GE;
1212         if (!strcmp(tline->text, "&&"))
1213             return tokval->t_type = TOKEN_DBL_AND;
1214         if (!strcmp(tline->text, "^^"))
1215             return tokval->t_type = TOKEN_DBL_XOR;
1216         if (!strcmp(tline->text, "||"))
1217             return tokval->t_type = TOKEN_DBL_OR;
1218     }
1219
1220     /*
1221      * We have no other options: just return the first character of
1222      * the token text.
1223      */
1224     return tokval->t_type = tline->text[0];
1225 }
1226
1227 /*
1228  * Compare a string to the name of an existing macro; this is a
1229  * simple wrapper which calls either strcmp or nasm_stricmp
1230  * depending on the value of the `casesense' parameter.
1231  */
1232 static int mstrcmp(const char *p, const char *q, bool casesense)
1233 {
1234     return casesense ? strcmp(p, q) : nasm_stricmp(p, q);
1235 }
1236
1237 /*
1238  * Compare a string to the name of an existing macro; this is a
1239  * simple wrapper which calls either strcmp or nasm_stricmp
1240  * depending on the value of the `casesense' parameter.
1241  */
1242 static int mmemcmp(const char *p, const char *q, size_t l, bool casesense)
1243 {
1244     return casesense ? memcmp(p, q, l) : nasm_memicmp(p, q, l);
1245 }
1246
1247 /*
1248  * Return the Context structure associated with a %$ token. Return
1249  * NULL, having _already_ reported an error condition, if the
1250  * context stack isn't deep enough for the supplied number of $
1251  * signs.
1252  * If all_contexts == true, contexts that enclose current are
1253  * also scanned for such smacro, until it is found; if not -
1254  * only the context that directly results from the number of $'s
1255  * in variable's name.
1256  */
1257 static Context *get_ctx(const char *name, bool all_contexts)
1258 {
1259     Context *ctx;
1260     SMacro *m;
1261     int i;
1262
1263     if (!name || name[0] != '%' || name[1] != '$')
1264         return NULL;
1265
1266     if (!cstk) {
1267         error(ERR_NONFATAL, "`%s': context stack is empty", name);
1268         return NULL;
1269     }
1270
1271     for (i = strspn(name + 2, "$"), ctx = cstk; (i > 0) && ctx; i--) {
1272         ctx = ctx->next;
1273 /*        i--;  Lino - 02/25/02 */
1274     }
1275     if (!ctx) {
1276         error(ERR_NONFATAL, "`%s': context stack is only"
1277               " %d level%s deep", name, i - 1, (i == 2 ? "" : "s"));
1278         return NULL;
1279     }
1280     if (!all_contexts)
1281         return ctx;
1282
1283     do {
1284         /* Search for this smacro in found context */
1285         m = hash_findix(&ctx->localmac, name);
1286         while (m) {
1287             if (!mstrcmp(m->name, name, m->casesense))
1288                 return ctx;
1289             m = m->next;
1290         }
1291         ctx = ctx->next;
1292     }
1293     while (ctx);
1294     return NULL;
1295 }
1296
1297 /*
1298  * Check to see if a file is already in a string list
1299  */
1300 static bool in_list(const StrList *list, const char *str)
1301 {
1302     while (list) {
1303         if (!strcmp(list->str, str))
1304             return true;
1305         list = list->next;
1306     }
1307     return false;
1308 }
1309
1310 /*
1311  * Open an include file. This routine must always return a valid
1312  * file pointer if it returns - it's responsible for throwing an
1313  * ERR_FATAL and bombing out completely if not. It should also try
1314  * the include path one by one until it finds the file or reaches
1315  * the end of the path.
1316  */
1317 static FILE *inc_fopen(const char *file, StrList **dhead, StrList ***dtail,
1318                        bool missing_ok)
1319 {
1320     FILE *fp;
1321     char *prefix = "";
1322     IncPath *ip = ipath;
1323     int len = strlen(file);
1324     size_t prefix_len = 0;
1325     StrList *sl;
1326
1327     while (1) {
1328         sl = nasm_malloc(prefix_len+len+1+sizeof sl->next);
1329         memcpy(sl->str, prefix, prefix_len);
1330         memcpy(sl->str+prefix_len, file, len+1);
1331         fp = fopen(sl->str, "r");
1332         if (fp && dhead && !in_list(*dhead, sl->str)) {
1333             sl->next = NULL;
1334             **dtail = sl;
1335             *dtail = &sl->next;
1336         } else {
1337             nasm_free(sl);
1338         }
1339         if (fp)
1340             return fp;
1341         if (!ip) {
1342             if (!missing_ok)
1343                 break;
1344             prefix = NULL;
1345         } else {
1346             prefix = ip->path;
1347             ip = ip->next;
1348         }
1349         if (prefix) {
1350             prefix_len = strlen(prefix);
1351         } else {
1352             /* -MG given and file not found */
1353             if (dhead && !in_list(*dhead, file)) {
1354                 sl = nasm_malloc(len+1+sizeof sl->next);
1355                 sl->next = NULL;
1356                 strcpy(sl->str, file);
1357                 **dtail = sl;
1358                 *dtail = &sl->next;
1359             }
1360             return NULL;
1361         }
1362     }
1363
1364     error(ERR_FATAL, "unable to open include file `%s'", file);
1365     return NULL;                /* never reached - placate compilers */
1366 }
1367
1368 /*
1369  * Determine if we should warn on defining a single-line macro of
1370  * name `name', with `nparam' parameters. If nparam is 0 or -1, will
1371  * return true if _any_ single-line macro of that name is defined.
1372  * Otherwise, will return true if a single-line macro with either
1373  * `nparam' or no parameters is defined.
1374  *
1375  * If a macro with precisely the right number of parameters is
1376  * defined, or nparam is -1, the address of the definition structure
1377  * will be returned in `defn'; otherwise NULL will be returned. If `defn'
1378  * is NULL, no action will be taken regarding its contents, and no
1379  * error will occur.
1380  *
1381  * Note that this is also called with nparam zero to resolve
1382  * `ifdef'.
1383  *
1384  * If you already know which context macro belongs to, you can pass
1385  * the context pointer as first parameter; if you won't but name begins
1386  * with %$ the context will be automatically computed. If all_contexts
1387  * is true, macro will be searched in outer contexts as well.
1388  */
1389 static bool
1390 smacro_defined(Context * ctx, const char *name, int nparam, SMacro ** defn,
1391                bool nocase)
1392 {
1393     struct hash_table *smtbl;
1394     SMacro *m;
1395
1396     if (ctx) {
1397         smtbl = &ctx->localmac;
1398     } else if (name[0] == '%' && name[1] == '$') {
1399         if (cstk)
1400             ctx = get_ctx(name, false);
1401         if (!ctx)
1402             return false;       /* got to return _something_ */
1403         smtbl = &ctx->localmac;
1404     } else {
1405         smtbl = &smacros;
1406     }
1407     m = (SMacro *) hash_findix(smtbl, name);
1408
1409     while (m) {
1410         if (!mstrcmp(m->name, name, m->casesense && nocase) &&
1411             (nparam <= 0 || m->nparam == 0 || nparam == (int) m->nparam)) {
1412             if (defn) {
1413                 if (nparam == (int) m->nparam || nparam == -1)
1414                     *defn = m;
1415                 else
1416                     *defn = NULL;
1417             }
1418             return true;
1419         }
1420         m = m->next;
1421     }
1422
1423     return false;
1424 }
1425
1426 /*
1427  * Count and mark off the parameters in a multi-line macro call.
1428  * This is called both from within the multi-line macro expansion
1429  * code, and also to mark off the default parameters when provided
1430  * in a %macro definition line.
1431  */
1432 static void count_mmac_params(Token * t, int *nparam, Token *** params)
1433 {
1434     int paramsize, brace;
1435
1436     *nparam = paramsize = 0;
1437     *params = NULL;
1438     while (t) {
1439         /* +1: we need space for the final NULL */
1440         if (*nparam+1 >= paramsize) {
1441             paramsize += PARAM_DELTA;
1442             *params = nasm_realloc(*params, sizeof(**params) * paramsize);
1443         }
1444         skip_white_(t);
1445         brace = false;
1446         if (tok_is_(t, "{"))
1447             brace = true;
1448         (*params)[(*nparam)++] = t;
1449         while (tok_isnt_(t, brace ? "}" : ","))
1450             t = t->next;
1451         if (t) {                /* got a comma/brace */
1452             t = t->next;
1453             if (brace) {
1454                 /*
1455                  * Now we've found the closing brace, look further
1456                  * for the comma.
1457                  */
1458                 skip_white_(t);
1459                 if (tok_isnt_(t, ",")) {
1460                     error(ERR_NONFATAL,
1461                           "braces do not enclose all of macro parameter");
1462                     while (tok_isnt_(t, ","))
1463                         t = t->next;
1464                 }
1465                 if (t)
1466                     t = t->next;        /* eat the comma */
1467             }
1468         }
1469     }
1470 }
1471
1472 /*
1473  * Determine whether one of the various `if' conditions is true or
1474  * not.
1475  *
1476  * We must free the tline we get passed.
1477  */
1478 static bool if_condition(Token * tline, enum preproc_token ct)
1479 {
1480     enum pp_conditional i = PP_COND(ct);
1481     bool j;
1482     Token *t, *tt, **tptr, *origline;
1483     struct tokenval tokval;
1484     expr *evalresult;
1485     enum pp_token_type needtype;
1486
1487     origline = tline;
1488
1489     switch (i) {
1490     case PPC_IFCTX:
1491         j = false;              /* have we matched yet? */
1492         while (true) {
1493             skip_white_(tline);
1494             if (!tline)
1495                 break;
1496             if (tline->type != TOK_ID) {
1497                 error(ERR_NONFATAL,
1498                       "`%s' expects context identifiers", pp_directives[ct]);
1499                 free_tlist(origline);
1500                 return -1;
1501             }
1502             if (cstk && cstk->name && !nasm_stricmp(tline->text, cstk->name))
1503                 j = true;
1504             tline = tline->next;
1505         }
1506         break;
1507
1508     case PPC_IFDEF:
1509         j = false;              /* have we matched yet? */
1510         while (tline) {
1511             skip_white_(tline);
1512             if (!tline || (tline->type != TOK_ID &&
1513                            (tline->type != TOK_PREPROC_ID ||
1514                             tline->text[1] != '$'))) {
1515                 error(ERR_NONFATAL,
1516                       "`%s' expects macro identifiers", pp_directives[ct]);
1517                 goto fail;
1518             }
1519             if (smacro_defined(NULL, tline->text, 0, NULL, true))
1520                 j = true;
1521             tline = tline->next;
1522         }
1523         break;
1524
1525     case PPC_IFIDN:
1526     case PPC_IFIDNI:
1527         tline = expand_smacro(tline);
1528         t = tt = tline;
1529         while (tok_isnt_(tt, ","))
1530             tt = tt->next;
1531         if (!tt) {
1532             error(ERR_NONFATAL,
1533                   "`%s' expects two comma-separated arguments",
1534                   pp_directives[ct]);
1535             goto fail;
1536         }
1537         tt = tt->next;
1538         j = true;               /* assume equality unless proved not */
1539         while ((t->type != TOK_OTHER || strcmp(t->text, ",")) && tt) {
1540             if (tt->type == TOK_OTHER && !strcmp(tt->text, ",")) {
1541                 error(ERR_NONFATAL, "`%s': more than one comma on line",
1542                       pp_directives[ct]);
1543                 goto fail;
1544             }
1545             if (t->type == TOK_WHITESPACE) {
1546                 t = t->next;
1547                 continue;
1548             }
1549             if (tt->type == TOK_WHITESPACE) {
1550                 tt = tt->next;
1551                 continue;
1552             }
1553             if (tt->type != t->type) {
1554                 j = false;      /* found mismatching tokens */
1555                 break;
1556             }
1557             /* When comparing strings, need to unquote them first */
1558             if (t->type == TOK_STRING) {
1559                 size_t l1 = nasm_unquote(t->text, NULL);
1560                 size_t l2 = nasm_unquote(tt->text, NULL);
1561
1562                 if (l1 != l2) {
1563                     j = false;
1564                     break;
1565                 }
1566                 if (mmemcmp(t->text, tt->text, l1, i == PPC_IFIDN)) {
1567                     j = false;
1568                     break;
1569                 }
1570             } else if (mstrcmp(tt->text, t->text, i == PPC_IFIDN) != 0) {
1571                 j = false;      /* found mismatching tokens */
1572                 break;
1573             }
1574
1575             t = t->next;
1576             tt = tt->next;
1577         }
1578         if ((t->type != TOK_OTHER || strcmp(t->text, ",")) || tt)
1579             j = false;          /* trailing gunk on one end or other */
1580         break;
1581
1582     case PPC_IFMACRO:
1583         {
1584             bool found = false;
1585             MMacro searching, *mmac;
1586
1587             tline = tline->next;
1588             skip_white_(tline);
1589             tline = expand_id(tline);
1590             if (!tok_type_(tline, TOK_ID)) {
1591                 error(ERR_NONFATAL,
1592                       "`%s' expects a macro name", pp_directives[ct]);
1593                 goto fail;
1594             }
1595             searching.name = nasm_strdup(tline->text);
1596             searching.casesense = true;
1597             searching.plus = false;
1598             searching.nolist = false;
1599             searching.in_progress = 0;
1600             searching.rep_nest = NULL;
1601             searching.nparam_min = 0;
1602             searching.nparam_max = INT_MAX;
1603             tline = expand_smacro(tline->next);
1604             skip_white_(tline);
1605             if (!tline) {
1606             } else if (!tok_type_(tline, TOK_NUMBER)) {
1607                 error(ERR_NONFATAL,
1608                       "`%s' expects a parameter count or nothing",
1609                       pp_directives[ct]);
1610             } else {
1611                 searching.nparam_min = searching.nparam_max =
1612                     readnum(tline->text, &j);
1613                 if (j)
1614                     error(ERR_NONFATAL,
1615                           "unable to parse parameter count `%s'",
1616                           tline->text);
1617             }
1618             if (tline && tok_is_(tline->next, "-")) {
1619                 tline = tline->next->next;
1620                 if (tok_is_(tline, "*"))
1621                     searching.nparam_max = INT_MAX;
1622                 else if (!tok_type_(tline, TOK_NUMBER))
1623                     error(ERR_NONFATAL,
1624                           "`%s' expects a parameter count after `-'",
1625                           pp_directives[ct]);
1626                 else {
1627                     searching.nparam_max = readnum(tline->text, &j);
1628                     if (j)
1629                         error(ERR_NONFATAL,
1630                               "unable to parse parameter count `%s'",
1631                               tline->text);
1632                     if (searching.nparam_min > searching.nparam_max)
1633                         error(ERR_NONFATAL,
1634                               "minimum parameter count exceeds maximum");
1635                 }
1636             }
1637             if (tline && tok_is_(tline->next, "+")) {
1638                 tline = tline->next;
1639                 searching.plus = true;
1640             }
1641             mmac = (MMacro *) hash_findix(&mmacros, searching.name);
1642             while (mmac) {
1643                 if (!strcmp(mmac->name, searching.name) &&
1644                     (mmac->nparam_min <= searching.nparam_max
1645                      || searching.plus)
1646                     && (searching.nparam_min <= mmac->nparam_max
1647                         || mmac->plus)) {
1648                     found = true;
1649                     break;
1650                 }
1651                 mmac = mmac->next;
1652             }
1653             if(tline && tline->next)
1654                 error(ERR_WARNING|ERR_PASS1,
1655                       "trailing garbage after %%ifmacro ignored");
1656             nasm_free(searching.name);
1657             j = found;
1658             break;
1659         }
1660
1661     case PPC_IFID:
1662         needtype = TOK_ID;
1663         goto iftype;
1664     case PPC_IFNUM:
1665         needtype = TOK_NUMBER;
1666         goto iftype;
1667     case PPC_IFSTR:
1668         needtype = TOK_STRING;
1669         goto iftype;
1670
1671     iftype:
1672         t = tline = expand_smacro(tline);
1673
1674         while (tok_type_(t, TOK_WHITESPACE) ||
1675                (needtype == TOK_NUMBER &&
1676                 tok_type_(t, TOK_OTHER) &&
1677                 (t->text[0] == '-' || t->text[0] == '+') &&
1678                 !t->text[1]))
1679             t = t->next;
1680
1681         j = tok_type_(t, needtype);
1682         break;
1683
1684     case PPC_IFTOKEN:
1685         t = tline = expand_smacro(tline);
1686         while (tok_type_(t, TOK_WHITESPACE))
1687             t = t->next;
1688
1689         j = false;
1690         if (t) {
1691             t = t->next;        /* Skip the actual token */
1692             while (tok_type_(t, TOK_WHITESPACE))
1693                 t = t->next;
1694             j = !t;             /* Should be nothing left */
1695         }
1696         break;
1697
1698     case PPC_IFEMPTY:
1699         t = tline = expand_smacro(tline);
1700         while (tok_type_(t, TOK_WHITESPACE))
1701             t = t->next;
1702
1703         j = !t;                 /* Should be empty */
1704         break;
1705
1706     case PPC_IF:
1707         t = tline = expand_smacro(tline);
1708         tptr = &t;
1709         tokval.t_type = TOKEN_INVALID;
1710         evalresult = evaluate(ppscan, tptr, &tokval,
1711                               NULL, pass | CRITICAL, error, NULL);
1712         if (!evalresult)
1713             return -1;
1714         if (tokval.t_type)
1715             error(ERR_WARNING|ERR_PASS1,
1716                   "trailing garbage after expression ignored");
1717         if (!is_simple(evalresult)) {
1718             error(ERR_NONFATAL,
1719                   "non-constant value given to `%s'", pp_directives[ct]);
1720             goto fail;
1721         }
1722         j = reloc_value(evalresult) != 0;
1723         break;
1724
1725     default:
1726         error(ERR_FATAL,
1727               "preprocessor directive `%s' not yet implemented",
1728               pp_directives[ct]);
1729         goto fail;
1730     }
1731
1732     free_tlist(origline);
1733     return j ^ PP_NEGATIVE(ct);
1734
1735 fail:
1736     free_tlist(origline);
1737     return -1;
1738 }
1739
1740 /*
1741  * Common code for defining an smacro
1742  */
1743 static bool define_smacro(Context *ctx, char *mname, bool casesense,
1744                           int nparam, Token *expansion)
1745 {
1746     SMacro *smac, **smhead;
1747     struct hash_table *smtbl;
1748
1749     if (smacro_defined(ctx, mname, nparam, &smac, casesense)) {
1750         if (!smac) {
1751             error(ERR_WARNING|ERR_PASS1,
1752                   "single-line macro `%s' defined both with and"
1753                   " without parameters", mname);
1754
1755             /* Some instances of the old code considered this a failure,
1756                some others didn't.  What is the right thing to do here? */
1757             free_tlist(expansion);
1758             return false;       /* Failure */
1759         } else {
1760             /*
1761              * We're redefining, so we have to take over an
1762              * existing SMacro structure. This means freeing
1763              * what was already in it.
1764              */
1765             nasm_free(smac->name);
1766             free_tlist(smac->expansion);
1767         }
1768     } else {
1769         smtbl  = ctx ? &ctx->localmac : &smacros;
1770         smhead = (SMacro **) hash_findi_add(smtbl, mname);
1771         smac = nasm_malloc(sizeof(SMacro));
1772         smac->next = *smhead;
1773         *smhead = smac;
1774     }
1775     smac->name = nasm_strdup(mname);
1776     smac->casesense = casesense;
1777     smac->nparam = nparam;
1778     smac->expansion = expansion;
1779     smac->in_progress = false;
1780     return true;                /* Success */
1781 }
1782
1783 /*
1784  * Undefine an smacro
1785  */
1786 static void undef_smacro(Context *ctx, const char *mname)
1787 {
1788     SMacro **smhead, *s, **sp;
1789     struct hash_table *smtbl;
1790
1791     smtbl = ctx ? &ctx->localmac : &smacros;
1792     smhead = (SMacro **)hash_findi(smtbl, mname, NULL);
1793
1794     if (smhead) {
1795         /*
1796          * We now have a macro name... go hunt for it.
1797          */
1798         sp = smhead;
1799         while ((s = *sp) != NULL) {
1800             if (!mstrcmp(s->name, mname, s->casesense)) {
1801                 *sp = s->next;
1802                 nasm_free(s->name);
1803                 free_tlist(s->expansion);
1804                 nasm_free(s);
1805             } else {
1806                 sp = &s->next;
1807             }
1808         }
1809     }
1810 }
1811
1812 /*
1813  * Parse a mmacro specification.
1814  */
1815 static bool parse_mmacro_spec(Token *tline, MMacro *def, const char *directive)
1816 {
1817     bool err;
1818
1819     tline = tline->next;
1820     skip_white_(tline);
1821     tline = expand_id(tline);
1822     if (!tok_type_(tline, TOK_ID)) {
1823         error(ERR_NONFATAL, "`%s' expects a macro name", directive);
1824         return false;
1825     }
1826
1827     def->name = nasm_strdup(tline->text);
1828     def->plus = false;
1829     def->nolist = false;
1830     def->in_progress = 0;
1831     def->rep_nest = NULL;
1832     def->nparam_min = 0;
1833     def->nparam_max = 0;
1834
1835     tline = expand_smacro(tline->next);
1836     skip_white_(tline);
1837     if (!tok_type_(tline, TOK_NUMBER)) {
1838         error(ERR_NONFATAL, "`%s' expects a parameter count", directive);
1839     } else {
1840         def->nparam_min = def->nparam_max =
1841             readnum(tline->text, &err);
1842         if (err)
1843             error(ERR_NONFATAL,
1844                   "unable to parse parameter count `%s'", tline->text);
1845     }
1846     if (tline && tok_is_(tline->next, "-")) {
1847         tline = tline->next->next;
1848         if (tok_is_(tline, "*")) {
1849             def->nparam_max = INT_MAX;
1850         } else if (!tok_type_(tline, TOK_NUMBER)) {
1851             error(ERR_NONFATAL,
1852                   "`%s' expects a parameter count after `-'", directive);
1853         } else {
1854             def->nparam_max = readnum(tline->text, &err);
1855             if (err) {
1856                 error(ERR_NONFATAL, "unable to parse parameter count `%s'",
1857                       tline->text);
1858             }
1859             if (def->nparam_min > def->nparam_max) {
1860                 error(ERR_NONFATAL, "minimum parameter count exceeds maximum");
1861             }
1862         }
1863     }
1864     if (tline && tok_is_(tline->next, "+")) {
1865         tline = tline->next;
1866         def->plus = true;
1867     }
1868     if (tline && tok_type_(tline->next, TOK_ID) &&
1869         !nasm_stricmp(tline->next->text, ".nolist")) {
1870         tline = tline->next;
1871         def->nolist = true;
1872     }
1873
1874     /*
1875      * Handle default parameters.
1876      */
1877     if (tline && tline->next) {
1878         def->dlist = tline->next;
1879         tline->next = NULL;
1880         count_mmac_params(def->dlist, &def->ndefs, &def->defaults);
1881     } else {
1882         def->dlist = NULL;
1883         def->defaults = NULL;
1884     }
1885     def->expansion = NULL;
1886
1887         if(def->defaults &&
1888            def->ndefs > def->nparam_max - def->nparam_min &&
1889            !def->plus)
1890          error(ERR_WARNING|ERR_PASS1|ERR_WARN_MDP,
1891                "too many default macro parameters");
1892
1893     return true;
1894 }
1895
1896
1897 /*
1898  * Decode a size directive
1899  */
1900 static int parse_size(const char *str) {
1901     static const char *size_names[] =
1902         { "byte", "dword", "oword", "qword", "tword", "word", "yword" };
1903     static const int sizes[] =
1904         { 0, 1, 4, 16, 8, 10, 2, 32 };
1905
1906     return sizes[bsii(str, size_names, elements(size_names))+1];
1907 }
1908
1909 /**
1910  * find and process preprocessor directive in passed line
1911  * Find out if a line contains a preprocessor directive, and deal
1912  * with it if so.
1913  *
1914  * If a directive _is_ found, it is the responsibility of this routine
1915  * (and not the caller) to free_tlist() the line.
1916  *
1917  * @param tline a pointer to the current tokeninzed line linked list
1918  * @return DIRECTIVE_FOUND or NO_DIRECTIVE_FOUND
1919  *
1920  */
1921 static int do_directive(Token * tline)
1922 {
1923     enum preproc_token i;
1924     int j;
1925     bool err;
1926     int nparam;
1927     bool nolist;
1928     bool casesense;
1929     int k, m;
1930     int offset;
1931     char *p, *pp, *mname;
1932     Include *inc;
1933     Context *ctx;
1934     Cond *cond;
1935     MMacro *mmac, **mmhead;
1936     Token *t, *tt, *param_start, *macro_start, *last, **tptr, *origline;
1937     Line *l;
1938     struct tokenval tokval;
1939     expr *evalresult;
1940     MMacro *tmp_defining;       /* Used when manipulating rep_nest */
1941     int64_t count;
1942     size_t len;
1943     int severity;
1944
1945     origline = tline;
1946
1947     skip_white_(tline);
1948     if (!tline || !tok_type_(tline, TOK_PREPROC_ID) ||
1949         (tline->text[1] == '%' || tline->text[1] == '$'
1950          || tline->text[1] == '!'))
1951         return NO_DIRECTIVE_FOUND;
1952
1953     i = pp_token_hash(tline->text);
1954
1955     /*
1956      * If we're in a non-emitting branch of a condition construct,
1957      * or walking to the end of an already terminated %rep block,
1958      * we should ignore all directives except for condition
1959      * directives.
1960      */
1961     if (((istk->conds && !emitting(istk->conds->state)) ||
1962          (istk->mstk && !istk->mstk->in_progress)) && !is_condition(i)) {
1963         return NO_DIRECTIVE_FOUND;
1964     }
1965
1966     /*
1967      * If we're defining a macro or reading a %rep block, we should
1968      * ignore all directives except for %macro/%imacro (which nest),
1969      * %endm/%endmacro, and (only if we're in a %rep block) %endrep.
1970      * If we're in a %rep block, another %rep nests, so should be let through.
1971      */
1972     if (defining && i != PP_MACRO && i != PP_IMACRO &&
1973         i != PP_ENDMACRO && i != PP_ENDM &&
1974         (defining->name || (i != PP_ENDREP && i != PP_REP))) {
1975         return NO_DIRECTIVE_FOUND;
1976     }
1977
1978     if (defining) {
1979         if (i == PP_MACRO || i == PP_IMACRO) {
1980             nested_mac_count++;
1981             return NO_DIRECTIVE_FOUND;
1982         } else if (nested_mac_count > 0) {
1983             if (i == PP_ENDMACRO) {
1984                 nested_mac_count--;
1985                 return NO_DIRECTIVE_FOUND;
1986             }
1987         }
1988         if (!defining->name) {
1989             if (i == PP_REP) {
1990                 nested_rep_count++;
1991                 return NO_DIRECTIVE_FOUND;
1992             } else if (nested_rep_count > 0) {
1993                 if (i == PP_ENDREP) {
1994                     nested_rep_count--;
1995                     return NO_DIRECTIVE_FOUND;
1996                 }
1997             }
1998         }
1999     }
2000
2001     switch (i) {
2002     case PP_INVALID:
2003         error(ERR_NONFATAL, "unknown preprocessor directive `%s'",
2004               tline->text);
2005         return NO_DIRECTIVE_FOUND;      /* didn't get it */
2006
2007     case PP_STACKSIZE:
2008         /* Directive to tell NASM what the default stack size is. The
2009          * default is for a 16-bit stack, and this can be overriden with
2010          * %stacksize large.
2011          * the following form:
2012          *
2013          *      ARG arg1:WORD, arg2:DWORD, arg4:QWORD
2014          */
2015         tline = tline->next;
2016         if (tline && tline->type == TOK_WHITESPACE)
2017             tline = tline->next;
2018         if (!tline || tline->type != TOK_ID) {
2019             error(ERR_NONFATAL, "`%%stacksize' missing size parameter");
2020             free_tlist(origline);
2021             return DIRECTIVE_FOUND;
2022         }
2023         if (nasm_stricmp(tline->text, "flat") == 0) {
2024             /* All subsequent ARG directives are for a 32-bit stack */
2025             StackSize = 4;
2026             StackPointer = "ebp";
2027             ArgOffset = 8;
2028             LocalOffset = 0;
2029         } else if (nasm_stricmp(tline->text, "flat64") == 0) {
2030             /* All subsequent ARG directives are for a 64-bit stack */
2031             StackSize = 8;
2032             StackPointer = "rbp";
2033             ArgOffset = 8;
2034             LocalOffset = 0;
2035         } else if (nasm_stricmp(tline->text, "large") == 0) {
2036             /* All subsequent ARG directives are for a 16-bit stack,
2037              * far function call.
2038              */
2039             StackSize = 2;
2040             StackPointer = "bp";
2041             ArgOffset = 4;
2042             LocalOffset = 0;
2043         } else if (nasm_stricmp(tline->text, "small") == 0) {
2044             /* All subsequent ARG directives are for a 16-bit stack,
2045              * far function call. We don't support near functions.
2046              */
2047             StackSize = 2;
2048             StackPointer = "bp";
2049             ArgOffset = 6;
2050             LocalOffset = 0;
2051         } else {
2052             error(ERR_NONFATAL, "`%%stacksize' invalid size type");
2053             free_tlist(origline);
2054             return DIRECTIVE_FOUND;
2055         }
2056         free_tlist(origline);
2057         return DIRECTIVE_FOUND;
2058
2059     case PP_ARG:
2060         /* TASM like ARG directive to define arguments to functions, in
2061          * the following form:
2062          *
2063          *      ARG arg1:WORD, arg2:DWORD, arg4:QWORD
2064          */
2065         offset = ArgOffset;
2066         do {
2067             char *arg, directive[256];
2068             int size = StackSize;
2069
2070             /* Find the argument name */
2071             tline = tline->next;
2072             if (tline && tline->type == TOK_WHITESPACE)
2073                 tline = tline->next;
2074             if (!tline || tline->type != TOK_ID) {
2075                 error(ERR_NONFATAL, "`%%arg' missing argument parameter");
2076                 free_tlist(origline);
2077                 return DIRECTIVE_FOUND;
2078             }
2079             arg = tline->text;
2080
2081             /* Find the argument size type */
2082             tline = tline->next;
2083             if (!tline || tline->type != TOK_OTHER
2084                 || tline->text[0] != ':') {
2085                 error(ERR_NONFATAL,
2086                       "Syntax error processing `%%arg' directive");
2087                 free_tlist(origline);
2088                 return DIRECTIVE_FOUND;
2089             }
2090             tline = tline->next;
2091             if (!tline || tline->type != TOK_ID) {
2092                 error(ERR_NONFATAL, "`%%arg' missing size type parameter");
2093                 free_tlist(origline);
2094                 return DIRECTIVE_FOUND;
2095             }
2096
2097             /* Allow macro expansion of type parameter */
2098             tt = tokenize(tline->text);
2099             tt = expand_smacro(tt);
2100             size = parse_size(tt->text);
2101             if (!size) {
2102                 error(ERR_NONFATAL,
2103                       "Invalid size type for `%%arg' missing directive");
2104                 free_tlist(tt);
2105                 free_tlist(origline);
2106                 return DIRECTIVE_FOUND;
2107             }
2108             free_tlist(tt);
2109
2110             /* Round up to even stack slots */
2111             size = (size+StackSize-1) & ~(StackSize-1);
2112
2113             /* Now define the macro for the argument */
2114             snprintf(directive, sizeof(directive), "%%define %s (%s+%d)",
2115                      arg, StackPointer, offset);
2116             do_directive(tokenize(directive));
2117             offset += size;
2118
2119             /* Move to the next argument in the list */
2120             tline = tline->next;
2121             if (tline && tline->type == TOK_WHITESPACE)
2122                 tline = tline->next;
2123         } while (tline && tline->type == TOK_OTHER && tline->text[0] == ',');
2124         ArgOffset = offset;
2125         free_tlist(origline);
2126         return DIRECTIVE_FOUND;
2127
2128     case PP_LOCAL:
2129         /* TASM like LOCAL directive to define local variables for a
2130          * function, in the following form:
2131          *
2132          *      LOCAL local1:WORD, local2:DWORD, local4:QWORD = LocalSize
2133          *
2134          * The '= LocalSize' at the end is ignored by NASM, but is
2135          * required by TASM to define the local parameter size (and used
2136          * by the TASM macro package).
2137          */
2138         offset = LocalOffset;
2139         do {
2140             char *local, directive[256];
2141             int size = StackSize;
2142
2143             /* Find the argument name */
2144             tline = tline->next;
2145             if (tline && tline->type == TOK_WHITESPACE)
2146                 tline = tline->next;
2147             if (!tline || tline->type != TOK_ID) {
2148                 error(ERR_NONFATAL,
2149                       "`%%local' missing argument parameter");
2150                 free_tlist(origline);
2151                 return DIRECTIVE_FOUND;
2152             }
2153             local = tline->text;
2154
2155             /* Find the argument size type */
2156             tline = tline->next;
2157             if (!tline || tline->type != TOK_OTHER
2158                 || tline->text[0] != ':') {
2159                 error(ERR_NONFATAL,
2160                       "Syntax error processing `%%local' directive");
2161                 free_tlist(origline);
2162                 return DIRECTIVE_FOUND;
2163             }
2164             tline = tline->next;
2165             if (!tline || tline->type != TOK_ID) {
2166                 error(ERR_NONFATAL,
2167                       "`%%local' missing size type parameter");
2168                 free_tlist(origline);
2169                 return DIRECTIVE_FOUND;
2170             }
2171
2172             /* Allow macro expansion of type parameter */
2173             tt = tokenize(tline->text);
2174             tt = expand_smacro(tt);
2175             size = parse_size(tt->text);
2176             if (!size) {
2177                 error(ERR_NONFATAL,
2178                       "Invalid size type for `%%local' missing directive");
2179                 free_tlist(tt);
2180                 free_tlist(origline);
2181                 return DIRECTIVE_FOUND;
2182             }
2183             free_tlist(tt);
2184
2185             /* Round up to even stack slots */
2186             size = (size+StackSize-1) & ~(StackSize-1);
2187
2188             offset += size;     /* Negative offset, increment before */
2189
2190             /* Now define the macro for the argument */
2191             snprintf(directive, sizeof(directive), "%%define %s (%s-%d)",
2192                      local, StackPointer, offset);
2193             do_directive(tokenize(directive));
2194
2195             /* Now define the assign to setup the enter_c macro correctly */
2196             snprintf(directive, sizeof(directive),
2197                      "%%assign %%$localsize %%$localsize+%d", size);
2198             do_directive(tokenize(directive));
2199
2200             /* Move to the next argument in the list */
2201             tline = tline->next;
2202             if (tline && tline->type == TOK_WHITESPACE)
2203                 tline = tline->next;
2204         } while (tline && tline->type == TOK_OTHER && tline->text[0] == ',');
2205         LocalOffset = offset;
2206         free_tlist(origline);
2207         return DIRECTIVE_FOUND;
2208
2209     case PP_CLEAR:
2210         if (tline->next)
2211             error(ERR_WARNING|ERR_PASS1,
2212                   "trailing garbage after `%%clear' ignored");
2213         free_macros();
2214         init_macros();
2215         free_tlist(origline);
2216         return DIRECTIVE_FOUND;
2217
2218     case PP_DEPEND:
2219         t = tline->next = expand_smacro(tline->next);
2220         skip_white_(t);
2221         if (!t || (t->type != TOK_STRING &&
2222                        t->type != TOK_INTERNAL_STRING)) {
2223             error(ERR_NONFATAL, "`%%depend' expects a file name");
2224             free_tlist(origline);
2225             return DIRECTIVE_FOUND;     /* but we did _something_ */
2226         }
2227         if (t->next)
2228             error(ERR_WARNING|ERR_PASS1,
2229                   "trailing garbage after `%%depend' ignored");
2230         p = t->text;
2231         if (t->type != TOK_INTERNAL_STRING)
2232             nasm_unquote(p, NULL);
2233         if (dephead && !in_list(*dephead, p)) {
2234             StrList *sl = nasm_malloc(strlen(p)+1+sizeof sl->next);
2235             sl->next = NULL;
2236             strcpy(sl->str, p);
2237             *deptail = sl;
2238             deptail = &sl->next;
2239         }
2240         free_tlist(origline);
2241         return DIRECTIVE_FOUND;
2242
2243     case PP_INCLUDE:
2244         t = tline->next = expand_smacro(tline->next);
2245         skip_white_(t);
2246
2247         if (!t || (t->type != TOK_STRING &&
2248                        t->type != TOK_INTERNAL_STRING)) {
2249             error(ERR_NONFATAL, "`%%include' expects a file name");
2250             free_tlist(origline);
2251             return DIRECTIVE_FOUND;     /* but we did _something_ */
2252         }
2253         if (t->next)
2254             error(ERR_WARNING|ERR_PASS1,
2255                   "trailing garbage after `%%include' ignored");
2256         p = t->text;
2257         if (t->type != TOK_INTERNAL_STRING)
2258             nasm_unquote(p, NULL);
2259         inc = nasm_malloc(sizeof(Include));
2260         inc->next = istk;
2261         inc->conds = NULL;
2262         inc->fp = inc_fopen(p, dephead, &deptail, pass == 0);
2263         if (!inc->fp) {
2264             /* -MG given but file not found */
2265             nasm_free(inc);
2266         } else {
2267             inc->fname = src_set_fname(nasm_strdup(p));
2268             inc->lineno = src_set_linnum(0);
2269             inc->lineinc = 1;
2270             inc->expansion = NULL;
2271             inc->mstk = NULL;
2272             istk = inc;
2273             list->uplevel(LIST_INCLUDE);
2274         }
2275         free_tlist(origline);
2276         return DIRECTIVE_FOUND;
2277
2278     case PP_USE:
2279     {
2280         static macros_t *use_pkg;
2281         const char *pkg_macro;
2282
2283         t = tline->next = expand_smacro(tline->next);
2284         skip_white_(t);
2285
2286         if (!t || (t->type != TOK_STRING &&
2287                    t->type != TOK_INTERNAL_STRING &&
2288                    t->type != TOK_ID)) {
2289             error(ERR_NONFATAL, "`%%use' expects a package name");
2290             free_tlist(origline);
2291             return DIRECTIVE_FOUND;     /* but we did _something_ */
2292         }
2293         if (t->next)
2294             error(ERR_WARNING|ERR_PASS1,
2295                   "trailing garbage after `%%use' ignored");
2296         if (t->type == TOK_STRING)
2297             nasm_unquote(t->text, NULL);
2298         use_pkg = nasm_stdmac_find_package(t->text);
2299         if (!use_pkg)
2300             error(ERR_NONFATAL, "unknown `%%use' package: %s", t->text);
2301         /* The first string will be <%define>__USE_*__ */
2302         pkg_macro = (char *)use_pkg + 1;
2303         if (!smacro_defined(NULL, pkg_macro, 0, NULL, true)) {
2304             /* Not already included, go ahead and include it */
2305             stdmacpos = use_pkg;
2306         }
2307         free_tlist(origline);
2308         return DIRECTIVE_FOUND;
2309     }
2310     case PP_PUSH:
2311         tline = tline->next;
2312         skip_white_(tline);
2313         tline = expand_id(tline);
2314         if (tline) {
2315             if (!tok_type_(tline, TOK_ID)) {
2316                 error(ERR_NONFATAL, "`%%push' expects a context identifier");
2317                 free_tlist(origline);
2318                 return DIRECTIVE_FOUND;     /* but we did _something_ */
2319             }
2320             if (tline->next)
2321                 error(ERR_WARNING|ERR_PASS1,
2322                       "trailing garbage after `%%push' ignored");
2323             p = nasm_strdup(tline->text);
2324         } else {
2325             p = NULL;           /* Anonymous context */
2326         }
2327         ctx = nasm_malloc(sizeof(Context));
2328         ctx->next = cstk;
2329         hash_init(&ctx->localmac, HASH_SMALL);
2330         ctx->name = p;
2331         ctx->number = unique++;
2332         cstk = ctx;
2333         free_tlist(origline);
2334         return DIRECTIVE_FOUND;
2335
2336     case PP_REPL:
2337         tline = tline->next;
2338         skip_white_(tline);
2339         tline = expand_id(tline);
2340         if (tline) {
2341             if (!tok_type_(tline, TOK_ID)) {
2342                 error(ERR_NONFATAL, "`%%repl' expects a context identifier");
2343                 free_tlist(origline);
2344                 return DIRECTIVE_FOUND;     /* but we did _something_ */
2345             }
2346             if (tline->next)
2347                 error(ERR_WARNING|ERR_PASS1,
2348                       "trailing garbage after `%%repl' ignored");
2349             p = nasm_strdup(tline->text);
2350         } else {
2351             p = NULL;
2352         }
2353         if (!cstk)
2354             error(ERR_NONFATAL, "`%%repl': context stack is empty");
2355         else {
2356             nasm_free(cstk->name);
2357             cstk->name = p;
2358         }
2359         free_tlist(origline);
2360         return DIRECTIVE_FOUND;
2361
2362     case PP_POP:
2363         if (tline->next)
2364             error(ERR_WARNING|ERR_PASS1,
2365                   "trailing garbage after `%%pop' ignored");
2366         if (!cstk)
2367             error(ERR_NONFATAL, "`%%pop': context stack is already empty");
2368         else
2369             ctx_pop();
2370         free_tlist(origline);
2371         return DIRECTIVE_FOUND;
2372
2373     case PP_FATAL:
2374         severity = ERR_FATAL|ERR_NO_SEVERITY;
2375         goto issue_error;
2376     case PP_ERROR:
2377         severity = ERR_NONFATAL|ERR_NO_SEVERITY;
2378         goto issue_error;
2379     case PP_WARNING:
2380         severity = ERR_WARNING|ERR_NO_SEVERITY|ERR_WARN_USER;
2381         goto issue_error;
2382
2383     issue_error:
2384     {
2385         /* Only error out if this is the final pass */
2386         if (pass != 2 && i != PP_FATAL)
2387             return DIRECTIVE_FOUND;
2388
2389         tline->next = expand_smacro(tline->next);
2390         tline = tline->next;
2391         skip_white_(tline);
2392         t = tline ? tline->next : NULL;
2393         skip_white_(t);
2394         if (tok_type_(tline, TOK_STRING) && !t) {
2395             /* The line contains only a quoted string */
2396             p = tline->text;
2397             nasm_unquote(p, NULL);
2398             error(severity, "%s: %s",  pp_directives[i], p);
2399         } else {
2400             /* Not a quoted string, or more than a quoted string */
2401             p = detoken(tline, false);
2402             error(severity, "%s: %s",  pp_directives[i], p);
2403             nasm_free(p);
2404         }
2405         free_tlist(origline);
2406         return DIRECTIVE_FOUND;
2407     }
2408
2409     CASE_PP_IF:
2410         if (istk->conds && !emitting(istk->conds->state))
2411             j = COND_NEVER;
2412         else {
2413             j = if_condition(tline->next, i);
2414             tline->next = NULL; /* it got freed */
2415             j = j < 0 ? COND_NEVER : j ? COND_IF_TRUE : COND_IF_FALSE;
2416         }
2417         cond = nasm_malloc(sizeof(Cond));
2418         cond->next = istk->conds;
2419         cond->state = j;
2420         istk->conds = cond;
2421         free_tlist(origline);
2422         return DIRECTIVE_FOUND;
2423
2424     CASE_PP_ELIF:
2425         if (!istk->conds)
2426             error(ERR_FATAL, "`%s': no matching `%%if'", pp_directives[i]);
2427         switch(istk->conds->state) {
2428             case COND_IF_TRUE:
2429                 istk->conds->state = COND_DONE;
2430                 break;
2431
2432             case COND_DONE:
2433             case COND_NEVER:
2434                 break;
2435
2436             case COND_ELSE_TRUE:
2437             case COND_ELSE_FALSE:
2438                 error_precond(ERR_WARNING|ERR_PASS1,
2439                               "`%%elif' after `%%else' ignored");
2440                 istk->conds->state = COND_NEVER;
2441                 break;
2442
2443             case COND_IF_FALSE:
2444                 /*
2445                  * IMPORTANT: In the case of %if, we will already have
2446                  * called expand_mmac_params(); however, if we're
2447                  * processing an %elif we must have been in a
2448                  * non-emitting mode, which would have inhibited
2449                  * the normal invocation of expand_mmac_params().  Therefore,
2450                  * we have to do it explicitly here.
2451                  */
2452                 j = if_condition(expand_mmac_params(tline->next), i);
2453                 tline->next = NULL; /* it got freed */
2454                 istk->conds->state =
2455                     j < 0 ? COND_NEVER : j ? COND_IF_TRUE : COND_IF_FALSE;
2456                 break;
2457         }
2458         free_tlist(origline);
2459         return DIRECTIVE_FOUND;
2460
2461     case PP_ELSE:
2462         if (tline->next)
2463             error_precond(ERR_WARNING|ERR_PASS1,
2464                           "trailing garbage after `%%else' ignored");
2465         if (!istk->conds)
2466             error(ERR_FATAL, "`%%else': no matching `%%if'");
2467         switch(istk->conds->state) {
2468             case COND_IF_TRUE:
2469             case COND_DONE:
2470                 istk->conds->state = COND_ELSE_FALSE;
2471                 break;
2472
2473             case COND_NEVER:
2474                 break;
2475
2476             case COND_IF_FALSE:
2477                 istk->conds->state = COND_ELSE_TRUE;
2478                 break;
2479
2480             case COND_ELSE_TRUE:
2481             case COND_ELSE_FALSE:
2482                 error_precond(ERR_WARNING|ERR_PASS1,
2483                               "`%%else' after `%%else' ignored.");
2484                 istk->conds->state = COND_NEVER;
2485                 break;
2486         }
2487         free_tlist(origline);
2488         return DIRECTIVE_FOUND;
2489
2490     case PP_ENDIF:
2491         if (tline->next)
2492             error_precond(ERR_WARNING|ERR_PASS1,
2493                           "trailing garbage after `%%endif' ignored");
2494         if (!istk->conds)
2495             error(ERR_FATAL, "`%%endif': no matching `%%if'");
2496         cond = istk->conds;
2497         istk->conds = cond->next;
2498         nasm_free(cond);
2499         free_tlist(origline);
2500         return DIRECTIVE_FOUND;
2501
2502     case PP_MACRO:
2503     case PP_IMACRO:
2504         if (defining) {
2505             error(ERR_FATAL,
2506                   "`%%%smacro': already defining a macro",
2507                   (i == PP_IMACRO ? "i" : ""));
2508             return DIRECTIVE_FOUND;
2509         }
2510         defining = nasm_malloc(sizeof(MMacro));
2511         defining->casesense = (i == PP_MACRO);
2512         if (!parse_mmacro_spec(tline, defining, pp_directives[i])) {
2513             nasm_free(defining);
2514             defining = NULL;
2515             return DIRECTIVE_FOUND;
2516         }
2517
2518         mmac = (MMacro *) hash_findix(&mmacros, defining->name);
2519         while (mmac) {
2520             if (!strcmp(mmac->name, defining->name) &&
2521                 (mmac->nparam_min <= defining->nparam_max
2522                  || defining->plus)
2523                 && (defining->nparam_min <= mmac->nparam_max
2524                     || mmac->plus)) {
2525                 error(ERR_WARNING|ERR_PASS1,
2526                       "redefining multi-line macro `%s'", defining->name);
2527                 return DIRECTIVE_FOUND;
2528             }
2529             mmac = mmac->next;
2530         }
2531         free_tlist(origline);
2532         return DIRECTIVE_FOUND;
2533
2534     case PP_ENDM:
2535     case PP_ENDMACRO:
2536         if (! (defining && defining->name)) {
2537             error(ERR_NONFATAL, "`%s': not defining a macro", tline->text);
2538             return DIRECTIVE_FOUND;
2539         }
2540         mmhead = (MMacro **) hash_findi_add(&mmacros, defining->name);
2541         defining->next = *mmhead;
2542         *mmhead = defining;
2543         defining = NULL;
2544         free_tlist(origline);
2545         return DIRECTIVE_FOUND;
2546
2547     case PP_UNMACRO:
2548     case PP_UNIMACRO:
2549     {
2550         MMacro **mmac_p;
2551         MMacro spec;
2552
2553         spec.casesense = (i == PP_UNMACRO);
2554         if (!parse_mmacro_spec(tline, &spec, pp_directives[i])) {
2555             return DIRECTIVE_FOUND;
2556         }
2557         mmac_p = (MMacro **) hash_findi(&mmacros, spec.name, NULL);
2558         while (mmac_p && *mmac_p) {
2559             mmac = *mmac_p;
2560             if (mmac->casesense == spec.casesense &&
2561                 !mstrcmp(mmac->name, spec.name, spec.casesense) &&
2562                 mmac->nparam_min == spec.nparam_min &&
2563                 mmac->nparam_max == spec.nparam_max &&
2564                 mmac->plus == spec.plus) {
2565                 *mmac_p = mmac->next;
2566                 free_mmacro(mmac);
2567             } else {
2568                 mmac_p = &mmac->next;
2569             }
2570         }
2571         free_tlist(origline);
2572         free_tlist(spec.dlist);
2573         return DIRECTIVE_FOUND;
2574     }
2575
2576     case PP_ROTATE:
2577         if (tline->next && tline->next->type == TOK_WHITESPACE)
2578             tline = tline->next;
2579         if (tline->next == NULL) {
2580             free_tlist(origline);
2581             error(ERR_NONFATAL, "`%%rotate' missing rotate count");
2582             return DIRECTIVE_FOUND;
2583         }
2584         t = expand_smacro(tline->next);
2585         tline->next = NULL;
2586         free_tlist(origline);
2587         tline = t;
2588         tptr = &t;
2589         tokval.t_type = TOKEN_INVALID;
2590         evalresult =
2591             evaluate(ppscan, tptr, &tokval, NULL, pass, error, NULL);
2592         free_tlist(tline);
2593         if (!evalresult)
2594             return DIRECTIVE_FOUND;
2595         if (tokval.t_type)
2596             error(ERR_WARNING|ERR_PASS1,
2597                   "trailing garbage after expression ignored");
2598         if (!is_simple(evalresult)) {
2599             error(ERR_NONFATAL, "non-constant value given to `%%rotate'");
2600             return DIRECTIVE_FOUND;
2601         }
2602         mmac = istk->mstk;
2603         while (mmac && !mmac->name)     /* avoid mistaking %reps for macros */
2604             mmac = mmac->next_active;
2605         if (!mmac) {
2606             error(ERR_NONFATAL, "`%%rotate' invoked outside a macro call");
2607         } else if (mmac->nparam == 0) {
2608             error(ERR_NONFATAL,
2609                   "`%%rotate' invoked within macro without parameters");
2610         } else {
2611             int rotate = mmac->rotate + reloc_value(evalresult);
2612
2613             rotate %= (int)mmac->nparam;
2614             if (rotate < 0)
2615                 rotate += mmac->nparam;
2616
2617             mmac->rotate = rotate;
2618         }
2619         return DIRECTIVE_FOUND;
2620
2621     case PP_REP:
2622         nolist = false;
2623         do {
2624             tline = tline->next;
2625         } while (tok_type_(tline, TOK_WHITESPACE));
2626
2627         if (tok_type_(tline, TOK_ID) &&
2628             nasm_stricmp(tline->text, ".nolist") == 0) {
2629             nolist = true;
2630             do {
2631                 tline = tline->next;
2632             } while (tok_type_(tline, TOK_WHITESPACE));
2633         }
2634
2635         if (tline) {
2636             t = expand_smacro(tline);
2637             tptr = &t;
2638             tokval.t_type = TOKEN_INVALID;
2639             evalresult =
2640                 evaluate(ppscan, tptr, &tokval, NULL, pass, error, NULL);
2641             if (!evalresult) {
2642                 free_tlist(origline);
2643                 return DIRECTIVE_FOUND;
2644             }
2645             if (tokval.t_type)
2646                 error(ERR_WARNING|ERR_PASS1,
2647                       "trailing garbage after expression ignored");
2648             if (!is_simple(evalresult)) {
2649                 error(ERR_NONFATAL, "non-constant value given to `%%rep'");
2650                 return DIRECTIVE_FOUND;
2651             }
2652             count = reloc_value(evalresult) + 1;
2653         } else {
2654             error(ERR_NONFATAL, "`%%rep' expects a repeat count");
2655             count = 0;
2656         }
2657         free_tlist(origline);
2658
2659         tmp_defining = defining;
2660         defining = nasm_malloc(sizeof(MMacro));
2661         defining->name = NULL;  /* flags this macro as a %rep block */
2662         defining->casesense = false;
2663         defining->plus = false;
2664         defining->nolist = nolist;
2665         defining->in_progress = count;
2666         defining->nparam_min = defining->nparam_max = 0;
2667         defining->defaults = NULL;
2668         defining->dlist = NULL;
2669         defining->expansion = NULL;
2670         defining->next_active = istk->mstk;
2671         defining->rep_nest = tmp_defining;
2672         return DIRECTIVE_FOUND;
2673
2674     case PP_ENDREP:
2675         if (!defining || defining->name) {
2676             error(ERR_NONFATAL, "`%%endrep': no matching `%%rep'");
2677             return DIRECTIVE_FOUND;
2678         }
2679
2680         /*
2681          * Now we have a "macro" defined - although it has no name
2682          * and we won't be entering it in the hash tables - we must
2683          * push a macro-end marker for it on to istk->expansion.
2684          * After that, it will take care of propagating itself (a
2685          * macro-end marker line for a macro which is really a %rep
2686          * block will cause the macro to be re-expanded, complete
2687          * with another macro-end marker to ensure the process
2688          * continues) until the whole expansion is forcibly removed
2689          * from istk->expansion by a %exitrep.
2690          */
2691         l = nasm_malloc(sizeof(Line));
2692         l->next = istk->expansion;
2693         l->finishes = defining;
2694         l->first = NULL;
2695         istk->expansion = l;
2696
2697         istk->mstk = defining;
2698
2699         list->uplevel(defining->nolist ? LIST_MACRO_NOLIST : LIST_MACRO);
2700         tmp_defining = defining;
2701         defining = defining->rep_nest;
2702         free_tlist(origline);
2703         return DIRECTIVE_FOUND;
2704
2705     case PP_EXITREP:
2706         /*
2707          * We must search along istk->expansion until we hit a
2708          * macro-end marker for a macro with no name. Then we set
2709          * its `in_progress' flag to 0.
2710          */
2711         for (l = istk->expansion; l; l = l->next)
2712             if (l->finishes && !l->finishes->name)
2713                 break;
2714
2715         if (l)
2716             l->finishes->in_progress = 1;
2717         else
2718             error(ERR_NONFATAL, "`%%exitrep' not within `%%rep' block");
2719         free_tlist(origline);
2720         return DIRECTIVE_FOUND;
2721
2722     case PP_XDEFINE:
2723     case PP_IXDEFINE:
2724     case PP_DEFINE:
2725     case PP_IDEFINE:
2726         casesense = (i == PP_DEFINE || i == PP_XDEFINE);
2727
2728         tline = tline->next;
2729         skip_white_(tline);
2730         tline = expand_id(tline);
2731         if (!tline || (tline->type != TOK_ID &&
2732                        (tline->type != TOK_PREPROC_ID ||
2733                         tline->text[1] != '$'))) {
2734             error(ERR_NONFATAL, "`%s' expects a macro identifier",
2735                   pp_directives[i]);
2736             free_tlist(origline);
2737             return DIRECTIVE_FOUND;
2738         }
2739
2740         ctx = get_ctx(tline->text, false);
2741
2742         mname = tline->text;
2743         last = tline;
2744         param_start = tline = tline->next;
2745         nparam = 0;
2746
2747         /* Expand the macro definition now for %xdefine and %ixdefine */
2748         if ((i == PP_XDEFINE) || (i == PP_IXDEFINE))
2749             tline = expand_smacro(tline);
2750
2751         if (tok_is_(tline, "(")) {
2752             /*
2753              * This macro has parameters.
2754              */
2755
2756             tline = tline->next;
2757             while (1) {
2758                 skip_white_(tline);
2759                 if (!tline) {
2760                     error(ERR_NONFATAL, "parameter identifier expected");
2761                     free_tlist(origline);
2762                     return DIRECTIVE_FOUND;
2763                 }
2764                 if (tline->type != TOK_ID) {
2765                     error(ERR_NONFATAL,
2766                           "`%s': parameter identifier expected",
2767                           tline->text);
2768                     free_tlist(origline);
2769                     return DIRECTIVE_FOUND;
2770                 }
2771                 tline->type = TOK_SMAC_PARAM + nparam++;
2772                 tline = tline->next;
2773                 skip_white_(tline);
2774                 if (tok_is_(tline, ",")) {
2775                     tline = tline->next;
2776                 } else {
2777                     if (!tok_is_(tline, ")")) {
2778                         error(ERR_NONFATAL,
2779                               "`)' expected to terminate macro template");
2780                         free_tlist(origline);
2781                         return DIRECTIVE_FOUND;
2782                     }
2783                     break;
2784                 }
2785             }
2786             last = tline;
2787             tline = tline->next;
2788         }
2789         if (tok_type_(tline, TOK_WHITESPACE))
2790             last = tline, tline = tline->next;
2791         macro_start = NULL;
2792         last->next = NULL;
2793         t = tline;
2794         while (t) {
2795             if (t->type == TOK_ID) {
2796                 for (tt = param_start; tt; tt = tt->next)
2797                     if (tt->type >= TOK_SMAC_PARAM &&
2798                         !strcmp(tt->text, t->text))
2799                         t->type = tt->type;
2800             }
2801             tt = t->next;
2802             t->next = macro_start;
2803             macro_start = t;
2804             t = tt;
2805         }
2806         /*
2807          * Good. We now have a macro name, a parameter count, and a
2808          * token list (in reverse order) for an expansion. We ought
2809          * to be OK just to create an SMacro, store it, and let
2810          * free_tlist have the rest of the line (which we have
2811          * carefully re-terminated after chopping off the expansion
2812          * from the end).
2813          */
2814         define_smacro(ctx, mname, casesense, nparam, macro_start);
2815         free_tlist(origline);
2816         return DIRECTIVE_FOUND;
2817
2818     case PP_UNDEF:
2819         tline = tline->next;
2820         skip_white_(tline);
2821         tline = expand_id(tline);
2822         if (!tline || (tline->type != TOK_ID &&
2823                        (tline->type != TOK_PREPROC_ID ||
2824                         tline->text[1] != '$'))) {
2825             error(ERR_NONFATAL, "`%%undef' expects a macro identifier");
2826             free_tlist(origline);
2827             return DIRECTIVE_FOUND;
2828         }
2829         if (tline->next) {
2830             error(ERR_WARNING|ERR_PASS1,
2831                   "trailing garbage after macro name ignored");
2832         }
2833
2834         /* Find the context that symbol belongs to */
2835         ctx = get_ctx(tline->text, false);
2836         undef_smacro(ctx, tline->text);
2837         free_tlist(origline);
2838         return DIRECTIVE_FOUND;
2839
2840     case PP_DEFSTR:
2841     case PP_IDEFSTR:
2842         casesense = (i == PP_DEFSTR);
2843
2844         tline = tline->next;
2845         skip_white_(tline);
2846         tline = expand_id(tline);
2847         if (!tline || (tline->type != TOK_ID &&
2848                        (tline->type != TOK_PREPROC_ID ||
2849                         tline->text[1] != '$'))) {
2850             error(ERR_NONFATAL, "`%s' expects a macro identifier",
2851                   pp_directives[i]);
2852             free_tlist(origline);
2853             return DIRECTIVE_FOUND;
2854         }
2855
2856         ctx = get_ctx(tline->text, false);
2857
2858         mname = tline->text;
2859         last = tline;
2860         tline = expand_smacro(tline->next);
2861         last->next = NULL;
2862
2863         while (tok_type_(tline, TOK_WHITESPACE))
2864             tline = delete_Token(tline);
2865
2866         p = detoken(tline, false);
2867         macro_start = nasm_malloc(sizeof(*macro_start));
2868         macro_start->next = NULL;
2869         macro_start->text = nasm_quote(p, strlen(p));
2870         macro_start->type = TOK_STRING;
2871         macro_start->a.mac = NULL;
2872         nasm_free(p);
2873
2874         /*
2875          * We now have a macro name, an implicit parameter count of
2876          * zero, and a string token to use as an expansion. Create
2877          * and store an SMacro.
2878          */
2879         define_smacro(ctx, mname, casesense, 0, macro_start);
2880         free_tlist(origline);
2881         return DIRECTIVE_FOUND;
2882
2883     case PP_PATHSEARCH:
2884     {
2885         FILE *fp;
2886         StrList *xsl = NULL;
2887         StrList **xst = &xsl;
2888
2889         casesense = true;
2890
2891         tline = tline->next;
2892         skip_white_(tline);
2893         tline = expand_id(tline);
2894         if (!tline || (tline->type != TOK_ID &&
2895                        (tline->type != TOK_PREPROC_ID ||
2896                         tline->text[1] != '$'))) {
2897             error(ERR_NONFATAL,
2898                   "`%%pathsearch' expects a macro identifier as first parameter");
2899             free_tlist(origline);
2900             return DIRECTIVE_FOUND;
2901         }
2902         ctx = get_ctx(tline->text, false);
2903
2904         mname = tline->text;
2905         last = tline;
2906         tline = expand_smacro(tline->next);
2907         last->next = NULL;
2908
2909         t = tline;
2910         while (tok_type_(t, TOK_WHITESPACE))
2911             t = t->next;
2912
2913         if (!t || (t->type != TOK_STRING &&
2914                    t->type != TOK_INTERNAL_STRING)) {
2915             error(ERR_NONFATAL, "`%%pathsearch' expects a file name");
2916             free_tlist(tline);
2917             free_tlist(origline);
2918             return DIRECTIVE_FOUND;     /* but we did _something_ */
2919         }
2920         if (t->next)
2921             error(ERR_WARNING|ERR_PASS1,
2922                   "trailing garbage after `%%pathsearch' ignored");
2923         p = t->text;
2924         if (t->type != TOK_INTERNAL_STRING)
2925             nasm_unquote(p, NULL);
2926
2927         fp = inc_fopen(p, &xsl, &xst, true);
2928         if (fp) {
2929             p = xsl->str;
2930             fclose(fp);         /* Don't actually care about the file */
2931         }
2932         macro_start = nasm_malloc(sizeof(*macro_start));
2933         macro_start->next = NULL;
2934         macro_start->text = nasm_quote(p, strlen(p));
2935         macro_start->type = TOK_STRING;
2936         macro_start->a.mac = NULL;
2937         if (xsl)
2938             nasm_free(xsl);
2939
2940         /*
2941          * We now have a macro name, an implicit parameter count of
2942          * zero, and a string token to use as an expansion. Create
2943          * and store an SMacro.
2944          */
2945         define_smacro(ctx, mname, casesense, 0, macro_start);
2946         free_tlist(tline);
2947         free_tlist(origline);
2948         return DIRECTIVE_FOUND;
2949     }
2950
2951     case PP_STRLEN:
2952         casesense = true;
2953
2954         tline = tline->next;
2955         skip_white_(tline);
2956         tline = expand_id(tline);
2957         if (!tline || (tline->type != TOK_ID &&
2958                        (tline->type != TOK_PREPROC_ID ||
2959                         tline->text[1] != '$'))) {
2960             error(ERR_NONFATAL,
2961                   "`%%strlen' expects a macro identifier as first parameter");
2962             free_tlist(origline);
2963             return DIRECTIVE_FOUND;
2964         }
2965         ctx = get_ctx(tline->text, false);
2966
2967         mname = tline->text;
2968         last = tline;
2969         tline = expand_smacro(tline->next);
2970         last->next = NULL;
2971
2972         t = tline;
2973         while (tok_type_(t, TOK_WHITESPACE))
2974             t = t->next;
2975         /* t should now point to the string */
2976         if (t->type != TOK_STRING) {
2977             error(ERR_NONFATAL,
2978                   "`%%strlen` requires string as second parameter");
2979             free_tlist(tline);
2980             free_tlist(origline);
2981             return DIRECTIVE_FOUND;
2982         }
2983
2984         macro_start = nasm_malloc(sizeof(*macro_start));
2985         macro_start->next = NULL;
2986         make_tok_num(macro_start, nasm_unquote(t->text, NULL));
2987         macro_start->a.mac = NULL;
2988
2989         /*
2990          * We now have a macro name, an implicit parameter count of
2991          * zero, and a numeric token to use as an expansion. Create
2992          * and store an SMacro.
2993          */
2994         define_smacro(ctx, mname, casesense, 0, macro_start);
2995         free_tlist(tline);
2996         free_tlist(origline);
2997         return DIRECTIVE_FOUND;
2998
2999     case PP_STRCAT:
3000         casesense = true;
3001
3002         tline = tline->next;
3003         skip_white_(tline);
3004         tline = expand_id(tline);
3005         if (!tline || (tline->type != TOK_ID &&
3006                        (tline->type != TOK_PREPROC_ID ||
3007                         tline->text[1] != '$'))) {
3008             error(ERR_NONFATAL,
3009                   "`%%strcat' expects a macro identifier as first parameter");
3010             free_tlist(origline);
3011             return DIRECTIVE_FOUND;
3012         }
3013         ctx = get_ctx(tline->text, false);
3014
3015         mname = tline->text;
3016         last = tline;
3017         tline = expand_smacro(tline->next);
3018         last->next = NULL;
3019
3020         len = 0;
3021         for (t = tline; t; t = t->next) {
3022             switch (t->type) {
3023             case TOK_WHITESPACE:
3024                 break;
3025             case TOK_STRING:
3026                 len += t->a.len = nasm_unquote(t->text, NULL);
3027                 break;
3028             case TOK_OTHER:
3029                 if (!strcmp(t->text, ",")) /* permit comma separators */
3030                     break;
3031                 /* else fall through */
3032             default:
3033                 error(ERR_NONFATAL,
3034                       "non-string passed to `%%strcat' (%d)", t->type);
3035                 free_tlist(tline);
3036                 free_tlist(origline);
3037                 return DIRECTIVE_FOUND;
3038             }
3039         }
3040
3041         p = pp = nasm_malloc(len);
3042         t = tline;
3043         for (t = tline; t; t = t->next) {
3044             if (t->type == TOK_STRING) {
3045                 memcpy(p, t->text, t->a.len);
3046                 p += t->a.len;
3047             }
3048         }
3049
3050         /*
3051          * We now have a macro name, an implicit parameter count of
3052          * zero, and a numeric token to use as an expansion. Create
3053          * and store an SMacro.
3054          */
3055         macro_start = new_Token(NULL, TOK_STRING, NULL, 0);
3056         macro_start->text = nasm_quote(pp, len);
3057         nasm_free(pp);
3058         define_smacro(ctx, mname, casesense, 0, macro_start);
3059         free_tlist(tline);
3060         free_tlist(origline);
3061         return DIRECTIVE_FOUND;
3062
3063     case PP_SUBSTR:
3064     {
3065         int64_t a1, a2;
3066         size_t len;
3067
3068         casesense = true;
3069
3070         tline = tline->next;
3071         skip_white_(tline);
3072         tline = expand_id(tline);
3073         if (!tline || (tline->type != TOK_ID &&
3074                        (tline->type != TOK_PREPROC_ID ||
3075                         tline->text[1] != '$'))) {
3076             error(ERR_NONFATAL,
3077                   "`%%substr' expects a macro identifier as first parameter");
3078             free_tlist(origline);
3079             return DIRECTIVE_FOUND;
3080         }
3081         ctx = get_ctx(tline->text, false);
3082
3083         mname = tline->text;
3084         last = tline;
3085         tline = expand_smacro(tline->next);
3086         last->next = NULL;
3087
3088         t = tline->next;
3089         while (tok_type_(t, TOK_WHITESPACE))
3090             t = t->next;
3091
3092         /* t should now point to the string */
3093         if (t->type != TOK_STRING) {
3094             error(ERR_NONFATAL,
3095                   "`%%substr` requires string as second parameter");
3096             free_tlist(tline);
3097             free_tlist(origline);
3098             return DIRECTIVE_FOUND;
3099         }
3100
3101         tt = t->next;
3102         tptr = &tt;
3103         tokval.t_type = TOKEN_INVALID;
3104         evalresult = evaluate(ppscan, tptr, &tokval, NULL,
3105                               pass, error, NULL);
3106         if (!evalresult) {
3107             free_tlist(tline);
3108             free_tlist(origline);
3109             return DIRECTIVE_FOUND;
3110         } else if (!is_simple(evalresult)) {
3111             error(ERR_NONFATAL, "non-constant value given to `%%substr`");
3112             free_tlist(tline);
3113             free_tlist(origline);
3114             return DIRECTIVE_FOUND;
3115         }
3116         a1 = evalresult->value-1;
3117
3118         while (tok_type_(tt, TOK_WHITESPACE))
3119             tt = tt->next;
3120         if (!tt) {
3121             a2 = 1;             /* Backwards compatibility: one character */
3122         } else {
3123             tokval.t_type = TOKEN_INVALID;
3124             evalresult = evaluate(ppscan, tptr, &tokval, NULL,
3125                                   pass, error, NULL);
3126             if (!evalresult) {
3127                 free_tlist(tline);
3128                 free_tlist(origline);
3129                 return DIRECTIVE_FOUND;
3130             } else if (!is_simple(evalresult)) {
3131                 error(ERR_NONFATAL, "non-constant value given to `%%substr`");
3132                 free_tlist(tline);
3133                 free_tlist(origline);
3134                 return DIRECTIVE_FOUND;
3135             }
3136             a2 = evalresult->value;
3137         }
3138
3139         len = nasm_unquote(t->text, NULL);
3140         if (a2 < 0)
3141             a2 = a2+1+len-a1;
3142         if (a1+a2 > (int64_t)len)
3143             a2 = len-a1;
3144
3145         macro_start = nasm_malloc(sizeof(*macro_start));
3146         macro_start->next = NULL;
3147         macro_start->text = nasm_quote((a1 < 0) ? "" : t->text+a1, a2);
3148         macro_start->type = TOK_STRING;
3149         macro_start->a.mac = NULL;
3150
3151         /*
3152          * We now have a macro name, an implicit parameter count of
3153          * zero, and a numeric token to use as an expansion. Create
3154          * and store an SMacro.
3155          */
3156         define_smacro(ctx, mname, casesense, 0, macro_start);
3157         free_tlist(tline);
3158         free_tlist(origline);
3159         return DIRECTIVE_FOUND;
3160     }
3161
3162     case PP_ASSIGN:
3163     case PP_IASSIGN:
3164         casesense = (i == PP_ASSIGN);
3165
3166         tline = tline->next;
3167         skip_white_(tline);
3168         tline = expand_id(tline);
3169         if (!tline || (tline->type != TOK_ID &&
3170                        (tline->type != TOK_PREPROC_ID ||
3171                         tline->text[1] != '$'))) {
3172             error(ERR_NONFATAL,
3173                   "`%%%sassign' expects a macro identifier",
3174                   (i == PP_IASSIGN ? "i" : ""));
3175             free_tlist(origline);
3176             return DIRECTIVE_FOUND;
3177         }
3178         ctx = get_ctx(tline->text, false);
3179
3180         mname = tline->text;
3181         last = tline;
3182         tline = expand_smacro(tline->next);
3183         last->next = NULL;
3184
3185         t = tline;
3186         tptr = &t;
3187         tokval.t_type = TOKEN_INVALID;
3188         evalresult =
3189             evaluate(ppscan, tptr, &tokval, NULL, pass, error, NULL);
3190         free_tlist(tline);
3191         if (!evalresult) {
3192             free_tlist(origline);
3193             return DIRECTIVE_FOUND;
3194         }
3195
3196         if (tokval.t_type)
3197             error(ERR_WARNING|ERR_PASS1,
3198                   "trailing garbage after expression ignored");
3199
3200         if (!is_simple(evalresult)) {
3201             error(ERR_NONFATAL,
3202                   "non-constant value given to `%%%sassign'",
3203                   (i == PP_IASSIGN ? "i" : ""));
3204             free_tlist(origline);
3205             return DIRECTIVE_FOUND;
3206         }
3207
3208         macro_start = nasm_malloc(sizeof(*macro_start));
3209         macro_start->next = NULL;
3210         make_tok_num(macro_start, reloc_value(evalresult));
3211         macro_start->a.mac = NULL;
3212
3213         /*
3214          * We now have a macro name, an implicit parameter count of
3215          * zero, and a numeric token to use as an expansion. Create
3216          * and store an SMacro.
3217          */
3218         define_smacro(ctx, mname, casesense, 0, macro_start);
3219         free_tlist(origline);
3220         return DIRECTIVE_FOUND;
3221
3222     case PP_LINE:
3223         /*
3224          * Syntax is `%line nnn[+mmm] [filename]'
3225          */
3226         tline = tline->next;
3227         skip_white_(tline);
3228         if (!tok_type_(tline, TOK_NUMBER)) {
3229             error(ERR_NONFATAL, "`%%line' expects line number");
3230             free_tlist(origline);
3231             return DIRECTIVE_FOUND;
3232         }
3233         k = readnum(tline->text, &err);
3234         m = 1;
3235         tline = tline->next;
3236         if (tok_is_(tline, "+")) {
3237             tline = tline->next;
3238             if (!tok_type_(tline, TOK_NUMBER)) {
3239                 error(ERR_NONFATAL, "`%%line' expects line increment");
3240                 free_tlist(origline);
3241                 return DIRECTIVE_FOUND;
3242             }
3243             m = readnum(tline->text, &err);
3244             tline = tline->next;
3245         }
3246         skip_white_(tline);
3247         src_set_linnum(k);
3248         istk->lineinc = m;
3249         if (tline) {
3250             nasm_free(src_set_fname(detoken(tline, false)));
3251         }
3252         free_tlist(origline);
3253         return DIRECTIVE_FOUND;
3254
3255     default:
3256         error(ERR_FATAL,
3257               "preprocessor directive `%s' not yet implemented",
3258               pp_directives[i]);
3259         return DIRECTIVE_FOUND;
3260     }
3261 }
3262
3263 /*
3264  * Ensure that a macro parameter contains a condition code and
3265  * nothing else. Return the condition code index if so, or -1
3266  * otherwise.
3267  */
3268 static int find_cc(Token * t)
3269 {
3270     Token *tt;
3271     int i, j, k, m;
3272
3273     if (!t)
3274             return -1;          /* Probably a %+ without a space */
3275
3276     skip_white_(t);
3277     if (t->type != TOK_ID)
3278         return -1;
3279     tt = t->next;
3280     skip_white_(tt);
3281     if (tt && (tt->type != TOK_OTHER || strcmp(tt->text, ",")))
3282         return -1;
3283
3284     i = -1;
3285     j = elements(conditions);
3286     while (j - i > 1) {
3287         k = (j + i) / 2;
3288         m = nasm_stricmp(t->text, conditions[k]);
3289         if (m == 0) {
3290             i = k;
3291             j = -2;
3292             break;
3293         } else if (m < 0) {
3294             j = k;
3295         } else
3296             i = k;
3297     }
3298     if (j != -2)
3299         return -1;
3300     return i;
3301 }
3302
3303 /*
3304  * Expand MMacro-local things: parameter references (%0, %n, %+n,
3305  * %-n) and MMacro-local identifiers (%%foo).
3306  */
3307 static Token *expand_mmac_params(Token * tline)
3308 {
3309     Token *t, *tt, **tail, *thead;
3310
3311     tail = &thead;
3312     thead = NULL;
3313
3314     while (tline) {
3315         if (tline->type == TOK_PREPROC_ID &&
3316             (((tline->text[1] == '+' || tline->text[1] == '-')
3317               && tline->text[2]) || tline->text[1] == '%'
3318              || (tline->text[1] >= '0' && tline->text[1] <= '9'))) {
3319             char *text = NULL;
3320             int type = 0, cc;   /* type = 0 to placate optimisers */
3321             char tmpbuf[30];
3322             unsigned int n;
3323             int i;
3324             MMacro *mac;
3325
3326             t = tline;
3327             tline = tline->next;
3328
3329             mac = istk->mstk;
3330             while (mac && !mac->name)   /* avoid mistaking %reps for macros */
3331                 mac = mac->next_active;
3332             if (!mac)
3333                 error(ERR_NONFATAL, "`%s': not in a macro call", t->text);
3334             else
3335                 switch (t->text[1]) {
3336                     /*
3337                      * We have to make a substitution of one of the
3338                      * forms %1, %-1, %+1, %%foo, %0.
3339                      */
3340                 case '0':
3341                     type = TOK_NUMBER;
3342                     snprintf(tmpbuf, sizeof(tmpbuf), "%d", mac->nparam);
3343                     text = nasm_strdup(tmpbuf);
3344                     break;
3345                 case '%':
3346                     type = TOK_ID;
3347                     snprintf(tmpbuf, sizeof(tmpbuf), "..@%"PRIu64".",
3348                              mac->unique);
3349                     text = nasm_strcat(tmpbuf, t->text + 2);
3350                     break;
3351                 case '-':
3352                     n = atoi(t->text + 2) - 1;
3353                     if (n >= mac->nparam)
3354                         tt = NULL;
3355                     else {
3356                         if (mac->nparam > 1)
3357                             n = (n + mac->rotate) % mac->nparam;
3358                         tt = mac->params[n];
3359                     }
3360                     cc = find_cc(tt);
3361                     if (cc == -1) {
3362                         error(ERR_NONFATAL,
3363                               "macro parameter %d is not a condition code",
3364                               n + 1);
3365                         text = NULL;
3366                     } else {
3367                         type = TOK_ID;
3368                         if (inverse_ccs[cc] == -1) {
3369                             error(ERR_NONFATAL,
3370                                   "condition code `%s' is not invertible",
3371                                   conditions[cc]);
3372                             text = NULL;
3373                         } else
3374                             text =
3375                                 nasm_strdup(conditions[inverse_ccs[cc]]);
3376                     }
3377                     break;
3378                 case '+':
3379                     n = atoi(t->text + 2) - 1;
3380                     if (n >= mac->nparam)
3381                         tt = NULL;
3382                     else {
3383                         if (mac->nparam > 1)
3384                             n = (n + mac->rotate) % mac->nparam;
3385                         tt = mac->params[n];
3386                     }
3387                     cc = find_cc(tt);
3388                     if (cc == -1) {
3389                         error(ERR_NONFATAL,
3390                               "macro parameter %d is not a condition code",
3391                               n + 1);
3392                         text = NULL;
3393                     } else {
3394                         type = TOK_ID;
3395                         text = nasm_strdup(conditions[cc]);
3396                     }
3397                     break;
3398                 default:
3399                     n = atoi(t->text + 1) - 1;
3400                     if (n >= mac->nparam)
3401                         tt = NULL;
3402                     else {
3403                         if (mac->nparam > 1)
3404                             n = (n + mac->rotate) % mac->nparam;
3405                         tt = mac->params[n];
3406                     }
3407                     if (tt) {
3408                         for (i = 0; i < mac->paramlen[n]; i++) {
3409                             *tail = new_Token(NULL, tt->type, tt->text, 0);
3410                             tail = &(*tail)->next;
3411                             tt = tt->next;
3412                         }
3413                     }
3414                     text = NULL;        /* we've done it here */
3415                     break;
3416                 }
3417             if (!text) {
3418                 delete_Token(t);
3419             } else {
3420                 *tail = t;
3421                 tail = &t->next;
3422                 t->type = type;
3423                 nasm_free(t->text);
3424                 t->text = text;
3425                 t->a.mac = NULL;
3426             }
3427             continue;
3428         } else {
3429             t = *tail = tline;
3430             tline = tline->next;
3431             t->a.mac = NULL;
3432             tail = &t->next;
3433         }
3434     }
3435     *tail = NULL;
3436     t = thead;
3437     for (; t && (tt = t->next) != NULL; t = t->next)
3438         switch (t->type) {
3439         case TOK_WHITESPACE:
3440             if (tt->type == TOK_WHITESPACE) {
3441                 t->next = delete_Token(tt);
3442             }
3443             break;
3444         case TOK_ID:
3445             if (tt->type == TOK_ID || tt->type == TOK_NUMBER) {
3446                 char *tmp = nasm_strcat(t->text, tt->text);
3447                 nasm_free(t->text);
3448                 t->text = tmp;
3449                 t->next = delete_Token(tt);
3450             }
3451             break;
3452         case TOK_NUMBER:
3453             if (tt->type == TOK_NUMBER) {
3454                 char *tmp = nasm_strcat(t->text, tt->text);
3455                 nasm_free(t->text);
3456                 t->text = tmp;
3457                 t->next = delete_Token(tt);
3458             }
3459             break;
3460         default:
3461             break;
3462         }
3463
3464     return thead;
3465 }
3466
3467 /*
3468  * Expand all single-line macro calls made in the given line.
3469  * Return the expanded version of the line. The original is deemed
3470  * to be destroyed in the process. (In reality we'll just move
3471  * Tokens from input to output a lot of the time, rather than
3472  * actually bothering to destroy and replicate.)
3473  */
3474 #define DEADMAN_LIMIT (1 << 20)
3475
3476 static Token *expand_smacro(Token * tline)
3477 {
3478     Token *t, *tt, *mstart, **tail, *thead;
3479     struct hash_table *smtbl;
3480     SMacro *head = NULL, *m;
3481     Token **params;
3482     int *paramsize;
3483     unsigned int nparam, sparam;
3484     int brackets, rescan;
3485     Token *org_tline = tline;
3486     Context *ctx;
3487     char *mname;
3488     int deadman = DEADMAN_LIMIT;
3489
3490     /*
3491      * Trick: we should avoid changing the start token pointer since it can
3492      * be contained in "next" field of other token. Because of this
3493      * we allocate a copy of first token and work with it; at the end of
3494      * routine we copy it back
3495      */
3496     if (org_tline) {
3497         tline =
3498             new_Token(org_tline->next, org_tline->type, org_tline->text,
3499                       0);
3500         tline->a.mac = org_tline->a.mac;
3501         nasm_free(org_tline->text);
3502         org_tline->text = NULL;
3503     }
3504
3505 again:
3506     tail = &thead;
3507     thead = NULL;
3508
3509     while (tline) {             /* main token loop */
3510         if (!--deadman) {
3511             error(ERR_NONFATAL, "interminable macro recursion");
3512             break;
3513         }
3514
3515         if ((mname = tline->text)) {
3516             /* if this token is a local macro, look in local context */
3517             ctx = NULL;
3518             smtbl = &smacros;
3519             if (tline->type == TOK_ID || tline->type == TOK_PREPROC_ID) {
3520                 ctx = get_ctx(mname, true);
3521                 if (ctx)
3522                     smtbl = &ctx->localmac;
3523             }
3524             head = (SMacro *) hash_findix(smtbl, mname);
3525
3526             /*
3527              * We've hit an identifier. As in is_mmacro below, we first
3528              * check whether the identifier is a single-line macro at
3529              * all, then think about checking for parameters if
3530              * necessary.
3531              */
3532             for (m = head; m; m = m->next)
3533                 if (!mstrcmp(m->name, mname, m->casesense))
3534                     break;
3535             if (m) {
3536                 mstart = tline;
3537                 params = NULL;
3538                 paramsize = NULL;
3539                 if (m->nparam == 0) {
3540                     /*
3541                      * Simple case: the macro is parameterless. Discard the
3542                      * one token that the macro call took, and push the
3543                      * expansion back on the to-do stack.
3544                      */
3545                     if (!m->expansion) {
3546                         if (!strcmp("__FILE__", m->name)) {
3547                             int32_t num = 0;
3548                             char *file = NULL;
3549                             src_get(&num, &file);
3550                             tline->text = nasm_quote(file, strlen(file));
3551                             tline->type = TOK_STRING;
3552                             nasm_free(file);
3553                             continue;
3554                         }
3555                         if (!strcmp("__LINE__", m->name)) {
3556                             nasm_free(tline->text);
3557                             make_tok_num(tline, src_get_linnum());
3558                             continue;
3559                         }
3560                         if (!strcmp("__BITS__", m->name)) {
3561                             nasm_free(tline->text);
3562                             make_tok_num(tline, globalbits);
3563                             continue;
3564                         }
3565                         tline = delete_Token(tline);
3566                         continue;
3567                     }
3568                 } else {
3569                     /*
3570                      * Complicated case: at least one macro with this name
3571                      * exists and takes parameters. We must find the
3572                      * parameters in the call, count them, find the SMacro
3573                      * that corresponds to that form of the macro call, and
3574                      * substitute for the parameters when we expand. What a
3575                      * pain.
3576                      */
3577                     /*tline = tline->next;
3578                        skip_white_(tline); */
3579                     do {
3580                         t = tline->next;
3581                         while (tok_type_(t, TOK_SMAC_END)) {
3582                             t->a.mac->in_progress = false;
3583                             t->text = NULL;
3584                             t = tline->next = delete_Token(t);
3585                         }
3586                         tline = t;
3587                     } while (tok_type_(tline, TOK_WHITESPACE));
3588                     if (!tok_is_(tline, "(")) {
3589                         /*
3590                          * This macro wasn't called with parameters: ignore
3591                          * the call. (Behaviour borrowed from gnu cpp.)
3592                          */
3593                         tline = mstart;
3594                         m = NULL;
3595                     } else {
3596                         int paren = 0;
3597                         int white = 0;
3598                         brackets = 0;
3599                         nparam = 0;
3600                         sparam = PARAM_DELTA;
3601                         params = nasm_malloc(sparam * sizeof(Token *));
3602                         params[0] = tline->next;
3603                         paramsize = nasm_malloc(sparam * sizeof(int));
3604                         paramsize[0] = 0;
3605                         while (true) {  /* parameter loop */
3606                             /*
3607                              * For some unusual expansions
3608                              * which concatenates function call
3609                              */
3610                             t = tline->next;
3611                             while (tok_type_(t, TOK_SMAC_END)) {
3612                                 t->a.mac->in_progress = false;
3613                                 t->text = NULL;
3614                                 t = tline->next = delete_Token(t);
3615                             }
3616                             tline = t;
3617
3618                             if (!tline) {
3619                                 error(ERR_NONFATAL,
3620                                       "macro call expects terminating `)'");
3621                                 break;
3622                             }
3623                             if (tline->type == TOK_WHITESPACE
3624                                 && brackets <= 0) {
3625                                 if (paramsize[nparam])
3626                                     white++;
3627                                 else
3628                                     params[nparam] = tline->next;
3629                                 continue;       /* parameter loop */
3630                             }
3631                             if (tline->type == TOK_OTHER
3632                                 && tline->text[1] == 0) {
3633                                 char ch = tline->text[0];
3634                                 if (ch == ',' && !paren && brackets <= 0) {
3635                                     if (++nparam >= sparam) {
3636                                         sparam += PARAM_DELTA;
3637                                         params = nasm_realloc(params,
3638                                                               sparam *
3639                                                               sizeof(Token
3640                                                                      *));
3641                                         paramsize =
3642                                             nasm_realloc(paramsize,
3643                                                          sparam *
3644                                                          sizeof(int));
3645                                     }
3646                                     params[nparam] = tline->next;
3647                                     paramsize[nparam] = 0;
3648                                     white = 0;
3649                                     continue;   /* parameter loop */
3650                                 }
3651                                 if (ch == '{' &&
3652                                     (brackets > 0 || (brackets == 0 &&
3653                                                       !paramsize[nparam])))
3654                                 {
3655                                     if (!(brackets++)) {
3656                                         params[nparam] = tline->next;
3657                                         continue;       /* parameter loop */
3658                                     }
3659                                 }
3660                                 if (ch == '}' && brackets > 0)
3661                                     if (--brackets == 0) {
3662                                         brackets = -1;
3663                                         continue;       /* parameter loop */
3664                                     }
3665                                 if (ch == '(' && !brackets)
3666                                     paren++;
3667                                 if (ch == ')' && brackets <= 0)
3668                                     if (--paren < 0)
3669                                         break;
3670                             }
3671                             if (brackets < 0) {
3672                                 brackets = 0;
3673                                 error(ERR_NONFATAL, "braces do not "
3674                                       "enclose all of macro parameter");
3675                             }
3676                             paramsize[nparam] += white + 1;
3677                             white = 0;
3678                         }       /* parameter loop */
3679                         nparam++;
3680                         while (m && (m->nparam != nparam ||
3681                                      mstrcmp(m->name, mname,
3682                                              m->casesense)))
3683                             m = m->next;
3684                         if (!m)
3685                             error(ERR_WARNING|ERR_PASS1|ERR_WARN_MNP,
3686                                   "macro `%s' exists, "
3687                                   "but not taking %d parameters",
3688                                   mstart->text, nparam);
3689                     }
3690                 }
3691                 if (m && m->in_progress)
3692                     m = NULL;
3693                 if (!m) {       /* in progess or didn't find '(' or wrong nparam */
3694                     /*
3695                      * Design question: should we handle !tline, which
3696                      * indicates missing ')' here, or expand those
3697                      * macros anyway, which requires the (t) test a few
3698                      * lines down?
3699                      */
3700                     nasm_free(params);
3701                     nasm_free(paramsize);
3702                     tline = mstart;
3703                 } else {
3704                     /*
3705                      * Expand the macro: we are placed on the last token of the
3706                      * call, so that we can easily split the call from the
3707                      * following tokens. We also start by pushing an SMAC_END
3708                      * token for the cycle removal.
3709                      */
3710                     t = tline;
3711                     if (t) {
3712                         tline = t->next;
3713                         t->next = NULL;
3714                     }
3715                     tt = new_Token(tline, TOK_SMAC_END, NULL, 0);
3716                     tt->a.mac = m;
3717                     m->in_progress = true;
3718                     tline = tt;
3719                     for (t = m->expansion; t; t = t->next) {
3720                         if (t->type >= TOK_SMAC_PARAM) {
3721                             Token *pcopy = tline, **ptail = &pcopy;
3722                             Token *ttt, *pt;
3723                             int i;
3724
3725                             ttt = params[t->type - TOK_SMAC_PARAM];
3726                             for (i = paramsize[t->type - TOK_SMAC_PARAM];
3727                                  --i >= 0;) {
3728                                 pt = *ptail =
3729                                     new_Token(tline, ttt->type, ttt->text,
3730                                               0);
3731                                 ptail = &pt->next;
3732                                 ttt = ttt->next;
3733                             }
3734                             tline = pcopy;
3735                         } else if (t->type == TOK_PREPROC_Q) {
3736                             tt = new_Token(tline, TOK_ID, mname, 0);
3737                             tline = tt;
3738                         } else if (t->type == TOK_PREPROC_QQ) {
3739                             tt = new_Token(tline, TOK_ID, m->name, 0);
3740                             tline = tt;
3741                         } else {
3742                             tt = new_Token(tline, t->type, t->text, 0);
3743                             tline = tt;
3744                         }
3745                     }
3746
3747                     /*
3748                      * Having done that, get rid of the macro call, and clean
3749                      * up the parameters.
3750                      */
3751                     nasm_free(params);
3752                     nasm_free(paramsize);
3753                     free_tlist(mstart);
3754                     continue;   /* main token loop */
3755                 }
3756             }
3757         }
3758
3759         if (tline->type == TOK_SMAC_END) {
3760             tline->a.mac->in_progress = false;
3761             tline = delete_Token(tline);
3762         } else {
3763             t = *tail = tline;
3764             tline = tline->next;
3765             t->a.mac = NULL;
3766             t->next = NULL;
3767             tail = &t->next;
3768         }
3769     }
3770
3771     /*
3772      * Now scan the entire line and look for successive TOK_IDs that resulted
3773      * after expansion (they can't be produced by tokenize()). The successive
3774      * TOK_IDs should be concatenated.
3775      * Also we look for %+ tokens and concatenate the tokens before and after
3776      * them (without white spaces in between).
3777      */
3778     t = thead;
3779     rescan = 0;
3780     while (t) {
3781         while (t && t->type != TOK_ID && t->type != TOK_PREPROC_ID)
3782             t = t->next;
3783         if (!t || !t->next)
3784             break;
3785         if (t->next->type == TOK_ID ||
3786             t->next->type == TOK_PREPROC_ID ||
3787             t->next->type == TOK_NUMBER) {
3788             char *p = nasm_strcat(t->text, t->next->text);
3789             nasm_free(t->text);
3790             t->next = delete_Token(t->next);
3791             t->text = p;
3792             rescan = 1;
3793         } else if (t->next->type == TOK_WHITESPACE && t->next->next &&
3794                    t->next->next->type == TOK_PREPROC_ID &&
3795                    strcmp(t->next->next->text, "%+") == 0) {
3796             /* free the next whitespace, the %+ token and next whitespace */
3797             int i;
3798             for (i = 1; i <= 3; i++) {
3799                 if (!t->next
3800                     || (i != 2 && t->next->type != TOK_WHITESPACE))
3801                     break;
3802                 t->next = delete_Token(t->next);
3803             }                   /* endfor */
3804         } else
3805             t = t->next;
3806     }
3807     /* If we concatenaded something, re-scan the line for macros */
3808     if (rescan) {
3809         tline = thead;
3810         goto again;
3811     }
3812
3813     if (org_tline) {
3814         if (thead) {
3815             *org_tline = *thead;
3816             /* since we just gave text to org_line, don't free it */
3817             thead->text = NULL;
3818             delete_Token(thead);
3819         } else {
3820             /* the expression expanded to empty line;
3821                we can't return NULL for some reasons
3822                we just set the line to a single WHITESPACE token. */
3823             memset(org_tline, 0, sizeof(*org_tline));
3824             org_tline->text = NULL;
3825             org_tline->type = TOK_WHITESPACE;
3826         }
3827         thead = org_tline;
3828     }
3829
3830     return thead;
3831 }
3832
3833 /*
3834  * Similar to expand_smacro but used exclusively with macro identifiers
3835  * right before they are fetched in. The reason is that there can be
3836  * identifiers consisting of several subparts. We consider that if there
3837  * are more than one element forming the name, user wants a expansion,
3838  * otherwise it will be left as-is. Example:
3839  *
3840  *      %define %$abc cde
3841  *
3842  * the identifier %$abc will be left as-is so that the handler for %define
3843  * will suck it and define the corresponding value. Other case:
3844  *
3845  *      %define _%$abc cde
3846  *
3847  * In this case user wants name to be expanded *before* %define starts
3848  * working, so we'll expand %$abc into something (if it has a value;
3849  * otherwise it will be left as-is) then concatenate all successive
3850  * PP_IDs into one.
3851  */
3852 static Token *expand_id(Token * tline)
3853 {
3854     Token *cur, *oldnext = NULL;
3855
3856     if (!tline || !tline->next)
3857         return tline;
3858
3859     cur = tline;
3860     while (cur->next &&
3861            (cur->next->type == TOK_ID ||
3862             cur->next->type == TOK_PREPROC_ID
3863             || cur->next->type == TOK_NUMBER))
3864         cur = cur->next;
3865
3866     /* If identifier consists of just one token, don't expand */
3867     if (cur == tline)
3868         return tline;
3869
3870     if (cur) {
3871         oldnext = cur->next;    /* Detach the tail past identifier */
3872         cur->next = NULL;       /* so that expand_smacro stops here */
3873     }
3874
3875     tline = expand_smacro(tline);
3876
3877     if (cur) {
3878         /* expand_smacro possibly changhed tline; re-scan for EOL */
3879         cur = tline;
3880         while (cur && cur->next)
3881             cur = cur->next;
3882         if (cur)
3883             cur->next = oldnext;
3884     }
3885
3886     return tline;
3887 }
3888
3889 /*
3890  * Determine whether the given line constitutes a multi-line macro
3891  * call, and return the MMacro structure called if so. Doesn't have
3892  * to check for an initial label - that's taken care of in
3893  * expand_mmacro - but must check numbers of parameters. Guaranteed
3894  * to be called with tline->type == TOK_ID, so the putative macro
3895  * name is easy to find.
3896  */
3897 static MMacro *is_mmacro(Token * tline, Token *** params_array)
3898 {
3899     MMacro *head, *m;
3900     Token **params;
3901     int nparam;
3902
3903     head = (MMacro *) hash_findix(&mmacros, tline->text);
3904
3905     /*
3906      * Efficiency: first we see if any macro exists with the given
3907      * name. If not, we can return NULL immediately. _Then_ we
3908      * count the parameters, and then we look further along the
3909      * list if necessary to find the proper MMacro.
3910      */
3911     for (m = head; m; m = m->next)
3912         if (!mstrcmp(m->name, tline->text, m->casesense))
3913             break;
3914     if (!m)
3915         return NULL;
3916
3917     /*
3918      * OK, we have a potential macro. Count and demarcate the
3919      * parameters.
3920      */
3921     count_mmac_params(tline->next, &nparam, &params);
3922
3923     /*
3924      * So we know how many parameters we've got. Find the MMacro
3925      * structure that handles this number.
3926      */
3927     while (m) {
3928         if (m->nparam_min <= nparam
3929             && (m->plus || nparam <= m->nparam_max)) {
3930             /*
3931              * This one is right. Just check if cycle removal
3932              * prohibits us using it before we actually celebrate...
3933              */
3934             if (m->in_progress) {
3935 #if 0
3936                 error(ERR_NONFATAL,
3937                       "self-reference in multi-line macro `%s'", m->name);
3938 #endif
3939                 nasm_free(params);
3940                 return NULL;
3941             }
3942             /*
3943              * It's right, and we can use it. Add its default
3944              * parameters to the end of our list if necessary.
3945              */
3946             if (m->defaults && nparam < m->nparam_min + m->ndefs) {
3947                 params =
3948                     nasm_realloc(params,
3949                                  ((m->nparam_min + m->ndefs +
3950                                    1) * sizeof(*params)));
3951                 while (nparam < m->nparam_min + m->ndefs) {
3952                     params[nparam] = m->defaults[nparam - m->nparam_min];
3953                     nparam++;
3954                 }
3955             }
3956             /*
3957              * If we've gone over the maximum parameter count (and
3958              * we're in Plus mode), ignore parameters beyond
3959              * nparam_max.
3960              */
3961             if (m->plus && nparam > m->nparam_max)
3962                 nparam = m->nparam_max;
3963             /*
3964              * Then terminate the parameter list, and leave.
3965              */
3966             if (!params) {      /* need this special case */
3967                 params = nasm_malloc(sizeof(*params));
3968                 nparam = 0;
3969             }
3970             params[nparam] = NULL;
3971             *params_array = params;
3972             return m;
3973         }
3974         /*
3975          * This one wasn't right: look for the next one with the
3976          * same name.
3977          */
3978         for (m = m->next; m; m = m->next)
3979             if (!mstrcmp(m->name, tline->text, m->casesense))
3980                 break;
3981     }
3982
3983     /*
3984      * After all that, we didn't find one with the right number of
3985      * parameters. Issue a warning, and fail to expand the macro.
3986      */
3987     error(ERR_WARNING|ERR_PASS1|ERR_WARN_MNP,
3988           "macro `%s' exists, but not taking %d parameters",
3989           tline->text, nparam);
3990     nasm_free(params);
3991     return NULL;
3992 }
3993
3994 /*
3995  * Expand the multi-line macro call made by the given line, if
3996  * there is one to be expanded. If there is, push the expansion on
3997  * istk->expansion and return 1. Otherwise return 0.
3998  */
3999 static int expand_mmacro(Token * tline)
4000 {
4001     Token *startline = tline;
4002     Token *label = NULL;
4003     int dont_prepend = 0;
4004     Token **params, *t, *mtok, *tt;
4005     MMacro *m;
4006     Line *l, *ll;
4007     int i, nparam, *paramlen;
4008     const char *mname;
4009
4010     t = tline;
4011     skip_white_(t);
4012     /*    if (!tok_type_(t, TOK_ID))  Lino 02/25/02 */
4013     if (!tok_type_(t, TOK_ID) && !tok_type_(t, TOK_PREPROC_ID))
4014         return 0;
4015     mtok = t;
4016     m = is_mmacro(t, &params);
4017     if (m) {
4018         mname = t->text;
4019     } else {
4020         Token *last;
4021         /*
4022          * We have an id which isn't a macro call. We'll assume
4023          * it might be a label; we'll also check to see if a
4024          * colon follows it. Then, if there's another id after
4025          * that lot, we'll check it again for macro-hood.
4026          */
4027         label = last = t;
4028         t = t->next;
4029         if (tok_type_(t, TOK_WHITESPACE))
4030             last = t, t = t->next;
4031         if (tok_is_(t, ":")) {
4032             dont_prepend = 1;
4033             last = t, t = t->next;
4034             if (tok_type_(t, TOK_WHITESPACE))
4035                 last = t, t = t->next;
4036         }
4037         if (!tok_type_(t, TOK_ID) || (m = is_mmacro(t, &params)) == NULL)
4038             return 0;
4039         last->next = NULL;
4040         mname = t->text;
4041         tline = t;
4042     }
4043
4044     /*
4045      * Fix up the parameters: this involves stripping leading and
4046      * trailing whitespace, then stripping braces if they are
4047      * present.
4048      */
4049     for (nparam = 0; params[nparam]; nparam++) ;
4050     paramlen = nparam ? nasm_malloc(nparam * sizeof(*paramlen)) : NULL;
4051
4052     for (i = 0; params[i]; i++) {
4053         int brace = false;
4054         int comma = (!m->plus || i < nparam - 1);
4055
4056         t = params[i];
4057         skip_white_(t);
4058         if (tok_is_(t, "{"))
4059             t = t->next, brace = true, comma = false;
4060         params[i] = t;
4061         paramlen[i] = 0;
4062         while (t) {
4063             if (comma && t->type == TOK_OTHER && !strcmp(t->text, ","))
4064                 break;          /* ... because we have hit a comma */
4065             if (comma && t->type == TOK_WHITESPACE
4066                 && tok_is_(t->next, ","))
4067                 break;          /* ... or a space then a comma */
4068             if (brace && t->type == TOK_OTHER && !strcmp(t->text, "}"))
4069                 break;          /* ... or a brace */
4070             t = t->next;
4071             paramlen[i]++;
4072         }
4073     }
4074
4075     /*
4076      * OK, we have a MMacro structure together with a set of
4077      * parameters. We must now go through the expansion and push
4078      * copies of each Line on to istk->expansion. Substitution of
4079      * parameter tokens and macro-local tokens doesn't get done
4080      * until the single-line macro substitution process; this is
4081      * because delaying them allows us to change the semantics
4082      * later through %rotate.
4083      *
4084      * First, push an end marker on to istk->expansion, mark this
4085      * macro as in progress, and set up its invocation-specific
4086      * variables.
4087      */
4088     ll = nasm_malloc(sizeof(Line));
4089     ll->next = istk->expansion;
4090     ll->finishes = m;
4091     ll->first = NULL;
4092     istk->expansion = ll;
4093
4094     m->in_progress = true;
4095     m->params = params;
4096     m->iline = tline;
4097     m->nparam = nparam;
4098     m->rotate = 0;
4099     m->paramlen = paramlen;
4100     m->unique = unique++;
4101     m->lineno = 0;
4102
4103     m->next_active = istk->mstk;
4104     istk->mstk = m;
4105
4106     for (l = m->expansion; l; l = l->next) {
4107         Token **tail;
4108
4109         ll = nasm_malloc(sizeof(Line));
4110         ll->finishes = NULL;
4111         ll->next = istk->expansion;
4112         istk->expansion = ll;
4113         tail = &ll->first;
4114
4115         for (t = l->first; t; t = t->next) {
4116             Token *x = t;
4117             switch (t->type) {
4118             case TOK_PREPROC_Q:
4119                 tt = *tail = new_Token(NULL, TOK_ID, mname, 0);
4120                 break;
4121             case TOK_PREPROC_QQ:
4122                 tt = *tail = new_Token(NULL, TOK_ID, m->name, 0);
4123                 break;
4124             case TOK_PREPROC_ID:
4125                 if (t->text[1] == '0' && t->text[2] == '0') {
4126                     dont_prepend = -1;
4127                     x = label;
4128                     if (!x)
4129                         continue;
4130                 }
4131                 /* fall through */
4132             default:
4133                 tt = *tail = new_Token(NULL, x->type, x->text, 0);
4134                 break;
4135             }
4136             tail = &tt->next;
4137         }
4138         *tail = NULL;
4139     }
4140
4141     /*
4142      * If we had a label, push it on as the first line of
4143      * the macro expansion.
4144      */
4145     if (label) {
4146         if (dont_prepend < 0)
4147             free_tlist(startline);
4148         else {
4149             ll = nasm_malloc(sizeof(Line));
4150             ll->finishes = NULL;
4151             ll->next = istk->expansion;
4152             istk->expansion = ll;
4153             ll->first = startline;
4154             if (!dont_prepend) {
4155                 while (label->next)
4156                     label = label->next;
4157                 label->next = tt = new_Token(NULL, TOK_OTHER, ":", 0);
4158             }
4159         }
4160     }
4161
4162     list->uplevel(m->nolist ? LIST_MACRO_NOLIST : LIST_MACRO);
4163
4164     return 1;
4165 }
4166
4167 /* The function that actually does the error reporting */
4168 static void verror(int severity, const char *fmt, va_list arg)
4169 {
4170     char buff[1024];
4171
4172     vsnprintf(buff, sizeof(buff), fmt, arg);
4173
4174     if (istk && istk->mstk && istk->mstk->name)
4175         _error(severity, "(%s:%d) %s", istk->mstk->name,
4176                istk->mstk->lineno, buff);
4177     else
4178         _error(severity, "%s", buff);
4179 }
4180
4181 /*
4182  * Since preprocessor always operate only on the line that didn't
4183  * arrived yet, we should always use ERR_OFFBY1.
4184  */
4185 static void error(int severity, const char *fmt, ...)
4186 {
4187     va_list arg;
4188
4189     /* If we're in a dead branch of IF or something like it, ignore the error */
4190     if (istk && istk->conds && !emitting(istk->conds->state))
4191         return;
4192
4193     va_start(arg, fmt);
4194     verror(severity, fmt, arg);
4195     va_end(arg);
4196 }
4197
4198 /*
4199  * Because %else etc are evaluated in the state context
4200  * of the previous branch, errors might get lost with error():
4201  *   %if 0 ... %else trailing garbage ... %endif
4202  * So %else etc should report errors with this function.
4203  */
4204 static void error_precond(int severity, const char *fmt, ...)
4205 {
4206     va_list arg;
4207
4208     /* Only ignore the error if it's really in a dead branch */
4209     if (istk && istk->conds && istk->conds->state == COND_NEVER)
4210         return;
4211
4212     va_start(arg, fmt);
4213     verror(severity, fmt, arg);
4214     va_end(arg);
4215 }
4216
4217 static void
4218 pp_reset(char *file, int apass, efunc errfunc, evalfunc eval,
4219          ListGen * listgen, StrList **deplist)
4220 {
4221     Token *t;
4222
4223     _error = errfunc;
4224     cstk = NULL;
4225     istk = nasm_malloc(sizeof(Include));
4226     istk->next = NULL;
4227     istk->conds = NULL;
4228     istk->expansion = NULL;
4229     istk->mstk = NULL;
4230     istk->fp = fopen(file, "r");
4231     istk->fname = NULL;
4232     src_set_fname(nasm_strdup(file));
4233     src_set_linnum(0);
4234     istk->lineinc = 1;
4235     if (!istk->fp)
4236         error(ERR_FATAL|ERR_NOFILE, "unable to open input file `%s'",
4237               file);
4238     defining = NULL;
4239     nested_mac_count = 0;
4240     nested_rep_count = 0;
4241     init_macros();
4242     unique = 0;
4243     if (tasm_compatible_mode) {
4244         stdmacpos = nasm_stdmac;
4245     } else {
4246         stdmacpos = nasm_stdmac_after_tasm;
4247     }
4248     any_extrastdmac = extrastdmac && *extrastdmac;
4249     do_predef = true;
4250     list = listgen;
4251     evaluate = eval;
4252
4253     /*
4254      * 0 for dependencies, 1 for preparatory passes, 2 for final pass.
4255      * The caller, however, will also pass in 3 for preprocess-only so
4256      * we can set __PASS__ accordingly.
4257      */
4258     pass = apass > 2 ? 2 : apass;
4259
4260     dephead = deptail = deplist;
4261     if (deplist) {
4262         StrList *sl = nasm_malloc(strlen(file)+1+sizeof sl->next);
4263         sl->next = NULL;
4264         strcpy(sl->str, file);
4265         *deptail = sl;
4266         deptail = &sl->next;
4267     }
4268
4269     /*
4270      * Define the __PASS__ macro.  This is defined here unlike
4271      * all the other builtins, because it is special -- it varies between
4272      * passes.
4273      */
4274     t = nasm_malloc(sizeof(*t));
4275     t->next = NULL;
4276     make_tok_num(t, apass);
4277     t->a.mac = NULL;
4278     define_smacro(NULL, "__PASS__", true, 0, t);
4279 }
4280
4281 static char *pp_getline(void)
4282 {
4283     char *line;
4284     Token *tline;
4285
4286     while (1) {
4287         /*
4288          * Fetch a tokenized line, either from the macro-expansion
4289          * buffer or from the input file.
4290          */
4291         tline = NULL;
4292         while (istk->expansion && istk->expansion->finishes) {
4293             Line *l = istk->expansion;
4294             if (!l->finishes->name && l->finishes->in_progress > 1) {
4295                 Line *ll;
4296
4297                 /*
4298                  * This is a macro-end marker for a macro with no
4299                  * name, which means it's not really a macro at all
4300                  * but a %rep block, and the `in_progress' field is
4301                  * more than 1, meaning that we still need to
4302                  * repeat. (1 means the natural last repetition; 0
4303                  * means termination by %exitrep.) We have
4304                  * therefore expanded up to the %endrep, and must
4305                  * push the whole block on to the expansion buffer
4306                  * again. We don't bother to remove the macro-end
4307                  * marker: we'd only have to generate another one
4308                  * if we did.
4309                  */
4310                 l->finishes->in_progress--;
4311                 for (l = l->finishes->expansion; l; l = l->next) {
4312                     Token *t, *tt, **tail;
4313
4314                     ll = nasm_malloc(sizeof(Line));
4315                     ll->next = istk->expansion;
4316                     ll->finishes = NULL;
4317                     ll->first = NULL;
4318                     tail = &ll->first;
4319
4320                     for (t = l->first; t; t = t->next) {
4321                         if (t->text || t->type == TOK_WHITESPACE) {
4322                             tt = *tail =
4323                                 new_Token(NULL, t->type, t->text, 0);
4324                             tail = &tt->next;
4325                         }
4326                     }
4327
4328                     istk->expansion = ll;
4329                 }
4330             } else {
4331                 /*
4332                  * Check whether a `%rep' was started and not ended
4333                  * within this macro expansion. This can happen and
4334                  * should be detected. It's a fatal error because
4335                  * I'm too confused to work out how to recover
4336                  * sensibly from it.
4337                  */
4338                 if (defining) {
4339                     if (defining->name)
4340                         error(ERR_PANIC,
4341                               "defining with name in expansion");
4342                     else if (istk->mstk->name)
4343                         error(ERR_FATAL,
4344                               "`%%rep' without `%%endrep' within"
4345                               " expansion of macro `%s'",
4346                               istk->mstk->name);
4347                 }
4348
4349                 /*
4350                  * FIXME:  investigate the relationship at this point between
4351                  * istk->mstk and l->finishes
4352                  */
4353                 {
4354                     MMacro *m = istk->mstk;
4355                     istk->mstk = m->next_active;
4356                     if (m->name) {
4357                         /*
4358                          * This was a real macro call, not a %rep, and
4359                          * therefore the parameter information needs to
4360                          * be freed.
4361                          */
4362                         nasm_free(m->params);
4363                         free_tlist(m->iline);
4364                         nasm_free(m->paramlen);
4365                         l->finishes->in_progress = false;
4366                     } else
4367                         free_mmacro(m);
4368                 }
4369                 istk->expansion = l->next;
4370                 nasm_free(l);
4371                 list->downlevel(LIST_MACRO);
4372             }
4373         }
4374         while (1) {             /* until we get a line we can use */
4375
4376             if (istk->expansion) {      /* from a macro expansion */
4377                 char *p;
4378                 Line *l = istk->expansion;
4379                 if (istk->mstk)
4380                     istk->mstk->lineno++;
4381                 tline = l->first;
4382                 istk->expansion = l->next;
4383                 nasm_free(l);
4384                 p = detoken(tline, false);
4385                 list->line(LIST_MACRO, p);
4386                 nasm_free(p);
4387                 break;
4388             }
4389             line = read_line();
4390             if (line) {         /* from the current input file */
4391                 line = prepreproc(line);
4392                 tline = tokenize(line);
4393                 nasm_free(line);
4394                 break;
4395             }
4396             /*
4397              * The current file has ended; work down the istk
4398              */
4399             {
4400                 Include *i = istk;
4401                 fclose(i->fp);
4402                 if (i->conds)
4403                     error(ERR_FATAL,
4404                           "expected `%%endif' before end of file");
4405                 /* only set line and file name if there's a next node */
4406                 if (i->next) {
4407                     src_set_linnum(i->lineno);
4408                     nasm_free(src_set_fname(i->fname));
4409                 }
4410                 istk = i->next;
4411                 list->downlevel(LIST_INCLUDE);
4412                 nasm_free(i);
4413                 if (!istk)
4414                     return NULL;
4415                 if (istk->expansion && istk->expansion->finishes)
4416                     break;
4417             }
4418         }
4419
4420         /*
4421          * We must expand MMacro parameters and MMacro-local labels
4422          * _before_ we plunge into directive processing, to cope
4423          * with things like `%define something %1' such as STRUC
4424          * uses. Unless we're _defining_ a MMacro, in which case
4425          * those tokens should be left alone to go into the
4426          * definition; and unless we're in a non-emitting
4427          * condition, in which case we don't want to meddle with
4428          * anything.
4429          */
4430         if (!defining && !(istk->conds && !emitting(istk->conds->state))
4431             && !(istk->mstk && !istk->mstk->in_progress))
4432             tline = expand_mmac_params(tline);
4433
4434         /*
4435          * Check the line to see if it's a preprocessor directive.
4436          */
4437         if (do_directive(tline) == DIRECTIVE_FOUND) {
4438             continue;
4439         } else if (defining) {
4440             /*
4441              * We're defining a multi-line macro. We emit nothing
4442              * at all, and just
4443              * shove the tokenized line on to the macro definition.
4444              */
4445             Line *l = nasm_malloc(sizeof(Line));
4446             l->next = defining->expansion;
4447             l->first = tline;
4448             l->finishes = NULL;
4449             defining->expansion = l;
4450             continue;
4451         } else if (istk->conds && !emitting(istk->conds->state)) {
4452             /*
4453              * We're in a non-emitting branch of a condition block.
4454              * Emit nothing at all, not even a blank line: when we
4455              * emerge from the condition we'll give a line-number
4456              * directive so we keep our place correctly.
4457              */
4458             free_tlist(tline);
4459             continue;
4460         } else if (istk->mstk && !istk->mstk->in_progress) {
4461             /*
4462              * We're in a %rep block which has been terminated, so
4463              * we're walking through to the %endrep without
4464              * emitting anything. Emit nothing at all, not even a
4465              * blank line: when we emerge from the %rep block we'll
4466              * give a line-number directive so we keep our place
4467              * correctly.
4468              */
4469             free_tlist(tline);
4470             continue;
4471         } else {
4472             tline = expand_smacro(tline);
4473             if (!expand_mmacro(tline)) {
4474                 /*
4475                  * De-tokenize the line again, and emit it.
4476                  */
4477                 line = detoken(tline, true);
4478                 free_tlist(tline);
4479                 break;
4480             } else {
4481                 continue;       /* expand_mmacro calls free_tlist */
4482             }
4483         }
4484     }
4485
4486     return line;
4487 }
4488
4489 static void pp_cleanup(int pass)
4490 {
4491     if (defining) {
4492         if(defining->name) {
4493             error(ERR_NONFATAL,
4494                   "end of file while still defining macro `%s'",
4495                   defining->name);
4496         } else {
4497             error(ERR_NONFATAL, "end of file while still in %%rep");
4498         }
4499
4500         free_mmacro(defining);
4501     }
4502     while (cstk)
4503         ctx_pop();
4504     free_macros();
4505     while (istk) {
4506         Include *i = istk;
4507         istk = istk->next;
4508         fclose(i->fp);
4509         nasm_free(i->fname);
4510         nasm_free(i);
4511     }
4512     while (cstk)
4513         ctx_pop();
4514     nasm_free(src_set_fname(NULL));
4515     if (pass == 0) {
4516         IncPath *i;
4517         free_llist(predef);
4518         delete_Blocks();
4519         while ((i = ipath)) {
4520             ipath = i->next;
4521             if (i->path)
4522                 nasm_free(i->path);
4523             nasm_free(i);
4524         }
4525     }
4526 }
4527
4528 void pp_include_path(char *path)
4529 {
4530     IncPath *i;
4531
4532     i = nasm_malloc(sizeof(IncPath));
4533     i->path = path ? nasm_strdup(path) : NULL;
4534     i->next = NULL;
4535
4536     if (ipath != NULL) {
4537         IncPath *j = ipath;
4538         while (j->next != NULL)
4539             j = j->next;
4540         j->next = i;
4541     } else {
4542         ipath = i;
4543     }
4544 }
4545
4546 void pp_pre_include(char *fname)
4547 {
4548     Token *inc, *space, *name;
4549     Line *l;
4550
4551     name = new_Token(NULL, TOK_INTERNAL_STRING, fname, 0);
4552     space = new_Token(name, TOK_WHITESPACE, NULL, 0);
4553     inc = new_Token(space, TOK_PREPROC_ID, "%include", 0);
4554
4555     l = nasm_malloc(sizeof(Line));
4556     l->next = predef;
4557     l->first = inc;
4558     l->finishes = NULL;
4559     predef = l;
4560 }
4561
4562 void pp_pre_define(char *definition)
4563 {
4564     Token *def, *space;
4565     Line *l;
4566     char *equals;
4567
4568     equals = strchr(definition, '=');
4569     space = new_Token(NULL, TOK_WHITESPACE, NULL, 0);
4570     def = new_Token(space, TOK_PREPROC_ID, "%define", 0);
4571     if (equals)
4572         *equals = ' ';
4573     space->next = tokenize(definition);
4574     if (equals)
4575         *equals = '=';
4576
4577     l = nasm_malloc(sizeof(Line));
4578     l->next = predef;
4579     l->first = def;
4580     l->finishes = NULL;
4581     predef = l;
4582 }
4583
4584 void pp_pre_undefine(char *definition)
4585 {
4586     Token *def, *space;
4587     Line *l;
4588
4589     space = new_Token(NULL, TOK_WHITESPACE, NULL, 0);
4590     def = new_Token(space, TOK_PREPROC_ID, "%undef", 0);
4591     space->next = tokenize(definition);
4592
4593     l = nasm_malloc(sizeof(Line));
4594     l->next = predef;
4595     l->first = def;
4596     l->finishes = NULL;
4597     predef = l;
4598 }
4599
4600 /*
4601  * Added by Keith Kanios:
4602  *
4603  * This function is used to assist with "runtime" preprocessor
4604  * directives. (e.g. pp_runtime("%define __BITS__ 64");)
4605  *
4606  * ERRORS ARE IGNORED HERE, SO MAKE COMPLETELY SURE THAT YOU
4607  * PASS A VALID STRING TO THIS FUNCTION!!!!!
4608  */
4609
4610 void pp_runtime(char *definition)
4611 {
4612     Token *def;
4613
4614     def = tokenize(definition);
4615     if(do_directive(def) == NO_DIRECTIVE_FOUND)
4616         free_tlist(def);
4617
4618 }
4619
4620 void pp_extra_stdmac(macros_t *macros)
4621 {
4622     extrastdmac = macros;
4623 }
4624
4625 static void make_tok_num(Token * tok, int64_t val)
4626 {
4627     char numbuf[20];
4628     snprintf(numbuf, sizeof(numbuf), "%"PRId64"", val);
4629     tok->text = nasm_strdup(numbuf);
4630     tok->type = TOK_NUMBER;
4631 }
4632
4633 Preproc nasmpp = {
4634     pp_reset,
4635     pp_getline,
4636     pp_cleanup
4637 };