Improve checking and documentation for %ifctx
[nasm.git] / preproc.c
blob39aa2abfacecaa60c9054e7219e72ee2720558bc
1 /* preproc.c macro preprocessor for the Netwide Assembler
3 * The Netwide Assembler is copyright (C) 1996 Simon Tatham and
4 * Julian Hall. All rights reserved. The software is
5 * redistributable under the license given in the file "LICENSE"
6 * distributed in the NASM archive.
8 * initial version 18/iii/97 by Simon Tatham
9 */
11 /* Typical flow of text through preproc
13 * pp_getline gets tokenized lines, either
15 * from a macro expansion
17 * or
18 * {
19 * read_line gets raw text from stdmacpos, or predef, or current input file
20 * tokenize converts to tokens
21 * }
23 * expand_mmac_params is used to expand %1 etc., unless a macro is being
24 * defined or a false conditional is being processed
25 * (%0, %1, %+1, %-1, %%foo
27 * do_directive checks for directives
29 * expand_smacro is used to expand single line macros
31 * expand_mmacro is used to expand multi-line macros
33 * detoken is used to convert the line back to text
36 #include "compiler.h"
38 #include <stdio.h>
39 #include <stdarg.h>
40 #include <stdlib.h>
41 #include <stddef.h>
42 #include <string.h>
43 #include <ctype.h>
44 #include <limits.h>
45 #include <inttypes.h>
47 #include "nasm.h"
48 #include "nasmlib.h"
49 #include "preproc.h"
50 #include "hashtbl.h"
51 #include "quote.h"
52 #include "stdscan.h"
53 #include "tokens.h"
54 #include "tables.h"
56 typedef struct SMacro SMacro;
57 typedef struct MMacro MMacro;
58 typedef struct Context Context;
59 typedef struct Token Token;
60 typedef struct Blocks Blocks;
61 typedef struct Line Line;
62 typedef struct Include Include;
63 typedef struct Cond Cond;
64 typedef struct IncPath IncPath;
67 * Note on the storage of both SMacro and MMacros: the hash table
68 * indexes them case-insensitively, and we then have to go through a
69 * linked list of potential case aliases (and, for MMacros, parameter
70 * ranges); this is to preserve the matching semantics of the earlier
71 * code. If the number of case aliases for a specific macro is a
72 * performance issue, you may want to reconsider your coding style.
76 * Store the definition of a single-line macro.
78 struct SMacro {
79 SMacro *next;
80 char *name;
81 bool casesense;
82 bool in_progress;
83 unsigned int nparam;
84 Token *expansion;
88 * Store the definition of a multi-line macro. This is also used to
89 * store the interiors of `%rep...%endrep' blocks, which are
90 * effectively self-re-invoking multi-line macros which simply
91 * don't have a name or bother to appear in the hash tables. %rep
92 * blocks are signified by having a NULL `name' field.
94 * In a MMacro describing a `%rep' block, the `in_progress' field
95 * isn't merely boolean, but gives the number of repeats left to
96 * run.
98 * The `next' field is used for storing MMacros in hash tables; the
99 * `next_active' field is for stacking them on istk entries.
101 * When a MMacro is being expanded, `params', `iline', `nparam',
102 * `paramlen', `rotate' and `unique' are local to the invocation.
104 struct MMacro {
105 MMacro *next;
106 char *name;
107 int nparam_min, nparam_max;
108 bool casesense;
109 bool plus; /* is the last parameter greedy? */
110 bool nolist; /* is this macro listing-inhibited? */
111 int64_t in_progress;
112 Token *dlist; /* All defaults as one list */
113 Token **defaults; /* Parameter default pointers */
114 int ndefs; /* number of default parameters */
115 Line *expansion;
117 MMacro *next_active;
118 MMacro *rep_nest; /* used for nesting %rep */
119 Token **params; /* actual parameters */
120 Token *iline; /* invocation line */
121 unsigned int nparam, rotate;
122 int *paramlen;
123 uint64_t unique;
124 int lineno; /* Current line number on expansion */
128 * The context stack is composed of a linked list of these.
130 struct Context {
131 Context *next;
132 char *name;
133 struct hash_table localmac;
134 uint32_t number;
138 * This is the internal form which we break input lines up into.
139 * Typically stored in linked lists.
141 * Note that `type' serves a double meaning: TOK_SMAC_PARAM is not
142 * necessarily used as-is, but is intended to denote the number of
143 * the substituted parameter. So in the definition
145 * %define a(x,y) ( (x) & ~(y) )
147 * the token representing `x' will have its type changed to
148 * TOK_SMAC_PARAM, but the one representing `y' will be
149 * TOK_SMAC_PARAM+1.
151 * TOK_INTERNAL_STRING is a dirty hack: it's a single string token
152 * which doesn't need quotes around it. Used in the pre-include
153 * mechanism as an alternative to trying to find a sensible type of
154 * quote to use on the filename we were passed.
156 enum pp_token_type {
157 TOK_NONE = 0, TOK_WHITESPACE, TOK_COMMENT, TOK_ID,
158 TOK_PREPROC_ID, TOK_STRING,
159 TOK_NUMBER, TOK_FLOAT, TOK_SMAC_END, TOK_OTHER,
160 TOK_INTERNAL_STRING,
161 TOK_PREPROC_Q, TOK_PREPROC_QQ,
162 TOK_SMAC_PARAM, /* MUST BE LAST IN THE LIST!!! */
163 TOK_MAX = INT_MAX /* Keep compiler from reducing the range */
166 struct Token {
167 Token *next;
168 char *text;
169 union {
170 SMacro *mac; /* associated macro for TOK_SMAC_END */
171 size_t len; /* scratch length field */
172 } a; /* Auxiliary data */
173 enum pp_token_type type;
177 * Multi-line macro definitions are stored as a linked list of
178 * these, which is essentially a container to allow several linked
179 * lists of Tokens.
181 * Note that in this module, linked lists are treated as stacks
182 * wherever possible. For this reason, Lines are _pushed_ on to the
183 * `expansion' field in MMacro structures, so that the linked list,
184 * if walked, would give the macro lines in reverse order; this
185 * means that we can walk the list when expanding a macro, and thus
186 * push the lines on to the `expansion' field in _istk_ in reverse
187 * order (so that when popped back off they are in the right
188 * order). It may seem cockeyed, and it relies on my design having
189 * an even number of steps in, but it works...
191 * Some of these structures, rather than being actual lines, are
192 * markers delimiting the end of the expansion of a given macro.
193 * This is for use in the cycle-tracking and %rep-handling code.
194 * Such structures have `finishes' non-NULL, and `first' NULL. All
195 * others have `finishes' NULL, but `first' may still be NULL if
196 * the line is blank.
198 struct Line {
199 Line *next;
200 MMacro *finishes;
201 Token *first;
205 * To handle an arbitrary level of file inclusion, we maintain a
206 * stack (ie linked list) of these things.
208 struct Include {
209 Include *next;
210 FILE *fp;
211 Cond *conds;
212 Line *expansion;
213 char *fname;
214 int lineno, lineinc;
215 MMacro *mstk; /* stack of active macros/reps */
219 * Include search path. This is simply a list of strings which get
220 * prepended, in turn, to the name of an include file, in an
221 * attempt to find the file if it's not in the current directory.
223 struct IncPath {
224 IncPath *next;
225 char *path;
229 * Conditional assembly: we maintain a separate stack of these for
230 * each level of file inclusion. (The only reason we keep the
231 * stacks separate is to ensure that a stray `%endif' in a file
232 * included from within the true branch of a `%if' won't terminate
233 * it and cause confusion: instead, rightly, it'll cause an error.)
235 struct Cond {
236 Cond *next;
237 int state;
239 enum {
241 * These states are for use just after %if or %elif: IF_TRUE
242 * means the condition has evaluated to truth so we are
243 * currently emitting, whereas IF_FALSE means we are not
244 * currently emitting but will start doing so if a %else comes
245 * up. In these states, all directives are admissible: %elif,
246 * %else and %endif. (And of course %if.)
248 COND_IF_TRUE, COND_IF_FALSE,
250 * These states come up after a %else: ELSE_TRUE means we're
251 * emitting, and ELSE_FALSE means we're not. In ELSE_* states,
252 * any %elif or %else will cause an error.
254 COND_ELSE_TRUE, COND_ELSE_FALSE,
256 * This state means that we're not emitting now, and also that
257 * nothing until %endif will be emitted at all. It's for use in
258 * two circumstances: (i) when we've had our moment of emission
259 * and have now started seeing %elifs, and (ii) when the
260 * condition construct in question is contained within a
261 * non-emitting branch of a larger condition construct.
263 COND_NEVER
265 #define emitting(x) ( (x) == COND_IF_TRUE || (x) == COND_ELSE_TRUE )
268 * These defines are used as the possible return values for do_directive
270 #define NO_DIRECTIVE_FOUND 0
271 #define DIRECTIVE_FOUND 1
274 * Condition codes. Note that we use c_ prefix not C_ because C_ is
275 * used in nasm.h for the "real" condition codes. At _this_ level,
276 * we treat CXZ and ECXZ as condition codes, albeit non-invertible
277 * ones, so we need a different enum...
279 static const char * const conditions[] = {
280 "a", "ae", "b", "be", "c", "cxz", "e", "ecxz", "g", "ge", "l", "le",
281 "na", "nae", "nb", "nbe", "nc", "ne", "ng", "nge", "nl", "nle", "no",
282 "np", "ns", "nz", "o", "p", "pe", "po", "rcxz", "s", "z"
284 enum pp_conds {
285 c_A, c_AE, c_B, c_BE, c_C, c_CXZ, c_E, c_ECXZ, c_G, c_GE, c_L, c_LE,
286 c_NA, c_NAE, c_NB, c_NBE, c_NC, c_NE, c_NG, c_NGE, c_NL, c_NLE, c_NO,
287 c_NP, c_NS, c_NZ, c_O, c_P, c_PE, c_PO, c_RCXZ, c_S, c_Z,
288 c_none = -1
290 static const enum pp_conds inverse_ccs[] = {
291 c_NA, c_NAE, c_NB, c_NBE, c_NC, -1, c_NE, -1, c_NG, c_NGE, c_NL, c_NLE,
292 c_A, c_AE, c_B, c_BE, c_C, c_E, c_G, c_GE, c_L, c_LE, c_O, c_P, c_S,
293 c_Z, c_NO, c_NP, c_PO, c_PE, -1, c_NS, c_NZ
297 * Directive names.
299 /* If this is a an IF, ELIF, ELSE or ENDIF keyword */
300 static int is_condition(enum preproc_token arg)
302 return PP_IS_COND(arg) || (arg == PP_ELSE) || (arg == PP_ENDIF);
305 /* For TASM compatibility we need to be able to recognise TASM compatible
306 * conditional compilation directives. Using the NASM pre-processor does
307 * not work, so we look for them specifically from the following list and
308 * then jam in the equivalent NASM directive into the input stream.
311 enum {
312 TM_ARG, TM_ELIF, TM_ELSE, TM_ENDIF, TM_IF, TM_IFDEF, TM_IFDIFI,
313 TM_IFNDEF, TM_INCLUDE, TM_LOCAL
316 static const char * const tasm_directives[] = {
317 "arg", "elif", "else", "endif", "if", "ifdef", "ifdifi",
318 "ifndef", "include", "local"
321 static int StackSize = 4;
322 static char *StackPointer = "ebp";
323 static int ArgOffset = 8;
324 static int LocalOffset = 0;
326 static Context *cstk;
327 static Include *istk;
328 static IncPath *ipath = NULL;
330 static efunc _error; /* Pointer to client-provided error reporting function */
331 static evalfunc evaluate;
333 static int pass; /* HACK: pass 0 = generate dependencies only */
334 static StrList **dephead, **deptail; /* Dependency list */
336 static uint64_t unique; /* unique identifier numbers */
338 static Line *predef = NULL;
339 static bool do_predef;
341 static ListGen *list;
344 * The current set of multi-line macros we have defined.
346 static struct hash_table mmacros;
349 * The current set of single-line macros we have defined.
351 static struct hash_table smacros;
354 * The multi-line macro we are currently defining, or the %rep
355 * block we are currently reading, if any.
357 static MMacro *defining;
359 static uint64_t nested_mac_count;
360 static uint64_t nested_rep_count;
363 * The number of macro parameters to allocate space for at a time.
365 #define PARAM_DELTA 16
368 * The standard macro set: defined in macros.c in the array nasm_stdmac.
369 * This gives our position in the macro set, when we're processing it.
371 static macros_t *stdmacpos;
374 * The extra standard macros that come from the object format, if
375 * any.
377 static macros_t *extrastdmac = NULL;
378 static bool any_extrastdmac;
381 * Tokens are allocated in blocks to improve speed
383 #define TOKEN_BLOCKSIZE 4096
384 static Token *freeTokens = NULL;
385 struct Blocks {
386 Blocks *next;
387 void *chunk;
390 static Blocks blocks = { NULL, NULL };
393 * Forward declarations.
395 static Token *expand_mmac_params(Token * tline);
396 static Token *expand_smacro(Token * tline);
397 static Token *expand_id(Token * tline);
398 static Context *get_ctx(const char *name, bool all_contexts);
399 static void make_tok_num(Token * tok, int64_t val);
400 static void error(int severity, const char *fmt, ...);
401 static void *new_Block(size_t size);
402 static void delete_Blocks(void);
403 static Token *new_Token(Token * next, enum pp_token_type type,
404 const char *text, int txtlen);
405 static Token *delete_Token(Token * t);
408 * Macros for safe checking of token pointers, avoid *(NULL)
410 #define tok_type_(x,t) ((x) && (x)->type == (t))
411 #define skip_white_(x) if (tok_type_((x), TOK_WHITESPACE)) (x)=(x)->next
412 #define tok_is_(x,v) (tok_type_((x), TOK_OTHER) && !strcmp((x)->text,(v)))
413 #define tok_isnt_(x,v) ((x) && ((x)->type!=TOK_OTHER || strcmp((x)->text,(v))))
415 /* Handle TASM specific directives, which do not contain a % in
416 * front of them. We do it here because I could not find any other
417 * place to do it for the moment, and it is a hack (ideally it would
418 * be nice to be able to use the NASM pre-processor to do it).
420 static char *check_tasm_directive(char *line)
422 int32_t i, j, k, m, len;
423 char *p = line, *oldline, oldchar;
425 /* Skip whitespace */
426 while (nasm_isspace(*p) && *p != 0)
427 p++;
429 /* Binary search for the directive name */
430 i = -1;
431 j = elements(tasm_directives);
432 len = 0;
433 while (!nasm_isspace(p[len]) && p[len] != 0)
434 len++;
435 if (len) {
436 oldchar = p[len];
437 p[len] = 0;
438 while (j - i > 1) {
439 k = (j + i) / 2;
440 m = nasm_stricmp(p, tasm_directives[k]);
441 if (m == 0) {
442 /* We have found a directive, so jam a % in front of it
443 * so that NASM will then recognise it as one if it's own.
445 p[len] = oldchar;
446 len = strlen(p);
447 oldline = line;
448 line = nasm_malloc(len + 2);
449 line[0] = '%';
450 if (k == TM_IFDIFI) {
451 /* NASM does not recognise IFDIFI, so we convert it to
452 * %ifdef BOGUS. This is not used in NASM comaptible
453 * code, but does need to parse for the TASM macro
454 * package.
456 strcpy(line + 1, "ifdef BOGUS");
457 } else {
458 memcpy(line + 1, p, len + 1);
460 nasm_free(oldline);
461 return line;
462 } else if (m < 0) {
463 j = k;
464 } else
465 i = k;
467 p[len] = oldchar;
469 return line;
473 * The pre-preprocessing stage... This function translates line
474 * number indications as they emerge from GNU cpp (`# lineno "file"
475 * flags') into NASM preprocessor line number indications (`%line
476 * lineno file').
478 static char *prepreproc(char *line)
480 int lineno, fnlen;
481 char *fname, *oldline;
483 if (line[0] == '#' && line[1] == ' ') {
484 oldline = line;
485 fname = oldline + 2;
486 lineno = atoi(fname);
487 fname += strspn(fname, "0123456789 ");
488 if (*fname == '"')
489 fname++;
490 fnlen = strcspn(fname, "\"");
491 line = nasm_malloc(20 + fnlen);
492 snprintf(line, 20 + fnlen, "%%line %d %.*s", lineno, fnlen, fname);
493 nasm_free(oldline);
495 if (tasm_compatible_mode)
496 return check_tasm_directive(line);
497 return line;
501 * Free a linked list of tokens.
503 static void free_tlist(Token * list)
505 while (list) {
506 list = delete_Token(list);
511 * Free a linked list of lines.
513 static void free_llist(Line * list)
515 Line *l;
516 while (list) {
517 l = list;
518 list = list->next;
519 free_tlist(l->first);
520 nasm_free(l);
525 * Free an MMacro
527 static void free_mmacro(MMacro * m)
529 nasm_free(m->name);
530 free_tlist(m->dlist);
531 nasm_free(m->defaults);
532 free_llist(m->expansion);
533 nasm_free(m);
537 * Free all currently defined macros, and free the hash tables
539 static void free_smacro_table(struct hash_table *smt)
541 SMacro *s;
542 const char *key;
543 struct hash_tbl_node *it = NULL;
545 while ((s = hash_iterate(smt, &it, &key)) != NULL) {
546 nasm_free((void *)key);
547 while (s) {
548 SMacro *ns = s->next;
549 nasm_free(s->name);
550 free_tlist(s->expansion);
551 nasm_free(s);
552 s = ns;
555 hash_free(smt);
558 static void free_mmacro_table(struct hash_table *mmt)
560 MMacro *m;
561 const char *key;
562 struct hash_tbl_node *it = NULL;
564 it = NULL;
565 while ((m = hash_iterate(mmt, &it, &key)) != NULL) {
566 nasm_free((void *)key);
567 while (m) {
568 MMacro *nm = m->next;
569 free_mmacro(m);
570 m = nm;
573 hash_free(mmt);
576 static void free_macros(void)
578 free_smacro_table(&smacros);
579 free_mmacro_table(&mmacros);
583 * Initialize the hash tables
585 static void init_macros(void)
587 hash_init(&smacros, HASH_LARGE);
588 hash_init(&mmacros, HASH_LARGE);
592 * Pop the context stack.
594 static void ctx_pop(void)
596 Context *c = cstk;
598 cstk = cstk->next;
599 free_smacro_table(&c->localmac);
600 nasm_free(c->name);
601 nasm_free(c);
605 * Search for a key in the hash index; adding it if necessary
606 * (in which case we initialize the data pointer to NULL.)
608 static void **
609 hash_findi_add(struct hash_table *hash, const char *str)
611 struct hash_insert hi;
612 void **r;
613 char *strx;
615 r = hash_findi(hash, str, &hi);
616 if (r)
617 return r;
619 strx = nasm_strdup(str); /* Use a more efficient allocator here? */
620 return hash_add(&hi, strx, NULL);
624 * Like hash_findi, but returns the data element rather than a pointer
625 * to it. Used only when not adding a new element, hence no third
626 * argument.
628 static void *
629 hash_findix(struct hash_table *hash, const char *str)
631 void **p;
633 p = hash_findi(hash, str, NULL);
634 return p ? *p : NULL;
637 #define BUF_DELTA 512
639 * Read a line from the top file in istk, handling multiple CR/LFs
640 * at the end of the line read, and handling spurious ^Zs. Will
641 * return lines from the standard macro set if this has not already
642 * been done.
644 static char *read_line(void)
646 char *buffer, *p, *q;
647 int bufsize, continued_count;
649 if (stdmacpos) {
650 unsigned char c;
651 const unsigned char *p = stdmacpos;
652 char *ret, *q;
653 size_t len = 0;
654 while ((c = *p++)) {
655 if (c >= 0x80)
656 len += pp_directives_len[c-0x80]+1;
657 else
658 len++;
660 ret = nasm_malloc(len+1);
661 q = ret;
662 while ((c = *stdmacpos++)) {
663 if (c >= 0x80) {
664 memcpy(q, pp_directives[c-0x80], pp_directives_len[c-0x80]);
665 q += pp_directives_len[c-0x80];
666 *q++ = ' ';
667 } else {
668 *q++ = c;
671 stdmacpos = p;
672 *q = '\0';
674 if (!*stdmacpos) {
675 /* This was the last of the standard macro chain... */
676 stdmacpos = NULL;
677 if (any_extrastdmac) {
678 stdmacpos = extrastdmac;
679 any_extrastdmac = false;
680 } else if (do_predef) {
681 Line *pd, *l;
682 Token *head, **tail, *t;
685 * Nasty hack: here we push the contents of
686 * `predef' on to the top-level expansion stack,
687 * since this is the most convenient way to
688 * implement the pre-include and pre-define
689 * features.
691 for (pd = predef; pd; pd = pd->next) {
692 head = NULL;
693 tail = &head;
694 for (t = pd->first; t; t = t->next) {
695 *tail = new_Token(NULL, t->type, t->text, 0);
696 tail = &(*tail)->next;
698 l = nasm_malloc(sizeof(Line));
699 l->next = istk->expansion;
700 l->first = head;
701 l->finishes = NULL;
702 istk->expansion = l;
704 do_predef = false;
707 return ret;
710 bufsize = BUF_DELTA;
711 buffer = nasm_malloc(BUF_DELTA);
712 p = buffer;
713 continued_count = 0;
714 while (1) {
715 q = fgets(p, bufsize - (p - buffer), istk->fp);
716 if (!q)
717 break;
718 p += strlen(p);
719 if (p > buffer && p[-1] == '\n') {
720 /* Convert backslash-CRLF line continuation sequences into
721 nothing at all (for DOS and Windows) */
722 if (((p - 2) > buffer) && (p[-3] == '\\') && (p[-2] == '\r')) {
723 p -= 3;
724 *p = 0;
725 continued_count++;
727 /* Also convert backslash-LF line continuation sequences into
728 nothing at all (for Unix) */
729 else if (((p - 1) > buffer) && (p[-2] == '\\')) {
730 p -= 2;
731 *p = 0;
732 continued_count++;
733 } else {
734 break;
737 if (p - buffer > bufsize - 10) {
738 int32_t offset = p - buffer;
739 bufsize += BUF_DELTA;
740 buffer = nasm_realloc(buffer, bufsize);
741 p = buffer + offset; /* prevent stale-pointer problems */
745 if (!q && p == buffer) {
746 nasm_free(buffer);
747 return NULL;
750 src_set_linnum(src_get_linnum() + istk->lineinc +
751 (continued_count * istk->lineinc));
754 * Play safe: remove CRs as well as LFs, if any of either are
755 * present at the end of the line.
757 while (--p >= buffer && (*p == '\n' || *p == '\r'))
758 *p = '\0';
761 * Handle spurious ^Z, which may be inserted into source files
762 * by some file transfer utilities.
764 buffer[strcspn(buffer, "\032")] = '\0';
766 list->line(LIST_READ, buffer);
768 return buffer;
772 * Tokenize a line of text. This is a very simple process since we
773 * don't need to parse the value out of e.g. numeric tokens: we
774 * simply split one string into many.
776 static Token *tokenize(char *line)
778 char *p = line;
779 enum pp_token_type type;
780 Token *list = NULL;
781 Token *t, **tail = &list;
783 while (*line) {
784 p = line;
785 if (*p == '%') {
786 p++;
787 if (nasm_isdigit(*p) ||
788 ((*p == '-' || *p == '+') && nasm_isdigit(p[1])) ||
789 ((*p == '+') && (nasm_isspace(p[1]) || !p[1]))) {
790 do {
791 p++;
793 while (nasm_isdigit(*p));
794 type = TOK_PREPROC_ID;
795 } else if (*p == '{') {
796 p++;
797 while (*p && *p != '}') {
798 p[-1] = *p;
799 p++;
801 p[-1] = '\0';
802 if (*p)
803 p++;
804 type = TOK_PREPROC_ID;
805 } else if (*p == '?') {
806 type = TOK_PREPROC_Q; /* %? */
807 p++;
808 if (*p == '?') {
809 type = TOK_PREPROC_QQ; /* %?? */
810 p++;
812 } else if (isidchar(*p) ||
813 ((*p == '!' || *p == '%' || *p == '$') &&
814 isidchar(p[1]))) {
815 do {
816 p++;
818 while (isidchar(*p));
819 type = TOK_PREPROC_ID;
820 } else {
821 type = TOK_OTHER;
822 if (*p == '%')
823 p++;
825 } else if (isidstart(*p) || (*p == '$' && isidstart(p[1]))) {
826 type = TOK_ID;
827 p++;
828 while (*p && isidchar(*p))
829 p++;
830 } else if (*p == '\'' || *p == '"' || *p == '`') {
832 * A string token.
834 type = TOK_STRING;
835 p = nasm_skip_string(p);
837 if (*p) {
838 p++;
839 } else {
840 error(ERR_WARNING, "unterminated string");
841 /* Handling unterminated strings by UNV */
842 /* type = -1; */
844 } else if (isnumstart(*p)) {
845 bool is_hex = false;
846 bool is_float = false;
847 bool has_e = false;
848 char c, *r;
851 * A numeric token.
854 if (*p == '$') {
855 p++;
856 is_hex = true;
859 for (;;) {
860 c = *p++;
862 if (!is_hex && (c == 'e' || c == 'E')) {
863 has_e = true;
864 if (*p == '+' || *p == '-') {
865 /* e can only be followed by +/- if it is either a
866 prefixed hex number or a floating-point number */
867 p++;
868 is_float = true;
870 } else if (c == 'H' || c == 'h' || c == 'X' || c == 'x') {
871 is_hex = true;
872 } else if (c == 'P' || c == 'p') {
873 is_float = true;
874 if (*p == '+' || *p == '-')
875 p++;
876 } else if (isnumchar(c) || c == '_')
877 ; /* just advance */
878 else if (c == '.') {
879 /* we need to deal with consequences of the legacy
880 parser, like "1.nolist" being two tokens
881 (TOK_NUMBER, TOK_ID) here; at least give it
882 a shot for now. In the future, we probably need
883 a flex-based scanner with proper pattern matching
884 to do it as well as it can be done. Nothing in
885 the world is going to help the person who wants
886 0x123.p16 interpreted as two tokens, though. */
887 r = p;
888 while (*r == '_')
889 r++;
891 if (nasm_isdigit(*r) || (is_hex && nasm_isxdigit(*r)) ||
892 (!is_hex && (*r == 'e' || *r == 'E')) ||
893 (*r == 'p' || *r == 'P')) {
894 p = r;
895 is_float = true;
896 } else
897 break; /* Terminate the token */
898 } else
899 break;
901 p--; /* Point to first character beyond number */
903 if (has_e && !is_hex) {
904 /* 1e13 is floating-point, but 1e13h is not */
905 is_float = true;
908 type = is_float ? TOK_FLOAT : TOK_NUMBER;
909 } else if (nasm_isspace(*p)) {
910 type = TOK_WHITESPACE;
911 p++;
912 while (*p && nasm_isspace(*p))
913 p++;
915 * Whitespace just before end-of-line is discarded by
916 * pretending it's a comment; whitespace just before a
917 * comment gets lumped into the comment.
919 if (!*p || *p == ';') {
920 type = TOK_COMMENT;
921 while (*p)
922 p++;
924 } else if (*p == ';') {
925 type = TOK_COMMENT;
926 while (*p)
927 p++;
928 } else {
930 * Anything else is an operator of some kind. We check
931 * for all the double-character operators (>>, <<, //,
932 * %%, <=, >=, ==, !=, <>, &&, ||, ^^), but anything
933 * else is a single-character operator.
935 type = TOK_OTHER;
936 if ((p[0] == '>' && p[1] == '>') ||
937 (p[0] == '<' && p[1] == '<') ||
938 (p[0] == '/' && p[1] == '/') ||
939 (p[0] == '<' && p[1] == '=') ||
940 (p[0] == '>' && p[1] == '=') ||
941 (p[0] == '=' && p[1] == '=') ||
942 (p[0] == '!' && p[1] == '=') ||
943 (p[0] == '<' && p[1] == '>') ||
944 (p[0] == '&' && p[1] == '&') ||
945 (p[0] == '|' && p[1] == '|') ||
946 (p[0] == '^' && p[1] == '^')) {
947 p++;
949 p++;
952 /* Handling unterminated string by UNV */
953 /*if (type == -1)
955 *tail = t = new_Token(NULL, TOK_STRING, line, p-line+1);
956 t->text[p-line] = *line;
957 tail = &t->next;
959 else */
960 if (type != TOK_COMMENT) {
961 *tail = t = new_Token(NULL, type, line, p - line);
962 tail = &t->next;
964 line = p;
966 return list;
970 * this function allocates a new managed block of memory and
971 * returns a pointer to the block. The managed blocks are
972 * deleted only all at once by the delete_Blocks function.
974 static void *new_Block(size_t size)
976 Blocks *b = &blocks;
978 /* first, get to the end of the linked list */
979 while (b->next)
980 b = b->next;
981 /* now allocate the requested chunk */
982 b->chunk = nasm_malloc(size);
984 /* now allocate a new block for the next request */
985 b->next = nasm_malloc(sizeof(Blocks));
986 /* and initialize the contents of the new block */
987 b->next->next = NULL;
988 b->next->chunk = NULL;
989 return b->chunk;
993 * this function deletes all managed blocks of memory
995 static void delete_Blocks(void)
997 Blocks *a, *b = &blocks;
1000 * keep in mind that the first block, pointed to by blocks
1001 * is a static and not dynamically allocated, so we don't
1002 * free it.
1004 while (b) {
1005 if (b->chunk)
1006 nasm_free(b->chunk);
1007 a = b;
1008 b = b->next;
1009 if (a != &blocks)
1010 nasm_free(a);
1015 * this function creates a new Token and passes a pointer to it
1016 * back to the caller. It sets the type and text elements, and
1017 * also the a.mac and next elements to NULL.
1019 static Token *new_Token(Token * next, enum pp_token_type type,
1020 const char *text, int txtlen)
1022 Token *t;
1023 int i;
1025 if (freeTokens == NULL) {
1026 freeTokens = (Token *) new_Block(TOKEN_BLOCKSIZE * sizeof(Token));
1027 for (i = 0; i < TOKEN_BLOCKSIZE - 1; i++)
1028 freeTokens[i].next = &freeTokens[i + 1];
1029 freeTokens[i].next = NULL;
1031 t = freeTokens;
1032 freeTokens = t->next;
1033 t->next = next;
1034 t->a.mac = NULL;
1035 t->type = type;
1036 if (type == TOK_WHITESPACE || text == NULL) {
1037 t->text = NULL;
1038 } else {
1039 if (txtlen == 0)
1040 txtlen = strlen(text);
1041 t->text = nasm_malloc(txtlen+1);
1042 memcpy(t->text, text, txtlen);
1043 t->text[txtlen] = '\0';
1045 return t;
1048 static Token *delete_Token(Token * t)
1050 Token *next = t->next;
1051 nasm_free(t->text);
1052 t->next = freeTokens;
1053 freeTokens = t;
1054 return next;
1058 * Convert a line of tokens back into text.
1059 * If expand_locals is not zero, identifiers of the form "%$*xxx"
1060 * will be transformed into ..@ctxnum.xxx
1062 static char *detoken(Token * tlist, bool expand_locals)
1064 Token *t;
1065 int len;
1066 char *line, *p;
1067 const char *q;
1069 len = 0;
1070 for (t = tlist; t; t = t->next) {
1071 if (t->type == TOK_PREPROC_ID && t->text[1] == '!') {
1072 char *p = getenv(t->text + 2);
1073 nasm_free(t->text);
1074 if (p)
1075 t->text = nasm_strdup(p);
1076 else
1077 t->text = NULL;
1079 /* Expand local macros here and not during preprocessing */
1080 if (expand_locals &&
1081 t->type == TOK_PREPROC_ID && t->text &&
1082 t->text[0] == '%' && t->text[1] == '$') {
1083 Context *ctx = get_ctx(t->text, false);
1084 if (ctx) {
1085 char buffer[40];
1086 char *p, *q = t->text + 2;
1088 q += strspn(q, "$");
1089 snprintf(buffer, sizeof(buffer), "..@%"PRIu32".", ctx->number);
1090 p = nasm_strcat(buffer, q);
1091 nasm_free(t->text);
1092 t->text = p;
1095 if (t->type == TOK_WHITESPACE) {
1096 len++;
1097 } else if (t->text) {
1098 len += strlen(t->text);
1101 p = line = nasm_malloc(len + 1);
1102 for (t = tlist; t; t = t->next) {
1103 if (t->type == TOK_WHITESPACE) {
1104 *p++ = ' ';
1105 } else if (t->text) {
1106 q = t->text;
1107 while (*q)
1108 *p++ = *q++;
1111 *p = '\0';
1112 return line;
1116 * A scanner, suitable for use by the expression evaluator, which
1117 * operates on a line of Tokens. Expects a pointer to a pointer to
1118 * the first token in the line to be passed in as its private_data
1119 * field.
1121 * FIX: This really needs to be unified with stdscan.
1123 static int ppscan(void *private_data, struct tokenval *tokval)
1125 Token **tlineptr = private_data;
1126 Token *tline;
1127 char ourcopy[MAX_KEYWORD+1], *p, *r, *s;
1129 do {
1130 tline = *tlineptr;
1131 *tlineptr = tline ? tline->next : NULL;
1133 while (tline && (tline->type == TOK_WHITESPACE ||
1134 tline->type == TOK_COMMENT));
1136 if (!tline)
1137 return tokval->t_type = TOKEN_EOS;
1139 tokval->t_charptr = tline->text;
1141 if (tline->text[0] == '$' && !tline->text[1])
1142 return tokval->t_type = TOKEN_HERE;
1143 if (tline->text[0] == '$' && tline->text[1] == '$' && !tline->text[2])
1144 return tokval->t_type = TOKEN_BASE;
1146 if (tline->type == TOK_ID) {
1147 p = tokval->t_charptr = tline->text;
1148 if (p[0] == '$') {
1149 tokval->t_charptr++;
1150 return tokval->t_type = TOKEN_ID;
1153 for (r = p, s = ourcopy; *r; r++) {
1154 if (r >= p+MAX_KEYWORD)
1155 return tokval->t_type = TOKEN_ID; /* Not a keyword */
1156 *s++ = nasm_tolower(*r);
1158 *s = '\0';
1159 /* right, so we have an identifier sitting in temp storage. now,
1160 * is it actually a register or instruction name, or what? */
1161 return nasm_token_hash(ourcopy, tokval);
1164 if (tline->type == TOK_NUMBER) {
1165 bool rn_error;
1166 tokval->t_integer = readnum(tline->text, &rn_error);
1167 tokval->t_charptr = tline->text;
1168 if (rn_error)
1169 return tokval->t_type = TOKEN_ERRNUM;
1170 else
1171 return tokval->t_type = TOKEN_NUM;
1174 if (tline->type == TOK_FLOAT) {
1175 return tokval->t_type = TOKEN_FLOAT;
1178 if (tline->type == TOK_STRING) {
1179 char bq, *ep;
1181 bq = tline->text[0];
1182 tokval->t_charptr = tline->text;
1183 tokval->t_inttwo = nasm_unquote(tline->text, &ep);
1185 if (ep[0] != bq || ep[1] != '\0')
1186 return tokval->t_type = TOKEN_ERRSTR;
1187 else
1188 return tokval->t_type = TOKEN_STR;
1191 if (tline->type == TOK_OTHER) {
1192 if (!strcmp(tline->text, "<<"))
1193 return tokval->t_type = TOKEN_SHL;
1194 if (!strcmp(tline->text, ">>"))
1195 return tokval->t_type = TOKEN_SHR;
1196 if (!strcmp(tline->text, "//"))
1197 return tokval->t_type = TOKEN_SDIV;
1198 if (!strcmp(tline->text, "%%"))
1199 return tokval->t_type = TOKEN_SMOD;
1200 if (!strcmp(tline->text, "=="))
1201 return tokval->t_type = TOKEN_EQ;
1202 if (!strcmp(tline->text, "<>"))
1203 return tokval->t_type = TOKEN_NE;
1204 if (!strcmp(tline->text, "!="))
1205 return tokval->t_type = TOKEN_NE;
1206 if (!strcmp(tline->text, "<="))
1207 return tokval->t_type = TOKEN_LE;
1208 if (!strcmp(tline->text, ">="))
1209 return tokval->t_type = TOKEN_GE;
1210 if (!strcmp(tline->text, "&&"))
1211 return tokval->t_type = TOKEN_DBL_AND;
1212 if (!strcmp(tline->text, "^^"))
1213 return tokval->t_type = TOKEN_DBL_XOR;
1214 if (!strcmp(tline->text, "||"))
1215 return tokval->t_type = TOKEN_DBL_OR;
1219 * We have no other options: just return the first character of
1220 * the token text.
1222 return tokval->t_type = tline->text[0];
1226 * Compare a string to the name of an existing macro; this is a
1227 * simple wrapper which calls either strcmp or nasm_stricmp
1228 * depending on the value of the `casesense' parameter.
1230 static int mstrcmp(const char *p, const char *q, bool casesense)
1232 return casesense ? strcmp(p, q) : nasm_stricmp(p, q);
1236 * Compare a string to the name of an existing macro; this is a
1237 * simple wrapper which calls either strcmp or nasm_stricmp
1238 * depending on the value of the `casesense' parameter.
1240 static int mmemcmp(const char *p, const char *q, size_t l, bool casesense)
1242 return casesense ? memcmp(p, q, l) : nasm_memicmp(p, q, l);
1246 * Return the Context structure associated with a %$ token. Return
1247 * NULL, having _already_ reported an error condition, if the
1248 * context stack isn't deep enough for the supplied number of $
1249 * signs.
1250 * If all_contexts == true, contexts that enclose current are
1251 * also scanned for such smacro, until it is found; if not -
1252 * only the context that directly results from the number of $'s
1253 * in variable's name.
1255 static Context *get_ctx(const char *name, bool all_contexts)
1257 Context *ctx;
1258 SMacro *m;
1259 int i;
1261 if (!name || name[0] != '%' || name[1] != '$')
1262 return NULL;
1264 if (!cstk) {
1265 error(ERR_NONFATAL, "`%s': context stack is empty", name);
1266 return NULL;
1269 for (i = strspn(name + 2, "$"), ctx = cstk; (i > 0) && ctx; i--) {
1270 ctx = ctx->next;
1271 /* i--; Lino - 02/25/02 */
1273 if (!ctx) {
1274 error(ERR_NONFATAL, "`%s': context stack is only"
1275 " %d level%s deep", name, i - 1, (i == 2 ? "" : "s"));
1276 return NULL;
1278 if (!all_contexts)
1279 return ctx;
1281 do {
1282 /* Search for this smacro in found context */
1283 m = hash_findix(&ctx->localmac, name);
1284 while (m) {
1285 if (!mstrcmp(m->name, name, m->casesense))
1286 return ctx;
1287 m = m->next;
1289 ctx = ctx->next;
1291 while (ctx);
1292 return NULL;
1296 * Check to see if a file is already in a string list
1298 static bool in_list(const StrList *list, const char *str)
1300 while (list) {
1301 if (!strcmp(list->str, str))
1302 return true;
1303 list = list->next;
1305 return false;
1309 * Open an include file. This routine must always return a valid
1310 * file pointer if it returns - it's responsible for throwing an
1311 * ERR_FATAL and bombing out completely if not. It should also try
1312 * the include path one by one until it finds the file or reaches
1313 * the end of the path.
1315 static FILE *inc_fopen(const char *file, StrList **dhead, StrList ***dtail,
1316 bool missing_ok)
1318 FILE *fp;
1319 char *prefix = "";
1320 IncPath *ip = ipath;
1321 int len = strlen(file);
1322 size_t prefix_len = 0;
1323 StrList *sl;
1325 while (1) {
1326 sl = nasm_malloc(prefix_len+len+1+sizeof sl->next);
1327 memcpy(sl->str, prefix, prefix_len);
1328 memcpy(sl->str+prefix_len, file, len+1);
1329 fp = fopen(sl->str, "r");
1330 if (fp && dhead && !in_list(*dhead, sl->str)) {
1331 sl->next = NULL;
1332 **dtail = sl;
1333 *dtail = &sl->next;
1334 } else {
1335 nasm_free(sl);
1337 if (fp)
1338 return fp;
1339 if (!ip) {
1340 if (!missing_ok)
1341 break;
1342 prefix = NULL;
1343 } else {
1344 prefix = ip->path;
1345 ip = ip->next;
1347 if (prefix) {
1348 prefix_len = strlen(prefix);
1349 } else {
1350 /* -MG given and file not found */
1351 if (dhead && !in_list(*dhead, file)) {
1352 sl = nasm_malloc(len+1+sizeof sl->next);
1353 sl->next = NULL;
1354 strcpy(sl->str, file);
1355 **dtail = sl;
1356 *dtail = &sl->next;
1358 return NULL;
1362 error(ERR_FATAL, "unable to open include file `%s'", file);
1363 return NULL; /* never reached - placate compilers */
1367 * Determine if we should warn on defining a single-line macro of
1368 * name `name', with `nparam' parameters. If nparam is 0 or -1, will
1369 * return true if _any_ single-line macro of that name is defined.
1370 * Otherwise, will return true if a single-line macro with either
1371 * `nparam' or no parameters is defined.
1373 * If a macro with precisely the right number of parameters is
1374 * defined, or nparam is -1, the address of the definition structure
1375 * will be returned in `defn'; otherwise NULL will be returned. If `defn'
1376 * is NULL, no action will be taken regarding its contents, and no
1377 * error will occur.
1379 * Note that this is also called with nparam zero to resolve
1380 * `ifdef'.
1382 * If you already know which context macro belongs to, you can pass
1383 * the context pointer as first parameter; if you won't but name begins
1384 * with %$ the context will be automatically computed. If all_contexts
1385 * is true, macro will be searched in outer contexts as well.
1387 static bool
1388 smacro_defined(Context * ctx, const char *name, int nparam, SMacro ** defn,
1389 bool nocase)
1391 struct hash_table *smtbl;
1392 SMacro *m;
1394 if (ctx) {
1395 smtbl = &ctx->localmac;
1396 } else if (name[0] == '%' && name[1] == '$') {
1397 if (cstk)
1398 ctx = get_ctx(name, false);
1399 if (!ctx)
1400 return false; /* got to return _something_ */
1401 smtbl = &ctx->localmac;
1402 } else {
1403 smtbl = &smacros;
1405 m = (SMacro *) hash_findix(smtbl, name);
1407 while (m) {
1408 if (!mstrcmp(m->name, name, m->casesense && nocase) &&
1409 (nparam <= 0 || m->nparam == 0 || nparam == (int) m->nparam)) {
1410 if (defn) {
1411 if (nparam == (int) m->nparam || nparam == -1)
1412 *defn = m;
1413 else
1414 *defn = NULL;
1416 return true;
1418 m = m->next;
1421 return false;
1425 * Count and mark off the parameters in a multi-line macro call.
1426 * This is called both from within the multi-line macro expansion
1427 * code, and also to mark off the default parameters when provided
1428 * in a %macro definition line.
1430 static void count_mmac_params(Token * t, int *nparam, Token *** params)
1432 int paramsize, brace;
1434 *nparam = paramsize = 0;
1435 *params = NULL;
1436 while (t) {
1437 if (*nparam >= paramsize) {
1438 paramsize += PARAM_DELTA;
1439 *params = nasm_realloc(*params, sizeof(**params) * paramsize);
1441 skip_white_(t);
1442 brace = false;
1443 if (tok_is_(t, "{"))
1444 brace = true;
1445 (*params)[(*nparam)++] = t;
1446 while (tok_isnt_(t, brace ? "}" : ","))
1447 t = t->next;
1448 if (t) { /* got a comma/brace */
1449 t = t->next;
1450 if (brace) {
1452 * Now we've found the closing brace, look further
1453 * for the comma.
1455 skip_white_(t);
1456 if (tok_isnt_(t, ",")) {
1457 error(ERR_NONFATAL,
1458 "braces do not enclose all of macro parameter");
1459 while (tok_isnt_(t, ","))
1460 t = t->next;
1462 if (t)
1463 t = t->next; /* eat the comma */
1470 * Determine whether one of the various `if' conditions is true or
1471 * not.
1473 * We must free the tline we get passed.
1475 static bool if_condition(Token * tline, enum preproc_token ct)
1477 enum pp_conditional i = PP_COND(ct);
1478 bool j;
1479 Token *t, *tt, **tptr, *origline;
1480 struct tokenval tokval;
1481 expr *evalresult;
1482 enum pp_token_type needtype;
1484 origline = tline;
1486 switch (i) {
1487 case PPC_IFCTX:
1488 j = false; /* have we matched yet? */
1489 while (true) {
1490 skip_white_(tline);
1491 if (!tline)
1492 break;
1493 if (tline->type != TOK_ID) {
1494 error(ERR_NONFATAL,
1495 "`%s' expects context identifiers", pp_directives[ct]);
1496 free_tlist(origline);
1497 return -1;
1499 if (cstk && cstk->name && !nasm_stricmp(tline->text, cstk->name))
1500 j = true;
1501 tline = tline->next;
1503 break;
1505 case PPC_IFDEF:
1506 j = false; /* have we matched yet? */
1507 while (tline) {
1508 skip_white_(tline);
1509 if (!tline || (tline->type != TOK_ID &&
1510 (tline->type != TOK_PREPROC_ID ||
1511 tline->text[1] != '$'))) {
1512 error(ERR_NONFATAL,
1513 "`%s' expects macro identifiers", pp_directives[ct]);
1514 goto fail;
1516 if (smacro_defined(NULL, tline->text, 0, NULL, true))
1517 j = true;
1518 tline = tline->next;
1520 break;
1522 case PPC_IFIDN:
1523 case PPC_IFIDNI:
1524 tline = expand_smacro(tline);
1525 t = tt = tline;
1526 while (tok_isnt_(tt, ","))
1527 tt = tt->next;
1528 if (!tt) {
1529 error(ERR_NONFATAL,
1530 "`%s' expects two comma-separated arguments",
1531 pp_directives[ct]);
1532 goto fail;
1534 tt = tt->next;
1535 j = true; /* assume equality unless proved not */
1536 while ((t->type != TOK_OTHER || strcmp(t->text, ",")) && tt) {
1537 if (tt->type == TOK_OTHER && !strcmp(tt->text, ",")) {
1538 error(ERR_NONFATAL, "`%s': more than one comma on line",
1539 pp_directives[ct]);
1540 goto fail;
1542 if (t->type == TOK_WHITESPACE) {
1543 t = t->next;
1544 continue;
1546 if (tt->type == TOK_WHITESPACE) {
1547 tt = tt->next;
1548 continue;
1550 if (tt->type != t->type) {
1551 j = false; /* found mismatching tokens */
1552 break;
1554 /* When comparing strings, need to unquote them first */
1555 if (t->type == TOK_STRING) {
1556 size_t l1 = nasm_unquote(t->text, NULL);
1557 size_t l2 = nasm_unquote(tt->text, NULL);
1559 if (l1 != l2) {
1560 j = false;
1561 break;
1563 if (mmemcmp(t->text, tt->text, l1, i == PPC_IFIDN)) {
1564 j = false;
1565 break;
1567 } else if (mstrcmp(tt->text, t->text, i == PPC_IFIDN) != 0) {
1568 j = false; /* found mismatching tokens */
1569 break;
1572 t = t->next;
1573 tt = tt->next;
1575 if ((t->type != TOK_OTHER || strcmp(t->text, ",")) || tt)
1576 j = false; /* trailing gunk on one end or other */
1577 break;
1579 case PPC_IFMACRO:
1581 bool found = false;
1582 MMacro searching, *mmac;
1584 tline = tline->next;
1585 skip_white_(tline);
1586 tline = expand_id(tline);
1587 if (!tok_type_(tline, TOK_ID)) {
1588 error(ERR_NONFATAL,
1589 "`%s' expects a macro name", pp_directives[ct]);
1590 goto fail;
1592 searching.name = nasm_strdup(tline->text);
1593 searching.casesense = true;
1594 searching.plus = false;
1595 searching.nolist = false;
1596 searching.in_progress = 0;
1597 searching.rep_nest = NULL;
1598 searching.nparam_min = 0;
1599 searching.nparam_max = INT_MAX;
1600 tline = expand_smacro(tline->next);
1601 skip_white_(tline);
1602 if (!tline) {
1603 } else if (!tok_type_(tline, TOK_NUMBER)) {
1604 error(ERR_NONFATAL,
1605 "`%s' expects a parameter count or nothing",
1606 pp_directives[ct]);
1607 } else {
1608 searching.nparam_min = searching.nparam_max =
1609 readnum(tline->text, &j);
1610 if (j)
1611 error(ERR_NONFATAL,
1612 "unable to parse parameter count `%s'",
1613 tline->text);
1615 if (tline && tok_is_(tline->next, "-")) {
1616 tline = tline->next->next;
1617 if (tok_is_(tline, "*"))
1618 searching.nparam_max = INT_MAX;
1619 else if (!tok_type_(tline, TOK_NUMBER))
1620 error(ERR_NONFATAL,
1621 "`%s' expects a parameter count after `-'",
1622 pp_directives[ct]);
1623 else {
1624 searching.nparam_max = readnum(tline->text, &j);
1625 if (j)
1626 error(ERR_NONFATAL,
1627 "unable to parse parameter count `%s'",
1628 tline->text);
1629 if (searching.nparam_min > searching.nparam_max)
1630 error(ERR_NONFATAL,
1631 "minimum parameter count exceeds maximum");
1634 if (tline && tok_is_(tline->next, "+")) {
1635 tline = tline->next;
1636 searching.plus = true;
1638 mmac = (MMacro *) hash_findix(&mmacros, searching.name);
1639 while (mmac) {
1640 if (!strcmp(mmac->name, searching.name) &&
1641 (mmac->nparam_min <= searching.nparam_max
1642 || searching.plus)
1643 && (searching.nparam_min <= mmac->nparam_max
1644 || mmac->plus)) {
1645 found = true;
1646 break;
1648 mmac = mmac->next;
1650 nasm_free(searching.name);
1651 j = found;
1652 break;
1655 case PPC_IFID:
1656 needtype = TOK_ID;
1657 goto iftype;
1658 case PPC_IFNUM:
1659 needtype = TOK_NUMBER;
1660 goto iftype;
1661 case PPC_IFSTR:
1662 needtype = TOK_STRING;
1663 goto iftype;
1665 iftype:
1666 t = tline = expand_smacro(tline);
1668 while (tok_type_(t, TOK_WHITESPACE) ||
1669 (needtype == TOK_NUMBER &&
1670 tok_type_(t, TOK_OTHER) &&
1671 (t->text[0] == '-' || t->text[0] == '+') &&
1672 !t->text[1]))
1673 t = t->next;
1675 j = tok_type_(t, needtype);
1676 break;
1678 case PPC_IFTOKEN:
1679 t = tline = expand_smacro(tline);
1680 while (tok_type_(t, TOK_WHITESPACE))
1681 t = t->next;
1683 j = false;
1684 if (t) {
1685 t = t->next; /* Skip the actual token */
1686 while (tok_type_(t, TOK_WHITESPACE))
1687 t = t->next;
1688 j = !t; /* Should be nothing left */
1690 break;
1692 case PPC_IFEMPTY:
1693 t = tline = expand_smacro(tline);
1694 while (tok_type_(t, TOK_WHITESPACE))
1695 t = t->next;
1697 j = !t; /* Should be empty */
1698 break;
1700 case PPC_IF:
1701 t = tline = expand_smacro(tline);
1702 tptr = &t;
1703 tokval.t_type = TOKEN_INVALID;
1704 evalresult = evaluate(ppscan, tptr, &tokval,
1705 NULL, pass | CRITICAL, error, NULL);
1706 if (!evalresult)
1707 return -1;
1708 if (tokval.t_type)
1709 error(ERR_WARNING,
1710 "trailing garbage after expression ignored");
1711 if (!is_simple(evalresult)) {
1712 error(ERR_NONFATAL,
1713 "non-constant value given to `%s'", pp_directives[ct]);
1714 goto fail;
1716 j = reloc_value(evalresult) != 0;
1717 break;
1719 default:
1720 error(ERR_FATAL,
1721 "preprocessor directive `%s' not yet implemented",
1722 pp_directives[ct]);
1723 goto fail;
1726 free_tlist(origline);
1727 return j ^ PP_NEGATIVE(ct);
1729 fail:
1730 free_tlist(origline);
1731 return -1;
1735 * Common code for defining an smacro
1737 static bool define_smacro(Context *ctx, char *mname, bool casesense,
1738 int nparam, Token *expansion)
1740 SMacro *smac, **smhead;
1741 struct hash_table *smtbl;
1743 if (smacro_defined(ctx, mname, nparam, &smac, casesense)) {
1744 if (!smac) {
1745 error(ERR_WARNING,
1746 "single-line macro `%s' defined both with and"
1747 " without parameters", mname);
1749 /* Some instances of the old code considered this a failure,
1750 some others didn't. What is the right thing to do here? */
1751 free_tlist(expansion);
1752 return false; /* Failure */
1753 } else {
1755 * We're redefining, so we have to take over an
1756 * existing SMacro structure. This means freeing
1757 * what was already in it.
1759 nasm_free(smac->name);
1760 free_tlist(smac->expansion);
1762 } else {
1763 smtbl = ctx ? &ctx->localmac : &smacros;
1764 smhead = (SMacro **) hash_findi_add(smtbl, mname);
1765 smac = nasm_malloc(sizeof(SMacro));
1766 smac->next = *smhead;
1767 *smhead = smac;
1769 smac->name = nasm_strdup(mname);
1770 smac->casesense = casesense;
1771 smac->nparam = nparam;
1772 smac->expansion = expansion;
1773 smac->in_progress = false;
1774 return true; /* Success */
1778 * Undefine an smacro
1780 static void undef_smacro(Context *ctx, const char *mname)
1782 SMacro **smhead, *s, **sp;
1783 struct hash_table *smtbl;
1785 smtbl = ctx ? &ctx->localmac : &smacros;
1786 smhead = (SMacro **)hash_findi(smtbl, mname, NULL);
1788 if (smhead) {
1790 * We now have a macro name... go hunt for it.
1792 sp = smhead;
1793 while ((s = *sp) != NULL) {
1794 if (!mstrcmp(s->name, mname, s->casesense)) {
1795 *sp = s->next;
1796 nasm_free(s->name);
1797 free_tlist(s->expansion);
1798 nasm_free(s);
1799 } else {
1800 sp = &s->next;
1807 * Parse a mmacro specification.
1809 static bool parse_mmacro_spec(Token *tline, MMacro *def, const char *directive)
1811 bool err;
1813 tline = tline->next;
1814 skip_white_(tline);
1815 tline = expand_id(tline);
1816 if (!tok_type_(tline, TOK_ID)) {
1817 error(ERR_NONFATAL, "`%s' expects a macro name", directive);
1818 return false;
1820 def->name = nasm_strdup(tline->text);
1821 def->plus = false;
1822 def->nolist = false;
1823 def->in_progress = 0;
1824 def->rep_nest = NULL;
1825 tline = expand_smacro(tline->next);
1826 skip_white_(tline);
1827 if (!tok_type_(tline, TOK_NUMBER)) {
1828 error(ERR_NONFATAL, "`%s' expects a parameter count", directive);
1829 def->nparam_min = def->nparam_max = 0;
1830 } else {
1831 def->nparam_min = def->nparam_max =
1832 readnum(tline->text, &err);
1833 if (err)
1834 error(ERR_NONFATAL,
1835 "unable to parse parameter count `%s'", tline->text);
1837 if (tline && tok_is_(tline->next, "-")) {
1838 tline = tline->next->next;
1839 if (tok_is_(tline, "*")) {
1840 def->nparam_max = INT_MAX;
1841 } else if (!tok_type_(tline, TOK_NUMBER)) {
1842 error(ERR_NONFATAL,
1843 "`%s' expects a parameter count after `-'", directive);
1844 } else {
1845 def->nparam_max = readnum(tline->text, &err);
1846 if (err) {
1847 error(ERR_NONFATAL, "unable to parse parameter count `%s'",
1848 tline->text);
1850 if (def->nparam_min > def->nparam_max) {
1851 error(ERR_NONFATAL, "minimum parameter count exceeds maximum");
1855 if (tline && tok_is_(tline->next, "+")) {
1856 tline = tline->next;
1857 def->plus = true;
1859 if (tline && tok_type_(tline->next, TOK_ID) &&
1860 !nasm_stricmp(tline->next->text, ".nolist")) {
1861 tline = tline->next;
1862 def->nolist = true;
1866 * Handle default parameters.
1868 if (tline && tline->next) {
1869 def->dlist = tline->next;
1870 tline->next = NULL;
1871 count_mmac_params(def->dlist, &def->ndefs, &def->defaults);
1872 } else {
1873 def->dlist = NULL;
1874 def->defaults = NULL;
1876 def->expansion = NULL;
1878 return true;
1883 * Decode a size directive
1885 static int parse_size(const char *str) {
1886 static const char *size_names[] =
1887 { "byte", "dword", "oword", "qword", "tword", "word", "yword" };
1888 static const int sizes[] =
1889 { 0, 1, 4, 16, 8, 10, 2, 32 };
1891 return sizes[bsii(str, size_names, elements(size_names))+1];
1895 * find and process preprocessor directive in passed line
1896 * Find out if a line contains a preprocessor directive, and deal
1897 * with it if so.
1899 * If a directive _is_ found, it is the responsibility of this routine
1900 * (and not the caller) to free_tlist() the line.
1902 * @param tline a pointer to the current tokeninzed line linked list
1903 * @return DIRECTIVE_FOUND or NO_DIRECTIVE_FOUND
1906 static int do_directive(Token * tline)
1908 enum preproc_token i;
1909 int j;
1910 bool err;
1911 int nparam;
1912 bool nolist;
1913 bool casesense;
1914 int k, m;
1915 int offset;
1916 char *p, *pp, *mname;
1917 Include *inc;
1918 Context *ctx;
1919 Cond *cond;
1920 MMacro *mmac, **mmhead;
1921 Token *t, *tt, *param_start, *macro_start, *last, **tptr, *origline;
1922 Line *l;
1923 struct tokenval tokval;
1924 expr *evalresult;
1925 MMacro *tmp_defining; /* Used when manipulating rep_nest */
1926 int64_t count;
1927 size_t len;
1929 origline = tline;
1931 skip_white_(tline);
1932 if (!tline || !tok_type_(tline, TOK_PREPROC_ID) ||
1933 (tline->text[1] == '%' || tline->text[1] == '$'
1934 || tline->text[1] == '!'))
1935 return NO_DIRECTIVE_FOUND;
1937 i = pp_token_hash(tline->text);
1940 * If we're in a non-emitting branch of a condition construct,
1941 * or walking to the end of an already terminated %rep block,
1942 * we should ignore all directives except for condition
1943 * directives.
1945 if (((istk->conds && !emitting(istk->conds->state)) ||
1946 (istk->mstk && !istk->mstk->in_progress)) && !is_condition(i)) {
1947 return NO_DIRECTIVE_FOUND;
1951 * If we're defining a macro or reading a %rep block, we should
1952 * ignore all directives except for %macro/%imacro (which nest),
1953 * %endm/%endmacro, and (only if we're in a %rep block) %endrep.
1954 * If we're in a %rep block, another %rep nests, so should be let through.
1956 if (defining && i != PP_MACRO && i != PP_IMACRO &&
1957 i != PP_ENDMACRO && i != PP_ENDM &&
1958 (defining->name || (i != PP_ENDREP && i != PP_REP))) {
1959 return NO_DIRECTIVE_FOUND;
1962 if (defining) {
1963 if (i == PP_MACRO || i == PP_IMACRO) {
1964 nested_mac_count++;
1965 return NO_DIRECTIVE_FOUND;
1966 } else if (nested_mac_count > 0) {
1967 if (i == PP_ENDMACRO) {
1968 nested_mac_count--;
1969 return NO_DIRECTIVE_FOUND;
1972 if (!defining->name) {
1973 if (i == PP_REP) {
1974 nested_rep_count++;
1975 return NO_DIRECTIVE_FOUND;
1976 } else if (nested_rep_count > 0) {
1977 if (i == PP_ENDREP) {
1978 nested_rep_count--;
1979 return NO_DIRECTIVE_FOUND;
1985 switch (i) {
1986 case PP_INVALID:
1987 error(ERR_NONFATAL, "unknown preprocessor directive `%s'",
1988 tline->text);
1989 return NO_DIRECTIVE_FOUND; /* didn't get it */
1991 case PP_STACKSIZE:
1992 /* Directive to tell NASM what the default stack size is. The
1993 * default is for a 16-bit stack, and this can be overriden with
1994 * %stacksize large.
1995 * the following form:
1997 * ARG arg1:WORD, arg2:DWORD, arg4:QWORD
1999 tline = tline->next;
2000 if (tline && tline->type == TOK_WHITESPACE)
2001 tline = tline->next;
2002 if (!tline || tline->type != TOK_ID) {
2003 error(ERR_NONFATAL, "`%%stacksize' missing size parameter");
2004 free_tlist(origline);
2005 return DIRECTIVE_FOUND;
2007 if (nasm_stricmp(tline->text, "flat") == 0) {
2008 /* All subsequent ARG directives are for a 32-bit stack */
2009 StackSize = 4;
2010 StackPointer = "ebp";
2011 ArgOffset = 8;
2012 LocalOffset = 0;
2013 } else if (nasm_stricmp(tline->text, "flat64") == 0) {
2014 /* All subsequent ARG directives are for a 64-bit stack */
2015 StackSize = 8;
2016 StackPointer = "rbp";
2017 ArgOffset = 8;
2018 LocalOffset = 0;
2019 } else if (nasm_stricmp(tline->text, "large") == 0) {
2020 /* All subsequent ARG directives are for a 16-bit stack,
2021 * far function call.
2023 StackSize = 2;
2024 StackPointer = "bp";
2025 ArgOffset = 4;
2026 LocalOffset = 0;
2027 } else if (nasm_stricmp(tline->text, "small") == 0) {
2028 /* All subsequent ARG directives are for a 16-bit stack,
2029 * far function call. We don't support near functions.
2031 StackSize = 2;
2032 StackPointer = "bp";
2033 ArgOffset = 6;
2034 LocalOffset = 0;
2035 } else {
2036 error(ERR_NONFATAL, "`%%stacksize' invalid size type");
2037 free_tlist(origline);
2038 return DIRECTIVE_FOUND;
2040 free_tlist(origline);
2041 return DIRECTIVE_FOUND;
2043 case PP_ARG:
2044 /* TASM like ARG directive to define arguments to functions, in
2045 * the following form:
2047 * ARG arg1:WORD, arg2:DWORD, arg4:QWORD
2049 offset = ArgOffset;
2050 do {
2051 char *arg, directive[256];
2052 int size = StackSize;
2054 /* Find the argument name */
2055 tline = tline->next;
2056 if (tline && tline->type == TOK_WHITESPACE)
2057 tline = tline->next;
2058 if (!tline || tline->type != TOK_ID) {
2059 error(ERR_NONFATAL, "`%%arg' missing argument parameter");
2060 free_tlist(origline);
2061 return DIRECTIVE_FOUND;
2063 arg = tline->text;
2065 /* Find the argument size type */
2066 tline = tline->next;
2067 if (!tline || tline->type != TOK_OTHER
2068 || tline->text[0] != ':') {
2069 error(ERR_NONFATAL,
2070 "Syntax error processing `%%arg' directive");
2071 free_tlist(origline);
2072 return DIRECTIVE_FOUND;
2074 tline = tline->next;
2075 if (!tline || tline->type != TOK_ID) {
2076 error(ERR_NONFATAL, "`%%arg' missing size type parameter");
2077 free_tlist(origline);
2078 return DIRECTIVE_FOUND;
2081 /* Allow macro expansion of type parameter */
2082 tt = tokenize(tline->text);
2083 tt = expand_smacro(tt);
2084 size = parse_size(tt->text);
2085 if (!size) {
2086 error(ERR_NONFATAL,
2087 "Invalid size type for `%%arg' missing directive");
2088 free_tlist(tt);
2089 free_tlist(origline);
2090 return DIRECTIVE_FOUND;
2092 free_tlist(tt);
2094 /* Round up to even stack slots */
2095 size = (size+StackSize-1) & ~(StackSize-1);
2097 /* Now define the macro for the argument */
2098 snprintf(directive, sizeof(directive), "%%define %s (%s+%d)",
2099 arg, StackPointer, offset);
2100 do_directive(tokenize(directive));
2101 offset += size;
2103 /* Move to the next argument in the list */
2104 tline = tline->next;
2105 if (tline && tline->type == TOK_WHITESPACE)
2106 tline = tline->next;
2107 } while (tline && tline->type == TOK_OTHER && tline->text[0] == ',');
2108 ArgOffset = offset;
2109 free_tlist(origline);
2110 return DIRECTIVE_FOUND;
2112 case PP_LOCAL:
2113 /* TASM like LOCAL directive to define local variables for a
2114 * function, in the following form:
2116 * LOCAL local1:WORD, local2:DWORD, local4:QWORD = LocalSize
2118 * The '= LocalSize' at the end is ignored by NASM, but is
2119 * required by TASM to define the local parameter size (and used
2120 * by the TASM macro package).
2122 offset = LocalOffset;
2123 do {
2124 char *local, directive[256];
2125 int size = StackSize;
2127 /* Find the argument name */
2128 tline = tline->next;
2129 if (tline && tline->type == TOK_WHITESPACE)
2130 tline = tline->next;
2131 if (!tline || tline->type != TOK_ID) {
2132 error(ERR_NONFATAL,
2133 "`%%local' missing argument parameter");
2134 free_tlist(origline);
2135 return DIRECTIVE_FOUND;
2137 local = tline->text;
2139 /* Find the argument size type */
2140 tline = tline->next;
2141 if (!tline || tline->type != TOK_OTHER
2142 || tline->text[0] != ':') {
2143 error(ERR_NONFATAL,
2144 "Syntax error processing `%%local' directive");
2145 free_tlist(origline);
2146 return DIRECTIVE_FOUND;
2148 tline = tline->next;
2149 if (!tline || tline->type != TOK_ID) {
2150 error(ERR_NONFATAL,
2151 "`%%local' missing size type parameter");
2152 free_tlist(origline);
2153 return DIRECTIVE_FOUND;
2156 /* Allow macro expansion of type parameter */
2157 tt = tokenize(tline->text);
2158 tt = expand_smacro(tt);
2159 size = parse_size(tt->text);
2160 if (!size) {
2161 error(ERR_NONFATAL,
2162 "Invalid size type for `%%local' missing directive");
2163 free_tlist(tt);
2164 free_tlist(origline);
2165 return DIRECTIVE_FOUND;
2167 free_tlist(tt);
2169 /* Round up to even stack slots */
2170 size = (size+StackSize-1) & ~(StackSize-1);
2172 offset += size; /* Negative offset, increment before */
2174 /* Now define the macro for the argument */
2175 snprintf(directive, sizeof(directive), "%%define %s (%s-%d)",
2176 local, StackPointer, offset);
2177 do_directive(tokenize(directive));
2179 /* Now define the assign to setup the enter_c macro correctly */
2180 snprintf(directive, sizeof(directive),
2181 "%%assign %%$localsize %%$localsize+%d", size);
2182 do_directive(tokenize(directive));
2184 /* Move to the next argument in the list */
2185 tline = tline->next;
2186 if (tline && tline->type == TOK_WHITESPACE)
2187 tline = tline->next;
2188 } while (tline && tline->type == TOK_OTHER && tline->text[0] == ',');
2189 LocalOffset = offset;
2190 free_tlist(origline);
2191 return DIRECTIVE_FOUND;
2193 case PP_CLEAR:
2194 if (tline->next)
2195 error(ERR_WARNING, "trailing garbage after `%%clear' ignored");
2196 free_macros();
2197 init_macros();
2198 free_tlist(origline);
2199 return DIRECTIVE_FOUND;
2201 case PP_DEPEND:
2202 t = tline->next = expand_smacro(tline->next);
2203 skip_white_(t);
2204 if (!t || (t->type != TOK_STRING &&
2205 t->type != TOK_INTERNAL_STRING)) {
2206 error(ERR_NONFATAL, "`%%depend' expects a file name");
2207 free_tlist(origline);
2208 return DIRECTIVE_FOUND; /* but we did _something_ */
2210 if (t->next)
2211 error(ERR_WARNING,
2212 "trailing garbage after `%%depend' ignored");
2213 p = t->text;
2214 if (t->type != TOK_INTERNAL_STRING)
2215 nasm_unquote(p, NULL);
2216 if (dephead && !in_list(*dephead, p)) {
2217 StrList *sl = nasm_malloc(strlen(p)+1+sizeof sl->next);
2218 sl->next = NULL;
2219 strcpy(sl->str, p);
2220 *deptail = sl;
2221 deptail = &sl->next;
2223 free_tlist(origline);
2224 return DIRECTIVE_FOUND;
2226 case PP_INCLUDE:
2227 t = tline->next = expand_smacro(tline->next);
2228 skip_white_(t);
2230 if (!t || (t->type != TOK_STRING &&
2231 t->type != TOK_INTERNAL_STRING)) {
2232 error(ERR_NONFATAL, "`%%include' expects a file name");
2233 free_tlist(origline);
2234 return DIRECTIVE_FOUND; /* but we did _something_ */
2236 if (t->next)
2237 error(ERR_WARNING,
2238 "trailing garbage after `%%include' ignored");
2239 p = t->text;
2240 if (t->type != TOK_INTERNAL_STRING)
2241 nasm_unquote(p, NULL);
2242 inc = nasm_malloc(sizeof(Include));
2243 inc->next = istk;
2244 inc->conds = NULL;
2245 inc->fp = inc_fopen(p, dephead, &deptail, pass == 0);
2246 if (!inc->fp) {
2247 /* -MG given but file not found */
2248 nasm_free(inc);
2249 } else {
2250 inc->fname = src_set_fname(nasm_strdup(p));
2251 inc->lineno = src_set_linnum(0);
2252 inc->lineinc = 1;
2253 inc->expansion = NULL;
2254 inc->mstk = NULL;
2255 istk = inc;
2256 list->uplevel(LIST_INCLUDE);
2258 free_tlist(origline);
2259 return DIRECTIVE_FOUND;
2261 case PP_USE:
2263 static macros_t *use_pkg;
2264 const char *pkg_macro;
2266 t = tline->next = expand_smacro(tline->next);
2267 skip_white_(t);
2269 if (!t || (t->type != TOK_STRING &&
2270 t->type != TOK_INTERNAL_STRING &&
2271 t->type != TOK_ID)) {
2272 error(ERR_NONFATAL, "`%%use' expects a package name");
2273 free_tlist(origline);
2274 return DIRECTIVE_FOUND; /* but we did _something_ */
2276 if (t->next)
2277 error(ERR_WARNING,
2278 "trailing garbage after `%%use' ignored");
2279 if (t->type == TOK_STRING)
2280 nasm_unquote(t->text, NULL);
2281 use_pkg = nasm_stdmac_find_package(t->text);
2282 if (!use_pkg)
2283 error(ERR_NONFATAL, "unknown `%%use' package: %s", t->text);
2284 /* The first string will be <%define>__USE_*__ */
2285 pkg_macro = (char *)use_pkg + 1;
2286 if (!smacro_defined(NULL, pkg_macro, 0, NULL, true)) {
2287 /* Not already included, go ahead and include it */
2288 stdmacpos = use_pkg;
2290 free_tlist(origline);
2291 return DIRECTIVE_FOUND;
2293 case PP_PUSH:
2294 tline = tline->next;
2295 skip_white_(tline);
2296 tline = expand_id(tline);
2297 if (tline) {
2298 if (!tok_type_(tline, TOK_ID)) {
2299 error(ERR_NONFATAL, "`%%push' expects a context identifier");
2300 free_tlist(origline);
2301 return DIRECTIVE_FOUND; /* but we did _something_ */
2303 if (tline->next)
2304 error(ERR_WARNING, "trailing garbage after `%%push' ignored");
2305 p = nasm_strdup(tline->text);
2306 } else {
2307 p = NULL; /* Anonymous context */
2309 ctx = nasm_malloc(sizeof(Context));
2310 ctx->next = cstk;
2311 hash_init(&ctx->localmac, HASH_SMALL);
2312 ctx->name = p;
2313 ctx->number = unique++;
2314 cstk = ctx;
2315 free_tlist(origline);
2316 return DIRECTIVE_FOUND;
2318 case PP_REPL:
2319 tline = tline->next;
2320 skip_white_(tline);
2321 tline = expand_id(tline);
2322 if (tline) {
2323 if (!tok_type_(tline, TOK_ID)) {
2324 error(ERR_NONFATAL, "`%%repl' expects a context identifier");
2325 free_tlist(origline);
2326 return DIRECTIVE_FOUND; /* but we did _something_ */
2328 if (tline->next)
2329 error(ERR_WARNING, "trailing garbage after `%%repl' ignored");
2330 p = nasm_strdup(tline->text);
2331 } else {
2332 p = NULL;
2334 if (!cstk)
2335 error(ERR_NONFATAL, "`%%repl': context stack is empty");
2336 else {
2337 nasm_free(cstk->name);
2338 cstk->name = p;
2340 free_tlist(origline);
2341 return DIRECTIVE_FOUND;
2343 case PP_POP:
2344 if (tline->next)
2345 error(ERR_WARNING, "trailing garbage after `%%pop' ignored");
2346 if (!cstk)
2347 error(ERR_NONFATAL, "`%%pop': context stack is already empty");
2348 else
2349 ctx_pop();
2350 free_tlist(origline);
2351 return DIRECTIVE_FOUND;
2353 case PP_ERROR:
2354 case PP_WARNING:
2356 int severity = (i == PP_ERROR)
2357 ? ERR_NONFATAL|ERR_NO_SEVERITY
2358 : ERR_WARNING|ERR_NO_SEVERITY;
2360 tline->next = expand_smacro(tline->next);
2361 tline = tline->next;
2362 skip_white_(tline);
2363 t = tline ? tline->next : NULL;
2364 skip_white_(t);
2365 if (tok_type_(tline, TOK_STRING) && !t) {
2366 /* The line contains only a quoted string */
2367 p = tline->text;
2368 nasm_unquote(p, NULL);
2369 error(severity, "%s: %s", pp_directives[i], p);
2370 } else {
2371 /* Not a quoted string, or more than a quoted string */
2372 p = detoken(tline, false);
2373 error(severity, "%s: %s", pp_directives[i], p);
2374 nasm_free(p);
2376 free_tlist(origline);
2377 return DIRECTIVE_FOUND;
2380 CASE_PP_IF:
2381 if (istk->conds && !emitting(istk->conds->state))
2382 j = COND_NEVER;
2383 else {
2384 j = if_condition(tline->next, i);
2385 tline->next = NULL; /* it got freed */
2386 j = j < 0 ? COND_NEVER : j ? COND_IF_TRUE : COND_IF_FALSE;
2388 cond = nasm_malloc(sizeof(Cond));
2389 cond->next = istk->conds;
2390 cond->state = j;
2391 istk->conds = cond;
2392 free_tlist(origline);
2393 return DIRECTIVE_FOUND;
2395 CASE_PP_ELIF:
2396 if (!istk->conds)
2397 error(ERR_FATAL, "`%s': no matching `%%if'", pp_directives[i]);
2398 if (emitting(istk->conds->state)
2399 || istk->conds->state == COND_NEVER)
2400 istk->conds->state = COND_NEVER;
2401 else {
2403 * IMPORTANT: In the case of %if, we will already have
2404 * called expand_mmac_params(); however, if we're
2405 * processing an %elif we must have been in a
2406 * non-emitting mode, which would have inhibited
2407 * the normal invocation of expand_mmac_params(). Therefore,
2408 * we have to do it explicitly here.
2410 j = if_condition(expand_mmac_params(tline->next), i);
2411 tline->next = NULL; /* it got freed */
2412 istk->conds->state =
2413 j < 0 ? COND_NEVER : j ? COND_IF_TRUE : COND_IF_FALSE;
2415 free_tlist(origline);
2416 return DIRECTIVE_FOUND;
2418 case PP_ELSE:
2419 if (tline->next)
2420 error(ERR_WARNING, "trailing garbage after `%%else' ignored");
2421 if (!istk->conds)
2422 error(ERR_FATAL, "`%%else': no matching `%%if'");
2423 if (emitting(istk->conds->state)
2424 || istk->conds->state == COND_NEVER)
2425 istk->conds->state = COND_ELSE_FALSE;
2426 else
2427 istk->conds->state = COND_ELSE_TRUE;
2428 free_tlist(origline);
2429 return DIRECTIVE_FOUND;
2431 case PP_ENDIF:
2432 if (tline->next)
2433 error(ERR_WARNING, "trailing garbage after `%%endif' ignored");
2434 if (!istk->conds)
2435 error(ERR_FATAL, "`%%endif': no matching `%%if'");
2436 cond = istk->conds;
2437 istk->conds = cond->next;
2438 nasm_free(cond);
2439 free_tlist(origline);
2440 return DIRECTIVE_FOUND;
2442 case PP_MACRO:
2443 case PP_IMACRO:
2444 if (defining) {
2445 error(ERR_FATAL,
2446 "`%%%smacro': already defining a macro",
2447 (i == PP_IMACRO ? "i" : ""));
2448 return DIRECTIVE_FOUND;
2450 defining = nasm_malloc(sizeof(MMacro));
2451 defining->casesense = (i == PP_MACRO);
2452 if (!parse_mmacro_spec(tline, defining, pp_directives[i])) {
2453 nasm_free(defining);
2454 defining = NULL;
2455 return DIRECTIVE_FOUND;
2458 mmac = (MMacro *) hash_findix(&mmacros, defining->name);
2459 while (mmac) {
2460 if (!strcmp(mmac->name, defining->name) &&
2461 (mmac->nparam_min <= defining->nparam_max
2462 || defining->plus)
2463 && (defining->nparam_min <= mmac->nparam_max
2464 || mmac->plus)) {
2465 error(ERR_WARNING,
2466 "redefining multi-line macro `%s'", defining->name);
2467 return DIRECTIVE_FOUND;
2469 mmac = mmac->next;
2471 free_tlist(origline);
2472 return DIRECTIVE_FOUND;
2474 case PP_ENDM:
2475 case PP_ENDMACRO:
2476 if (! (defining && defining->name)) {
2477 error(ERR_NONFATAL, "`%s': not defining a macro", tline->text);
2478 return DIRECTIVE_FOUND;
2480 mmhead = (MMacro **) hash_findi_add(&mmacros, defining->name);
2481 defining->next = *mmhead;
2482 *mmhead = defining;
2483 defining = NULL;
2484 free_tlist(origline);
2485 return DIRECTIVE_FOUND;
2487 case PP_UNMACRO:
2488 case PP_UNIMACRO:
2490 MMacro **mmac_p;
2491 MMacro spec;
2493 spec.casesense = (i == PP_UNMACRO);
2494 if (!parse_mmacro_spec(tline, &spec, pp_directives[i])) {
2495 return DIRECTIVE_FOUND;
2497 mmac_p = (MMacro **) hash_findi(&mmacros, spec.name, NULL);
2498 while (mmac_p && *mmac_p) {
2499 mmac = *mmac_p;
2500 if (mmac->casesense == spec.casesense &&
2501 !mstrcmp(mmac->name, spec.name, spec.casesense) &&
2502 mmac->nparam_min == spec.nparam_min &&
2503 mmac->nparam_max == spec.nparam_max &&
2504 mmac->plus == spec.plus) {
2505 *mmac_p = mmac->next;
2506 free_mmacro(mmac);
2507 } else {
2508 mmac_p = &mmac->next;
2511 free_tlist(origline);
2512 free_tlist(spec.dlist);
2513 return DIRECTIVE_FOUND;
2516 case PP_ROTATE:
2517 if (tline->next && tline->next->type == TOK_WHITESPACE)
2518 tline = tline->next;
2519 if (tline->next == NULL) {
2520 free_tlist(origline);
2521 error(ERR_NONFATAL, "`%%rotate' missing rotate count");
2522 return DIRECTIVE_FOUND;
2524 t = expand_smacro(tline->next);
2525 tline->next = NULL;
2526 free_tlist(origline);
2527 tline = t;
2528 tptr = &t;
2529 tokval.t_type = TOKEN_INVALID;
2530 evalresult =
2531 evaluate(ppscan, tptr, &tokval, NULL, pass, error, NULL);
2532 free_tlist(tline);
2533 if (!evalresult)
2534 return DIRECTIVE_FOUND;
2535 if (tokval.t_type)
2536 error(ERR_WARNING,
2537 "trailing garbage after expression ignored");
2538 if (!is_simple(evalresult)) {
2539 error(ERR_NONFATAL, "non-constant value given to `%%rotate'");
2540 return DIRECTIVE_FOUND;
2542 mmac = istk->mstk;
2543 while (mmac && !mmac->name) /* avoid mistaking %reps for macros */
2544 mmac = mmac->next_active;
2545 if (!mmac) {
2546 error(ERR_NONFATAL, "`%%rotate' invoked outside a macro call");
2547 } else if (mmac->nparam == 0) {
2548 error(ERR_NONFATAL,
2549 "`%%rotate' invoked within macro without parameters");
2550 } else {
2551 int rotate = mmac->rotate + reloc_value(evalresult);
2553 rotate %= (int)mmac->nparam;
2554 if (rotate < 0)
2555 rotate += mmac->nparam;
2557 mmac->rotate = rotate;
2559 return DIRECTIVE_FOUND;
2561 case PP_REP:
2562 nolist = false;
2563 do {
2564 tline = tline->next;
2565 } while (tok_type_(tline, TOK_WHITESPACE));
2567 if (tok_type_(tline, TOK_ID) &&
2568 nasm_stricmp(tline->text, ".nolist") == 0) {
2569 nolist = true;
2570 do {
2571 tline = tline->next;
2572 } while (tok_type_(tline, TOK_WHITESPACE));
2575 if (tline) {
2576 t = expand_smacro(tline);
2577 tptr = &t;
2578 tokval.t_type = TOKEN_INVALID;
2579 evalresult =
2580 evaluate(ppscan, tptr, &tokval, NULL, pass, error, NULL);
2581 if (!evalresult) {
2582 free_tlist(origline);
2583 return DIRECTIVE_FOUND;
2585 if (tokval.t_type)
2586 error(ERR_WARNING,
2587 "trailing garbage after expression ignored");
2588 if (!is_simple(evalresult)) {
2589 error(ERR_NONFATAL, "non-constant value given to `%%rep'");
2590 return DIRECTIVE_FOUND;
2592 count = reloc_value(evalresult) + 1;
2593 } else {
2594 error(ERR_NONFATAL, "`%%rep' expects a repeat count");
2595 count = 0;
2597 free_tlist(origline);
2599 tmp_defining = defining;
2600 defining = nasm_malloc(sizeof(MMacro));
2601 defining->name = NULL; /* flags this macro as a %rep block */
2602 defining->casesense = false;
2603 defining->plus = false;
2604 defining->nolist = nolist;
2605 defining->in_progress = count;
2606 defining->nparam_min = defining->nparam_max = 0;
2607 defining->defaults = NULL;
2608 defining->dlist = NULL;
2609 defining->expansion = NULL;
2610 defining->next_active = istk->mstk;
2611 defining->rep_nest = tmp_defining;
2612 return DIRECTIVE_FOUND;
2614 case PP_ENDREP:
2615 if (!defining || defining->name) {
2616 error(ERR_NONFATAL, "`%%endrep': no matching `%%rep'");
2617 return DIRECTIVE_FOUND;
2621 * Now we have a "macro" defined - although it has no name
2622 * and we won't be entering it in the hash tables - we must
2623 * push a macro-end marker for it on to istk->expansion.
2624 * After that, it will take care of propagating itself (a
2625 * macro-end marker line for a macro which is really a %rep
2626 * block will cause the macro to be re-expanded, complete
2627 * with another macro-end marker to ensure the process
2628 * continues) until the whole expansion is forcibly removed
2629 * from istk->expansion by a %exitrep.
2631 l = nasm_malloc(sizeof(Line));
2632 l->next = istk->expansion;
2633 l->finishes = defining;
2634 l->first = NULL;
2635 istk->expansion = l;
2637 istk->mstk = defining;
2639 list->uplevel(defining->nolist ? LIST_MACRO_NOLIST : LIST_MACRO);
2640 tmp_defining = defining;
2641 defining = defining->rep_nest;
2642 free_tlist(origline);
2643 return DIRECTIVE_FOUND;
2645 case PP_EXITREP:
2647 * We must search along istk->expansion until we hit a
2648 * macro-end marker for a macro with no name. Then we set
2649 * its `in_progress' flag to 0.
2651 for (l = istk->expansion; l; l = l->next)
2652 if (l->finishes && !l->finishes->name)
2653 return DIRECTIVE_FOUND;
2655 if (l)
2656 l->finishes->in_progress = 1;
2657 else
2658 error(ERR_NONFATAL, "`%%exitrep' not within `%%rep' block");
2659 free_tlist(origline);
2660 return DIRECTIVE_FOUND;
2662 case PP_XDEFINE:
2663 case PP_IXDEFINE:
2664 case PP_DEFINE:
2665 case PP_IDEFINE:
2666 casesense = (i == PP_DEFINE || i == PP_XDEFINE);
2668 tline = tline->next;
2669 skip_white_(tline);
2670 tline = expand_id(tline);
2671 if (!tline || (tline->type != TOK_ID &&
2672 (tline->type != TOK_PREPROC_ID ||
2673 tline->text[1] != '$'))) {
2674 error(ERR_NONFATAL, "`%s' expects a macro identifier",
2675 pp_directives[i]);
2676 free_tlist(origline);
2677 return DIRECTIVE_FOUND;
2680 ctx = get_ctx(tline->text, false);
2682 mname = tline->text;
2683 last = tline;
2684 param_start = tline = tline->next;
2685 nparam = 0;
2687 /* Expand the macro definition now for %xdefine and %ixdefine */
2688 if ((i == PP_XDEFINE) || (i == PP_IXDEFINE))
2689 tline = expand_smacro(tline);
2691 if (tok_is_(tline, "(")) {
2693 * This macro has parameters.
2696 tline = tline->next;
2697 while (1) {
2698 skip_white_(tline);
2699 if (!tline) {
2700 error(ERR_NONFATAL, "parameter identifier expected");
2701 free_tlist(origline);
2702 return DIRECTIVE_FOUND;
2704 if (tline->type != TOK_ID) {
2705 error(ERR_NONFATAL,
2706 "`%s': parameter identifier expected",
2707 tline->text);
2708 free_tlist(origline);
2709 return DIRECTIVE_FOUND;
2711 tline->type = TOK_SMAC_PARAM + nparam++;
2712 tline = tline->next;
2713 skip_white_(tline);
2714 if (tok_is_(tline, ",")) {
2715 tline = tline->next;
2716 continue;
2718 if (!tok_is_(tline, ")")) {
2719 error(ERR_NONFATAL,
2720 "`)' expected to terminate macro template");
2721 free_tlist(origline);
2722 return DIRECTIVE_FOUND;
2724 return DIRECTIVE_FOUND;
2726 last = tline;
2727 tline = tline->next;
2729 if (tok_type_(tline, TOK_WHITESPACE))
2730 last = tline, tline = tline->next;
2731 macro_start = NULL;
2732 last->next = NULL;
2733 t = tline;
2734 while (t) {
2735 if (t->type == TOK_ID) {
2736 for (tt = param_start; tt; tt = tt->next)
2737 if (tt->type >= TOK_SMAC_PARAM &&
2738 !strcmp(tt->text, t->text))
2739 t->type = tt->type;
2741 tt = t->next;
2742 t->next = macro_start;
2743 macro_start = t;
2744 t = tt;
2747 * Good. We now have a macro name, a parameter count, and a
2748 * token list (in reverse order) for an expansion. We ought
2749 * to be OK just to create an SMacro, store it, and let
2750 * free_tlist have the rest of the line (which we have
2751 * carefully re-terminated after chopping off the expansion
2752 * from the end).
2754 define_smacro(ctx, mname, casesense, nparam, macro_start);
2755 free_tlist(origline);
2756 return DIRECTIVE_FOUND;
2758 case PP_UNDEF:
2759 tline = tline->next;
2760 skip_white_(tline);
2761 tline = expand_id(tline);
2762 if (!tline || (tline->type != TOK_ID &&
2763 (tline->type != TOK_PREPROC_ID ||
2764 tline->text[1] != '$'))) {
2765 error(ERR_NONFATAL, "`%%undef' expects a macro identifier");
2766 free_tlist(origline);
2767 return DIRECTIVE_FOUND;
2769 if (tline->next) {
2770 error(ERR_WARNING,
2771 "trailing garbage after macro name ignored");
2774 /* Find the context that symbol belongs to */
2775 ctx = get_ctx(tline->text, false);
2776 undef_smacro(ctx, tline->text);
2777 free_tlist(origline);
2778 return DIRECTIVE_FOUND;
2780 case PP_DEFSTR:
2781 case PP_IDEFSTR:
2782 casesense = (i == PP_DEFSTR);
2784 tline = tline->next;
2785 skip_white_(tline);
2786 tline = expand_id(tline);
2787 if (!tline || (tline->type != TOK_ID &&
2788 (tline->type != TOK_PREPROC_ID ||
2789 tline->text[1] != '$'))) {
2790 error(ERR_NONFATAL, "`%s' expects a macro identifier",
2791 pp_directives[i]);
2792 free_tlist(origline);
2793 return DIRECTIVE_FOUND;
2796 ctx = get_ctx(tline->text, false);
2798 mname = tline->text;
2799 last = tline;
2800 tline = expand_smacro(tline->next);
2801 last->next = NULL;
2803 while (tok_type_(tline, TOK_WHITESPACE))
2804 tline = delete_Token(tline);
2806 p = detoken(tline, false);
2807 macro_start = nasm_malloc(sizeof(*macro_start));
2808 macro_start->next = NULL;
2809 macro_start->text = nasm_quote(p, strlen(p));
2810 macro_start->type = TOK_STRING;
2811 macro_start->a.mac = NULL;
2812 nasm_free(p);
2815 * We now have a macro name, an implicit parameter count of
2816 * zero, and a string token to use as an expansion. Create
2817 * and store an SMacro.
2819 define_smacro(ctx, mname, casesense, 0, macro_start);
2820 free_tlist(origline);
2821 return DIRECTIVE_FOUND;
2823 case PP_PATHSEARCH:
2825 FILE *fp;
2826 StrList *xsl = NULL;
2827 StrList **xst = &xsl;
2829 casesense = true;
2831 tline = tline->next;
2832 skip_white_(tline);
2833 tline = expand_id(tline);
2834 if (!tline || (tline->type != TOK_ID &&
2835 (tline->type != TOK_PREPROC_ID ||
2836 tline->text[1] != '$'))) {
2837 error(ERR_NONFATAL,
2838 "`%%pathsearch' expects a macro identifier as first parameter");
2839 free_tlist(origline);
2840 return DIRECTIVE_FOUND;
2842 ctx = get_ctx(tline->text, false);
2844 mname = tline->text;
2845 last = tline;
2846 tline = expand_smacro(tline->next);
2847 last->next = NULL;
2849 t = tline;
2850 while (tok_type_(t, TOK_WHITESPACE))
2851 t = t->next;
2853 if (!t || (t->type != TOK_STRING &&
2854 t->type != TOK_INTERNAL_STRING)) {
2855 error(ERR_NONFATAL, "`%%pathsearch' expects a file name");
2856 free_tlist(tline);
2857 free_tlist(origline);
2858 return DIRECTIVE_FOUND; /* but we did _something_ */
2860 if (t->next)
2861 error(ERR_WARNING,
2862 "trailing garbage after `%%pathsearch' ignored");
2863 p = t->text;
2864 if (t->type != TOK_INTERNAL_STRING)
2865 nasm_unquote(p, NULL);
2867 fp = inc_fopen(p, &xsl, &xst, true);
2868 if (fp) {
2869 p = xsl->str;
2870 fclose(fp); /* Don't actually care about the file */
2872 macro_start = nasm_malloc(sizeof(*macro_start));
2873 macro_start->next = NULL;
2874 macro_start->text = nasm_quote(p, strlen(p));
2875 macro_start->type = TOK_STRING;
2876 macro_start->a.mac = NULL;
2877 if (xsl)
2878 nasm_free(xsl);
2881 * We now have a macro name, an implicit parameter count of
2882 * zero, and a string token to use as an expansion. Create
2883 * and store an SMacro.
2885 define_smacro(ctx, mname, casesense, 0, macro_start);
2886 free_tlist(tline);
2887 free_tlist(origline);
2888 return DIRECTIVE_FOUND;
2891 case PP_STRLEN:
2892 casesense = true;
2894 tline = tline->next;
2895 skip_white_(tline);
2896 tline = expand_id(tline);
2897 if (!tline || (tline->type != TOK_ID &&
2898 (tline->type != TOK_PREPROC_ID ||
2899 tline->text[1] != '$'))) {
2900 error(ERR_NONFATAL,
2901 "`%%strlen' expects a macro identifier as first parameter");
2902 free_tlist(origline);
2903 return DIRECTIVE_FOUND;
2905 ctx = get_ctx(tline->text, false);
2907 mname = tline->text;
2908 last = tline;
2909 tline = expand_smacro(tline->next);
2910 last->next = NULL;
2912 t = tline;
2913 while (tok_type_(t, TOK_WHITESPACE))
2914 t = t->next;
2915 /* t should now point to the string */
2916 if (t->type != TOK_STRING) {
2917 error(ERR_NONFATAL,
2918 "`%%strlen` requires string as second parameter");
2919 free_tlist(tline);
2920 free_tlist(origline);
2921 return DIRECTIVE_FOUND;
2924 macro_start = nasm_malloc(sizeof(*macro_start));
2925 macro_start->next = NULL;
2926 make_tok_num(macro_start, nasm_unquote(t->text, NULL));
2927 macro_start->a.mac = NULL;
2930 * We now have a macro name, an implicit parameter count of
2931 * zero, and a numeric token to use as an expansion. Create
2932 * and store an SMacro.
2934 define_smacro(ctx, mname, casesense, 0, macro_start);
2935 free_tlist(tline);
2936 free_tlist(origline);
2937 return DIRECTIVE_FOUND;
2939 case PP_STRCAT:
2940 casesense = true;
2942 tline = tline->next;
2943 skip_white_(tline);
2944 tline = expand_id(tline);
2945 if (!tline || (tline->type != TOK_ID &&
2946 (tline->type != TOK_PREPROC_ID ||
2947 tline->text[1] != '$'))) {
2948 error(ERR_NONFATAL,
2949 "`%%strcat' expects a macro identifier as first parameter");
2950 free_tlist(origline);
2951 return DIRECTIVE_FOUND;
2953 ctx = get_ctx(tline->text, false);
2955 mname = tline->text;
2956 last = tline;
2957 tline = expand_smacro(tline->next);
2958 last->next = NULL;
2960 len = 0;
2961 for (t = tline; t; t = t->next) {
2962 switch (t->type) {
2963 case TOK_WHITESPACE:
2964 break;
2965 case TOK_STRING:
2966 len += t->a.len = nasm_unquote(t->text, NULL);
2967 break;
2968 case TOK_OTHER:
2969 if (!strcmp(t->text, ",")) /* permit comma separators */
2970 break;
2971 /* else fall through */
2972 default:
2973 error(ERR_NONFATAL,
2974 "non-string passed to `%%strcat' (%d)", t->type);
2975 free_tlist(tline);
2976 free_tlist(origline);
2977 return DIRECTIVE_FOUND;
2981 p = pp = nasm_malloc(len);
2982 t = tline;
2983 for (t = tline; t; t = t->next) {
2984 if (t->type == TOK_STRING) {
2985 memcpy(p, t->text, t->a.len);
2986 p += t->a.len;
2991 * We now have a macro name, an implicit parameter count of
2992 * zero, and a numeric token to use as an expansion. Create
2993 * and store an SMacro.
2995 macro_start = new_Token(NULL, TOK_STRING, NULL, 0);
2996 macro_start->text = nasm_quote(pp, len);
2997 nasm_free(pp);
2998 define_smacro(ctx, mname, casesense, 0, macro_start);
2999 free_tlist(tline);
3000 free_tlist(origline);
3001 return DIRECTIVE_FOUND;
3003 case PP_SUBSTR:
3005 int64_t a1, a2;
3006 size_t len;
3008 casesense = true;
3010 tline = tline->next;
3011 skip_white_(tline);
3012 tline = expand_id(tline);
3013 if (!tline || (tline->type != TOK_ID &&
3014 (tline->type != TOK_PREPROC_ID ||
3015 tline->text[1] != '$'))) {
3016 error(ERR_NONFATAL,
3017 "`%%substr' expects a macro identifier as first parameter");
3018 free_tlist(origline);
3019 return DIRECTIVE_FOUND;
3021 ctx = get_ctx(tline->text, false);
3023 mname = tline->text;
3024 last = tline;
3025 tline = expand_smacro(tline->next);
3026 last->next = NULL;
3028 t = tline->next;
3029 while (tok_type_(t, TOK_WHITESPACE))
3030 t = t->next;
3032 /* t should now point to the string */
3033 if (t->type != TOK_STRING) {
3034 error(ERR_NONFATAL,
3035 "`%%substr` requires string as second parameter");
3036 free_tlist(tline);
3037 free_tlist(origline);
3038 return DIRECTIVE_FOUND;
3041 tt = t->next;
3042 tptr = &tt;
3043 tokval.t_type = TOKEN_INVALID;
3044 evalresult = evaluate(ppscan, tptr, &tokval, NULL,
3045 pass, error, NULL);
3046 if (!evalresult) {
3047 free_tlist(tline);
3048 free_tlist(origline);
3049 return DIRECTIVE_FOUND;
3050 } else if (!is_simple(evalresult)) {
3051 error(ERR_NONFATAL, "non-constant value given to `%%substr`");
3052 free_tlist(tline);
3053 free_tlist(origline);
3054 return DIRECTIVE_FOUND;
3056 a1 = evalresult->value-1;
3058 while (tok_type_(tt, TOK_WHITESPACE))
3059 tt = tt->next;
3060 if (!tt) {
3061 a2 = 1; /* Backwards compatibility: one character */
3062 } else {
3063 tokval.t_type = TOKEN_INVALID;
3064 evalresult = evaluate(ppscan, tptr, &tokval, NULL,
3065 pass, error, NULL);
3066 if (!evalresult) {
3067 free_tlist(tline);
3068 free_tlist(origline);
3069 return DIRECTIVE_FOUND;
3070 } else if (!is_simple(evalresult)) {
3071 error(ERR_NONFATAL, "non-constant value given to `%%substr`");
3072 free_tlist(tline);
3073 free_tlist(origline);
3074 return DIRECTIVE_FOUND;
3076 a2 = evalresult->value;
3079 len = nasm_unquote(t->text, NULL);
3080 if (a2 < 0)
3081 a2 = a2+1+len-a1;
3082 if (a1+a2 > (int64_t)len)
3083 a2 = len-a1;
3085 macro_start = nasm_malloc(sizeof(*macro_start));
3086 macro_start->next = NULL;
3087 macro_start->text = nasm_quote((a1 < 0) ? "" : t->text+a1, a2);
3088 macro_start->type = TOK_STRING;
3089 macro_start->a.mac = NULL;
3092 * We now have a macro name, an implicit parameter count of
3093 * zero, and a numeric token to use as an expansion. Create
3094 * and store an SMacro.
3096 define_smacro(ctx, mname, casesense, 0, macro_start);
3097 free_tlist(tline);
3098 free_tlist(origline);
3099 return DIRECTIVE_FOUND;
3102 case PP_ASSIGN:
3103 case PP_IASSIGN:
3104 casesense = (i == PP_ASSIGN);
3106 tline = tline->next;
3107 skip_white_(tline);
3108 tline = expand_id(tline);
3109 if (!tline || (tline->type != TOK_ID &&
3110 (tline->type != TOK_PREPROC_ID ||
3111 tline->text[1] != '$'))) {
3112 error(ERR_NONFATAL,
3113 "`%%%sassign' expects a macro identifier",
3114 (i == PP_IASSIGN ? "i" : ""));
3115 free_tlist(origline);
3116 return DIRECTIVE_FOUND;
3118 ctx = get_ctx(tline->text, false);
3120 mname = tline->text;
3121 last = tline;
3122 tline = expand_smacro(tline->next);
3123 last->next = NULL;
3125 t = tline;
3126 tptr = &t;
3127 tokval.t_type = TOKEN_INVALID;
3128 evalresult =
3129 evaluate(ppscan, tptr, &tokval, NULL, pass, error, NULL);
3130 free_tlist(tline);
3131 if (!evalresult) {
3132 free_tlist(origline);
3133 return DIRECTIVE_FOUND;
3136 if (tokval.t_type)
3137 error(ERR_WARNING,
3138 "trailing garbage after expression ignored");
3140 if (!is_simple(evalresult)) {
3141 error(ERR_NONFATAL,
3142 "non-constant value given to `%%%sassign'",
3143 (i == PP_IASSIGN ? "i" : ""));
3144 free_tlist(origline);
3145 return DIRECTIVE_FOUND;
3148 macro_start = nasm_malloc(sizeof(*macro_start));
3149 macro_start->next = NULL;
3150 make_tok_num(macro_start, reloc_value(evalresult));
3151 macro_start->a.mac = NULL;
3154 * We now have a macro name, an implicit parameter count of
3155 * zero, and a numeric token to use as an expansion. Create
3156 * and store an SMacro.
3158 define_smacro(ctx, mname, casesense, 0, macro_start);
3159 free_tlist(origline);
3160 return DIRECTIVE_FOUND;
3162 case PP_LINE:
3164 * Syntax is `%line nnn[+mmm] [filename]'
3166 tline = tline->next;
3167 skip_white_(tline);
3168 if (!tok_type_(tline, TOK_NUMBER)) {
3169 error(ERR_NONFATAL, "`%%line' expects line number");
3170 free_tlist(origline);
3171 return DIRECTIVE_FOUND;
3173 k = readnum(tline->text, &err);
3174 m = 1;
3175 tline = tline->next;
3176 if (tok_is_(tline, "+")) {
3177 tline = tline->next;
3178 if (!tok_type_(tline, TOK_NUMBER)) {
3179 error(ERR_NONFATAL, "`%%line' expects line increment");
3180 free_tlist(origline);
3181 return DIRECTIVE_FOUND;
3183 m = readnum(tline->text, &err);
3184 tline = tline->next;
3186 skip_white_(tline);
3187 src_set_linnum(k);
3188 istk->lineinc = m;
3189 if (tline) {
3190 nasm_free(src_set_fname(detoken(tline, false)));
3192 free_tlist(origline);
3193 return DIRECTIVE_FOUND;
3195 default:
3196 error(ERR_FATAL,
3197 "preprocessor directive `%s' not yet implemented",
3198 pp_directives[i]);
3199 return DIRECTIVE_FOUND;
3204 * Ensure that a macro parameter contains a condition code and
3205 * nothing else. Return the condition code index if so, or -1
3206 * otherwise.
3208 static int find_cc(Token * t)
3210 Token *tt;
3211 int i, j, k, m;
3213 if (!t)
3214 return -1; /* Probably a %+ without a space */
3216 skip_white_(t);
3217 if (t->type != TOK_ID)
3218 return -1;
3219 tt = t->next;
3220 skip_white_(tt);
3221 if (tt && (tt->type != TOK_OTHER || strcmp(tt->text, ",")))
3222 return -1;
3224 i = -1;
3225 j = elements(conditions);
3226 while (j - i > 1) {
3227 k = (j + i) / 2;
3228 m = nasm_stricmp(t->text, conditions[k]);
3229 if (m == 0) {
3230 i = k;
3231 j = -2;
3232 break;
3233 } else if (m < 0) {
3234 j = k;
3235 } else
3236 i = k;
3238 if (j != -2)
3239 return -1;
3240 return i;
3244 * Expand MMacro-local things: parameter references (%0, %n, %+n,
3245 * %-n) and MMacro-local identifiers (%%foo).
3247 static Token *expand_mmac_params(Token * tline)
3249 Token *t, *tt, **tail, *thead;
3251 tail = &thead;
3252 thead = NULL;
3254 while (tline) {
3255 if (tline->type == TOK_PREPROC_ID &&
3256 (((tline->text[1] == '+' || tline->text[1] == '-')
3257 && tline->text[2]) || tline->text[1] == '%'
3258 || (tline->text[1] >= '0' && tline->text[1] <= '9'))) {
3259 char *text = NULL;
3260 int type = 0, cc; /* type = 0 to placate optimisers */
3261 char tmpbuf[30];
3262 unsigned int n;
3263 int i;
3264 MMacro *mac;
3266 t = tline;
3267 tline = tline->next;
3269 mac = istk->mstk;
3270 while (mac && !mac->name) /* avoid mistaking %reps for macros */
3271 mac = mac->next_active;
3272 if (!mac)
3273 error(ERR_NONFATAL, "`%s': not in a macro call", t->text);
3274 else
3275 switch (t->text[1]) {
3277 * We have to make a substitution of one of the
3278 * forms %1, %-1, %+1, %%foo, %0.
3280 case '0':
3281 type = TOK_NUMBER;
3282 snprintf(tmpbuf, sizeof(tmpbuf), "%d", mac->nparam);
3283 text = nasm_strdup(tmpbuf);
3284 break;
3285 case '%':
3286 type = TOK_ID;
3287 snprintf(tmpbuf, sizeof(tmpbuf), "..@%"PRIu64".",
3288 mac->unique);
3289 text = nasm_strcat(tmpbuf, t->text + 2);
3290 break;
3291 case '-':
3292 n = atoi(t->text + 2) - 1;
3293 if (n >= mac->nparam)
3294 tt = NULL;
3295 else {
3296 if (mac->nparam > 1)
3297 n = (n + mac->rotate) % mac->nparam;
3298 tt = mac->params[n];
3300 cc = find_cc(tt);
3301 if (cc == -1) {
3302 error(ERR_NONFATAL,
3303 "macro parameter %d is not a condition code",
3304 n + 1);
3305 text = NULL;
3306 } else {
3307 type = TOK_ID;
3308 if (inverse_ccs[cc] == -1) {
3309 error(ERR_NONFATAL,
3310 "condition code `%s' is not invertible",
3311 conditions[cc]);
3312 text = NULL;
3313 } else
3314 text =
3315 nasm_strdup(conditions[inverse_ccs[cc]]);
3317 break;
3318 case '+':
3319 n = atoi(t->text + 2) - 1;
3320 if (n >= mac->nparam)
3321 tt = NULL;
3322 else {
3323 if (mac->nparam > 1)
3324 n = (n + mac->rotate) % mac->nparam;
3325 tt = mac->params[n];
3327 cc = find_cc(tt);
3328 if (cc == -1) {
3329 error(ERR_NONFATAL,
3330 "macro parameter %d is not a condition code",
3331 n + 1);
3332 text = NULL;
3333 } else {
3334 type = TOK_ID;
3335 text = nasm_strdup(conditions[cc]);
3337 break;
3338 default:
3339 n = atoi(t->text + 1) - 1;
3340 if (n >= mac->nparam)
3341 tt = NULL;
3342 else {
3343 if (mac->nparam > 1)
3344 n = (n + mac->rotate) % mac->nparam;
3345 tt = mac->params[n];
3347 if (tt) {
3348 for (i = 0; i < mac->paramlen[n]; i++) {
3349 *tail = new_Token(NULL, tt->type, tt->text, 0);
3350 tail = &(*tail)->next;
3351 tt = tt->next;
3354 text = NULL; /* we've done it here */
3355 break;
3357 if (!text) {
3358 delete_Token(t);
3359 } else {
3360 *tail = t;
3361 tail = &t->next;
3362 t->type = type;
3363 nasm_free(t->text);
3364 t->text = text;
3365 t->a.mac = NULL;
3367 continue;
3368 } else {
3369 t = *tail = tline;
3370 tline = tline->next;
3371 t->a.mac = NULL;
3372 tail = &t->next;
3375 *tail = NULL;
3376 t = thead;
3377 for (; t && (tt = t->next) != NULL; t = t->next)
3378 switch (t->type) {
3379 case TOK_WHITESPACE:
3380 if (tt->type == TOK_WHITESPACE) {
3381 t->next = delete_Token(tt);
3383 break;
3384 case TOK_ID:
3385 if (tt->type == TOK_ID || tt->type == TOK_NUMBER) {
3386 char *tmp = nasm_strcat(t->text, tt->text);
3387 nasm_free(t->text);
3388 t->text = tmp;
3389 t->next = delete_Token(tt);
3391 break;
3392 case TOK_NUMBER:
3393 if (tt->type == TOK_NUMBER) {
3394 char *tmp = nasm_strcat(t->text, tt->text);
3395 nasm_free(t->text);
3396 t->text = tmp;
3397 t->next = delete_Token(tt);
3399 break;
3400 default:
3401 break;
3404 return thead;
3408 * Expand all single-line macro calls made in the given line.
3409 * Return the expanded version of the line. The original is deemed
3410 * to be destroyed in the process. (In reality we'll just move
3411 * Tokens from input to output a lot of the time, rather than
3412 * actually bothering to destroy and replicate.)
3414 #define DEADMAN_LIMIT (1 << 20)
3416 static Token *expand_smacro(Token * tline)
3418 Token *t, *tt, *mstart, **tail, *thead;
3419 struct hash_table *smtbl;
3420 SMacro *head = NULL, *m;
3421 Token **params;
3422 int *paramsize;
3423 unsigned int nparam, sparam;
3424 int brackets, rescan;
3425 Token *org_tline = tline;
3426 Context *ctx;
3427 char *mname;
3428 int deadman = DEADMAN_LIMIT;
3431 * Trick: we should avoid changing the start token pointer since it can
3432 * be contained in "next" field of other token. Because of this
3433 * we allocate a copy of first token and work with it; at the end of
3434 * routine we copy it back
3436 if (org_tline) {
3437 tline =
3438 new_Token(org_tline->next, org_tline->type, org_tline->text,
3440 tline->a.mac = org_tline->a.mac;
3441 nasm_free(org_tline->text);
3442 org_tline->text = NULL;
3445 again:
3446 tail = &thead;
3447 thead = NULL;
3449 while (tline) { /* main token loop */
3450 if (!--deadman) {
3451 error(ERR_NONFATAL, "interminable macro recursion");
3452 break;
3455 if ((mname = tline->text)) {
3456 /* if this token is a local macro, look in local context */
3457 ctx = NULL;
3458 smtbl = &smacros;
3459 if (tline->type == TOK_ID || tline->type == TOK_PREPROC_ID) {
3460 ctx = get_ctx(mname, true);
3461 if (ctx)
3462 smtbl = &ctx->localmac;
3464 head = (SMacro *) hash_findix(smtbl, mname);
3467 * We've hit an identifier. As in is_mmacro below, we first
3468 * check whether the identifier is a single-line macro at
3469 * all, then think about checking for parameters if
3470 * necessary.
3472 for (m = head; m; m = m->next)
3473 if (!mstrcmp(m->name, mname, m->casesense))
3474 break;
3475 if (m) {
3476 mstart = tline;
3477 params = NULL;
3478 paramsize = NULL;
3479 if (m->nparam == 0) {
3481 * Simple case: the macro is parameterless. Discard the
3482 * one token that the macro call took, and push the
3483 * expansion back on the to-do stack.
3485 if (!m->expansion) {
3486 if (!strcmp("__FILE__", m->name)) {
3487 int32_t num = 0;
3488 char *file;
3489 src_get(&num, &file);
3490 tline->text = nasm_quote(file, strlen(file));
3491 tline->type = TOK_STRING;
3492 nasm_free(file);
3493 continue;
3495 if (!strcmp("__LINE__", m->name)) {
3496 nasm_free(tline->text);
3497 make_tok_num(tline, src_get_linnum());
3498 continue;
3500 if (!strcmp("__BITS__", m->name)) {
3501 nasm_free(tline->text);
3502 make_tok_num(tline, globalbits);
3503 continue;
3505 tline = delete_Token(tline);
3506 continue;
3508 } else {
3510 * Complicated case: at least one macro with this name
3511 * exists and takes parameters. We must find the
3512 * parameters in the call, count them, find the SMacro
3513 * that corresponds to that form of the macro call, and
3514 * substitute for the parameters when we expand. What a
3515 * pain.
3517 /*tline = tline->next;
3518 skip_white_(tline); */
3519 do {
3520 t = tline->next;
3521 while (tok_type_(t, TOK_SMAC_END)) {
3522 t->a.mac->in_progress = false;
3523 t->text = NULL;
3524 t = tline->next = delete_Token(t);
3526 tline = t;
3527 } while (tok_type_(tline, TOK_WHITESPACE));
3528 if (!tok_is_(tline, "(")) {
3530 * This macro wasn't called with parameters: ignore
3531 * the call. (Behaviour borrowed from gnu cpp.)
3533 tline = mstart;
3534 m = NULL;
3535 } else {
3536 int paren = 0;
3537 int white = 0;
3538 brackets = 0;
3539 nparam = 0;
3540 sparam = PARAM_DELTA;
3541 params = nasm_malloc(sparam * sizeof(Token *));
3542 params[0] = tline->next;
3543 paramsize = nasm_malloc(sparam * sizeof(int));
3544 paramsize[0] = 0;
3545 while (true) { /* parameter loop */
3547 * For some unusual expansions
3548 * which concatenates function call
3550 t = tline->next;
3551 while (tok_type_(t, TOK_SMAC_END)) {
3552 t->a.mac->in_progress = false;
3553 t->text = NULL;
3554 t = tline->next = delete_Token(t);
3556 tline = t;
3558 if (!tline) {
3559 error(ERR_NONFATAL,
3560 "macro call expects terminating `)'");
3561 break;
3563 if (tline->type == TOK_WHITESPACE
3564 && brackets <= 0) {
3565 if (paramsize[nparam])
3566 white++;
3567 else
3568 params[nparam] = tline->next;
3569 continue; /* parameter loop */
3571 if (tline->type == TOK_OTHER
3572 && tline->text[1] == 0) {
3573 char ch = tline->text[0];
3574 if (ch == ',' && !paren && brackets <= 0) {
3575 if (++nparam >= sparam) {
3576 sparam += PARAM_DELTA;
3577 params = nasm_realloc(params,
3578 sparam *
3579 sizeof(Token
3580 *));
3581 paramsize =
3582 nasm_realloc(paramsize,
3583 sparam *
3584 sizeof(int));
3586 params[nparam] = tline->next;
3587 paramsize[nparam] = 0;
3588 white = 0;
3589 continue; /* parameter loop */
3591 if (ch == '{' &&
3592 (brackets > 0 || (brackets == 0 &&
3593 !paramsize[nparam])))
3595 if (!(brackets++)) {
3596 params[nparam] = tline->next;
3597 continue; /* parameter loop */
3600 if (ch == '}' && brackets > 0)
3601 if (--brackets == 0) {
3602 brackets = -1;
3603 continue; /* parameter loop */
3605 if (ch == '(' && !brackets)
3606 paren++;
3607 if (ch == ')' && brackets <= 0)
3608 if (--paren < 0)
3609 break;
3611 if (brackets < 0) {
3612 brackets = 0;
3613 error(ERR_NONFATAL, "braces do not "
3614 "enclose all of macro parameter");
3616 paramsize[nparam] += white + 1;
3617 white = 0;
3618 } /* parameter loop */
3619 nparam++;
3620 while (m && (m->nparam != nparam ||
3621 mstrcmp(m->name, mname,
3622 m->casesense)))
3623 m = m->next;
3624 if (!m)
3625 error(ERR_WARNING | ERR_WARN_MNP,
3626 "macro `%s' exists, "
3627 "but not taking %d parameters",
3628 mstart->text, nparam);
3631 if (m && m->in_progress)
3632 m = NULL;
3633 if (!m) { /* in progess or didn't find '(' or wrong nparam */
3635 * Design question: should we handle !tline, which
3636 * indicates missing ')' here, or expand those
3637 * macros anyway, which requires the (t) test a few
3638 * lines down?
3640 nasm_free(params);
3641 nasm_free(paramsize);
3642 tline = mstart;
3643 } else {
3645 * Expand the macro: we are placed on the last token of the
3646 * call, so that we can easily split the call from the
3647 * following tokens. We also start by pushing an SMAC_END
3648 * token for the cycle removal.
3650 t = tline;
3651 if (t) {
3652 tline = t->next;
3653 t->next = NULL;
3655 tt = new_Token(tline, TOK_SMAC_END, NULL, 0);
3656 tt->a.mac = m;
3657 m->in_progress = true;
3658 tline = tt;
3659 for (t = m->expansion; t; t = t->next) {
3660 if (t->type >= TOK_SMAC_PARAM) {
3661 Token *pcopy = tline, **ptail = &pcopy;
3662 Token *ttt, *pt;
3663 int i;
3665 ttt = params[t->type - TOK_SMAC_PARAM];
3666 for (i = paramsize[t->type - TOK_SMAC_PARAM];
3667 --i >= 0;) {
3668 pt = *ptail =
3669 new_Token(tline, ttt->type, ttt->text,
3671 ptail = &pt->next;
3672 ttt = ttt->next;
3674 tline = pcopy;
3675 } else if (t->type == TOK_PREPROC_Q) {
3676 tt = new_Token(tline, TOK_ID, mname, 0);
3677 tline = tt;
3678 } else if (t->type == TOK_PREPROC_QQ) {
3679 tt = new_Token(tline, TOK_ID, m->name, 0);
3680 tline = tt;
3681 } else {
3682 tt = new_Token(tline, t->type, t->text, 0);
3683 tline = tt;
3688 * Having done that, get rid of the macro call, and clean
3689 * up the parameters.
3691 nasm_free(params);
3692 nasm_free(paramsize);
3693 free_tlist(mstart);
3694 continue; /* main token loop */
3699 if (tline->type == TOK_SMAC_END) {
3700 tline->a.mac->in_progress = false;
3701 tline = delete_Token(tline);
3702 } else {
3703 t = *tail = tline;
3704 tline = tline->next;
3705 t->a.mac = NULL;
3706 t->next = NULL;
3707 tail = &t->next;
3712 * Now scan the entire line and look for successive TOK_IDs that resulted
3713 * after expansion (they can't be produced by tokenize()). The successive
3714 * TOK_IDs should be concatenated.
3715 * Also we look for %+ tokens and concatenate the tokens before and after
3716 * them (without white spaces in between).
3718 t = thead;
3719 rescan = 0;
3720 while (t) {
3721 while (t && t->type != TOK_ID && t->type != TOK_PREPROC_ID)
3722 t = t->next;
3723 if (!t || !t->next)
3724 break;
3725 if (t->next->type == TOK_ID ||
3726 t->next->type == TOK_PREPROC_ID ||
3727 t->next->type == TOK_NUMBER) {
3728 char *p = nasm_strcat(t->text, t->next->text);
3729 nasm_free(t->text);
3730 t->next = delete_Token(t->next);
3731 t->text = p;
3732 rescan = 1;
3733 } else if (t->next->type == TOK_WHITESPACE && t->next->next &&
3734 t->next->next->type == TOK_PREPROC_ID &&
3735 strcmp(t->next->next->text, "%+") == 0) {
3736 /* free the next whitespace, the %+ token and next whitespace */
3737 int i;
3738 for (i = 1; i <= 3; i++) {
3739 if (!t->next
3740 || (i != 2 && t->next->type != TOK_WHITESPACE))
3741 break;
3742 t->next = delete_Token(t->next);
3743 } /* endfor */
3744 } else
3745 t = t->next;
3747 /* If we concatenaded something, re-scan the line for macros */
3748 if (rescan) {
3749 tline = thead;
3750 goto again;
3753 if (org_tline) {
3754 if (thead) {
3755 *org_tline = *thead;
3756 /* since we just gave text to org_line, don't free it */
3757 thead->text = NULL;
3758 delete_Token(thead);
3759 } else {
3760 /* the expression expanded to empty line;
3761 we can't return NULL for some reasons
3762 we just set the line to a single WHITESPACE token. */
3763 memset(org_tline, 0, sizeof(*org_tline));
3764 org_tline->text = NULL;
3765 org_tline->type = TOK_WHITESPACE;
3767 thead = org_tline;
3770 return thead;
3774 * Similar to expand_smacro but used exclusively with macro identifiers
3775 * right before they are fetched in. The reason is that there can be
3776 * identifiers consisting of several subparts. We consider that if there
3777 * are more than one element forming the name, user wants a expansion,
3778 * otherwise it will be left as-is. Example:
3780 * %define %$abc cde
3782 * the identifier %$abc will be left as-is so that the handler for %define
3783 * will suck it and define the corresponding value. Other case:
3785 * %define _%$abc cde
3787 * In this case user wants name to be expanded *before* %define starts
3788 * working, so we'll expand %$abc into something (if it has a value;
3789 * otherwise it will be left as-is) then concatenate all successive
3790 * PP_IDs into one.
3792 static Token *expand_id(Token * tline)
3794 Token *cur, *oldnext = NULL;
3796 if (!tline || !tline->next)
3797 return tline;
3799 cur = tline;
3800 while (cur->next &&
3801 (cur->next->type == TOK_ID ||
3802 cur->next->type == TOK_PREPROC_ID
3803 || cur->next->type == TOK_NUMBER))
3804 cur = cur->next;
3806 /* If identifier consists of just one token, don't expand */
3807 if (cur == tline)
3808 return tline;
3810 if (cur) {
3811 oldnext = cur->next; /* Detach the tail past identifier */
3812 cur->next = NULL; /* so that expand_smacro stops here */
3815 tline = expand_smacro(tline);
3817 if (cur) {
3818 /* expand_smacro possibly changhed tline; re-scan for EOL */
3819 cur = tline;
3820 while (cur && cur->next)
3821 cur = cur->next;
3822 if (cur)
3823 cur->next = oldnext;
3826 return tline;
3830 * Determine whether the given line constitutes a multi-line macro
3831 * call, and return the MMacro structure called if so. Doesn't have
3832 * to check for an initial label - that's taken care of in
3833 * expand_mmacro - but must check numbers of parameters. Guaranteed
3834 * to be called with tline->type == TOK_ID, so the putative macro
3835 * name is easy to find.
3837 static MMacro *is_mmacro(Token * tline, Token *** params_array)
3839 MMacro *head, *m;
3840 Token **params;
3841 int nparam;
3843 head = (MMacro *) hash_findix(&mmacros, tline->text);
3846 * Efficiency: first we see if any macro exists with the given
3847 * name. If not, we can return NULL immediately. _Then_ we
3848 * count the parameters, and then we look further along the
3849 * list if necessary to find the proper MMacro.
3851 for (m = head; m; m = m->next)
3852 if (!mstrcmp(m->name, tline->text, m->casesense))
3853 break;
3854 if (!m)
3855 return NULL;
3858 * OK, we have a potential macro. Count and demarcate the
3859 * parameters.
3861 count_mmac_params(tline->next, &nparam, &params);
3864 * So we know how many parameters we've got. Find the MMacro
3865 * structure that handles this number.
3867 while (m) {
3868 if (m->nparam_min <= nparam
3869 && (m->plus || nparam <= m->nparam_max)) {
3871 * This one is right. Just check if cycle removal
3872 * prohibits us using it before we actually celebrate...
3874 if (m->in_progress) {
3875 #if 0
3876 error(ERR_NONFATAL,
3877 "self-reference in multi-line macro `%s'", m->name);
3878 #endif
3879 nasm_free(params);
3880 return NULL;
3883 * It's right, and we can use it. Add its default
3884 * parameters to the end of our list if necessary.
3886 if (m->defaults && nparam < m->nparam_min + m->ndefs) {
3887 params =
3888 nasm_realloc(params,
3889 ((m->nparam_min + m->ndefs +
3890 1) * sizeof(*params)));
3891 while (nparam < m->nparam_min + m->ndefs) {
3892 params[nparam] = m->defaults[nparam - m->nparam_min];
3893 nparam++;
3897 * If we've gone over the maximum parameter count (and
3898 * we're in Plus mode), ignore parameters beyond
3899 * nparam_max.
3901 if (m->plus && nparam > m->nparam_max)
3902 nparam = m->nparam_max;
3904 * Then terminate the parameter list, and leave.
3906 if (!params) { /* need this special case */
3907 params = nasm_malloc(sizeof(*params));
3908 nparam = 0;
3910 params[nparam] = NULL;
3911 *params_array = params;
3912 return m;
3915 * This one wasn't right: look for the next one with the
3916 * same name.
3918 for (m = m->next; m; m = m->next)
3919 if (!mstrcmp(m->name, tline->text, m->casesense))
3920 break;
3924 * After all that, we didn't find one with the right number of
3925 * parameters. Issue a warning, and fail to expand the macro.
3927 error(ERR_WARNING | ERR_WARN_MNP,
3928 "macro `%s' exists, but not taking %d parameters",
3929 tline->text, nparam);
3930 nasm_free(params);
3931 return NULL;
3935 * Expand the multi-line macro call made by the given line, if
3936 * there is one to be expanded. If there is, push the expansion on
3937 * istk->expansion and return 1. Otherwise return 0.
3939 static int expand_mmacro(Token * tline)
3941 Token *startline = tline;
3942 Token *label = NULL;
3943 int dont_prepend = 0;
3944 Token **params, *t, *mtok, *tt;
3945 MMacro *m;
3946 Line *l, *ll;
3947 int i, nparam, *paramlen;
3948 const char *mname;
3950 t = tline;
3951 skip_white_(t);
3952 /* if (!tok_type_(t, TOK_ID)) Lino 02/25/02 */
3953 if (!tok_type_(t, TOK_ID) && !tok_type_(t, TOK_PREPROC_ID))
3954 return 0;
3955 mtok = t;
3956 m = is_mmacro(t, &params);
3957 if (m) {
3958 mname = t->text;
3959 } else {
3960 Token *last;
3962 * We have an id which isn't a macro call. We'll assume
3963 * it might be a label; we'll also check to see if a
3964 * colon follows it. Then, if there's another id after
3965 * that lot, we'll check it again for macro-hood.
3967 label = last = t;
3968 t = t->next;
3969 if (tok_type_(t, TOK_WHITESPACE))
3970 last = t, t = t->next;
3971 if (tok_is_(t, ":")) {
3972 dont_prepend = 1;
3973 last = t, t = t->next;
3974 if (tok_type_(t, TOK_WHITESPACE))
3975 last = t, t = t->next;
3977 if (!tok_type_(t, TOK_ID) || (m = is_mmacro(t, &params)) == NULL)
3978 return 0;
3979 last->next = NULL;
3980 mname = t->text;
3981 tline = t;
3985 * Fix up the parameters: this involves stripping leading and
3986 * trailing whitespace, then stripping braces if they are
3987 * present.
3989 for (nparam = 0; params[nparam]; nparam++) ;
3990 paramlen = nparam ? nasm_malloc(nparam * sizeof(*paramlen)) : NULL;
3992 for (i = 0; params[i]; i++) {
3993 int brace = false;
3994 int comma = (!m->plus || i < nparam - 1);
3996 t = params[i];
3997 skip_white_(t);
3998 if (tok_is_(t, "{"))
3999 t = t->next, brace = true, comma = false;
4000 params[i] = t;
4001 paramlen[i] = 0;
4002 while (t) {
4003 if (comma && t->type == TOK_OTHER && !strcmp(t->text, ","))
4004 break; /* ... because we have hit a comma */
4005 if (comma && t->type == TOK_WHITESPACE
4006 && tok_is_(t->next, ","))
4007 break; /* ... or a space then a comma */
4008 if (brace && t->type == TOK_OTHER && !strcmp(t->text, "}"))
4009 break; /* ... or a brace */
4010 t = t->next;
4011 paramlen[i]++;
4016 * OK, we have a MMacro structure together with a set of
4017 * parameters. We must now go through the expansion and push
4018 * copies of each Line on to istk->expansion. Substitution of
4019 * parameter tokens and macro-local tokens doesn't get done
4020 * until the single-line macro substitution process; this is
4021 * because delaying them allows us to change the semantics
4022 * later through %rotate.
4024 * First, push an end marker on to istk->expansion, mark this
4025 * macro as in progress, and set up its invocation-specific
4026 * variables.
4028 ll = nasm_malloc(sizeof(Line));
4029 ll->next = istk->expansion;
4030 ll->finishes = m;
4031 ll->first = NULL;
4032 istk->expansion = ll;
4034 m->in_progress = true;
4035 m->params = params;
4036 m->iline = tline;
4037 m->nparam = nparam;
4038 m->rotate = 0;
4039 m->paramlen = paramlen;
4040 m->unique = unique++;
4041 m->lineno = 0;
4043 m->next_active = istk->mstk;
4044 istk->mstk = m;
4046 for (l = m->expansion; l; l = l->next) {
4047 Token **tail;
4049 ll = nasm_malloc(sizeof(Line));
4050 ll->finishes = NULL;
4051 ll->next = istk->expansion;
4052 istk->expansion = ll;
4053 tail = &ll->first;
4055 for (t = l->first; t; t = t->next) {
4056 Token *x = t;
4057 switch (t->type) {
4058 case TOK_PREPROC_Q:
4059 tt = *tail = new_Token(NULL, TOK_ID, mname, 0);
4060 break;
4061 case TOK_PREPROC_QQ:
4062 tt = *tail = new_Token(NULL, TOK_ID, m->name, 0);
4063 break;
4064 case TOK_PREPROC_ID:
4065 if (t->text[1] == '0' && t->text[2] == '0') {
4066 dont_prepend = -1;
4067 x = label;
4068 if (!x)
4069 continue;
4071 /* fall through */
4072 default:
4073 tt = *tail = new_Token(NULL, x->type, x->text, 0);
4074 break;
4076 tail = &tt->next;
4078 *tail = NULL;
4082 * If we had a label, push it on as the first line of
4083 * the macro expansion.
4085 if (label) {
4086 if (dont_prepend < 0)
4087 free_tlist(startline);
4088 else {
4089 ll = nasm_malloc(sizeof(Line));
4090 ll->finishes = NULL;
4091 ll->next = istk->expansion;
4092 istk->expansion = ll;
4093 ll->first = startline;
4094 if (!dont_prepend) {
4095 while (label->next)
4096 label = label->next;
4097 label->next = tt = new_Token(NULL, TOK_OTHER, ":", 0);
4102 list->uplevel(m->nolist ? LIST_MACRO_NOLIST : LIST_MACRO);
4104 return 1;
4108 * Since preprocessor always operate only on the line that didn't
4109 * arrived yet, we should always use ERR_OFFBY1. Also since user
4110 * won't want to see same error twice (preprocessing is done once
4111 * per pass) we will want to show errors only during pass one.
4113 static void error(int severity, const char *fmt, ...)
4115 va_list arg;
4116 char buff[1024];
4118 /* If we're in a dead branch of IF or something like it, ignore the error */
4119 if (istk && istk->conds && !emitting(istk->conds->state))
4120 return;
4122 va_start(arg, fmt);
4123 vsnprintf(buff, sizeof(buff), fmt, arg);
4124 va_end(arg);
4126 if (istk && istk->mstk && istk->mstk->name)
4127 _error(severity | ERR_PASS1, "(%s:%d) %s", istk->mstk->name,
4128 istk->mstk->lineno, buff);
4129 else
4130 _error(severity | ERR_PASS1, "%s", buff);
4133 static void
4134 pp_reset(char *file, int apass, efunc errfunc, evalfunc eval,
4135 ListGen * listgen, StrList **deplist)
4137 _error = errfunc;
4138 cstk = NULL;
4139 istk = nasm_malloc(sizeof(Include));
4140 istk->next = NULL;
4141 istk->conds = NULL;
4142 istk->expansion = NULL;
4143 istk->mstk = NULL;
4144 istk->fp = fopen(file, "r");
4145 istk->fname = NULL;
4146 src_set_fname(nasm_strdup(file));
4147 src_set_linnum(0);
4148 istk->lineinc = 1;
4149 if (!istk->fp)
4150 error(ERR_FATAL | ERR_NOFILE, "unable to open input file `%s'",
4151 file);
4152 defining = NULL;
4153 nested_mac_count = 0;
4154 nested_rep_count = 0;
4155 init_macros();
4156 unique = 0;
4157 if (tasm_compatible_mode) {
4158 stdmacpos = nasm_stdmac;
4159 } else {
4160 stdmacpos = nasm_stdmac_after_tasm;
4162 any_extrastdmac = extrastdmac && *extrastdmac;
4163 do_predef = true;
4164 list = listgen;
4165 evaluate = eval;
4166 pass = apass;
4167 dephead = deptail = deplist;
4168 if (deplist) {
4169 StrList *sl = nasm_malloc(strlen(file)+1+sizeof sl->next);
4170 sl->next = NULL;
4171 strcpy(sl->str, file);
4172 *deptail = sl;
4173 deptail = &sl->next;
4177 static char *pp_getline(void)
4179 char *line;
4180 Token *tline;
4182 while (1) {
4184 * Fetch a tokenized line, either from the macro-expansion
4185 * buffer or from the input file.
4187 tline = NULL;
4188 while (istk->expansion && istk->expansion->finishes) {
4189 Line *l = istk->expansion;
4190 if (!l->finishes->name && l->finishes->in_progress > 1) {
4191 Line *ll;
4194 * This is a macro-end marker for a macro with no
4195 * name, which means it's not really a macro at all
4196 * but a %rep block, and the `in_progress' field is
4197 * more than 1, meaning that we still need to
4198 * repeat. (1 means the natural last repetition; 0
4199 * means termination by %exitrep.) We have
4200 * therefore expanded up to the %endrep, and must
4201 * push the whole block on to the expansion buffer
4202 * again. We don't bother to remove the macro-end
4203 * marker: we'd only have to generate another one
4204 * if we did.
4206 l->finishes->in_progress--;
4207 for (l = l->finishes->expansion; l; l = l->next) {
4208 Token *t, *tt, **tail;
4210 ll = nasm_malloc(sizeof(Line));
4211 ll->next = istk->expansion;
4212 ll->finishes = NULL;
4213 ll->first = NULL;
4214 tail = &ll->first;
4216 for (t = l->first; t; t = t->next) {
4217 if (t->text || t->type == TOK_WHITESPACE) {
4218 tt = *tail =
4219 new_Token(NULL, t->type, t->text, 0);
4220 tail = &tt->next;
4224 istk->expansion = ll;
4226 } else {
4228 * Check whether a `%rep' was started and not ended
4229 * within this macro expansion. This can happen and
4230 * should be detected. It's a fatal error because
4231 * I'm too confused to work out how to recover
4232 * sensibly from it.
4234 if (defining) {
4235 if (defining->name)
4236 error(ERR_PANIC,
4237 "defining with name in expansion");
4238 else if (istk->mstk->name)
4239 error(ERR_FATAL,
4240 "`%%rep' without `%%endrep' within"
4241 " expansion of macro `%s'",
4242 istk->mstk->name);
4246 * FIXME: investigate the relationship at this point between
4247 * istk->mstk and l->finishes
4250 MMacro *m = istk->mstk;
4251 istk->mstk = m->next_active;
4252 if (m->name) {
4254 * This was a real macro call, not a %rep, and
4255 * therefore the parameter information needs to
4256 * be freed.
4258 nasm_free(m->params);
4259 free_tlist(m->iline);
4260 nasm_free(m->paramlen);
4261 l->finishes->in_progress = false;
4262 } else
4263 free_mmacro(m);
4265 istk->expansion = l->next;
4266 nasm_free(l);
4267 list->downlevel(LIST_MACRO);
4270 while (1) { /* until we get a line we can use */
4272 if (istk->expansion) { /* from a macro expansion */
4273 char *p;
4274 Line *l = istk->expansion;
4275 if (istk->mstk)
4276 istk->mstk->lineno++;
4277 tline = l->first;
4278 istk->expansion = l->next;
4279 nasm_free(l);
4280 p = detoken(tline, false);
4281 list->line(LIST_MACRO, p);
4282 nasm_free(p);
4283 break;
4285 line = read_line();
4286 if (line) { /* from the current input file */
4287 line = prepreproc(line);
4288 tline = tokenize(line);
4289 nasm_free(line);
4290 break;
4293 * The current file has ended; work down the istk
4296 Include *i = istk;
4297 fclose(i->fp);
4298 if (i->conds)
4299 error(ERR_FATAL,
4300 "expected `%%endif' before end of file");
4301 /* only set line and file name if there's a next node */
4302 if (i->next) {
4303 src_set_linnum(i->lineno);
4304 nasm_free(src_set_fname(i->fname));
4306 istk = i->next;
4307 list->downlevel(LIST_INCLUDE);
4308 nasm_free(i);
4309 if (!istk)
4310 return NULL;
4315 * We must expand MMacro parameters and MMacro-local labels
4316 * _before_ we plunge into directive processing, to cope
4317 * with things like `%define something %1' such as STRUC
4318 * uses. Unless we're _defining_ a MMacro, in which case
4319 * those tokens should be left alone to go into the
4320 * definition; and unless we're in a non-emitting
4321 * condition, in which case we don't want to meddle with
4322 * anything.
4324 if (!defining && !(istk->conds && !emitting(istk->conds->state))
4325 && !(istk->mstk && !istk->mstk->in_progress))
4326 tline = expand_mmac_params(tline);
4329 * Check the line to see if it's a preprocessor directive.
4331 if (do_directive(tline) == DIRECTIVE_FOUND) {
4332 continue;
4333 } else if (defining) {
4335 * We're defining a multi-line macro. We emit nothing
4336 * at all, and just
4337 * shove the tokenized line on to the macro definition.
4339 Line *l = nasm_malloc(sizeof(Line));
4340 l->next = defining->expansion;
4341 l->first = tline;
4342 l->finishes = NULL;
4343 defining->expansion = l;
4344 continue;
4345 } else if (istk->conds && !emitting(istk->conds->state)) {
4347 * We're in a non-emitting branch of a condition block.
4348 * Emit nothing at all, not even a blank line: when we
4349 * emerge from the condition we'll give a line-number
4350 * directive so we keep our place correctly.
4352 free_tlist(tline);
4353 continue;
4354 } else if (istk->mstk && !istk->mstk->in_progress) {
4356 * We're in a %rep block which has been terminated, so
4357 * we're walking through to the %endrep without
4358 * emitting anything. Emit nothing at all, not even a
4359 * blank line: when we emerge from the %rep block we'll
4360 * give a line-number directive so we keep our place
4361 * correctly.
4363 free_tlist(tline);
4364 continue;
4365 } else {
4366 tline = expand_smacro(tline);
4367 if (!expand_mmacro(tline)) {
4369 * De-tokenize the line again, and emit it.
4371 line = detoken(tline, true);
4372 free_tlist(tline);
4373 break;
4374 } else {
4375 continue; /* expand_mmacro calls free_tlist */
4380 return line;
4383 static void pp_cleanup(int pass)
4385 if (defining) {
4386 if(defining->name) {
4387 error(ERR_NONFATAL,
4388 "end of file while still defining macro `%s'",
4389 defining->name);
4390 } else {
4391 error(ERR_NONFATAL, "end of file while still in %%rep");
4394 free_mmacro(defining);
4396 while (cstk)
4397 ctx_pop();
4398 free_macros();
4399 while (istk) {
4400 Include *i = istk;
4401 istk = istk->next;
4402 fclose(i->fp);
4403 nasm_free(i->fname);
4404 nasm_free(i);
4406 while (cstk)
4407 ctx_pop();
4408 nasm_free(src_set_fname(NULL));
4409 if (pass == 0) {
4410 IncPath *i;
4411 free_llist(predef);
4412 delete_Blocks();
4413 while ((i = ipath)) {
4414 ipath = i->next;
4415 if (i->path)
4416 nasm_free(i->path);
4417 nasm_free(i);
4422 void pp_include_path(char *path)
4424 IncPath *i;
4426 i = nasm_malloc(sizeof(IncPath));
4427 i->path = path ? nasm_strdup(path) : NULL;
4428 i->next = NULL;
4430 if (ipath != NULL) {
4431 IncPath *j = ipath;
4432 while (j->next != NULL)
4433 j = j->next;
4434 j->next = i;
4435 } else {
4436 ipath = i;
4440 void pp_pre_include(char *fname)
4442 Token *inc, *space, *name;
4443 Line *l;
4445 name = new_Token(NULL, TOK_INTERNAL_STRING, fname, 0);
4446 space = new_Token(name, TOK_WHITESPACE, NULL, 0);
4447 inc = new_Token(space, TOK_PREPROC_ID, "%include", 0);
4449 l = nasm_malloc(sizeof(Line));
4450 l->next = predef;
4451 l->first = inc;
4452 l->finishes = NULL;
4453 predef = l;
4456 void pp_pre_define(char *definition)
4458 Token *def, *space;
4459 Line *l;
4460 char *equals;
4462 equals = strchr(definition, '=');
4463 space = new_Token(NULL, TOK_WHITESPACE, NULL, 0);
4464 def = new_Token(space, TOK_PREPROC_ID, "%define", 0);
4465 if (equals)
4466 *equals = ' ';
4467 space->next = tokenize(definition);
4468 if (equals)
4469 *equals = '=';
4471 l = nasm_malloc(sizeof(Line));
4472 l->next = predef;
4473 l->first = def;
4474 l->finishes = NULL;
4475 predef = l;
4478 void pp_pre_undefine(char *definition)
4480 Token *def, *space;
4481 Line *l;
4483 space = new_Token(NULL, TOK_WHITESPACE, NULL, 0);
4484 def = new_Token(space, TOK_PREPROC_ID, "%undef", 0);
4485 space->next = tokenize(definition);
4487 l = nasm_malloc(sizeof(Line));
4488 l->next = predef;
4489 l->first = def;
4490 l->finishes = NULL;
4491 predef = l;
4495 * Added by Keith Kanios:
4497 * This function is used to assist with "runtime" preprocessor
4498 * directives. (e.g. pp_runtime("%define __BITS__ 64");)
4500 * ERRORS ARE IGNORED HERE, SO MAKE COMPLETELY SURE THAT YOU
4501 * PASS A VALID STRING TO THIS FUNCTION!!!!!
4504 void pp_runtime(char *definition)
4506 Token *def;
4508 def = tokenize(definition);
4509 if(do_directive(def) == NO_DIRECTIVE_FOUND)
4510 free_tlist(def);
4514 void pp_extra_stdmac(macros_t *macros)
4516 extrastdmac = macros;
4519 static void make_tok_num(Token * tok, int64_t val)
4521 char numbuf[20];
4522 snprintf(numbuf, sizeof(numbuf), "%"PRId64"", val);
4523 tok->text = nasm_strdup(numbuf);
4524 tok->type = TOK_NUMBER;
4527 Preproc nasmpp = {
4528 pp_reset,
4529 pp_getline,
4530 pp_cleanup