No C++ comments, please!
[nasm.git] / nasm.c
blob031f31a2213588fbcbe5742ed0fe282e2483213c
1 /* The Netwide Assembler main program module
3 * The Netwide Assembler is copyright (C) 1996 Simon Tatham and
4 * Julian Hall. All rights reserved. The software is
5 * redistributable under the licence given in the file "Licence"
6 * distributed in the NASM archive.
7 */
9 #include <stdio.h>
10 #include <stdarg.h>
11 #include <stdlib.h>
12 #include <string.h>
13 #include <ctype.h>
15 #include "nasm.h"
16 #include "nasmlib.h"
17 #include "insns.h"
18 #include "preproc.h"
19 #include "parser.h"
20 #include "eval.h"
21 #include "assemble.h"
22 #include "labels.h"
23 #include "outform.h"
24 #include "listing.h"
26 struct forwrefinfo { /* info held on forward refs. */
27 int lineno;
28 int operand;
31 static int get_bits (char *value);
32 static unsigned long get_cpu (char *cpu_str);
33 static void parse_cmdline (int, char **);
34 static void assemble_file (char *);
35 static int getkw (char *buf, char **value);
36 static void register_output_formats(void);
37 static void report_error (int severity, const char *fmt, ...);
38 static void usage(void);
40 static int using_debug_info;
41 int tasm_compatible_mode = FALSE;
42 int pass0;
44 static char inname[FILENAME_MAX];
45 static char outname[FILENAME_MAX];
46 static char listname[FILENAME_MAX];
47 static int globallineno; /* for forward-reference tracking */
48 /* static int pass = 0; */
49 static struct ofmt *ofmt = NULL;
51 static FILE *error_file; /* Where to write error messages */
53 static FILE *ofile = NULL;
54 int optimizing = -1; /* number of optimization passes to take */
55 static int sb, cmd_sb = 16; /* by default */
56 static unsigned long cmd_cpu = IF_PLEVEL; /* highest level by default */
57 static unsigned long cpu = IF_PLEVEL; /* passed to insn_size & assemble.c */
58 int global_offset_changed; /* referenced in labels.c */
60 static loc_t location;
61 int in_abs_seg; /* Flag we are in ABSOLUTE seg */
63 static struct RAA *offsets;
64 static long abs_offset;
66 static struct SAA *forwrefs; /* keep track of forward references */
67 static struct forwrefinfo *forwref;
69 static Preproc *preproc;
70 enum op_type {
71 op_normal, /* Preprocess and assemble */
72 op_preprocess, /* Preprocess only */
73 op_depend /* Generate dependencies */
75 static enum op_type operating_mode;
78 * Which of the suppressible warnings are suppressed. Entry zero
79 * doesn't do anything. Initial defaults are given here.
81 static char suppressed[1+ERR_WARN_MAX] = {
82 0, TRUE, TRUE, TRUE, FALSE, TRUE
86 * The option names for the suppressible warnings. As before, entry
87 * zero does nothing.
89 static const char *suppressed_names[1+ERR_WARN_MAX] = {
90 NULL, "macro-params", "macro-selfref", "orphan-labels", "number-overflow",
91 "gnu-elf-extensions"
95 * The explanations for the suppressible warnings. As before, entry
96 * zero does nothing.
98 static const char *suppressed_what[1+ERR_WARN_MAX] = {
99 NULL,
100 "macro calls with wrong no. of params",
101 "cyclic macro self-references",
102 "labels alone on lines without trailing `:'",
103 "numeric constants greater than 0xFFFFFFFF",
104 "using 8- or 16-bit relocation in ELF, a GNU extension"
108 * This is a null preprocessor which just copies lines from input
109 * to output. It's used when someone explicitly requests that NASM
110 * not preprocess their source file.
113 static void no_pp_reset (char *, int, efunc, evalfunc, ListGen *);
114 static char *no_pp_getline (void);
115 static void no_pp_cleanup (int);
116 static Preproc no_pp = {
117 no_pp_reset,
118 no_pp_getline,
119 no_pp_cleanup
123 * get/set current offset...
125 #define GET_CURR_OFFS (in_abs_seg?abs_offset:\
126 raa_read(offsets,location.segment))
127 #define SET_CURR_OFFS(x) (in_abs_seg?(void)(abs_offset=(x)):\
128 (void)(offsets=raa_write(offsets,location.segment,(x))))
130 static int want_usage;
131 static int terminate_after_phase;
132 int user_nolist = 0; /* fbk 9/2/00 */
134 static void nasm_fputs(const char *line, FILE *outfile)
136 if (outfile) {
137 fputs(line, outfile);
138 fputc('\n', outfile);
139 } else
140 puts(line);
143 int main(int argc, char **argv)
145 pass0 = 1;
146 want_usage = terminate_after_phase = FALSE;
148 nasm_set_malloc_error (report_error);
149 offsets = raa_init();
150 forwrefs = saa_init ((long)sizeof(struct forwrefinfo));
152 preproc = &nasmpp;
153 operating_mode = op_normal;
155 error_file = stderr;
157 seg_init();
159 register_output_formats();
161 parse_cmdline(argc, argv);
163 if (terminate_after_phase)
165 if (want_usage)
166 usage();
167 return 1;
170 if (ofmt->stdmac)
171 pp_extra_stdmac (ofmt->stdmac);
172 parser_global_info (ofmt, &location);
173 eval_global_info (ofmt, lookup_label, &location);
175 /* define some macros dependent of command-line */
177 char temp [64];
178 sprintf (temp, "__OUTPUT_FORMAT__=%s\n", ofmt->shortname);
179 pp_pre_define (temp);
182 switch ( operating_mode ) {
183 case op_depend:
185 char *line;
186 preproc->reset (inname, 0, report_error, evaluate, &nasmlist);
187 if (outname[0] == '\0')
188 ofmt->filename (inname, outname, report_error);
189 ofile = NULL;
190 fprintf(stdout, "%s: %s", outname, inname);
191 while ( (line = preproc->getline()) )
192 nasm_free (line);
193 preproc->cleanup(0);
194 putc('\n', stdout);
196 break;
198 case op_preprocess:
200 char *line;
201 char *file_name = NULL;
202 long prior_linnum=0;
203 int lineinc=0;
205 if (*outname) {
206 ofile = fopen(outname, "w");
207 if (!ofile)
208 report_error (ERR_FATAL | ERR_NOFILE,
209 "unable to open output file `%s'", outname);
210 } else
211 ofile = NULL;
213 location.known = FALSE;
215 /* pass = 1; */
216 preproc->reset (inname, 2, report_error, evaluate, &nasmlist);
217 while ( (line = preproc->getline()) ) {
219 * We generate %line directives if needed for later programs
221 long linnum = prior_linnum += lineinc;
222 int altline = src_get(&linnum, &file_name);
223 if (altline) {
224 if (altline==1 && lineinc==1)
225 nasm_fputs("", ofile);
226 else {
227 lineinc = (altline != -1 || lineinc!=1);
228 fprintf(ofile ? ofile : stdout, "%%line %ld+%d %s\n",
229 linnum, lineinc, file_name);
231 prior_linnum = linnum;
233 nasm_fputs(line, ofile);
234 nasm_free (line);
236 nasm_free(file_name);
237 preproc->cleanup(0);
238 if (ofile)
239 fclose(ofile);
240 if (ofile && terminate_after_phase)
241 remove(outname);
243 break;
245 case op_normal:
248 * We must call ofmt->filename _anyway_, even if the user
249 * has specified their own output file, because some
250 * formats (eg OBJ and COFF) use ofmt->filename to find out
251 * the name of the input file and then put that inside the
252 * file.
254 ofmt->filename (inname, outname, report_error);
256 ofile = fopen(outname, "wb");
257 if (!ofile) {
258 report_error (ERR_FATAL | ERR_NOFILE,
259 "unable to open output file `%s'", outname);
263 * We must call init_labels() before ofmt->init() since
264 * some object formats will want to define labels in their
265 * init routines. (eg OS/2 defines the FLAT group)
267 init_labels ();
269 ofmt->init (ofile, report_error, define_label, evaluate);
271 assemble_file (inname);
273 if (!terminate_after_phase) {
274 ofmt->cleanup (using_debug_info);
275 cleanup_labels ();
276 } else {
278 * We had an fclose on the output file here, but we
279 * actually do that in all the object file drivers as well,
280 * so we're leaving out the one here.
281 * fclose (ofile);
283 remove(outname);
284 if (listname[0])
285 remove(listname);
288 break;
291 if (want_usage)
292 usage();
294 raa_free (offsets);
295 saa_free (forwrefs);
296 eval_cleanup ();
297 nasmlib_cleanup ();
299 if (terminate_after_phase)
300 return 1;
301 else
302 return 0;
307 * Get a parameter for a command line option.
308 * First arg must be in the form of e.g. -f...
310 static char *get_param (char *p, char *q, int *advance)
312 *advance = 0;
313 if (p[2]) /* the parameter's in the option */
315 p += 2;
316 while (isspace(*p))
317 p++;
318 return p;
320 if (q && q[0])
322 *advance = 1;
323 return q;
325 report_error (ERR_NONFATAL | ERR_NOFILE | ERR_USAGE,
326 "option `-%c' requires an argument",
327 p[1]);
328 return NULL;
331 struct textargs
333 const char *label;
334 int value;
337 #define OPT_PREFIX 0
338 #define OPT_POSTFIX 1
339 struct textargs textopts[] =
341 {"prefix",OPT_PREFIX},
342 {"postfix",OPT_POSTFIX},
343 {NULL,0}
347 int stopoptions = 0;
348 static int process_arg (char *p, char *q)
350 char *param;
351 int i, advance = 0;
353 if (!p || !p[0])
354 return 0;
356 if (p[0]=='-' && ! stopoptions)
358 switch (p[1]) {
359 case 's':
360 error_file = stdout;
361 break;
362 case 'o': /* these parameters take values */
363 case 'O':
364 case 'f':
365 case 'p':
366 case 'P':
367 case 'd':
368 case 'D':
369 case 'i':
370 case 'I':
371 case 'l':
372 case 'E':
373 case 'F':
374 if ( !(param = get_param (p, q, &advance)) )
375 break;
376 if (p[1]=='o') { /* output file */
377 strcpy (outname, param);
378 } else if (p[1]=='f') { /* output format */
379 ofmt = ofmt_find(param);
380 if (!ofmt) {
381 report_error (ERR_FATAL | ERR_NOFILE | ERR_USAGE,
382 "unrecognised output format `%s' - "
383 "use -hf for a list",
384 param);
386 else
387 ofmt->current_dfmt = ofmt->debug_formats[0];
388 } else if (p[1]=='O') { /* Optimization level */
389 int opt;
390 if (!isdigit(*param)) report_error(ERR_FATAL,
391 "command line optimization level must be 0..3 or <nn>");
392 opt = atoi(param);
393 if (opt<=0) optimizing = -1; /* 0.98 behaviour */
394 else if (opt==1) optimizing = 0; /* Two passes, 0.98.09 behavior */
395 else if (opt<=3) optimizing = opt*5; /* Multiple passes */
396 else optimizing = opt; /* Multiple passes */
397 } else if (p[1]=='P' || p[1]=='p') { /* pre-include */
398 pp_pre_include (param);
399 } else if (p[1]=='D' || p[1]=='d') { /* pre-define */
400 pp_pre_define (param);
401 } else if (p[1]=='U' || p[1]=='u') { /* un-define */
402 pp_pre_undefine (param);
403 } else if (p[1]=='I' || p[1]=='i') { /* include search path */
404 pp_include_path (param);
405 } else if (p[1]=='l') { /* listing file */
406 strcpy (listname, param);
407 } else if (p[1]=='E') { /* error messages file */
408 error_file = fopen(param, "w");
409 if ( !error_file ) {
410 error_file = stderr; /* Revert to default! */
411 report_error (ERR_FATAL | ERR_NOFILE | ERR_USAGE,
412 "cannot open file `%s' for error messages",
413 param);
415 } else if (p[1] == 'F') { /* specify debug format */
416 ofmt->current_dfmt = dfmt_find(ofmt, param);
417 if (!ofmt->current_dfmt) {
418 report_error (ERR_FATAL | ERR_NOFILE | ERR_USAGE,
419 "unrecognized debug format `%s' for"
420 " output format `%s'",
421 param, ofmt->shortname);
424 break;
425 case 'g':
426 using_debug_info = TRUE;
427 break;
428 case 'h':
429 printf("usage: nasm [-@ response file] [-o outfile] [-f format] "
430 "[-l listfile]\n"
431 " [options...] [--] filename\n"
432 " or nasm -r for version info (obsolete)\n"
433 " or nasm -v for version info (preferred)\n\n"
434 " -t Assemble in SciTech TASM compatible mode\n"
435 " -g Generate debug information in selected format.\n");
436 printf(" -e preprocess only (writes output to stdout by default)\n"
437 " -a don't preprocess (assemble only)\n"
438 " -M generate Makefile dependencies on stdout\n\n"
439 " -E<file> redirect error messages to file\n"
440 " -s redirect error messages to stdout\n\n"
441 " -F format select a debugging format\n\n"
442 " -I<path> adds a pathname to the include file path\n");
443 printf(" -O<digit> optimize branch offsets (-O0 disables, default)\n"
444 " -P<file> pre-includes a file\n"
445 " -D<macro>[=<value>] pre-defines a macro\n"
446 " -U<macro> undefines a macro\n"
447 " -w+foo enables warnings about foo; -w-foo disables them\n"
448 "where foo can be:\n");
449 for (i=1; i<=ERR_WARN_MAX; i++)
450 printf(" %-23s %s (default %s)\n",
451 suppressed_names[i], suppressed_what[i],
452 suppressed[i] ? "off" : "on");
453 printf ("\nresponse files should contain command line parameters"
454 ", one per line.\n");
455 if (p[2] == 'f') {
456 printf("\nvalid output formats for -f are"
457 " (`*' denotes default):\n");
458 ofmt_list(ofmt, stdout);
460 else {
461 printf ("\nFor a list of valid output formats, use -hf.\n");
462 printf ("For a list of debug formats, use -f <form> -y.\n");
464 exit (0); /* never need usage message here */
465 break;
466 case 'y':
467 printf("\nvalid debug formats for '%s' output format are"
468 " ('*' denotes default):\n",
469 ofmt->shortname);
470 dfmt_list(ofmt, stdout);
471 exit(0);
472 break;
473 case 't':
474 tasm_compatible_mode = TRUE;
475 break;
476 case 'r':
477 case 'v':
478 printf("NASM version %s compiled "
479 #ifdef DEBUG
480 "with -DDEBUG "
481 #endif
482 "on " __DATE__ "\n", NASM_VER);
483 exit (0); /* never need usage message here */
484 break;
485 case 'e': /* preprocess only */
486 operating_mode = op_preprocess;
487 break;
488 case 'a': /* assemble only - don't preprocess */
489 preproc = &no_pp;
490 break;
491 case 'w':
492 if (p[2] != '+' && p[2] != '-') {
493 report_error (ERR_NONFATAL | ERR_NOFILE | ERR_USAGE,
494 "invalid option to `-w'");
495 } else {
496 for (i=1; i<=ERR_WARN_MAX; i++)
497 if (!nasm_stricmp(p+3, suppressed_names[i]))
498 break;
499 if (i <= ERR_WARN_MAX)
500 suppressed[i] = (p[2] == '-');
501 else
502 report_error (ERR_NONFATAL | ERR_NOFILE | ERR_USAGE,
503 "invalid option to `-w'");
505 break;
506 case 'M':
507 operating_mode = op_depend;
508 break;
510 case '-':
512 int s;
514 if (p[2]==0) { /* -- => stop processing options */
515 stopoptions = 1;
516 break;
518 for(s=0; textopts[s].label; s++)
520 if(!nasm_stricmp(p+2, textopts[s].label))
522 break;
526 switch(s)
529 case OPT_PREFIX:
530 case OPT_POSTFIX:
532 if (!q)
534 report_error (ERR_NONFATAL | ERR_NOFILE | ERR_USAGE,
535 "option `--%s' requires an argument",
536 p+2);
537 break;
539 else
541 advance = 1, param = q;
544 if(s == OPT_PREFIX)
546 strncpy(lprefix,param,PREFIX_MAX-1);
547 lprefix[PREFIX_MAX-1]=0;
548 break;
550 if(s == OPT_POSTFIX)
552 strncpy(lpostfix,param,POSTFIX_MAX-1);
553 lpostfix[POSTFIX_MAX-1]=0;
554 break;
556 break;
558 default:
560 report_error (ERR_NONFATAL | ERR_NOFILE | ERR_USAGE,
561 "unrecognised option `--%s'",
562 p+2);
563 break;
566 break;
569 default:
570 if (!ofmt->setinfo(GI_SWITCH,&p))
571 report_error (ERR_NONFATAL | ERR_NOFILE | ERR_USAGE,
572 "unrecognised option `-%c'",
573 p[1]);
574 break;
577 else
579 if (*inname) {
580 report_error (ERR_NONFATAL | ERR_NOFILE | ERR_USAGE,
581 "more than one input file specified");
582 } else
583 strcpy(inname, p);
586 return advance;
589 #define ARG_BUF_DELTA 128
591 static void process_respfile (FILE *rfile)
593 char *buffer, *p, *q, *prevarg;
594 int bufsize, prevargsize;
596 bufsize = prevargsize = ARG_BUF_DELTA;
597 buffer = nasm_malloc(ARG_BUF_DELTA);
598 prevarg = nasm_malloc(ARG_BUF_DELTA);
599 prevarg[0] = '\0';
601 while (1) { /* Loop to handle all lines in file */
603 p = buffer;
604 while (1) { /* Loop to handle long lines */
605 q = fgets(p, bufsize-(p-buffer), rfile);
606 if (!q)
607 break;
608 p += strlen(p);
609 if (p > buffer && p[-1] == '\n')
610 break;
611 if (p-buffer > bufsize-10) {
612 int offset;
613 offset = p - buffer;
614 bufsize += ARG_BUF_DELTA;
615 buffer = nasm_realloc(buffer, bufsize);
616 p = buffer + offset;
620 if (!q && p == buffer) {
621 if (prevarg[0])
622 process_arg (prevarg, NULL);
623 nasm_free (buffer);
624 nasm_free (prevarg);
625 return;
629 * Play safe: remove CRs, LFs and any spurious ^Zs, if any of
630 * them are present at the end of the line.
632 *(p = &buffer[strcspn(buffer, "\r\n\032")]) = '\0';
634 while (p > buffer && isspace(p[-1]))
635 *--p = '\0';
637 p = buffer;
638 while (isspace(*p))
639 p++;
641 if (process_arg (prevarg, p))
642 *p = '\0';
644 if (strlen(p) > prevargsize-10) {
645 prevargsize += ARG_BUF_DELTA;
646 prevarg = nasm_realloc(prevarg, prevargsize);
648 strcpy (prevarg, p);
652 /* Function to process args from a string of args, rather than the
653 * argv array. Used by the environment variable and response file
654 * processing.
656 static void process_args (char *args) {
657 char *p, *q, *arg, *prevarg;
658 char separator = ' ';
660 p = args;
661 if (*p && *p != '-')
662 separator = *p++;
663 arg = NULL;
664 while (*p) {
665 q = p;
666 while (*p && *p != separator) p++;
667 while (*p == separator) *p++ = '\0';
668 prevarg = arg;
669 arg = q;
670 if (process_arg (prevarg, arg))
671 arg = NULL;
673 if (arg)
674 process_arg (arg, NULL);
677 static void parse_cmdline(int argc, char **argv)
679 FILE *rfile;
680 char *envreal, *envcopy=NULL, *p, *arg;
682 *inname = *outname = *listname = '\0';
685 * First, process the NASMENV environment variable.
687 envreal = getenv("NASMENV");
688 arg = NULL;
689 if (envreal) {
690 envcopy = nasm_strdup(envreal);
691 process_args(envcopy);
692 nasm_free (envcopy);
696 * Now process the actual command line.
698 while (--argc)
700 int i;
701 argv++;
702 if (argv[0][0] == '@') {
703 /* We have a response file, so process this as a set of
704 * arguments like the environment variable. This allows us
705 * to have multiple arguments on a single line, which is
706 * different to the -@resp file processing below for regular
707 * NASM.
709 char *str = malloc(2048);
710 FILE *f = fopen(&argv[0][1],"r");
711 if (!str) {
712 printf("out of memory");
713 exit(-1);
715 if (f) {
716 while (fgets(str,2048,f)) {
717 process_args(str);
719 fclose(f);
721 free(str);
722 argc--;
723 argv++;
725 if (!stopoptions && argv[0][0] == '-' && argv[0][1] == '@') {
726 if ((p = get_param (argv[0], argc > 1 ? argv[1] : NULL, &i))) {
727 if ((rfile = fopen(p, "r"))) {
728 process_respfile (rfile);
729 fclose(rfile);
730 } else
731 report_error (ERR_NONFATAL | ERR_NOFILE | ERR_USAGE,
732 "unable to open response file `%s'", p);
734 } else
735 i = process_arg (argv[0], argc > 1 ? argv[1] : NULL);
736 argv += i, argc -= i;
739 if (!*inname)
740 report_error (ERR_NONFATAL | ERR_NOFILE | ERR_USAGE,
741 "no input file specified");
745 static void assemble_file (char *fname)
747 char * value, * p, * q, * special, * line, debugid[80];
748 insn output_ins;
749 int i, rn_error, validid;
750 long seg, offs;
751 struct tokenval tokval;
752 expr * e;
753 int pass, pass_max;
754 int pass_cnt = 0; /* count actual passes */
756 if (cmd_sb == 32 && cmd_cpu < IF_386)
757 report_error(ERR_FATAL, "command line: "
758 "32-bit segment size requires a higher cpu");
760 pass_max = (optimizing>0 ? optimizing : 0) + 2; /* passes 1, optimizing, then 2 */
761 pass0 = !(optimizing>0); /* start at 1 if not optimizing */
762 for (pass = 1; pass <= pass_max && pass0 <= 2; pass++) {
763 int pass1, pass2;
764 ldfunc def_label;
766 pass1 = pass < pass_max ? 1 : 2; /* seq is 1, 1, 1,..., 1, 2 */
767 pass2 = pass > 1 ? 2 : 1; /* seq is 1, 2, 2,..., 2, 2 */
768 /* pass0 seq is 0, 0, 0,..., 1, 2 */
770 def_label = pass > 1 ? redefine_label : define_label;
773 sb = cmd_sb; /* set 'bits' to command line default */
774 cpu = cmd_cpu;
775 if (pass0 == 2) {
776 if (*listname)
777 nasmlist.init(listname, report_error);
779 in_abs_seg = FALSE;
780 global_offset_changed = FALSE; /* set by redefine_label */
781 location.segment = ofmt->section(NULL, pass2, &sb);
782 if (pass > 1) {
783 saa_rewind (forwrefs);
784 forwref = saa_rstruct (forwrefs);
785 raa_free (offsets);
786 offsets = raa_init();
788 preproc->reset(fname, pass1, report_error, evaluate, &nasmlist);
789 globallineno = 0;
790 if (pass == 1) location.known = TRUE;
791 location.offset = offs = GET_CURR_OFFS;
793 while ( (line = preproc->getline()) )
795 globallineno++;
797 /* here we parse our directives; this is not handled by the 'real'
798 * parser. */
799 if ( (i = getkw (line, &value)) )
801 switch (i) {
802 case 1: /* [SEGMENT n] */
803 seg = ofmt->section (value, pass2, &sb);
804 if (seg == NO_SEG) {
805 report_error (pass1==1 ? ERR_NONFATAL : ERR_PANIC,
806 "segment name `%s' not recognised",
807 value);
808 } else {
809 in_abs_seg = FALSE;
810 location.segment = seg;
812 break;
813 case 2: /* [EXTERN label:special] */
814 if (*value == '$') value++; /* skip initial $ if present */
815 if (pass0 == 2) {
816 q = value;
817 while (*q && *q != ':')
818 q++;
819 if (*q == ':') {
820 *q++ = '\0';
821 ofmt->symdef(value, 0L, 0L, 3, q);
823 } else if (pass == 1) { /* pass == 1 */
824 q = value;
825 validid = TRUE;
826 if (!isidstart(*q))
827 validid = FALSE;
828 while (*q && *q != ':') {
829 if (!isidchar(*q))
830 validid = FALSE;
831 q++;
833 if (!validid) {
834 report_error (ERR_NONFATAL,
835 "identifier expected after EXTERN");
836 break;
838 if (*q == ':') {
839 *q++ = '\0';
840 special = q;
841 } else
842 special = NULL;
843 if (!is_extern(value)) { /* allow re-EXTERN to be ignored */
844 int temp = pass0;
845 pass0 = 1; /* fake pass 1 in labels.c */
846 declare_as_global (value, special, report_error);
847 define_label (value, seg_alloc(), 0L, NULL, FALSE, TRUE,
848 ofmt, report_error);
849 pass0 = temp;
851 } /* else pass0 == 1 */
852 break;
853 case 3: /* [BITS bits] */
854 sb = get_bits(value);
855 break;
856 case 4: /* [GLOBAL symbol:special] */
857 if (*value == '$') value++; /* skip initial $ if present */
858 if (pass0 == 2) { /* pass 2 */
859 q = value;
860 while (*q && *q != ':')
861 q++;
862 if (*q == ':') {
863 *q++ = '\0';
864 ofmt->symdef(value, 0L, 0L, 3, q);
866 } else if (pass2 == 1) { /* pass == 1 */
867 q = value;
868 validid = TRUE;
869 if (!isidstart(*q))
870 validid = FALSE;
871 while (*q && *q != ':') {
872 if (!isidchar(*q))
873 validid = FALSE;
874 q++;
876 if (!validid) {
877 report_error (ERR_NONFATAL,
878 "identifier expected after GLOBAL");
879 break;
881 if (*q == ':') {
882 *q++ = '\0';
883 special = q;
884 } else
885 special = NULL;
886 declare_as_global (value, special, report_error);
887 } /* pass == 1 */
888 break;
889 case 5: /* [COMMON symbol size:special] */
890 if (*value == '$') value++; /* skip initial $ if present */
891 if (pass0 == 1) {
892 p = value;
893 validid = TRUE;
894 if (!isidstart(*p))
895 validid = FALSE;
896 while (*p && !isspace(*p)) {
897 if (!isidchar(*p))
898 validid = FALSE;
899 p++;
901 if (!validid) {
902 report_error (ERR_NONFATAL,
903 "identifier expected after COMMON");
904 break;
906 if (*p) {
907 long size;
909 while (*p && isspace(*p))
910 *p++ = '\0';
911 q = p;
912 while (*q && *q != ':')
913 q++;
914 if (*q == ':') {
915 *q++ = '\0';
916 special = q;
917 } else
918 special = NULL;
919 size = readnum (p, &rn_error);
920 if (rn_error)
921 report_error (ERR_NONFATAL, "invalid size specified"
922 " in COMMON declaration");
923 else
924 define_common (value, seg_alloc(), size,
925 special, ofmt, report_error);
926 } else
927 report_error (ERR_NONFATAL, "no size specified in"
928 " COMMON declaration");
929 } else if (pass0 == 2) { /* pass == 2 */
930 q = value;
931 while (*q && *q != ':') {
932 if (isspace(*q))
933 *q = '\0';
934 q++;
936 if (*q == ':') {
937 *q++ = '\0';
938 ofmt->symdef(value, 0L, 0L, 3, q);
941 break;
942 case 6: /* [ABSOLUTE address] */
943 stdscan_reset();
944 stdscan_bufptr = value;
945 tokval.t_type = TOKEN_INVALID;
946 e = evaluate(stdscan, NULL, &tokval, NULL, pass2, report_error,
947 NULL);
948 if (e) {
949 if (!is_reloc(e))
950 report_error (pass0==1 ? ERR_NONFATAL : ERR_PANIC,
951 "cannot use non-relocatable expression as "
952 "ABSOLUTE address");
953 else {
954 /* abs_seg = reloc_seg(e); */
955 abs_offset = reloc_value(e);
957 } else
958 if (pass==1) abs_offset = 0x100;/* don't go near zero in case of / */
959 else report_error (ERR_PANIC, "invalid ABSOLUTE address "
960 "in pass two");
961 in_abs_seg = TRUE;
962 location.segment = NO_SEG;
963 break;
964 case 7: /* DEBUG */
965 p = value;
966 q = debugid;
967 validid = TRUE;
968 if (!isidstart(*p))
969 validid = FALSE;
970 while (*p && !isspace(*p)) {
971 if (!isidchar(*p))
972 validid = FALSE;
973 *q++ = *p++;
975 *q++ = 0;
976 if (!validid) {
977 report_error (pass==1 ? ERR_NONFATAL : ERR_PANIC,
978 "identifier expected after DEBUG");
979 break;
981 while (*p && isspace(*p)) p++;
982 if (pass==pass_max) ofmt->current_dfmt->debug_directive (debugid, p);
983 break;
984 case 8: /* [WARNING {+|-}warn-name] */
985 if (pass1 == 1) {
986 while (*value && isspace(*value))
987 value++;
989 if (*value == '+' || *value == '-') {
990 validid = (*value == '-') ? TRUE : FALSE;
991 value++;
992 } else
993 validid = FALSE;
995 for (i=1; i<=ERR_WARN_MAX; i++)
996 if (!nasm_stricmp(value, suppressed_names[i]))
997 break;
998 if (i <= ERR_WARN_MAX)
999 suppressed[i] = validid;
1000 else
1001 report_error (ERR_NONFATAL, "invalid warning id in WARNING directive");
1003 break;
1004 case 9: /* cpu */
1005 cpu = get_cpu (value);
1006 break;
1007 case 10: /* fbk 9/2/00 */ /* [LIST {+|-}] */
1008 while (*value && isspace(*value))
1009 value++;
1011 if (*value == '+') {
1012 user_nolist = 0;
1014 else {
1015 if (*value == '-') {
1016 user_nolist = 1;
1018 else {
1019 report_error (ERR_NONFATAL, "invalid parameter to \"list\" directive");
1022 break;
1023 default:
1024 if (!ofmt->directive (line+1, value, pass2))
1025 report_error (pass1==1 ? ERR_NONFATAL : ERR_PANIC,
1026 "unrecognised directive [%s]",
1027 line+1);
1030 else /* it isn't a directive */
1032 parse_line (pass1, line, &output_ins,
1033 report_error, evaluate,
1034 def_label);
1036 if (!(optimizing>0) && pass == 2) {
1037 if (forwref != NULL && globallineno == forwref->lineno) {
1038 output_ins.forw_ref = TRUE;
1039 do {
1040 output_ins.oprs[forwref->operand].opflags |= OPFLAG_FORWARD;
1041 forwref = saa_rstruct (forwrefs);
1042 } while (forwref != NULL && forwref->lineno == globallineno);
1043 } else
1044 output_ins.forw_ref = FALSE;
1048 if (!(optimizing>0) && output_ins.forw_ref)
1050 if (pass == 1) {
1051 for(i = 0; i < output_ins.operands; i++)
1053 if (output_ins.oprs[i].opflags & OPFLAG_FORWARD)
1055 struct forwrefinfo *fwinf =
1056 (struct forwrefinfo *)saa_wstruct(forwrefs);
1057 fwinf->lineno = globallineno;
1058 fwinf->operand = i;
1061 } else { /* pass == 2 */
1063 * Hack to prevent phase error in the code
1064 * rol ax,x
1065 * x equ 1
1067 * If the second operand is a forward reference,
1068 * the UNITY property of the number 1 in that
1069 * operand is cancelled. Otherwise the above
1070 * sequence will cause a phase error.
1072 * This hack means that the above code will
1073 * generate 286+ code.
1075 * The forward reference will mean that the
1076 * operand will not have the UNITY property on
1077 * the first pass, so the pass behaviours will
1078 * be consistent.
1081 if (output_ins.operands >= 2 &&
1082 (output_ins.oprs[1].opflags & OPFLAG_FORWARD))
1084 output_ins.oprs[1].type &= ~(ONENESS|BYTENESS);
1087 } /* pass == 2 */
1089 } /* forw_ref */
1092 if (output_ins.opcode == I_EQU) {
1093 if (pass1 == 1)
1096 * Special `..' EQUs get processed in pass two,
1097 * except `..@' macro-processor EQUs which are done
1098 * in the normal place.
1100 if (!output_ins.label)
1101 report_error (ERR_NONFATAL,
1102 "EQU not preceded by label");
1104 else if (output_ins.label[0] != '.' ||
1105 output_ins.label[1] != '.' ||
1106 output_ins.label[2] == '@')
1108 if (output_ins.operands == 1 &&
1109 (output_ins.oprs[0].type & IMMEDIATE) &&
1110 output_ins.oprs[0].wrt == NO_SEG)
1112 int isext = output_ins.oprs[0].opflags & OPFLAG_EXTERN;
1113 def_label (output_ins.label,
1114 output_ins.oprs[0].segment,
1115 output_ins.oprs[0].offset,
1116 NULL, FALSE, isext, ofmt, report_error);
1118 else if (output_ins.operands == 2 &&
1119 (output_ins.oprs[0].type & IMMEDIATE) &&
1120 (output_ins.oprs[0].type & COLON) &&
1121 output_ins.oprs[0].segment == NO_SEG &&
1122 output_ins.oprs[0].wrt == NO_SEG &&
1123 (output_ins.oprs[1].type & IMMEDIATE) &&
1124 output_ins.oprs[1].segment == NO_SEG &&
1125 output_ins.oprs[1].wrt == NO_SEG)
1127 def_label (output_ins.label,
1128 output_ins.oprs[0].offset | SEG_ABS,
1129 output_ins.oprs[1].offset,
1130 NULL, FALSE, FALSE, ofmt, report_error);
1132 else
1133 report_error(ERR_NONFATAL, "bad syntax for EQU");
1135 } else { /* pass == 2 */
1137 * Special `..' EQUs get processed here, except
1138 * `..@' macro processor EQUs which are done above.
1140 if (output_ins.label[0] == '.' &&
1141 output_ins.label[1] == '.' &&
1142 output_ins.label[2] != '@')
1144 if (output_ins.operands == 1 &&
1145 (output_ins.oprs[0].type & IMMEDIATE)) {
1146 define_label (output_ins.label,
1147 output_ins.oprs[0].segment,
1148 output_ins.oprs[0].offset,
1149 NULL, FALSE, FALSE, ofmt, report_error);
1151 else if (output_ins.operands == 2 &&
1152 (output_ins.oprs[0].type & IMMEDIATE) &&
1153 (output_ins.oprs[0].type & COLON) &&
1154 output_ins.oprs[0].segment == NO_SEG &&
1155 (output_ins.oprs[1].type & IMMEDIATE) &&
1156 output_ins.oprs[1].segment == NO_SEG)
1158 define_label (output_ins.label,
1159 output_ins.oprs[0].offset | SEG_ABS,
1160 output_ins.oprs[1].offset,
1161 NULL, FALSE, FALSE, ofmt, report_error);
1163 else
1164 report_error(ERR_NONFATAL, "bad syntax for EQU");
1166 } /* pass == 2 */
1167 } else { /* instruction isn't an EQU */
1169 if (pass1 == 1) {
1171 long l = insn_size (location.segment, offs, sb, cpu,
1172 &output_ins, report_error);
1174 /* if (using_debug_info) && output_ins.opcode != -1)*/
1175 if (using_debug_info) /* fbk 03/25/01 */
1178 /* this is done here so we can do debug type info */
1179 long typeinfo = TYS_ELEMENTS(output_ins.operands);
1180 switch (output_ins.opcode) {
1181 case I_RESB:
1182 typeinfo = TYS_ELEMENTS(output_ins.oprs[0].offset) | TY_BYTE;
1183 break;
1184 case I_RESW:
1185 typeinfo = TYS_ELEMENTS(output_ins.oprs[0].offset) | TY_WORD;
1186 break;
1187 case I_RESD:
1188 typeinfo = TYS_ELEMENTS(output_ins.oprs[0].offset) | TY_DWORD;
1189 break;
1190 case I_RESQ:
1191 typeinfo = TYS_ELEMENTS(output_ins.oprs[0].offset) | TY_QWORD;
1192 break;
1193 case I_REST:
1194 typeinfo = TYS_ELEMENTS(output_ins.oprs[0].offset) | TY_TBYTE;
1195 break;
1196 case I_DB:
1197 typeinfo |= TY_BYTE;
1198 break;
1199 case I_DW:
1200 typeinfo |= TY_WORD;
1201 break;
1202 case I_DD:
1203 if (output_ins.eops_float)
1204 typeinfo |= TY_FLOAT;
1205 else
1206 typeinfo |= TY_DWORD;
1207 break;
1208 case I_DQ:
1209 typeinfo |= TY_QWORD;
1210 break;
1211 case I_DT:
1212 typeinfo |= TY_TBYTE;
1213 break;
1214 default:
1215 typeinfo = TY_LABEL;
1219 ofmt->current_dfmt->debug_typevalue(typeinfo);
1222 if (l != -1) {
1223 offs += l;
1224 SET_CURR_OFFS (offs);
1227 * else l == -1 => invalid instruction, which will be
1228 * flagged as an error on pass 2
1231 } else { /* pass == 2 */
1232 offs += assemble (location.segment, offs, sb, cpu,
1233 &output_ins, ofmt, report_error, &nasmlist);
1234 SET_CURR_OFFS (offs);
1237 } /* not an EQU */
1238 cleanup_insn (&output_ins);
1240 nasm_free (line);
1241 location.offset = offs = GET_CURR_OFFS;
1242 } /* end while (line = preproc->getline... */
1244 if (pass1==2 && global_offset_changed)
1245 report_error(ERR_NONFATAL, "phase error detected at end of assembly.");
1247 if (pass1 == 1) preproc->cleanup(1);
1249 if (pass1==1 && terminate_after_phase) {
1250 fclose(ofile);
1251 remove(outname);
1252 if (want_usage)
1253 usage();
1254 exit (1);
1256 pass_cnt++;
1257 if (pass>1 && !global_offset_changed) {
1258 pass0++;
1259 if (pass0==2) pass = pass_max - 1;
1260 } else if (!(optimizing>0)) pass0++;
1262 } /* for (pass=1; pass<=2; pass++) */
1264 preproc->cleanup(0);
1265 nasmlist.cleanup();
1266 #if 1
1267 if (optimizing>0 && using_debug_info) /* -On and -g switches */
1268 fprintf(stdout,
1269 "info:: assembly required 1+%d+1 passes\n", pass_cnt-2);
1270 #endif
1271 } /* exit from assemble_file (...) */
1274 static int getkw (char *buf, char **value)
1276 char *p, *q;
1278 /* allow leading spaces or tabs */
1279 while (*buf==' ' || *buf=='\t')
1280 buf++;
1282 if (*buf!='[')
1283 return 0;
1285 p = buf;
1287 while (*p && *p != ']') p++;
1289 if (!*p)
1290 return 0;
1292 q = p++;
1294 while (*p && *p != ';') {
1295 if (!isspace(*p))
1296 return 0;
1297 p++;
1299 q[1] = '\0';
1301 p = buf+1;
1302 while (*buf && *buf!=' ' && *buf!=']' && *buf!='\t')
1303 buf++;
1304 if (*buf==']') {
1305 *buf = '\0';
1306 *value = buf;
1307 } else {
1308 *buf++ = '\0';
1309 while (isspace(*buf)) buf++; /* beppu - skip leading whitespace */
1310 *value = buf;
1311 while (*buf!=']') buf++;
1312 *buf++ = '\0';
1314 #if 0
1315 for (q=p; *q; q++)
1316 *q = tolower(*q);
1317 #endif
1318 if (!nasm_stricmp(p, "segment") || !nasm_stricmp(p, "section"))
1319 return 1;
1320 if (!nasm_stricmp(p, "extern"))
1321 return 2;
1322 if (!nasm_stricmp(p, "bits"))
1323 return 3;
1324 if (!nasm_stricmp(p, "global"))
1325 return 4;
1326 if (!nasm_stricmp(p, "common"))
1327 return 5;
1328 if (!nasm_stricmp(p, "absolute"))
1329 return 6;
1330 if (!nasm_stricmp(p, "debug"))
1331 return 7;
1332 if (!nasm_stricmp(p, "warning"))
1333 return 8;
1334 if (!nasm_stricmp(p, "cpu"))
1335 return 9;
1336 if (!nasm_stricmp(p, "list")) /* fbk 9/2/00 */
1337 return 10;
1338 return -1;
1341 static void report_error (int severity, const char *fmt, ...)
1343 va_list ap;
1346 * See if it's a suppressed warning.
1348 if ((severity & ERR_MASK) == ERR_WARNING &&
1349 (severity & ERR_WARN_MASK) != 0 &&
1350 suppressed[ (severity & ERR_WARN_MASK) >> ERR_WARN_SHR ])
1351 return; /* and bail out if so */
1354 * See if it's a pass-one only warning and we're not in pass one.
1356 if ((severity & ERR_PASS1) && pass0 == 2)
1357 return;
1359 if (severity & ERR_NOFILE)
1360 fputs ("nasm: ", error_file);
1361 else {
1362 char * currentfile = NULL;
1363 long lineno = 0;
1364 src_get (&lineno, &currentfile);
1365 fprintf (error_file, "%s:%ld: ", currentfile, lineno);
1366 nasm_free (currentfile);
1369 switch (severity & ERR_MASK) {
1370 case ERR_WARNING:
1371 fputs ("warning: ", error_file); break;
1372 case ERR_NONFATAL:
1373 fputs ("error: ", error_file); break;
1374 case ERR_FATAL:
1375 fputs ("fatal: ", error_file); break;
1376 case ERR_PANIC:
1377 fputs ("panic: ", error_file); break;
1378 case ERR_DEBUG:
1379 fputs("debug: ", error_file); break;
1382 va_start (ap, fmt);
1383 vfprintf (error_file, fmt, ap);
1384 fputc ('\n', error_file);
1386 if (severity & ERR_USAGE)
1387 want_usage = TRUE;
1389 switch (severity & ERR_MASK) {
1390 case ERR_WARNING: case ERR_DEBUG:
1391 /* no further action, by definition */
1392 break;
1393 case ERR_NONFATAL:
1394 /* terminate_after_phase = TRUE; *//**//* hack enables listing(!) on errors */
1395 terminate_after_phase = TRUE;
1396 break;
1397 case ERR_FATAL:
1398 if (ofile) {
1399 fclose(ofile);
1400 remove(outname);
1402 if (want_usage)
1403 usage();
1404 exit(1); /* instantly die */
1405 break; /* placate silly compilers */
1406 case ERR_PANIC:
1407 fflush(NULL);
1408 /* abort(); */ /* halt, catch fire, and dump core */
1409 exit(3);
1410 break;
1414 static void usage(void)
1416 fputs("type `nasm -h' for help\n", error_file);
1419 static void register_output_formats(void)
1421 ofmt = ofmt_register (report_error);
1424 #define BUF_DELTA 512
1426 static FILE *no_pp_fp;
1427 static efunc no_pp_err;
1428 static ListGen *no_pp_list;
1429 static long no_pp_lineinc;
1431 static void no_pp_reset (char *file, int pass, efunc error, evalfunc eval,
1432 ListGen *listgen)
1434 src_set_fname(nasm_strdup(file));
1435 src_set_linnum(0);
1436 no_pp_lineinc = 1;
1437 no_pp_err = error;
1438 no_pp_fp = fopen(file, "r");
1439 if (!no_pp_fp)
1440 no_pp_err (ERR_FATAL | ERR_NOFILE,
1441 "unable to open input file `%s'", file);
1442 no_pp_list = listgen;
1443 (void) pass; /* placate compilers */
1444 (void) eval; /* placate compilers */
1447 static char *no_pp_getline (void)
1449 char *buffer, *p, *q;
1450 int bufsize;
1452 bufsize = BUF_DELTA;
1453 buffer = nasm_malloc(BUF_DELTA);
1454 src_set_linnum(src_get_linnum() + no_pp_lineinc);
1456 while (1) { /* Loop to handle %line */
1458 p = buffer;
1459 while (1) { /* Loop to handle long lines */
1460 q = fgets(p, bufsize-(p-buffer), no_pp_fp);
1461 if (!q)
1462 break;
1463 p += strlen(p);
1464 if (p > buffer && p[-1] == '\n')
1465 break;
1466 if (p-buffer > bufsize-10) {
1467 int offset;
1468 offset = p - buffer;
1469 bufsize += BUF_DELTA;
1470 buffer = nasm_realloc(buffer, bufsize);
1471 p = buffer + offset;
1475 if (!q && p == buffer) {
1476 nasm_free (buffer);
1477 return NULL;
1481 * Play safe: remove CRs, LFs and any spurious ^Zs, if any of
1482 * them are present at the end of the line.
1484 buffer[strcspn(buffer, "\r\n\032")] = '\0';
1486 if (!strncmp(buffer, "%line", 5)) {
1487 long ln;
1488 int li;
1489 char *nm = nasm_malloc(strlen(buffer));
1490 if (sscanf(buffer+5, "%ld+%d %s", &ln, &li, nm) == 3) {
1491 nasm_free( src_set_fname(nm) );
1492 src_set_linnum(ln);
1493 no_pp_lineinc = li;
1494 continue;
1496 nasm_free(nm);
1498 break;
1501 no_pp_list->line (LIST_READ, buffer);
1503 return buffer;
1506 static void no_pp_cleanup (int pass)
1508 fclose(no_pp_fp);
1511 static unsigned long get_cpu (char *value)
1514 if (!strcmp(value, "8086")) return IF_8086;
1515 if (!strcmp(value, "186")) return IF_186;
1516 if (!strcmp(value, "286")) return IF_286;
1517 if (!strcmp(value, "386")) return IF_386;
1518 if (!strcmp(value, "486")) return IF_486;
1519 if (!strcmp(value, "586") ||
1520 !nasm_stricmp(value, "pentium") ) return IF_PENT;
1521 if (!strcmp(value, "686") ||
1522 !nasm_stricmp(value, "ppro") ||
1523 !nasm_stricmp(value, "p2") ) return IF_P6;
1524 if (!nasm_stricmp(value, "p3") ||
1525 !nasm_stricmp(value, "katmai") ) return IF_KATMAI;
1526 if (!nasm_stricmp(value, "p4") || /* is this right? -- jrc */
1527 !nasm_stricmp(value, "willamette") ) return IF_WILLAMETTE;
1529 report_error (pass0<2 ? ERR_NONFATAL : ERR_FATAL, "unknown 'cpu' type");
1531 return IF_PLEVEL; /* the maximum level */
1535 static int get_bits (char *value)
1537 int i;
1539 if ((i = atoi(value)) == 16) return i; /* set for a 16-bit segment */
1540 else if (i == 32) {
1541 if (cpu < IF_386) {
1542 report_error(ERR_NONFATAL,
1543 "cannot specify 32-bit segment on processor below a 386");
1544 i = 16;
1546 } else {
1547 report_error(pass0<2 ? ERR_NONFATAL : ERR_FATAL,
1548 "`%s' is not a valid segment size; must be 16 or 32",
1549 value);
1550 i = 16;
1552 return i;
1555 /* end of nasm.c */