NASM 0.98.18
[nasm/avx512.git] / nasm.c
blob5479a73969d317aef117685a18daa486f919ea22
1 /* The Netwide Assembler main program module
3 * The Netwide Assembler is copyright (C) 1996 Simon Tatham and
4 * Julian Hall. All rights reserved. The software is
5 * redistributable under the licence given in the file "Licence"
6 * distributed in the NASM archive.
7 */
9 #include <stdio.h>
10 #include <stdarg.h>
11 #include <stdlib.h>
12 #include <string.h>
13 #include <ctype.h>
15 #include "nasm.h"
16 #include "nasmlib.h"
17 #include "insns.h"
18 #include "preproc.h"
19 #include "parser.h"
20 #include "eval.h"
21 #include "assemble.h"
22 #include "labels.h"
23 #include "outform.h"
24 #include "listing.h"
26 struct forwrefinfo { /* info held on forward refs. */
27 int lineno;
28 int operand;
31 static int get_bits (char *value);
32 static unsigned long get_cpu (char *cpu_str);
33 static void report_error (int, char *, ...);
34 static void parse_cmdline (int, char **);
35 static void assemble_file (char *);
36 static int getkw (char *buf, char **value);
37 static void register_output_formats(void);
38 static void usage(void);
40 static int using_debug_info;
41 int tasm_compatible_mode = FALSE;
42 int pass0;
44 static char inname[FILENAME_MAX];
45 static char outname[FILENAME_MAX];
46 static char listname[FILENAME_MAX];
47 static int globallineno; /* for forward-reference tracking */
48 /* static int pass = 0; */
49 static struct ofmt *ofmt = NULL;
51 static FILE *error_file; /* Where to write error messages */
53 static FILE *ofile = NULL;
54 int optimizing = -1; /* number of optimization passes to take */
55 static int sb, cmd_sb = 16; /* by default */
56 static unsigned long cmd_cpu = IF_PLEVEL; /* highest level by default */
57 static unsigned long cpu = IF_PLEVEL; /* passed to insn_size & assemble.c */
58 int global_offset_changed; /* referenced in labels.c */
60 static loc_t location;
61 int in_abs_seg; /* Flag we are in ABSOLUTE seg */
62 static long abs_seg;
64 static struct RAA *offsets;
65 static long abs_offset;
67 static struct SAA *forwrefs; /* keep track of forward references */
68 static struct forwrefinfo *forwref;
70 static Preproc *preproc;
71 enum op_type {
72 op_normal, /* Preprocess and assemble */
73 op_preprocess, /* Preprocess only */
74 op_depend /* Generate dependencies */
76 static enum op_type operating_mode;
79 * Which of the suppressible warnings are suppressed. Entry zero
80 * doesn't do anything. Initial defaults are given here.
82 static char suppressed[1+ERR_WARN_MAX] = {
83 0, TRUE, TRUE, TRUE, FALSE
87 * The option names for the suppressible warnings. As before, entry
88 * zero does nothing.
90 static char *suppressed_names[1+ERR_WARN_MAX] = {
91 NULL, "macro-params", "macro-selfref", "orphan-labels", "number-overflow",
95 * The explanations for the suppressible warnings. As before, entry
96 * zero does nothing.
98 static char *suppressed_what[1+ERR_WARN_MAX] = {
99 NULL,
100 "macro calls with wrong no. of params",
101 "cyclic macro self-references",
102 "labels alone on lines without trailing `:'",
103 "numeric constants greater than 0xFFFFFFFF"
107 * This is a null preprocessor which just copies lines from input
108 * to output. It's used when someone explicitly requests that NASM
109 * not preprocess their source file.
112 static void no_pp_reset (char *, int, efunc, evalfunc, ListGen *);
113 static char *no_pp_getline (void);
114 static void no_pp_cleanup (int);
115 static Preproc no_pp = {
116 no_pp_reset,
117 no_pp_getline,
118 no_pp_cleanup
122 * get/set current offset...
124 #define GET_CURR_OFFS (in_abs_seg?abs_offset:\
125 raa_read(offsets,location.segment))
126 #define SET_CURR_OFFS(x) (in_abs_seg?(void)(abs_offset=(x)):\
127 (void)(offsets=raa_write(offsets,location.segment,(x))))
129 static int want_usage;
130 static int terminate_after_phase;
131 int user_nolist = 0; /* fbk 9/2/00 */
133 static void nasm_fputs(char *line, FILE *ofile)
135 if (ofile) {
136 fputs(line, ofile);
137 fputc('\n', ofile);
138 } else
139 puts(line);
142 int main(int argc, char **argv)
144 pass0 = 1;
145 want_usage = terminate_after_phase = FALSE;
147 nasm_set_malloc_error (report_error);
148 offsets = raa_init();
149 forwrefs = saa_init ((long)sizeof(struct forwrefinfo));
151 preproc = &nasmpp;
152 operating_mode = op_normal;
154 error_file = stderr;
156 seg_init();
158 register_output_formats();
160 parse_cmdline(argc, argv);
162 if (terminate_after_phase)
164 if (want_usage)
165 usage();
166 return 1;
169 if (ofmt->stdmac)
170 pp_extra_stdmac (ofmt->stdmac);
171 parser_global_info (ofmt, &location);
172 eval_global_info (ofmt, lookup_label, &location);
174 /* define some macros dependent of command-line */
176 char temp [64];
177 sprintf (temp, "__OUTPUT_FORMAT__=%s\n", ofmt->shortname);
178 pp_pre_define (temp);
181 switch ( operating_mode ) {
182 case op_depend:
184 char *line;
185 preproc->reset (inname, 0, report_error, evaluate, &nasmlist);
186 if (outname[0] == '\0')
187 ofmt->filename (inname, outname, report_error);
188 ofile = NULL;
189 fprintf(stdout, "%s: %s", outname, inname);
190 while ( (line = preproc->getline()) )
191 nasm_free (line);
192 preproc->cleanup(0);
193 putc('\n', stdout);
195 break;
197 case op_preprocess:
199 char *line;
200 char *file_name = NULL;
201 long prior_linnum=0;
202 int lineinc=0;
204 if (*outname) {
205 ofile = fopen(outname, "w");
206 if (!ofile)
207 report_error (ERR_FATAL | ERR_NOFILE,
208 "unable to open output file `%s'", outname);
209 } else
210 ofile = NULL;
212 location.known = FALSE;
214 /* pass = 1; */
215 preproc->reset (inname, 2, report_error, evaluate, &nasmlist);
216 while ( (line = preproc->getline()) ) {
218 * We generate %line directives if needed for later programs
220 long linnum = prior_linnum += lineinc;
221 int altline = src_get(&linnum, &file_name);
222 if (altline) {
223 if (altline==1 && lineinc==1)
224 nasm_fputs("", ofile);
225 else {
226 lineinc = (altline != -1 || lineinc!=1);
227 fprintf(ofile ? ofile : stdout, "%%line %ld+%d %s\n",
228 linnum, lineinc, file_name);
230 prior_linnum = linnum;
232 nasm_fputs(line, ofile);
233 nasm_free (line);
235 nasm_free(file_name);
236 preproc->cleanup(0);
237 if (ofile)
238 fclose(ofile);
239 if (ofile && terminate_after_phase)
240 remove(outname);
242 break;
244 case op_normal:
247 * We must call ofmt->filename _anyway_, even if the user
248 * has specified their own output file, because some
249 * formats (eg OBJ and COFF) use ofmt->filename to find out
250 * the name of the input file and then put that inside the
251 * file.
253 ofmt->filename (inname, outname, report_error);
255 ofile = fopen(outname, "wb");
256 if (!ofile) {
257 report_error (ERR_FATAL | ERR_NOFILE,
258 "unable to open output file `%s'", outname);
262 * We must call init_labels() before ofmt->init() since
263 * some object formats will want to define labels in their
264 * init routines. (eg OS/2 defines the FLAT group)
266 init_labels ();
268 ofmt->init (ofile, report_error, define_label, evaluate);
270 assemble_file (inname);
272 if (!terminate_after_phase) {
273 ofmt->cleanup (using_debug_info);
274 cleanup_labels ();
275 } else {
277 * We had an fclose on the output file here, but we
278 * actually do that in all the object file drivers as well,
279 * so we're leaving out the one here.
280 * fclose (ofile);
282 remove(outname);
283 if (listname[0])
284 remove(listname);
287 break;
290 if (want_usage)
291 usage();
293 raa_free (offsets);
294 saa_free (forwrefs);
295 eval_cleanup ();
296 nasmlib_cleanup ();
298 if (terminate_after_phase)
299 return 1;
300 else
301 return 0;
306 * Get a parameter for a command line option.
307 * First arg must be in the form of e.g. -f...
309 static char *get_param (char *p, char *q, int *advance)
311 *advance = 0;
312 if (p[2]) /* the parameter's in the option */
314 p += 2;
315 while (isspace(*p))
316 p++;
317 return p;
319 if (q && q[0])
321 *advance = 1;
322 return q;
324 report_error (ERR_NONFATAL | ERR_NOFILE | ERR_USAGE,
325 "option `-%c' requires an argument",
326 p[1]);
327 return NULL;
330 struct textargs
332 char *label;
333 int value;
336 #define OPT_PREFIX 0
337 #define OPT_POSTFIX 1
338 struct textargs textopts[] =
340 {"prefix",OPT_PREFIX},
341 {"postfix",OPT_POSTFIX},
342 {NULL,0}
346 int stopoptions = 0;
347 static int process_arg (char *p, char *q)
349 char *param;
350 int i, advance = 0;
352 if (!p || !p[0])
353 return 0;
355 if (p[0]=='-' && ! stopoptions)
357 switch (p[1]) {
358 case 's':
359 error_file = stdout;
360 break;
361 case 'o': /* these parameters take values */
362 case 'O':
363 case 'f':
364 case 'p':
365 case 'P':
366 case 'd':
367 case 'D':
368 case 'i':
369 case 'I':
370 case 'l':
371 case 'E':
372 case 'F':
373 if ( !(param = get_param (p, q, &advance)) )
374 break;
375 if (p[1]=='o') { /* output file */
376 strcpy (outname, param);
377 } else if (p[1]=='f') { /* output format */
378 ofmt = ofmt_find(param);
379 if (!ofmt) {
380 report_error (ERR_FATAL | ERR_NOFILE | ERR_USAGE,
381 "unrecognised output format `%s' - "
382 "use -hf for a list",
383 param);
385 else
386 ofmt->current_dfmt = ofmt->debug_formats[0];
387 } else if (p[1]=='O') { /* Optimization level */
388 int opt;
389 if (!isdigit(*param)) report_error(ERR_FATAL,
390 "command line optimization level must be 0..3 or <nn>");
391 opt = atoi(param);
392 if (opt<=0) optimizing = -1; /* 0.98 behaviour */
393 else if (opt==1) optimizing = 0; /* Two passes, 0.98.09 behavior */
394 else if (opt<=3) optimizing = opt*5; /* Multiple passes */
395 else optimizing = opt; /* Multiple passes */
396 } else if (p[1]=='P' || p[1]=='p') { /* pre-include */
397 pp_pre_include (param);
398 } else if (p[1]=='D' || p[1]=='d') { /* pre-define */
399 pp_pre_define (param);
400 } else if (p[1]=='U' || p[1]=='u') { /* un-define */
401 pp_pre_undefine (param);
402 } else if (p[1]=='I' || p[1]=='i') { /* include search path */
403 pp_include_path (param);
404 } else if (p[1]=='l') { /* listing file */
405 strcpy (listname, param);
406 } else if (p[1]=='E') { /* error messages file */
407 error_file = fopen(param, "w");
408 if ( !error_file ) {
409 error_file = stderr; /* Revert to default! */
410 report_error (ERR_FATAL | ERR_NOFILE | ERR_USAGE,
411 "cannot open file `%s' for error messages",
412 param);
414 } else if (p[1] == 'F') { /* specify debug format */
415 ofmt->current_dfmt = dfmt_find(ofmt, param);
416 if (!ofmt->current_dfmt) {
417 report_error (ERR_FATAL | ERR_NOFILE | ERR_USAGE,
418 "unrecognized debug format `%s' for"
419 " output format `%s'",
420 param, ofmt->shortname);
423 break;
424 case 'g':
425 using_debug_info = TRUE;
426 break;
427 case 'h':
428 printf("usage: nasm [-@ response file] [-o outfile] [-f format] "
429 "[-l listfile]\n"
430 " [options...] [--] filename\n"
431 " or nasm -r for version info (obsolete)\n"
432 " or nasm -v for version info (preferred)\n\n"
433 " -t Assemble in SciTech TASM compatible mode\n"
434 " -g Generate debug information in selected format.\n");
435 printf(" -e preprocess only (writes output to stdout by default)\n"
436 " -a don't preprocess (assemble only)\n"
437 " -M generate Makefile dependencies on stdout\n\n"
438 " -E<file> redirect error messages to file\n"
439 " -s redirect error messages to stdout\n\n"
440 " -F format select a debugging format\n\n"
441 " -I<path> adds a pathname to the include file path\n");
442 printf(" -O<digit> optimize branch offsets (-O0 disables, default)\n"
443 " -P<file> pre-includes a file\n"
444 " -D<macro>[=<value>] pre-defines a macro\n"
445 " -U<macro> undefines a macro\n"
446 " -w+foo enables warnings about foo; -w-foo disables them\n"
447 "where foo can be:\n");
448 for (i=1; i<=ERR_WARN_MAX; i++)
449 printf(" %-16s%s (default %s)\n",
450 suppressed_names[i], suppressed_what[i],
451 suppressed[i] ? "off" : "on");
452 printf ("\nresponse files should contain command line parameters"
453 ", one per line.\n");
454 if (p[2] == 'f') {
455 printf("\nvalid output formats for -f are"
456 " (`*' denotes default):\n");
457 ofmt_list(ofmt, stdout);
459 else {
460 printf ("\nFor a list of valid output formats, use -hf.\n");
461 printf ("For a list of debug formats, use -f <form> -y.\n");
463 exit (0); /* never need usage message here */
464 break;
465 case 'y':
466 printf("\nvalid debug formats for '%s' output format are"
467 " ('*' denotes default):\n",
468 ofmt->shortname);
469 dfmt_list(ofmt, stdout);
470 exit(0);
471 break;
472 case 't':
473 tasm_compatible_mode = TRUE;
474 break;
475 case 'r':
476 case 'v':
477 printf("NASM version %s compiled "
478 #ifdef DEBUG
479 "with -DDEBUG "
480 #endif
481 "on " __DATE__ "\n", NASM_VER);
482 exit (0); /* never need usage message here */
483 break;
484 case 'e': /* preprocess only */
485 operating_mode = op_preprocess;
486 break;
487 case 'a': /* assemble only - don't preprocess */
488 preproc = &no_pp;
489 break;
490 case 'w':
491 if (p[2] != '+' && p[2] != '-') {
492 report_error (ERR_NONFATAL | ERR_NOFILE | ERR_USAGE,
493 "invalid option to `-w'");
494 } else {
495 for (i=1; i<=ERR_WARN_MAX; i++)
496 if (!nasm_stricmp(p+3, suppressed_names[i]))
497 break;
498 if (i <= ERR_WARN_MAX)
499 suppressed[i] = (p[2] == '-');
500 else
501 report_error (ERR_NONFATAL | ERR_NOFILE | ERR_USAGE,
502 "invalid option to `-w'");
504 break;
505 case 'M':
506 operating_mode = op_depend;
507 break;
509 case '-':
511 int s;
513 if (p[2]==0) { /* -- => stop processing options */
514 stopoptions = 1;
515 break;
517 for(s=0; textopts[s].label; s++)
519 if(!nasm_stricmp(p+2, textopts[s].label))
521 break;
525 switch(s)
528 case OPT_PREFIX:
529 case OPT_POSTFIX:
531 if (!q)
533 report_error (ERR_NONFATAL | ERR_NOFILE | ERR_USAGE,
534 "option `--%s' requires an argument",
535 p+2);
536 break;
538 else
540 advance = 1, param = q;
543 if(s == OPT_PREFIX)
545 strncpy(lprefix,param,PREFIX_MAX-1);
546 lprefix[PREFIX_MAX-1]=0;
547 break;
549 if(s == OPT_POSTFIX)
551 strncpy(lpostfix,param,POSTFIX_MAX-1);
552 lpostfix[POSTFIX_MAX-1]=0;
553 break;
555 break;
557 default:
559 report_error (ERR_NONFATAL | ERR_NOFILE | ERR_USAGE,
560 "unrecognised option `--%s'",
561 p+2);
562 break;
565 break;
568 default:
569 if (!ofmt->setinfo(GI_SWITCH,&p))
570 report_error (ERR_NONFATAL | ERR_NOFILE | ERR_USAGE,
571 "unrecognised option `-%c'",
572 p[1]);
573 break;
576 else
578 if (*inname) {
579 report_error (ERR_NONFATAL | ERR_NOFILE | ERR_USAGE,
580 "more than one input file specified");
581 } else
582 strcpy(inname, p);
585 return advance;
588 #define ARG_BUF_DELTA 128
590 static void process_respfile (FILE *rfile)
592 char *buffer, *p, *q, *prevarg;
593 int bufsize, prevargsize;
595 bufsize = prevargsize = ARG_BUF_DELTA;
596 buffer = nasm_malloc(ARG_BUF_DELTA);
597 prevarg = nasm_malloc(ARG_BUF_DELTA);
598 prevarg[0] = '\0';
600 while (1) { /* Loop to handle all lines in file */
602 p = buffer;
603 while (1) { /* Loop to handle long lines */
604 q = fgets(p, bufsize-(p-buffer), rfile);
605 if (!q)
606 break;
607 p += strlen(p);
608 if (p > buffer && p[-1] == '\n')
609 break;
610 if (p-buffer > bufsize-10) {
611 int offset;
612 offset = p - buffer;
613 bufsize += ARG_BUF_DELTA;
614 buffer = nasm_realloc(buffer, bufsize);
615 p = buffer + offset;
619 if (!q && p == buffer) {
620 if (prevarg[0])
621 process_arg (prevarg, NULL);
622 nasm_free (buffer);
623 nasm_free (prevarg);
624 return;
628 * Play safe: remove CRs, LFs and any spurious ^Zs, if any of
629 * them are present at the end of the line.
631 *(p = &buffer[strcspn(buffer, "\r\n\032")]) = '\0';
633 while (p > buffer && isspace(p[-1]))
634 *--p = '\0';
636 p = buffer;
637 while (isspace(*p))
638 p++;
640 if (process_arg (prevarg, p))
641 *p = '\0';
643 if (strlen(p) > prevargsize-10) {
644 prevargsize += ARG_BUF_DELTA;
645 prevarg = nasm_realloc(prevarg, prevargsize);
647 strcpy (prevarg, p);
651 /* Function to process args from a string of args, rather than the
652 * argv array. Used by the environment variable and response file
653 * processing.
655 static void process_args (char *args) {
656 char *p, *q, *arg, *prevarg;
657 char separator = ' ';
659 p = args;
660 if (*p && *p != '-')
661 separator = *p++;
662 arg = NULL;
663 while (*p) {
664 q = p;
665 while (*p && *p != separator) p++;
666 while (*p == separator) *p++ = '\0';
667 prevarg = arg;
668 arg = q;
669 if (process_arg (prevarg, arg))
670 arg = NULL;
672 if (arg)
673 process_arg (arg, NULL);
676 static void parse_cmdline(int argc, char **argv)
678 FILE *rfile;
679 char *envreal, *envcopy=NULL, *p, *arg;
681 *inname = *outname = *listname = '\0';
684 * First, process the NASM environment variable.
686 envreal = getenv("NASM");
687 arg = NULL;
688 if (envreal) {
689 envcopy = nasm_strdup(envreal);
690 process_args(envcopy);
691 nasm_free (envcopy);
695 * Now process the actual command line.
697 while (--argc)
699 int i;
700 argv++;
701 if (argv[0][0] == '@') {
702 /* We have a response file, so process this as a set of
703 * arguments like the environment variable. This allows us
704 * to have multiple arguments on a single line, which is
705 * different to the -@resp file processing below for regular
706 * NASM.
708 char *str = malloc(2048);
709 FILE *f = fopen(&argv[0][1],"r");
710 if (!str) {
711 printf("out of memory");
712 exit(-1);
714 if (f) {
715 while (fgets(str,2048,f)) {
716 process_args(str);
718 fclose(f);
720 free(str);
721 argc--;
722 argv++;
724 if (!stopoptions && argv[0][0] == '-' && argv[0][1] == '@') {
725 if ((p = get_param (argv[0], argc > 1 ? argv[1] : NULL, &i))) {
726 if ((rfile = fopen(p, "r"))) {
727 process_respfile (rfile);
728 fclose(rfile);
729 } else
730 report_error (ERR_NONFATAL | ERR_NOFILE | ERR_USAGE,
731 "unable to open response file `%s'", p);
733 } else
734 i = process_arg (argv[0], argc > 1 ? argv[1] : NULL);
735 argv += i, argc -= i;
738 if (!*inname)
739 report_error (ERR_NONFATAL | ERR_NOFILE | ERR_USAGE,
740 "no input file specified");
744 static void assemble_file (char *fname)
746 char * value, * p, * q, * special, * line, debugid[80];
747 insn output_ins;
748 int i, rn_error, validid;
749 long seg, offs;
750 struct tokenval tokval;
751 expr * e;
752 int pass, pass_max;
753 int pass_cnt = 0; /* count actual passes */
755 if (cmd_sb == 32 && cmd_cpu < IF_386)
756 report_error(ERR_FATAL, "command line: "
757 "32-bit segment size requires a higher cpu");
759 pass_max = (optimizing>0 ? optimizing : 0) + 2; /* passes 1, optimizing, then 2 */
760 pass0 = !(optimizing>0); /* start at 1 if not optimizing */
761 for (pass = 1; pass <= pass_max && pass0 <= 2; pass++) {
762 int pass1, pass2;
763 ldfunc def_label;
765 pass1 = pass < pass_max ? 1 : 2; /* seq is 1, 1, 1,..., 1, 2 */
766 pass2 = pass > 1 ? 2 : 1; /* seq is 1, 2, 2,..., 2, 2 */
767 /* pass0 seq is 0, 0, 0,..., 1, 2 */
769 def_label = pass > 1 ? redefine_label : define_label;
772 sb = cmd_sb; /* set 'bits' to command line default */
773 cpu = cmd_cpu;
774 if (pass0 == 2) {
775 if (*listname)
776 nasmlist.init(listname, report_error);
778 in_abs_seg = FALSE;
779 global_offset_changed = FALSE; /* set by redefine_label */
780 location.segment = ofmt->section(NULL, pass2, &sb);
781 if (pass > 1) {
782 saa_rewind (forwrefs);
783 forwref = saa_rstruct (forwrefs);
784 raa_free (offsets);
785 offsets = raa_init();
787 preproc->reset(fname, pass1, report_error, evaluate, &nasmlist);
788 globallineno = 0;
789 if (pass == 1) location.known = TRUE;
790 location.offset = offs = GET_CURR_OFFS;
792 while ( (line = preproc->getline()) )
794 globallineno++;
796 /* here we parse our directives; this is not handled by the 'real'
797 * parser. */
798 if ( (i = getkw (line, &value)) )
800 switch (i) {
801 case 1: /* [SEGMENT n] */
802 seg = ofmt->section (value, pass2, &sb);
803 if (seg == NO_SEG) {
804 report_error (pass1==1 ? ERR_NONFATAL : ERR_PANIC,
805 "segment name `%s' not recognised",
806 value);
807 } else {
808 in_abs_seg = FALSE;
809 location.segment = seg;
811 break;
812 case 2: /* [EXTERN label:special] */
813 if (*value == '$') value++; /* skip initial $ if present */
814 if (pass0 == 2) {
815 q = value;
816 while (*q && *q != ':')
817 q++;
818 if (*q == ':') {
819 *q++ = '\0';
820 ofmt->symdef(value, 0L, 0L, 3, q);
822 } else if (pass0 == 1) { /* pass == 1 */
823 q = value;
824 validid = TRUE;
825 if (!isidstart(*q))
826 validid = FALSE;
827 while (*q && *q != ':') {
828 if (!isidchar(*q))
829 validid = FALSE;
830 q++;
832 if (!validid) {
833 report_error (ERR_NONFATAL,
834 "identifier expected after EXTERN");
835 break;
837 if (*q == ':') {
838 *q++ = '\0';
839 special = q;
840 } else
841 special = NULL;
842 if (!is_extern(value)) { /* allow re-EXTERN to be ignored */
843 declare_as_global (value, special, report_error);
844 define_label (value, seg_alloc(), 0L, NULL, FALSE, TRUE,
845 ofmt, report_error);
847 } /* else pass0 == 1 */
848 break;
849 case 3: /* [BITS bits] */
850 sb = get_bits(value);
851 break;
852 case 4: /* [GLOBAL symbol:special] */
853 if (*value == '$') value++; /* skip initial $ if present */
854 if (pass0 == 2) { /* pass 2 */
855 q = value;
856 while (*q && *q != ':')
857 q++;
858 if (*q == ':') {
859 *q++ = '\0';
860 ofmt->symdef(value, 0L, 0L, 3, q);
862 } else if (pass2 == 1) { /* pass == 1 */
863 q = value;
864 validid = TRUE;
865 if (!isidstart(*q))
866 validid = FALSE;
867 while (*q && *q != ':') {
868 if (!isidchar(*q))
869 validid = FALSE;
870 q++;
872 if (!validid) {
873 report_error (ERR_NONFATAL,
874 "identifier expected after GLOBAL");
875 break;
877 if (*q == ':') {
878 *q++ = '\0';
879 special = q;
880 } else
881 special = NULL;
882 declare_as_global (value, special, report_error);
883 } /* pass == 1 */
884 break;
885 case 5: /* [COMMON symbol size:special] */
886 if (*value == '$') value++; /* skip initial $ if present */
887 if (pass0 == 1) {
888 p = value;
889 validid = TRUE;
890 if (!isidstart(*p))
891 validid = FALSE;
892 while (*p && !isspace(*p)) {
893 if (!isidchar(*p))
894 validid = FALSE;
895 p++;
897 if (!validid) {
898 report_error (ERR_NONFATAL,
899 "identifier expected after COMMON");
900 break;
902 if (*p) {
903 long size;
905 while (*p && isspace(*p))
906 *p++ = '\0';
907 q = p;
908 while (*q && *q != ':')
909 q++;
910 if (*q == ':') {
911 *q++ = '\0';
912 special = q;
913 } else
914 special = NULL;
915 size = readnum (p, &rn_error);
916 if (rn_error)
917 report_error (ERR_NONFATAL, "invalid size specified"
918 " in COMMON declaration");
919 else
920 define_common (value, seg_alloc(), size,
921 special, ofmt, report_error);
922 } else
923 report_error (ERR_NONFATAL, "no size specified in"
924 " COMMON declaration");
925 } else if (pass0 == 2) { /* pass == 2 */
926 q = value;
927 while (*q && *q != ':') {
928 if (isspace(*q))
929 *q = '\0';
930 q++;
932 if (*q == ':') {
933 *q++ = '\0';
934 ofmt->symdef(value, 0L, 0L, 3, q);
937 break;
938 case 6: /* [ABSOLUTE address] */
939 stdscan_reset();
940 stdscan_bufptr = value;
941 tokval.t_type = TOKEN_INVALID;
942 e = evaluate(stdscan, NULL, &tokval, NULL, pass2, report_error,
943 NULL);
944 if (e) {
945 if (!is_reloc(e))
946 report_error (pass0==1 ? ERR_NONFATAL : ERR_PANIC,
947 "cannot use non-relocatable expression as "
948 "ABSOLUTE address");
949 else {
950 abs_seg = reloc_seg(e);
951 abs_offset = reloc_value(e);
953 } else
954 if (pass==1) abs_offset = 0x100;/* don't go near zero in case of / */
955 else report_error (ERR_PANIC, "invalid ABSOLUTE address "
956 "in pass two");
957 in_abs_seg = TRUE;
958 location.segment = abs_seg;
959 break;
960 case 7: /* DEBUG */
961 p = value;
962 q = debugid;
963 validid = TRUE;
964 if (!isidstart(*p))
965 validid = FALSE;
966 while (*p && !isspace(*p)) {
967 if (!isidchar(*p))
968 validid = FALSE;
969 *q++ = *p++;
971 *q++ = 0;
972 if (!validid) {
973 report_error (pass==1 ? ERR_NONFATAL : ERR_PANIC,
974 "identifier expected after DEBUG");
975 break;
977 while (*p && isspace(*p)) p++;
978 if (pass==pass_max) ofmt->current_dfmt->debug_directive (debugid, p);
979 break;
980 case 8: /* [WARNING {+|-}warn-name] */
981 if (pass1 == 1) {
982 while (*value && isspace(*value))
983 value++;
985 if (*value == '+' || *value == '-') {
986 validid = (*value == '-') ? TRUE : FALSE;
987 value++;
988 } else
989 validid = FALSE;
991 for (i=1; i<=ERR_WARN_MAX; i++)
992 if (!nasm_stricmp(value, suppressed_names[i]))
993 break;
994 if (i <= ERR_WARN_MAX)
995 suppressed[i] = validid;
996 else
997 report_error (ERR_NONFATAL, "invalid warning id in WARNING directive");
999 break;
1000 case 9: /* cpu */
1001 cpu = get_cpu (value);
1002 break;
1003 case 10: /* fbk 9/2/00 */ /* [LIST {+|-}] */
1004 while (*value && isspace(*value))
1005 value++;
1007 if (*value == '+') {
1008 user_nolist = 0;
1010 else {
1011 if (*value == '-') {
1012 user_nolist = 1;
1014 else {
1015 report_error (ERR_NONFATAL, "invalid parameter to \"list\" directive");
1018 break;
1019 default:
1020 if (!ofmt->directive (line+1, value, pass2))
1021 report_error (pass1==1 ? ERR_NONFATAL : ERR_PANIC,
1022 "unrecognised directive [%s]",
1023 line+1);
1026 else /* it isn't a directive */
1028 parse_line (pass1, line, &output_ins,
1029 report_error, evaluate,
1030 def_label);
1032 if (!(optimizing>0) && pass == 2) {
1033 if (forwref != NULL && globallineno == forwref->lineno) {
1034 output_ins.forw_ref = TRUE;
1035 do {
1036 output_ins.oprs[forwref->operand].opflags |= OPFLAG_FORWARD;
1037 forwref = saa_rstruct (forwrefs);
1038 } while (forwref != NULL && forwref->lineno == globallineno);
1039 } else
1040 output_ins.forw_ref = FALSE;
1044 if (!(optimizing>0) && output_ins.forw_ref)
1046 if (pass == 1) {
1047 for(i = 0; i < output_ins.operands; i++)
1049 if (output_ins.oprs[i].opflags & OPFLAG_FORWARD)
1051 struct forwrefinfo *fwinf =
1052 (struct forwrefinfo *)saa_wstruct(forwrefs);
1053 fwinf->lineno = globallineno;
1054 fwinf->operand = i;
1057 } else { /* pass == 2 */
1059 * Hack to prevent phase error in the code
1060 * rol ax,x
1061 * x equ 1
1063 * If the second operand is a forward reference,
1064 * the UNITY property of the number 1 in that
1065 * operand is cancelled. Otherwise the above
1066 * sequence will cause a phase error.
1068 * This hack means that the above code will
1069 * generate 286+ code.
1071 * The forward reference will mean that the
1072 * operand will not have the UNITY property on
1073 * the first pass, so the pass behaviours will
1074 * be consistent.
1077 if (output_ins.operands >= 2 &&
1078 (output_ins.oprs[1].opflags & OPFLAG_FORWARD))
1080 output_ins.oprs[1].type &= ~(ONENESS|BYTENESS);
1083 } /* pass == 2 */
1085 } /* forw_ref */
1088 if (output_ins.opcode == I_EQU) {
1089 if (pass1 == 1)
1092 * Special `..' EQUs get processed in pass two,
1093 * except `..@' macro-processor EQUs which are done
1094 * in the normal place.
1096 if (!output_ins.label)
1097 report_error (ERR_NONFATAL,
1098 "EQU not preceded by label");
1100 else if (output_ins.label[0] != '.' ||
1101 output_ins.label[1] != '.' ||
1102 output_ins.label[2] == '@')
1104 if (output_ins.operands == 1 &&
1105 (output_ins.oprs[0].type & IMMEDIATE) &&
1106 output_ins.oprs[0].wrt == NO_SEG)
1108 int isext = output_ins.oprs[0].opflags & OPFLAG_EXTERN;
1109 def_label (output_ins.label,
1110 output_ins.oprs[0].segment,
1111 output_ins.oprs[0].offset,
1112 NULL, FALSE, isext, ofmt, report_error);
1114 else if (output_ins.operands == 2 &&
1115 (output_ins.oprs[0].type & IMMEDIATE) &&
1116 (output_ins.oprs[0].type & COLON) &&
1117 output_ins.oprs[0].segment == NO_SEG &&
1118 output_ins.oprs[0].wrt == NO_SEG &&
1119 (output_ins.oprs[1].type & IMMEDIATE) &&
1120 output_ins.oprs[1].segment == NO_SEG &&
1121 output_ins.oprs[1].wrt == NO_SEG)
1123 def_label (output_ins.label,
1124 output_ins.oprs[0].offset | SEG_ABS,
1125 output_ins.oprs[1].offset,
1126 NULL, FALSE, FALSE, ofmt, report_error);
1128 else
1129 report_error(ERR_NONFATAL, "bad syntax for EQU");
1131 } else { /* pass == 2 */
1133 * Special `..' EQUs get processed here, except
1134 * `..@' macro processor EQUs which are done above.
1136 if (output_ins.label[0] == '.' &&
1137 output_ins.label[1] == '.' &&
1138 output_ins.label[2] != '@')
1140 if (output_ins.operands == 1 &&
1141 (output_ins.oprs[0].type & IMMEDIATE)) {
1142 define_label (output_ins.label,
1143 output_ins.oprs[0].segment,
1144 output_ins.oprs[0].offset,
1145 NULL, FALSE, FALSE, ofmt, report_error);
1147 else if (output_ins.operands == 2 &&
1148 (output_ins.oprs[0].type & IMMEDIATE) &&
1149 (output_ins.oprs[0].type & COLON) &&
1150 output_ins.oprs[0].segment == NO_SEG &&
1151 (output_ins.oprs[1].type & IMMEDIATE) &&
1152 output_ins.oprs[1].segment == NO_SEG)
1154 define_label (output_ins.label,
1155 output_ins.oprs[0].offset | SEG_ABS,
1156 output_ins.oprs[1].offset,
1157 NULL, FALSE, FALSE, ofmt, report_error);
1159 else
1160 report_error(ERR_NONFATAL, "bad syntax for EQU");
1162 } /* pass == 2 */
1163 } else { /* instruction isn't an EQU */
1165 if (pass1 == 1) {
1167 long l = insn_size (location.segment, offs, sb, cpu,
1168 &output_ins, report_error);
1170 /* if (using_debug_info) && output_ins.opcode != -1)*/
1171 if (using_debug_info) /* fbk 03/25/01 */
1174 /* this is done here so we can do debug type info */
1175 long typeinfo = TYS_ELEMENTS(output_ins.operands);
1176 switch (output_ins.opcode) {
1177 case I_RESB:
1178 typeinfo = TYS_ELEMENTS(output_ins.oprs[0].offset) | TY_BYTE;
1179 break;
1180 case I_RESW:
1181 typeinfo = TYS_ELEMENTS(output_ins.oprs[0].offset) | TY_WORD;
1182 break;
1183 case I_RESD:
1184 typeinfo = TYS_ELEMENTS(output_ins.oprs[0].offset) | TY_DWORD;
1185 break;
1186 case I_RESQ:
1187 typeinfo = TYS_ELEMENTS(output_ins.oprs[0].offset) | TY_QWORD;
1188 break;
1189 case I_REST:
1190 typeinfo = TYS_ELEMENTS(output_ins.oprs[0].offset) | TY_TBYTE;
1191 break;
1192 case I_DB:
1193 typeinfo |= TY_BYTE;
1194 break;
1195 case I_DW:
1196 typeinfo |= TY_WORD;
1197 break;
1198 case I_DD:
1199 if (output_ins.eops_float)
1200 typeinfo |= TY_FLOAT;
1201 else
1202 typeinfo |= TY_DWORD;
1203 break;
1204 case I_DQ:
1205 typeinfo |= TY_QWORD;
1206 break;
1207 case I_DT:
1208 typeinfo |= TY_TBYTE;
1209 break;
1210 default:
1211 typeinfo = TY_LABEL;
1215 ofmt->current_dfmt->debug_typevalue(typeinfo);
1218 if (l != -1) {
1219 offs += l;
1220 SET_CURR_OFFS (offs);
1223 * else l == -1 => invalid instruction, which will be
1224 * flagged as an error on pass 2
1227 } else { /* pass == 2 */
1228 offs += assemble (location.segment, offs, sb, cpu,
1229 &output_ins, ofmt, report_error, &nasmlist);
1230 SET_CURR_OFFS (offs);
1233 } /* not an EQU */
1234 cleanup_insn (&output_ins);
1236 nasm_free (line);
1237 location.offset = offs = GET_CURR_OFFS;
1238 } /* end while (line = preproc->getline... */
1240 if (pass1==2 && global_offset_changed)
1241 report_error(ERR_NONFATAL, "phase error detected at end of assembly.");
1243 if (pass1 == 1) preproc->cleanup(1);
1245 if (pass1==1 && terminate_after_phase) {
1246 fclose(ofile);
1247 remove(outname);
1248 if (want_usage)
1249 usage();
1250 exit (1);
1252 pass_cnt++;
1253 if (pass>1 && !global_offset_changed) {
1254 pass0++;
1255 if (pass0==2) pass = pass_max - 1;
1256 } else if (!(optimizing>0)) pass0++;
1258 } /* for (pass=1; pass<=2; pass++) */
1260 preproc->cleanup(0);
1261 nasmlist.cleanup();
1262 #if 1
1263 if (optimizing>0 && using_debug_info) /* -On and -g switches */
1264 fprintf(stdout,
1265 "info:: assembly required 1+%d+1 passes\n", pass_cnt-2);
1266 #endif
1267 } /* exit from assemble_file (...) */
1270 static int getkw (char *buf, char **value)
1272 char *p, *q;
1274 /* allow leading spaces or tabs */
1275 while (*buf==' ' || *buf=='\t')
1276 buf++;
1278 if (*buf!='[')
1279 return 0;
1281 p = buf;
1283 while (*p && *p != ']') p++;
1285 if (!*p)
1286 return 0;
1288 q = p++;
1290 while (*p && *p != ';') {
1291 if (!isspace(*p))
1292 return 0;
1293 p++;
1295 q[1] = '\0';
1297 p = buf+1;
1298 while (*buf && *buf!=' ' && *buf!=']' && *buf!='\t')
1299 buf++;
1300 if (*buf==']') {
1301 *buf = '\0';
1302 *value = buf;
1303 } else {
1304 *buf++ = '\0';
1305 while (isspace(*buf)) buf++; /* beppu - skip leading whitespace */
1306 *value = buf;
1307 while (*buf!=']') buf++;
1308 *buf++ = '\0';
1310 #if 0
1311 for (q=p; *q; q++)
1312 *q = tolower(*q);
1313 #endif
1314 if (!nasm_stricmp(p, "segment") || !nasm_stricmp(p, "section"))
1315 return 1;
1316 if (!nasm_stricmp(p, "extern"))
1317 return 2;
1318 if (!nasm_stricmp(p, "bits"))
1319 return 3;
1320 if (!nasm_stricmp(p, "global"))
1321 return 4;
1322 if (!nasm_stricmp(p, "common"))
1323 return 5;
1324 if (!nasm_stricmp(p, "absolute"))
1325 return 6;
1326 if (!nasm_stricmp(p, "debug"))
1327 return 7;
1328 if (!nasm_stricmp(p, "warning"))
1329 return 8;
1330 if (!nasm_stricmp(p, "cpu"))
1331 return 9;
1332 if (!nasm_stricmp(p, "list")) /* fbk 9/2/00 */
1333 return 10;
1334 return -1;
1337 static void report_error (int severity, char *fmt, ...)
1339 va_list ap;
1342 * See if it's a suppressed warning.
1344 if ((severity & ERR_MASK) == ERR_WARNING &&
1345 (severity & ERR_WARN_MASK) != 0 &&
1346 suppressed[ (severity & ERR_WARN_MASK) >> ERR_WARN_SHR ])
1347 return; /* and bail out if so */
1350 * See if it's a pass-one only warning and we're not in pass one.
1352 if ((severity & ERR_PASS1) && pass0 == 2)
1353 return;
1355 if (severity & ERR_NOFILE)
1356 fputs ("nasm: ", error_file);
1357 else {
1358 char * currentfile = NULL;
1359 long lineno = 0;
1360 src_get (&lineno, &currentfile);
1361 fprintf (error_file, "%s:%ld: ", currentfile, lineno);
1362 nasm_free (currentfile);
1365 switch (severity & ERR_MASK) {
1366 case ERR_WARNING:
1367 fputs ("warning: ", error_file); break;
1368 case ERR_NONFATAL:
1369 fputs ("error: ", error_file); break;
1370 case ERR_FATAL:
1371 fputs ("fatal: ", error_file); break;
1372 case ERR_PANIC:
1373 fputs ("panic: ", error_file); break;
1374 case ERR_DEBUG:
1375 fputs("debug: ", error_file); break;
1378 va_start (ap, fmt);
1379 vfprintf (error_file, fmt, ap);
1380 fputc ('\n', error_file);
1382 if (severity & ERR_USAGE)
1383 want_usage = TRUE;
1385 switch (severity & ERR_MASK) {
1386 case ERR_WARNING: case ERR_DEBUG:
1387 /* no further action, by definition */
1388 break;
1389 case ERR_NONFATAL:
1390 /* terminate_after_phase = TRUE; *//**//* hack enables listing(!) on errors */
1391 terminate_after_phase = TRUE;
1392 break;
1393 case ERR_FATAL:
1394 if (ofile) {
1395 fclose(ofile);
1396 remove(outname);
1398 if (want_usage)
1399 usage();
1400 exit(1); /* instantly die */
1401 break; /* placate silly compilers */
1402 case ERR_PANIC:
1403 fflush(NULL);
1404 /* abort(); */ /* halt, catch fire, and dump core */
1405 exit(3);
1406 break;
1410 static void usage(void)
1412 fputs("type `nasm -h' for help\n", error_file);
1415 static void register_output_formats(void)
1417 ofmt = ofmt_register (report_error);
1420 #define BUF_DELTA 512
1422 static FILE *no_pp_fp;
1423 static efunc no_pp_err;
1424 static ListGen *no_pp_list;
1425 static long no_pp_lineinc;
1427 static void no_pp_reset (char *file, int pass, efunc error, evalfunc eval,
1428 ListGen *listgen)
1430 src_set_fname(nasm_strdup(file));
1431 src_set_linnum(0);
1432 no_pp_lineinc = 1;
1433 no_pp_err = error;
1434 no_pp_fp = fopen(file, "r");
1435 if (!no_pp_fp)
1436 no_pp_err (ERR_FATAL | ERR_NOFILE,
1437 "unable to open input file `%s'", file);
1438 no_pp_list = listgen;
1439 (void) pass; /* placate compilers */
1440 (void) eval; /* placate compilers */
1443 static char *no_pp_getline (void)
1445 char *buffer, *p, *q;
1446 int bufsize;
1448 bufsize = BUF_DELTA;
1449 buffer = nasm_malloc(BUF_DELTA);
1450 src_set_linnum(src_get_linnum() + no_pp_lineinc);
1452 while (1) { /* Loop to handle %line */
1454 p = buffer;
1455 while (1) { /* Loop to handle long lines */
1456 q = fgets(p, bufsize-(p-buffer), no_pp_fp);
1457 if (!q)
1458 break;
1459 p += strlen(p);
1460 if (p > buffer && p[-1] == '\n')
1461 break;
1462 if (p-buffer > bufsize-10) {
1463 int offset;
1464 offset = p - buffer;
1465 bufsize += BUF_DELTA;
1466 buffer = nasm_realloc(buffer, bufsize);
1467 p = buffer + offset;
1471 if (!q && p == buffer) {
1472 nasm_free (buffer);
1473 return NULL;
1477 * Play safe: remove CRs, LFs and any spurious ^Zs, if any of
1478 * them are present at the end of the line.
1480 buffer[strcspn(buffer, "\r\n\032")] = '\0';
1482 if (!strncmp(buffer, "%line", 5)) {
1483 long ln;
1484 int li;
1485 char *nm = nasm_malloc(strlen(buffer));
1486 if (sscanf(buffer+5, "%ld+%d %s", &ln, &li, nm) == 3) {
1487 nasm_free( src_set_fname(nm) );
1488 src_set_linnum(ln);
1489 no_pp_lineinc = li;
1490 continue;
1492 nasm_free(nm);
1494 break;
1497 no_pp_list->line (LIST_READ, buffer);
1499 return buffer;
1502 static void no_pp_cleanup (int pass)
1504 fclose(no_pp_fp);
1507 static unsigned long get_cpu (char *value)
1510 if (!strcmp(value, "8086")) return IF_8086;
1511 if (!strcmp(value, "186")) return IF_186;
1512 if (!strcmp(value, "286")) return IF_286;
1513 if (!strcmp(value, "386")) return IF_386;
1514 if (!strcmp(value, "486")) return IF_486;
1515 if (!strcmp(value, "586") ||
1516 !nasm_stricmp(value, "pentium") ) return IF_PENT;
1517 if (!strcmp(value, "686") ||
1518 !nasm_stricmp(value, "ppro") ||
1519 !nasm_stricmp(value, "p2") ) return IF_P6;
1520 if (!nasm_stricmp(value, "p3") ||
1521 !nasm_stricmp(value, "katmai") ) return IF_KATMAI;
1522 if (!nasm_stricmp(value, "p4") || /* is this right? -- jrc */
1523 !nasm_stricmp(value, "willamette") ) return IF_WILLAMETTE;
1525 report_error (pass0<2 ? ERR_NONFATAL : ERR_FATAL, "unknown 'cpu' type");
1527 return IF_PLEVEL; /* the maximum level */
1531 static int get_bits (char *value)
1533 int i;
1535 if ((i = atoi(value)) == 16) return i; /* set for a 16-bit segment */
1536 else if (i == 32) {
1537 if (cpu < IF_386) {
1538 report_error(ERR_NONFATAL,
1539 "cannot specify 32-bit segment on processor below a 386");
1540 i = 16;
1542 } else {
1543 report_error(pass0<2 ? ERR_NONFATAL : ERR_FATAL,
1544 "`%s' is not a valid segment size; must be 16 or 32",
1545 value);
1546 i = 16;
1548 return i;
1551 /* end of nasm.c */