NASM 2.09.01
[nasm/avx512.git] / preproc.c
blob70e550d0c1f51f927dce3c90fb777c4d1ff46857
1 /* ----------------------------------------------------------------------- *
3 * Copyright 1996-2010 The NASM Authors - All Rights Reserved
4 * See the file AUTHORS included with the NASM distribution for
5 * the specific copyright holders.
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following
9 * conditions are met:
11 * * Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * * Redistributions in binary form must reproduce the above
14 * copyright notice, this list of conditions and the following
15 * disclaimer in the documentation and/or other materials provided
16 * with the distribution.
18 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
19 * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
20 * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
21 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
22 * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
23 * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
24 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
25 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
26 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
28 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
29 * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
30 * EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32 * ----------------------------------------------------------------------- */
35 * preproc.c macro preprocessor for the Netwide Assembler
38 /* Typical flow of text through preproc
40 * pp_getline gets tokenized lines, either
42 * from a macro expansion
44 * or
45 * {
46 * read_line gets raw text from stdmacpos, or predef, or current input file
47 * tokenize converts to tokens
48 * }
50 * expand_mmac_params is used to expand %1 etc., unless a macro is being
51 * defined or a false conditional is being processed
52 * (%0, %1, %+1, %-1, %%foo
54 * do_directive checks for directives
56 * expand_smacro is used to expand single line macros
58 * expand_mmacro is used to expand multi-line macros
60 * detoken is used to convert the line back to text
63 #include "compiler.h"
65 #include <stdio.h>
66 #include <stdarg.h>
67 #include <stdlib.h>
68 #include <stddef.h>
69 #include <string.h>
70 #include <ctype.h>
71 #include <limits.h>
72 #include <inttypes.h>
74 #include "nasm.h"
75 #include "nasmlib.h"
76 #include "preproc.h"
77 #include "hashtbl.h"
78 #include "quote.h"
79 #include "stdscan.h"
80 #include "eval.h"
81 #include "tokens.h"
82 #include "tables.h"
84 typedef struct SMacro SMacro;
85 typedef struct MMacro MMacro;
86 typedef struct MMacroInvocation MMacroInvocation;
87 typedef struct Context Context;
88 typedef struct Token Token;
89 typedef struct Blocks Blocks;
90 typedef struct Line Line;
91 typedef struct Include Include;
92 typedef struct Cond Cond;
93 typedef struct IncPath IncPath;
96 * Note on the storage of both SMacro and MMacros: the hash table
97 * indexes them case-insensitively, and we then have to go through a
98 * linked list of potential case aliases (and, for MMacros, parameter
99 * ranges); this is to preserve the matching semantics of the earlier
100 * code. If the number of case aliases for a specific macro is a
101 * performance issue, you may want to reconsider your coding style.
105 * Store the definition of a single-line macro.
107 struct SMacro {
108 SMacro *next;
109 char *name;
110 bool casesense;
111 bool in_progress;
112 unsigned int nparam;
113 Token *expansion;
117 * Store the definition of a multi-line macro. This is also used to
118 * store the interiors of `%rep...%endrep' blocks, which are
119 * effectively self-re-invoking multi-line macros which simply
120 * don't have a name or bother to appear in the hash tables. %rep
121 * blocks are signified by having a NULL `name' field.
123 * In a MMacro describing a `%rep' block, the `in_progress' field
124 * isn't merely boolean, but gives the number of repeats left to
125 * run.
127 * The `next' field is used for storing MMacros in hash tables; the
128 * `next_active' field is for stacking them on istk entries.
130 * When a MMacro is being expanded, `params', `iline', `nparam',
131 * `paramlen', `rotate' and `unique' are local to the invocation.
133 struct MMacro {
134 MMacro *next;
135 MMacroInvocation *prev; /* previous invocation */
136 char *name;
137 int nparam_min, nparam_max;
138 bool casesense;
139 bool plus; /* is the last parameter greedy? */
140 bool nolist; /* is this macro listing-inhibited? */
141 int64_t in_progress; /* is this macro currently being expanded? */
142 int32_t max_depth; /* maximum number of recursive expansions allowed */
143 Token *dlist; /* All defaults as one list */
144 Token **defaults; /* Parameter default pointers */
145 int ndefs; /* number of default parameters */
146 Line *expansion;
148 MMacro *next_active;
149 MMacro *rep_nest; /* used for nesting %rep */
150 Token **params; /* actual parameters */
151 Token *iline; /* invocation line */
152 unsigned int nparam, rotate;
153 int *paramlen;
154 uint64_t unique;
155 int lineno; /* Current line number on expansion */
156 uint64_t condcnt; /* number of if blocks... */
160 /* Store the definition of a multi-line macro, as defined in a
161 * previous recursive macro expansion.
163 struct MMacroInvocation {
164 MMacroInvocation *prev; /* previous invocation */
165 Token **params; /* actual parameters */
166 Token *iline; /* invocation line */
167 unsigned int nparam, rotate;
168 int *paramlen;
169 uint64_t unique;
170 uint64_t condcnt;
175 * The context stack is composed of a linked list of these.
177 struct Context {
178 Context *next;
179 char *name;
180 struct hash_table localmac;
181 uint32_t number;
185 * This is the internal form which we break input lines up into.
186 * Typically stored in linked lists.
188 * Note that `type' serves a double meaning: TOK_SMAC_PARAM is not
189 * necessarily used as-is, but is intended to denote the number of
190 * the substituted parameter. So in the definition
192 * %define a(x,y) ( (x) & ~(y) )
194 * the token representing `x' will have its type changed to
195 * TOK_SMAC_PARAM, but the one representing `y' will be
196 * TOK_SMAC_PARAM+1.
198 * TOK_INTERNAL_STRING is a dirty hack: it's a single string token
199 * which doesn't need quotes around it. Used in the pre-include
200 * mechanism as an alternative to trying to find a sensible type of
201 * quote to use on the filename we were passed.
203 enum pp_token_type {
204 TOK_NONE = 0, TOK_WHITESPACE, TOK_COMMENT, TOK_ID,
205 TOK_PREPROC_ID, TOK_STRING,
206 TOK_NUMBER, TOK_FLOAT, TOK_SMAC_END, TOK_OTHER,
207 TOK_INTERNAL_STRING,
208 TOK_PREPROC_Q, TOK_PREPROC_QQ,
209 TOK_PASTE, /* %+ */
210 TOK_INDIRECT, /* %[...] */
211 TOK_SMAC_PARAM, /* MUST BE LAST IN THE LIST!!! */
212 TOK_MAX = INT_MAX /* Keep compiler from reducing the range */
215 struct Token {
216 Token *next;
217 char *text;
218 union {
219 SMacro *mac; /* associated macro for TOK_SMAC_END */
220 size_t len; /* scratch length field */
221 } a; /* Auxiliary data */
222 enum pp_token_type type;
226 * Multi-line macro definitions are stored as a linked list of
227 * these, which is essentially a container to allow several linked
228 * lists of Tokens.
230 * Note that in this module, linked lists are treated as stacks
231 * wherever possible. For this reason, Lines are _pushed_ on to the
232 * `expansion' field in MMacro structures, so that the linked list,
233 * if walked, would give the macro lines in reverse order; this
234 * means that we can walk the list when expanding a macro, and thus
235 * push the lines on to the `expansion' field in _istk_ in reverse
236 * order (so that when popped back off they are in the right
237 * order). It may seem cockeyed, and it relies on my design having
238 * an even number of steps in, but it works...
240 * Some of these structures, rather than being actual lines, are
241 * markers delimiting the end of the expansion of a given macro.
242 * This is for use in the cycle-tracking and %rep-handling code.
243 * Such structures have `finishes' non-NULL, and `first' NULL. All
244 * others have `finishes' NULL, but `first' may still be NULL if
245 * the line is blank.
247 struct Line {
248 Line *next;
249 MMacro *finishes;
250 Token *first;
254 * To handle an arbitrary level of file inclusion, we maintain a
255 * stack (ie linked list) of these things.
257 struct Include {
258 Include *next;
259 FILE *fp;
260 Cond *conds;
261 Line *expansion;
262 char *fname;
263 int lineno, lineinc;
264 MMacro *mstk; /* stack of active macros/reps */
268 * Include search path. This is simply a list of strings which get
269 * prepended, in turn, to the name of an include file, in an
270 * attempt to find the file if it's not in the current directory.
272 struct IncPath {
273 IncPath *next;
274 char *path;
278 * Conditional assembly: we maintain a separate stack of these for
279 * each level of file inclusion. (The only reason we keep the
280 * stacks separate is to ensure that a stray `%endif' in a file
281 * included from within the true branch of a `%if' won't terminate
282 * it and cause confusion: instead, rightly, it'll cause an error.)
284 struct Cond {
285 Cond *next;
286 int state;
288 enum {
290 * These states are for use just after %if or %elif: IF_TRUE
291 * means the condition has evaluated to truth so we are
292 * currently emitting, whereas IF_FALSE means we are not
293 * currently emitting but will start doing so if a %else comes
294 * up. In these states, all directives are admissible: %elif,
295 * %else and %endif. (And of course %if.)
297 COND_IF_TRUE, COND_IF_FALSE,
299 * These states come up after a %else: ELSE_TRUE means we're
300 * emitting, and ELSE_FALSE means we're not. In ELSE_* states,
301 * any %elif or %else will cause an error.
303 COND_ELSE_TRUE, COND_ELSE_FALSE,
305 * These states mean that we're not emitting now, and also that
306 * nothing until %endif will be emitted at all. COND_DONE is
307 * used when we've had our moment of emission
308 * and have now started seeing %elifs. COND_NEVER is used when
309 * the condition construct in question is contained within a
310 * non-emitting branch of a larger condition construct,
311 * or if there is an error.
313 COND_DONE, COND_NEVER
315 #define emitting(x) ( (x) == COND_IF_TRUE || (x) == COND_ELSE_TRUE )
318 * These defines are used as the possible return values for do_directive
320 #define NO_DIRECTIVE_FOUND 0
321 #define DIRECTIVE_FOUND 1
324 * This define sets the upper limit for smacro and recursive mmacro
325 * expansions
327 #define DEADMAN_LIMIT (1 << 20)
329 /* max reps */
330 #define REP_LIMIT ((INT64_C(1) << 62))
333 * Condition codes. Note that we use c_ prefix not C_ because C_ is
334 * used in nasm.h for the "real" condition codes. At _this_ level,
335 * we treat CXZ and ECXZ as condition codes, albeit non-invertible
336 * ones, so we need a different enum...
338 static const char * const conditions[] = {
339 "a", "ae", "b", "be", "c", "cxz", "e", "ecxz", "g", "ge", "l", "le",
340 "na", "nae", "nb", "nbe", "nc", "ne", "ng", "nge", "nl", "nle", "no",
341 "np", "ns", "nz", "o", "p", "pe", "po", "rcxz", "s", "z"
343 enum pp_conds {
344 c_A, c_AE, c_B, c_BE, c_C, c_CXZ, c_E, c_ECXZ, c_G, c_GE, c_L, c_LE,
345 c_NA, c_NAE, c_NB, c_NBE, c_NC, c_NE, c_NG, c_NGE, c_NL, c_NLE, c_NO,
346 c_NP, c_NS, c_NZ, c_O, c_P, c_PE, c_PO, c_RCXZ, c_S, c_Z,
347 c_none = -1
349 static const enum pp_conds inverse_ccs[] = {
350 c_NA, c_NAE, c_NB, c_NBE, c_NC, -1, c_NE, -1, c_NG, c_NGE, c_NL, c_NLE,
351 c_A, c_AE, c_B, c_BE, c_C, c_E, c_G, c_GE, c_L, c_LE, c_O, c_P, c_S,
352 c_Z, c_NO, c_NP, c_PO, c_PE, -1, c_NS, c_NZ
356 * Directive names.
358 /* If this is a an IF, ELIF, ELSE or ENDIF keyword */
359 static int is_condition(enum preproc_token arg)
361 return PP_IS_COND(arg) || (arg == PP_ELSE) || (arg == PP_ENDIF);
364 /* For TASM compatibility we need to be able to recognise TASM compatible
365 * conditional compilation directives. Using the NASM pre-processor does
366 * not work, so we look for them specifically from the following list and
367 * then jam in the equivalent NASM directive into the input stream.
370 enum {
371 TM_ARG, TM_ELIF, TM_ELSE, TM_ENDIF, TM_IF, TM_IFDEF, TM_IFDIFI,
372 TM_IFNDEF, TM_INCLUDE, TM_LOCAL
375 static const char * const tasm_directives[] = {
376 "arg", "elif", "else", "endif", "if", "ifdef", "ifdifi",
377 "ifndef", "include", "local"
380 static int StackSize = 4;
381 static char *StackPointer = "ebp";
382 static int ArgOffset = 8;
383 static int LocalOffset = 0;
385 static Context *cstk;
386 static Include *istk;
387 static IncPath *ipath = NULL;
389 static int pass; /* HACK: pass 0 = generate dependencies only */
390 static StrList **dephead, **deptail; /* Dependency list */
392 static uint64_t unique; /* unique identifier numbers */
394 static Line *predef = NULL;
395 static bool do_predef;
397 static ListGen *list;
400 * The current set of multi-line macros we have defined.
402 static struct hash_table mmacros;
405 * The current set of single-line macros we have defined.
407 static struct hash_table smacros;
410 * The multi-line macro we are currently defining, or the %rep
411 * block we are currently reading, if any.
413 static MMacro *defining;
415 static uint64_t nested_mac_count;
416 static uint64_t nested_rep_count;
419 * The number of macro parameters to allocate space for at a time.
421 #define PARAM_DELTA 16
424 * The standard macro set: defined in macros.c in the array nasm_stdmac.
425 * This gives our position in the macro set, when we're processing it.
427 static macros_t *stdmacpos;
430 * The extra standard macros that come from the object format, if
431 * any.
433 static macros_t *extrastdmac = NULL;
434 static bool any_extrastdmac;
437 * Tokens are allocated in blocks to improve speed
439 #define TOKEN_BLOCKSIZE 4096
440 static Token *freeTokens = NULL;
441 struct Blocks {
442 Blocks *next;
443 void *chunk;
446 static Blocks blocks = { NULL, NULL };
449 * Forward declarations.
451 static Token *expand_mmac_params(Token * tline);
452 static Token *expand_smacro(Token * tline);
453 static Token *expand_id(Token * tline);
454 static Context *get_ctx(const char *name, const char **namep,
455 bool all_contexts);
456 static void make_tok_num(Token * tok, int64_t val);
457 static void error(int severity, const char *fmt, ...);
458 static void error_precond(int severity, const char *fmt, ...);
459 static void *new_Block(size_t size);
460 static void delete_Blocks(void);
461 static Token *new_Token(Token * next, enum pp_token_type type,
462 const char *text, int txtlen);
463 static Token *delete_Token(Token * t);
466 * Macros for safe checking of token pointers, avoid *(NULL)
468 #define tok_type_(x,t) ((x) && (x)->type == (t))
469 #define skip_white_(x) if (tok_type_((x), TOK_WHITESPACE)) (x)=(x)->next
470 #define tok_is_(x,v) (tok_type_((x), TOK_OTHER) && !strcmp((x)->text,(v)))
471 #define tok_isnt_(x,v) ((x) && ((x)->type!=TOK_OTHER || strcmp((x)->text,(v))))
474 * nasm_unquote with error if the string contains NUL characters.
475 * If the string contains NUL characters, issue an error and return
476 * the C len, i.e. truncate at the NUL.
478 static size_t nasm_unquote_cstr(char *qstr, enum preproc_token directive)
480 size_t len = nasm_unquote(qstr, NULL);
481 size_t clen = strlen(qstr);
483 if (len != clen)
484 error(ERR_NONFATAL, "NUL character in `%s' directive",
485 pp_directives[directive]);
487 return clen;
491 * Handle TASM specific directives, which do not contain a % in
492 * front of them. We do it here because I could not find any other
493 * place to do it for the moment, and it is a hack (ideally it would
494 * be nice to be able to use the NASM pre-processor to do it).
496 static char *check_tasm_directive(char *line)
498 int32_t i, j, k, m, len;
499 char *p, *q, *oldline, oldchar;
501 p = nasm_skip_spaces(line);
503 /* Binary search for the directive name */
504 i = -1;
505 j = ARRAY_SIZE(tasm_directives);
506 q = nasm_skip_word(p);
507 len = q - p;
508 if (len) {
509 oldchar = p[len];
510 p[len] = 0;
511 while (j - i > 1) {
512 k = (j + i) / 2;
513 m = nasm_stricmp(p, tasm_directives[k]);
514 if (m == 0) {
515 /* We have found a directive, so jam a % in front of it
516 * so that NASM will then recognise it as one if it's own.
518 p[len] = oldchar;
519 len = strlen(p);
520 oldline = line;
521 line = nasm_malloc(len + 2);
522 line[0] = '%';
523 if (k == TM_IFDIFI) {
525 * NASM does not recognise IFDIFI, so we convert
526 * it to %if 0. This is not used in NASM
527 * compatible code, but does need to parse for the
528 * TASM macro package.
530 strcpy(line + 1, "if 0");
531 } else {
532 memcpy(line + 1, p, len + 1);
534 nasm_free(oldline);
535 return line;
536 } else if (m < 0) {
537 j = k;
538 } else
539 i = k;
541 p[len] = oldchar;
543 return line;
547 * The pre-preprocessing stage... This function translates line
548 * number indications as they emerge from GNU cpp (`# lineno "file"
549 * flags') into NASM preprocessor line number indications (`%line
550 * lineno file').
552 static char *prepreproc(char *line)
554 int lineno, fnlen;
555 char *fname, *oldline;
557 if (line[0] == '#' && line[1] == ' ') {
558 oldline = line;
559 fname = oldline + 2;
560 lineno = atoi(fname);
561 fname += strspn(fname, "0123456789 ");
562 if (*fname == '"')
563 fname++;
564 fnlen = strcspn(fname, "\"");
565 line = nasm_malloc(20 + fnlen);
566 snprintf(line, 20 + fnlen, "%%line %d %.*s", lineno, fnlen, fname);
567 nasm_free(oldline);
569 if (tasm_compatible_mode)
570 return check_tasm_directive(line);
571 return line;
575 * Free a linked list of tokens.
577 static void free_tlist(Token * list)
579 while (list)
580 list = delete_Token(list);
584 * Free a linked list of lines.
586 static void free_llist(Line * list)
588 Line *l, *tmp;
589 list_for_each_safe(l, tmp, list) {
590 free_tlist(l->first);
591 nasm_free(l);
596 * Free an MMacro
598 static void free_mmacro(MMacro * m)
600 nasm_free(m->name);
601 free_tlist(m->dlist);
602 nasm_free(m->defaults);
603 free_llist(m->expansion);
604 nasm_free(m);
608 * Free all currently defined macros, and free the hash tables
610 static void free_smacro_table(struct hash_table *smt)
612 SMacro *s, *tmp;
613 const char *key;
614 struct hash_tbl_node *it = NULL;
616 while ((s = hash_iterate(smt, &it, &key)) != NULL) {
617 nasm_free((void *)key);
618 list_for_each_safe(s, tmp, s) {
619 nasm_free(s->name);
620 free_tlist(s->expansion);
621 nasm_free(s);
624 hash_free(smt);
627 static void free_mmacro_table(struct hash_table *mmt)
629 MMacro *m, *tmp;
630 const char *key;
631 struct hash_tbl_node *it = NULL;
633 it = NULL;
634 while ((m = hash_iterate(mmt, &it, &key)) != NULL) {
635 nasm_free((void *)key);
636 list_for_each_safe(m ,tmp, m)
637 free_mmacro(m);
639 hash_free(mmt);
642 static void free_macros(void)
644 free_smacro_table(&smacros);
645 free_mmacro_table(&mmacros);
649 * Initialize the hash tables
651 static void init_macros(void)
653 hash_init(&smacros, HASH_LARGE);
654 hash_init(&mmacros, HASH_LARGE);
658 * Pop the context stack.
660 static void ctx_pop(void)
662 Context *c = cstk;
664 cstk = cstk->next;
665 free_smacro_table(&c->localmac);
666 nasm_free(c->name);
667 nasm_free(c);
671 * Search for a key in the hash index; adding it if necessary
672 * (in which case we initialize the data pointer to NULL.)
674 static void **
675 hash_findi_add(struct hash_table *hash, const char *str)
677 struct hash_insert hi;
678 void **r;
679 char *strx;
681 r = hash_findi(hash, str, &hi);
682 if (r)
683 return r;
685 strx = nasm_strdup(str); /* Use a more efficient allocator here? */
686 return hash_add(&hi, strx, NULL);
690 * Like hash_findi, but returns the data element rather than a pointer
691 * to it. Used only when not adding a new element, hence no third
692 * argument.
694 static void *
695 hash_findix(struct hash_table *hash, const char *str)
697 void **p;
699 p = hash_findi(hash, str, NULL);
700 return p ? *p : NULL;
704 * read line from standart macros set,
705 * if there no more left -- return NULL
707 static char *line_from_stdmac(void)
709 unsigned char c;
710 const unsigned char *p = stdmacpos;
711 char *line, *q;
712 size_t len = 0;
714 if (!stdmacpos)
715 return NULL;
717 while ((c = *p++)) {
718 if (c >= 0x80)
719 len += pp_directives_len[c - 0x80] + 1;
720 else
721 len++;
724 line = nasm_malloc(len + 1);
725 q = line;
726 while ((c = *stdmacpos++)) {
727 if (c >= 0x80) {
728 memcpy(q, pp_directives[c - 0x80], pp_directives_len[c - 0x80]);
729 q += pp_directives_len[c - 0x80];
730 *q++ = ' ';
731 } else {
732 *q++ = c;
735 stdmacpos = p;
736 *q = '\0';
738 if (!*stdmacpos) {
739 /* This was the last of the standard macro chain... */
740 stdmacpos = NULL;
741 if (any_extrastdmac) {
742 stdmacpos = extrastdmac;
743 any_extrastdmac = false;
744 } else if (do_predef) {
745 Line *pd, *l;
746 Token *head, **tail, *t;
749 * Nasty hack: here we push the contents of
750 * `predef' on to the top-level expansion stack,
751 * since this is the most convenient way to
752 * implement the pre-include and pre-define
753 * features.
755 list_for_each(pd, predef) {
756 head = NULL;
757 tail = &head;
758 list_for_each(t, pd->first) {
759 *tail = new_Token(NULL, t->type, t->text, 0);
760 tail = &(*tail)->next;
763 l = nasm_malloc(sizeof(Line));
764 l->next = istk->expansion;
765 l->first = head;
766 l->finishes = NULL;
768 istk->expansion = l;
770 do_predef = false;
774 return line;
777 #define BUF_DELTA 512
779 * Read a line from the top file in istk, handling multiple CR/LFs
780 * at the end of the line read, and handling spurious ^Zs. Will
781 * return lines from the standard macro set if this has not already
782 * been done.
784 static char *read_line(void)
786 char *buffer, *p, *q;
787 int bufsize, continued_count;
790 * standart macros set (predefined) goes first
792 p = line_from_stdmac();
793 if (p)
794 return p;
797 * regular read from a file
799 bufsize = BUF_DELTA;
800 buffer = nasm_malloc(BUF_DELTA);
801 p = buffer;
802 continued_count = 0;
803 while (1) {
804 q = fgets(p, bufsize - (p - buffer), istk->fp);
805 if (!q)
806 break;
807 p += strlen(p);
808 if (p > buffer && p[-1] == '\n') {
810 * Convert backslash-CRLF line continuation sequences into
811 * nothing at all (for DOS and Windows)
813 if (((p - 2) > buffer) && (p[-3] == '\\') && (p[-2] == '\r')) {
814 p -= 3;
815 *p = 0;
816 continued_count++;
819 * Also convert backslash-LF line continuation sequences into
820 * nothing at all (for Unix)
822 else if (((p - 1) > buffer) && (p[-2] == '\\')) {
823 p -= 2;
824 *p = 0;
825 continued_count++;
826 } else {
827 break;
830 if (p - buffer > bufsize - 10) {
831 int32_t offset = p - buffer;
832 bufsize += BUF_DELTA;
833 buffer = nasm_realloc(buffer, bufsize);
834 p = buffer + offset; /* prevent stale-pointer problems */
838 if (!q && p == buffer) {
839 nasm_free(buffer);
840 return NULL;
843 src_set_linnum(src_get_linnum() + istk->lineinc +
844 (continued_count * istk->lineinc));
847 * Play safe: remove CRs as well as LFs, if any of either are
848 * present at the end of the line.
850 while (--p >= buffer && (*p == '\n' || *p == '\r'))
851 *p = '\0';
854 * Handle spurious ^Z, which may be inserted into source files
855 * by some file transfer utilities.
857 buffer[strcspn(buffer, "\032")] = '\0';
859 list->line(LIST_READ, buffer);
861 return buffer;
865 * Tokenize a line of text. This is a very simple process since we
866 * don't need to parse the value out of e.g. numeric tokens: we
867 * simply split one string into many.
869 static Token *tokenize(char *line)
871 char c, *p = line;
872 enum pp_token_type type;
873 Token *list = NULL;
874 Token *t, **tail = &list;
876 while (*line) {
877 p = line;
878 if (*p == '%') {
879 p++;
880 if (*p == '+' && !nasm_isdigit(p[1])) {
881 p++;
882 type = TOK_PASTE;
883 } else if (nasm_isdigit(*p) ||
884 ((*p == '-' || *p == '+') && nasm_isdigit(p[1]))) {
885 do {
886 p++;
888 while (nasm_isdigit(*p));
889 type = TOK_PREPROC_ID;
890 } else if (*p == '{') {
891 p++;
892 while (*p && *p != '}') {
893 p[-1] = *p;
894 p++;
896 p[-1] = '\0';
897 if (*p)
898 p++;
899 type = TOK_PREPROC_ID;
900 } else if (*p == '[') {
901 int lvl = 1;
902 line += 2; /* Skip the leading %[ */
903 p++;
904 while (lvl && (c = *p++)) {
905 switch (c) {
906 case ']':
907 lvl--;
908 break;
909 case '%':
910 if (*p == '[')
911 lvl++;
912 break;
913 case '\'':
914 case '\"':
915 case '`':
916 p = nasm_skip_string(p - 1) + 1;
917 break;
918 default:
919 break;
922 p--;
923 if (*p)
924 *p++ = '\0';
925 if (lvl)
926 error(ERR_NONFATAL, "unterminated %[ construct");
927 type = TOK_INDIRECT;
928 } else if (*p == '?') {
929 type = TOK_PREPROC_Q; /* %? */
930 p++;
931 if (*p == '?') {
932 type = TOK_PREPROC_QQ; /* %?? */
933 p++;
935 } else if (*p == '!') {
936 type = TOK_PREPROC_ID;
937 p++;
938 if (isidchar(*p)) {
939 do {
940 p++;
942 while (isidchar(*p));
943 } else if (*p == '\'' || *p == '\"' || *p == '`') {
944 p = nasm_skip_string(p);
945 if (*p)
946 p++;
947 else
948 error(ERR_NONFATAL|ERR_PASS1, "unterminated %! string");
949 } else {
950 /* %! without string or identifier */
951 type = TOK_OTHER; /* Legacy behavior... */
953 } else if (isidchar(*p) ||
954 ((*p == '!' || *p == '%' || *p == '$') &&
955 isidchar(p[1]))) {
956 do {
957 p++;
959 while (isidchar(*p));
960 type = TOK_PREPROC_ID;
961 } else {
962 type = TOK_OTHER;
963 if (*p == '%')
964 p++;
966 } else if (isidstart(*p) || (*p == '$' && isidstart(p[1]))) {
967 type = TOK_ID;
968 p++;
969 while (*p && isidchar(*p))
970 p++;
971 } else if (*p == '\'' || *p == '"' || *p == '`') {
973 * A string token.
975 type = TOK_STRING;
976 p = nasm_skip_string(p);
978 if (*p) {
979 p++;
980 } else {
981 error(ERR_WARNING|ERR_PASS1, "unterminated string");
982 /* Handling unterminated strings by UNV */
983 /* type = -1; */
985 } else if (p[0] == '$' && p[1] == '$') {
986 type = TOK_OTHER; /* TOKEN_BASE */
987 p += 2;
988 } else if (isnumstart(*p)) {
989 bool is_hex = false;
990 bool is_float = false;
991 bool has_e = false;
992 char c, *r;
995 * A numeric token.
998 if (*p == '$') {
999 p++;
1000 is_hex = true;
1003 for (;;) {
1004 c = *p++;
1006 if (!is_hex && (c == 'e' || c == 'E')) {
1007 has_e = true;
1008 if (*p == '+' || *p == '-') {
1010 * e can only be followed by +/- if it is either a
1011 * prefixed hex number or a floating-point number
1013 p++;
1014 is_float = true;
1016 } else if (c == 'H' || c == 'h' || c == 'X' || c == 'x') {
1017 is_hex = true;
1018 } else if (c == 'P' || c == 'p') {
1019 is_float = true;
1020 if (*p == '+' || *p == '-')
1021 p++;
1022 } else if (isnumchar(c) || c == '_')
1023 ; /* just advance */
1024 else if (c == '.') {
1026 * we need to deal with consequences of the legacy
1027 * parser, like "1.nolist" being two tokens
1028 * (TOK_NUMBER, TOK_ID) here; at least give it
1029 * a shot for now. In the future, we probably need
1030 * a flex-based scanner with proper pattern matching
1031 * to do it as well as it can be done. Nothing in
1032 * the world is going to help the person who wants
1033 * 0x123.p16 interpreted as two tokens, though.
1035 r = p;
1036 while (*r == '_')
1037 r++;
1039 if (nasm_isdigit(*r) || (is_hex && nasm_isxdigit(*r)) ||
1040 (!is_hex && (*r == 'e' || *r == 'E')) ||
1041 (*r == 'p' || *r == 'P')) {
1042 p = r;
1043 is_float = true;
1044 } else
1045 break; /* Terminate the token */
1046 } else
1047 break;
1049 p--; /* Point to first character beyond number */
1051 if (p == line+1 && *line == '$') {
1052 type = TOK_OTHER; /* TOKEN_HERE */
1053 } else {
1054 if (has_e && !is_hex) {
1055 /* 1e13 is floating-point, but 1e13h is not */
1056 is_float = true;
1059 type = is_float ? TOK_FLOAT : TOK_NUMBER;
1061 } else if (nasm_isspace(*p)) {
1062 type = TOK_WHITESPACE;
1063 p = nasm_skip_spaces(p);
1065 * Whitespace just before end-of-line is discarded by
1066 * pretending it's a comment; whitespace just before a
1067 * comment gets lumped into the comment.
1069 if (!*p || *p == ';') {
1070 type = TOK_COMMENT;
1071 while (*p)
1072 p++;
1074 } else if (*p == ';') {
1075 type = TOK_COMMENT;
1076 while (*p)
1077 p++;
1078 } else {
1080 * Anything else is an operator of some kind. We check
1081 * for all the double-character operators (>>, <<, //,
1082 * %%, <=, >=, ==, !=, <>, &&, ||, ^^), but anything
1083 * else is a single-character operator.
1085 type = TOK_OTHER;
1086 if ((p[0] == '>' && p[1] == '>') ||
1087 (p[0] == '<' && p[1] == '<') ||
1088 (p[0] == '/' && p[1] == '/') ||
1089 (p[0] == '<' && p[1] == '=') ||
1090 (p[0] == '>' && p[1] == '=') ||
1091 (p[0] == '=' && p[1] == '=') ||
1092 (p[0] == '!' && p[1] == '=') ||
1093 (p[0] == '<' && p[1] == '>') ||
1094 (p[0] == '&' && p[1] == '&') ||
1095 (p[0] == '|' && p[1] == '|') ||
1096 (p[0] == '^' && p[1] == '^')) {
1097 p++;
1099 p++;
1102 /* Handling unterminated string by UNV */
1103 /*if (type == -1)
1105 *tail = t = new_Token(NULL, TOK_STRING, line, p-line+1);
1106 t->text[p-line] = *line;
1107 tail = &t->next;
1109 else */
1110 if (type != TOK_COMMENT) {
1111 *tail = t = new_Token(NULL, type, line, p - line);
1112 tail = &t->next;
1114 line = p;
1116 return list;
1120 * this function allocates a new managed block of memory and
1121 * returns a pointer to the block. The managed blocks are
1122 * deleted only all at once by the delete_Blocks function.
1124 static void *new_Block(size_t size)
1126 Blocks *b = &blocks;
1128 /* first, get to the end of the linked list */
1129 while (b->next)
1130 b = b->next;
1131 /* now allocate the requested chunk */
1132 b->chunk = nasm_malloc(size);
1134 /* now allocate a new block for the next request */
1135 b->next = nasm_malloc(sizeof(Blocks));
1136 /* and initialize the contents of the new block */
1137 b->next->next = NULL;
1138 b->next->chunk = NULL;
1139 return b->chunk;
1143 * this function deletes all managed blocks of memory
1145 static void delete_Blocks(void)
1147 Blocks *a, *b = &blocks;
1150 * keep in mind that the first block, pointed to by blocks
1151 * is a static and not dynamically allocated, so we don't
1152 * free it.
1154 while (b) {
1155 if (b->chunk)
1156 nasm_free(b->chunk);
1157 a = b;
1158 b = b->next;
1159 if (a != &blocks)
1160 nasm_free(a);
1165 * this function creates a new Token and passes a pointer to it
1166 * back to the caller. It sets the type and text elements, and
1167 * also the a.mac and next elements to NULL.
1169 static Token *new_Token(Token * next, enum pp_token_type type,
1170 const char *text, int txtlen)
1172 Token *t;
1173 int i;
1175 if (!freeTokens) {
1176 freeTokens = (Token *) new_Block(TOKEN_BLOCKSIZE * sizeof(Token));
1177 for (i = 0; i < TOKEN_BLOCKSIZE - 1; i++)
1178 freeTokens[i].next = &freeTokens[i + 1];
1179 freeTokens[i].next = NULL;
1181 t = freeTokens;
1182 freeTokens = t->next;
1183 t->next = next;
1184 t->a.mac = NULL;
1185 t->type = type;
1186 if (type == TOK_WHITESPACE || !text) {
1187 t->text = NULL;
1188 } else {
1189 if (txtlen == 0)
1190 txtlen = strlen(text);
1191 t->text = nasm_malloc(txtlen+1);
1192 memcpy(t->text, text, txtlen);
1193 t->text[txtlen] = '\0';
1195 return t;
1198 static Token *delete_Token(Token * t)
1200 Token *next = t->next;
1201 nasm_free(t->text);
1202 t->next = freeTokens;
1203 freeTokens = t;
1204 return next;
1208 * Convert a line of tokens back into text.
1209 * If expand_locals is not zero, identifiers of the form "%$*xxx"
1210 * will be transformed into ..@ctxnum.xxx
1212 static char *detoken(Token * tlist, bool expand_locals)
1214 Token *t;
1215 char *line, *p;
1216 const char *q;
1217 int len = 0;
1219 list_for_each(t, tlist) {
1220 if (t->type == TOK_PREPROC_ID && t->text[1] == '!') {
1221 char *v;
1222 char *q = t->text;
1224 v = t->text + 2;
1225 if (*v == '\'' || *v == '\"' || *v == '`') {
1226 size_t len = nasm_unquote(v, NULL);
1227 size_t clen = strlen(v);
1229 if (len != clen) {
1230 error(ERR_NONFATAL | ERR_PASS1,
1231 "NUL character in %! string");
1232 v = NULL;
1236 if (v) {
1237 char *p = getenv(v);
1238 if (!p) {
1239 error(ERR_NONFATAL | ERR_PASS1,
1240 "nonexistent environment variable `%s'", v);
1241 p = "";
1243 t->text = nasm_strdup(p);
1245 nasm_free(q);
1248 /* Expand local macros here and not during preprocessing */
1249 if (expand_locals &&
1250 t->type == TOK_PREPROC_ID && t->text &&
1251 t->text[0] == '%' && t->text[1] == '$') {
1252 const char *q;
1253 char *p;
1254 Context *ctx = get_ctx(t->text, &q, false);
1255 if (ctx) {
1256 char buffer[40];
1257 snprintf(buffer, sizeof(buffer), "..@%"PRIu32".", ctx->number);
1258 p = nasm_strcat(buffer, q);
1259 nasm_free(t->text);
1260 t->text = p;
1263 if (t->type == TOK_WHITESPACE)
1264 len++;
1265 else if (t->text)
1266 len += strlen(t->text);
1269 p = line = nasm_malloc(len + 1);
1271 list_for_each(t, tlist) {
1272 if (t->type == TOK_WHITESPACE) {
1273 *p++ = ' ';
1274 } else if (t->text) {
1275 q = t->text;
1276 while (*q)
1277 *p++ = *q++;
1280 *p = '\0';
1282 return line;
1286 * A scanner, suitable for use by the expression evaluator, which
1287 * operates on a line of Tokens. Expects a pointer to a pointer to
1288 * the first token in the line to be passed in as its private_data
1289 * field.
1291 * FIX: This really needs to be unified with stdscan.
1293 static int ppscan(void *private_data, struct tokenval *tokval)
1295 Token **tlineptr = private_data;
1296 Token *tline;
1297 char ourcopy[MAX_KEYWORD+1], *p, *r, *s;
1299 do {
1300 tline = *tlineptr;
1301 *tlineptr = tline ? tline->next : NULL;
1302 } while (tline && (tline->type == TOK_WHITESPACE ||
1303 tline->type == TOK_COMMENT));
1305 if (!tline)
1306 return tokval->t_type = TOKEN_EOS;
1308 tokval->t_charptr = tline->text;
1310 if (tline->text[0] == '$' && !tline->text[1])
1311 return tokval->t_type = TOKEN_HERE;
1312 if (tline->text[0] == '$' && tline->text[1] == '$' && !tline->text[2])
1313 return tokval->t_type = TOKEN_BASE;
1315 if (tline->type == TOK_ID) {
1316 p = tokval->t_charptr = tline->text;
1317 if (p[0] == '$') {
1318 tokval->t_charptr++;
1319 return tokval->t_type = TOKEN_ID;
1322 for (r = p, s = ourcopy; *r; r++) {
1323 if (r >= p+MAX_KEYWORD)
1324 return tokval->t_type = TOKEN_ID; /* Not a keyword */
1325 *s++ = nasm_tolower(*r);
1327 *s = '\0';
1328 /* right, so we have an identifier sitting in temp storage. now,
1329 * is it actually a register or instruction name, or what? */
1330 return nasm_token_hash(ourcopy, tokval);
1333 if (tline->type == TOK_NUMBER) {
1334 bool rn_error;
1335 tokval->t_integer = readnum(tline->text, &rn_error);
1336 tokval->t_charptr = tline->text;
1337 if (rn_error)
1338 return tokval->t_type = TOKEN_ERRNUM;
1339 else
1340 return tokval->t_type = TOKEN_NUM;
1343 if (tline->type == TOK_FLOAT) {
1344 return tokval->t_type = TOKEN_FLOAT;
1347 if (tline->type == TOK_STRING) {
1348 char bq, *ep;
1350 bq = tline->text[0];
1351 tokval->t_charptr = tline->text;
1352 tokval->t_inttwo = nasm_unquote(tline->text, &ep);
1354 if (ep[0] != bq || ep[1] != '\0')
1355 return tokval->t_type = TOKEN_ERRSTR;
1356 else
1357 return tokval->t_type = TOKEN_STR;
1360 if (tline->type == TOK_OTHER) {
1361 if (!strcmp(tline->text, "<<"))
1362 return tokval->t_type = TOKEN_SHL;
1363 if (!strcmp(tline->text, ">>"))
1364 return tokval->t_type = TOKEN_SHR;
1365 if (!strcmp(tline->text, "//"))
1366 return tokval->t_type = TOKEN_SDIV;
1367 if (!strcmp(tline->text, "%%"))
1368 return tokval->t_type = TOKEN_SMOD;
1369 if (!strcmp(tline->text, "=="))
1370 return tokval->t_type = TOKEN_EQ;
1371 if (!strcmp(tline->text, "<>"))
1372 return tokval->t_type = TOKEN_NE;
1373 if (!strcmp(tline->text, "!="))
1374 return tokval->t_type = TOKEN_NE;
1375 if (!strcmp(tline->text, "<="))
1376 return tokval->t_type = TOKEN_LE;
1377 if (!strcmp(tline->text, ">="))
1378 return tokval->t_type = TOKEN_GE;
1379 if (!strcmp(tline->text, "&&"))
1380 return tokval->t_type = TOKEN_DBL_AND;
1381 if (!strcmp(tline->text, "^^"))
1382 return tokval->t_type = TOKEN_DBL_XOR;
1383 if (!strcmp(tline->text, "||"))
1384 return tokval->t_type = TOKEN_DBL_OR;
1388 * We have no other options: just return the first character of
1389 * the token text.
1391 return tokval->t_type = tline->text[0];
1395 * Compare a string to the name of an existing macro; this is a
1396 * simple wrapper which calls either strcmp or nasm_stricmp
1397 * depending on the value of the `casesense' parameter.
1399 static int mstrcmp(const char *p, const char *q, bool casesense)
1401 return casesense ? strcmp(p, q) : nasm_stricmp(p, q);
1405 * Compare a string to the name of an existing macro; this is a
1406 * simple wrapper which calls either strcmp or nasm_stricmp
1407 * depending on the value of the `casesense' parameter.
1409 static int mmemcmp(const char *p, const char *q, size_t l, bool casesense)
1411 return casesense ? memcmp(p, q, l) : nasm_memicmp(p, q, l);
1415 * Return the Context structure associated with a %$ token. Return
1416 * NULL, having _already_ reported an error condition, if the
1417 * context stack isn't deep enough for the supplied number of $
1418 * signs.
1419 * If all_contexts == true, contexts that enclose current are
1420 * also scanned for such smacro, until it is found; if not -
1421 * only the context that directly results from the number of $'s
1422 * in variable's name.
1424 * If "namep" is non-NULL, set it to the pointer to the macro name
1425 * tail, i.e. the part beyond %$...
1427 static Context *get_ctx(const char *name, const char **namep,
1428 bool all_contexts)
1430 Context *ctx;
1431 SMacro *m;
1432 int i;
1434 if (namep)
1435 *namep = name;
1437 if (!name || name[0] != '%' || name[1] != '$')
1438 return NULL;
1440 if (!cstk) {
1441 error(ERR_NONFATAL, "`%s': context stack is empty", name);
1442 return NULL;
1445 name += 2;
1446 ctx = cstk;
1447 i = 0;
1448 while (ctx && *name == '$') {
1449 name++;
1450 i++;
1451 ctx = ctx->next;
1453 if (!ctx) {
1454 error(ERR_NONFATAL, "`%s': context stack is only"
1455 " %d level%s deep", name, i, (i == 1 ? "" : "s"));
1456 return NULL;
1459 if (namep)
1460 *namep = name;
1462 if (!all_contexts)
1463 return ctx;
1466 * NOTE: In 2.10 we will not need lookup in extarnal
1467 * contexts, so this is a gentle way to inform users
1468 * about their source code need to be updated
1471 /* first round -- check the current context */
1472 m = hash_findix(&ctx->localmac, name);
1473 while (m) {
1474 if (!mstrcmp(m->name, name, m->casesense))
1475 return ctx;
1476 m = m->next;
1479 /* second round - external contexts */
1480 while ((ctx = ctx->next)) {
1481 /* Search for this smacro in found context */
1482 m = hash_findix(&ctx->localmac, name);
1483 while (m) {
1484 if (!mstrcmp(m->name, name, m->casesense)) {
1485 /* NOTE: deprecated as of 2.10 */
1486 static int once = 0;
1487 if (!once) {
1488 error(ERR_WARNING, "context-local macro expansion"
1489 " fall-through (automatic searching of outer"
1490 " contexts) will be deprecated starting in"
1491 " NASM 2.10, please see the NASM Manual for"
1492 " more information");
1493 once = 1;
1495 error(ERR_WARNING, "`%s': context-local macro expansion fall-through", name);
1496 return ctx;
1498 m = m->next;
1502 return NULL;
1506 * Check to see if a file is already in a string list
1508 static bool in_list(const StrList *list, const char *str)
1510 while (list) {
1511 if (!strcmp(list->str, str))
1512 return true;
1513 list = list->next;
1515 return false;
1519 * Open an include file. This routine must always return a valid
1520 * file pointer if it returns - it's responsible for throwing an
1521 * ERR_FATAL and bombing out completely if not. It should also try
1522 * the include path one by one until it finds the file or reaches
1523 * the end of the path.
1525 static FILE *inc_fopen(const char *file, StrList **dhead, StrList ***dtail,
1526 bool missing_ok)
1528 FILE *fp;
1529 char *prefix = "";
1530 IncPath *ip = ipath;
1531 int len = strlen(file);
1532 size_t prefix_len = 0;
1533 StrList *sl;
1535 while (1) {
1536 sl = nasm_malloc(prefix_len+len+1+sizeof sl->next);
1537 memcpy(sl->str, prefix, prefix_len);
1538 memcpy(sl->str+prefix_len, file, len+1);
1539 fp = fopen(sl->str, "r");
1540 if (fp && dhead && !in_list(*dhead, sl->str)) {
1541 sl->next = NULL;
1542 **dtail = sl;
1543 *dtail = &sl->next;
1544 } else {
1545 nasm_free(sl);
1547 if (fp)
1548 return fp;
1549 if (!ip) {
1550 if (!missing_ok)
1551 break;
1552 prefix = NULL;
1553 } else {
1554 prefix = ip->path;
1555 ip = ip->next;
1557 if (prefix) {
1558 prefix_len = strlen(prefix);
1559 } else {
1560 /* -MG given and file not found */
1561 if (dhead && !in_list(*dhead, file)) {
1562 sl = nasm_malloc(len+1+sizeof sl->next);
1563 sl->next = NULL;
1564 strcpy(sl->str, file);
1565 **dtail = sl;
1566 *dtail = &sl->next;
1568 return NULL;
1572 error(ERR_FATAL, "unable to open include file `%s'", file);
1573 return NULL;
1577 * Determine if we should warn on defining a single-line macro of
1578 * name `name', with `nparam' parameters. If nparam is 0 or -1, will
1579 * return true if _any_ single-line macro of that name is defined.
1580 * Otherwise, will return true if a single-line macro with either
1581 * `nparam' or no parameters is defined.
1583 * If a macro with precisely the right number of parameters is
1584 * defined, or nparam is -1, the address of the definition structure
1585 * will be returned in `defn'; otherwise NULL will be returned. If `defn'
1586 * is NULL, no action will be taken regarding its contents, and no
1587 * error will occur.
1589 * Note that this is also called with nparam zero to resolve
1590 * `ifdef'.
1592 * If you already know which context macro belongs to, you can pass
1593 * the context pointer as first parameter; if you won't but name begins
1594 * with %$ the context will be automatically computed. If all_contexts
1595 * is true, macro will be searched in outer contexts as well.
1597 static bool
1598 smacro_defined(Context * ctx, const char *name, int nparam, SMacro ** defn,
1599 bool nocase)
1601 struct hash_table *smtbl;
1602 SMacro *m;
1604 if (ctx) {
1605 smtbl = &ctx->localmac;
1606 } else if (name[0] == '%' && name[1] == '$') {
1607 if (cstk)
1608 ctx = get_ctx(name, &name, false);
1609 if (!ctx)
1610 return false; /* got to return _something_ */
1611 smtbl = &ctx->localmac;
1612 } else {
1613 smtbl = &smacros;
1615 m = (SMacro *) hash_findix(smtbl, name);
1617 while (m) {
1618 if (!mstrcmp(m->name, name, m->casesense && nocase) &&
1619 (nparam <= 0 || m->nparam == 0 || nparam == (int) m->nparam)) {
1620 if (defn) {
1621 if (nparam == (int) m->nparam || nparam == -1)
1622 *defn = m;
1623 else
1624 *defn = NULL;
1626 return true;
1628 m = m->next;
1631 return false;
1635 * Count and mark off the parameters in a multi-line macro call.
1636 * This is called both from within the multi-line macro expansion
1637 * code, and also to mark off the default parameters when provided
1638 * in a %macro definition line.
1640 static void count_mmac_params(Token * t, int *nparam, Token *** params)
1642 int paramsize, brace;
1644 *nparam = paramsize = 0;
1645 *params = NULL;
1646 while (t) {
1647 /* +1: we need space for the final NULL */
1648 if (*nparam+1 >= paramsize) {
1649 paramsize += PARAM_DELTA;
1650 *params = nasm_realloc(*params, sizeof(**params) * paramsize);
1652 skip_white_(t);
1653 brace = false;
1654 if (tok_is_(t, "{"))
1655 brace = true;
1656 (*params)[(*nparam)++] = t;
1657 while (tok_isnt_(t, brace ? "}" : ","))
1658 t = t->next;
1659 if (t) { /* got a comma/brace */
1660 t = t->next;
1661 if (brace) {
1663 * Now we've found the closing brace, look further
1664 * for the comma.
1666 skip_white_(t);
1667 if (tok_isnt_(t, ",")) {
1668 error(ERR_NONFATAL,
1669 "braces do not enclose all of macro parameter");
1670 while (tok_isnt_(t, ","))
1671 t = t->next;
1673 if (t)
1674 t = t->next; /* eat the comma */
1681 * Determine whether one of the various `if' conditions is true or
1682 * not.
1684 * We must free the tline we get passed.
1686 static bool if_condition(Token * tline, enum preproc_token ct)
1688 enum pp_conditional i = PP_COND(ct);
1689 bool j;
1690 Token *t, *tt, **tptr, *origline;
1691 struct tokenval tokval;
1692 expr *evalresult;
1693 enum pp_token_type needtype;
1694 char *p;
1696 origline = tline;
1698 switch (i) {
1699 case PPC_IFCTX:
1700 j = false; /* have we matched yet? */
1701 while (true) {
1702 skip_white_(tline);
1703 if (!tline)
1704 break;
1705 if (tline->type != TOK_ID) {
1706 error(ERR_NONFATAL,
1707 "`%s' expects context identifiers", pp_directives[ct]);
1708 free_tlist(origline);
1709 return -1;
1711 if (cstk && cstk->name && !nasm_stricmp(tline->text, cstk->name))
1712 j = true;
1713 tline = tline->next;
1715 break;
1717 case PPC_IFDEF:
1718 j = false; /* have we matched yet? */
1719 while (tline) {
1720 skip_white_(tline);
1721 if (!tline || (tline->type != TOK_ID &&
1722 (tline->type != TOK_PREPROC_ID ||
1723 tline->text[1] != '$'))) {
1724 error(ERR_NONFATAL,
1725 "`%s' expects macro identifiers", pp_directives[ct]);
1726 goto fail;
1728 if (smacro_defined(NULL, tline->text, 0, NULL, true))
1729 j = true;
1730 tline = tline->next;
1732 break;
1734 case PPC_IFENV:
1735 tline = expand_smacro(tline);
1736 j = false; /* have we matched yet? */
1737 while (tline) {
1738 skip_white_(tline);
1739 if (!tline || (tline->type != TOK_ID &&
1740 tline->type != TOK_STRING &&
1741 (tline->type != TOK_PREPROC_ID ||
1742 tline->text[1] != '!'))) {
1743 error(ERR_NONFATAL,
1744 "`%s' expects environment variable names",
1745 pp_directives[ct]);
1746 goto fail;
1748 p = tline->text;
1749 if (tline->type == TOK_PREPROC_ID)
1750 p += 2; /* Skip leading %! */
1751 if (*p == '\'' || *p == '\"' || *p == '`')
1752 nasm_unquote_cstr(p, ct);
1753 if (getenv(p))
1754 j = true;
1755 tline = tline->next;
1757 break;
1759 case PPC_IFIDN:
1760 case PPC_IFIDNI:
1761 tline = expand_smacro(tline);
1762 t = tt = tline;
1763 while (tok_isnt_(tt, ","))
1764 tt = tt->next;
1765 if (!tt) {
1766 error(ERR_NONFATAL,
1767 "`%s' expects two comma-separated arguments",
1768 pp_directives[ct]);
1769 goto fail;
1771 tt = tt->next;
1772 j = true; /* assume equality unless proved not */
1773 while ((t->type != TOK_OTHER || strcmp(t->text, ",")) && tt) {
1774 if (tt->type == TOK_OTHER && !strcmp(tt->text, ",")) {
1775 error(ERR_NONFATAL, "`%s': more than one comma on line",
1776 pp_directives[ct]);
1777 goto fail;
1779 if (t->type == TOK_WHITESPACE) {
1780 t = t->next;
1781 continue;
1783 if (tt->type == TOK_WHITESPACE) {
1784 tt = tt->next;
1785 continue;
1787 if (tt->type != t->type) {
1788 j = false; /* found mismatching tokens */
1789 break;
1791 /* When comparing strings, need to unquote them first */
1792 if (t->type == TOK_STRING) {
1793 size_t l1 = nasm_unquote(t->text, NULL);
1794 size_t l2 = nasm_unquote(tt->text, NULL);
1796 if (l1 != l2) {
1797 j = false;
1798 break;
1800 if (mmemcmp(t->text, tt->text, l1, i == PPC_IFIDN)) {
1801 j = false;
1802 break;
1804 } else if (mstrcmp(tt->text, t->text, i == PPC_IFIDN) != 0) {
1805 j = false; /* found mismatching tokens */
1806 break;
1809 t = t->next;
1810 tt = tt->next;
1812 if ((t->type != TOK_OTHER || strcmp(t->text, ",")) || tt)
1813 j = false; /* trailing gunk on one end or other */
1814 break;
1816 case PPC_IFMACRO:
1818 bool found = false;
1819 MMacro searching, *mmac;
1821 skip_white_(tline);
1822 tline = expand_id(tline);
1823 if (!tok_type_(tline, TOK_ID)) {
1824 error(ERR_NONFATAL,
1825 "`%s' expects a macro name", pp_directives[ct]);
1826 goto fail;
1828 searching.name = nasm_strdup(tline->text);
1829 searching.casesense = true;
1830 searching.plus = false;
1831 searching.nolist = false;
1832 searching.in_progress = 0;
1833 searching.max_depth = 0;
1834 searching.rep_nest = NULL;
1835 searching.nparam_min = 0;
1836 searching.nparam_max = INT_MAX;
1837 tline = expand_smacro(tline->next);
1838 skip_white_(tline);
1839 if (!tline) {
1840 } else if (!tok_type_(tline, TOK_NUMBER)) {
1841 error(ERR_NONFATAL,
1842 "`%s' expects a parameter count or nothing",
1843 pp_directives[ct]);
1844 } else {
1845 searching.nparam_min = searching.nparam_max =
1846 readnum(tline->text, &j);
1847 if (j)
1848 error(ERR_NONFATAL,
1849 "unable to parse parameter count `%s'",
1850 tline->text);
1852 if (tline && tok_is_(tline->next, "-")) {
1853 tline = tline->next->next;
1854 if (tok_is_(tline, "*"))
1855 searching.nparam_max = INT_MAX;
1856 else if (!tok_type_(tline, TOK_NUMBER))
1857 error(ERR_NONFATAL,
1858 "`%s' expects a parameter count after `-'",
1859 pp_directives[ct]);
1860 else {
1861 searching.nparam_max = readnum(tline->text, &j);
1862 if (j)
1863 error(ERR_NONFATAL,
1864 "unable to parse parameter count `%s'",
1865 tline->text);
1866 if (searching.nparam_min > searching.nparam_max)
1867 error(ERR_NONFATAL,
1868 "minimum parameter count exceeds maximum");
1871 if (tline && tok_is_(tline->next, "+")) {
1872 tline = tline->next;
1873 searching.plus = true;
1875 mmac = (MMacro *) hash_findix(&mmacros, searching.name);
1876 while (mmac) {
1877 if (!strcmp(mmac->name, searching.name) &&
1878 (mmac->nparam_min <= searching.nparam_max
1879 || searching.plus)
1880 && (searching.nparam_min <= mmac->nparam_max
1881 || mmac->plus)) {
1882 found = true;
1883 break;
1885 mmac = mmac->next;
1887 if (tline && tline->next)
1888 error(ERR_WARNING|ERR_PASS1,
1889 "trailing garbage after %%ifmacro ignored");
1890 nasm_free(searching.name);
1891 j = found;
1892 break;
1895 case PPC_IFID:
1896 needtype = TOK_ID;
1897 goto iftype;
1898 case PPC_IFNUM:
1899 needtype = TOK_NUMBER;
1900 goto iftype;
1901 case PPC_IFSTR:
1902 needtype = TOK_STRING;
1903 goto iftype;
1905 iftype:
1906 t = tline = expand_smacro(tline);
1908 while (tok_type_(t, TOK_WHITESPACE) ||
1909 (needtype == TOK_NUMBER &&
1910 tok_type_(t, TOK_OTHER) &&
1911 (t->text[0] == '-' || t->text[0] == '+') &&
1912 !t->text[1]))
1913 t = t->next;
1915 j = tok_type_(t, needtype);
1916 break;
1918 case PPC_IFTOKEN:
1919 t = tline = expand_smacro(tline);
1920 while (tok_type_(t, TOK_WHITESPACE))
1921 t = t->next;
1923 j = false;
1924 if (t) {
1925 t = t->next; /* Skip the actual token */
1926 while (tok_type_(t, TOK_WHITESPACE))
1927 t = t->next;
1928 j = !t; /* Should be nothing left */
1930 break;
1932 case PPC_IFEMPTY:
1933 t = tline = expand_smacro(tline);
1934 while (tok_type_(t, TOK_WHITESPACE))
1935 t = t->next;
1937 j = !t; /* Should be empty */
1938 break;
1940 case PPC_IF:
1941 t = tline = expand_smacro(tline);
1942 tptr = &t;
1943 tokval.t_type = TOKEN_INVALID;
1944 evalresult = evaluate(ppscan, tptr, &tokval,
1945 NULL, pass | CRITICAL, error, NULL);
1946 if (!evalresult)
1947 return -1;
1948 if (tokval.t_type)
1949 error(ERR_WARNING|ERR_PASS1,
1950 "trailing garbage after expression ignored");
1951 if (!is_simple(evalresult)) {
1952 error(ERR_NONFATAL,
1953 "non-constant value given to `%s'", pp_directives[ct]);
1954 goto fail;
1956 j = reloc_value(evalresult) != 0;
1957 break;
1959 default:
1960 error(ERR_FATAL,
1961 "preprocessor directive `%s' not yet implemented",
1962 pp_directives[ct]);
1963 goto fail;
1966 free_tlist(origline);
1967 return j ^ PP_NEGATIVE(ct);
1969 fail:
1970 free_tlist(origline);
1971 return -1;
1975 * Common code for defining an smacro
1977 static bool define_smacro(Context *ctx, const char *mname, bool casesense,
1978 int nparam, Token *expansion)
1980 SMacro *smac, **smhead;
1981 struct hash_table *smtbl;
1983 if (smacro_defined(ctx, mname, nparam, &smac, casesense)) {
1984 if (!smac) {
1985 error(ERR_WARNING|ERR_PASS1,
1986 "single-line macro `%s' defined both with and"
1987 " without parameters", mname);
1989 * Some instances of the old code considered this a failure,
1990 * some others didn't. What is the right thing to do here?
1992 free_tlist(expansion);
1993 return false; /* Failure */
1994 } else {
1996 * We're redefining, so we have to take over an
1997 * existing SMacro structure. This means freeing
1998 * what was already in it.
2000 nasm_free(smac->name);
2001 free_tlist(smac->expansion);
2003 } else {
2004 smtbl = ctx ? &ctx->localmac : &smacros;
2005 smhead = (SMacro **) hash_findi_add(smtbl, mname);
2006 smac = nasm_malloc(sizeof(SMacro));
2007 smac->next = *smhead;
2008 *smhead = smac;
2010 smac->name = nasm_strdup(mname);
2011 smac->casesense = casesense;
2012 smac->nparam = nparam;
2013 smac->expansion = expansion;
2014 smac->in_progress = false;
2015 return true; /* Success */
2019 * Undefine an smacro
2021 static void undef_smacro(Context *ctx, const char *mname)
2023 SMacro **smhead, *s, **sp;
2024 struct hash_table *smtbl;
2026 smtbl = ctx ? &ctx->localmac : &smacros;
2027 smhead = (SMacro **)hash_findi(smtbl, mname, NULL);
2029 if (smhead) {
2031 * We now have a macro name... go hunt for it.
2033 sp = smhead;
2034 while ((s = *sp) != NULL) {
2035 if (!mstrcmp(s->name, mname, s->casesense)) {
2036 *sp = s->next;
2037 nasm_free(s->name);
2038 free_tlist(s->expansion);
2039 nasm_free(s);
2040 } else {
2041 sp = &s->next;
2048 * Parse a mmacro specification.
2050 static bool parse_mmacro_spec(Token *tline, MMacro *def, const char *directive)
2052 bool err;
2054 tline = tline->next;
2055 skip_white_(tline);
2056 tline = expand_id(tline);
2057 if (!tok_type_(tline, TOK_ID)) {
2058 error(ERR_NONFATAL, "`%s' expects a macro name", directive);
2059 return false;
2062 def->prev = NULL;
2063 def->name = nasm_strdup(tline->text);
2064 def->plus = false;
2065 def->nolist = false;
2066 def->in_progress = 0;
2067 def->rep_nest = NULL;
2068 def->nparam_min = 0;
2069 def->nparam_max = 0;
2071 tline = expand_smacro(tline->next);
2072 skip_white_(tline);
2073 if (!tok_type_(tline, TOK_NUMBER)) {
2074 error(ERR_NONFATAL, "`%s' expects a parameter count", directive);
2075 } else {
2076 def->nparam_min = def->nparam_max =
2077 readnum(tline->text, &err);
2078 if (err)
2079 error(ERR_NONFATAL,
2080 "unable to parse parameter count `%s'", tline->text);
2082 if (tline && tok_is_(tline->next, "-")) {
2083 tline = tline->next->next;
2084 if (tok_is_(tline, "*")) {
2085 def->nparam_max = INT_MAX;
2086 } else if (!tok_type_(tline, TOK_NUMBER)) {
2087 error(ERR_NONFATAL,
2088 "`%s' expects a parameter count after `-'", directive);
2089 } else {
2090 def->nparam_max = readnum(tline->text, &err);
2091 if (err) {
2092 error(ERR_NONFATAL, "unable to parse parameter count `%s'",
2093 tline->text);
2095 if (def->nparam_min > def->nparam_max) {
2096 error(ERR_NONFATAL, "minimum parameter count exceeds maximum");
2100 if (tline && tok_is_(tline->next, "+")) {
2101 tline = tline->next;
2102 def->plus = true;
2104 if (tline && tok_type_(tline->next, TOK_ID) &&
2105 !nasm_stricmp(tline->next->text, ".nolist")) {
2106 tline = tline->next;
2107 def->nolist = true;
2111 * Handle default parameters.
2113 if (tline && tline->next) {
2114 def->dlist = tline->next;
2115 tline->next = NULL;
2116 count_mmac_params(def->dlist, &def->ndefs, &def->defaults);
2117 } else {
2118 def->dlist = NULL;
2119 def->defaults = NULL;
2121 def->expansion = NULL;
2123 if (def->defaults && def->ndefs > def->nparam_max - def->nparam_min &&
2124 !def->plus)
2125 error(ERR_WARNING|ERR_PASS1|ERR_WARN_MDP,
2126 "too many default macro parameters");
2128 return true;
2133 * Decode a size directive
2135 static int parse_size(const char *str) {
2136 static const char *size_names[] =
2137 { "byte", "dword", "oword", "qword", "tword", "word", "yword" };
2138 static const int sizes[] =
2139 { 0, 1, 4, 16, 8, 10, 2, 32 };
2141 return sizes[bsii(str, size_names, ARRAY_SIZE(size_names))+1];
2145 * find and process preprocessor directive in passed line
2146 * Find out if a line contains a preprocessor directive, and deal
2147 * with it if so.
2149 * If a directive _is_ found, it is the responsibility of this routine
2150 * (and not the caller) to free_tlist() the line.
2152 * @param tline a pointer to the current tokeninzed line linked list
2153 * @return DIRECTIVE_FOUND or NO_DIRECTIVE_FOUND
2156 static int do_directive(Token * tline)
2158 enum preproc_token i;
2159 int j;
2160 bool err;
2161 int nparam;
2162 bool nolist;
2163 bool casesense;
2164 int k, m;
2165 int offset;
2166 char *p, *pp;
2167 const char *mname;
2168 Include *inc;
2169 Context *ctx;
2170 Cond *cond;
2171 MMacro *mmac, **mmhead;
2172 Token *t, *tt, *param_start, *macro_start, *last, **tptr, *origline;
2173 Line *l;
2174 struct tokenval tokval;
2175 expr *evalresult;
2176 MMacro *tmp_defining; /* Used when manipulating rep_nest */
2177 int64_t count;
2178 size_t len;
2179 int severity;
2181 origline = tline;
2183 skip_white_(tline);
2184 if (!tline || !tok_type_(tline, TOK_PREPROC_ID) ||
2185 (tline->text[1] == '%' || tline->text[1] == '$'
2186 || tline->text[1] == '!'))
2187 return NO_DIRECTIVE_FOUND;
2189 i = pp_token_hash(tline->text);
2192 * FIXME: We zap execution of PP_RMACRO, PP_IRMACRO, PP_EXITMACRO
2193 * since they are known to be buggy at moment, we need to fix them
2194 * in future release (2.09-2.10)
2196 if (i == PP_RMACRO || i == PP_RMACRO || i == PP_EXITMACRO) {
2197 error(ERR_NONFATAL, "unknown preprocessor directive `%s'",
2198 tline->text);
2199 return NO_DIRECTIVE_FOUND;
2203 * If we're in a non-emitting branch of a condition construct,
2204 * or walking to the end of an already terminated %rep block,
2205 * we should ignore all directives except for condition
2206 * directives.
2208 if (((istk->conds && !emitting(istk->conds->state)) ||
2209 (istk->mstk && !istk->mstk->in_progress)) && !is_condition(i)) {
2210 return NO_DIRECTIVE_FOUND;
2214 * If we're defining a macro or reading a %rep block, we should
2215 * ignore all directives except for %macro/%imacro (which nest),
2216 * %endm/%endmacro, and (only if we're in a %rep block) %endrep.
2217 * If we're in a %rep block, another %rep nests, so should be let through.
2219 if (defining && i != PP_MACRO && i != PP_IMACRO &&
2220 i != PP_RMACRO && i != PP_IRMACRO &&
2221 i != PP_ENDMACRO && i != PP_ENDM &&
2222 (defining->name || (i != PP_ENDREP && i != PP_REP))) {
2223 return NO_DIRECTIVE_FOUND;
2226 if (defining) {
2227 if (i == PP_MACRO || i == PP_IMACRO ||
2228 i == PP_RMACRO || i == PP_IRMACRO) {
2229 nested_mac_count++;
2230 return NO_DIRECTIVE_FOUND;
2231 } else if (nested_mac_count > 0) {
2232 if (i == PP_ENDMACRO) {
2233 nested_mac_count--;
2234 return NO_DIRECTIVE_FOUND;
2237 if (!defining->name) {
2238 if (i == PP_REP) {
2239 nested_rep_count++;
2240 return NO_DIRECTIVE_FOUND;
2241 } else if (nested_rep_count > 0) {
2242 if (i == PP_ENDREP) {
2243 nested_rep_count--;
2244 return NO_DIRECTIVE_FOUND;
2250 switch (i) {
2251 case PP_INVALID:
2252 error(ERR_NONFATAL, "unknown preprocessor directive `%s'",
2253 tline->text);
2254 return NO_DIRECTIVE_FOUND; /* didn't get it */
2256 case PP_STACKSIZE:
2257 /* Directive to tell NASM what the default stack size is. The
2258 * default is for a 16-bit stack, and this can be overriden with
2259 * %stacksize large.
2261 tline = tline->next;
2262 if (tline && tline->type == TOK_WHITESPACE)
2263 tline = tline->next;
2264 if (!tline || tline->type != TOK_ID) {
2265 error(ERR_NONFATAL, "`%%stacksize' missing size parameter");
2266 free_tlist(origline);
2267 return DIRECTIVE_FOUND;
2269 if (nasm_stricmp(tline->text, "flat") == 0) {
2270 /* All subsequent ARG directives are for a 32-bit stack */
2271 StackSize = 4;
2272 StackPointer = "ebp";
2273 ArgOffset = 8;
2274 LocalOffset = 0;
2275 } else if (nasm_stricmp(tline->text, "flat64") == 0) {
2276 /* All subsequent ARG directives are for a 64-bit stack */
2277 StackSize = 8;
2278 StackPointer = "rbp";
2279 ArgOffset = 16;
2280 LocalOffset = 0;
2281 } else if (nasm_stricmp(tline->text, "large") == 0) {
2282 /* All subsequent ARG directives are for a 16-bit stack,
2283 * far function call.
2285 StackSize = 2;
2286 StackPointer = "bp";
2287 ArgOffset = 4;
2288 LocalOffset = 0;
2289 } else if (nasm_stricmp(tline->text, "small") == 0) {
2290 /* All subsequent ARG directives are for a 16-bit stack,
2291 * far function call. We don't support near functions.
2293 StackSize = 2;
2294 StackPointer = "bp";
2295 ArgOffset = 6;
2296 LocalOffset = 0;
2297 } else {
2298 error(ERR_NONFATAL, "`%%stacksize' invalid size type");
2299 free_tlist(origline);
2300 return DIRECTIVE_FOUND;
2302 free_tlist(origline);
2303 return DIRECTIVE_FOUND;
2305 case PP_ARG:
2306 /* TASM like ARG directive to define arguments to functions, in
2307 * the following form:
2309 * ARG arg1:WORD, arg2:DWORD, arg4:QWORD
2311 offset = ArgOffset;
2312 do {
2313 char *arg, directive[256];
2314 int size = StackSize;
2316 /* Find the argument name */
2317 tline = tline->next;
2318 if (tline && tline->type == TOK_WHITESPACE)
2319 tline = tline->next;
2320 if (!tline || tline->type != TOK_ID) {
2321 error(ERR_NONFATAL, "`%%arg' missing argument parameter");
2322 free_tlist(origline);
2323 return DIRECTIVE_FOUND;
2325 arg = tline->text;
2327 /* Find the argument size type */
2328 tline = tline->next;
2329 if (!tline || tline->type != TOK_OTHER
2330 || tline->text[0] != ':') {
2331 error(ERR_NONFATAL,
2332 "Syntax error processing `%%arg' directive");
2333 free_tlist(origline);
2334 return DIRECTIVE_FOUND;
2336 tline = tline->next;
2337 if (!tline || tline->type != TOK_ID) {
2338 error(ERR_NONFATAL, "`%%arg' missing size type parameter");
2339 free_tlist(origline);
2340 return DIRECTIVE_FOUND;
2343 /* Allow macro expansion of type parameter */
2344 tt = tokenize(tline->text);
2345 tt = expand_smacro(tt);
2346 size = parse_size(tt->text);
2347 if (!size) {
2348 error(ERR_NONFATAL,
2349 "Invalid size type for `%%arg' missing directive");
2350 free_tlist(tt);
2351 free_tlist(origline);
2352 return DIRECTIVE_FOUND;
2354 free_tlist(tt);
2356 /* Round up to even stack slots */
2357 size = ALIGN(size, StackSize);
2359 /* Now define the macro for the argument */
2360 snprintf(directive, sizeof(directive), "%%define %s (%s+%d)",
2361 arg, StackPointer, offset);
2362 do_directive(tokenize(directive));
2363 offset += size;
2365 /* Move to the next argument in the list */
2366 tline = tline->next;
2367 if (tline && tline->type == TOK_WHITESPACE)
2368 tline = tline->next;
2369 } while (tline && tline->type == TOK_OTHER && tline->text[0] == ',');
2370 ArgOffset = offset;
2371 free_tlist(origline);
2372 return DIRECTIVE_FOUND;
2374 case PP_LOCAL:
2375 /* TASM like LOCAL directive to define local variables for a
2376 * function, in the following form:
2378 * LOCAL local1:WORD, local2:DWORD, local4:QWORD = LocalSize
2380 * The '= LocalSize' at the end is ignored by NASM, but is
2381 * required by TASM to define the local parameter size (and used
2382 * by the TASM macro package).
2384 offset = LocalOffset;
2385 do {
2386 char *local, directive[256];
2387 int size = StackSize;
2389 /* Find the argument name */
2390 tline = tline->next;
2391 if (tline && tline->type == TOK_WHITESPACE)
2392 tline = tline->next;
2393 if (!tline || tline->type != TOK_ID) {
2394 error(ERR_NONFATAL,
2395 "`%%local' missing argument parameter");
2396 free_tlist(origline);
2397 return DIRECTIVE_FOUND;
2399 local = tline->text;
2401 /* Find the argument size type */
2402 tline = tline->next;
2403 if (!tline || tline->type != TOK_OTHER
2404 || tline->text[0] != ':') {
2405 error(ERR_NONFATAL,
2406 "Syntax error processing `%%local' directive");
2407 free_tlist(origline);
2408 return DIRECTIVE_FOUND;
2410 tline = tline->next;
2411 if (!tline || tline->type != TOK_ID) {
2412 error(ERR_NONFATAL,
2413 "`%%local' missing size type parameter");
2414 free_tlist(origline);
2415 return DIRECTIVE_FOUND;
2418 /* Allow macro expansion of type parameter */
2419 tt = tokenize(tline->text);
2420 tt = expand_smacro(tt);
2421 size = parse_size(tt->text);
2422 if (!size) {
2423 error(ERR_NONFATAL,
2424 "Invalid size type for `%%local' missing directive");
2425 free_tlist(tt);
2426 free_tlist(origline);
2427 return DIRECTIVE_FOUND;
2429 free_tlist(tt);
2431 /* Round up to even stack slots */
2432 size = ALIGN(size, StackSize);
2434 offset += size; /* Negative offset, increment before */
2436 /* Now define the macro for the argument */
2437 snprintf(directive, sizeof(directive), "%%define %s (%s-%d)",
2438 local, StackPointer, offset);
2439 do_directive(tokenize(directive));
2441 /* Now define the assign to setup the enter_c macro correctly */
2442 snprintf(directive, sizeof(directive),
2443 "%%assign %%$localsize %%$localsize+%d", size);
2444 do_directive(tokenize(directive));
2446 /* Move to the next argument in the list */
2447 tline = tline->next;
2448 if (tline && tline->type == TOK_WHITESPACE)
2449 tline = tline->next;
2450 } while (tline && tline->type == TOK_OTHER && tline->text[0] == ',');
2451 LocalOffset = offset;
2452 free_tlist(origline);
2453 return DIRECTIVE_FOUND;
2455 case PP_CLEAR:
2456 if (tline->next)
2457 error(ERR_WARNING|ERR_PASS1,
2458 "trailing garbage after `%%clear' ignored");
2459 free_macros();
2460 init_macros();
2461 free_tlist(origline);
2462 return DIRECTIVE_FOUND;
2464 case PP_DEPEND:
2465 t = tline->next = expand_smacro(tline->next);
2466 skip_white_(t);
2467 if (!t || (t->type != TOK_STRING &&
2468 t->type != TOK_INTERNAL_STRING)) {
2469 error(ERR_NONFATAL, "`%%depend' expects a file name");
2470 free_tlist(origline);
2471 return DIRECTIVE_FOUND; /* but we did _something_ */
2473 if (t->next)
2474 error(ERR_WARNING|ERR_PASS1,
2475 "trailing garbage after `%%depend' ignored");
2476 p = t->text;
2477 if (t->type != TOK_INTERNAL_STRING)
2478 nasm_unquote_cstr(p, i);
2479 if (dephead && !in_list(*dephead, p)) {
2480 StrList *sl = nasm_malloc(strlen(p)+1+sizeof sl->next);
2481 sl->next = NULL;
2482 strcpy(sl->str, p);
2483 *deptail = sl;
2484 deptail = &sl->next;
2486 free_tlist(origline);
2487 return DIRECTIVE_FOUND;
2489 case PP_INCLUDE:
2490 t = tline->next = expand_smacro(tline->next);
2491 skip_white_(t);
2493 if (!t || (t->type != TOK_STRING &&
2494 t->type != TOK_INTERNAL_STRING)) {
2495 error(ERR_NONFATAL, "`%%include' expects a file name");
2496 free_tlist(origline);
2497 return DIRECTIVE_FOUND; /* but we did _something_ */
2499 if (t->next)
2500 error(ERR_WARNING|ERR_PASS1,
2501 "trailing garbage after `%%include' ignored");
2502 p = t->text;
2503 if (t->type != TOK_INTERNAL_STRING)
2504 nasm_unquote_cstr(p, i);
2505 inc = nasm_malloc(sizeof(Include));
2506 inc->next = istk;
2507 inc->conds = NULL;
2508 inc->fp = inc_fopen(p, dephead, &deptail, pass == 0);
2509 if (!inc->fp) {
2510 /* -MG given but file not found */
2511 nasm_free(inc);
2512 } else {
2513 inc->fname = src_set_fname(nasm_strdup(p));
2514 inc->lineno = src_set_linnum(0);
2515 inc->lineinc = 1;
2516 inc->expansion = NULL;
2517 inc->mstk = NULL;
2518 istk = inc;
2519 list->uplevel(LIST_INCLUDE);
2521 free_tlist(origline);
2522 return DIRECTIVE_FOUND;
2524 case PP_USE:
2526 static macros_t *use_pkg;
2527 const char *pkg_macro = NULL;
2529 tline = tline->next;
2530 skip_white_(tline);
2531 tline = expand_id(tline);
2533 if (!tline || (tline->type != TOK_STRING &&
2534 tline->type != TOK_INTERNAL_STRING &&
2535 tline->type != TOK_ID)) {
2536 error(ERR_NONFATAL, "`%%use' expects a package name");
2537 free_tlist(origline);
2538 return DIRECTIVE_FOUND; /* but we did _something_ */
2540 if (tline->next)
2541 error(ERR_WARNING|ERR_PASS1,
2542 "trailing garbage after `%%use' ignored");
2543 if (tline->type == TOK_STRING)
2544 nasm_unquote_cstr(tline->text, i);
2545 use_pkg = nasm_stdmac_find_package(tline->text);
2546 if (!use_pkg)
2547 error(ERR_NONFATAL, "unknown `%%use' package: %s", tline->text);
2548 else
2549 pkg_macro = (char *)use_pkg + 1; /* The first string will be <%define>__USE_*__ */
2550 if (use_pkg && ! smacro_defined(NULL, pkg_macro, 0, NULL, true)) {
2551 /* Not already included, go ahead and include it */
2552 stdmacpos = use_pkg;
2554 free_tlist(origline);
2555 return DIRECTIVE_FOUND;
2557 case PP_PUSH:
2558 case PP_REPL:
2559 case PP_POP:
2560 tline = tline->next;
2561 skip_white_(tline);
2562 tline = expand_id(tline);
2563 if (tline) {
2564 if (!tok_type_(tline, TOK_ID)) {
2565 error(ERR_NONFATAL, "`%s' expects a context identifier",
2566 pp_directives[i]);
2567 free_tlist(origline);
2568 return DIRECTIVE_FOUND; /* but we did _something_ */
2570 if (tline->next)
2571 error(ERR_WARNING|ERR_PASS1,
2572 "trailing garbage after `%s' ignored",
2573 pp_directives[i]);
2574 p = nasm_strdup(tline->text);
2575 } else {
2576 p = NULL; /* Anonymous */
2579 if (i == PP_PUSH) {
2580 ctx = nasm_malloc(sizeof(Context));
2581 ctx->next = cstk;
2582 hash_init(&ctx->localmac, HASH_SMALL);
2583 ctx->name = p;
2584 ctx->number = unique++;
2585 cstk = ctx;
2586 } else {
2587 /* %pop or %repl */
2588 if (!cstk) {
2589 error(ERR_NONFATAL, "`%s': context stack is empty",
2590 pp_directives[i]);
2591 } else if (i == PP_POP) {
2592 if (p && (!cstk->name || nasm_stricmp(p, cstk->name)))
2593 error(ERR_NONFATAL, "`%%pop' in wrong context: %s, "
2594 "expected %s",
2595 cstk->name ? cstk->name : "anonymous", p);
2596 else
2597 ctx_pop();
2598 } else {
2599 /* i == PP_REPL */
2600 nasm_free(cstk->name);
2601 cstk->name = p;
2602 p = NULL;
2604 nasm_free(p);
2606 free_tlist(origline);
2607 return DIRECTIVE_FOUND;
2608 case PP_FATAL:
2609 severity = ERR_FATAL;
2610 goto issue_error;
2611 case PP_ERROR:
2612 severity = ERR_NONFATAL;
2613 goto issue_error;
2614 case PP_WARNING:
2615 severity = ERR_WARNING|ERR_WARN_USER;
2616 goto issue_error;
2618 issue_error:
2620 /* Only error out if this is the final pass */
2621 if (pass != 2 && i != PP_FATAL)
2622 return DIRECTIVE_FOUND;
2624 tline->next = expand_smacro(tline->next);
2625 tline = tline->next;
2626 skip_white_(tline);
2627 t = tline ? tline->next : NULL;
2628 skip_white_(t);
2629 if (tok_type_(tline, TOK_STRING) && !t) {
2630 /* The line contains only a quoted string */
2631 p = tline->text;
2632 nasm_unquote(p, NULL); /* Ignore NUL character truncation */
2633 error(severity, "%s", p);
2634 } else {
2635 /* Not a quoted string, or more than a quoted string */
2636 p = detoken(tline, false);
2637 error(severity, "%s", p);
2638 nasm_free(p);
2640 free_tlist(origline);
2641 return DIRECTIVE_FOUND;
2644 CASE_PP_IF:
2645 if (istk->conds && !emitting(istk->conds->state))
2646 j = COND_NEVER;
2647 else {
2648 j = if_condition(tline->next, i);
2649 tline->next = NULL; /* it got freed */
2650 j = j < 0 ? COND_NEVER : j ? COND_IF_TRUE : COND_IF_FALSE;
2652 cond = nasm_malloc(sizeof(Cond));
2653 cond->next = istk->conds;
2654 cond->state = j;
2655 istk->conds = cond;
2656 if(istk->mstk)
2657 istk->mstk->condcnt ++;
2658 free_tlist(origline);
2659 return DIRECTIVE_FOUND;
2661 CASE_PP_ELIF:
2662 if (!istk->conds)
2663 error(ERR_FATAL, "`%s': no matching `%%if'", pp_directives[i]);
2664 switch(istk->conds->state) {
2665 case COND_IF_TRUE:
2666 istk->conds->state = COND_DONE;
2667 break;
2669 case COND_DONE:
2670 case COND_NEVER:
2671 break;
2673 case COND_ELSE_TRUE:
2674 case COND_ELSE_FALSE:
2675 error_precond(ERR_WARNING|ERR_PASS1,
2676 "`%%elif' after `%%else' ignored");
2677 istk->conds->state = COND_NEVER;
2678 break;
2680 case COND_IF_FALSE:
2682 * IMPORTANT: In the case of %if, we will already have
2683 * called expand_mmac_params(); however, if we're
2684 * processing an %elif we must have been in a
2685 * non-emitting mode, which would have inhibited
2686 * the normal invocation of expand_mmac_params().
2687 * Therefore, we have to do it explicitly here.
2689 j = if_condition(expand_mmac_params(tline->next), i);
2690 tline->next = NULL; /* it got freed */
2691 istk->conds->state =
2692 j < 0 ? COND_NEVER : j ? COND_IF_TRUE : COND_IF_FALSE;
2693 break;
2695 free_tlist(origline);
2696 return DIRECTIVE_FOUND;
2698 case PP_ELSE:
2699 if (tline->next)
2700 error_precond(ERR_WARNING|ERR_PASS1,
2701 "trailing garbage after `%%else' ignored");
2702 if (!istk->conds)
2703 error(ERR_FATAL, "`%%else': no matching `%%if'");
2704 switch(istk->conds->state) {
2705 case COND_IF_TRUE:
2706 case COND_DONE:
2707 istk->conds->state = COND_ELSE_FALSE;
2708 break;
2710 case COND_NEVER:
2711 break;
2713 case COND_IF_FALSE:
2714 istk->conds->state = COND_ELSE_TRUE;
2715 break;
2717 case COND_ELSE_TRUE:
2718 case COND_ELSE_FALSE:
2719 error_precond(ERR_WARNING|ERR_PASS1,
2720 "`%%else' after `%%else' ignored.");
2721 istk->conds->state = COND_NEVER;
2722 break;
2724 free_tlist(origline);
2725 return DIRECTIVE_FOUND;
2727 case PP_ENDIF:
2728 if (tline->next)
2729 error_precond(ERR_WARNING|ERR_PASS1,
2730 "trailing garbage after `%%endif' ignored");
2731 if (!istk->conds)
2732 error(ERR_FATAL, "`%%endif': no matching `%%if'");
2733 cond = istk->conds;
2734 istk->conds = cond->next;
2735 nasm_free(cond);
2736 if(istk->mstk)
2737 istk->mstk->condcnt --;
2738 free_tlist(origline);
2739 return DIRECTIVE_FOUND;
2741 case PP_RMACRO:
2742 case PP_IRMACRO:
2743 case PP_MACRO:
2744 case PP_IMACRO:
2745 if (defining) {
2746 error(ERR_FATAL, "`%s': already defining a macro",
2747 pp_directives[i]);
2748 return DIRECTIVE_FOUND;
2750 defining = nasm_malloc(sizeof(MMacro));
2751 defining->max_depth =
2752 (i == PP_RMACRO) || (i == PP_IRMACRO) ? DEADMAN_LIMIT : 0;
2753 defining->casesense = (i == PP_MACRO) || (i == PP_RMACRO);
2754 if (!parse_mmacro_spec(tline, defining, pp_directives[i])) {
2755 nasm_free(defining);
2756 defining = NULL;
2757 return DIRECTIVE_FOUND;
2760 mmac = (MMacro *) hash_findix(&mmacros, defining->name);
2761 while (mmac) {
2762 if (!strcmp(mmac->name, defining->name) &&
2763 (mmac->nparam_min <= defining->nparam_max
2764 || defining->plus)
2765 && (defining->nparam_min <= mmac->nparam_max
2766 || mmac->plus)) {
2767 error(ERR_WARNING|ERR_PASS1,
2768 "redefining multi-line macro `%s'", defining->name);
2769 return DIRECTIVE_FOUND;
2771 mmac = mmac->next;
2773 free_tlist(origline);
2774 return DIRECTIVE_FOUND;
2776 case PP_ENDM:
2777 case PP_ENDMACRO:
2778 if (! (defining && defining->name)) {
2779 error(ERR_NONFATAL, "`%s': not defining a macro", tline->text);
2780 return DIRECTIVE_FOUND;
2782 mmhead = (MMacro **) hash_findi_add(&mmacros, defining->name);
2783 defining->next = *mmhead;
2784 *mmhead = defining;
2785 defining = NULL;
2786 free_tlist(origline);
2787 return DIRECTIVE_FOUND;
2789 case PP_EXITMACRO:
2791 * We must search along istk->expansion until we hit a
2792 * macro-end marker for a macro with a name. Then we
2793 * bypass all lines between exitmacro and endmacro.
2795 list_for_each(l, istk->expansion)
2796 if (l->finishes && l->finishes->name)
2797 break;
2799 if (l) {
2801 * Remove all conditional entries relative to this
2802 * macro invocation. (safe to do in this context)
2804 for ( ; l->finishes->condcnt > 0; l->finishes->condcnt --) {
2805 cond = istk->conds;
2806 istk->conds = cond->next;
2807 nasm_free(cond);
2809 istk->expansion = l;
2810 } else {
2811 error(ERR_NONFATAL, "`%%exitmacro' not within `%%macro' block");
2813 free_tlist(origline);
2814 return DIRECTIVE_FOUND;
2816 case PP_UNMACRO:
2817 case PP_UNIMACRO:
2819 MMacro **mmac_p;
2820 MMacro spec;
2822 spec.casesense = (i == PP_UNMACRO);
2823 if (!parse_mmacro_spec(tline, &spec, pp_directives[i])) {
2824 return DIRECTIVE_FOUND;
2826 mmac_p = (MMacro **) hash_findi(&mmacros, spec.name, NULL);
2827 while (mmac_p && *mmac_p) {
2828 mmac = *mmac_p;
2829 if (mmac->casesense == spec.casesense &&
2830 !mstrcmp(mmac->name, spec.name, spec.casesense) &&
2831 mmac->nparam_min == spec.nparam_min &&
2832 mmac->nparam_max == spec.nparam_max &&
2833 mmac->plus == spec.plus) {
2834 *mmac_p = mmac->next;
2835 free_mmacro(mmac);
2836 } else {
2837 mmac_p = &mmac->next;
2840 free_tlist(origline);
2841 free_tlist(spec.dlist);
2842 return DIRECTIVE_FOUND;
2845 case PP_ROTATE:
2846 if (tline->next && tline->next->type == TOK_WHITESPACE)
2847 tline = tline->next;
2848 if (!tline->next) {
2849 free_tlist(origline);
2850 error(ERR_NONFATAL, "`%%rotate' missing rotate count");
2851 return DIRECTIVE_FOUND;
2853 t = expand_smacro(tline->next);
2854 tline->next = NULL;
2855 free_tlist(origline);
2856 tline = t;
2857 tptr = &t;
2858 tokval.t_type = TOKEN_INVALID;
2859 evalresult =
2860 evaluate(ppscan, tptr, &tokval, NULL, pass, error, NULL);
2861 free_tlist(tline);
2862 if (!evalresult)
2863 return DIRECTIVE_FOUND;
2864 if (tokval.t_type)
2865 error(ERR_WARNING|ERR_PASS1,
2866 "trailing garbage after expression ignored");
2867 if (!is_simple(evalresult)) {
2868 error(ERR_NONFATAL, "non-constant value given to `%%rotate'");
2869 return DIRECTIVE_FOUND;
2871 mmac = istk->mstk;
2872 while (mmac && !mmac->name) /* avoid mistaking %reps for macros */
2873 mmac = mmac->next_active;
2874 if (!mmac) {
2875 error(ERR_NONFATAL, "`%%rotate' invoked outside a macro call");
2876 } else if (mmac->nparam == 0) {
2877 error(ERR_NONFATAL,
2878 "`%%rotate' invoked within macro without parameters");
2879 } else {
2880 int rotate = mmac->rotate + reloc_value(evalresult);
2882 rotate %= (int)mmac->nparam;
2883 if (rotate < 0)
2884 rotate += mmac->nparam;
2886 mmac->rotate = rotate;
2888 return DIRECTIVE_FOUND;
2890 case PP_REP:
2891 nolist = false;
2892 do {
2893 tline = tline->next;
2894 } while (tok_type_(tline, TOK_WHITESPACE));
2896 if (tok_type_(tline, TOK_ID) &&
2897 nasm_stricmp(tline->text, ".nolist") == 0) {
2898 nolist = true;
2899 do {
2900 tline = tline->next;
2901 } while (tok_type_(tline, TOK_WHITESPACE));
2904 if (tline) {
2905 t = expand_smacro(tline);
2906 tptr = &t;
2907 tokval.t_type = TOKEN_INVALID;
2908 evalresult =
2909 evaluate(ppscan, tptr, &tokval, NULL, pass, error, NULL);
2910 if (!evalresult) {
2911 free_tlist(origline);
2912 return DIRECTIVE_FOUND;
2914 if (tokval.t_type)
2915 error(ERR_WARNING|ERR_PASS1,
2916 "trailing garbage after expression ignored");
2917 if (!is_simple(evalresult)) {
2918 error(ERR_NONFATAL, "non-constant value given to `%%rep'");
2919 return DIRECTIVE_FOUND;
2921 count = reloc_value(evalresult);
2922 if (count >= REP_LIMIT) {
2923 error(ERR_NONFATAL, "`%%rep' value exceeds limit");
2924 count = 0;
2925 } else
2926 count++;
2927 } else {
2928 error(ERR_NONFATAL, "`%%rep' expects a repeat count");
2929 count = 0;
2931 free_tlist(origline);
2933 tmp_defining = defining;
2934 defining = nasm_malloc(sizeof(MMacro));
2935 defining->prev = NULL;
2936 defining->name = NULL; /* flags this macro as a %rep block */
2937 defining->casesense = false;
2938 defining->plus = false;
2939 defining->nolist = nolist;
2940 defining->in_progress = count;
2941 defining->max_depth = 0;
2942 defining->nparam_min = defining->nparam_max = 0;
2943 defining->defaults = NULL;
2944 defining->dlist = NULL;
2945 defining->expansion = NULL;
2946 defining->next_active = istk->mstk;
2947 defining->rep_nest = tmp_defining;
2948 return DIRECTIVE_FOUND;
2950 case PP_ENDREP:
2951 if (!defining || defining->name) {
2952 error(ERR_NONFATAL, "`%%endrep': no matching `%%rep'");
2953 return DIRECTIVE_FOUND;
2957 * Now we have a "macro" defined - although it has no name
2958 * and we won't be entering it in the hash tables - we must
2959 * push a macro-end marker for it on to istk->expansion.
2960 * After that, it will take care of propagating itself (a
2961 * macro-end marker line for a macro which is really a %rep
2962 * block will cause the macro to be re-expanded, complete
2963 * with another macro-end marker to ensure the process
2964 * continues) until the whole expansion is forcibly removed
2965 * from istk->expansion by a %exitrep.
2967 l = nasm_malloc(sizeof(Line));
2968 l->next = istk->expansion;
2969 l->finishes = defining;
2970 l->first = NULL;
2971 istk->expansion = l;
2973 istk->mstk = defining;
2975 list->uplevel(defining->nolist ? LIST_MACRO_NOLIST : LIST_MACRO);
2976 tmp_defining = defining;
2977 defining = defining->rep_nest;
2978 free_tlist(origline);
2979 return DIRECTIVE_FOUND;
2981 case PP_EXITREP:
2983 * We must search along istk->expansion until we hit a
2984 * macro-end marker for a macro with no name. Then we set
2985 * its `in_progress' flag to 0.
2987 list_for_each(l, istk->expansion)
2988 if (l->finishes && !l->finishes->name)
2989 break;
2991 if (l)
2992 l->finishes->in_progress = 1;
2993 else
2994 error(ERR_NONFATAL, "`%%exitrep' not within `%%rep' block");
2995 free_tlist(origline);
2996 return DIRECTIVE_FOUND;
2998 case PP_XDEFINE:
2999 case PP_IXDEFINE:
3000 case PP_DEFINE:
3001 case PP_IDEFINE:
3002 casesense = (i == PP_DEFINE || i == PP_XDEFINE);
3004 tline = tline->next;
3005 skip_white_(tline);
3006 tline = expand_id(tline);
3007 if (!tline || (tline->type != TOK_ID &&
3008 (tline->type != TOK_PREPROC_ID ||
3009 tline->text[1] != '$'))) {
3010 error(ERR_NONFATAL, "`%s' expects a macro identifier",
3011 pp_directives[i]);
3012 free_tlist(origline);
3013 return DIRECTIVE_FOUND;
3016 ctx = get_ctx(tline->text, &mname, false);
3017 last = tline;
3018 param_start = tline = tline->next;
3019 nparam = 0;
3021 /* Expand the macro definition now for %xdefine and %ixdefine */
3022 if ((i == PP_XDEFINE) || (i == PP_IXDEFINE))
3023 tline = expand_smacro(tline);
3025 if (tok_is_(tline, "(")) {
3027 * This macro has parameters.
3030 tline = tline->next;
3031 while (1) {
3032 skip_white_(tline);
3033 if (!tline) {
3034 error(ERR_NONFATAL, "parameter identifier expected");
3035 free_tlist(origline);
3036 return DIRECTIVE_FOUND;
3038 if (tline->type != TOK_ID) {
3039 error(ERR_NONFATAL,
3040 "`%s': parameter identifier expected",
3041 tline->text);
3042 free_tlist(origline);
3043 return DIRECTIVE_FOUND;
3045 tline->type = TOK_SMAC_PARAM + nparam++;
3046 tline = tline->next;
3047 skip_white_(tline);
3048 if (tok_is_(tline, ",")) {
3049 tline = tline->next;
3050 } else {
3051 if (!tok_is_(tline, ")")) {
3052 error(ERR_NONFATAL,
3053 "`)' expected to terminate macro template");
3054 free_tlist(origline);
3055 return DIRECTIVE_FOUND;
3057 break;
3060 last = tline;
3061 tline = tline->next;
3063 if (tok_type_(tline, TOK_WHITESPACE))
3064 last = tline, tline = tline->next;
3065 macro_start = NULL;
3066 last->next = NULL;
3067 t = tline;
3068 while (t) {
3069 if (t->type == TOK_ID) {
3070 list_for_each(tt, param_start)
3071 if (tt->type >= TOK_SMAC_PARAM &&
3072 !strcmp(tt->text, t->text))
3073 t->type = tt->type;
3075 tt = t->next;
3076 t->next = macro_start;
3077 macro_start = t;
3078 t = tt;
3081 * Good. We now have a macro name, a parameter count, and a
3082 * token list (in reverse order) for an expansion. We ought
3083 * to be OK just to create an SMacro, store it, and let
3084 * free_tlist have the rest of the line (which we have
3085 * carefully re-terminated after chopping off the expansion
3086 * from the end).
3088 define_smacro(ctx, mname, casesense, nparam, macro_start);
3089 free_tlist(origline);
3090 return DIRECTIVE_FOUND;
3092 case PP_UNDEF:
3093 tline = tline->next;
3094 skip_white_(tline);
3095 tline = expand_id(tline);
3096 if (!tline || (tline->type != TOK_ID &&
3097 (tline->type != TOK_PREPROC_ID ||
3098 tline->text[1] != '$'))) {
3099 error(ERR_NONFATAL, "`%%undef' expects a macro identifier");
3100 free_tlist(origline);
3101 return DIRECTIVE_FOUND;
3103 if (tline->next) {
3104 error(ERR_WARNING|ERR_PASS1,
3105 "trailing garbage after macro name ignored");
3108 /* Find the context that symbol belongs to */
3109 ctx = get_ctx(tline->text, &mname, false);
3110 undef_smacro(ctx, mname);
3111 free_tlist(origline);
3112 return DIRECTIVE_FOUND;
3114 case PP_DEFSTR:
3115 case PP_IDEFSTR:
3116 casesense = (i == PP_DEFSTR);
3118 tline = tline->next;
3119 skip_white_(tline);
3120 tline = expand_id(tline);
3121 if (!tline || (tline->type != TOK_ID &&
3122 (tline->type != TOK_PREPROC_ID ||
3123 tline->text[1] != '$'))) {
3124 error(ERR_NONFATAL, "`%s' expects a macro identifier",
3125 pp_directives[i]);
3126 free_tlist(origline);
3127 return DIRECTIVE_FOUND;
3130 ctx = get_ctx(tline->text, &mname, false);
3131 last = tline;
3132 tline = expand_smacro(tline->next);
3133 last->next = NULL;
3135 while (tok_type_(tline, TOK_WHITESPACE))
3136 tline = delete_Token(tline);
3138 p = detoken(tline, false);
3139 macro_start = nasm_malloc(sizeof(*macro_start));
3140 macro_start->next = NULL;
3141 macro_start->text = nasm_quote(p, strlen(p));
3142 macro_start->type = TOK_STRING;
3143 macro_start->a.mac = NULL;
3144 nasm_free(p);
3147 * We now have a macro name, an implicit parameter count of
3148 * zero, and a string token to use as an expansion. Create
3149 * and store an SMacro.
3151 define_smacro(ctx, mname, casesense, 0, macro_start);
3152 free_tlist(origline);
3153 return DIRECTIVE_FOUND;
3155 case PP_DEFTOK:
3156 case PP_IDEFTOK:
3157 casesense = (i == PP_DEFTOK);
3159 tline = tline->next;
3160 skip_white_(tline);
3161 tline = expand_id(tline);
3162 if (!tline || (tline->type != TOK_ID &&
3163 (tline->type != TOK_PREPROC_ID ||
3164 tline->text[1] != '$'))) {
3165 error(ERR_NONFATAL,
3166 "`%s' expects a macro identifier as first parameter",
3167 pp_directives[i]);
3168 free_tlist(origline);
3169 return DIRECTIVE_FOUND;
3171 ctx = get_ctx(tline->text, &mname, false);
3172 last = tline;
3173 tline = expand_smacro(tline->next);
3174 last->next = NULL;
3176 t = tline;
3177 while (tok_type_(t, TOK_WHITESPACE))
3178 t = t->next;
3179 /* t should now point to the string */
3180 if (!tok_type_(t, TOK_STRING)) {
3181 error(ERR_NONFATAL,
3182 "`%s` requires string as second parameter",
3183 pp_directives[i]);
3184 free_tlist(tline);
3185 free_tlist(origline);
3186 return DIRECTIVE_FOUND;
3189 nasm_unquote_cstr(t->text, i);
3190 macro_start = tokenize(t->text);
3193 * We now have a macro name, an implicit parameter count of
3194 * zero, and a numeric token to use as an expansion. Create
3195 * and store an SMacro.
3197 define_smacro(ctx, mname, casesense, 0, macro_start);
3198 free_tlist(tline);
3199 free_tlist(origline);
3200 return DIRECTIVE_FOUND;
3202 case PP_PATHSEARCH:
3204 FILE *fp;
3205 StrList *xsl = NULL;
3206 StrList **xst = &xsl;
3208 casesense = true;
3210 tline = tline->next;
3211 skip_white_(tline);
3212 tline = expand_id(tline);
3213 if (!tline || (tline->type != TOK_ID &&
3214 (tline->type != TOK_PREPROC_ID ||
3215 tline->text[1] != '$'))) {
3216 error(ERR_NONFATAL,
3217 "`%%pathsearch' expects a macro identifier as first parameter");
3218 free_tlist(origline);
3219 return DIRECTIVE_FOUND;
3221 ctx = get_ctx(tline->text, &mname, false);
3222 last = tline;
3223 tline = expand_smacro(tline->next);
3224 last->next = NULL;
3226 t = tline;
3227 while (tok_type_(t, TOK_WHITESPACE))
3228 t = t->next;
3230 if (!t || (t->type != TOK_STRING &&
3231 t->type != TOK_INTERNAL_STRING)) {
3232 error(ERR_NONFATAL, "`%%pathsearch' expects a file name");
3233 free_tlist(tline);
3234 free_tlist(origline);
3235 return DIRECTIVE_FOUND; /* but we did _something_ */
3237 if (t->next)
3238 error(ERR_WARNING|ERR_PASS1,
3239 "trailing garbage after `%%pathsearch' ignored");
3240 p = t->text;
3241 if (t->type != TOK_INTERNAL_STRING)
3242 nasm_unquote(p, NULL);
3244 fp = inc_fopen(p, &xsl, &xst, true);
3245 if (fp) {
3246 p = xsl->str;
3247 fclose(fp); /* Don't actually care about the file */
3249 macro_start = nasm_malloc(sizeof(*macro_start));
3250 macro_start->next = NULL;
3251 macro_start->text = nasm_quote(p, strlen(p));
3252 macro_start->type = TOK_STRING;
3253 macro_start->a.mac = NULL;
3254 if (xsl)
3255 nasm_free(xsl);
3258 * We now have a macro name, an implicit parameter count of
3259 * zero, and a string token to use as an expansion. Create
3260 * and store an SMacro.
3262 define_smacro(ctx, mname, casesense, 0, macro_start);
3263 free_tlist(tline);
3264 free_tlist(origline);
3265 return DIRECTIVE_FOUND;
3268 case PP_STRLEN:
3269 casesense = true;
3271 tline = tline->next;
3272 skip_white_(tline);
3273 tline = expand_id(tline);
3274 if (!tline || (tline->type != TOK_ID &&
3275 (tline->type != TOK_PREPROC_ID ||
3276 tline->text[1] != '$'))) {
3277 error(ERR_NONFATAL,
3278 "`%%strlen' expects a macro identifier as first parameter");
3279 free_tlist(origline);
3280 return DIRECTIVE_FOUND;
3282 ctx = get_ctx(tline->text, &mname, false);
3283 last = tline;
3284 tline = expand_smacro(tline->next);
3285 last->next = NULL;
3287 t = tline;
3288 while (tok_type_(t, TOK_WHITESPACE))
3289 t = t->next;
3290 /* t should now point to the string */
3291 if (!tok_type_(t, TOK_STRING)) {
3292 error(ERR_NONFATAL,
3293 "`%%strlen` requires string as second parameter");
3294 free_tlist(tline);
3295 free_tlist(origline);
3296 return DIRECTIVE_FOUND;
3299 macro_start = nasm_malloc(sizeof(*macro_start));
3300 macro_start->next = NULL;
3301 make_tok_num(macro_start, nasm_unquote(t->text, NULL));
3302 macro_start->a.mac = NULL;
3305 * We now have a macro name, an implicit parameter count of
3306 * zero, and a numeric token to use as an expansion. Create
3307 * and store an SMacro.
3309 define_smacro(ctx, mname, casesense, 0, macro_start);
3310 free_tlist(tline);
3311 free_tlist(origline);
3312 return DIRECTIVE_FOUND;
3314 case PP_STRCAT:
3315 casesense = true;
3317 tline = tline->next;
3318 skip_white_(tline);
3319 tline = expand_id(tline);
3320 if (!tline || (tline->type != TOK_ID &&
3321 (tline->type != TOK_PREPROC_ID ||
3322 tline->text[1] != '$'))) {
3323 error(ERR_NONFATAL,
3324 "`%%strcat' expects a macro identifier as first parameter");
3325 free_tlist(origline);
3326 return DIRECTIVE_FOUND;
3328 ctx = get_ctx(tline->text, &mname, false);
3329 last = tline;
3330 tline = expand_smacro(tline->next);
3331 last->next = NULL;
3333 len = 0;
3334 list_for_each(t, tline) {
3335 switch (t->type) {
3336 case TOK_WHITESPACE:
3337 break;
3338 case TOK_STRING:
3339 len += t->a.len = nasm_unquote(t->text, NULL);
3340 break;
3341 case TOK_OTHER:
3342 if (!strcmp(t->text, ",")) /* permit comma separators */
3343 break;
3344 /* else fall through */
3345 default:
3346 error(ERR_NONFATAL,
3347 "non-string passed to `%%strcat' (%d)", t->type);
3348 free_tlist(tline);
3349 free_tlist(origline);
3350 return DIRECTIVE_FOUND;
3354 p = pp = nasm_malloc(len);
3355 list_for_each(t, tline) {
3356 if (t->type == TOK_STRING) {
3357 memcpy(p, t->text, t->a.len);
3358 p += t->a.len;
3363 * We now have a macro name, an implicit parameter count of
3364 * zero, and a numeric token to use as an expansion. Create
3365 * and store an SMacro.
3367 macro_start = new_Token(NULL, TOK_STRING, NULL, 0);
3368 macro_start->text = nasm_quote(pp, len);
3369 nasm_free(pp);
3370 define_smacro(ctx, mname, casesense, 0, macro_start);
3371 free_tlist(tline);
3372 free_tlist(origline);
3373 return DIRECTIVE_FOUND;
3375 case PP_SUBSTR:
3377 int64_t start, count;
3378 size_t len;
3380 casesense = true;
3382 tline = tline->next;
3383 skip_white_(tline);
3384 tline = expand_id(tline);
3385 if (!tline || (tline->type != TOK_ID &&
3386 (tline->type != TOK_PREPROC_ID ||
3387 tline->text[1] != '$'))) {
3388 error(ERR_NONFATAL,
3389 "`%%substr' expects a macro identifier as first parameter");
3390 free_tlist(origline);
3391 return DIRECTIVE_FOUND;
3393 ctx = get_ctx(tline->text, &mname, false);
3394 last = tline;
3395 tline = expand_smacro(tline->next);
3396 last->next = NULL;
3398 if (tline) /* skip expanded id */
3399 t = tline->next;
3400 while (tok_type_(t, TOK_WHITESPACE))
3401 t = t->next;
3403 /* t should now point to the string */
3404 if (!tok_type_(t, TOK_STRING)) {
3405 error(ERR_NONFATAL,
3406 "`%%substr` requires string as second parameter");
3407 free_tlist(tline);
3408 free_tlist(origline);
3409 return DIRECTIVE_FOUND;
3412 tt = t->next;
3413 tptr = &tt;
3414 tokval.t_type = TOKEN_INVALID;
3415 evalresult = evaluate(ppscan, tptr, &tokval, NULL,
3416 pass, error, NULL);
3417 if (!evalresult) {
3418 free_tlist(tline);
3419 free_tlist(origline);
3420 return DIRECTIVE_FOUND;
3421 } else if (!is_simple(evalresult)) {
3422 error(ERR_NONFATAL, "non-constant value given to `%%substr`");
3423 free_tlist(tline);
3424 free_tlist(origline);
3425 return DIRECTIVE_FOUND;
3427 start = evalresult->value - 1;
3429 while (tok_type_(tt, TOK_WHITESPACE))
3430 tt = tt->next;
3431 if (!tt) {
3432 count = 1; /* Backwards compatibility: one character */
3433 } else {
3434 tokval.t_type = TOKEN_INVALID;
3435 evalresult = evaluate(ppscan, tptr, &tokval, NULL,
3436 pass, error, NULL);
3437 if (!evalresult) {
3438 free_tlist(tline);
3439 free_tlist(origline);
3440 return DIRECTIVE_FOUND;
3441 } else if (!is_simple(evalresult)) {
3442 error(ERR_NONFATAL, "non-constant value given to `%%substr`");
3443 free_tlist(tline);
3444 free_tlist(origline);
3445 return DIRECTIVE_FOUND;
3447 count = evalresult->value;
3450 len = nasm_unquote(t->text, NULL);
3452 /* make start and count being in range */
3453 if (start < 0)
3454 start = 0;
3455 if (count < 0)
3456 count = len + count + 1 - start;
3457 if (start + count > (int64_t)len)
3458 count = len - start;
3459 if (!len || count < 0 || start >=(int64_t)len)
3460 start = -1, count = 0; /* empty string */
3462 macro_start = nasm_malloc(sizeof(*macro_start));
3463 macro_start->next = NULL;
3464 macro_start->text = nasm_quote((start < 0) ? "" : t->text + start, count);
3465 macro_start->type = TOK_STRING;
3466 macro_start->a.mac = NULL;
3469 * We now have a macro name, an implicit parameter count of
3470 * zero, and a numeric token to use as an expansion. Create
3471 * and store an SMacro.
3473 define_smacro(ctx, mname, casesense, 0, macro_start);
3474 free_tlist(tline);
3475 free_tlist(origline);
3476 return DIRECTIVE_FOUND;
3479 case PP_ASSIGN:
3480 case PP_IASSIGN:
3481 casesense = (i == PP_ASSIGN);
3483 tline = tline->next;
3484 skip_white_(tline);
3485 tline = expand_id(tline);
3486 if (!tline || (tline->type != TOK_ID &&
3487 (tline->type != TOK_PREPROC_ID ||
3488 tline->text[1] != '$'))) {
3489 error(ERR_NONFATAL,
3490 "`%%%sassign' expects a macro identifier",
3491 (i == PP_IASSIGN ? "i" : ""));
3492 free_tlist(origline);
3493 return DIRECTIVE_FOUND;
3495 ctx = get_ctx(tline->text, &mname, false);
3496 last = tline;
3497 tline = expand_smacro(tline->next);
3498 last->next = NULL;
3500 t = tline;
3501 tptr = &t;
3502 tokval.t_type = TOKEN_INVALID;
3503 evalresult =
3504 evaluate(ppscan, tptr, &tokval, NULL, pass, error, NULL);
3505 free_tlist(tline);
3506 if (!evalresult) {
3507 free_tlist(origline);
3508 return DIRECTIVE_FOUND;
3511 if (tokval.t_type)
3512 error(ERR_WARNING|ERR_PASS1,
3513 "trailing garbage after expression ignored");
3515 if (!is_simple(evalresult)) {
3516 error(ERR_NONFATAL,
3517 "non-constant value given to `%%%sassign'",
3518 (i == PP_IASSIGN ? "i" : ""));
3519 free_tlist(origline);
3520 return DIRECTIVE_FOUND;
3523 macro_start = nasm_malloc(sizeof(*macro_start));
3524 macro_start->next = NULL;
3525 make_tok_num(macro_start, reloc_value(evalresult));
3526 macro_start->a.mac = NULL;
3529 * We now have a macro name, an implicit parameter count of
3530 * zero, and a numeric token to use as an expansion. Create
3531 * and store an SMacro.
3533 define_smacro(ctx, mname, casesense, 0, macro_start);
3534 free_tlist(origline);
3535 return DIRECTIVE_FOUND;
3537 case PP_LINE:
3539 * Syntax is `%line nnn[+mmm] [filename]'
3541 tline = tline->next;
3542 skip_white_(tline);
3543 if (!tok_type_(tline, TOK_NUMBER)) {
3544 error(ERR_NONFATAL, "`%%line' expects line number");
3545 free_tlist(origline);
3546 return DIRECTIVE_FOUND;
3548 k = readnum(tline->text, &err);
3549 m = 1;
3550 tline = tline->next;
3551 if (tok_is_(tline, "+")) {
3552 tline = tline->next;
3553 if (!tok_type_(tline, TOK_NUMBER)) {
3554 error(ERR_NONFATAL, "`%%line' expects line increment");
3555 free_tlist(origline);
3556 return DIRECTIVE_FOUND;
3558 m = readnum(tline->text, &err);
3559 tline = tline->next;
3561 skip_white_(tline);
3562 src_set_linnum(k);
3563 istk->lineinc = m;
3564 if (tline) {
3565 nasm_free(src_set_fname(detoken(tline, false)));
3567 free_tlist(origline);
3568 return DIRECTIVE_FOUND;
3570 default:
3571 error(ERR_FATAL,
3572 "preprocessor directive `%s' not yet implemented",
3573 pp_directives[i]);
3574 return DIRECTIVE_FOUND;
3579 * Ensure that a macro parameter contains a condition code and
3580 * nothing else. Return the condition code index if so, or -1
3581 * otherwise.
3583 static int find_cc(Token * t)
3585 Token *tt;
3586 int i, j, k, m;
3588 if (!t)
3589 return -1; /* Probably a %+ without a space */
3591 skip_white_(t);
3592 if (t->type != TOK_ID)
3593 return -1;
3594 tt = t->next;
3595 skip_white_(tt);
3596 if (tt && (tt->type != TOK_OTHER || strcmp(tt->text, ",")))
3597 return -1;
3599 i = -1;
3600 j = ARRAY_SIZE(conditions);
3601 while (j - i > 1) {
3602 k = (j + i) / 2;
3603 m = nasm_stricmp(t->text, conditions[k]);
3604 if (m == 0) {
3605 i = k;
3606 j = -2;
3607 break;
3608 } else if (m < 0) {
3609 j = k;
3610 } else
3611 i = k;
3613 if (j != -2)
3614 return -1;
3615 return i;
3618 static bool paste_tokens(Token **head, bool handle_paste_tokens)
3620 Token **tail, *t, *tt;
3621 Token **paste_head;
3622 bool did_paste = false;
3623 char *tmp;
3625 /* Now handle token pasting... */
3626 paste_head = NULL;
3627 tail = head;
3628 while ((t = *tail) && (tt = t->next)) {
3629 switch (t->type) {
3630 case TOK_WHITESPACE:
3631 if (tt->type == TOK_WHITESPACE) {
3632 /* Zap adjacent whitespace tokens */
3633 t->next = delete_Token(tt);
3634 } else {
3635 /* Do not advance paste_head here */
3636 tail = &t->next;
3638 break;
3639 case TOK_ID:
3640 case TOK_NUMBER:
3641 case TOK_FLOAT:
3643 size_t len = 0;
3644 char *tmp, *p;
3646 while (tt && (tt->type == TOK_ID || tt->type == TOK_PREPROC_ID ||
3647 tt->type == TOK_NUMBER || tt->type == TOK_FLOAT ||
3648 tt->type == TOK_OTHER)) {
3649 len += strlen(tt->text);
3650 tt = tt->next;
3654 * Now tt points to the first token after
3655 * the potential paste area...
3657 if (tt != t->next) {
3658 /* We have at least two tokens... */
3659 len += strlen(t->text);
3660 p = tmp = nasm_malloc(len+1);
3662 while (t != tt) {
3663 strcpy(p, t->text);
3664 p = strchr(p, '\0');
3665 t = delete_Token(t);
3668 t = *tail = tokenize(tmp);
3669 nasm_free(tmp);
3671 while (t->next) {
3672 tail = &t->next;
3673 t = t->next;
3675 t->next = tt; /* Attach the remaining token chain */
3677 did_paste = true;
3679 paste_head = tail;
3680 tail = &t->next;
3681 break;
3683 case TOK_PASTE: /* %+ */
3684 if (handle_paste_tokens) {
3685 /* Zap %+ and whitespace tokens to the right */
3686 while (t && (t->type == TOK_WHITESPACE ||
3687 t->type == TOK_PASTE))
3688 t = *tail = delete_Token(t);
3689 if (!paste_head || !t)
3690 break; /* Nothing to paste with */
3691 tail = paste_head;
3692 t = *tail;
3693 tt = t->next;
3694 while (tok_type_(tt, TOK_WHITESPACE))
3695 tt = t->next = delete_Token(tt);
3697 if (tt) {
3698 tmp = nasm_strcat(t->text, tt->text);
3699 delete_Token(t);
3700 tt = delete_Token(tt);
3701 t = *tail = tokenize(tmp);
3702 nasm_free(tmp);
3703 while (t->next) {
3704 tail = &t->next;
3705 t = t->next;
3707 t->next = tt; /* Attach the remaining token chain */
3708 did_paste = true;
3710 paste_head = tail;
3711 tail = &t->next;
3712 break;
3714 /* else fall through */
3715 default:
3716 tail = &t->next;
3717 if (!tok_type_(t->next, TOK_WHITESPACE))
3718 paste_head = tail;
3719 break;
3722 return did_paste;
3726 * expands to a list of tokens from %{x:y}
3728 static Token *expand_mmac_params_range(MMacro *mac, Token *tline, Token ***last)
3730 Token *t = tline, **tt, *tm, *head;
3731 char *pos;
3732 int fst, lst, j, i;
3734 pos = strchr(tline->text, ':');
3735 nasm_assert(pos);
3737 lst = atoi(pos + 1);
3738 fst = atoi(tline->text + 1);
3741 * only macros params are accounted so
3742 * if someone passes %0 -- we reject such
3743 * value(s)
3745 if (lst == 0 || fst == 0)
3746 goto err;
3748 /* the values should be sane */
3749 if ((fst > (int)mac->nparam || fst < (-(int)mac->nparam)) ||
3750 (lst > (int)mac->nparam || lst < (-(int)mac->nparam)))
3751 goto err;
3753 fst = fst < 0 ? fst + (int)mac->nparam + 1: fst;
3754 lst = lst < 0 ? lst + (int)mac->nparam + 1: lst;
3756 /* counted from zero */
3757 fst--, lst--;
3760 * it will be at least one token
3762 tm = mac->params[(fst + mac->rotate) % mac->nparam];
3763 t = new_Token(NULL, tm->type, tm->text, 0);
3764 head = t, tt = &t->next;
3765 if (fst < lst) {
3766 for (i = fst + 1; i <= lst; i++) {
3767 t = new_Token(NULL, TOK_OTHER, ",", 0);
3768 *tt = t, tt = &t->next;
3769 j = (i + mac->rotate) % mac->nparam;
3770 tm = mac->params[j];
3771 t = new_Token(NULL, tm->type, tm->text, 0);
3772 *tt = t, tt = &t->next;
3774 } else {
3775 for (i = fst - 1; i >= lst; i--) {
3776 t = new_Token(NULL, TOK_OTHER, ",", 0);
3777 *tt = t, tt = &t->next;
3778 j = (i + mac->rotate) % mac->nparam;
3779 tm = mac->params[j];
3780 t = new_Token(NULL, tm->type, tm->text, 0);
3781 *tt = t, tt = &t->next;
3785 *last = tt;
3786 return head;
3788 err:
3789 error(ERR_NONFATAL, "`%%{%s}': macro parameters out of range",
3790 &tline->text[1]);
3791 return tline;
3795 * Expand MMacro-local things: parameter references (%0, %n, %+n,
3796 * %-n) and MMacro-local identifiers (%%foo) as well as
3797 * macro indirection (%[...]) and range (%{..:..}).
3799 static Token *expand_mmac_params(Token * tline)
3801 Token *t, *tt, **tail, *thead;
3802 bool changed = false;
3803 char *pos;
3805 tail = &thead;
3806 thead = NULL;
3808 while (tline) {
3809 if (tline->type == TOK_PREPROC_ID &&
3810 (((tline->text[1] == '+' || tline->text[1] == '-') && tline->text[2]) ||
3811 (tline->text[1] >= '0' && tline->text[1] <= '9') ||
3812 tline->text[1] == '%')) {
3813 char *text = NULL;
3814 int type = 0, cc; /* type = 0 to placate optimisers */
3815 char tmpbuf[30];
3816 unsigned int n;
3817 int i;
3818 MMacro *mac;
3820 t = tline;
3821 tline = tline->next;
3823 mac = istk->mstk;
3824 while (mac && !mac->name) /* avoid mistaking %reps for macros */
3825 mac = mac->next_active;
3826 if (!mac) {
3827 error(ERR_NONFATAL, "`%s': not in a macro call", t->text);
3828 } else {
3829 pos = strchr(t->text, ':');
3830 if (!pos) {
3831 switch (t->text[1]) {
3833 * We have to make a substitution of one of the
3834 * forms %1, %-1, %+1, %%foo, %0.
3836 case '0':
3837 type = TOK_NUMBER;
3838 snprintf(tmpbuf, sizeof(tmpbuf), "%d", mac->nparam);
3839 text = nasm_strdup(tmpbuf);
3840 break;
3841 case '%':
3842 type = TOK_ID;
3843 snprintf(tmpbuf, sizeof(tmpbuf), "..@%"PRIu64".",
3844 mac->unique);
3845 text = nasm_strcat(tmpbuf, t->text + 2);
3846 break;
3847 case '-':
3848 n = atoi(t->text + 2) - 1;
3849 if (n >= mac->nparam)
3850 tt = NULL;
3851 else {
3852 if (mac->nparam > 1)
3853 n = (n + mac->rotate) % mac->nparam;
3854 tt = mac->params[n];
3856 cc = find_cc(tt);
3857 if (cc == -1) {
3858 error(ERR_NONFATAL,
3859 "macro parameter %d is not a condition code",
3860 n + 1);
3861 text = NULL;
3862 } else {
3863 type = TOK_ID;
3864 if (inverse_ccs[cc] == -1) {
3865 error(ERR_NONFATAL,
3866 "condition code `%s' is not invertible",
3867 conditions[cc]);
3868 text = NULL;
3869 } else
3870 text = nasm_strdup(conditions[inverse_ccs[cc]]);
3872 break;
3873 case '+':
3874 n = atoi(t->text + 2) - 1;
3875 if (n >= mac->nparam)
3876 tt = NULL;
3877 else {
3878 if (mac->nparam > 1)
3879 n = (n + mac->rotate) % mac->nparam;
3880 tt = mac->params[n];
3882 cc = find_cc(tt);
3883 if (cc == -1) {
3884 error(ERR_NONFATAL,
3885 "macro parameter %d is not a condition code",
3886 n + 1);
3887 text = NULL;
3888 } else {
3889 type = TOK_ID;
3890 text = nasm_strdup(conditions[cc]);
3892 break;
3893 default:
3894 n = atoi(t->text + 1) - 1;
3895 if (n >= mac->nparam)
3896 tt = NULL;
3897 else {
3898 if (mac->nparam > 1)
3899 n = (n + mac->rotate) % mac->nparam;
3900 tt = mac->params[n];
3902 if (tt) {
3903 for (i = 0; i < mac->paramlen[n]; i++) {
3904 *tail = new_Token(NULL, tt->type, tt->text, 0);
3905 tail = &(*tail)->next;
3906 tt = tt->next;
3909 text = NULL; /* we've done it here */
3910 break;
3912 } else {
3914 * seems we have a parameters range here
3916 Token *head, **last;
3917 head = expand_mmac_params_range(mac, t, &last);
3918 if (head != t) {
3919 *tail = head;
3920 *last = tline;
3921 tline = head;
3922 text = NULL;
3926 if (!text) {
3927 delete_Token(t);
3928 } else {
3929 *tail = t;
3930 tail = &t->next;
3931 t->type = type;
3932 nasm_free(t->text);
3933 t->text = text;
3934 t->a.mac = NULL;
3936 changed = true;
3937 continue;
3938 } else if (tline->type == TOK_INDIRECT) {
3939 t = tline;
3940 tline = tline->next;
3941 tt = tokenize(t->text);
3942 tt = expand_mmac_params(tt);
3943 tt = expand_smacro(tt);
3944 *tail = tt;
3945 while (tt) {
3946 tt->a.mac = NULL; /* Necessary? */
3947 tail = &tt->next;
3948 tt = tt->next;
3950 delete_Token(t);
3951 changed = true;
3952 } else {
3953 t = *tail = tline;
3954 tline = tline->next;
3955 t->a.mac = NULL;
3956 tail = &t->next;
3959 *tail = NULL;
3961 if (changed)
3962 paste_tokens(&thead, false);
3964 return thead;
3968 * Expand all single-line macro calls made in the given line.
3969 * Return the expanded version of the line. The original is deemed
3970 * to be destroyed in the process. (In reality we'll just move
3971 * Tokens from input to output a lot of the time, rather than
3972 * actually bothering to destroy and replicate.)
3975 static Token *expand_smacro(Token * tline)
3977 Token *t, *tt, *mstart, **tail, *thead;
3978 SMacro *head = NULL, *m;
3979 Token **params;
3980 int *paramsize;
3981 unsigned int nparam, sparam;
3982 int brackets;
3983 Token *org_tline = tline;
3984 Context *ctx;
3985 const char *mname;
3986 int deadman = DEADMAN_LIMIT;
3987 bool expanded;
3990 * Trick: we should avoid changing the start token pointer since it can
3991 * be contained in "next" field of other token. Because of this
3992 * we allocate a copy of first token and work with it; at the end of
3993 * routine we copy it back
3995 if (org_tline) {
3996 tline = new_Token(org_tline->next, org_tline->type,
3997 org_tline->text, 0);
3998 tline->a.mac = org_tline->a.mac;
3999 nasm_free(org_tline->text);
4000 org_tline->text = NULL;
4003 expanded = true; /* Always expand %+ at least once */
4005 again:
4006 thead = NULL;
4007 tail = &thead;
4009 while (tline) { /* main token loop */
4010 if (!--deadman) {
4011 error(ERR_NONFATAL, "interminable macro recursion");
4012 goto err;
4015 if ((mname = tline->text)) {
4016 /* if this token is a local macro, look in local context */
4017 if (tline->type == TOK_ID) {
4018 head = (SMacro *)hash_findix(&smacros, mname);
4019 } else if (tline->type == TOK_PREPROC_ID) {
4020 ctx = get_ctx(mname, &mname, true);
4021 head = ctx ? (SMacro *)hash_findix(&ctx->localmac, mname) : NULL;
4022 } else
4023 head = NULL;
4026 * We've hit an identifier. As in is_mmacro below, we first
4027 * check whether the identifier is a single-line macro at
4028 * all, then think about checking for parameters if
4029 * necessary.
4031 list_for_each(m, head)
4032 if (!mstrcmp(m->name, mname, m->casesense))
4033 break;
4034 if (m) {
4035 mstart = tline;
4036 params = NULL;
4037 paramsize = NULL;
4038 if (m->nparam == 0) {
4040 * Simple case: the macro is parameterless. Discard the
4041 * one token that the macro call took, and push the
4042 * expansion back on the to-do stack.
4044 if (!m->expansion) {
4045 if (!strcmp("__FILE__", m->name)) {
4046 int32_t num = 0;
4047 char *file = NULL;
4048 src_get(&num, &file);
4049 tline->text = nasm_quote(file, strlen(file));
4050 tline->type = TOK_STRING;
4051 nasm_free(file);
4052 continue;
4054 if (!strcmp("__LINE__", m->name)) {
4055 nasm_free(tline->text);
4056 make_tok_num(tline, src_get_linnum());
4057 continue;
4059 if (!strcmp("__BITS__", m->name)) {
4060 nasm_free(tline->text);
4061 make_tok_num(tline, globalbits);
4062 continue;
4064 tline = delete_Token(tline);
4065 continue;
4067 } else {
4069 * Complicated case: at least one macro with this name
4070 * exists and takes parameters. We must find the
4071 * parameters in the call, count them, find the SMacro
4072 * that corresponds to that form of the macro call, and
4073 * substitute for the parameters when we expand. What a
4074 * pain.
4076 /*tline = tline->next;
4077 skip_white_(tline); */
4078 do {
4079 t = tline->next;
4080 while (tok_type_(t, TOK_SMAC_END)) {
4081 t->a.mac->in_progress = false;
4082 t->text = NULL;
4083 t = tline->next = delete_Token(t);
4085 tline = t;
4086 } while (tok_type_(tline, TOK_WHITESPACE));
4087 if (!tok_is_(tline, "(")) {
4089 * This macro wasn't called with parameters: ignore
4090 * the call. (Behaviour borrowed from gnu cpp.)
4092 tline = mstart;
4093 m = NULL;
4094 } else {
4095 int paren = 0;
4096 int white = 0;
4097 brackets = 0;
4098 nparam = 0;
4099 sparam = PARAM_DELTA;
4100 params = nasm_malloc(sparam * sizeof(Token *));
4101 params[0] = tline->next;
4102 paramsize = nasm_malloc(sparam * sizeof(int));
4103 paramsize[0] = 0;
4104 while (true) { /* parameter loop */
4106 * For some unusual expansions
4107 * which concatenates function call
4109 t = tline->next;
4110 while (tok_type_(t, TOK_SMAC_END)) {
4111 t->a.mac->in_progress = false;
4112 t->text = NULL;
4113 t = tline->next = delete_Token(t);
4115 tline = t;
4117 if (!tline) {
4118 error(ERR_NONFATAL,
4119 "macro call expects terminating `)'");
4120 break;
4122 if (tline->type == TOK_WHITESPACE
4123 && brackets <= 0) {
4124 if (paramsize[nparam])
4125 white++;
4126 else
4127 params[nparam] = tline->next;
4128 continue; /* parameter loop */
4130 if (tline->type == TOK_OTHER
4131 && tline->text[1] == 0) {
4132 char ch = tline->text[0];
4133 if (ch == ',' && !paren && brackets <= 0) {
4134 if (++nparam >= sparam) {
4135 sparam += PARAM_DELTA;
4136 params = nasm_realloc(params,
4137 sparam * sizeof(Token *));
4138 paramsize = nasm_realloc(paramsize,
4139 sparam * sizeof(int));
4141 params[nparam] = tline->next;
4142 paramsize[nparam] = 0;
4143 white = 0;
4144 continue; /* parameter loop */
4146 if (ch == '{' &&
4147 (brackets > 0 || (brackets == 0 &&
4148 !paramsize[nparam])))
4150 if (!(brackets++)) {
4151 params[nparam] = tline->next;
4152 continue; /* parameter loop */
4155 if (ch == '}' && brackets > 0)
4156 if (--brackets == 0) {
4157 brackets = -1;
4158 continue; /* parameter loop */
4160 if (ch == '(' && !brackets)
4161 paren++;
4162 if (ch == ')' && brackets <= 0)
4163 if (--paren < 0)
4164 break;
4166 if (brackets < 0) {
4167 brackets = 0;
4168 error(ERR_NONFATAL, "braces do not "
4169 "enclose all of macro parameter");
4171 paramsize[nparam] += white + 1;
4172 white = 0;
4173 } /* parameter loop */
4174 nparam++;
4175 while (m && (m->nparam != nparam ||
4176 mstrcmp(m->name, mname,
4177 m->casesense)))
4178 m = m->next;
4179 if (!m)
4180 error(ERR_WARNING|ERR_PASS1|ERR_WARN_MNP,
4181 "macro `%s' exists, "
4182 "but not taking %d parameters",
4183 mstart->text, nparam);
4186 if (m && m->in_progress)
4187 m = NULL;
4188 if (!m) { /* in progess or didn't find '(' or wrong nparam */
4190 * Design question: should we handle !tline, which
4191 * indicates missing ')' here, or expand those
4192 * macros anyway, which requires the (t) test a few
4193 * lines down?
4195 nasm_free(params);
4196 nasm_free(paramsize);
4197 tline = mstart;
4198 } else {
4200 * Expand the macro: we are placed on the last token of the
4201 * call, so that we can easily split the call from the
4202 * following tokens. We also start by pushing an SMAC_END
4203 * token for the cycle removal.
4205 t = tline;
4206 if (t) {
4207 tline = t->next;
4208 t->next = NULL;
4210 tt = new_Token(tline, TOK_SMAC_END, NULL, 0);
4211 tt->a.mac = m;
4212 m->in_progress = true;
4213 tline = tt;
4214 list_for_each(t, m->expansion) {
4215 if (t->type >= TOK_SMAC_PARAM) {
4216 Token *pcopy = tline, **ptail = &pcopy;
4217 Token *ttt, *pt;
4218 int i;
4220 ttt = params[t->type - TOK_SMAC_PARAM];
4221 i = paramsize[t->type - TOK_SMAC_PARAM];
4222 while (--i >= 0) {
4223 pt = *ptail = new_Token(tline, ttt->type,
4224 ttt->text, 0);
4225 ptail = &pt->next;
4226 ttt = ttt->next;
4228 tline = pcopy;
4229 } else if (t->type == TOK_PREPROC_Q) {
4230 tt = new_Token(tline, TOK_ID, mname, 0);
4231 tline = tt;
4232 } else if (t->type == TOK_PREPROC_QQ) {
4233 tt = new_Token(tline, TOK_ID, m->name, 0);
4234 tline = tt;
4235 } else {
4236 tt = new_Token(tline, t->type, t->text, 0);
4237 tline = tt;
4242 * Having done that, get rid of the macro call, and clean
4243 * up the parameters.
4245 nasm_free(params);
4246 nasm_free(paramsize);
4247 free_tlist(mstart);
4248 expanded = true;
4249 continue; /* main token loop */
4254 if (tline->type == TOK_SMAC_END) {
4255 tline->a.mac->in_progress = false;
4256 tline = delete_Token(tline);
4257 } else {
4258 t = *tail = tline;
4259 tline = tline->next;
4260 t->a.mac = NULL;
4261 t->next = NULL;
4262 tail = &t->next;
4267 * Now scan the entire line and look for successive TOK_IDs that resulted
4268 * after expansion (they can't be produced by tokenize()). The successive
4269 * TOK_IDs should be concatenated.
4270 * Also we look for %+ tokens and concatenate the tokens before and after
4271 * them (without white spaces in between).
4273 if (expanded && paste_tokens(&thead, true)) {
4275 * If we concatenated something, *and* we had previously expanded
4276 * an actual macro, scan the lines again for macros...
4278 tline = thead;
4279 expanded = false;
4280 goto again;
4283 err:
4284 if (org_tline) {
4285 if (thead) {
4286 *org_tline = *thead;
4287 /* since we just gave text to org_line, don't free it */
4288 thead->text = NULL;
4289 delete_Token(thead);
4290 } else {
4291 /* the expression expanded to empty line;
4292 we can't return NULL for some reasons
4293 we just set the line to a single WHITESPACE token. */
4294 memset(org_tline, 0, sizeof(*org_tline));
4295 org_tline->text = NULL;
4296 org_tline->type = TOK_WHITESPACE;
4298 thead = org_tline;
4301 return thead;
4305 * Similar to expand_smacro but used exclusively with macro identifiers
4306 * right before they are fetched in. The reason is that there can be
4307 * identifiers consisting of several subparts. We consider that if there
4308 * are more than one element forming the name, user wants a expansion,
4309 * otherwise it will be left as-is. Example:
4311 * %define %$abc cde
4313 * the identifier %$abc will be left as-is so that the handler for %define
4314 * will suck it and define the corresponding value. Other case:
4316 * %define _%$abc cde
4318 * In this case user wants name to be expanded *before* %define starts
4319 * working, so we'll expand %$abc into something (if it has a value;
4320 * otherwise it will be left as-is) then concatenate all successive
4321 * PP_IDs into one.
4323 static Token *expand_id(Token * tline)
4325 Token *cur, *oldnext = NULL;
4327 if (!tline || !tline->next)
4328 return tline;
4330 cur = tline;
4331 while (cur->next &&
4332 (cur->next->type == TOK_ID ||
4333 cur->next->type == TOK_PREPROC_ID
4334 || cur->next->type == TOK_NUMBER))
4335 cur = cur->next;
4337 /* If identifier consists of just one token, don't expand */
4338 if (cur == tline)
4339 return tline;
4341 if (cur) {
4342 oldnext = cur->next; /* Detach the tail past identifier */
4343 cur->next = NULL; /* so that expand_smacro stops here */
4346 tline = expand_smacro(tline);
4348 if (cur) {
4349 /* expand_smacro possibly changhed tline; re-scan for EOL */
4350 cur = tline;
4351 while (cur && cur->next)
4352 cur = cur->next;
4353 if (cur)
4354 cur->next = oldnext;
4357 return tline;
4361 * Determine whether the given line constitutes a multi-line macro
4362 * call, and return the MMacro structure called if so. Doesn't have
4363 * to check for an initial label - that's taken care of in
4364 * expand_mmacro - but must check numbers of parameters. Guaranteed
4365 * to be called with tline->type == TOK_ID, so the putative macro
4366 * name is easy to find.
4368 static MMacro *is_mmacro(Token * tline, Token *** params_array)
4370 MMacro *head, *m;
4371 Token **params;
4372 int nparam;
4374 head = (MMacro *) hash_findix(&mmacros, tline->text);
4377 * Efficiency: first we see if any macro exists with the given
4378 * name. If not, we can return NULL immediately. _Then_ we
4379 * count the parameters, and then we look further along the
4380 * list if necessary to find the proper MMacro.
4382 list_for_each(m, head)
4383 if (!mstrcmp(m->name, tline->text, m->casesense))
4384 break;
4385 if (!m)
4386 return NULL;
4389 * OK, we have a potential macro. Count and demarcate the
4390 * parameters.
4392 count_mmac_params(tline->next, &nparam, &params);
4395 * So we know how many parameters we've got. Find the MMacro
4396 * structure that handles this number.
4398 while (m) {
4399 if (m->nparam_min <= nparam
4400 && (m->plus || nparam <= m->nparam_max)) {
4402 * This one is right. Just check if cycle removal
4403 * prohibits us using it before we actually celebrate...
4405 if (m->in_progress > m->max_depth) {
4406 if (m->max_depth > 0) {
4407 error(ERR_WARNING,
4408 "reached maximum recursion depth of %i",
4409 m->max_depth);
4411 nasm_free(params);
4412 return NULL;
4415 * It's right, and we can use it. Add its default
4416 * parameters to the end of our list if necessary.
4418 if (m->defaults && nparam < m->nparam_min + m->ndefs) {
4419 params =
4420 nasm_realloc(params,
4421 ((m->nparam_min + m->ndefs +
4422 1) * sizeof(*params)));
4423 while (nparam < m->nparam_min + m->ndefs) {
4424 params[nparam] = m->defaults[nparam - m->nparam_min];
4425 nparam++;
4429 * If we've gone over the maximum parameter count (and
4430 * we're in Plus mode), ignore parameters beyond
4431 * nparam_max.
4433 if (m->plus && nparam > m->nparam_max)
4434 nparam = m->nparam_max;
4436 * Then terminate the parameter list, and leave.
4438 if (!params) { /* need this special case */
4439 params = nasm_malloc(sizeof(*params));
4440 nparam = 0;
4442 params[nparam] = NULL;
4443 *params_array = params;
4444 return m;
4447 * This one wasn't right: look for the next one with the
4448 * same name.
4450 list_for_each(m, m->next)
4451 if (!mstrcmp(m->name, tline->text, m->casesense))
4452 break;
4456 * After all that, we didn't find one with the right number of
4457 * parameters. Issue a warning, and fail to expand the macro.
4459 error(ERR_WARNING|ERR_PASS1|ERR_WARN_MNP,
4460 "macro `%s' exists, but not taking %d parameters",
4461 tline->text, nparam);
4462 nasm_free(params);
4463 return NULL;
4468 * Save MMacro invocation specific fields in
4469 * preparation for a recursive macro expansion
4471 static void push_mmacro(MMacro *m)
4473 MMacroInvocation *i;
4475 i = nasm_malloc(sizeof(MMacroInvocation));
4476 i->prev = m->prev;
4477 i->params = m->params;
4478 i->iline = m->iline;
4479 i->nparam = m->nparam;
4480 i->rotate = m->rotate;
4481 i->paramlen = m->paramlen;
4482 i->unique = m->unique;
4483 i->condcnt = m->condcnt;
4484 m->prev = i;
4489 * Restore MMacro invocation specific fields that were
4490 * saved during a previous recursive macro expansion
4492 static void pop_mmacro(MMacro *m)
4494 MMacroInvocation *i;
4496 if (m->prev) {
4497 i = m->prev;
4498 m->prev = i->prev;
4499 m->params = i->params;
4500 m->iline = i->iline;
4501 m->nparam = i->nparam;
4502 m->rotate = i->rotate;
4503 m->paramlen = i->paramlen;
4504 m->unique = i->unique;
4505 m->condcnt = i->condcnt;
4506 nasm_free(i);
4512 * Expand the multi-line macro call made by the given line, if
4513 * there is one to be expanded. If there is, push the expansion on
4514 * istk->expansion and return 1. Otherwise return 0.
4516 static int expand_mmacro(Token * tline)
4518 Token *startline = tline;
4519 Token *label = NULL;
4520 int dont_prepend = 0;
4521 Token **params, *t, *mtok, *tt;
4522 MMacro *m;
4523 Line *l, *ll;
4524 int i, nparam, *paramlen;
4525 const char *mname;
4527 t = tline;
4528 skip_white_(t);
4529 /* if (!tok_type_(t, TOK_ID)) Lino 02/25/02 */
4530 if (!tok_type_(t, TOK_ID) && !tok_type_(t, TOK_PREPROC_ID))
4531 return 0;
4532 mtok = t;
4533 m = is_mmacro(t, &params);
4534 if (m) {
4535 mname = t->text;
4536 } else {
4537 Token *last;
4539 * We have an id which isn't a macro call. We'll assume
4540 * it might be a label; we'll also check to see if a
4541 * colon follows it. Then, if there's another id after
4542 * that lot, we'll check it again for macro-hood.
4544 label = last = t;
4545 t = t->next;
4546 if (tok_type_(t, TOK_WHITESPACE))
4547 last = t, t = t->next;
4548 if (tok_is_(t, ":")) {
4549 dont_prepend = 1;
4550 last = t, t = t->next;
4551 if (tok_type_(t, TOK_WHITESPACE))
4552 last = t, t = t->next;
4554 if (!tok_type_(t, TOK_ID) || !(m = is_mmacro(t, &params)))
4555 return 0;
4556 last->next = NULL;
4557 mname = t->text;
4558 tline = t;
4562 * Fix up the parameters: this involves stripping leading and
4563 * trailing whitespace, then stripping braces if they are
4564 * present.
4566 for (nparam = 0; params[nparam]; nparam++) ;
4567 paramlen = nparam ? nasm_malloc(nparam * sizeof(*paramlen)) : NULL;
4569 for (i = 0; params[i]; i++) {
4570 int brace = false;
4571 int comma = (!m->plus || i < nparam - 1);
4573 t = params[i];
4574 skip_white_(t);
4575 if (tok_is_(t, "{"))
4576 t = t->next, brace = true, comma = false;
4577 params[i] = t;
4578 paramlen[i] = 0;
4579 while (t) {
4580 if (comma && t->type == TOK_OTHER && !strcmp(t->text, ","))
4581 break; /* ... because we have hit a comma */
4582 if (comma && t->type == TOK_WHITESPACE
4583 && tok_is_(t->next, ","))
4584 break; /* ... or a space then a comma */
4585 if (brace && t->type == TOK_OTHER && !strcmp(t->text, "}"))
4586 break; /* ... or a brace */
4587 t = t->next;
4588 paramlen[i]++;
4593 * OK, we have a MMacro structure together with a set of
4594 * parameters. We must now go through the expansion and push
4595 * copies of each Line on to istk->expansion. Substitution of
4596 * parameter tokens and macro-local tokens doesn't get done
4597 * until the single-line macro substitution process; this is
4598 * because delaying them allows us to change the semantics
4599 * later through %rotate.
4601 * First, push an end marker on to istk->expansion, mark this
4602 * macro as in progress, and set up its invocation-specific
4603 * variables.
4605 ll = nasm_malloc(sizeof(Line));
4606 ll->next = istk->expansion;
4607 ll->finishes = m;
4608 ll->first = NULL;
4609 istk->expansion = ll;
4612 * Save the previous MMacro expansion in the case of
4613 * macro recursion
4615 if (m->max_depth && m->in_progress)
4616 push_mmacro(m);
4618 m->in_progress ++;
4619 m->params = params;
4620 m->iline = tline;
4621 m->nparam = nparam;
4622 m->rotate = 0;
4623 m->paramlen = paramlen;
4624 m->unique = unique++;
4625 m->lineno = 0;
4626 m->condcnt = 0;
4628 m->next_active = istk->mstk;
4629 istk->mstk = m;
4631 list_for_each(l, m->expansion) {
4632 Token **tail;
4634 ll = nasm_malloc(sizeof(Line));
4635 ll->finishes = NULL;
4636 ll->next = istk->expansion;
4637 istk->expansion = ll;
4638 tail = &ll->first;
4640 list_for_each(t, l->first) {
4641 Token *x = t;
4642 switch (t->type) {
4643 case TOK_PREPROC_Q:
4644 tt = *tail = new_Token(NULL, TOK_ID, mname, 0);
4645 break;
4646 case TOK_PREPROC_QQ:
4647 tt = *tail = new_Token(NULL, TOK_ID, m->name, 0);
4648 break;
4649 case TOK_PREPROC_ID:
4650 if (t->text[1] == '0' && t->text[2] == '0') {
4651 dont_prepend = -1;
4652 x = label;
4653 if (!x)
4654 continue;
4656 /* fall through */
4657 default:
4658 tt = *tail = new_Token(NULL, x->type, x->text, 0);
4659 break;
4661 tail = &tt->next;
4663 *tail = NULL;
4667 * If we had a label, push it on as the first line of
4668 * the macro expansion.
4670 if (label) {
4671 if (dont_prepend < 0)
4672 free_tlist(startline);
4673 else {
4674 ll = nasm_malloc(sizeof(Line));
4675 ll->finishes = NULL;
4676 ll->next = istk->expansion;
4677 istk->expansion = ll;
4678 ll->first = startline;
4679 if (!dont_prepend) {
4680 while (label->next)
4681 label = label->next;
4682 label->next = tt = new_Token(NULL, TOK_OTHER, ":", 0);
4687 list->uplevel(m->nolist ? LIST_MACRO_NOLIST : LIST_MACRO);
4689 return 1;
4692 /* The function that actually does the error reporting */
4693 static void verror(int severity, const char *fmt, va_list arg)
4695 char buff[1024];
4697 vsnprintf(buff, sizeof(buff), fmt, arg);
4699 if (istk && istk->mstk && istk->mstk->name)
4700 nasm_error(severity, "(%s:%d) %s", istk->mstk->name,
4701 istk->mstk->lineno, buff);
4702 else
4703 nasm_error(severity, "%s", buff);
4707 * Since preprocessor always operate only on the line that didn't
4708 * arrived yet, we should always use ERR_OFFBY1.
4710 static void error(int severity, const char *fmt, ...)
4712 va_list arg;
4714 /* If we're in a dead branch of IF or something like it, ignore the error */
4715 if (istk && istk->conds && !emitting(istk->conds->state))
4716 return;
4718 va_start(arg, fmt);
4719 verror(severity, fmt, arg);
4720 va_end(arg);
4724 * Because %else etc are evaluated in the state context
4725 * of the previous branch, errors might get lost with error():
4726 * %if 0 ... %else trailing garbage ... %endif
4727 * So %else etc should report errors with this function.
4729 static void error_precond(int severity, const char *fmt, ...)
4731 va_list arg;
4733 /* Only ignore the error if it's really in a dead branch */
4734 if (istk && istk->conds && istk->conds->state == COND_NEVER)
4735 return;
4737 va_start(arg, fmt);
4738 verror(severity, fmt, arg);
4739 va_end(arg);
4742 static void
4743 pp_reset(char *file, int apass, ListGen * listgen, StrList **deplist)
4745 Token *t;
4747 cstk = NULL;
4748 istk = nasm_malloc(sizeof(Include));
4749 istk->next = NULL;
4750 istk->conds = NULL;
4751 istk->expansion = NULL;
4752 istk->mstk = NULL;
4753 istk->fp = fopen(file, "r");
4754 istk->fname = NULL;
4755 src_set_fname(nasm_strdup(file));
4756 src_set_linnum(0);
4757 istk->lineinc = 1;
4758 if (!istk->fp)
4759 error(ERR_FATAL|ERR_NOFILE, "unable to open input file `%s'",
4760 file);
4761 defining = NULL;
4762 nested_mac_count = 0;
4763 nested_rep_count = 0;
4764 init_macros();
4765 unique = 0;
4766 if (tasm_compatible_mode) {
4767 stdmacpos = nasm_stdmac;
4768 } else {
4769 stdmacpos = nasm_stdmac_after_tasm;
4771 any_extrastdmac = extrastdmac && *extrastdmac;
4772 do_predef = true;
4773 list = listgen;
4776 * 0 for dependencies, 1 for preparatory passes, 2 for final pass.
4777 * The caller, however, will also pass in 3 for preprocess-only so
4778 * we can set __PASS__ accordingly.
4780 pass = apass > 2 ? 2 : apass;
4782 dephead = deptail = deplist;
4783 if (deplist) {
4784 StrList *sl = nasm_malloc(strlen(file)+1+sizeof sl->next);
4785 sl->next = NULL;
4786 strcpy(sl->str, file);
4787 *deptail = sl;
4788 deptail = &sl->next;
4792 * Define the __PASS__ macro. This is defined here unlike
4793 * all the other builtins, because it is special -- it varies between
4794 * passes.
4796 t = nasm_malloc(sizeof(*t));
4797 t->next = NULL;
4798 make_tok_num(t, apass);
4799 t->a.mac = NULL;
4800 define_smacro(NULL, "__PASS__", true, 0, t);
4803 static char *pp_getline(void)
4805 char *line;
4806 Token *tline;
4808 while (1) {
4810 * Fetch a tokenized line, either from the macro-expansion
4811 * buffer or from the input file.
4813 tline = NULL;
4814 while (istk->expansion && istk->expansion->finishes) {
4815 Line *l = istk->expansion;
4816 if (!l->finishes->name && l->finishes->in_progress > 1) {
4817 Line *ll;
4820 * This is a macro-end marker for a macro with no
4821 * name, which means it's not really a macro at all
4822 * but a %rep block, and the `in_progress' field is
4823 * more than 1, meaning that we still need to
4824 * repeat. (1 means the natural last repetition; 0
4825 * means termination by %exitrep.) We have
4826 * therefore expanded up to the %endrep, and must
4827 * push the whole block on to the expansion buffer
4828 * again. We don't bother to remove the macro-end
4829 * marker: we'd only have to generate another one
4830 * if we did.
4832 l->finishes->in_progress--;
4833 list_for_each(l, l->finishes->expansion) {
4834 Token *t, *tt, **tail;
4836 ll = nasm_malloc(sizeof(Line));
4837 ll->next = istk->expansion;
4838 ll->finishes = NULL;
4839 ll->first = NULL;
4840 tail = &ll->first;
4842 list_for_each(t, l->first) {
4843 if (t->text || t->type == TOK_WHITESPACE) {
4844 tt = *tail = new_Token(NULL, t->type, t->text, 0);
4845 tail = &tt->next;
4849 istk->expansion = ll;
4851 } else {
4853 * Check whether a `%rep' was started and not ended
4854 * within this macro expansion. This can happen and
4855 * should be detected. It's a fatal error because
4856 * I'm too confused to work out how to recover
4857 * sensibly from it.
4859 if (defining) {
4860 if (defining->name)
4861 error(ERR_PANIC,
4862 "defining with name in expansion");
4863 else if (istk->mstk->name)
4864 error(ERR_FATAL,
4865 "`%%rep' without `%%endrep' within"
4866 " expansion of macro `%s'",
4867 istk->mstk->name);
4871 * FIXME: investigate the relationship at this point between
4872 * istk->mstk and l->finishes
4875 MMacro *m = istk->mstk;
4876 istk->mstk = m->next_active;
4877 if (m->name) {
4879 * This was a real macro call, not a %rep, and
4880 * therefore the parameter information needs to
4881 * be freed.
4883 if (m->prev) {
4884 pop_mmacro(m);
4885 l->finishes->in_progress --;
4886 } else {
4887 nasm_free(m->params);
4888 free_tlist(m->iline);
4889 nasm_free(m->paramlen);
4890 l->finishes->in_progress = 0;
4892 } else
4893 free_mmacro(m);
4895 istk->expansion = l->next;
4896 nasm_free(l);
4897 list->downlevel(LIST_MACRO);
4900 while (1) { /* until we get a line we can use */
4902 if (istk->expansion) { /* from a macro expansion */
4903 char *p;
4904 Line *l = istk->expansion;
4905 if (istk->mstk)
4906 istk->mstk->lineno++;
4907 tline = l->first;
4908 istk->expansion = l->next;
4909 nasm_free(l);
4910 p = detoken(tline, false);
4911 list->line(LIST_MACRO, p);
4912 nasm_free(p);
4913 break;
4915 line = read_line();
4916 if (line) { /* from the current input file */
4917 line = prepreproc(line);
4918 tline = tokenize(line);
4919 nasm_free(line);
4920 break;
4923 * The current file has ended; work down the istk
4926 Include *i = istk;
4927 fclose(i->fp);
4928 if (i->conds)
4929 error(ERR_FATAL,
4930 "expected `%%endif' before end of file");
4931 /* only set line and file name if there's a next node */
4932 if (i->next) {
4933 src_set_linnum(i->lineno);
4934 nasm_free(src_set_fname(i->fname));
4936 istk = i->next;
4937 list->downlevel(LIST_INCLUDE);
4938 nasm_free(i);
4939 if (!istk)
4940 return NULL;
4941 if (istk->expansion && istk->expansion->finishes)
4942 break;
4947 * We must expand MMacro parameters and MMacro-local labels
4948 * _before_ we plunge into directive processing, to cope
4949 * with things like `%define something %1' such as STRUC
4950 * uses. Unless we're _defining_ a MMacro, in which case
4951 * those tokens should be left alone to go into the
4952 * definition; and unless we're in a non-emitting
4953 * condition, in which case we don't want to meddle with
4954 * anything.
4956 if (!defining && !(istk->conds && !emitting(istk->conds->state))
4957 && !(istk->mstk && !istk->mstk->in_progress)) {
4958 tline = expand_mmac_params(tline);
4962 * Check the line to see if it's a preprocessor directive.
4964 if (do_directive(tline) == DIRECTIVE_FOUND) {
4965 continue;
4966 } else if (defining) {
4968 * We're defining a multi-line macro. We emit nothing
4969 * at all, and just
4970 * shove the tokenized line on to the macro definition.
4972 Line *l = nasm_malloc(sizeof(Line));
4973 l->next = defining->expansion;
4974 l->first = tline;
4975 l->finishes = NULL;
4976 defining->expansion = l;
4977 continue;
4978 } else if (istk->conds && !emitting(istk->conds->state)) {
4980 * We're in a non-emitting branch of a condition block.
4981 * Emit nothing at all, not even a blank line: when we
4982 * emerge from the condition we'll give a line-number
4983 * directive so we keep our place correctly.
4985 free_tlist(tline);
4986 continue;
4987 } else if (istk->mstk && !istk->mstk->in_progress) {
4989 * We're in a %rep block which has been terminated, so
4990 * we're walking through to the %endrep without
4991 * emitting anything. Emit nothing at all, not even a
4992 * blank line: when we emerge from the %rep block we'll
4993 * give a line-number directive so we keep our place
4994 * correctly.
4996 free_tlist(tline);
4997 continue;
4998 } else {
4999 tline = expand_smacro(tline);
5000 if (!expand_mmacro(tline)) {
5002 * De-tokenize the line again, and emit it.
5004 line = detoken(tline, true);
5005 free_tlist(tline);
5006 break;
5007 } else {
5008 continue; /* expand_mmacro calls free_tlist */
5013 return line;
5016 static void pp_cleanup(int pass)
5018 if (defining) {
5019 if (defining->name) {
5020 error(ERR_NONFATAL,
5021 "end of file while still defining macro `%s'",
5022 defining->name);
5023 } else {
5024 error(ERR_NONFATAL, "end of file while still in %%rep");
5027 free_mmacro(defining);
5028 defining = NULL;
5030 while (cstk)
5031 ctx_pop();
5032 free_macros();
5033 while (istk) {
5034 Include *i = istk;
5035 istk = istk->next;
5036 fclose(i->fp);
5037 nasm_free(i->fname);
5038 nasm_free(i);
5040 while (cstk)
5041 ctx_pop();
5042 nasm_free(src_set_fname(NULL));
5043 if (pass == 0) {
5044 IncPath *i;
5045 free_llist(predef);
5046 delete_Blocks();
5047 while ((i = ipath)) {
5048 ipath = i->next;
5049 if (i->path)
5050 nasm_free(i->path);
5051 nasm_free(i);
5056 void pp_include_path(char *path)
5058 IncPath *i;
5060 i = nasm_malloc(sizeof(IncPath));
5061 i->path = path ? nasm_strdup(path) : NULL;
5062 i->next = NULL;
5064 if (ipath) {
5065 IncPath *j = ipath;
5066 while (j->next)
5067 j = j->next;
5068 j->next = i;
5069 } else {
5070 ipath = i;
5074 void pp_pre_include(char *fname)
5076 Token *inc, *space, *name;
5077 Line *l;
5079 name = new_Token(NULL, TOK_INTERNAL_STRING, fname, 0);
5080 space = new_Token(name, TOK_WHITESPACE, NULL, 0);
5081 inc = new_Token(space, TOK_PREPROC_ID, "%include", 0);
5083 l = nasm_malloc(sizeof(Line));
5084 l->next = predef;
5085 l->first = inc;
5086 l->finishes = NULL;
5087 predef = l;
5090 void pp_pre_define(char *definition)
5092 Token *def, *space;
5093 Line *l;
5094 char *equals;
5096 equals = strchr(definition, '=');
5097 space = new_Token(NULL, TOK_WHITESPACE, NULL, 0);
5098 def = new_Token(space, TOK_PREPROC_ID, "%define", 0);
5099 if (equals)
5100 *equals = ' ';
5101 space->next = tokenize(definition);
5102 if (equals)
5103 *equals = '=';
5105 l = nasm_malloc(sizeof(Line));
5106 l->next = predef;
5107 l->first = def;
5108 l->finishes = NULL;
5109 predef = l;
5112 void pp_pre_undefine(char *definition)
5114 Token *def, *space;
5115 Line *l;
5117 space = new_Token(NULL, TOK_WHITESPACE, NULL, 0);
5118 def = new_Token(space, TOK_PREPROC_ID, "%undef", 0);
5119 space->next = tokenize(definition);
5121 l = nasm_malloc(sizeof(Line));
5122 l->next = predef;
5123 l->first = def;
5124 l->finishes = NULL;
5125 predef = l;
5129 * Added by Keith Kanios:
5131 * This function is used to assist with "runtime" preprocessor
5132 * directives. (e.g. pp_runtime("%define __BITS__ 64");)
5134 * ERRORS ARE IGNORED HERE, SO MAKE COMPLETELY SURE THAT YOU
5135 * PASS A VALID STRING TO THIS FUNCTION!!!!!
5138 void pp_runtime(char *definition)
5140 Token *def;
5142 def = tokenize(definition);
5143 if (do_directive(def) == NO_DIRECTIVE_FOUND)
5144 free_tlist(def);
5148 void pp_extra_stdmac(macros_t *macros)
5150 extrastdmac = macros;
5153 static void make_tok_num(Token * tok, int64_t val)
5155 char numbuf[20];
5156 snprintf(numbuf, sizeof(numbuf), "%"PRId64"", val);
5157 tok->text = nasm_strdup(numbuf);
5158 tok->type = TOK_NUMBER;
5161 Preproc nasmpp = {
5162 pp_reset,
5163 pp_getline,
5164 pp_cleanup