Cache regex compilation for another autoconf speedup.
[m4/ericb.git] / src / macro.c
blobf9c5fe140bba0c2cbddf90d35d2d18e07e0df941
1 /* GNU m4 -- A simple macro processor
3 Copyright (C) 1989, 1990, 1991, 1992, 1993, 1994, 2006, 2007 Free
4 Software Foundation, Inc.
6 This file is part of GNU M4.
8 GNU M4 is free software: you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation, either version 3 of the License, or
11 (at your option) any later version.
13 GNU M4 is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with this program. If not, see <http://www.gnu.org/licenses/>.
22 /* This file contains the functions, that performs the basic argument
23 parsing and macro expansion. */
25 #include "m4.h"
27 static void expand_macro (symbol *);
28 static void expand_token (struct obstack *, token_type, token_data *, int);
30 /* Current recursion level in expand_macro (). */
31 int expansion_level = 0;
33 /* The number of the current call of expand_macro (). */
34 static int macro_call_id = 0;
36 /* The shared stack of collected arguments for macro calls; as each
37 argument is collected, it is finished and its location stored in
38 argv_stack. Normally, this stack can be used simultaneously by
39 multiple macro calls; the exception is when an outer macro has
40 generated some text, then calls a nested macro, in which case the
41 nested macro must use a local stack to leave the unfinished text
42 alone. Too bad obstack.h does not provide an easy way to reopen a
43 finished object for further growth, but in practice this does not
44 hurt us too much. */
45 static struct obstack argc_stack;
47 /* The shared stack of pointers to collected arguments for macro
48 calls. This object is never finished; we exploit the fact that
49 obstack_blank is documented to take a negative size to reduce the
50 size again. */
51 static struct obstack argv_stack;
53 /*----------------------------------------------------------------------.
54 | This function read all input, and expands each token, one at a time. |
55 `----------------------------------------------------------------------*/
57 void
58 expand_input (void)
60 token_type t;
61 token_data td;
62 int line;
64 obstack_init (&argc_stack);
65 obstack_init (&argv_stack);
67 while ((t = next_token (&td, &line)) != TOKEN_EOF)
68 expand_token ((struct obstack *) NULL, t, &td, line);
70 obstack_free (&argc_stack, NULL);
71 obstack_free (&argv_stack, NULL);
75 /*------------------------------------------------------------------------.
76 | Expand one token, according to its type. Potential macro names |
77 | (TOKEN_WORD) are looked up in the symbol table, to see if they have a |
78 | macro definition. If they have, they are expanded as macros, otherwise |
79 | the text are just copied to the output. |
80 `------------------------------------------------------------------------*/
82 static void
83 expand_token (struct obstack *obs, token_type t, token_data *td, int line)
85 symbol *sym;
87 switch (t)
88 { /* TOKSW */
89 case TOKEN_EOF:
90 case TOKEN_MACDEF:
91 break;
93 case TOKEN_OPEN:
94 case TOKEN_COMMA:
95 case TOKEN_CLOSE:
96 case TOKEN_SIMPLE:
97 case TOKEN_STRING:
98 shipout_text (obs, TOKEN_DATA_TEXT (td), strlen (TOKEN_DATA_TEXT (td)),
99 line);
100 break;
102 case TOKEN_WORD:
103 sym = lookup_symbol (TOKEN_DATA_TEXT (td), SYMBOL_LOOKUP);
104 if (sym == NULL || SYMBOL_TYPE (sym) == TOKEN_VOID
105 || (SYMBOL_TYPE (sym) == TOKEN_FUNC
106 && SYMBOL_BLIND_NO_ARGS (sym)
107 && peek_token () != TOKEN_OPEN))
109 #ifdef ENABLE_CHANGEWORD
110 shipout_text (obs, TOKEN_DATA_ORIG_TEXT (td),
111 strlen (TOKEN_DATA_ORIG_TEXT (td)), line);
112 #else
113 shipout_text (obs, TOKEN_DATA_TEXT (td),
114 strlen (TOKEN_DATA_TEXT (td)), line);
115 #endif
117 else
118 expand_macro (sym);
119 break;
121 default:
122 M4ERROR ((warning_status, 0,
123 "INTERNAL ERROR: bad token type in expand_token ()"));
124 abort ();
129 /*-------------------------------------------------------------------------.
130 | This function parses one argument to a macro call. It expects the first |
131 | left parenthesis, or the separating comma to have been read by the |
132 | caller. It skips leading whitespace, and reads and expands tokens, |
133 | until it finds a comma or an right parenthesis at the same level of |
134 | parentheses. It returns a flag indicating whether the argument read are |
135 | the last for the active macro call. The argument are build on the |
136 | obstack OBS, indirectly through expand_token (). |
137 `-------------------------------------------------------------------------*/
139 static bool
140 expand_argument (struct obstack *obs, token_data *argp)
142 token_type t;
143 token_data td;
144 char *text;
145 int paren_level;
146 const char *file = current_file;
147 int line = current_line;
149 TOKEN_DATA_TYPE (argp) = TOKEN_VOID;
151 /* Skip leading white space. */
154 t = next_token (&td, NULL);
156 while (t == TOKEN_SIMPLE && isspace (to_uchar (*TOKEN_DATA_TEXT (&td))));
158 paren_level = 0;
160 while (1)
163 switch (t)
164 { /* TOKSW */
165 case TOKEN_COMMA:
166 case TOKEN_CLOSE:
167 if (paren_level == 0)
169 /* The argument MUST be finished, whether we want it or not. */
170 obstack_1grow (obs, '\0');
171 text = (char *) obstack_finish (obs);
173 if (TOKEN_DATA_TYPE (argp) == TOKEN_VOID)
175 TOKEN_DATA_TYPE (argp) = TOKEN_TEXT;
176 TOKEN_DATA_TEXT (argp) = text;
178 return t == TOKEN_COMMA;
180 /* fallthru */
181 case TOKEN_OPEN:
182 case TOKEN_SIMPLE:
183 text = TOKEN_DATA_TEXT (&td);
185 if (*text == '(')
186 paren_level++;
187 else if (*text == ')')
188 paren_level--;
189 expand_token (obs, t, &td, line);
190 break;
192 case TOKEN_EOF:
193 /* current_file changed to "" if we see TOKEN_EOF, use the
194 previous value we stored earlier. */
195 M4ERROR_AT_LINE ((EXIT_FAILURE, 0, file, line,
196 "ERROR: end of file in argument list"));
197 break;
199 case TOKEN_WORD:
200 case TOKEN_STRING:
201 expand_token (obs, t, &td, line);
202 break;
204 case TOKEN_MACDEF:
205 if (obstack_object_size (obs) == 0)
207 TOKEN_DATA_TYPE (argp) = TOKEN_FUNC;
208 TOKEN_DATA_FUNC (argp) = TOKEN_DATA_FUNC (&td);
210 break;
212 default:
213 M4ERROR ((warning_status, 0,
214 "INTERNAL ERROR: bad token type in expand_argument ()"));
215 abort ();
218 t = next_token (&td, NULL);
222 /*-------------------------------------------------------------------------.
223 | Collect all the arguments to a call of the macro SYM. The arguments are |
224 | stored on the obstack ARGUMENTS and a table of pointers to the arguments |
225 | on the obstack ARGPTR. |
226 `-------------------------------------------------------------------------*/
228 static void
229 collect_arguments (symbol *sym, struct obstack *argptr,
230 struct obstack *arguments)
232 token_data td;
233 token_data *tdp;
234 bool more_args;
235 bool groks_macro_args = SYMBOL_MACRO_ARGS (sym);
237 TOKEN_DATA_TYPE (&td) = TOKEN_TEXT;
238 TOKEN_DATA_TEXT (&td) = SYMBOL_NAME (sym);
239 tdp = (token_data *) obstack_copy (arguments, &td, sizeof td);
240 obstack_ptr_grow (argptr, tdp);
242 if (peek_token () == TOKEN_OPEN)
244 next_token (&td, NULL); /* gobble parenthesis */
247 more_args = expand_argument (arguments, &td);
249 if (!groks_macro_args && TOKEN_DATA_TYPE (&td) == TOKEN_FUNC)
251 TOKEN_DATA_TYPE (&td) = TOKEN_TEXT;
252 TOKEN_DATA_TEXT (&td) = (char *) "";
254 tdp = (token_data *) obstack_copy (arguments, &td, sizeof td);
255 obstack_ptr_grow (argptr, tdp);
257 while (more_args);
262 /*------------------------------------------------------------------------.
263 | The actual call of a macro is handled by call_macro (). call_macro () |
264 | is passed a symbol SYM, whose type is used to call either a builtin |
265 | function, or the user macro expansion function expand_user_macro () |
266 | (lives in builtin.c). There are ARGC arguments to the call, stored in |
267 | the ARGV table. The expansion is left on the obstack EXPANSION. Macro |
268 | tracing is also handled here. |
269 `------------------------------------------------------------------------*/
271 void
272 call_macro (symbol *sym, int argc, token_data **argv,
273 struct obstack *expansion)
275 switch (SYMBOL_TYPE (sym))
277 case TOKEN_FUNC:
278 (*SYMBOL_FUNC (sym)) (expansion, argc, argv);
279 break;
281 case TOKEN_TEXT:
282 expand_user_macro (expansion, sym, argc, argv);
283 break;
285 default:
286 M4ERROR ((warning_status, 0,
287 "INTERNAL ERROR: bad symbol type in call_macro ()"));
288 abort ();
292 /*-------------------------------------------------------------------------.
293 | The macro expansion is handled by expand_macro (). It parses the |
294 | arguments, using collect_arguments (), and builds a table of pointers to |
295 | the arguments. The arguments themselves are stored on a local obstack. |
296 | Expand_macro () uses call_macro () to do the call of the macro. |
298 | Expand_macro () is potentially recursive, since it calls expand_argument |
299 | (), which might call expand_token (), which might call expand_macro (). |
300 `-------------------------------------------------------------------------*/
302 static void
303 expand_macro (symbol *sym)
305 struct obstack arguments; /* Alternate obstack if argc_stack is busy. */
306 unsigned argv_base; /* Size of argv_stack on entry. */
307 bool use_argc_stack = true; /* Whether argc_stack is safe. */
308 token_data **argv;
309 int argc;
310 struct obstack *expansion;
311 const char *expanded;
312 bool traced;
313 int my_call_id;
315 /* Report errors at the location where the open parenthesis (if any)
316 was found, but after expansion, restore global state back to the
317 location of the close parenthesis. This is safe since we
318 guarantee that macro expansion does not alter the state of
319 current_file/current_line (dnl, include, and sinclude are special
320 cased in the input engine to ensure this fact). */
321 const char *loc_open_file = current_file;
322 int loc_open_line = current_line;
323 const char *loc_close_file;
324 int loc_close_line;
326 SYMBOL_PENDING_EXPANSIONS (sym)++;
327 expansion_level++;
328 if (nesting_limit > 0 && expansion_level > nesting_limit)
329 M4ERROR ((EXIT_FAILURE, 0,
330 "recursion limit of %d exceeded, use -L<N> to change it",
331 nesting_limit));
333 macro_call_id++;
334 my_call_id = macro_call_id;
336 traced = (debug_level & DEBUG_TRACE_ALL) || SYMBOL_TRACED (sym);
338 argv_base = obstack_object_size (&argv_stack);
339 if (obstack_object_size (&argc_stack) > 0)
341 /* We cannot use argc_stack if this is a nested invocation, and an
342 outer invocation has an unfinished argument being
343 collected. */
344 obstack_init (&arguments);
345 use_argc_stack = false;
348 if (traced && (debug_level & DEBUG_TRACE_CALL))
349 trace_prepre (SYMBOL_NAME (sym), my_call_id);
351 collect_arguments (sym, &argv_stack,
352 use_argc_stack ? &argc_stack : &arguments);
354 argc = ((obstack_object_size (&argv_stack) - argv_base)
355 / sizeof (token_data *));
356 argv = (token_data **) ((char *) obstack_base (&argv_stack) + argv_base);
358 loc_close_file = current_file;
359 loc_close_line = current_line;
360 current_file = loc_open_file;
361 current_line = loc_open_line;
363 if (traced)
364 trace_pre (SYMBOL_NAME (sym), my_call_id, argc, argv);
366 expansion = push_string_init ();
367 call_macro (sym, argc, argv, expansion);
368 expanded = push_string_finish ();
370 if (traced)
371 trace_post (SYMBOL_NAME (sym), my_call_id, argc, argv, expanded);
373 current_file = loc_close_file;
374 current_line = loc_close_line;
376 --expansion_level;
377 --SYMBOL_PENDING_EXPANSIONS (sym);
379 if (SYMBOL_DELETED (sym))
380 free_symbol (sym);
382 if (use_argc_stack)
383 obstack_free (&argc_stack, argv[0]);
384 else
385 obstack_free (&arguments, NULL);
386 obstack_blank (&argv_stack, -argc * sizeof (token_data *));