2 * Wrc preprocessor lexical analysis
4 * Copyright 1999-2000 Bertho A. Stultiens (BS)
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
21 * 24-Apr-2000 BS - Started from scratch to restructure everything
22 * and reintegrate the source into the wine-tree.
23 * 04-Jan-2000 BS - Added comments about the lexicographical
24 * grammar to give some insight in the complexity.
25 * 28-Dec-1999 BS - Eliminated backing-up of the flexer by running
26 * `flex -b' on the source. This results in some
27 * weirdo extra rules, but a much faster scanner.
28 * 23-Dec-1999 BS - Started this file
30 *-------------------------------------------------------------------------
31 * The preprocessor's lexographical grammar (approximately):
33 * pp := {ws} # {ws} if {ws} {expr} {ws} \n
34 * | {ws} # {ws} ifdef {ws} {id} {ws} \n
35 * | {ws} # {ws} ifndef {ws} {id} {ws} \n
36 * | {ws} # {ws} elif {ws} {expr} {ws} \n
37 * | {ws} # {ws} else {ws} \n
38 * | {ws} # {ws} endif {ws} \n
39 * | {ws} # {ws} include {ws} < {anytext} > \n
40 * | {ws} # {ws} include {ws} " {anytext} " \n
41 * | {ws} # {ws} include_next {ws} < {anytext} > \n
42 * | {ws} # {ws} include_next {ws} " {anytext} " \n
43 * | {ws} # {ws} define {ws} {anytext} \n
44 * | {ws} # {ws} define( {arglist} ) {ws} {expansion} \n
45 * | {ws} # {ws} pragma {ws} {anytext} \n
46 * | {ws} # {ws} ident {ws} {anytext} \n
47 * | {ws} # {ws} error {ws} {anytext} \n
48 * | {ws} # {ws} warning {ws} {anytext} \n
49 * | {ws} # {ws} line {ws} " {anytext} " {number} \n
50 * | {ws} # {ws} {number} " {anytext} " {number} [ {number} [{number}] ] \n
55 * expr := {expr} [+-*%^/|&] {expr}
56 * | {expr} {logor|logand} {expr}
58 * | {expr} ? {expr} : {expr}
64 * id := [a-zA-Z_][a-zA-Z0-9_]*
66 * anytext := [^\n]* (see note)
71 * | {arglist} , {id} ...
76 * | {anytext} ## {anytext}
80 * Note: "anytext" is not always "[^\n]*". This is because the
81 * trailing context must be considered as well.
83 * The only certain assumption for the preprocessor to make is that
84 * directives start at the beginning of the line, followed by a '#'
85 * and end with a newline.
86 * Any directive may be suffixed with a line-continuation. Also
87 * classical comment / *...* / (note: no comments within comments,
88 * therefore spaces) is considered to be a line-continuation
89 * (according to gcc and egcs AFAIK, ANSI is a bit vague).
90 * Comments have not been added to the above grammar for simplicity
91 * reasons. However, it is allowed to enter comment anywhere within
92 * the directives as long as they do not interfere with the context.
93 * All comments are considered to be deletable whitespace (both
94 * classical form "/ *...* /" and C++ form "//...\n").
96 * All recursive scans, except for macro-expansion, are done by the
97 * parser, whereas the simple state transitions of non-recursive
98 * directives are done in the scanner. This results in the many
99 * exclusive start-conditions of the scanner.
101 * Macro expansions are slightly more difficult because they have to
102 * prescan the arguments. Parameter substitution is literal if the
103 * substitution is # or ## (either side). This enables new identifiers
104 * to be created (see 'info cpp' node Macro|Pitfalls|Prescan for more
107 * FIXME: Variable macro parameters is recognized, but not yet
108 * expanded. I have to reread the ANSI standard on the subject (yes,
111 * The following special defines are supported:
112 * __FILE__ -> "thissource.c"
114 * __DATE__ -> "May 1 2000"
115 * __TIME__ -> "23:59:59"
116 * These macros expand, as expected, into their ANSI defined values.
118 * The same include prevention is implemented as gcc and egcs does.
119 * This results in faster processing because we do not read the text
120 * at all. Some wine-sources attempt to include the same file 4 or 5
121 * times. This strategy also saves a lot blank output-lines, which in
122 * its turn improves the real resource scanner/parser.
127 * Special flex options and exclusive scanner start-conditions
130 %option 8bit never-interactive
157 cident [a-zA-Z_][0-9a-zA-Z_]*
158 ul [uUlL]|[uUlL][lL]|[lL][uU]|[lL][lL][uU]|[uU][lL][lL]|[lL][uU][lL]
167 #include "wpp_private.h"
171 * Make sure that we are running an appropriate version of flex.
173 #if !defined(YY_FLEX_MAJOR_VERSION) || (1000 * YY_FLEX_MAJOR_VERSION + YY_FLEX_MINOR_VERSION < 2005)
174 #error Must use flex version 2.5.1 or higher (yy_scan_* routines are required).
177 #define YY_USE_PROTOS
179 #define YY_READ_BUF_SIZE 65536 /* So we read most of a file at once */
181 #define yy_current_state() YY_START
182 #define yy_pp_state(x) yy_pop_state(); yy_push_state(x)
185 * Always update the current character position within a line
187 #define YY_USER_ACTION pp_status.char_number+=ppleng;
190 * Buffer management for includes and expansions
192 #define MAXBUFFERSTACK 128 /* Nesting more than 128 includes or macro expansion textss is insane */
194 typedef struct bufferstackentry {
195 YY_BUFFER_STATE bufferstate; /* Buffer to switch back to */
196 pp_entry_t *define; /* Points to expanding define or NULL if handling includes */
197 int line_number; /* Line that we were handling */
198 int char_number; /* The current position on that line */
199 const char *filename; /* Filename that we were handling */
200 int if_depth; /* How many #if:s deep to check matching #endif:s */
201 int ncontinuations; /* Remember the continuation state */
202 int should_pop; /* Set if we must pop the start-state on EOF */
203 /* Include management */
204 include_state_t incl;
205 char *include_filename;
207 } bufferstackentry_t;
209 #define ALLOCBLOCKSIZE (1 << 10) /* Allocate these chunks at a time for string-buffers */
212 * Macro expansion nesting
213 * We need the stack to handle expansions while scanning
214 * a macro's arguments. The TOS must always be the macro
215 * that receives the current expansion from the scanner.
217 #define MAXMACEXPSTACK 128 /* Nesting more than 128 macro expansions is insane */
219 typedef struct macexpstackentry {
220 pp_entry_t *ppp; /* This macro we are scanning */
221 char **args; /* With these arguments */
222 char **ppargs; /* Resulting in these preprocessed arguments */
223 int *nnls; /* Number of newlines per argument */
224 int nargs; /* And this many arguments scanned */
225 int parentheses; /* Nesting level of () */
226 int curargsize; /* Current scanning argument's size */
227 int curargalloc; /* Current scanning argument's block allocated */
228 char *curarg; /* Current scanning argument's content */
229 } macexpstackentry_t;
231 #define MACROPARENTHESES() (top_macro()->parentheses)
236 static void newline(int);
237 static int make_number(int radix, YYSTYPE *val, const char *str, int len);
238 static void put_buffer(const char *s, int len);
239 static int is_c_h_include(char *fname, int quoted);
240 /* Buffer management */
241 static void push_buffer(pp_entry_t *ppp, char *filename, char *incname, int pop);
242 static bufferstackentry_t *pop_buffer(void);
243 /* String functions */
244 static void new_string(void);
245 static void add_string(const char *str, int len);
246 static char *get_string(void);
247 static void put_string(void);
248 static int string_start(void);
249 /* Macro functions */
250 static void push_macro(pp_entry_t *ppp);
251 static macexpstackentry_t *top_macro(void);
252 static macexpstackentry_t *pop_macro(void);
253 static void free_macro(macexpstackentry_t *mep);
254 static void add_text_to_macro(const char *text, int len);
255 static void macro_add_arg(int last);
256 static void macro_add_expansion(void);
258 static void expand_special(pp_entry_t *ppp);
259 static void expand_define(pp_entry_t *ppp);
260 static void expand_macro(macexpstackentry_t *mep);
265 static int ncontinuations;
267 static int strbuf_idx = 0;
268 static int strbuf_alloc = 0;
269 static char *strbuffer = NULL;
270 static int str_startline;
272 static macexpstackentry_t *macexpstack[MAXMACEXPSTACK];
273 static int macexpstackidx = 0;
275 static bufferstackentry_t bufferstack[MAXBUFFERSTACK];
276 static int bufferstackidx = 0;
278 static int pass_data=1;
283 include_state_t pp_incl_state =
291 includelogicentry_t *pp_includelogiclist = NULL;
296 **************************************************************************
297 * The scanner starts here
298 **************************************************************************
303 * Catch line-continuations.
304 * Note: Gcc keeps the line-continuations in, for example, strings
305 * intact. However, I prefer to remove them all so that the next
306 * scanner will not need to reduce the continuation state.
308 * <*>\\\n newline(0);
312 * Detect the leading # of a preprocessor directive.
314 <INITIAL,pp_ignore>^{ws}*# pp_incl_state.seen_junk++; yy_push_state(pp_pp);
317 * Scan for the preprocessor directives
319 <pp_pp>{ws}*include{ws}* if(yy_top_state() != pp_ignore) {yy_pp_state(pp_inc); return tINCLUDE;} else {yy_pp_state(pp_eol);}
320 <pp_pp>{ws}*include_next{ws}* if(yy_top_state() != pp_ignore) {yy_pp_state(pp_inc); return tINCLUDE_NEXT;} else {yy_pp_state(pp_eol);}
321 <pp_pp>{ws}*define{ws}* yy_pp_state(yy_current_state() != pp_ignore ? pp_def : pp_eol);
322 <pp_pp>{ws}*error{ws}* yy_pp_state(pp_eol); if(yy_top_state() != pp_ignore) return tERROR;
323 <pp_pp>{ws}*warning{ws}* yy_pp_state(pp_eol); if(yy_top_state() != pp_ignore) return tWARNING;
324 <pp_pp>{ws}*pragma{ws}* yy_pp_state(pp_eol); if(yy_top_state() != pp_ignore) return tPRAGMA;
325 <pp_pp>{ws}*ident{ws}* yy_pp_state(pp_eol); if(yy_top_state() != pp_ignore) return tPPIDENT;
326 <pp_pp>{ws}*undef{ws}* if(yy_top_state() != pp_ignore) {yy_pp_state(pp_ifd); return tUNDEF;} else {yy_pp_state(pp_eol);}
327 <pp_pp>{ws}*ifdef{ws}* yy_pp_state(pp_ifd); return tIFDEF;
328 <pp_pp>{ws}*ifndef{ws}* pp_incl_state.seen_junk--; yy_pp_state(pp_ifd); return tIFNDEF;
329 <pp_pp>{ws}*if{ws}* yy_pp_state(pp_if); return tIF;
330 <pp_pp>{ws}*elif{ws}* yy_pp_state(pp_if); return tELIF;
331 <pp_pp>{ws}*else{ws}* yy_pp_state(pp_endif); return tELSE;
332 <pp_pp>{ws}*endif{ws}* yy_pp_state(pp_endif); return tENDIF;
333 <pp_pp>{ws}*line{ws}* if(yy_top_state() != pp_ignore) {yy_pp_state(pp_line); return tLINE;} else {yy_pp_state(pp_eol);}
334 <pp_pp>{ws}+ if(yy_top_state() != pp_ignore) {yy_pp_state(pp_line); return tGCCLINE;} else {yy_pp_state(pp_eol);}
335 <pp_pp>{ws}*[a-z]+ pperror("Invalid preprocessor token '%s'", pptext);
336 <pp_pp>\r?\n newline(1); yy_pop_state(); return tNL; /* This could be the null-token */
337 <pp_pp>\\\r?\n newline(0);
338 <pp_pp>\\\r? pperror("Preprocessor junk '%s'", pptext);
339 <pp_pp>. return *pptext;
342 * Handle #include and #line
344 <pp_line>[0-9]+ return make_number(10, &pplval, pptext, ppleng);
345 <pp_inc>\< new_string(); add_string(pptext, ppleng); yy_push_state(pp_iqs);
346 <pp_inc,pp_line>\" new_string(); add_string(pptext, ppleng); yy_push_state(pp_dqs);
347 <pp_inc,pp_line>{ws}+ ;
348 <pp_inc,pp_line>\n newline(1); yy_pop_state(); return tNL;
349 <pp_inc,pp_line>\\\r?\n newline(0);
350 <pp_inc,pp_line>(\\\r?)|(.) pperror(yy_current_state() == pp_inc ? "Trailing junk in #include" : "Trailing junk in #line");
353 * Ignore all input when a false clause is parsed
355 <pp_ignore>[^#/\\\n]+ ;
356 <pp_ignore>\n newline(1);
357 <pp_ignore>\\\r?\n newline(0);
358 <pp_ignore>(\\\r?)|(.) ;
361 * Handle #if and #elif.
362 * These require conditionals to be evaluated, but we do not
363 * want to jam the scanner normally when we see these tokens.
364 * Note: tIDENT is handled below.
367 <pp_if>0[0-7]*{ul}? return make_number(8, &pplval, pptext, ppleng);
368 <pp_if>0[0-7]*[8-9]+{ul}? pperror("Invalid octal digit");
369 <pp_if>[1-9][0-9]*{ul}? return make_number(10, &pplval, pptext, ppleng);
370 <pp_if>0[xX][0-9a-fA-F]+{ul}? return make_number(16, &pplval, pptext, ppleng);
371 <pp_if>0[xX] pperror("Invalid hex number");
372 <pp_if>defined yy_push_state(pp_defined); return tDEFINED;
373 <pp_if>"<<" return tLSHIFT;
374 <pp_if>">>" return tRSHIFT;
375 <pp_if>"&&" return tLOGAND;
376 <pp_if>"||" return tLOGOR;
377 <pp_if>"==" return tEQ;
378 <pp_if>"!=" return tNE;
379 <pp_if>"<=" return tLTE;
380 <pp_if>">=" return tGTE;
381 <pp_if>\n newline(1); yy_pop_state(); return tNL;
382 <pp_if>\\\r?\n newline(0);
383 <pp_if>\\\r? pperror("Junk in conditional expression");
385 <pp_if>\' new_string(); add_string(pptext, ppleng); yy_push_state(pp_sqs);
386 <pp_if>\" pperror("String constants not allowed in conditionals");
387 <pp_if>. return *pptext;
390 * Handle #ifdef, #ifndef and #undef
391 * to get only an untranslated/unexpanded identifier
393 <pp_ifd>{cident} pplval.cptr = pp_xstrdup(pptext); return tIDENT;
395 <pp_ifd>\n newline(1); yy_pop_state(); return tNL;
396 <pp_ifd>\\\r?\n newline(0);
397 <pp_ifd>(\\\r?)|(.) pperror("Identifier expected");
400 * Handle #else and #endif.
403 <pp_endif>\n newline(1); yy_pop_state(); return tNL;
404 <pp_endif>\\\r?\n newline(0);
405 <pp_endif>. pperror("Garbage after #else or #endif.");
408 * Handle the special 'defined' keyword.
409 * This is necessary to get the identifier prior to any
412 <pp_defined>{cident} yy_pop_state(); pplval.cptr = pp_xstrdup(pptext); return tIDENT;
414 <pp_defined>(\()|(\)) return *pptext;
415 <pp_defined>\\\r?\n newline(0);
416 <pp_defined>(\\.)|(\n)|(.) pperror("Identifier expected");
419 * Handle #error, #warning, #pragma and #ident.
420 * Pass everything literally to the parser, which
421 * will act appropriately.
422 * Comments are stripped from the literal text.
424 <pp_eol>[^/\\\n]+ if(yy_top_state() != pp_ignore) { pplval.cptr = pp_xstrdup(pptext); return tLITERAL; }
425 <pp_eol>\/[^/\\\n*]* if(yy_top_state() != pp_ignore) { pplval.cptr = pp_xstrdup(pptext); return tLITERAL; }
426 <pp_eol>(\\\r?)|(\/[^/*]) if(yy_top_state() != pp_ignore) { pplval.cptr = pp_xstrdup(pptext); return tLITERAL; }
427 <pp_eol>\n newline(1); yy_pop_state(); if(yy_current_state() != pp_ignore) { return tNL; }
428 <pp_eol>\\\r?\n newline(0);
431 * Handle left side of #define
433 <pp_def>{cident}\( pplval.cptr = pp_xstrdup(pptext); pplval.cptr[ppleng-1] = '\0'; yy_pp_state(pp_macro); return tMACRO;
434 <pp_def>{cident} pplval.cptr = pp_xstrdup(pptext); yy_pp_state(pp_define); return tDEFINE;
436 <pp_def>\\\r?\n newline(0);
437 <pp_def>(\\\r?)|(\n)|(.) perror("Identifier expected");
440 * Scan the substitution of a define
442 <pp_define>[^'"/\\\n]+ pplval.cptr = pp_xstrdup(pptext); return tLITERAL;
443 <pp_define>(\\\r?)|(\/[^/*]) pplval.cptr = pp_xstrdup(pptext); return tLITERAL;
444 <pp_define>\\\r?\n{ws}+ newline(0); pplval.cptr = pp_xstrdup(" "); return tLITERAL;
445 <pp_define>\\\r?\n newline(0);
446 <pp_define>\n newline(1); yy_pop_state(); return tNL;
447 <pp_define>\' new_string(); add_string(pptext, ppleng); yy_push_state(pp_sqs);
448 <pp_define>\" new_string(); add_string(pptext, ppleng); yy_push_state(pp_dqs);
451 * Scan the definition macro arguments
453 <pp_macro>\){ws}* yy_pp_state(pp_mbody); return tMACROEND;
455 <pp_macro>{cident} pplval.cptr = pp_xstrdup(pptext); return tIDENT;
456 <pp_macro>, return ',';
457 <pp_macro>"..." return tELIPSIS;
458 <pp_macro>(\\\r?)|(\n)|(.)|(\.\.?) pperror("Argument identifier expected");
459 <pp_macro>\\\r?\n newline(0);
462 * Scan the substitution of a macro
464 <pp_mbody>[^a-zA-Z0-9'"#/\\\n]+ pplval.cptr = pp_xstrdup(pptext); return tLITERAL;
465 <pp_mbody>{cident} pplval.cptr = pp_xstrdup(pptext); return tIDENT;
466 <pp_mbody>\#\# return tCONCAT;
467 <pp_mbody>\# return tSTRINGIZE;
468 <pp_mbody>[0-9][^'"#/\\\n]* pplval.cptr = pp_xstrdup(pptext); return tLITERAL;
469 <pp_mbody>(\\\r?)|(\/[^/*'"#\\\n]*) pplval.cptr = pp_xstrdup(pptext); return tLITERAL;
470 <pp_mbody>\\\r?\n{ws}+ newline(0); pplval.cptr = pp_xstrdup(" "); return tLITERAL;
471 <pp_mbody>\\\r?\n newline(0);
472 <pp_mbody>\n newline(1); yy_pop_state(); return tNL;
473 <pp_mbody>\' new_string(); add_string(pptext, ppleng); yy_push_state(pp_sqs);
474 <pp_mbody>\" new_string(); add_string(pptext, ppleng); yy_push_state(pp_dqs);
477 * Macro expansion text scanning.
478 * This state is active just after the identifier is scanned
479 * that triggers an expansion. We *must* delete the leading
480 * whitespace before we can start scanning for arguments.
482 * If we do not see a '(' as next trailing token, then we have
483 * a false alarm. We just continue with a nose-bleed...
485 <pp_macign>{ws}*/\( yy_pp_state(pp_macscan);
487 if(yy_top_state() != pp_macscan)
490 <pp_macign>{ws}*\\\r?\n newline(0);
491 <pp_macign>{ws}+|{ws}*\\\r?|. {
492 macexpstackentry_t *mac = pop_macro();
494 put_buffer(mac->ppp->ident, strlen(mac->ppp->ident));
495 put_buffer(pptext, ppleng);
500 * Macro expansion argument text scanning.
501 * This state is active when a macro's arguments are being read for expansion.
504 if(++MACROPARENTHESES() > 1)
505 add_text_to_macro(pptext, ppleng);
508 if(--MACROPARENTHESES() == 0)
514 add_text_to_macro(pptext, ppleng);
517 if(MACROPARENTHESES() > 1)
518 add_text_to_macro(pptext, ppleng);
522 <pp_macscan>\" new_string(); add_string(pptext, ppleng); yy_push_state(pp_dqs);
523 <pp_macscan>\' new_string(); add_string(pptext, ppleng); yy_push_state(pp_sqs);
524 <pp_macscan>"/*" yy_push_state(pp_comment); add_text_to_macro(" ", 1);
525 <pp_macscan>\n pp_status.line_number++; pp_status.char_number = 1; add_text_to_macro(pptext, ppleng);
526 <pp_macscan>([^/(),\\\n"']+)|(\/[^/*(),\\\n'"]*)|(\\\r?)|(.) add_text_to_macro(pptext, ppleng);
527 <pp_macscan>\\\r?\n newline(0);
530 * Comment handling (almost all start-conditions)
532 <INITIAL,pp_pp,pp_ignore,pp_eol,pp_inc,pp_if,pp_ifd,pp_endif,pp_defined,pp_def,pp_define,pp_macro,pp_mbody,RCINCL>"/*" yy_push_state(pp_comment);
533 <pp_comment>[^*\n]*|"*"+[^*/\n]* ;
534 <pp_comment>\n newline(0);
535 <pp_comment>"*"+"/" yy_pop_state();
538 * Remove C++ style comment (almost all start-conditions)
540 <INITIAL,pp_pp,pp_ignore,pp_eol,pp_inc,pp_if,pp_ifd,pp_endif,pp_defined,pp_def,pp_define,pp_macro,pp_mbody,pp_macscan,RCINCL>"//"[^\n]* {
541 if(pptext[ppleng-1] == '\\')
542 ppwarning("C++ style comment ends with an escaped newline (escape ignored)");
546 * Single, double and <> quoted constants
548 <INITIAL,pp_macexp>\" pp_incl_state.seen_junk++; new_string(); add_string(pptext, ppleng); yy_push_state(pp_dqs);
549 <INITIAL,pp_macexp>\' pp_incl_state.seen_junk++; new_string(); add_string(pptext, ppleng); yy_push_state(pp_sqs);
550 <pp_dqs>[^"\\\n]+ add_string(pptext, ppleng);
552 add_string(pptext, ppleng);
554 switch(yy_current_state())
561 if (yy_current_state()==RCINCL) yy_pop_state();
562 pplval.cptr = get_string();
565 pplval.cptr = get_string();
566 if (is_c_h_include(pplval.cptr, 1)) pass_data=0;
573 <pp_sqs>[^'\\\n]+ add_string(pptext, ppleng);
575 add_string(pptext, ppleng);
577 switch(yy_current_state())
582 pplval.cptr = get_string();
588 <pp_iqs>[^\>\\\n]+ add_string(pptext, ppleng);
590 add_string(pptext, ppleng);
592 pplval.cptr = get_string();
597 * This is tricky; we need to remove the line-continuation
598 * from preprocessor strings, but OTOH retain them in all
599 * other strings. This is because the resource grammar is
600 * even more braindead than initially analysed and line-
601 * continuations in strings introduce, sigh, newlines in
602 * the output. There goes the concept of non-breaking, non-
603 * spacing whitespace.
605 switch(yy_top_state())
615 add_string(pptext, ppleng);
619 <pp_iqs,pp_dqs,pp_sqs>\\. add_string(pptext, ppleng);
620 <pp_iqs,pp_dqs,pp_sqs>\n {
622 add_string(pptext, ppleng);
623 ppwarning("Newline in string constant encounterd (started line %d)", string_start());
627 * Identifier scanning
629 <INITIAL,pp_if,pp_inc,pp_macexp>{cident} {
631 pp_incl_state.seen_junk++;
632 if(!(ppp = pplookup(pptext)))
634 if(yy_current_state() == pp_inc)
635 pperror("Expected include filename");
637 if(yy_current_state() == pp_if)
639 pplval.cptr = pp_xstrdup(pptext);
643 if((yy_current_state()==INITIAL) && (strcasecmp(pptext,"RCINCLUDE")==0)){
644 yy_push_state(RCINCL);
647 else put_buffer(pptext, ppleng);
650 else if(!ppp->expanding)
661 yy_push_state(pp_macign);
665 pp_internal_error(__FILE__, __LINE__, "Invalid define type %d\n", ppp->type);
671 * Everything else that needs to be passed and
672 * newline and continuation handling
674 <INITIAL,pp_macexp>[^a-zA-Z_#'"/\\\n \r\t\f\v]+|(\/|\\)[^a-zA-Z_/*'"\\\n \r\t\v\f]* pp_incl_state.seen_junk++; put_buffer(pptext, ppleng);
675 <INITIAL,pp_macexp>{ws}+ put_buffer(pptext, ppleng);
676 <INITIAL>\n newline(1);
677 <INITIAL>\\\r?\n newline(0);
678 <INITIAL>\\\r? pp_incl_state.seen_junk++; put_buffer(pptext, ppleng);
681 * Special catcher for macro argmument expansion to prevent
682 * newlines to propagate to the output or admin.
684 <pp_macexp>(\n)|(.)|(\\\r?(\n|.)) put_buffer(pptext, ppleng);
686 <RCINCL>[A-Za-z0-9_\.\\/]+ {
687 pplval.cptr=pp_xstrdup(pptext);
689 return tRCINCLUDEPATH;
695 new_string(); add_string(pptext,ppleng);yy_push_state(pp_dqs);
699 * This is a 'catch-all' rule to discover errors in the scanner
700 * in an orderly manner.
702 <*>. pp_incl_state.seen_junk++; ppwarning("Unmatched text '%c' (0x%02x); please report\n", isprint(*pptext & 0xff) ? *pptext : ' ', *pptext);
705 YY_BUFFER_STATE b = YY_CURRENT_BUFFER;
706 bufferstackentry_t *bep = pop_buffer();
708 if((!bep && pp_get_if_depth()) || (bep && pp_get_if_depth() != bep->if_depth))
709 ppwarning("Unmatched #if/#endif at end of file");
713 if(YY_START != INITIAL)
714 pperror("Unexpected end of file during preprocessing");
717 else if(bep->should_pop == 2)
719 macexpstackentry_t *mac;
728 **************************************************************************
730 **************************************************************************
742 *-------------------------------------------------------------------------
743 * Output newlines or set them as continuations
745 * Input: -1 - Don't count this one, but update local position (see pp_dqs)
746 * 0 - Line-continuation seen and cache output
747 * 1 - Newline seen and flush output
748 *-------------------------------------------------------------------------
750 static void newline(int dowrite)
752 pp_status.line_number++;
753 pp_status.char_number = 1;
761 for(;ncontinuations; ncontinuations--)
768 *-------------------------------------------------------------------------
769 * Make a number out of an any-base and suffixed string
771 * Possible number extensions:
774 * - "LL" long long int
776 * - "UL" unsigned long int
777 * - "ULL" unsigned long long int
778 * - "LU" unsigned long int
779 * - "LLU" unsigned long long int
783 * The sizes of resulting 'int' and 'long' are compiler specific.
784 * I depend on sizeof(int) > 2 here (although a relatively safe
786 * Long longs are not yet implemented because this is very compiler
787 * specific and I don't want to think too much about the problems.
789 *-------------------------------------------------------------------------
791 static int make_number(int radix, YYSTYPE *val, const char *str, int len)
799 ext[2] = toupper(str[len-1]);
800 ext[1] = len > 1 ? toupper(str[len-2]) : ' ';
801 ext[0] = len > 2 ? toupper(str[len-3]) : ' ';
803 if(!strcmp(ext, "LUL"))
804 pperror("Invalid constant suffix");
805 else if(!strcmp(ext, "LLU") || !strcmp(ext, "ULL"))
810 else if(!strcmp(ext+1, "LU") || !strcmp(ext+1, "UL"))
815 else if(!strcmp(ext+1, "LL"))
819 else if(!strcmp(ext+2, "L"))
823 else if(!strcmp(ext+2, "U"))
829 pp_internal_error(__FILE__, __LINE__, "long long constants not implemented yet");
833 val->ulong = strtoul(str, NULL, radix);
836 else if(!is_u && is_l)
838 val->slong = strtol(str, NULL, radix);
841 else if(is_u && !is_l)
843 val->uint = (unsigned int)strtoul(str, NULL, radix);
847 /* Else it must be an int... */
848 val->sint = (int)strtol(str, NULL, radix);
854 *-------------------------------------------------------------------------
855 * Macro and define expansion support
857 * FIXME: Variable macro arguments.
858 *-------------------------------------------------------------------------
860 static void expand_special(pp_entry_t *ppp)
862 const char *dbgtext = "?";
863 static char *buf = NULL;
865 assert(ppp->type == def_special);
867 if(!strcmp(ppp->ident, "__LINE__"))
869 dbgtext = "def_special(__LINE__)";
870 buf = pp_xrealloc(buf, 32);
871 sprintf(buf, "%d", pp_status.line_number);
873 else if(!strcmp(ppp->ident, "__FILE__"))
875 dbgtext = "def_special(__FILE__)";
876 buf = pp_xrealloc(buf, strlen(pp_status.input) + 3);
877 sprintf(buf, "\"%s\"", pp_status.input);
880 pp_internal_error(__FILE__, __LINE__, "Special macro '%s' not found...\n", ppp->ident);
883 fprintf(stderr, "expand_special(%d): %s:%d: '%s' -> '%s'\n",
886 pp_status.line_number,
892 push_buffer(ppp, NULL, NULL, 0);
897 static void expand_define(pp_entry_t *ppp)
899 assert(ppp->type == def_define);
902 fprintf(stderr, "expand_define(%d): %s:%d: '%s' -> '%s'\n",
905 pp_status.line_number,
908 if(ppp->subst.text && ppp->subst.text[0])
910 push_buffer(ppp, NULL, NULL, 0);
911 yy_scan_string(ppp->subst.text);
915 static int curdef_idx = 0;
916 static int curdef_alloc = 0;
917 static char *curdef_text = NULL;
919 static void add_text(const char *str, int len)
923 if(curdef_idx >= curdef_alloc || curdef_alloc - curdef_idx < len)
925 curdef_alloc += (len + ALLOCBLOCKSIZE-1) & ~(ALLOCBLOCKSIZE-1);
926 curdef_text = pp_xrealloc(curdef_text, curdef_alloc * sizeof(curdef_text[0]));
927 if(curdef_alloc > 65536)
928 ppwarning("Reallocating macro-expansion buffer larger than 64kB");
930 memcpy(&curdef_text[curdef_idx], str, len);
934 static mtext_t *add_expand_text(mtext_t *mtp, macexpstackentry_t *mep, int *nnl)
948 fprintf(stderr, "add_expand_text: exp_text: '%s'\n", mtp->subst.text);
949 add_text(mtp->subst.text, strlen(mtp->subst.text));
954 fprintf(stderr, "add_expand_text: exp_stringize(%d): '%s'\n",
956 mep->args[mtp->subst.argidx]);
957 cptr = mep->args[mtp->subst.argidx];
961 if(*cptr == '"' || *cptr == '\\')
971 fprintf(stderr, "add_expand_text: exp_concat\n");
972 /* Remove trailing whitespace from current expansion text */
975 if(isspace(curdef_text[curdef_idx-1] & 0xff))
980 /* tag current position and recursively expand the next part */
982 mtp = add_expand_text(mtp->next, mep, nnl);
984 /* Now get rid of the leading space of the expansion */
985 cptr = &curdef_text[tag];
986 n = curdef_idx - tag;
989 if(isspace(*cptr & 0xff))
997 if(cptr != &curdef_text[tag])
999 memmove(&curdef_text[tag], cptr, n);
1000 curdef_idx -= (curdef_idx - tag) - n;
1005 if((mtp->next && mtp->next->type == exp_concat) || (mtp->prev && mtp->prev->type == exp_concat))
1006 exp = mep->args[mtp->subst.argidx];
1008 exp = mep->ppargs[mtp->subst.argidx];
1011 add_text(exp, strlen(exp));
1012 *nnl -= mep->nnls[mtp->subst.argidx];
1013 cptr = strchr(exp, '\n');
1017 cptr = strchr(cptr+1, '\n');
1019 mep->nnls[mtp->subst.argidx] = 0;
1022 fprintf(stderr, "add_expand_text: exp_subst(%d): '%s'\n", mtp->subst.argidx, exp);
1026 pp_internal_error(__FILE__, __LINE__, "Invalid expansion type (%d) in macro expansion\n", mtp->type);
1031 static void expand_macro(macexpstackentry_t *mep)
1037 pp_entry_t *ppp = mep->ppp;
1038 int nargs = mep->nargs;
1040 assert(ppp->type == def_macro);
1041 assert(ppp->expanding == 0);
1043 if((ppp->nargs >= 0 && nargs != ppp->nargs) || (ppp->nargs < 0 && nargs < -ppp->nargs))
1044 pperror("Too %s macro arguments (%d)", nargs < abs(ppp->nargs) ? "few" : "many", nargs);
1046 for(n = 0; n < nargs; n++)
1047 nnl += mep->nnls[n];
1050 fprintf(stderr, "expand_macro(%d): %s:%d: '%s'(%d,%d) -> ...\n",
1053 pp_status.line_number,
1060 for(mtp = ppp->subst.mtext; mtp; mtp = mtp->next)
1062 if(!(mtp = add_expand_text(mtp, mep, &nnl)))
1066 for(n = 0; n < nnl; n++)
1069 /* To make sure there is room and termination (see below) */
1072 /* Strip trailing whitespace from expansion */
1073 for(k = curdef_idx, cptr = &curdef_text[curdef_idx-1]; k > 0; k--, cptr--)
1075 if(!isspace(*cptr & 0xff))
1080 * We must add *one* whitespace to make sure that there
1081 * is a token-separation after the expansion.
1087 /* Strip leading whitespace from expansion */
1088 for(n = 0, cptr = curdef_text; n < k; n++, cptr++)
1090 if(!isspace(*cptr & 0xff))
1097 fprintf(stderr, "expand_text: '%s'\n", curdef_text + n);
1098 push_buffer(ppp, NULL, NULL, 0);
1099 /*yy_scan_bytes(curdef_text + n, k - n);*/
1100 yy_scan_string(curdef_text + n);
1105 *-------------------------------------------------------------------------
1106 * String collection routines
1107 *-------------------------------------------------------------------------
1109 static void new_string(void)
1113 ppwarning("new_string: strbuf_idx != 0");
1116 str_startline = pp_status.line_number;
1119 static void add_string(const char *str, int len)
1123 if(strbuf_idx >= strbuf_alloc || strbuf_alloc - strbuf_idx < len)
1125 strbuf_alloc += (len + ALLOCBLOCKSIZE-1) & ~(ALLOCBLOCKSIZE-1);
1126 strbuffer = pp_xrealloc(strbuffer, strbuf_alloc * sizeof(strbuffer[0]));
1127 if(strbuf_alloc > 65536)
1128 ppwarning("Reallocating string buffer larger than 64kB");
1130 memcpy(&strbuffer[strbuf_idx], str, len);
1134 static char *get_string(void)
1136 char *str = pp_xmalloc(strbuf_idx + 1);
1137 memcpy(str, strbuffer, strbuf_idx);
1138 str[strbuf_idx] = '\0';
1145 static void put_string(void)
1147 put_buffer(strbuffer, strbuf_idx);
1153 static int string_start(void)
1155 return str_startline;
1160 *-------------------------------------------------------------------------
1162 *-------------------------------------------------------------------------
1164 static void push_buffer(pp_entry_t *ppp, char *filename, char *incname, int pop)
1167 printf("push_buffer(%d): %p %p %p %d\n", bufferstackidx, ppp, filename, incname, pop);
1168 if(bufferstackidx >= MAXBUFFERSTACK)
1169 pp_internal_error(__FILE__, __LINE__, "Buffer stack overflow");
1171 memset(&bufferstack[bufferstackidx], 0, sizeof(bufferstack[0]));
1172 bufferstack[bufferstackidx].bufferstate = YY_CURRENT_BUFFER;
1173 bufferstack[bufferstackidx].define = ppp;
1174 bufferstack[bufferstackidx].line_number = pp_status.line_number;
1175 bufferstack[bufferstackidx].char_number = pp_status.char_number;
1176 bufferstack[bufferstackidx].if_depth = pp_get_if_depth();
1177 bufferstack[bufferstackidx].should_pop = pop;
1178 bufferstack[bufferstackidx].filename = pp_status.input;
1179 bufferstack[bufferstackidx].ncontinuations = ncontinuations;
1180 bufferstack[bufferstackidx].incl = pp_incl_state;
1181 bufferstack[bufferstackidx].include_filename = incname;
1182 bufferstack[bufferstackidx].pass_data = pass_data;
1188 /* These will track the pperror to the correct file and line */
1189 pp_status.line_number = 1;
1190 pp_status.char_number = 1;
1191 pp_status.input = filename;
1195 pp_internal_error(__FILE__, __LINE__, "Pushing buffer without knowing where to go to");
1199 static bufferstackentry_t *pop_buffer(void)
1201 if(bufferstackidx < 0)
1202 pp_internal_error(__FILE__, __LINE__, "Bufferstack underflow?");
1204 if(bufferstackidx == 0)
1209 if(bufferstack[bufferstackidx].define)
1210 bufferstack[bufferstackidx].define->expanding = 0;
1213 pp_status.line_number = bufferstack[bufferstackidx].line_number;
1214 pp_status.char_number = bufferstack[bufferstackidx].char_number;
1215 pp_status.input = bufferstack[bufferstackidx].filename;
1216 ncontinuations = bufferstack[bufferstackidx].ncontinuations;
1217 if(!bufferstack[bufferstackidx].should_pop)
1220 fprintf(ppout, "# %d \"%s\" 2\n", pp_status.line_number, pp_status.input);
1222 /* We have EOF, check the include logic */
1223 if(pp_incl_state.state == 2 && !pp_incl_state.seen_junk && pp_incl_state.ppp)
1225 pp_entry_t *ppp = pplookup(pp_incl_state.ppp);
1228 includelogicentry_t *iep = pp_xmalloc(sizeof(includelogicentry_t));
1231 iep->filename = bufferstack[bufferstackidx].include_filename;
1233 iep->next = pp_includelogiclist;
1235 iep->next->prev = iep;
1236 pp_includelogiclist = iep;
1238 fprintf(stderr, "pop_buffer: %s:%d: includelogic added, include_ppp='%s', file='%s'\n", pp_status.input, pp_status.line_number, pp_incl_state.ppp, iep->filename);
1240 else if(bufferstack[bufferstackidx].include_filename)
1241 free(bufferstack[bufferstackidx].include_filename);
1243 if(pp_incl_state.ppp)
1244 free(pp_incl_state.ppp);
1245 pp_incl_state = bufferstack[bufferstackidx].incl;
1246 pass_data = bufferstack[bufferstackidx].pass_data;
1252 printf("pop_buffer(%d): %p %p (%d, %d, %d) %p %d\n",
1254 bufferstack[bufferstackidx].bufferstate,
1255 bufferstack[bufferstackidx].define,
1256 bufferstack[bufferstackidx].line_number,
1257 bufferstack[bufferstackidx].char_number,
1258 bufferstack[bufferstackidx].if_depth,
1259 bufferstack[bufferstackidx].filename,
1260 bufferstack[bufferstackidx].should_pop);
1262 pp_switch_to_buffer(bufferstack[bufferstackidx].bufferstate);
1264 if(bufferstack[bufferstackidx].should_pop)
1266 if(yy_current_state() == pp_macexp)
1267 macro_add_expansion();
1269 pp_internal_error(__FILE__, __LINE__, "Pop buffer and state without macro expansion state");
1273 return &bufferstack[bufferstackidx];
1278 *-------------------------------------------------------------------------
1279 * Macro nestng support
1280 *-------------------------------------------------------------------------
1282 static void push_macro(pp_entry_t *ppp)
1284 if(macexpstackidx >= MAXMACEXPSTACK)
1285 pperror("Too many nested macros");
1287 macexpstack[macexpstackidx] = pp_xmalloc(sizeof(macexpstack[0][0]));
1288 memset( macexpstack[macexpstackidx], 0, sizeof(macexpstack[0][0]));
1289 macexpstack[macexpstackidx]->ppp = ppp;
1293 static macexpstackentry_t *top_macro(void)
1295 return macexpstackidx > 0 ? macexpstack[macexpstackidx-1] : NULL;
1298 static macexpstackentry_t *pop_macro(void)
1300 if(macexpstackidx <= 0)
1301 pp_internal_error(__FILE__, __LINE__, "Macro expansion stack underflow\n");
1302 return macexpstack[--macexpstackidx];
1305 static void free_macro(macexpstackentry_t *mep)
1309 for(i = 0; i < mep->nargs; i++)
1320 static void add_text_to_macro(const char *text, int len)
1322 macexpstackentry_t *mep = top_macro();
1324 assert(mep->ppp->expanding == 0);
1326 if(mep->curargalloc - mep->curargsize <= len+1) /* +1 for '\0' */
1328 mep->curargalloc += (ALLOCBLOCKSIZE > len+1) ? ALLOCBLOCKSIZE : len+1;
1329 mep->curarg = pp_xrealloc(mep->curarg, mep->curargalloc * sizeof(mep->curarg[0]));
1331 memcpy(mep->curarg + mep->curargsize, text, len);
1332 mep->curargsize += len;
1333 mep->curarg[mep->curargsize] = '\0';
1336 static void macro_add_arg(int last)
1340 macexpstackentry_t *mep = top_macro();
1342 assert(mep->ppp->expanding == 0);
1344 mep->args = pp_xrealloc(mep->args, (mep->nargs+1) * sizeof(mep->args[0]));
1345 mep->ppargs = pp_xrealloc(mep->ppargs, (mep->nargs+1) * sizeof(mep->ppargs[0]));
1346 mep->nnls = pp_xrealloc(mep->nnls, (mep->nargs+1) * sizeof(mep->nnls[0]));
1347 mep->args[mep->nargs] = pp_xstrdup(mep->curarg ? mep->curarg : "");
1348 cptr = mep->args[mep->nargs]-1;
1349 while((cptr = strchr(cptr+1, '\n')))
1353 mep->nnls[mep->nargs] = nnl;
1356 mep->curargalloc = mep->curargsize = 0;
1360 fprintf(stderr, "macro_add_arg: %s:%d: %d -> '%s'\n",
1362 pp_status.line_number,
1364 mep->args[mep->nargs-1]);
1366 /* Each macro argument must be expanded to cope with stingize */
1367 if(last || mep->args[mep->nargs-1][0])
1369 yy_push_state(pp_macexp);
1370 push_buffer(NULL, NULL, NULL, last ? 2 : 1);
1371 yy_scan_string(mep->args[mep->nargs-1]);
1372 /*mep->bufferstackidx = bufferstackidx; But not nested! */
1376 static void macro_add_expansion(void)
1378 macexpstackentry_t *mep = top_macro();
1380 assert(mep->ppp->expanding == 0);
1382 mep->ppargs[mep->nargs-1] = pp_xstrdup(mep->curarg ? mep->curarg : "");
1384 mep->curargalloc = mep->curargsize = 0;
1388 fprintf(stderr, "macro_add_expansion: %s:%d: %d -> '%s'\n",
1390 pp_status.line_number,
1392 mep->ppargs[mep->nargs-1]);
1397 *-------------------------------------------------------------------------
1399 *-------------------------------------------------------------------------
1401 static void put_buffer(const char *s, int len)
1404 add_text_to_macro(s, len);
1407 fwrite(s, 1, len, ppout);
1413 *-------------------------------------------------------------------------
1414 * Include management
1415 *-------------------------------------------------------------------------
1417 static int is_c_h_include(char *fname, int quoted)
1419 int sl=strlen(fname);
1420 if (sl < 2 + 2 * quoted) return 0;
1421 if ((toupper(fname[sl-1-quoted])!='H') && (toupper(fname[sl-1-quoted])!='C')) return 0;
1422 if (fname[sl-2-quoted]!='.') return 0;
1426 void pp_do_include(char *fname, int type)
1430 includelogicentry_t *iep;
1432 for(iep = pp_includelogiclist; iep; iep = iep->next)
1434 if(!strcmp(iep->filename, fname))
1437 * We are done. The file was included before.
1438 * If the define was deleted, then this entry would have
1448 pperror("Empty include filename");
1450 /* Undo the effect of the quotation */
1453 if((ppin = pp_open_include(fname+1, type ? pp_status.input : NULL, &newpath, type)) == NULL)
1454 pperror("Unable to open include file %s", fname+1);
1456 fname[n-1] = *fname; /* Redo the quotes */
1457 push_buffer(NULL, newpath, fname, 0);
1458 pp_incl_state.seen_junk = 0;
1459 pp_incl_state.state = 0;
1460 pp_incl_state.ppp = NULL;
1461 if (is_c_h_include(newpath, 0)) pass_data=0;
1465 fprintf(stderr, "pp_do_include: %s:%d: include_state=%d, include_ppp='%s', include_ifdepth=%d ,pass_data=%d\n",
1466 pp_status.input, pp_status.line_number, pp_incl_state.state, pp_incl_state.ppp, pp_incl_state.ifdepth, pass_data);
1467 pp_switch_to_buffer(pp_create_buffer(ppin, YY_BUF_SIZE));
1469 fprintf(ppout, "# 1 \"%s\" 1%s\n", newpath, type ? "" : " 3");
1473 *-------------------------------------------------------------------------
1474 * Push/pop preprocessor ignore state when processing conditionals
1476 *-------------------------------------------------------------------------
1478 void pp_push_ignore_state(void)
1480 yy_push_state(pp_ignore);
1483 void pp_pop_ignore_state(void)