ppl.l 45.6 KB
Newer Older
1
/* -*-C-*-
2 3 4 5
 * Wrc preprocessor lexical analysis
 *
 * Copyright 1999-2000	Bertho A. Stultiens (BS)
 *
6 7 8 9 10 11 12 13 14 15 16 17
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
18
 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
19 20
 *
 * History:
21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47
 * 24-Apr-2000 BS	- Started from scratch to restructure everything
 *			  and reintegrate the source into the wine-tree.
 * 04-Jan-2000 BS	- Added comments about the lexicographical
 *			  grammar to give some insight in the complexity.
 * 28-Dec-1999 BS	- Eliminated backing-up of the flexer by running
 *			  `flex -b' on the source. This results in some
 *			  weirdo extra rules, but a much faster scanner.
 * 23-Dec-1999 BS	- Started this file
 *
 *-------------------------------------------------------------------------
 * The preprocessor's lexographical grammar (approximately):
 *
 * pp		:= {ws} # {ws} if {ws} {expr} {ws} \n
 *		|  {ws} # {ws} ifdef {ws} {id} {ws} \n
 *		|  {ws} # {ws} ifndef {ws} {id} {ws} \n
 *		|  {ws} # {ws} elif {ws} {expr} {ws} \n
 *		|  {ws} # {ws} else {ws} \n
 *		|  {ws} # {ws} endif {ws} \n
 *		|  {ws} # {ws} include {ws} < {anytext} > \n
 *		|  {ws} # {ws} include {ws} " {anytext} " \n
 *		|  {ws} # {ws} define {ws} {anytext} \n
 *		|  {ws} # {ws} define( {arglist} ) {ws} {expansion} \n
 *		|  {ws} # {ws} pragma {ws} {anytext} \n
 *		|  {ws} # {ws} ident {ws} {anytext} \n
 *		|  {ws} # {ws} error {ws} {anytext} \n
 *		|  {ws} # {ws} warning {ws} {anytext} \n
 *		|  {ws} # {ws} line {ws} " {anytext} " {number} \n
48
 *		|  {ws} # {ws} {number} " {anytext} " {number} [ {number} [{number}] ] \n
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87
 *		|  {ws} # {ws} \n
 *
 * ws		:= [ \t\r\f\v]*
 *
 * expr		:= {expr} [+-*%^/|&] {expr}
 *		|  {expr} {logor|logand} {expr}
 *		|  [!~+-] {expr}
 *		|  {expr} ? {expr} : {expr}
 *
 * logor	:= ||
 *
 * logand	:= &&
 *
 * id		:= [a-zA-Z_][a-zA-Z0-9_]*
 *
 * anytext	:= [^\n]*	(see note)
 *
 * arglist	:=
 *		|  {id}
 *		|  {arglist} , {id}
 *		|  {arglist} , {id} ...
 *
 * expansion	:= {id}
 *		|  # {id}
 *		|  {anytext}
 *		|  {anytext} ## {anytext}
 *
 * number	:= [0-9]+
 *
 * Note: "anytext" is not always "[^\n]*". This is because the
 *	 trailing context must be considered as well.
 *
 * The only certain assumption for the preprocessor to make is that
 * directives start at the beginning of the line, followed by a '#'
 * and end with a newline.
 * Any directive may be suffixed with a line-continuation. Also
 * classical comment / *...* / (note: no comments within comments,
 * therefore spaces) is considered to be a line-continuation
 * (according to gcc and egcs AFAIK, ANSI is a bit vague).
Francois Gouget's avatar
Francois Gouget committed
88
 * Comments have not been added to the above grammar for simplicity
89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123
 * reasons. However, it is allowed to enter comment anywhere within
 * the directives as long as they do not interfere with the context.
 * All comments are considered to be deletable whitespace (both
 * classical form "/ *...* /" and C++ form "//...\n").
 *
 * All recursive scans, except for macro-expansion, are done by the
 * parser, whereas the simple state transitions of non-recursive
 * directives are done in the scanner. This results in the many
 * exclusive start-conditions of the scanner.
 *
 * Macro expansions are slightly more difficult because they have to
 * prescan the arguments. Parameter substitution is literal if the
 * substitution is # or ## (either side). This enables new identifiers
 * to be created (see 'info cpp' node Macro|Pitfalls|Prescan for more
 * information).
 *
 * FIXME: Variable macro parameters is recognized, but not yet
 * expanded. I have to reread the ANSI standard on the subject (yes,
 * ANSI defines it).
 *
 * The following special defines are supported:
 * __FILE__	-> "thissource.c"
 * __LINE__	-> 123
 * __DATE__	-> "May  1 2000"
 * __TIME__	-> "23:59:59"
 * These macros expand, as expected, into their ANSI defined values.
 *
 * The same include prevention is implemented as gcc and egcs does.
 * This results in faster processing because we do not read the text
 * at all. Some wine-sources attempt to include the same file 4 or 5
 * times. This strategy also saves a lot blank output-lines, which in
 * its turn improves the real resource scanner/parser.
 *
 */

124 125 126 127 128
%top{
#include "config.h"
#include "wine/port.h"
}

129 130 131 132
/*
 * Special flex options and exclusive scanner start-conditions
 */
%option stack
133
%option 8bit never-interactive
134
%option noinput nounput
135
%option prefix="ppy_"
136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152

%x pp_pp
%x pp_eol
%x pp_inc
%x pp_dqs
%x pp_sqs
%x pp_iqs
%x pp_comment
%x pp_def
%x pp_define
%x pp_macro
%x pp_mbody
%x pp_macign
%x pp_macscan
%x pp_macexp
%x pp_if
%x pp_ifd
153
%x pp_endif
154 155 156
%x pp_line
%x pp_defined
%x pp_ignore
157
%x RCINCL
158 159 160 161 162 163 164 165 166 167 168

ws	[ \v\f\t\r]
cident	[a-zA-Z_][0-9a-zA-Z_]*
ul	[uUlL]|[uUlL][lL]|[lL][uU]|[lL][lL][uU]|[uU][lL][lL]|[lL][uU][lL]

%{
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <ctype.h>
#include <assert.h>
169 170 171 172 173 174 175 176 177 178
#include <errno.h>
#include <limits.h>

#ifndef LLONG_MAX
# define LLONG_MAX  ((long long)0x7fffffff << 32 | 0xffffffff)
# define LLONG_MIN  (-LLONG_MAX - 1)
#endif
#ifndef ULLONG_MAX
# define ULLONG_MAX ((long long)0xffffffff << 32 | 0xffffffff)
#endif
179

180 181 182 183
#ifndef HAVE_UNISTD_H
#define YY_NO_UNISTD_H
#endif

Matteo Bruni's avatar
Matteo Bruni committed
184
#include "wine/wpp.h"
185
#include "wpp_private.h"
186
#include "ppy.tab.h"
187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202

/*
 * Make sure that we are running an appropriate version of flex.
 */
#if !defined(YY_FLEX_MAJOR_VERSION) || (1000 * YY_FLEX_MAJOR_VERSION + YY_FLEX_MINOR_VERSION < 2005)
#error Must use flex version 2.5.1 or higher (yy_scan_* routines are required).
#endif

#define YY_READ_BUF_SIZE	65536		/* So we read most of a file at once */

#define yy_current_state()	YY_START
#define yy_pp_state(x)		yy_pop_state(); yy_push_state(x)

/*
 * Always update the current character position within a line
 */
203
#define YY_USER_ACTION	pp_status.char_number+=ppy_leng;
204 205 206 207 208 209 210 211

/*
 * Buffer management for includes and expansions
 */
#define MAXBUFFERSTACK	128	/* Nesting more than 128 includes or macro expansion textss is insane */

typedef struct bufferstackentry {
	YY_BUFFER_STATE	bufferstate;	/* Buffer to switch back to */
Matteo Bruni's avatar
Matteo Bruni committed
212
	void		*filehandle;    /* Handle to be used with wpp_callbacks->read */
213 214 215
	pp_entry_t	*define;	/* Points to expanding define or NULL if handling includes */
	int		line_number;	/* Line that we were handling */
	int		char_number;	/* The current position on that line */
216
	char		*filename;	/* Filename that we were handling */
217 218 219 220
	int		if_depth;	/* How many #if:s deep to check matching #endif:s */
	int		ncontinuations;	/* Remember the continuation state */
	int		should_pop;	/* Set if we must pop the start-state on EOF */
	/* Include management */
221 222
        include_state_t incl;
	char 		*include_filename;
223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252
} bufferstackentry_t;

#define ALLOCBLOCKSIZE	(1 << 10)	/* Allocate these chunks at a time for string-buffers */

/*
 * Macro expansion nesting
 * We need the stack to handle expansions while scanning
 * a macro's arguments. The TOS must always be the macro
 * that receives the current expansion from the scanner.
 */
#define MAXMACEXPSTACK	128	/* Nesting more than 128 macro expansions is insane */

typedef struct macexpstackentry {
	pp_entry_t	*ppp;		/* This macro we are scanning */
	char		**args;		/* With these arguments */
	char		**ppargs;	/* Resulting in these preprocessed arguments */
	int		*nnls;		/* Number of newlines per argument */
	int		nargs;		/* And this many arguments scanned */
	int		parentheses;	/* Nesting level of () */
	int		curargsize;	/* Current scanning argument's size */
	int		curargalloc;	/* Current scanning argument's block allocated */
	char		*curarg;	/* Current scanning argument's content */
} macexpstackentry_t;

#define MACROPARENTHESES()	(top_macro()->parentheses)

/*
 * Prototypes
 */
static void newline(int);
253 254
static int make_number(int radix, YYSTYPE *val, const char *str, int len);
static void put_buffer(const char *s, int len);
255 256 257 258 259
/* Buffer management */
static void push_buffer(pp_entry_t *ppp, char *filename, char *incname, int pop);
static bufferstackentry_t *pop_buffer(void);
/* String functions */
static void new_string(void);
260
static void add_string(const char *str, int len);
261 262 263 264 265 266 267 268
static char *get_string(void);
static void put_string(void);
static int string_start(void);
/* Macro functions */
static void push_macro(pp_entry_t *ppp);
static macexpstackentry_t *top_macro(void);
static macexpstackentry_t *pop_macro(void);
static void free_macro(macexpstackentry_t *mep);
269
static void add_text_to_macro(const char *text, int len);
270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295
static void macro_add_arg(int last);
static void macro_add_expansion(void);
/* Expansion */
static void expand_special(pp_entry_t *ppp);
static void expand_define(pp_entry_t *ppp);
static void expand_macro(macexpstackentry_t *mep);

/*
 * Local variables
 */
static int ncontinuations;

static int strbuf_idx = 0;
static int strbuf_alloc = 0;
static char *strbuffer = NULL;
static int str_startline;

static macexpstackentry_t *macexpstack[MAXMACEXPSTACK];
static int macexpstackidx = 0;

static bufferstackentry_t bufferstack[MAXBUFFERSTACK];
static int bufferstackidx = 0;

/*
 * Global variables
 */
296 297 298 299 300 301 302 303 304
include_state_t pp_incl_state =
{
    -1,    /* state */
    NULL,  /* ppp */
    0,     /* ifdepth */
    0      /* seen_junk */
};

includelogicentry_t *pp_includelogiclist = NULL;
305

Matteo Bruni's avatar
Matteo Bruni committed
306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331
#define YY_INPUT(buf,result,max_size)					     \
	{								     \
		result = wpp_callbacks->read(pp_status.file, buf, max_size); \
	}

#define BUFFERINITIALCAPACITY 256

void pp_writestring(const char *format, ...)
{
	va_list valist;
	int len;
	static char *buffer;
	static int buffercapacity;
	char *new_buffer;

	if(buffercapacity == 0)
	{
		buffer = pp_xmalloc(BUFFERINITIALCAPACITY);
		if(buffer == NULL)
			return;
		buffercapacity = BUFFERINITIALCAPACITY;
	}

	va_start(valist, format);
	len = vsnprintf(buffer, buffercapacity,
			format, valist);
332
	va_end(valist);
Matteo Bruni's avatar
Matteo Bruni committed
333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348
        /* If the string is longer than buffersize, vsnprintf returns
         * the string length with glibc >= 2.1, -1 with glibc < 2.1 */
	while(len > buffercapacity || len < 0)
	{
		do
		{
			buffercapacity *= 2;
		} while(len > buffercapacity);

		new_buffer = pp_xrealloc(buffer, buffercapacity);
		if(new_buffer == NULL)
		{
			va_end(valist);
			return;
		}
		buffer = new_buffer;
349
		va_start(valist, format);
Matteo Bruni's avatar
Matteo Bruni committed
350 351
		len = vsnprintf(buffer, buffercapacity,
				format, valist);
352
		va_end(valist);
Matteo Bruni's avatar
Matteo Bruni committed
353 354 355 356 357
	}

	wpp_callbacks->write(buffer, len);
}

358 359 360 361 362 363 364 365 366 367 368 369 370 371
%}

/*
 **************************************************************************
 * The scanner starts here
 **************************************************************************
 */

%%
	/*
	 * Catch line-continuations.
	 * Note: Gcc keeps the line-continuations in, for example, strings
	 * intact. However, I prefer to remove them all so that the next
	 * scanner will not need to reduce the continuation state.
372 373
	 *
	 * <*>\\\n		newline(0);
374 375 376 377 378
	 */

	/*
	 * Detect the leading # of a preprocessor directive.
	 */
379
<INITIAL,pp_ignore>^{ws}*#	pp_incl_state.seen_junk++; yy_push_state(pp_pp);
380 381 382 383 384 385 386 387 388 389 390 391

	/*
	 * Scan for the preprocessor directives
	 */
<pp_pp>{ws}*include{ws}*	if(yy_top_state() != pp_ignore) {yy_pp_state(pp_inc); return tINCLUDE;} else {yy_pp_state(pp_eol);}
<pp_pp>{ws}*define{ws}*		yy_pp_state(yy_current_state() != pp_ignore ? pp_def : pp_eol);
<pp_pp>{ws}*error{ws}*		yy_pp_state(pp_eol);	if(yy_top_state() != pp_ignore) return tERROR;
<pp_pp>{ws}*warning{ws}*	yy_pp_state(pp_eol);	if(yy_top_state() != pp_ignore) return tWARNING;
<pp_pp>{ws}*pragma{ws}*		yy_pp_state(pp_eol);	if(yy_top_state() != pp_ignore) return tPRAGMA;
<pp_pp>{ws}*ident{ws}*		yy_pp_state(pp_eol);	if(yy_top_state() != pp_ignore) return tPPIDENT;
<pp_pp>{ws}*undef{ws}*		if(yy_top_state() != pp_ignore) {yy_pp_state(pp_ifd); return tUNDEF;} else {yy_pp_state(pp_eol);}
<pp_pp>{ws}*ifdef{ws}*		yy_pp_state(pp_ifd);	return tIFDEF;
392
<pp_pp>{ws}*ifndef{ws}*		pp_incl_state.seen_junk--; yy_pp_state(pp_ifd);	return tIFNDEF;
393 394
<pp_pp>{ws}*if{ws}*		yy_pp_state(pp_if);	return tIF;
<pp_pp>{ws}*elif{ws}*		yy_pp_state(pp_if);	return tELIF;
395 396
<pp_pp>{ws}*else{ws}*		yy_pp_state(pp_endif);  return tELSE;
<pp_pp>{ws}*endif{ws}*		yy_pp_state(pp_endif);  return tENDIF;
397 398
<pp_pp>{ws}*line{ws}*		if(yy_top_state() != pp_ignore) {yy_pp_state(pp_line); return tLINE;} else {yy_pp_state(pp_eol);}
<pp_pp>{ws}+			if(yy_top_state() != pp_ignore) {yy_pp_state(pp_line); return tGCCLINE;} else {yy_pp_state(pp_eol);}
399
<pp_pp>{ws}*[a-z]+		ppy_error("Invalid preprocessor token '%s'", ppy_text);
400 401
<pp_pp>\r?\n			newline(1); yy_pop_state(); return tNL;	/* This could be the null-token */
<pp_pp>\\\r?\n			newline(0);
402 403
<pp_pp>\\\r?			ppy_error("Preprocessor junk '%s'", ppy_text);
<pp_pp>.			return *ppy_text;
404 405 406 407

	/*
	 * Handle #include and #line
	 */
408 409 410
<pp_line>[0-9]+			return make_number(10, &ppy_lval, ppy_text, ppy_leng);
<pp_inc>\<			new_string(); add_string(ppy_text, ppy_leng); yy_push_state(pp_iqs);
<pp_inc,pp_line>\"		new_string(); add_string(ppy_text, ppy_leng); yy_push_state(pp_dqs);
411 412
<pp_inc,pp_line>{ws}+		;
<pp_inc,pp_line>\n		newline(1); yy_pop_state(); return tNL;
413
<pp_inc,pp_line>\\\r?\n		newline(0);
414
<pp_inc,pp_line>(\\\r?)|(.)	ppy_error(yy_current_state() == pp_inc ? "Trailing junk in #include" : "Trailing junk in #line");
415 416 417 418 419 420

	/*
	 * Ignore all input when a false clause is parsed
	 */
<pp_ignore>[^#/\\\n]+		;
<pp_ignore>\n			newline(1);
421 422
<pp_ignore>\\\r?\n		newline(0);
<pp_ignore>(\\\r?)|(.)		;
423 424 425 426 427 428 429 430

	/*
	 * Handle #if and #elif.
	 * These require conditionals to be evaluated, but we do not
	 * want to jam the scanner normally when we see these tokens.
	 * Note: tIDENT is handled below.
	 */

431 432 433 434 435
<pp_if>0[0-7]*{ul}?		return make_number(8, &ppy_lval, ppy_text, ppy_leng);
<pp_if>0[0-7]*[8-9]+{ul}?	ppy_error("Invalid octal digit");
<pp_if>[1-9][0-9]*{ul}?		return make_number(10, &ppy_lval, ppy_text, ppy_leng);
<pp_if>0[xX][0-9a-fA-F]+{ul}?	return make_number(16, &ppy_lval, ppy_text, ppy_leng);
<pp_if>0[xX]			ppy_error("Invalid hex number");
436 437 438 439 440 441 442 443 444 445
<pp_if>defined			yy_push_state(pp_defined); return tDEFINED;
<pp_if>"<<"			return tLSHIFT;
<pp_if>">>"			return tRSHIFT;
<pp_if>"&&"			return tLOGAND;
<pp_if>"||"			return tLOGOR;
<pp_if>"=="			return tEQ;
<pp_if>"!="			return tNE;
<pp_if>"<="			return tLTE;
<pp_if>">="			return tGTE;
<pp_if>\n			newline(1); yy_pop_state(); return tNL;
446
<pp_if>\\\r?\n			newline(0);
447
<pp_if>\\\r?			ppy_error("Junk in conditional expression");
448
<pp_if>{ws}+			;
449 450 451
<pp_if>\'			new_string(); add_string(ppy_text, ppy_leng); yy_push_state(pp_sqs);
<pp_if>\"			ppy_error("String constants not allowed in conditionals");
<pp_if>.			return *ppy_text;
452 453 454 455 456

	/*
	 * Handle #ifdef, #ifndef and #undef
	 * to get only an untranslated/unexpanded identifier
	 */
457
<pp_ifd>{cident}	ppy_lval.cptr = pp_xstrdup(ppy_text); return tIDENT;
458 459
<pp_ifd>{ws}+		;
<pp_ifd>\n		newline(1); yy_pop_state(); return tNL;
460
<pp_ifd>\\\r?\n		newline(0);
461
<pp_ifd>(\\\r?)|(.)	ppy_error("Identifier expected");
462

463 464 465 466 467 468
	/*
	 * Handle #else and #endif.
	 */
<pp_endif>{ws}+		;
<pp_endif>\n		newline(1); yy_pop_state(); return tNL;
<pp_endif>\\\r?\n	newline(0);
469
<pp_endif>.		ppy_error("Garbage after #else or #endif.");
470

471 472 473 474 475
	/*
	 * Handle the special 'defined' keyword.
	 * This is necessary to get the identifier prior to any
	 * substitutions.
	 */
476
<pp_defined>{cident}		yy_pop_state(); ppy_lval.cptr = pp_xstrdup(ppy_text); return tIDENT;
477
<pp_defined>{ws}+		;
478
<pp_defined>(\()|(\))		return *ppy_text;
479
<pp_defined>\\\r?\n		newline(0);
480
<pp_defined>(\\.)|(\n)|(.)	ppy_error("Identifier expected");
481 482 483 484 485 486 487

	/*
	 * Handle #error, #warning, #pragma and #ident.
	 * Pass everything literally to the parser, which
	 * will act appropriately.
	 * Comments are stripped from the literal text.
	 */
488 489 490
<pp_eol>[^/\\\n]+		if(yy_top_state() != pp_ignore) { ppy_lval.cptr = pp_xstrdup(ppy_text); return tLITERAL; }
<pp_eol>\/[^/\\\n*]*		if(yy_top_state() != pp_ignore) { ppy_lval.cptr = pp_xstrdup(ppy_text); return tLITERAL; }
<pp_eol>(\\\r?)|(\/[^/*])	if(yy_top_state() != pp_ignore) { ppy_lval.cptr = pp_xstrdup(ppy_text); return tLITERAL; }
491
<pp_eol>\n			newline(1); yy_pop_state(); if(yy_current_state() != pp_ignore) { return tNL; }
492
<pp_eol>\\\r?\n			newline(0);
493 494 495 496

	/*
	 * Handle left side of #define
	 */
497
<pp_def>{cident}\(		ppy_lval.cptr = pp_xstrdup(ppy_text); if(ppy_lval.cptr) ppy_lval.cptr[ppy_leng-1] = '\0'; yy_pp_state(pp_macro);  return tMACRO;
498
<pp_def>{cident}		ppy_lval.cptr = pp_xstrdup(ppy_text); yy_pp_state(pp_define); return tDEFINE;
499
<pp_def>{ws}+			;
500 501
<pp_def>\\\r?\n			newline(0);
<pp_def>(\\\r?)|(\n)|(.)	perror("Identifier expected");
502 503 504 505

	/*
	 * Scan the substitution of a define
	 */
506 507 508
<pp_define>[^'"/\\\n]+		ppy_lval.cptr = pp_xstrdup(ppy_text); return tLITERAL;
<pp_define>(\\\r?)|(\/[^/*])	ppy_lval.cptr = pp_xstrdup(ppy_text); return tLITERAL;
<pp_define>\\\r?\n{ws}+		newline(0); ppy_lval.cptr = pp_xstrdup(" "); return tLITERAL;
509
<pp_define>\\\r?\n		newline(0);
510
<pp_define>\n			newline(1); yy_pop_state(); return tNL;
511 512
<pp_define>\'			new_string(); add_string(ppy_text, ppy_leng); yy_push_state(pp_sqs);
<pp_define>\"			new_string(); add_string(ppy_text, ppy_leng); yy_push_state(pp_dqs);
513 514 515 516 517 518

	/*
	 * Scan the definition macro arguments
	 */
<pp_macro>\){ws}*		yy_pp_state(pp_mbody); return tMACROEND;
<pp_macro>{ws}+			;
519
<pp_macro>{cident}		ppy_lval.cptr = pp_xstrdup(ppy_text); return tIDENT;
520 521
<pp_macro>,			return ',';
<pp_macro>"..."			return tELIPSIS;
522
<pp_macro>(\\\r?)|(\n)|(.)|(\.\.?)	ppy_error("Argument identifier expected");
523
<pp_macro>\\\r?\n		newline(0);
524 525 526 527

	/*
	 * Scan the substitution of a macro
	 */
528 529
<pp_mbody>[^a-zA-Z0-9'"#/\\\n]+	ppy_lval.cptr = pp_xstrdup(ppy_text); return tLITERAL;
<pp_mbody>{cident}		ppy_lval.cptr = pp_xstrdup(ppy_text); return tIDENT;
530 531
<pp_mbody>\#\#			return tCONCAT;
<pp_mbody>\#			return tSTRINGIZE;
532
<pp_mbody>[0-9][a-zA-Z0-9]*[^a-zA-Z0-9'"#/\\\n]*	ppy_lval.cptr = pp_xstrdup(ppy_text); return tLITERAL;
533 534
<pp_mbody>(\\\r?)|(\/[^/*'"#\\\n]*)	ppy_lval.cptr = pp_xstrdup(ppy_text); return tLITERAL;
<pp_mbody>\\\r?\n{ws}+		newline(0); ppy_lval.cptr = pp_xstrdup(" "); return tLITERAL;
535
<pp_mbody>\\\r?\n		newline(0);
536
<pp_mbody>\n			newline(1); yy_pop_state(); return tNL;
537 538
<pp_mbody>\'			new_string(); add_string(ppy_text, ppy_leng); yy_push_state(pp_sqs);
<pp_mbody>\"			new_string(); add_string(ppy_text, ppy_leng); yy_push_state(pp_dqs);
539 540 541 542 543 544 545 546 547 548 549 550 551 552 553

	/*
	 * Macro expansion text scanning.
	 * This state is active just after the identifier is scanned
	 * that triggers an expansion. We *must* delete the leading
	 * whitespace before we can start scanning for arguments.
	 *
	 * If we do not see a '(' as next trailing token, then we have
	 * a false alarm. We just continue with a nose-bleed...
	 */
<pp_macign>{ws}*/\(	yy_pp_state(pp_macscan);
<pp_macign>{ws}*\n	{
		if(yy_top_state() != pp_macscan)
			newline(0);
	}
554 555
<pp_macign>{ws}*\\\r?\n	newline(0);
<pp_macign>{ws}+|{ws}*\\\r?|.	{
556 557 558
		macexpstackentry_t *mac = pop_macro();
		yy_pop_state();
		put_buffer(mac->ppp->ident, strlen(mac->ppp->ident));
559
		put_buffer(ppy_text, ppy_leng);
560 561 562 563 564 565 566 567 568
		free_macro(mac);
	}

	/*
	 * Macro expansion argument text scanning.
	 * This state is active when a macro's arguments are being read for expansion.
	 */
<pp_macscan>\(	{
		if(++MACROPARENTHESES() > 1)
569
			add_text_to_macro(ppy_text, ppy_leng);
570 571 572 573 574 575 576 577
	}
<pp_macscan>\)	{
		if(--MACROPARENTHESES() == 0)
		{
			yy_pop_state();
			macro_add_arg(1);
		}
		else
578
			add_text_to_macro(ppy_text, ppy_leng);
579 580 581
	}
<pp_macscan>,		{
		if(MACROPARENTHESES() > 1)
582
			add_text_to_macro(ppy_text, ppy_leng);
583 584 585
		else
			macro_add_arg(0);
	}
586 587
<pp_macscan>\"		new_string(); add_string(ppy_text, ppy_leng); yy_push_state(pp_dqs);
<pp_macscan>\'		new_string(); add_string(ppy_text, ppy_leng); yy_push_state(pp_sqs);
588
<pp_macscan>"/*"	yy_push_state(pp_comment); add_text_to_macro(" ", 1);
589 590
<pp_macscan>\n		pp_status.line_number++; pp_status.char_number = 1; add_text_to_macro(ppy_text, ppy_leng);
<pp_macscan>([^/(),\\\n"']+)|(\/[^/*(),\\\n'"]*)|(\\\r?)|(.)	add_text_to_macro(ppy_text, ppy_leng);
591
<pp_macscan>\\\r?\n	newline(0);
592 593 594 595

	/*
	 * Comment handling (almost all start-conditions)
	 */
596
<INITIAL,pp_pp,pp_ignore,pp_eol,pp_inc,pp_if,pp_ifd,pp_endif,pp_defined,pp_def,pp_define,pp_macro,pp_mbody,RCINCL>"/*" yy_push_state(pp_comment);
597 598 599 600 601 602 603
<pp_comment>[^*\n]*|"*"+[^*/\n]*	;
<pp_comment>\n				newline(0);
<pp_comment>"*"+"/"			yy_pop_state();

	/*
	 * Remove C++ style comment (almost all start-conditions)
	 */
604
<INITIAL,pp_pp,pp_ignore,pp_eol,pp_inc,pp_if,pp_ifd,pp_endif,pp_defined,pp_def,pp_define,pp_macro,pp_mbody,pp_macscan,RCINCL>"//"[^\n]*	{
605 606
		if(ppy_text[ppy_leng-1] == '\\')
			ppy_warning("C++ style comment ends with an escaped newline (escape ignored)");
607 608 609 610 611
	}

	/*
	 * Single, double and <> quoted constants
	 */
612 613 614
<INITIAL,pp_macexp>\"		pp_incl_state.seen_junk++; new_string(); add_string(ppy_text, ppy_leng); yy_push_state(pp_dqs);
<INITIAL,pp_macexp>\'		pp_incl_state.seen_junk++; new_string(); add_string(ppy_text, ppy_leng); yy_push_state(pp_sqs);
<pp_dqs>[^"\\\n]+		add_string(ppy_text, ppy_leng);
615
<pp_dqs>\"			{
616
		add_string(ppy_text, ppy_leng);
617 618 619 620 621 622 623
		yy_pop_state();
		switch(yy_current_state())
		{
		case pp_pp:
		case pp_define:
		case pp_mbody:
		case pp_inc:
624 625
		case RCINCL:
			if (yy_current_state()==RCINCL) yy_pop_state();
626
			ppy_lval.cptr = get_string();
627
			return tDQSTRING;
628
		case pp_line:
629
			ppy_lval.cptr = get_string();
630
			return tDQSTRING;
631 632 633 634
		default:
			put_string();
		}
	}
635
<pp_sqs>[^'\\\n]+		add_string(ppy_text, ppy_leng);
636
<pp_sqs>\'			{
637
		add_string(ppy_text, ppy_leng);
638 639 640 641 642 643
		yy_pop_state();
		switch(yy_current_state())
		{
		case pp_if:
		case pp_define:
		case pp_mbody:
644
			ppy_lval.cptr = get_string();
645 646 647 648 649
			return tSQSTRING;
		default:
			put_string();
		}
	}
650
<pp_iqs>[^\>\\\n]+		add_string(ppy_text, ppy_leng);
651
<pp_iqs>\>			{
652
		add_string(ppy_text, ppy_leng);
653
		yy_pop_state();
654
		ppy_lval.cptr = get_string();
655 656
		return tIQSTRING;
	}
657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676
<pp_dqs>\\\r?\n		{
		/*
		 * This is tricky; we need to remove the line-continuation
		 * from preprocessor strings, but OTOH retain them in all
		 * other strings. This is because the resource grammar is
		 * even more braindead than initially analysed and line-
		 * continuations in strings introduce, sigh, newlines in
		 * the output. There goes the concept of non-breaking, non-
		 * spacing whitespace.
		 */
		switch(yy_top_state())
		{
		case pp_pp:
		case pp_define:
		case pp_mbody:
		case pp_inc:
		case pp_line:
			newline(0);
			break;
		default:
677
			add_string(ppy_text, ppy_leng);
678 679 680
			newline(-1);
		}
	}
681
<pp_iqs,pp_dqs,pp_sqs>\\.	add_string(ppy_text, ppy_leng);
682 683
<pp_iqs,pp_dqs,pp_sqs>\n	{
		newline(1);
684
		add_string(ppy_text, ppy_leng);
685
		ppy_warning("Newline in string constant encountered (started line %d)", string_start());
686 687 688 689 690 691 692
	}

	/*
	 * Identifier scanning
	 */
<INITIAL,pp_if,pp_inc,pp_macexp>{cident}	{
		pp_entry_t *ppp;
693
		pp_incl_state.seen_junk++;
694
		if(!(ppp = pplookup(ppy_text)))
695 696
		{
			if(yy_current_state() == pp_inc)
697
				ppy_error("Expected include filename");
698

699
			else if(yy_current_state() == pp_if)
700
			{
701
				ppy_lval.cptr = pp_xstrdup(ppy_text);
702 703
				return tIDENT;
			}
704
			else {
705
				if((yy_current_state()==INITIAL) && (strcasecmp(ppy_text,"RCINCLUDE")==0)){
706 707 708
					yy_push_state(RCINCL);
					return tRCINCLUDE;
				}
709
				else put_buffer(ppy_text, ppy_leng);
710
			}
711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726
		}
		else if(!ppp->expanding)
		{
			switch(ppp->type)
			{
			case def_special:
				expand_special(ppp);
				break;
			case def_define:
				expand_define(ppp);
				break;
			case def_macro:
				yy_push_state(pp_macign);
				push_macro(ppp);
				break;
			default:
727
				pp_internal_error(__FILE__, __LINE__, "Invalid define type %d\n", ppp->type);
728 729
			}
		}
730
		else put_buffer(ppy_text, ppy_leng);
731 732 733 734 735 736
	}

	/*
	 * Everything else that needs to be passed and
	 * newline and continuation handling
	 */
737 738
<INITIAL,pp_macexp>[^a-zA-Z_#'"/\\\n \r\t\f\v]+|(\/|\\)[^a-zA-Z_/*'"\\\n \r\t\v\f]*	pp_incl_state.seen_junk++; put_buffer(ppy_text, ppy_leng);
<INITIAL,pp_macexp>{ws}+	put_buffer(ppy_text, ppy_leng);
739
<INITIAL>\n			newline(1);
740
<INITIAL>\\\r?\n		newline(0);
741
<INITIAL>\\\r?			pp_incl_state.seen_junk++; put_buffer(ppy_text, ppy_leng);
742 743 744 745 746

	/*
	 * Special catcher for macro argmument expansion to prevent
	 * newlines to propagate to the output or admin.
	 */
747
<pp_macexp>(\n)|(.)|(\\\r?(\n|.))	put_buffer(ppy_text, ppy_leng);
748

749
<RCINCL>[A-Za-z0-9_\.\\/]+ {
750
		ppy_lval.cptr=pp_xstrdup(ppy_text);
751 752 753 754 755 756 757
        	yy_pop_state();
		return tRCINCLUDEPATH;
	}

<RCINCL>{ws}+ ;

<RCINCL>\"		{
758
		new_string(); add_string(ppy_text,ppy_leng);yy_push_state(pp_dqs);
759 760
	}

761 762 763 764
	/*
	 * This is a 'catch-all' rule to discover errors in the scanner
	 * in an orderly manner.
	 */
765
<*>.		pp_incl_state.seen_junk++; ppy_warning("Unmatched text '%c' (0x%02x); please report\n", isprint(*ppy_text & 0xff) ? *ppy_text : ' ', *ppy_text);
766 767 768 769 770

<<EOF>>	{
		YY_BUFFER_STATE b = YY_CURRENT_BUFFER;
		bufferstackentry_t *bep = pop_buffer();

771
		if((!bep && pp_get_if_depth()) || (bep && pp_get_if_depth() != bep->if_depth))
772
			ppy_warning("Unmatched #if/#endif at end of file");
773 774 775 776

		if(!bep)
		{
			if(YY_START != INITIAL)
777
			{
778
				ppy_error("Unexpected end of file during preprocessing");
779 780
				BEGIN(INITIAL);
			}
781 782 783 784 785 786 787 788
			yyterminate();
		}
		else if(bep->should_pop == 2)
		{
			macexpstackentry_t *mac;
			mac = pop_macro();
			expand_macro(mac);
		}
789
		ppy__delete_buffer(b);
790 791 792 793 794 795 796 797 798
	}

%%
/*
 **************************************************************************
 * Support functions
 **************************************************************************
 */

799 800
#ifndef ppy_wrap
int ppy_wrap(void)
801 802 803 804 805 806 807 808 809
{
	return 1;
}
#endif


/*
 *-------------------------------------------------------------------------
 * Output newlines or set them as continuations
810 811 812 813
 *
 * Input: -1 - Don't count this one, but update local position (see pp_dqs)
 *	   0 - Line-continuation seen and cache output
 *	   1 - Newline seen and flush output
814 815 816 817
 *-------------------------------------------------------------------------
 */
static void newline(int dowrite)
{
818 819
	pp_status.line_number++;
	pp_status.char_number = 1;
820 821 822 823

	if(dowrite == -1)
		return;

824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856
	ncontinuations++;
	if(dowrite)
	{
		for(;ncontinuations; ncontinuations--)
			put_buffer("\n", 1);
	}
}


/*
 *-------------------------------------------------------------------------
 * Make a number out of an any-base and suffixed string
 *
 * Possible number extensions:
 * - ""		int
 * - "L"	long int
 * - "LL"	long long int
 * - "U"	unsigned int
 * - "UL"	unsigned long int
 * - "ULL"	unsigned long long int
 * - "LU"	unsigned long int
 * - "LLU"	unsigned long long int
 * - "LUL"	invalid
 *
 * FIXME:
 * The sizes of resulting 'int' and 'long' are compiler specific.
 * I depend on sizeof(int) > 2 here (although a relatively safe
 * assumption).
 * Long longs are not yet implemented because this is very compiler
 * specific and I don't want to think too much about the problems.
 *
 *-------------------------------------------------------------------------
 */
857
static int make_number(int radix, YYSTYPE *val, const char *str, int len)
858 859 860 861 862
{
	int is_l  = 0;
	int is_ll = 0;
	int is_u  = 0;
	char ext[4];
863
	long l;
864 865 866 867 868 869 870

	ext[3] = '\0';
	ext[2] = toupper(str[len-1]);
	ext[1] = len > 1 ? toupper(str[len-2]) : ' ';
	ext[0] = len > 2 ? toupper(str[len-3]) : ' ';

	if(!strcmp(ext, "LUL"))
871
	{
872
		ppy_error("Invalid constant suffix");
873 874
		return 0;
	}
875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898
	else if(!strcmp(ext, "LLU") || !strcmp(ext, "ULL"))
	{
		is_ll++;
		is_u++;
	}
	else if(!strcmp(ext+1, "LU") || !strcmp(ext+1, "UL"))
	{
		is_l++;
		is_u++;
	}
	else if(!strcmp(ext+1, "LL"))
	{
		is_ll++;
	}
	else if(!strcmp(ext+2, "L"))
	{
		is_l++;
	}
	else if(!strcmp(ext+2, "U"))
	{
		is_u++;
	}

	if(is_ll)
899 900
	{
/* Assume as in the declaration of wrc_ull_t and wrc_sll_t */
901
#ifdef HAVE_LONG_LONG
902 903
		if (is_u)
		{
904
			errno = 0;
905
			val->ull = strtoull(str, NULL, radix);
906 907
			if (val->ull == ULLONG_MAX && errno == ERANGE)
				ppy_error("integer constant %s is too large\n", str);
908 909 910 911
			return tULONGLONG;
		}
		else
		{
912
			errno = 0;
913
			val->sll = strtoll(str, NULL, radix);
914 915
			if ((val->sll == LLONG_MIN || val->sll == LLONG_MAX) && errno == ERANGE)
				ppy_error("integer constant %s is too large\n", str);
916 917 918 919 920 921 922
			return tSLONGLONG;
		}
#else
		pp_internal_error(__FILE__, __LINE__, "long long constants not supported on this platform");
#endif
	}
	else if(is_u && is_l)
923
	{
924
		errno = 0;
925
		val->ulong = strtoul(str, NULL, radix);
926 927
		if (val->ulong == ULONG_MAX && errno == ERANGE)
			ppy_error("integer constant %s is too large\n", str);
928 929 930 931
		return tULONG;
	}
	else if(!is_u && is_l)
	{
932
		errno = 0;
933
		val->slong = strtol(str, NULL, radix);
934 935
		if ((val->slong == LONG_MIN || val->slong == LONG_MAX) && errno == ERANGE)
			ppy_error("integer constant %s is too large\n", str);
936 937 938 939
		return tSLONG;
	}
	else if(is_u && !is_l)
	{
940 941 942 943 944 945
		unsigned long ul;
		errno = 0;
		ul = strtoul(str, NULL, radix);
		if ((ul == ULONG_MAX && errno == ERANGE) || (ul > UINT_MAX))
			ppy_error("integer constant %s is too large\n", str);
		val->uint = (unsigned int)ul;
946 947 948 949
		return tUINT;
	}

	/* Else it must be an int... */
950 951 952 953 954 955
	errno = 0;
	l = strtol(str, NULL, radix);
	if (((l == LONG_MIN || l == LONG_MAX) && errno == ERANGE) ||
		(l > INT_MAX) || (l < INT_MIN))
		ppy_error("integer constant %s is too large\n", str);
	val->sint = (int)l;
956 957 958 959 960 961 962 963 964 965 966 967 968 969
	return tSINT;
}


/*
 *-------------------------------------------------------------------------
 * Macro and define expansion support
 *
 * FIXME: Variable macro arguments.
 *-------------------------------------------------------------------------
 */
static void expand_special(pp_entry_t *ppp)
{
	static char *buf = NULL;
970
	char *new_buf;
971 972 973 974 975

	assert(ppp->type == def_special);

	if(!strcmp(ppp->ident, "__LINE__"))
	{
976 977 978 979
		new_buf = pp_xrealloc(buf, 32);
		if(!new_buf)
			return;
		buf = new_buf;
980
		sprintf(buf, "%d", pp_status.line_number);
981 982 983
	}
	else if(!strcmp(ppp->ident, "__FILE__"))
	{
984 985 986 987
		new_buf = pp_xrealloc(buf, strlen(pp_status.input) + 3);
		if(!new_buf)
			return;
		buf = new_buf;
988
		sprintf(buf, "\"%s\"", pp_status.input);
989 990
	}
	else
991
		pp_internal_error(__FILE__, __LINE__, "Special macro '%s' not found...\n", ppp->ident);
992

993
	if(pp_flex_debug)
994 995
		fprintf(stderr, "expand_special(%d): %s:%d: '%s' -> '%s'\n",
			macexpstackidx,
996 997
			pp_status.input,
			pp_status.line_number,
998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011
			ppp->ident,
			buf ? buf : "");

	if(buf && buf[0])
	{
		push_buffer(ppp, NULL, NULL, 0);
		yy_scan_string(buf);
	}
}

static void expand_define(pp_entry_t *ppp)
{
	assert(ppp->type == def_define);

1012
	if(pp_flex_debug)
1013 1014
		fprintf(stderr, "expand_define(%d): %s:%d: '%s' -> '%s'\n",
			macexpstackidx,
1015 1016
			pp_status.input,
			pp_status.line_number,
1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029
			ppp->ident,
			ppp->subst.text);
	if(ppp->subst.text && ppp->subst.text[0])
	{
		push_buffer(ppp, NULL, NULL, 0);
		yy_scan_string(ppp->subst.text);
	}
}

static int curdef_idx = 0;
static int curdef_alloc = 0;
static char *curdef_text = NULL;

1030
static void add_text(const char *str, int len)
1031
{
1032 1033 1034
	int new_alloc;
	char *new_text;

1035 1036 1037 1038
	if(len == 0)
		return;
	if(curdef_idx >= curdef_alloc || curdef_alloc - curdef_idx < len)
	{
1039 1040 1041 1042 1043 1044
		new_alloc = curdef_alloc + ((len + ALLOCBLOCKSIZE-1) & ~(ALLOCBLOCKSIZE-1));
		new_text = pp_xrealloc(curdef_text, new_alloc * sizeof(curdef_text[0]));
		if(!new_text)
			return;
		curdef_text = new_text;
		curdef_alloc = new_alloc;
1045
		if(curdef_alloc > 65536)
1046
			ppy_warning("Reallocating macro-expansion buffer larger than 64kB");
1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064
	}
	memcpy(&curdef_text[curdef_idx], str, len);
	curdef_idx += len;
}

static mtext_t *add_expand_text(mtext_t *mtp, macexpstackentry_t *mep, int *nnl)
{
	char *cptr;
	char *exp;
	int tag;
	int n;

	if(mtp == NULL)
		return NULL;

	switch(mtp->type)
	{
	case exp_text:
1065
		if(pp_flex_debug)
1066 1067 1068 1069 1070
			fprintf(stderr, "add_expand_text: exp_text: '%s'\n", mtp->subst.text);
		add_text(mtp->subst.text, strlen(mtp->subst.text));
		break;

	case exp_stringize:
1071
		if(pp_flex_debug)
1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087
			fprintf(stderr, "add_expand_text: exp_stringize(%d): '%s'\n",
				mtp->subst.argidx,
				mep->args[mtp->subst.argidx]);
		cptr = mep->args[mtp->subst.argidx];
		add_text("\"", 1);
		while(*cptr)
		{
			if(*cptr == '"' || *cptr == '\\')
				add_text("\\", 1);
			add_text(cptr, 1);
			cptr++;
		}
		add_text("\"", 1);
		break;

	case exp_concat:
1088
		if(pp_flex_debug)
1089 1090 1091 1092
			fprintf(stderr, "add_expand_text: exp_concat\n");
		/* Remove trailing whitespace from current expansion text */
		while(curdef_idx)
		{
1093
			if(isspace(curdef_text[curdef_idx-1] & 0xff))
1094 1095 1096 1097 1098 1099 1100 1101 1102 1103 1104 1105 1106
				curdef_idx--;
			else
				break;
		}
		/* tag current position and recursively expand the next part */
		tag = curdef_idx;
		mtp = add_expand_text(mtp->next, mep, nnl);

		/* Now get rid of the leading space of the expansion */
		cptr = &curdef_text[tag];
		n = curdef_idx - tag;
		while(n)
		{
1107
			if(isspace(*cptr & 0xff))
1108 1109 1110 1111 1112 1113 1114 1115
			{
				cptr++;
				n--;
			}
			else
				break;
		}
		if(cptr != &curdef_text[tag])
1116
		{
1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138
			memmove(&curdef_text[tag], cptr, n);
			curdef_idx -= (curdef_idx - tag) - n;
		}
		break;

	case exp_subst:
		if((mtp->next && mtp->next->type == exp_concat) || (mtp->prev && mtp->prev->type == exp_concat))
			exp = mep->args[mtp->subst.argidx];
		else
			exp = mep->ppargs[mtp->subst.argidx];
		if(exp)
		{
			add_text(exp, strlen(exp));
			*nnl -= mep->nnls[mtp->subst.argidx];
			cptr = strchr(exp, '\n');
			while(cptr)
			{
				*cptr = ' ';
				cptr = strchr(cptr+1, '\n');
			}
			mep->nnls[mtp->subst.argidx] = 0;
		}
1139
		if(pp_flex_debug)
1140 1141 1142 1143
			fprintf(stderr, "add_expand_text: exp_subst(%d): '%s'\n", mtp->subst.argidx, exp);
		break;

	default:
1144
		pp_internal_error(__FILE__, __LINE__, "Invalid expansion type (%d) in macro expansion\n", mtp->type);
1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161
	}
	return mtp;
}

static void expand_macro(macexpstackentry_t *mep)
{
	mtext_t *mtp;
	int n, k;
	char *cptr;
	int nnl = 0;
	pp_entry_t *ppp = mep->ppp;
	int nargs = mep->nargs;

	assert(ppp->type == def_macro);
	assert(ppp->expanding == 0);

	if((ppp->nargs >= 0 && nargs != ppp->nargs) || (ppp->nargs < 0 && nargs < -ppp->nargs))
1162
	{
1163
		ppy_error("Too %s macro arguments (%d)", nargs < abs(ppp->nargs) ? "few" : "many", nargs);
1164 1165
		return;
	}
1166 1167 1168 1169

	for(n = 0; n < nargs; n++)
		nnl += mep->nnls[n];

1170
	if(pp_flex_debug)
1171 1172
		fprintf(stderr, "expand_macro(%d): %s:%d: '%s'(%d,%d) -> ...\n",
			macexpstackidx,
1173 1174
			pp_status.input,
			pp_status.line_number,
1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195
			ppp->ident,
			mep->nargs,
			nnl);

	curdef_idx = 0;

	for(mtp = ppp->subst.mtext; mtp; mtp = mtp->next)
	{
		if(!(mtp = add_expand_text(mtp, mep, &nnl)))
			break;
	}

	for(n = 0; n < nnl; n++)
		add_text("\n", 1);

	/* To make sure there is room and termination (see below) */
	add_text(" \0", 2);

	/* Strip trailing whitespace from expansion */
	for(k = curdef_idx, cptr = &curdef_text[curdef_idx-1]; k > 0; k--, cptr--)
	{
1196
		if(!isspace(*cptr & 0xff))
1197 1198 1199 1200 1201
			break;
	}

	/*
	 * We must add *one* whitespace to make sure that there
Francois Gouget's avatar
Francois Gouget committed
1202
	 * is a token-separation after the expansion.
1203 1204 1205 1206 1207 1208 1209 1210
	 */
	*(++cptr) = ' ';
	*(++cptr) = '\0';
	k++;

	/* Strip leading whitespace from expansion */
	for(n = 0, cptr = curdef_text; n < k; n++, cptr++)
	{
1211
		if(!isspace(*cptr & 0xff))
1212 1213 1214 1215 1216
			break;
	}

	if(k - n > 0)
	{
1217
		if(pp_flex_debug)
1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233
			fprintf(stderr, "expand_text: '%s'\n", curdef_text + n);
		push_buffer(ppp, NULL, NULL, 0);
		/*yy_scan_bytes(curdef_text + n, k - n);*/
		yy_scan_string(curdef_text + n);
	}
}

/*
 *-------------------------------------------------------------------------
 * String collection routines
 *-------------------------------------------------------------------------
 */
static void new_string(void)
{
#ifdef DEBUG
	if(strbuf_idx)
1234
		ppy_warning("new_string: strbuf_idx != 0");
1235 1236
#endif
	strbuf_idx = 0;
1237
	str_startline = pp_status.line_number;
1238 1239
}

1240
static void add_string(const char *str, int len)
1241
{
1242 1243 1244
	int new_alloc;
	char *new_buffer;

1245 1246 1247 1248
	if(len == 0)
		return;
	if(strbuf_idx >= strbuf_alloc || strbuf_alloc - strbuf_idx < len)
	{
1249 1250 1251 1252 1253 1254
		new_alloc = strbuf_alloc + ((len + ALLOCBLOCKSIZE-1) & ~(ALLOCBLOCKSIZE-1));
		new_buffer = pp_xrealloc(strbuffer, new_alloc * sizeof(strbuffer[0]));
		if(!new_buffer)
			return;
		strbuffer = new_buffer;
		strbuf_alloc = new_alloc;
1255
		if(strbuf_alloc > 65536)
1256
			ppy_warning("Reallocating string buffer larger than 64kB");
1257 1258 1259 1260 1261 1262 1263
	}
	memcpy(&strbuffer[strbuf_idx], str, len);
	strbuf_idx += len;
}

static char *get_string(void)
{
1264
	char *str = pp_xmalloc(strbuf_idx + 1);
1265 1266
	if(!str)
		return NULL;
1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295
	memcpy(str, strbuffer, strbuf_idx);
	str[strbuf_idx] = '\0';
#ifdef DEBUG
	strbuf_idx = 0;
#endif
	return str;
}

static void put_string(void)
{
	put_buffer(strbuffer, strbuf_idx);
#ifdef DEBUG
	strbuf_idx = 0;
#endif
}

static int string_start(void)
{
	return str_startline;
}


/*
 *-------------------------------------------------------------------------
 * Buffer management
 *-------------------------------------------------------------------------
 */
static void push_buffer(pp_entry_t *ppp, char *filename, char *incname, int pop)
{
1296
	if(ppy_debug)
1297 1298
		printf("push_buffer(%d): %p %p %p %d\n", bufferstackidx, ppp, filename, incname, pop);
	if(bufferstackidx >= MAXBUFFERSTACK)
1299
		pp_internal_error(__FILE__, __LINE__, "Buffer stack overflow");
1300 1301 1302

	memset(&bufferstack[bufferstackidx], 0, sizeof(bufferstack[0]));
	bufferstack[bufferstackidx].bufferstate	= YY_CURRENT_BUFFER;
Matteo Bruni's avatar
Matteo Bruni committed
1303
	bufferstack[bufferstackidx].filehandle  = pp_status.file;
1304
	bufferstack[bufferstackidx].define	= ppp;
1305 1306 1307
	bufferstack[bufferstackidx].line_number	= pp_status.line_number;
	bufferstack[bufferstackidx].char_number	= pp_status.char_number;
	bufferstack[bufferstackidx].if_depth	= pp_get_if_depth();
1308
	bufferstack[bufferstackidx].should_pop	= pop;
1309
	bufferstack[bufferstackidx].filename	= pp_status.input;
1310
	bufferstack[bufferstackidx].ncontinuations	= ncontinuations;
1311
	bufferstack[bufferstackidx].incl		= pp_incl_state;
1312 1313 1314 1315 1316 1317
	bufferstack[bufferstackidx].include_filename	= incname;

	if(ppp)
		ppp->expanding = 1;
	else if(filename)
	{
1318
		/* These will track the ppy_error to the correct file and line */
1319 1320 1321
		pp_status.line_number = 1;
		pp_status.char_number = 1;
		pp_status.input  = filename;
1322 1323 1324
		ncontinuations = 0;
	}
	else if(!pop)
1325
		pp_internal_error(__FILE__, __LINE__, "Pushing buffer without knowing where to go to");
1326 1327 1328 1329 1330 1331
	bufferstackidx++;
}

static bufferstackentry_t *pop_buffer(void)
{
	if(bufferstackidx < 0)
1332
		pp_internal_error(__FILE__, __LINE__, "Bufferstack underflow?");
1333 1334 1335 1336 1337 1338 1339 1340 1341 1342

	if(bufferstackidx == 0)
		return NULL;

	bufferstackidx--;

	if(bufferstack[bufferstackidx].define)
		bufferstack[bufferstackidx].define->expanding = 0;
	else
	{
1343 1344
		includelogicentry_t *iep = NULL;

1345 1346
		if(!bufferstack[bufferstackidx].should_pop)
		{
Matteo Bruni's avatar
Matteo Bruni committed
1347 1348
			wpp_callbacks->close(pp_status.file);
			pp_writestring("# %d \"%s\" 2\n", bufferstack[bufferstackidx].line_number, bufferstack[bufferstackidx].filename);
1349 1350

			/* We have EOF, check the include logic */
1351
			if(pp_incl_state.state == 2 && !pp_incl_state.seen_junk && pp_incl_state.ppp)
1352
			{
1353
				pp_entry_t *ppp = pplookup(pp_incl_state.ppp);
1354 1355
				if(ppp)
				{
1356
					iep = pp_xmalloc(sizeof(includelogicentry_t));
1357 1358 1359 1360 1361 1362 1363 1364 1365 1366 1367 1368 1369 1370
					if (iep)
					{
						iep->ppp = ppp;
						ppp->iep = iep;
						iep->filename = bufferstack[bufferstackidx].include_filename;
						iep->prev = NULL;
						iep->next = pp_includelogiclist;
						if(iep->next)
							iep->next->prev = iep;
						pp_includelogiclist = iep;
						if(pp_status.debug)
							fprintf(stderr, "pop_buffer: %s:%d: includelogic added, include_ppp='%s', file='%s'\n",
                                                                bufferstack[bufferstackidx].filename, bufferstack[bufferstackidx].line_number, pp_incl_state.ppp, iep->filename);
					}
1371 1372
				}
			}
1373
			free(pp_incl_state.ppp);
1374
			pp_incl_state	= bufferstack[bufferstackidx].incl;
1375

1376
		}
1377 1378 1379 1380 1381
		if (bufferstack[bufferstackidx].include_filename)
		{
			free(pp_status.input);
			pp_status.input = bufferstack[bufferstackidx].filename;
		}
1382 1383 1384
		pp_status.line_number = bufferstack[bufferstackidx].line_number;
		pp_status.char_number = bufferstack[bufferstackidx].char_number;
		ncontinuations = bufferstack[bufferstackidx].ncontinuations;
1385 1386
		if (!iep)
			free(bufferstack[bufferstackidx].include_filename);
1387 1388
	}

1389
	if(ppy_debug)
1390 1391 1392 1393 1394 1395 1396 1397 1398 1399
		printf("pop_buffer(%d): %p %p (%d, %d, %d) %p %d\n",
			bufferstackidx,
			bufferstack[bufferstackidx].bufferstate,
			bufferstack[bufferstackidx].define,
			bufferstack[bufferstackidx].line_number,
			bufferstack[bufferstackidx].char_number,
			bufferstack[bufferstackidx].if_depth,
			bufferstack[bufferstackidx].filename,
			bufferstack[bufferstackidx].should_pop);

Matteo Bruni's avatar
Matteo Bruni committed
1400 1401
	pp_status.file = bufferstack[bufferstackidx].filehandle;
	ppy__switch_to_buffer(bufferstack[bufferstackidx].bufferstate);
1402 1403 1404 1405 1406 1407

	if(bufferstack[bufferstackidx].should_pop)
	{
		if(yy_current_state() == pp_macexp)
			macro_add_expansion();
		else
1408
			pp_internal_error(__FILE__, __LINE__, "Pop buffer and state without macro expansion state");
1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423
		yy_pop_state();
	}

	return &bufferstack[bufferstackidx];
}


/*
 *-------------------------------------------------------------------------
 * Macro nestng support
 *-------------------------------------------------------------------------
 */
static void push_macro(pp_entry_t *ppp)
{
	if(macexpstackidx >= MAXMACEXPSTACK)
1424
	{
1425
		ppy_error("Too many nested macros");
1426 1427
		return;
	}
1428

1429
	macexpstack[macexpstackidx] = pp_xmalloc(sizeof(macexpstack[0][0]));
1430 1431
	if(!macexpstack[macexpstackidx])
		return;
1432
        memset( macexpstack[macexpstackidx], 0, sizeof(macexpstack[0][0]));
1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 1443 1444
	macexpstack[macexpstackidx]->ppp = ppp;
	macexpstackidx++;
}

static macexpstackentry_t *top_macro(void)
{
	return macexpstackidx > 0 ? macexpstack[macexpstackidx-1] : NULL;
}

static macexpstackentry_t *pop_macro(void)
{
	if(macexpstackidx <= 0)
1445
		pp_internal_error(__FILE__, __LINE__, "Macro expansion stack underflow\n");
1446 1447 1448 1449 1450 1451 1452 1453 1454
	return macexpstack[--macexpstackidx];
}

static void free_macro(macexpstackentry_t *mep)
{
	int i;

	for(i = 0; i < mep->nargs; i++)
		free(mep->args[i]);
1455 1456 1457
	free(mep->args);
	free(mep->nnls);
	free(mep->curarg);
1458 1459 1460
	free(mep);
}

1461
static void add_text_to_macro(const char *text, int len)
1462 1463 1464 1465 1466
{
	macexpstackentry_t *mep = top_macro();

	assert(mep->ppp->expanding == 0);

1467
	if(mep->curargalloc - mep->curargsize <= len+1)	/* +1 for '\0' */
1468
	{
1469
		char *new_curarg;
1470
		int new_alloc =	mep->curargalloc + ((ALLOCBLOCKSIZE > len+1) ? ALLOCBLOCKSIZE : len+1);
1471 1472 1473 1474 1475
		new_curarg = pp_xrealloc(mep->curarg, new_alloc * sizeof(mep->curarg[0]));
		if(!new_curarg)
			return;
		mep->curarg = new_curarg;
		mep->curargalloc = new_alloc;
1476
	}
1477
	memcpy(mep->curarg + mep->curargsize, text, len);
1478
	mep->curargsize += len;
1479
	mep->curarg[mep->curargsize] = '\0';
1480 1481 1482 1483 1484 1485
}

static void macro_add_arg(int last)
{
	int nnl = 0;
	char *cptr;
1486 1487
	char **new_args, **new_ppargs;
	int *new_nnls;
1488 1489 1490 1491
	macexpstackentry_t *mep = top_macro();

	assert(mep->ppp->expanding == 0);

1492 1493 1494 1495 1496 1497 1498 1499 1500 1501 1502 1503 1504 1505 1506
	new_args = pp_xrealloc(mep->args, (mep->nargs+1) * sizeof(mep->args[0]));
	if(!new_args)
		return;
	mep->args = new_args;

	new_ppargs = pp_xrealloc(mep->ppargs, (mep->nargs+1) * sizeof(mep->ppargs[0]));
	if(!new_ppargs)
		return;
	mep->ppargs = new_ppargs;

	new_nnls = pp_xrealloc(mep->nnls, (mep->nargs+1) * sizeof(mep->nnls[0]));
	if(!new_nnls)
		return;
	mep->nnls = new_nnls;

1507
	mep->args[mep->nargs] = pp_xstrdup(mep->curarg ? mep->curarg : "");
1508 1509
	if(!mep->args[mep->nargs])
		return;
1510 1511 1512 1513 1514 1515 1516 1517 1518 1519 1520
	cptr = mep->args[mep->nargs]-1;
	while((cptr = strchr(cptr+1, '\n')))
	{
		nnl++;
	}
	mep->nnls[mep->nargs] = nnl;
	mep->nargs++;
	free(mep->curarg);
	mep->curargalloc = mep->curargsize = 0;
	mep->curarg = NULL;

1521
	if(pp_flex_debug)
1522
		fprintf(stderr, "macro_add_arg: %s:%d: %d -> '%s'\n",
1523 1524
			pp_status.input,
			pp_status.line_number,
1525 1526 1527 1528 1529 1530 1531 1532 1533 1534 1535 1536 1537 1538 1539 1540 1541 1542 1543
			mep->nargs-1,
			mep->args[mep->nargs-1]);

	/* Each macro argument must be expanded to cope with stingize */
	if(last || mep->args[mep->nargs-1][0])
	{
		yy_push_state(pp_macexp);
		push_buffer(NULL, NULL, NULL, last ? 2 : 1);
		yy_scan_string(mep->args[mep->nargs-1]);
		/*mep->bufferstackidx = bufferstackidx;	 But not nested! */
	}
}

static void macro_add_expansion(void)
{
	macexpstackentry_t *mep = top_macro();

	assert(mep->ppp->expanding == 0);

1544
	mep->ppargs[mep->nargs-1] = pp_xstrdup(mep->curarg ? mep->curarg : "");
1545 1546 1547 1548
	free(mep->curarg);
	mep->curargalloc = mep->curargsize = 0;
	mep->curarg = NULL;

1549
	if(pp_flex_debug)
1550
		fprintf(stderr, "macro_add_expansion: %s:%d: %d -> '%s'\n",
1551 1552
			pp_status.input,
			pp_status.line_number,
1553
			mep->nargs-1,
1554
			mep->ppargs[mep->nargs-1] ? mep->ppargs[mep->nargs-1] : "");
1555 1556 1557 1558 1559 1560 1561 1562
}


/*
 *-------------------------------------------------------------------------
 * Output management
 *-------------------------------------------------------------------------
 */
1563
static void put_buffer(const char *s, int len)
1564 1565 1566
{
	if(top_macro())
		add_text_to_macro(s, len);
1567
	else
Matteo Bruni's avatar
Matteo Bruni committed
1568
		wpp_callbacks->write(s, len);
1569 1570 1571 1572 1573 1574 1575 1576
}


/*
 *-------------------------------------------------------------------------
 * Include management
 *-------------------------------------------------------------------------
 */
1577
void pp_do_include(char *fname, int type)
1578 1579 1580 1581
{
	char *newpath;
	int n;
	includelogicentry_t *iep;
Matteo Bruni's avatar
Matteo Bruni committed
1582
	void *fp;
1583

1584 1585 1586
	if(!fname)
		return;

1587
	for(iep = pp_includelogiclist; iep; iep = iep->next)
1588 1589 1590 1591 1592 1593 1594 1595
	{
		if(!strcmp(iep->filename, fname))
		{
			/*
			 * We are done. The file was included before.
			 * If the define was deleted, then this entry would have
			 * been deleted too.
			 */
1596
			free(fname);
1597 1598 1599 1600 1601 1602 1603
			return;
		}
	}

	n = strlen(fname);

	if(n <= 2)
1604
	{
1605
		ppy_error("Empty include filename");
1606
		free(fname);
1607 1608
		return;
	}
1609 1610 1611 1612

	/* Undo the effect of the quotation */
	fname[n-1] = '\0';

1613
	if((fp = pp_open_include(fname+1, type, pp_status.input, &newpath)) == NULL)
1614
	{
1615
		ppy_error("Unable to open include file %s", fname+1);
1616
		free(fname);
1617 1618
		return;
	}
1619 1620 1621

	fname[n-1] = *fname;	/* Redo the quotes */
	push_buffer(NULL, newpath, fname, 0);
1622 1623 1624
	pp_incl_state.seen_junk = 0;
	pp_incl_state.state = 0;
	pp_incl_state.ppp = NULL;
1625

1626
	if(pp_status.debug)
1627 1628
		fprintf(stderr, "pp_do_include: %s:%d: include_state=%d, include_ppp='%s', include_ifdepth=%d\n",
                        pp_status.input, pp_status.line_number, pp_incl_state.state, pp_incl_state.ppp, pp_incl_state.ifdepth);
Matteo Bruni's avatar
Matteo Bruni committed
1629 1630
	pp_status.file = fp;
	ppy__switch_to_buffer(ppy__create_buffer(NULL, YY_BUF_SIZE));
1631

Matteo Bruni's avatar
Matteo Bruni committed
1632
	pp_writestring("# 1 \"%s\" 1%s\n", newpath, type ? "" : " 3");
1633 1634 1635 1636 1637 1638 1639 1640
}

/*
 *-------------------------------------------------------------------------
 * Push/pop preprocessor ignore state when processing conditionals
 * which are false.
 *-------------------------------------------------------------------------
 */
1641
void pp_push_ignore_state(void)
1642 1643 1644 1645
{
	yy_push_state(pp_ignore);
}

1646
void pp_pop_ignore_state(void)
1647 1648 1649
{
	yy_pop_state();
}