1 files changed, 1921 insertions, 0 deletions
diff --git a/libexec/auxcpp/macro.c b/libexec/auxcpp/macro.c
new file mode 100644
index 00000000000..5b9540c67c2
--- /dev/null
+++ b/libexec/auxcpp/macro.c
@@ -0,0 +1,1921 @@
+/*
+ * (c) Thomas Pornin 1999 - 2002
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ *    notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ *    notice, this list of conditions and the following disclaimer in the
+ *    documentation and/or other materials provided with the distribution.
+ * 4. The name of the authors may not be used to endorse or promote
+ *    products derived from this software without specific prior written
+ *    permission.
+ *
+ * THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR
+ * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+ * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE
+ * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+ * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT
+ * OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+ * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+ * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+ * OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
+ * EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ *
+ */
+
+#include "tune.h"
+#include <stdio.h>
+#include <string.h>
+#include <stddef.h>
+#include <limits.h>
+#include "ucppi.h"
+#include "mem.h"
+#include "nhash.h"
+
+/*
+ * we store macros in a hash table, and retrieve them using their name
+ * as identifier.
+ */
+static HTT macros;
+static int macros_init_done = 0;
+
+static void del_macro(void *m)
+{
+	struct macro *n = m;
+	size_t i;
+
+	for (i = 0; (int)i < n->narg; i ++) freemem(n->arg[i]);
+	if (n->narg > 0) freemem(n->arg);
+#ifdef LOW_MEM
+	if (n->cval.length) freemem(n->cval.t);
+#else
+	if (n->val.nt) {
+		for (i = 0; i < n->val.nt; i ++)
+			if (S_TOKEN(n->val.t[i].type))
+				freemem(n->val.t[i].name);
+		freemem(n->val.t);
+	}
+#endif
+	freemem(n);
+}
+
+static inline struct macro *new_macro(void)
+{
+	struct macro *m = getmem(sizeof(struct macro));
+
+	m->narg = -1;
+	m->nest = 0;
+#ifdef LOW_MEM
+	m->cval.length = 0;
+#else
+	m->val.nt = m->val.art = 0;
+#endif
+	m->vaarg = 0;
+	return m;
+}
+
+/*
+ * for special macros, and the "defined" operator
+ */
+enum {
+	MAC_NONE, MAC_DEFINED,
+	MAC_LINE, MAC_FILE, MAC_DATE, MAC_TIME, MAC_STDC, MAC_PRAGMA
+};
+#define MAC_SPECIAL	MAC_LINE
+
+/*
+ * returns 1 for "defined"
+ * returns x > 1 for a special macro such as __FILE__
+ * returns 0 otherwise
+ */
+static inline int check_special_macro(char *name)
+{
+	if (!strcmp(name, "defined")) return MAC_DEFINED;
+	if (*name != '_') return MAC_NONE;
+	if (*(name + 1) == 'P') {
+		if (!strcmp(name, "_Pragma")) return MAC_PRAGMA;
+		return MAC_NONE;
+	} else if (*(name + 1) != '_') return MAC_NONE;
+	if (no_special_macros) return MAC_NONE;
+	if (!strcmp(name, "__LINE__")) return MAC_LINE;
+	else if (!strcmp(name, "__FILE__")) return MAC_FILE;
+	else if (!strcmp(name, "__DATE__")) return MAC_DATE;
+	else if (!strcmp(name, "__TIME__")) return MAC_TIME;
+	else if (!strcmp(name, "__STDC__")) return MAC_STDC;
+	return MAC_NONE;
+}
+
+int c99_compliant = 1;
+int c99_hosted = 1;
+
+/*
+ * add the special macros to the macro table
+ */
+static void add_special_macros(void)
+{
+	struct macro *m;
+
+	HTT_put(&macros, new_macro(), "__LINE__");
+	HTT_put(&macros, new_macro(), "__FILE__");
+	HTT_put(&macros, new_macro(), "__DATE__");
+	HTT_put(&macros, new_macro(), "__TIME__");
+	HTT_put(&macros, new_macro(), "__STDC__");
+	m = new_macro(); m->narg = 1;
+	m->arg = getmem(sizeof(char *)); m->arg[0] = sdup("foo");
+	HTT_put(&macros, m, "_Pragma");
+	if (c99_compliant) {
+#ifndef LOW_MEM
+		struct token t;
+#endif
+
+		m = new_macro();
+#ifdef LOW_MEM
+		m->cval.t = getmem(9);
+		m->cval.t[0] = NUMBER;
+		mmv(m->cval.t + 1, "199901L", 8);
+		m->cval.length = 9;
+#else
+		t.type = NUMBER;
+		t.line = 0;
+		t.name = sdup("199901L");
+		aol(m->val.t, m->val.nt, t, TOKEN_LIST_MEMG);
+#endif
+		HTT_put(&macros, m, "__STDC_VERSION__");
+	}
+	if (c99_hosted) {
+#ifndef LOW_MEM
+		struct token t;
+#endif
+
+		m = new_macro();
+#ifdef LOW_MEM
+		m->cval.t = getmem(3);
+		m->cval.t[0] = NUMBER;
+		mmv(m->cval.t + 1, "1", 2);
+		m->cval.length = 3;
+#else
+		t.type = NUMBER;
+		t.line = 0;
+		t.name = sdup("1");
+		aol(m->val.t, m->val.nt, t, TOKEN_LIST_MEMG);
+#endif
+		HTT_put(&macros, m, "__STDC_HOSTED__");
+	}
+}
+
+#ifdef LOW_MEM
+/*
+ * We store macro arguments as a single-byte token MACROARG, followed
+ * by the argument number as a one or two-byte value. If the argument
+ * number is between 0 and 127 (inclusive), it is stored as such in
+ * a single byte. Otherwise, it is supposed to be a 14-bit number, with
+ * the 7 upper bits stored in the first byte (with the high bit set to 1)
+ * and the 7 lower bits in the second byte.
+ */
+#endif
+
+/*
+ * print the content of a macro, in #define form
+ */
+static void print_macro(void *vm)
+{
+	struct macro *m = vm;
+	char *mname = HASH_ITEM_NAME(m);
+	int x = check_special_macro(mname);
+	size_t i;
+
+	if (x != MAC_NONE) {
+		fprintf(emit_output, "/* #define %s */ /* special */\n",
+			mname);
+		return;
+	}
+	fprintf(emit_output, "#define %s", mname);
+	if (m->narg >= 0) {
+		fprintf(emit_output, "(");
+		for (i = 0; i < (size_t)(m->narg); i ++) {
+			fprintf(emit_output, i ? ", %s" : "%s", m->arg[i]);
+		}
+		if (m->vaarg) {
+			fputs(m->narg ? ", ..." : "...", emit_output);
+		}
+		fprintf(emit_output, ")");
+	}
+#ifdef LOW_MEM
+	if (m->cval.length == 0) {
+		fputc('\n', emit_output);
+		return;
+	}
+	fputc(' ', emit_output);
+	for (i = 0; i < m->cval.length;) {
+		int tt = m->cval.t[i ++];
+
+		if (tt == MACROARG) {
+			unsigned anum = m->cval.t[i];
+
+			if (anum >= 128) anum = ((anum & 127U) << 8)
+				| m->cval.t[++ i];
+			if (anum == (unsigned)m->narg)
+				fputs("__VA_ARGS__", emit_output);
+			else
+				fputs(m->arg[anum], emit_output);
+			i ++;
+		}
+		else if (S_TOKEN(tt)) {
+			fputs((char *)(m->cval.t + i), emit_output);
+			i += 1 + strlen((char *)(m->cval.t + i));
+		} else fputs(operators_name[tt], emit_output);
+	}
+#else
+	if (m->val.nt == 0) {
+		fputc('\n', emit_output);
+		return;
+	}
+	fputc(' ', emit_output);
+	for (i = 0; i < m->val.nt; i ++) {
+		if (m->val.t[i].type == MACROARG) {
+			if (m->val.t[i].line == m->narg)
+				fputs("__VA_ARGS__", emit_output);
+			else
+				fputs(m->arg[(size_t)(m->val.t[i].line)],
+					emit_output);
+		} else fputs(token_name(m->val.t + i), emit_output);
+	}
+#endif
+	fputc('\n', emit_output);
+}
+
+/*
+ * Send a token to the output (a token_fifo in lexer mode, the output
+ * buffer in stand alone mode).
+ */
+void print_token(struct lexer_state *ls, struct token *t, long uz_line)
+{
+	char *x = t->name;
+
+	if (uz_line && t->line < 0) t->line = uz_line;
+	if (ls->flags & LEXER) {
+		struct token at;
+
+		at = *t;
+		if (S_TOKEN(t->type)) {
+			at.name = sdup(at.name);
+			throw_away(ls->gf, at.name);
+		}
+		aol(ls->output_fifo->t, ls->output_fifo->nt, at,
+			TOKEN_LIST_MEMG);
+		return;
+	}
+	if (ls->flags & KEEP_OUTPUT) {
+		for (; ls->oline < ls->line;) put_char(ls, '\n');
+	}
+	if (!S_TOKEN(t->type)) x = operators_name[t->type];
+	for (; *x; x ++) put_char(ls, *x);
+}
+
+/*
+ * Send a token to the output at a given line (this is for text output
+ * and unreplaced macros due to lack of arguments).
+ */
+static void print_token_nailed(struct lexer_state *ls, struct token *t,
+	long nail_line)
+{
+	char *x = t->name;
+
+	if (ls->flags & LEXER) {
+		print_token(ls, t, 0);
+		return;
+	}
+	if (ls->flags & KEEP_OUTPUT) {
+		for (; ls->oline < nail_line;) put_char(ls, '\n');
+	}
+	if (!S_TOKEN(t->type)) x = operators_name[t->type];
+	for (; *x; x ++) put_char(ls, *x);
+}
+
+/*
+ * send a reduced whitespace token to the output
+ */
+#define print_space(ls)	do { \
+		struct token lt; \
+		lt.type = OPT_NONE; \
+		lt.line = (ls)->line; \
+		print_token((ls), &lt, 0); \
+	} while (0)
+
+/*
+ * We found a #define directive; parse the end of the line, perform
+ * sanity checks, store the new macro into the "macros" hash table.
+ *
+ * In case of a redefinition of a macro: we enforce the rule that a
+ * macro should be redefined identically, including the spelling of
+ * parameters. We emit an error on offending code; dura lex, sed lex.
+ * After all, it is easy to avoid such problems, with a #undef directive.
+ */
+int handle_define(struct lexer_state *ls)
+{
+	struct macro *m = 0, *n;
+#ifdef LOW_MEM
+	struct token_fifo mv;
+#endif
+	int ltwws = 1, redef = 0;
+	char *mname = 0;
+	int narg;
+	size_t nt;
+	long l = ls->line;
+	
+#ifdef LOW_MEM
+	mv.art = mv.nt = 0;
+#endif
+	/* find the next non-white token on the line, this should be
+	   the macro name */
+	while (!next_token(ls) && ls->ctok->type != NEWLINE) {
+		if (ttMWS(ls->ctok->type)) continue;
+		if (ls->ctok->type == NAME) mname = sdup(ls->ctok->name);
+		break;
+	}
+	if (mname == 0) {
+		error(l, "missing macro name");
+		return 1;
+	}
+	if (check_special_macro(mname)) {
+		error(l, "trying to redefine the special macro %s", mname);
+		goto warp_error;
+	}
+	/*
+	 * If a macro with this name was already defined: the K&R
+	 * states that the new macro should be identical to the old one
+	 * (with some arcane rule of equivalence of whitespace); otherwise,
+	 * redefining the macro is an error. Most preprocessors would
+	 * only emit a warning (or nothing at all) on an unidentical
+	 * redefinition.
+	 *
+	 * Since it is easy to avoid this error (with a #undef directive),
+	 * we choose to enforce the rule and emit an error.
+	 */
+	if ((n = HTT_get(&macros, mname)) != 0) {
+		/* redefinition of a macro: we must check that we define
+		   it identical */
+		redef = 1;
+#ifdef LOW_MEM
+		n->cval.rp = 0;
+#endif
+		freemem(mname);
+		mname = 0;
+	}
+	if (!redef) {
+		m = new_macro();
+		m->narg = -1;
+#ifdef LOW_MEM
+#define mval	mv
+#else
+#define mval	(m->val)
+#endif
+	}
+	if (next_token(ls)) goto define_end;
+	/*
+	 * Check if the token immediately following the macro name is
+	 * a left parenthesis; if so, then this is a macro with arguments.
+	 * Collect their names and try to match the next parenthesis.
+	 */
+	if (ls->ctok->type == LPAR) {
+		int i, j;
+		int need_comma = 0, saw_mdots = 0;
+
+		narg = 0;
+		while (!next_token(ls)) {
+			if (ls->ctok->type == NEWLINE) {
+				error(l, "truncated macro definition");
+				goto define_error;
+			}
+			if (ls->ctok->type == COMMA) {
+				if (saw_mdots) {
+					error(l, "'...' must end the macro "
+						"argument list");
+					goto warp_error;
+				}
+				if (!need_comma) {
+					error(l, "void macro argument");
+					goto warp_error;
+				}
+				need_comma = 0;
+				continue;
+			} else if (ls->ctok->type == NAME) {
+				if (saw_mdots) {
+					error(l, "'...' must end the macro "
+						"argument list");
+					goto warp_error;
+				}
+				if (need_comma) {
+					error(l, "missing comma in "
+						"macro argument list");
+					goto warp_error;
+				}
+				if (!redef) {
+					aol(m->arg, narg,
+						sdup(ls->ctok->name), 8);
+					/* we must keep track of m->narg
+					   so that cleanup in case of
+					   error works. */
+					m->narg = narg;
+					if (narg == 128
+						&& (ls->flags & WARN_STANDARD))
+						warning(l, "more arguments to "
+							"macro than the ISO "
+							"limit (127)");
+#ifdef LOW_MEM
+					if (narg == 32767) {
+						error(l, "too many arguments "
+							"in macro definition "
+							"(max 32766)");
+						goto warp_error;
+					}
+#endif
+				} else {
+					/* this is a redefinition of the
+					   macro; check equality between
+					   old and new definitions */
+					if (narg >= n->narg) goto redef_error;
+					if (strcmp(ls->ctok->name,
+						n->arg[narg ++]))
+						goto redef_error;
+				}
+				need_comma = 1;
+				continue;
+			} else if ((ls->flags & MACRO_VAARG)
+				&& ls->ctok->type == MDOTS) {
+				if (need_comma) {
+					error(l, "missing comma before '...'");
+					goto warp_error;
+				}
+				if (redef && !n->vaarg) goto redef_error;
+				if (!redef) m->vaarg = 1;
+				saw_mdots = 1;
+				need_comma = 1;
+				continue;
+			} else if (ls->ctok->type == RPAR) {
+				if (narg > 0 && !need_comma) {
+					error(l, "void macro argument");
+					goto warp_error;
+				}
+				if (redef && n->vaarg && !saw_mdots)
+					goto redef_error;
+				break;
+			} else if (ttMWS(ls->ctok->type)) {
+				continue;
+			}
+			error(l, "invalid macro argument");
+			goto warp_error;
+		}
+		if (!redef) {
+			for (i = 1; i < narg; i ++) for (j = 0; j < i; j ++)
+				if (!strcmp(m->arg[i], m->arg[j])) {
+					error(l, "duplicate macro "
+						"argument");
+					goto warp_error;
+				}
+		}
+		if (!redef) m->narg = narg;
+	} else {
+		if (!ttWHI(ls->ctok->type) && (ls->flags & WARN_STANDARD))
+			warning(ls->line, "identifier not followed by "
+				"whitespace in #define");
+		ls->flags |= READ_AGAIN;
+		narg = 0;
+	}
+	if (redef) nt = 0;
+
+	/* now, we have the arguments. Let's get the macro contents. */
+	while (!next_token(ls) && ls->ctok->type != NEWLINE) {
+		struct token t;
+
+		t.type = ls->ctok->type;
+		if (ltwws && ttMWS(t.type)) continue;
+		t.line = 0;
+		if (t.type == NAME) {
+			int i;
+
+			if ((ls->flags & MACRO_VAARG)
+				&& !strcmp(ls->ctok->name, "__VA_ARGS__")) {
+				if (redef) {
+					if (!n->vaarg) goto redef_error;
+				} else if (!m->vaarg) {
+					error(l, "'__VA_ARGS__' is forbidden "
+						"in macros with a fixed "
+						"number of arguments");
+					goto warp_error;
+				}
+				t.type = MACROARG;
+				t.line = redef ? n->narg : m->narg;
+			}
+			for (i = 0; i < narg; i ++)
+				if (!strcmp(redef ? n->arg[i] : m->arg[i],
+					ls->ctok->name)) {
+					t.type = MACROARG;
+					/* this is a hack: we store the
+					   argument number in the line field */
+					t.line = i;
+					break;
+				}
+		}
+		if (!redef && S_TOKEN(t.type)) t.name = sdup(ls->ctok->name);
+		if (ttMWS(t.type)) {
+			if (ltwws) continue;
+#ifdef SEMPER_FIDELIS
+			t.type = OPT_NONE;
+#else
+			t.type = NONE;
+#endif
+			ltwws = 1;
+		} else ltwws = 0;
+		if (!redef) {
+			/* we ensure that each macro token has a correct
+			   line number */
+			if (t.type != MACROARG) t.line = 1;
+			aol(mval.t, mval.nt, t, TOKEN_LIST_MEMG);
+		} else {
+#ifdef LOW_MEM
+			int tt;
+
+			if (n->cval.rp >= n->cval.length) {
+#ifdef SEMPER_FIDELIS
+				if (t.type != OPT_NONE) goto redef_error;
+#else
+				if (t.type != NONE) goto redef_error;
+#endif
+			} else if (t.type != n->cval.t[n->cval.rp]) {
+				goto redef_error;
+			} else if (t.type == MACROARG) {
+				unsigned anum = n->cval.t[n->cval.rp + 1];
+
+				if (anum >= 128U) anum = ((anum & 127U) << 8)
+					| m->cval.t[n->cval.rp + 2];
+				if (anum != (unsigned)t.line) goto redef_error;
+			} else if (S_TOKEN(t.type) && strcmp(ls->ctok->name,
+				   (char *)(n->cval.t + n->cval.rp + 1))) {
+				goto redef_error;
+			}
+			tt = n->cval.t[n->cval.rp ++];
+			if (S_TOKEN(tt)) n->cval.rp += 1
+				+ strlen((char *)(n->cval.t + n->cval.rp));
+			else if (tt == MACROARG) {
+				if (n->cval.t[++ n->cval.rp] >= 128)
+					n->cval.rp ++;
+			}
+#else
+			if (nt >= n->val.nt) {
+#ifdef SEMPER_FIDELIS
+				if (t.type != OPT_NONE) goto redef_error;
+#else
+				if (t.type != NONE) goto redef_error;
+#endif
+			} else if (t.type != n->val.t[nt].type
+				|| (t.type == MACROARG
+				    && t.line != n->val.t[nt].line)
+				|| (S_TOKEN(t.type) && strcmp(ls->ctok->name,
+				   n->val.t[nt].name))) {
+				goto redef_error;
+			}
+#endif
+			nt ++;
+		}
+	}
+
+	if (redef) {
+#ifdef LOW_MEM
+		if (n->cval.rp < n->cval.length) goto redef_error_2;
+#else
+		if (nt < n->val.nt) goto redef_error_2;
+#endif
+		return 0;
+	}
+
+	/* now we have the complete macro; perform some checks about
+	   the operators # and ##, and, if everything is ok,
+	   store the macro into the hash table */
+define_end:
+#ifdef SEMPER_FIDELIS
+	if (mval.nt && mval.t[mval.nt - 1].type == OPT_NONE) {
+#else
+	if (mval.nt && mval.t[mval.nt - 1].type == NONE) {
+#endif
+		mval.nt --;
+		if (mval.nt == 0) freemem(mval.t);
+	}
+	if (mval.nt != 0) {
+		size_t i;
+
+		/* some checks about the macro */
+		if (mval.t[0].type == DSHARP
+			|| mval.t[0].type == DIG_DSHARP
+			|| mval.t[mval.nt - 1].type == DSHARP
+			|| mval.t[mval.nt - 1].type == DIG_DSHARP) {
+			error(l, "operator '##' may neither begin "
+				"nor end a macro");
+			goto define_error;
+		}
+		if (m->narg >= 0) for (i = 0; i < mval.nt; i ++)
+			if ((mval.t[i].type == SHARP
+				|| mval.t[i].type == DIG_SHARP) &&
+				(i == (mval.nt - 1)
+				|| (ttMWS(mval.t[i + 1].type) &&
+				    (i == mval.nt - 2
+				     || mval.t[i + 2].type != MACROARG))
+				|| (!ttMWS(mval.t[i + 1].type)
+				     && mval.t[i + 1].type != MACROARG))) {
+				error(l, "operator '#' not followed "
+					"by a macro argument");
+				goto define_error;
+			}
+	}
+#ifdef LOW_MEM
+	{
+		size_t i, l;
+
+		for (i = 0, l = 0; i < mval.nt; i ++) {
+			l ++;
+			if (S_TOKEN(mval.t[i].type))
+				l += 1 + strlen(mval.t[i].name);
+			else if (mval.t[i].type == MACROARG) {
+				l ++;
+				if (mval.t[i].line >= 128) l ++;
+			}
+		}
+		m->cval.length = l;
+		if (l) m->cval.t = getmem(l);
+		for (i = 0, l = 0; i < mval.nt; i ++) {
+			m->cval.t[l ++] = mval.t[i].type;
+			if (S_TOKEN(mval.t[i].type)) {
+				size_t x = 1 + strlen(mval.t[i].name);
+
+				mmv(m->cval.t + l, mval.t[i].name, x);
+				l += x;
+				freemem(mval.t[i].name);
+			}
+			else if (mval.t[i].type == MACROARG) {
+				unsigned anum = mval.t[i].line;
+
+				if (anum >= 128) {
+					m->cval.t[l ++] = 128 | (anum >> 8);
+					m->cval.t[l ++] = anum & 0xFF;
+				} else {
+					m->cval.t[l ++] = anum;
+				}
+			}
+		}
+		if (mval.nt) freemem(mval.t);
+	}
+#endif
+	HTT_put(&macros, m, mname);
+	freemem(mname);
+	if (emit_defines) print_macro(m);
+	return 0;
+
+redef_error:
+	while (ls->ctok->type != NEWLINE && !next_token(ls));
+redef_error_2:
+	error(l, "macro '%s' redefined unidentically", HASH_ITEM_NAME(n));
+	return 1;
+warp_error:
+	while (ls->ctok->type != NEWLINE && !next_token(ls));
+define_error:
+	if (m) del_macro(m);
+	if (mname) freemem(mname);
+#ifdef LOW_MEM
+	if (mv.nt) {
+		size_t i;
+
+		for (i = 0; i < mv.nt; i ++)
+			if (S_TOKEN(mv.t[i].type)) freemem(mv.t[i].name);
+		freemem(mv.t);
+	}
+#endif
+	return 1;
+#undef mval
+}
+
+/*
+ * Get the arguments for a macro. This code is tricky because there can
+ * be multiple sources for these arguments, if we are in the middle of
+ * a macro replacement; arguments are macro-replaced before inclusion
+ * into the macro replacement.
+ *
+ * return value:
+ * 1	no argument (last token read from next_token())
+ * 2    no argument (last token read from tfi)
+ * 3    no argument (nothing read)
+ * 4	error
+ *
+ * Void arguments are allowed in C99.
+ */
+static int collect_arguments(struct lexer_state *ls, struct token_fifo *tfi,
+	int penury, struct token_fifo *atl, int narg, int vaarg, int *wr)
+{
+	int ltwws = 1, npar = 0, i;
+	struct token *ct = 0;
+	int read_from_fifo = 0;
+	long begin_line = ls->line;
+
+#define unravel(ls)	(read_from_fifo = 0, !((tfi && tfi->art < tfi->nt \
+	&& (read_from_fifo = 1) != 0 && (ct = tfi->t + (tfi->art ++))) \
+	|| ((!tfi || penury) && !next_token(ls) && (ct = (ls)->ctok))))
+
+	/*
+	 * collect_arguments() is assumed to setup correctly atl
+	 * (this is not elegant, but it works)
+	 */
+	for (i = 0; i < narg; i ++) atl[i].art = atl[i].nt = 0;
+	if (vaarg) atl[narg].art = atl[narg].nt = 0;
+	*wr = 0;
+	while (!unravel(ls)) {
+		if (!read_from_fifo && ct->type == NEWLINE) ls->ltwnl = 1;
+		if (ttWHI(ct->type)) {
+			*wr = 1;
+			continue;
+		}
+		if (ct->type == LPAR) {
+			npar = 1;
+		}
+		break;
+	}
+	if (!npar) {
+		if (ct == ls->ctok) return 1;
+		if (read_from_fifo) return 2;
+		return 3;
+	}
+	if (!read_from_fifo && ct == ls->ctok) ls->ltwnl = 0;
+	i = 0;
+	if ((narg + vaarg) == 0) {
+		while(!unravel(ls)) {
+			if (ttWHI(ct->type)) continue;
+			if (ct->type == RPAR) goto harvested;
+			npar = 1;
+			goto too_many_args;
+		}
+	}
+	while (!unravel(ls)) {
+		struct token t;
+
+		if (ct->type == LPAR) npar ++;
+		else if (ct->type == RPAR && (-- npar) == 0) {
+			if (atl[i].nt != 0
+				&& ttMWS(atl[i].t[atl[i].nt - 1].type))
+					atl[i].nt --;
+			i ++;
+			/*
+			 * C99 standard states that at least one argument
+			 * should be present for the ... part; to relax
+			 * this behaviour, change 'narg + vaarg' to 'narg'.
+			 */
+			if (i < (narg + vaarg)) {
+				error(begin_line, "not enough arguments "
+					"to macro");
+				return 4;
+			}
+			if (i > narg) {
+				if (!(ls->flags & MACRO_VAARG) || !vaarg)
+					goto too_many_args;
+			}
+			goto harvested;
+		} else if (ct->type == COMMA && npar <= 1 && i < narg) {
+			if (atl[i].nt != 0
+				&& ttMWS(atl[i].t[atl[i].nt - 1].type))
+					atl[i].nt --;
+			if (++ i == narg) {
+				if (!(ls->flags & MACRO_VAARG) || !vaarg)
+					goto too_many_args;
+			}
+			if (i > 30000) goto too_many_args;
+			ltwws = 1;
+			continue;
+		} else if (ltwws && ttWHI(ct->type)) continue;
+
+		t.type = ct->type;
+		if (!read_from_fifo) t.line = ls->line; else t.line = ct->line;
+		/*
+		 * Stringification applies only to macro arguments;
+		 * so we handle here OPT_NONE.
+		 * OPT_NONE is kept, but does not count as whitespace,
+		 * and merges with other whitespace to give a fully
+		 * qualified NONE token. Two OPT_NONE tokens merge.
+		 * Initial and final OPT_NONE are discarded (initial
+		 * is already done, as OPT_NONE is matched by ttWHI).
+		 */
+		if (ttWHI(t.type)) {
+			if (t.type != OPT_NONE) {
+				t.type = NONE;
+#ifdef SEMPER_FIDELIS
+				t.name = sdup(" ");
+				throw_away(ls->gf, t.name);
+#endif
+				ltwws = 1;
+			}
+			if (atl[i].nt > 0
+				&& atl[i].t[atl[i].nt - 1].type == OPT_NONE)
+					atl[i].nt --;
+		} else { 
+			ltwws = 0;
+			if (S_TOKEN(t.type)) {
+				t.name = ct->name;
+				if (ct == (ls)->ctok) {
+					t.name = sdup(t.name);
+					throw_away(ls->gf, t.name);
+				}
+			}
+		}
+		aol(atl[i].t, atl[i].nt, t, TOKEN_LIST_MEMG);
+	}
+	error(begin_line, "unfinished macro call");
+	return 4;
+too_many_args:
+	error(begin_line, "too many arguments to macro");
+	while (npar && !unravel(ls)) {
+		if (ct->type == LPAR) npar ++;
+		else if (ct->type == RPAR) npar --;
+	}
+	return 4;
+harvested:
+	if (i > 127 && (ls->flags & WARN_STANDARD))
+		warning(begin_line, "macro call with %d arguments (ISO "
+			"specifies 127 max)", i);
+	return 0;
+#undef unravel
+}
+
+/*
+ * concat_token() is called when the ## operator is used. It uses
+ * the struct lexer_state dsharp_lexer to parse the result of the
+ * concatenation.
+ *
+ * Law enforcement: if the whole string does not produce a valid
+ * single token, an error (non-zero result) is returned.
+ */
+struct lexer_state dsharp_lexer;
+
+static inline int concat_token(struct token *t1, struct token *t2)
+{
+	char *n1 = token_name(t1), *n2 = token_name(t2);
+	size_t l1 = strlen(n1), l2 = strlen(n2);
+	unsigned char *x = getmem(l1 + l2 + 1);
+	int r;
+
+	mmv(x, n1, l1);
+	mmv(x + l1, n2, l2);
+	x[l1 + l2] = 0;
+	dsharp_lexer.input = 0;
+	dsharp_lexer.input_string = x;
+	dsharp_lexer.pbuf = 0;
+	dsharp_lexer.ebuf = l1 + l2;
+	dsharp_lexer.discard = 1;
+	dsharp_lexer.flags = DEFAULT_LEXER_FLAGS;
+	dsharp_lexer.pending_token = 0;
+	r = next_token(&dsharp_lexer);
+	freemem(x);
+	return (r == 1 || dsharp_lexer.pbuf < (l1 + l2)
+		|| dsharp_lexer.pending_token
+		|| (dsharp_lexer.pbuf == (l1 + l2) && !dsharp_lexer.discard));
+}
+
+#ifdef PRAGMA_TOKENIZE
+/*
+ * tokenize_string() takes a string as input, and split it into tokens,
+ * reassembling the tokens into a single compressed string generated by
+ * compress_token_list(); this function is used for _Pragma processing.
+ */
+struct lexer_state tokenize_lexer;
+
+static char *tokenize_string(struct lexer_state *ls, char *buf)
+{
+	struct token_fifo tf;
+	size_t bl = strlen(buf);
+	int r;
+
+	tokenize_lexer.input = 0;
+	tokenize_lexer.input_string = (unsigned char *)buf;
+	tokenize_lexer.pbuf = 0;
+	tokenize_lexer.ebuf = bl;
+	tokenize_lexer.discard = 1;
+	tokenize_lexer.flags = ls->flags | LEXER;
+	tokenize_lexer.pending_token = 0;
+	tf.art = tf.nt = 0;
+	while (!(r = next_token(&tokenize_lexer))) {
+		struct token t, *ct = tokenize_lexer.ctok;
+
+		if (ttWHI(ct->type)) continue;
+		t = *ct;
+		if (S_TOKEN(t.type)) t.name = sdup(t.name);
+		aol(tf.t, tf.nt, t, TOKEN_LIST_MEMG);
+	}
+	if (tokenize_lexer.pbuf < bl) goto tokenize_error;
+	return (char *)((compress_token_list(&tf)).t);
+
+tokenize_error:
+	if (tf.nt) {
+		for (tf.art = 0; tf.art < tf.nt; tf.art ++)
+			if (S_TOKEN(tf.t[tf.art].type))
+				freemem(tf.t[tf.art].name);
+		freemem(tf.t);
+	}
+	return 0;
+}
+#endif
+
+/*
+ * stringify_string() has a self-explanatory name. It is called when
+ * the # operator is used in a macro and a string constant must be
+ * stringified.
+ */
+static inline char *stringify_string(char *x)
+{
+	size_t l;
+	int i, inside_str = 0, inside_cc = 0, must_quote, has_quoted = 0;
+	char *y, *d;
+
+	for (i = 0; i < 2; i ++) {
+		if (i) d[0] = '"';
+		for (l = 1, y = x; *y; y ++, l ++) {
+			must_quote = 0;
+			if (inside_cc) {
+				if (*y == '\\') {
+					must_quote = 1;
+					has_quoted = 1;
+				} else if (!has_quoted && *y == '\'')
+					inside_cc = 0;
+			} else if (inside_str) {
+				if (*y == '"' || *y == '\\') must_quote = 1;
+				if (*y == '\\') has_quoted = 1;
+				else if (!has_quoted && *y == '"')
+					inside_str = 0;
+			} else if (*y == '"') {
+				inside_str = 1;
+				must_quote = 1;
+			} else if (*y == '\'') {
+				inside_cc = 1;
+			}
+			if (must_quote) {
+				if (i) d[l] = '\\';
+				l ++;
+			}
+			if (i) d[l] = *y;
+		}
+		if (!i) d = getmem(l + 2);
+		if (i) {
+			d[l] = '"';
+			d[l + 1] = 0;
+		}
+	}
+	return d;
+}
+
+/*
+ * stringify() produces a constant string, result of the # operator
+ * on a list of tokens.
+ */
+static char *stringify(struct token_fifo *tf)
+{
+	size_t tlen;
+	size_t i;
+	char *x, *y;
+
+	for (tlen = 0, i = 0; i < tf->nt; i ++)
+		if (tf->t[i].type < CPPERR && tf->t[i].type != OPT_NONE)
+			tlen += strlen(token_name(tf->t + i));
+	if (tlen == 0) return sdup("\"\"");
+	x = getmem(tlen + 1);
+	for (tlen = 0, i = 0; i < tf->nt; i ++) {
+		if (tf->t[i].type >= CPPERR || tf->t[i].type == OPT_NONE)
+			continue;
+		strcpy(x + tlen, token_name(tf->t + i));
+		tlen += strlen(token_name(tf->t + i));
+	}
+	/* no need to add a trailing 0: strcpy() did that (and the string
+	   is not empty) */
+	y = stringify_string(x);
+	freemem(x);
+	return y;
+}
+
+/*
+ * Two strings evaluated at initialization time, to handle the __TIME__
+ * and __DATE__ special macros.
+ *
+ * C99 specifies that these macros should remain constant throughout
+ * the whole preprocessing.
+ */
+char compile_time[12], compile_date[24];
+
+/*
+ * substitute_macro() performs the macro substitution. It is called when
+ * an identifier recognized as a macro name has been found; this function
+ * tries to collect the arguments (if needed), applies # and ## operators
+ * and perform recursive and nested macro expansions.
+ *
+ * In the substitution of a macro, we remove all newlines that were in the
+ * arguments. This might confuse error reporting (which could report
+ * erroneous line numbers) or have worse effect is the preprocessor is
+ * used for another language pickier than C. Since the interface between
+ * the preprocessor and the compiler is not fully specified, I believe
+ * that this is no violation of the standard. Comments welcome.
+ *
+ * We take tokens from tfi. If tfi has no more tokens to give: we may
+ * take some tokens from ls to complete a call (fetch arguments) if
+ * and only if penury is non zero.
+ */
+int substitute_macro(struct lexer_state *ls, struct macro *m,
+	struct token_fifo *tfi, int penury, int reject_nested, long l)
+{
+	char *mname = HASH_ITEM_NAME(m);
+	struct token_fifo *atl, etl;
+	struct token t, *ct;
+	int i, save_nest = m->nest;
+	size_t save_art, save_tfi, etl_limit;
+	int ltwds, ntwds, ltwws;
+	int pragma_op = 0;
+
+	/*
+	 * Reject the replacement, if we are already inside the macro.
+	 */
+	if (m->nest > reject_nested) {
+		t.type = NAME;
+		t.line = ls->line;
+		t.name = mname;
+		print_token(ls, &t, 0);
+		return 0;
+	}
+
+	/*
+	 * put a separation from preceeding tokens
+	 */
+	print_space(ls);
+
+	/*
+	 * Check if the macro is a special one.
+	 */
+	if ((i = check_special_macro(mname)) >= MAC_SPECIAL) {
+		/* we have a special macro */
+		switch (i) {
+			char buf[30], *bbuf, *cfn;
+
+		case MAC_LINE:
+			t.type = NUMBER;
+			t.line = l;
+			sprintf(buf, "%ld", l);
+			t.name = buf;
+			print_space(ls);
+			print_token(ls, &t, 0);
+			break;
+		case MAC_FILE:
+			t.type = STRING;
+			t.line = l;
+			cfn = current_long_filename ?
+				current_long_filename : current_filename;
+			bbuf = getmem(2 * strlen(cfn) + 3);
+			{
+				char *c, *d;
+				int lcwb = 0;
+
+				bbuf[0] = '"';
+				for (c = cfn, d = bbuf + 1; *c; c ++) {
+					if (*c == '\\') {
+						if (lcwb) continue;
+						*(d ++) = '\\';
+						lcwb = 1;
+					} else lcwb = 0;
+					*(d ++) = *c;
+				}
+				*(d ++) = '"';
+				*(d ++) = 0;
+			}
+			t.name = bbuf;
+			print_space(ls);
+			print_token(ls, &t, 0);
+			freemem(bbuf);
+			break;
+		case MAC_DATE:
+			t.type = STRING;
+			t.line = l;
+			t.name = compile_date;
+			print_space(ls);
+			print_token(ls, &t, 0);
+			break;
+		case MAC_TIME:
+			t.type = STRING;
+			t.line = l;
+			t.name = compile_time;
+			print_space(ls);
+			print_token(ls, &t, 0);
+			break;
+		case MAC_STDC:
+			t.type = NUMBER;
+			t.line = l;
+			t.name = "1";
+			print_space(ls);
+			print_token(ls, &t, 0);
+			break;
+		case MAC_PRAGMA:
+			if (reject_nested > 0) {
+				/* do not replace _Pragma() unless toplevel */
+				t.type = NAME;
+				t.line = ls->line;
+				t.name = mname;
+				print_token(ls, &t, 0);
+				return 0;
+			}
+			pragma_op = 1;
+			goto collect_args;
+#ifdef AUDIT
+		default:
+			ouch("unbekanntes fliegendes macro");
+#endif
+		}
+		return 0;
+	}
+
+	/*
+	 * If the macro has arguments, collect them.
+	 */
+collect_args:
+	if (m->narg >= 0) {
+		unsigned long save_flags = ls->flags;
+		int wr = 0;
+
+		ls->flags |= LEXER;
+		if (m->narg > 0 || m->vaarg)
+			atl = getmem((m->narg + m->vaarg)
+				* sizeof(struct token_fifo));
+		switch (collect_arguments(ls, tfi, penury, atl,
+			m->narg, m->vaarg, &wr)) {
+		case 1:
+			/* the macro expected arguments, but we did not
+			   find any; the last read token should be read
+			   again. */
+			ls->flags = save_flags | READ_AGAIN;
+			goto no_argument_next;
+		case 2:
+			tfi->art --;
+			/* fall through */
+		case 3:
+			ls->flags = save_flags;
+		no_argument_next:
+			t.type = NAME;
+			t.line = l;
+			t.name = mname;
+			print_token_nailed(ls, &t, l);
+			if (wr) {
+				t.type = NONE;
+				t.line = l;
+#ifdef SEMPER_FIDELIS
+				t.name = " ";
+#endif
+				print_token(ls, &t, 0);
+				goto exit_macro_2;
+			}
+			goto exit_macro_1;
+		case 4:
+			ls->flags = save_flags;
+			goto exit_error_1;
+		}
+		ls->flags = save_flags;
+	}
+
+	/*
+	 * If the macro is _Pragma, and we got here, then we have
+	 * exactly one argument. We check it, unstringize it, and
+	 * emit a PRAGMA token.
+	 */
+	if (pragma_op) {
+		char *pn;
+
+		if (atl[0].nt != 1 || atl[0].t[0].type != STRING) {
+			error(ls->line, "invalid argument to _Pragma");
+			if (atl[0].nt) freemem(atl[0].t);
+			freemem(atl);
+			goto exit_error;
+		}
+		pn = atl[0].t[0].name;
+		if ((pn[0] == '"' && pn[1] == '"') || (pn[0] == 'L'
+			&& pn[1] == '"' && pn[2] == '"')) {
+			/* void pragma -- just ignore it */
+			freemem(atl[0].t);
+			freemem(atl);
+			return 0;
+		}
+		if (ls->flags & TEXT_OUTPUT) {
+#ifdef PRAGMA_DUMP
+	/*
+	 * This code works because we actually evaluate arguments in a
+	 * lazy way: we scan a macro argument only if it appears in the
+	 * output, and exactly as many times as it appears. Therefore,
+	 * _Pragma() will get evaluated just like they should.
+	 */
+			char *c = atl[0].t[0].name, *d;
+
+			for (d = "\n#pragma "; *d; d ++) put_char(ls, *d);
+			d = (*c == 'L') ? c + 2 : c + 1;
+			for (; *d != '"'; d ++) {
+				if (*d == '\\' && (*(d + 1) == '\\'
+					|| *(d + 1) == '"')) {
+					d ++;
+				}
+				put_char(ls, *d);
+			}
+			put_char(ls, '\n');
+			ls->oline = ls->line;
+			enter_file(ls, ls->flags);
+#else
+			if (ls->flags & WARN_PRAGMA)
+				warning(ls->line,
+					"_Pragma() ignored and not dumped");
+#endif
+		} else if (ls->flags & HANDLE_PRAGMA) {
+			char *c = atl[0].t[0].name, *d, *buf;
+			struct token t;
+
+			/* a wide string is a string */
+			if (*c == 'L') c ++;
+			c ++;
+			for (buf = d = getmem(strlen(c)); *c != '"'; c ++) {
+				if (*c == '\\' && (*(c + 1) == '\\'
+					|| *(c + 1) == '"')) {
+					*(d ++) = *(++ c);
+				} else *(d ++) = *c;
+			}
+			*d = 0;
+			t.type = PRAGMA;
+			t.line = ls->line;
+#ifdef PRAGMA_TOKENIZE
+			t.name = tokenize_string(ls, buf);
+			freemem(buf);
+			buf = t.name;
+			if (!buf) {
+				freemem(atl[0].t);
+				freemem(atl);
+				goto exit_error;
+			}
+#else
+			t.name = buf;
+#endif
+			aol(ls->toplevel_of->t, ls->toplevel_of->nt,
+				t, TOKEN_LIST_MEMG);
+			throw_away(ls->gf, buf);
+		}
+		freemem(atl[0].t);
+		freemem(atl);
+		return 0;
+	}
+
+	/*
+	 * Now we expand and replace the arguments in the macro; we
+	 * also handle '#' and '##'. If we find an argument, that has
+	 * to be replaced, we expand it in its own token list, then paste
+	 * it. Tricky point: when we paste an argument, we must scan
+	 * again the resulting list for further replacements. This
+	 * implies problems with regards to nesting self-referencing
+	 * macros.
+	 *
+	 * We do then YAUH (yet another ugly hack): if a macro is replaced,
+	 * and nested replacement exhibit the same macro, we mark it with
+	 * a negative line number. All produced negative line numbers
+	 * must be cleaned in the end.
+	 */
+
+#define ZAP_LINE(t)	do { \
+		if ((t).type == NAME) { \
+			struct macro *zlm = HTT_get(&macros, (t).name); \
+			if (zlm && zlm->nest > reject_nested) \
+				(t).line = -1 - (t).line; \
+		} \
+	} while (0)
+
+#ifdef LOW_MEM
+	save_art = m->cval.rp;
+	m->cval.rp = 0;
+#else
+	save_art = m->val.art;
+	m->val.art = 0;
+#endif
+	etl.art = etl.nt = 0;
+	m->nest = reject_nested + 1;
+	ltwds = ntwds = 0;
+#ifdef LOW_MEM
+	while (m->cval.rp < m->cval.length) {
+#else
+	while (m->val.art < m->val.nt) {
+#endif
+		size_t next, z;
+#ifdef LOW_MEM
+		struct token uu;
+
+		ct = &uu;
+		ct->line = 1;
+		t.type = ct->type = m->cval.t[m->cval.rp ++];
+		if (ct->type == MACROARG) {
+			unsigned anum = m->cval.t[m->cval.rp ++];
+
+			if (anum >= 128U) anum = ((anum & 127U) << 8)
+				| (unsigned)m->cval.t[m->cval.rp ++];
+			ct->line = anum;
+		} else if (S_TOKEN(ct->type)) {
+			t.name = ct->name = (char *)(m->cval.t + m->cval.rp);
+			m->cval.rp += 1 + strlen(ct->name);
+		}
+#ifdef SEMPER_FIDELIS
+		else if (ct->type == OPT_NONE) {
+			t.type = ct->type = NONE;
+			t.name = ct->name = " ";
+		}
+#endif
+		t.line = ls->line;
+		next = m->cval.rp;
+		if ((next < m->cval.length && (m->cval.t[z = next] == DSHARP
+			|| m->cval.t[z = next] == DIG_DSHARP))
+			|| ((next + 1) < m->cval.length
+			   && ttWHI(m->cval.t[next])
+			   && (m->cval.t[z = next + 1] == DSHARP
+			    || m->cval.t[z = next + 1] == DIG_DSHARP))) {
+			ntwds = 1;
+			m->cval.rp = z;
+		} else ntwds = 0;
+#else
+		ct = m->val.t + (m->val.art ++);
+		next = m->val.art;
+		t.type = ct->type;
+		t.line = ls->line;
+#ifdef SEMPER_FIDELIS
+		if (t.type == OPT_NONE) {
+			t.type = NONE;
+			t.name = " ";
+		} else
+#endif
+		t.name = ct->name;
+		if ((next < m->val.nt && (m->val.t[z = next].type == DSHARP
+			|| m->val.t[z = next].type == DIG_DSHARP))
+			|| ((next + 1) < m->val.nt
+			   && ttWHI(m->val.t[next].type)
+			   && (m->val.t[z = next + 1].type == DSHARP
+			    || m->val.t[z = next + 1].type == DIG_DSHARP))) {
+			ntwds = 1;
+			m->val.art = z;
+		} else ntwds = 0;
+#endif
+		if (ct->type == MACROARG) {
+#ifdef DSHARP_TOKEN_MERGE
+			int need_opt_space = 1;
+#endif
+			z = ct->line;	/* the argument number is there */
+			if (ltwds && atl[z].nt != 0 && etl.nt) {
+				if (concat_token(etl.t + (-- etl.nt),
+					atl[z].t)) {
+					warning(ls->line, "operator '##' "
+						"produced the invalid token "
+						"'%s%s'",
+						token_name(etl.t + etl.nt),
+						token_name(atl[z].t));
+#if 0
+/* obsolete */
+#ifdef LOW_MEM
+					m->cval.rp = save_art;
+#else
+					m->val.art = save_art;
+#endif
+					etl.nt ++;
+					goto exit_error_2;
+#endif
+					etl.nt ++;
+					atl[z].art = 0;
+#ifdef DSHARP_TOKEN_MERGE
+					need_opt_space = 0;
+#endif
+				} else {
+					if (etl.nt == 0) freemem(etl.t);
+					else if (!ttWHI(etl.t[etl.nt - 1]
+						.type)) {
+						t.type = OPT_NONE;
+						t.line = ls->line;
+						aol(etl.t, etl.nt, t,
+							TOKEN_LIST_MEMG);
+					}
+					t.type = dsharp_lexer.ctok->type;
+					t.line = ls->line;
+					if (S_TOKEN(t.type)) {
+						t.name = sdup(dsharp_lexer
+							.ctok->name);
+						throw_away(ls->gf, t.name);
+					}
+					ZAP_LINE(t);
+					aol(etl.t, etl.nt, t, TOKEN_LIST_MEMG);
+					atl[z].art = 1;
+				}
+			} else atl[z].art = 0;
+			if (
+#ifdef DSHARP_TOKEN_MERGE
+				need_opt_space &&
+#endif
+				atl[z].art < atl[z].nt && (!etl.nt
+					|| !ttWHI(etl.t[etl.nt - 1].type))) {
+				t.type = OPT_NONE;
+				t.line = ls->line;
+				aol(etl.t, etl.nt, t, TOKEN_LIST_MEMG);
+			}
+			if (ltwds || ntwds) {
+				while (atl[z].art < atl[z].nt) {
+					t = atl[z].t[atl[z].art ++];
+					t.line = ls->line;
+					ZAP_LINE(t);
+					aol(etl.t, etl.nt, t, TOKEN_LIST_MEMG);
+				}
+			} else {
+				struct token_fifo *save_tf;
+				unsigned long save_flags;
+				int ret = 0;
+
+				atl[z].art = 0;
+				save_tf = ls->output_fifo;
+				ls->output_fifo = &etl;
+				save_flags = ls->flags;
+				ls->flags |= LEXER;
+				while (atl[z].art < atl[z].nt) {
+					struct macro *nm;
+					struct token *cct;
+
+					cct = atl[z].t + (atl[z].art ++);
+					if (cct->type == NAME
+						&& cct->line >= 0
+						&& (nm = HTT_get(&macros,
+						    cct->name))
+						&& nm->nest <=
+						    (reject_nested + 1)) {
+						ret |= substitute_macro(ls,
+							nm, atl + z, 0,
+							reject_nested + 1, l);
+						continue;
+					}
+					t = *cct;
+					ZAP_LINE(t);
+					aol(etl.t, etl.nt, t, TOKEN_LIST_MEMG);
+				}
+				ls->output_fifo = save_tf;
+				ls->flags = save_flags;
+				if (ret) {
+#ifdef LOW_MEM
+					m->cval.rp = save_art;
+#else
+					m->val.art = save_art;
+#endif
+					goto exit_error_2;
+				}
+			}
+			if (!ntwds && (!etl.nt
+				|| !ttWHI(etl.t[etl.nt - 1].type))) {
+				t.type = OPT_NONE;
+				t.line = ls->line;
+				aol(etl.t, etl.nt, t, TOKEN_LIST_MEMG);
+			}
+			ltwds = 0;
+			continue;
+		}
+		/*
+		 * This code is definitely cursed.
+		 *
+		 * For the extremely brave reader who tries to understand
+		 * what is happening: ltwds is a flag meaning "last token
+		 * was double-sharp" and ntwds means "next token will be
+		 * double-sharp". The tokens are from the macro definition,
+		 * and scanned from left to right. Arguments that are
+		 * not implied into a #/## construction are macro-expanded
+		 * seperately, then included into the token stream.
+		 */
+		if (ct->type == DSHARP || ct->type == DIG_DSHARP) {
+			if (ltwds) {
+				error(ls->line, "quad sharp");
+#ifdef LOW_MEM
+				m->cval.rp = save_art;
+#else
+				m->val.art = save_art;
+#endif
+				goto exit_error_2;
+			}
+#ifdef LOW_MEM
+			if (m->cval.rp < m->cval.length
+				&& ttMWS(m->cval.t[m->cval.rp]))
+					m->cval.rp ++;
+#else
+			if (m->val.art < m->val.nt
+				&& ttMWS(m->val.t[m->val.art].type))
+					m->val.art ++;
+#endif
+			ltwds = 1;
+			continue;
+		} else if (ltwds && etl.nt != 0) {
+			if (concat_token(etl.t + (-- etl.nt), ct)) {
+				warning(ls->line, "operator '##' produced "
+					"the invalid token '%s%s'",
+					token_name(etl.t + etl.nt),
+					token_name(ct));
+#if 0
+/* obsolete */
+#ifdef LOW_MEM
+				m->cval.rp = save_art;
+#else
+				m->val.art = save_art;
+#endif
+				etl.nt ++;
+				goto exit_error_2;
+#endif
+				etl.nt ++;
+			} else {
+				if (etl.nt == 0) freemem(etl.t);
+				t.type = dsharp_lexer.ctok->type;
+				t.line = ls->line;
+				if (S_TOKEN(t.type)) {
+					t.name = sdup(dsharp_lexer.ctok->name);
+					throw_away(ls->gf, t.name);
+				}
+				ct = &t;
+			}
+		}
+		ltwds = 0;
+#ifdef LOW_MEM
+		if ((ct->type == SHARP || ct->type == DIG_SHARP)
+			&& next < m->cval.length
+			&& (m->cval.t[next] == MACROARG
+			|| (ttMWS(m->cval.t[next])
+			&& (next + 1) < m->cval.length
+			&& m->cval.t[next + 1] == MACROARG))) {
+
+			unsigned anum;
+#else
+		if ((ct->type == SHARP || ct->type == DIG_SHARP)
+			&& next < m->val.nt
+			&& (m->val.t[next].type == MACROARG
+			|| (ttMWS(m->val.t[next].type)
+			&& (next + 1) < m->val.nt
+			&& m->val.t[next + 1].type == MACROARG))) {
+#endif
+			/*
+			 * We have a # operator followed by (an optional
+			 * whitespace and) a macro argument; this means
+			 * stringification. So be it.
+			 */
+#ifdef LOW_MEM
+			if (ttMWS(m->cval.t[next])) m->cval.rp ++;
+#else
+			if (ttMWS(m->val.t[next].type)) m->val.art ++;
+#endif
+			t.type = STRING;
+#ifdef LOW_MEM
+			anum = m->cval.t[++ m->cval.rp];
+			if (anum >= 128U) anum = ((anum & 127U) << 8)
+				| (unsigned)m->cval.t[++ m->cval.rp];
+			t.name = stringify(atl + anum);
+			m->cval.rp ++;
+#else
+			t.name = stringify(atl +
+				(size_t)(m->val.t[m->val.art ++].line));
+#endif
+			throw_away(ls->gf, t.name);
+			ct = &t;
+			/*
+			 * There is no need for extra spaces here.
+			 */
+		}
+		t = *ct;
+		ZAP_LINE(t);
+		aol(etl.t, etl.nt, t, TOKEN_LIST_MEMG);
+	}
+#ifdef LOW_MEM
+	m->cval.rp = save_art;
+#else
+	m->val.art = save_art;
+#endif
+
+	/*
+	 * Now etl contains the expanded macro, to be parsed again for
+	 * further expansions -- much easier, since '#' and '##' have
+	 * already been handled.
+	 * However, we might need some input from tfi. So, we paste
+	 * the contents of tfi after etl, and we put back what was
+	 * not used.
+	 *
+	 * Some adjacent spaces are merged; only unique NONE, or sequences
+	 * OPT_NONE NONE are emitted.
+	 */
+	etl_limit = etl.nt;
+	if (tfi) {
+		save_tfi = tfi->art;
+		while (tfi->art < tfi->nt) aol(etl.t, etl.nt,
+			tfi->t[tfi->art ++], TOKEN_LIST_MEMG);
+	}
+	ltwws = 0;
+	while (etl.art < etl_limit) {
+		struct macro *nm;
+
+		ct = etl.t + (etl.art ++);
+		if (ct->type == NAME && ct->line >= 0
+			&& (nm = HTT_get(&macros, ct->name))) {
+			if (substitute_macro(ls, nm, &etl,
+				penury, reject_nested, l)) {
+				m->nest = save_nest;
+				goto exit_error_2;
+			}
+			ltwws = 0;
+			continue;
+		}
+		if (ttMWS(ct->type)) {
+			if (ltwws == 1) {
+				if (ct->type == OPT_NONE) continue;
+				ltwws = 2;
+			} else if (ltwws == 2) continue;
+			else if (ct->type == OPT_NONE) ltwws = 1;
+			else ltwws = 2;
+		} else ltwws = 0;
+		if (ct->line >= 0) ct->line = l;
+		print_token(ls, ct, reject_nested ? 0 : l);
+	}
+	if (etl.nt) freemem(etl.t);
+	if (tfi) {
+		tfi->art = save_tfi + (etl.art - etl_limit);
+	}
+
+exit_macro_1:
+	print_space(ls);
+exit_macro_2:
+	for (i = 0; i < (m->narg + m->vaarg); i ++)
+		if (atl[i].nt) freemem(atl[i].t);
+	if (m->narg > 0 || m->vaarg) freemem(atl);
+	m->nest = save_nest;
+	return 0;
+
+exit_error_2:
+	if (etl.nt) freemem(etl.t);
+exit_error_1:
+	for (i = 0; i < (m->narg + m->vaarg); i ++)
+		if (atl[i].nt) freemem(atl[i].t);
+	if (m->narg > 0 || m->vaarg) freemem(atl);
+	m->nest = save_nest;
+exit_error:
+	return 1;
+}
+
+/*
+ * print already defined macros
+ */
+void print_defines(void)
+{
+	HTT_scan(&macros, print_macro);
+}
+
+/*
+ * define_macro() defines a new macro, whom definition is given in
+ * the command-line syntax: macro=def
+ * The '=def' part is optional.
+ *
+ * It returns non-zero on error.
+ */
+int define_macro(struct lexer_state *ls, char *def)
+{
+	char *c = sdup(def), *d;
+	int with_def = 0;
+	int ret = 0;
+
+	for (d = c; *d && *d != '='; d ++);
+	if (*d) {
+		*d = ' ';
+		with_def = 1;
+	}
+	if (with_def) {
+		struct lexer_state lls;
+		size_t n = strlen(c) + 1;
+
+		if (c == d) {
+			error(-1, "void macro name");
+			ret = 1;
+		} else {
+			*(c + n - 1) = '\n';
+			init_buf_lexer_state(&lls, 0);
+			lls.flags = ls->flags | LEXER;
+			lls.input = 0;
+			lls.input_string = (unsigned char *)c;
+			lls.pbuf = 0;
+			lls.ebuf = n;
+			lls.line = -1;
+			ret = handle_define(&lls);
+			free_lexer_state(&lls);
+		}
+	} else {
+		struct macro *m;
+
+		if (!*c) {
+			error(-1, "void macro name");
+			ret = 1;
+		} else if ((m = HTT_get(&macros, c))
+#ifdef LOW_MEM
+			&& (m->cval.length != 3
+			|| m->cval.t[0] != NUMBER
+			|| strcmp((char *)(m->cval.t + 1), "1"))) {
+#else
+			&& (m->val.nt != 1
+			|| m->val.t[0].type != NUMBER
+			|| strcmp(m->val.t[0].name, "1"))) {
+#endif
+			error(-1, "macro %s already defined", c);
+			ret = 1;
+		} else {
+#ifndef LOW_MEM
+			struct token t;
+#endif
+
+			m = new_macro();
+#ifdef LOW_MEM
+			m->cval.length = 3;
+			m->cval.t = getmem(3);
+			m->cval.t[0] = NUMBER;
+			m->cval.t[1] = '1';
+			m->cval.t[2] = 0;
+#else
+			t.type = NUMBER;
+			t.name = sdup("1");
+			aol(m->val.t, m->val.nt, t, TOKEN_LIST_MEMG);
+#endif
+			HTT_put(&macros, m, c);
+		}
+	}
+	freemem(c);
+	return ret;
+}
+
+/*
+ * undef_macro() undefines the macro whom name is given as "def";
+ * it is not an error to try to undef a macro that does not exist.
+ *
+ * It returns non-zero on error (undefinition of a special macro,
+ * void macro name).
+ */
+int undef_macro(struct lexer_state *ls, char *def)
+{
+	char *c = def;
+
+	if (!*c) {
+		error(-1, "void macro name");
+		return 1;
+	}
+	if (HTT_get(&macros, c)) {
+		if (check_special_macro(c)) {
+			error(-1, "trying to undef special macro %s", c);
+			return 1;
+		} else HTT_del(&macros, c);
+	}
+	return 0;
+}
+
+/*
+ * We saw a #ifdef directive. Parse the line.
+ * return value: 1 if the macro is defined, 0 if it is not, -1 on error
+ */
+int handle_ifdef(struct lexer_state *ls)
+{
+	while (!next_token(ls)) {
+		int tgd = 1;
+
+		if (ls->ctok->type == NEWLINE) break;
+		if (ttMWS(ls->ctok->type)) continue;
+		if (ls->ctok->type == NAME) {
+			int x = (HTT_get(&macros, ls->ctok->name) != 0);
+			while (!next_token(ls) && ls->ctok->type != NEWLINE)
+				if (tgd && !ttWHI(ls->ctok->type)
+					&& (ls->flags & WARN_STANDARD)) {
+					warning(ls->line, "trailing garbage "
+						"in #ifdef");
+					tgd = 0;
+				}
+			return x;
+		}
+		error(ls->line, "illegal macro name for #ifdef");
+		while (!next_token(ls) && ls->ctok->type != NEWLINE)
+			if (tgd && !ttWHI(ls->ctok->type)
+				&& (ls->flags & WARN_STANDARD)) {
+				warning(ls->line, "trailing garbage in "
+					"#ifdef");
+				tgd = 0;
+			}
+		return -1;
+	}
+	error(ls->line, "unfinished #ifdef");
+	return -1;
+}
+
+/*
+ * for #undef
+ * return value: 1 on error, 0 on success. Undefining a macro that was
+ * already not defined is not an error.
+ */
+int handle_undef(struct lexer_state *ls)
+{
+	while (!next_token(ls)) {
+		if (ls->ctok->type == NEWLINE) break;
+		if (ttMWS(ls->ctok->type)) continue;
+		if (ls->ctok->type == NAME) {
+			struct macro *m = HTT_get(&macros, ls->ctok->name);
+			int tgd = 1;
+
+			if (m != 0) {
+				if (check_special_macro(ls->ctok->name)) {
+					error(ls->line, "trying to undef "
+						"special macro %s",
+						ls->ctok->name);
+					goto undef_error;
+				}
+				if (emit_defines)
+					fprintf(emit_output, "#undef %s\n",
+						ls->ctok->name);
+				HTT_del(&macros, ls->ctok->name);
+			}
+			while (!next_token(ls) && ls->ctok->type != NEWLINE)
+				if (tgd && !ttWHI(ls->ctok->type)
+					&& (ls->flags & WARN_STANDARD)) {
+					warning(ls->line, "trailing garbage "
+						"in #undef");
+					tgd = 0;
+				}
+			return 0;
+		}
+		error(ls->line, "illegal macro name for #undef");
+	undef_error:
+		while (!next_token(ls) && ls->ctok->type != NEWLINE);
+		return 1;
+	}
+	error(ls->line, "unfinished #undef");
+	return 1;
+}
+
+/*
+ * for #ifndef
+ * return value: 0 if the macro is defined, 1 if it is not, -1 on error.
+ */
+int handle_ifndef(struct lexer_state *ls)
+{
+	while (!next_token(ls)) {
+		int tgd = 1;
+
+		if (ls->ctok->type == NEWLINE) break;
+		if (ttMWS(ls->ctok->type)) continue;
+		if (ls->ctok->type == NAME) {
+			int x = (HTT_get(&macros, ls->ctok->name) == 0);
+
+			while (!next_token(ls) && ls->ctok->type != NEWLINE)
+				if (tgd && !ttWHI(ls->ctok->type)
+					&& (ls->flags & WARN_STANDARD)) {
+					warning(ls->line, "trailing garbage "
+						"in #ifndef");
+					tgd = 0;
+				}
+			if (protect_detect.state == 1) {
+				protect_detect.state = 2;
+				protect_detect.macro = sdup(ls->ctok->name);
+			}
+			return x;
+		}
+		error(ls->line, "illegal macro name for #ifndef");
+		while (!next_token(ls) && ls->ctok->type != NEWLINE)
+			if (tgd && !ttWHI(ls->ctok->type)
+				&& (ls->flags & WARN_STANDARD)) {
+				warning(ls->line, "trailing garbage in "
+					"#ifndef");
+				tgd = 0;
+			}
+		return -1;
+	}
+	error(ls->line, "unfinished #ifndef");
+	return -1;
+}
+
+/*
+ * erase the macro table.
+ */
+void wipe_macros(void)
+{
+	if (macros_init_done) HTT_kill(&macros);
+	macros_init_done = 0;
+}
+
+/*
+ * initialize the macro table
+ */
+void init_macros(void)
+{
+	wipe_macros();
+	HTT_init(&macros, del_macro);
+	macros_init_done = 1;
+	if (!no_special_macros) add_special_macros();
+}
+
+/*
+ * find a macro from its name
+ */
+struct macro *get_macro(char *name)
+{
+	return HTT_get(&macros, name);
+}