# This is a shell archive. Save it in a file, remove anything before # this line, and then unpack it by entering "sh file". Note, it may # create directories; files and directories will be owned by you and # have default permissions. # # This archive contains: # # cpp5.c # cpp6.c # echo x - cpp5.c sed 's/^X//' >cpp5.c << 'END-of-cpp5.c' X/* X * C P P 5 . C X * E x p r e s s i o n E v a l u a t i o n X * X * Edit History X * 31-Aug-84 MM USENET net.sources release X * 04-Oct-84 MM __LINE__ and __FILE__ must call ungetstring() X * so they work correctly with token concatenation. X * Added string formal recognition. X * 25-Oct-84 MM "Short-circuit" evaluate #if's so that we X * don't print unnecessary error messages for X * #if !defined(FOO) && FOO != 0 && 10 / FOO ... X * 31-Oct-84 ado/MM Added token concatenation X * 6-Nov-84 MM Split from #define stuff, added sizeof stuff X * 19-Nov-84 ado #if error returns TRUE for (sigh) compatibility X */ X X#include X#include X#include "cppdef.h" X#include "cpp.h" X X/* X * Evaluate an #if expression. X */ X Xstatic char *opname[] = { /* For debug and error messages */ X"end of expression", "val", "id", X "+", "-", "*", "/", "%", X "<<", ">>", "&", "|", "^", X "==", "!=", "<", "<=", ">=", ">", X "&&", "||", "?", ":", ",", X "unary +", "unary -", "~", "!", "(", ")", "(none)", X}; X X/* X * opdope[] has the operator precedence: X * Bits X * 7 Unused (so the value is always positive) X * 6-2 Precedence (000x .. 017x) X * 1-0 Binary op. flags: X * 01 The binop flag should be set/cleared when this op is seen. X * 10 The new value of the binop flag. X * Note: Expected, New binop X * constant 0 1 Binop, end, or ) should follow constants X * End of line 1 0 End may not be preceeded by an operator X * binary 1 0 Binary op follows a value, value follows. X * unary 0 0 Unary op doesn't follow a value, value follows X * ( 0 0 Doesn't follow value, value or unop follows X * ) 1 1 Follows value. Op follows. X */ X Xstatic char opdope[OP_MAX] = { X 0001, /* End of expression */ X 0002, /* Digit */ X 0000, /* Letter (identifier) */ X 0141, 0141, 0151, 0151, 0151, /* ADD, SUB, MUL, DIV, MOD */ X 0131, 0131, 0101, 0071, 0071, /* ASL, ASR, AND, OR, XOR */ X 0111, 0111, 0121, 0121, 0121, 0121, /* EQ, NE, LT, LE, GE, GT */ X 0061, 0051, 0041, 0041, 0031, /* ANA, ORO, QUE, COL, CMA */ X/* X * Unary op's follow X */ X 0160, 0160, 0160, 0160, /* NEG, PLU, COM, NOT */ X 0170, 0013, 0023, /* LPA, RPA, END */ X}; X/* X * OP_QUE and OP_RPA have alternate precedences: X */ X#define OP_RPA_PREC 0013 X#define OP_QUE_PREC 0034 X X/* X * S_ANDOR and S_QUEST signal "short-circuit" boolean evaluation, so that X * #if FOO != 0 && 10 / FOO ... X * doesn't generate an error message. They are stored in optab.skip. X */ X#define S_ANDOR 2 X#define S_QUEST 1 X Xtypedef struct optab { X char op; /* Operator */ X char prec; /* Its precedence */ X char skip; /* Short-circuit: TRUE to skip */ X} OPTAB; Xstatic int evalue; /* Current value from evallex() */ X X#ifdef nomacargs XFILE_LOCAL int Xisbinary(op) Xregister int op; X{ X return (op >= FIRST_BINOP && op <= LAST_BINOP); X} X XFILE_LOCAL int Xisunary(op) Xregister int op; X{ X return (op >= FIRST_UNOP && op <= LAST_UNOP); X} X#else X#define isbinary(op) (op >= FIRST_BINOP && op <= LAST_BINOP) X#define isunary(op) (op >= FIRST_UNOP && op <= LAST_UNOP) X#endif X X/* X * The following definitions are used to specify basic variable sizes. X */ X X#ifndef S_CHAR X#define S_CHAR (sizeof (char)) X#endif X#ifndef S_SINT X#define S_SINT (sizeof (short int)) X#endif X#ifndef S_INT X#define S_INT (sizeof (int)) X#endif X#ifndef S_LINT X#define S_LINT (sizeof (long int)) X#endif X#ifndef S_FLOAT X#define S_FLOAT (sizeof (float)) X#endif X#ifndef S_DOUBLE X#define S_DOUBLE (sizeof (double)) X#endif X#ifndef S_PCHAR X#define S_PCHAR (sizeof (char *)) X#endif X#ifndef S_PSINT X#define S_PSINT (sizeof (short int *)) X#endif X#ifndef S_PINT X#define S_PINT (sizeof (int *)) X#endif X#ifndef S_PLINT X#define S_PLINT (sizeof (long int *)) X#endif X#ifndef S_PFLOAT X#define S_PFLOAT (sizeof (float *)) X#endif X#ifndef S_PDOUBLE X#define S_PDOUBLE (sizeof (double *)) X#endif X#ifndef S_PFPTR X#define S_PFPTR (sizeof (int (*)())) X#endif X Xtypedef struct types { X short type; /* This is the bit if */ X char *name; /* this is the token word */ X} TYPES; X Xstatic TYPES basic_types[] = { X { T_CHAR, "char", }, X { T_INT, "int", }, X { T_FLOAT, "float", }, X { T_DOUBLE, "double", }, X { T_SHORT, "short", }, X { T_LONG, "long", }, X { T_SIGNED, "signed", }, X { T_UNSIGNED, "unsigned", }, X { 0, NULL, }, /* Signal end */ X}; X X/* X * Test_table[] is used to test for illegal combinations. X */ Xstatic short test_table[] = { X T_FLOAT | T_DOUBLE | T_LONG | T_SHORT, X T_FLOAT | T_DOUBLE | T_CHAR | T_INT, X T_FLOAT | T_DOUBLE | T_SIGNED | T_UNSIGNED, X T_LONG | T_SHORT | T_CHAR, X 0 /* end marker */ X}; X X/* X * The order of this table is important -- it is also referenced by X * the command line processor to allow run-time overriding of the X * built-in size values. The order must not be changed: X * char, short, int, long, float, double (func pointer) X */ XSIZES size_table[] = { X { T_CHAR, S_CHAR, S_PCHAR }, /* char */ X { T_SHORT, S_SINT, S_PSINT }, /* short int */ X { T_INT, S_INT, S_PINT }, /* int */ X { T_LONG, S_LINT, S_PLINT }, /* long */ X { T_FLOAT, S_FLOAT, S_PFLOAT }, /* float */ X { T_DOUBLE, S_DOUBLE, S_PDOUBLE }, /* double */ X { T_FPTR, 0, S_PFPTR }, /* int (*()) */ X { 0, 0, 0 }, /* End of table */ X}; X Xint Xeval() X/* X * Evaluate an expression. Straight-forward operator precedence. X * This is called from control() on encountering an #if statement. X * It calls the following routines: X * evallex Lexical analyser -- returns the type and value of X * the next input token. X * evaleval Evaluate the current operator, given the values on X * the value stack. Returns a pointer to the (new) X * value stack. X * For compatiblity with older cpp's, this return returns 1 (TRUE) X * if a syntax error is detected. X */ X{ X register int op; /* Current operator */ X register int *valp; /* -> value vector */ X register OPTAB *opp; /* Operator stack */ X int prec; /* Op precedence */ X int binop; /* Set if binary op. needed */ X int op1; /* Operand from stack */ X int skip; /* For short-circuit testing */ X int value[NEXP]; /* Value stack */ X OPTAB opstack[NEXP]; /* Operand stack */ X extern int *evaleval(); /* Does actual evaluation */ X X valp = value; X opp = opstack; X opp->op = OP_END; /* Mark bottom of stack */ X opp->prec = opdope[OP_END]; /* And its precedence */ X opp->skip = 0; /* Not skipping now */ X binop = 0; Xagain: ; X#ifdef DEBUG_EVAL X printf("In #if at again: skip = %d, binop = %d, line is: %s", X opp->skip, binop, infile->bptr); X#endif X if ((op = evallex(opp->skip)) == OP_SUB && binop == 0) X op = OP_NEG; /* Unary minus */ X else if (op == OP_ADD && binop == 0) X op = OP_PLU; /* Unary plus */ X else if (op == OP_FAIL) X return (1); /* Error in evallex */ X#ifdef DEBUG_EVAL X printf("op = %s, opdope = %03o, binop = %d, skip = %d\n", X opname[op], opdope[op], binop, opp->skip); X#endif X if (op == DIG) { /* Value? */ X if (binop != 0) { X cerror("misplaced constant in #if", NULLST); X return (1); X } X else if (valp >= &value[NEXP-1]) { X cerror("#if value stack overflow", NULLST); X return (1); X } X else { X#ifdef DEBUG_EVAL X printf("pushing %d onto value stack[%d]\n", X evalue, valp - value); X#endif X *valp++ = evalue; X binop = 1; X } X goto again; X } X else if (op > OP_END) { X cerror("Illegal #if line", NULLST); X return (1); X } X prec = opdope[op]; X if (binop != (prec & 1)) { X cerror("Operator %s in incorrect context", opname[op]); X return (1); X } X binop = (prec & 2) >> 1; X for (;;) { X#ifdef DEBUG_EVAL X printf("op %s, prec %d., stacked op %s, prec %d, skip %d\n", X opname[op], prec, opname[opp->op], opp->prec, opp->skip); X#endif X if (prec > opp->prec) { X if (op == OP_LPA) X prec = OP_RPA_PREC; X else if (op == OP_QUE) X prec = OP_QUE_PREC; X op1 = opp->skip; /* Save skip for test */ X /* X * Push operator onto op. stack. X */ X opp++; X if (opp >= &opstack[NEXP]) { X cerror("expression stack overflow at op \"%s\"", X opname[op]); X return (1); X } X opp->op = op; X opp->prec = prec; X skip = (valp[-1] != 0); /* Short-circuit tester */ X /* X * Do the short-circuit stuff here. Short-circuiting X * stops automagically when operators are evaluated. X */ X if ((op == OP_ANA && !skip) X || (op == OP_ORO && skip)) X opp->skip = S_ANDOR; /* And/or skip starts */ X else if (op == OP_QUE) /* Start of ?: operator */ X opp->skip = (op1 & S_ANDOR) | ((!skip) ? S_QUEST : 0); X else if (op == OP_COL) { /* : inverts S_QUEST */ X opp->skip = (op1 & S_ANDOR) X | (((op1 & S_QUEST) != 0) ? 0 : S_QUEST); X } X else { /* Other ops leave */ X opp->skip = op1; /* skipping unchanged. */ X } X#ifdef DEBUG_EVAL X printf("stacking %s, valp[-1] == %d at %s", X opname[op], valp[-1], infile->bptr); X dumpstack(opstack, opp, value, valp); X#endif X goto again; X } X /* X * Pop operator from op. stack and evaluate it. X * End of stack and '(' are specials. X */ X skip = opp->skip; /* Remember skip value */ X switch ((op1 = opp->op)) { /* Look at stacked op */ X case OP_END: /* Stack end marker */ X if (op == OP_EOE) X return (valp[-1]); /* Finished ok. */ X goto again; /* Read another op. */ X X case OP_LPA: /* ( on stack */ X if (op != OP_RPA) { /* Matches ) on input */ X cerror("unbalanced paren's, op is \"%s\"", opname[op]); X return (1); X } X opp--; /* Unstack it */ X /* goto again; -- Fall through */ X X case OP_QUE: X goto again; /* Evaluate true expr. */ X X case OP_COL: /* : on stack. */ X opp--; /* Unstack : */ X if (opp->op != OP_QUE) { /* Matches ? on stack? */ X cerror("Misplaced '?' or ':', previous operator is %s", X opname[opp->op]); X return (1); X } X /* X * Evaluate op1. X */ X default: /* Others: */ X opp--; /* Unstack the operator */ X#ifdef DEBUG_EVAL X printf("Stack before evaluation of %s\n", opname[op1]); X dumpstack(opstack, opp, value, valp); X#endif X valp = evaleval(valp, op1, skip); X#ifdef DEBUG_EVAL X printf("Stack after evaluation\n"); X dumpstack(opstack, opp, value, valp); X#endif X } /* op1 switch end */ X } /* Stack unwind loop */ X} X XFILE_LOCAL int Xevallex(skip) Xint skip; /* TRUE if short-circuit evaluation */ X/* X * Return next eval operator or value. Called from eval(). It X * calls a special-purpose routines for 'char' strings and X * numeric values: X * evalchar called to evaluate 'x' X * evalnum called to evaluate numbers. X */ X{ X register int c, c1, t; X Xagain: do { /* Collect the token */ X c = skipws(); X if ((c = macroid(c)) == EOF_CHAR || c == '\n') { X unget(); X return (OP_EOE); /* End of expression */ X } X } while ((t = type[c]) == LET && catenate()); X if (t == INV) { /* Total nonsense */ X if (!skip) { X if (isascii(c) && isprint(c)) X cierror("illegal character '%c' in #if", c); X else X cierror("illegal character (%d decimal) in #if", c); X } X return (OP_FAIL); X } X else if (t == QUO) { /* ' or " */ X if (c == '\'') { /* Character constant */ X evalue = evalchar(skip); /* Somewhat messy */ X#ifdef DEBUG_EVAL X printf("evalchar returns %d.\n", evalue); X#endif X return (DIG); /* Return a value */ X } X cerror("Can't use a string in an #if", NULLST); X return (OP_FAIL); X } X else if (t == LET) { /* ID must be a macro */ X if (streq(token, "defined")) { /* Or defined name */ X c1 = c = skipws(); X if (c == '(') /* Allow defined(name) */ X c = skipws(); X if (type[c] == LET) { X evalue = (lookid(c) != NULL); X if (c1 != '(' /* Need to balance */ X || skipws() == ')') /* Did we balance? */ X return (DIG); /* Parsed ok */ X } X cerror("Bad #if ... defined() syntax", NULLST); X return (OP_FAIL); X } X else if (streq(token, "sizeof")) /* New sizeof hackery */ X return (dosizeof()); /* Gets own routine */ X /* X * The Draft ANSI C Standard says that an undefined symbol X * in an #if has the value zero. We are a bit pickier, X * warning except where the programmer was careful to write X * #if defined(foo) ? foo : 0 X */ X#ifdef VERBOSE X if (!skip) X cwarn("undefined symbol \"%s\" in #if, 0 used", token); X#endif X evalue = 0; X return (DIG); X } X else if (t == DIG) { /* Numbers are harder */ X evalue = evalnum(c); X#ifdef DEBUG_EVAL X printf("evalnum returns %d.\n", evalue); X#endif X } X else if (strchr("!=<>&|\\", c) != NULL) { X /* X * Process a possible multi-byte lexeme. X */ X c1 = cget(); /* Peek at next char */ X switch (c) { X case '!': X if (c1 == '=') X return (OP_NE); X break; X X case '=': X if (c1 != '=') { /* Can't say a=b in #if */ X unget(); X cerror("= not allowed in #if", NULLST); X return (OP_FAIL); X } X return (OP_EQ); X X case '>': X case '<': X if (c1 == c) X return ((c == '<') ? OP_ASL : OP_ASR); X else if (c1 == '=') X return ((c == '<') ? OP_LE : OP_GE); X break; X X case '|': X case '&': X if (c1 == c) X return ((c == '|') ? OP_ORO : OP_ANA); X break; X X case '\\': X if (c1 == '\n') /* Multi-line if */ X goto again; X cerror("Unexpected \\ in #if", NULLST); X return (OP_FAIL); X } X unget(); X } X return (t); X} X XFILE_LOCAL int Xdosizeof() X/* X * Process the sizeof (basic type) operation in an #if string. X * Sets evalue to the size and returns X * DIG success X * OP_FAIL bad parse or something. X */ X{ X register int c; X register TYPES *tp; X register SIZES *sizp; X register short *testp; X short typecode; X X if ((c = skipws()) != '(') X goto nogood; X /* X * Scan off the tokens. X */ X typecode = 0; X while ((c = skipws())) { X if ((c = macroid(c)) == EOF_CHAR || c == '\n') X goto nogood; /* End of line is a bug */ X else if (c == '(') { /* thing (*)() func ptr */ X if (skipws() == '*' X && skipws() == ')') { /* We found (*) */ X if (skipws() != '(') /* Let () be optional */ X unget(); X else if (skipws() != ')') X goto nogood; X typecode |= T_FPTR; /* Function pointer */ X } X else { /* Junk is a bug */ X goto nogood; X } X } X else if (type[c] != LET) /* Exit if not a type */ X break; X else if (!catenate()) { /* Maybe combine tokens */ X /* X * Look for this unexpandable token in basic_types. X * The code accepts "int long" as well as "long int" X * which is a minor bug as bugs go (and one shared with X * a lot of C compilers). X */ X for (tp = basic_types; tp->name != NULLST; tp++) { X if (streq(token, tp->name)) X break; X } X if (tp->name == NULLST) { X cerror("#if sizeof, unknown type \"%s\"", token); X return (OP_FAIL); X } X typecode |= tp->type; /* Or in the type bit */ X } X } X /* X * We are at the end of the type scan. Chew off '*' if necessary. X */ X if (c == '*') { X typecode |= T_PTR; X c = skipws(); X } X if (c == ')') { /* Last syntax check */ X for (testp = test_table; *testp != 0; testp++) { X if (!bittest(typecode & *testp)) { X cerror("#if ... sizeof: illegal type combination", NULLST); X return (OP_FAIL); X } X } X /* X * We assume that all function pointers are the same size: X * sizeof (int (*)()) == sizeof (float (*)()) X * We assume that signed and unsigned don't change the size: X * sizeof (signed int) == (sizeof unsigned int) X */ X if ((typecode & T_FPTR) != 0) /* Function pointer */ X typecode = T_FPTR | T_PTR; X else { /* Var or var * datum */ X typecode &= ~(T_SIGNED | T_UNSIGNED); X if ((typecode & (T_SHORT | T_LONG)) != 0) X typecode &= ~T_INT; X } X if ((typecode & ~T_PTR) == 0) { X cerror("#if sizeof() error, no type specified", NULLST); X return (OP_FAIL); X } X /* X * Exactly one bit (and possibly T_PTR) may be set. X */ X for (sizp = size_table; sizp->bits != 0; sizp++) { X if ((typecode & ~T_PTR) == sizp->bits) { X evalue = ((typecode & T_PTR) != 0) X ? sizp->psize : sizp->size; X return (DIG); X } X } /* We shouldn't fail */ X cierror("#if ... sizeof: bug, unknown type code 0x%x", typecode); X return (OP_FAIL); X } X Xnogood: unget(); X cerror("#if ... sizeof() syntax error", NULLST); X return (OP_FAIL); X} X XFILE_LOCAL int Xbittest(value) X/* X * TRUE if value is zero or exactly one bit is set in value. X */ X{ X#if (4096 & ~(-4096)) == 0 X return ((value & ~(-value)) == 0); X#else X /* X * Do it the hard way (for non 2's complement machines) X */ X return (value == 0 || value ^ (value - 1) == (value * 2 - 1)); X#endif X} X XFILE_LOCAL int Xevalnum(c) Xregister int c; X/* X * Expand number for #if lexical analysis. Note: evalnum recognizes X * the unsigned suffix, but only returns a signed int value. X */ X{ X register int value; X register int base; X register int c1; X X if (c != '0') X base = 10; X else if ((c = cget()) == 'x' || c == 'X') { X base = 16; X c = cget(); X } X else base = 8; X value = 0; X for (;;) { X c1 = c; X if (isascii(c) && isupper(c1)) X c1 = tolower(c1); X if (c1 >= 'a') X c1 -= ('a' - 10); X else c1 -= '0'; X if (c1 < 0 || c1 >= base) X break; X value *= base; X value += c1; X c = cget(); X } X if (c == 'u' || c == 'U') /* Unsigned nonsense */ X c = cget(); X unget(); X return (value); X} X XFILE_LOCAL int Xevalchar(skip) Xint skip; /* TRUE if short-circuit evaluation */ X/* X * Get a character constant X */ X{ X register int c; X register int value; X register int count; X X instring = TRUE; X if ((c = cget()) == '\\') { X switch ((c = cget())) { X case 'a': /* New in Standard */ X#if ('a' == '\a' || '\a' == ALERT) X value = ALERT; /* Use predefined value */ X#else X value = '\a'; /* Use compiler's value */ X#endif X break; X X case 'b': X value = '\b'; X break; X X case 'f': X value = '\f'; X break; X X case 'n': X value = '\n'; X break; X X case 'r': X value = '\r'; X break; X X case 't': X value = '\t'; X break; X X case 'v': /* New in Standard */ X#if ('v' == '\v' || '\v' == VT) X value = VT; /* Use predefined value */ X#else X value = '\v'; /* Use compiler's value */ X#endif X break; X X case 'x': /* '\xFF' */ X count = 3; X value = 0; X while ((((c = get()) >= '0' && c <= '9') X || (c >= 'a' && c <= 'f') X || (c >= 'A' && c <= 'F')) X && (--count >= 0)) { X value *= 16; X value += (c <= '9') ? (c - '0') : ((c & 0xF) + 9); X } X unget(); X break; X X default: X if (c >= '0' && c <= '7') { X count = 3; X value = 0; X while (c >= '0' && c <= '7' && --count >= 0) { X value *= 8; X value += (c - '0'); X c = get(); X } X unget(); X } X else value = c; X break; X } X } X else if (c == '\'') X value = 0; X else value = c; X /* X * We warn on multi-byte constants and try to hack X * (big|little)endian machines. X */ X#if BIG_ENDIAN X count = 0; X#endif X while ((c = get()) != '\'' && c != EOF_CHAR && c != '\n') { X if (!skip) X ciwarn("multi-byte constant '%c' isn't portable", c); X#if BIG_ENDIAN X count += BITS_CHAR; X value += (c << count); X#else X value <<= BITS_CHAR; X value += c; X#endif X } X instring = FALSE; X return (value); X} X XFILE_LOCAL int * Xevaleval(valp, op, skip) Xregister int *valp; Xint op; Xint skip; /* TRUE if short-circuit evaluation */ X/* X * Apply the argument operator to the data on the value stack. X * One or two values are popped from the value stack and the result X * is pushed onto the value stack. X * X * OP_COL is a special case. X * X * evaleval() returns the new pointer to the top of the value stack. X */ X{ X register int v1, v2; X X if (isbinary(op)) X v2 = *--valp; X v1 = *--valp; X#ifdef DEBUG_EVAL X printf("%s op %s", (isbinary(op)) ? "binary" : "unary", X opname[op]); X if (isbinary(op)) X printf(", v2 = %d.", v2); X printf(", v1 = %d.\n", v1); X#endif X switch (op) { X case OP_EOE: X break; X X case OP_ADD: X v1 += v2; X break; X X case OP_SUB: X v1 -= v2; X break; X X case OP_MUL: X v1 *= v2; X break; X X case OP_DIV: X case OP_MOD: X if (v2 == 0) { X if (!skip) { X cwarn("%s by zero in #if, zero result assumed", X (op == OP_DIV) ? "divide" : "mod"); X } X v1 = 0; X } X else if (op == OP_DIV) X v1 /= v2; X else X v1 %= v2; X break; X X case OP_ASL: X v1 <<= v2; X break; X X case OP_ASR: X v1 >>= v2; X break; X X case OP_AND: X v1 &= v2; X break; X X case OP_OR: X v1 |= v2; X break; X X case OP_XOR: X v1 ^= v2; X break; X X case OP_EQ: X v1 = (v1 == v2); X break; X X case OP_NE: X v1 = (v1 != v2); X break; X X case OP_LT: X v1 = (v1 < v2); X break; X X case OP_LE: X v1 = (v1 <= v2); X break; X X case OP_GE: X v1 = (v1 >= v2); X break; X X case OP_GT: X v1 = (v1 > v2); X break; X X case OP_ANA: X v1 = (v1 && v2); X break; X X case OP_ORO: X v1 = (v1 || v2); X break; X X case OP_COL: X /* X * v1 has the "true" value, v2 the "false" value. X * The top of the value stack has the test. X */ X v1 = (*--valp) ? v1 : v2; X break; X X case OP_NEG: X v1 = (-v1); X break; X X case OP_PLU: X break; X X case OP_COM: X v1 = ~v1; X break; X X case OP_NOT: X v1 = !v1; X break; X X default: X cierror("#if bug, operand = %d.", op); X v1 = 0; X } X *valp++ = v1; X return (valp); X} X X#ifdef DEBUG_EVAL Xdumpstack(opstack, opp, value, valp) XOPTAB opstack[NEXP]; /* Operand stack */ Xregister OPTAB *opp; /* Operator stack */ Xint value[NEXP]; /* Value stack */ Xregister int *valp; /* -> value vector */ X{ X printf("index op prec skip name -- op stack at %s", infile->bptr); X while (opp > opstack) { X printf(" [%2d] %2d %03o %d %s\n", opp - opstack, X opp->op, opp->prec, opp->skip, opname[opp->op]); X opp--; X } X while (--valp >= value) { X printf("value[%d] = %d\n", (valp - value), *valp); X } X} X#endif X END-of-cpp5.c echo x - cpp6.c sed 's/^X//' >cpp6.c << 'END-of-cpp6.c' X/* X * C P P 6 . C X * S u p p o r t R o u t i n e s X * X * Edit History X * 25-May-84 MM Added 8-bit support to type table. X * 30-May-84 ARF sharp() should output filename in quotes X * 02-Aug-84 MM Newline and #line hacking. sharp() now in cpp1.c X * 31-Aug-84 MM USENET net.sources release X * 11-Sep-84 ado/MM Keepcomments, also line number pathological X * 12-Sep-84 ado/MM bug if comment changes to space and we unget later. X * 03-Oct-84 gkr/MM Fixed scannumber bug for '.e' (as in struct.element). X * 04-Oct-84 MM Added ungetstring() for token concatenation X * 08-Oct-84 MM Yet another attack on number scanning X * 31-Oct-84 ado Parameterized $ in identifiers X * 2-Nov-84 MM Token concatenation is messier than I thought X * 6-Dec-84 MM \ is everywhere invisible. X */ X X#include X#include X#include "cppdef.h" X#include "cpp.h" X X/* X * skipnl() skips over input text to the end of the line. X * skipws() skips over "whitespace" (spaces or tabs), but X * not skip over the end of the line. It skips over X * TOK_SEP, however (though that shouldn't happen). X * scanid() reads the next token (C identifier) into token[]. X * The caller has already read the first character of X * the identifier. Unlike macroid(), the token is X * never expanded. X * macroid() reads the next token (C identifier) into token[]. X * If it is a #defined macro, it is expanded, and X * macroid() returns TRUE, otherwise, FALSE. X * catenate() Does the dirty work of token concatenation, TRUE if it did. X * scanstring() Reads a string from the input stream, calling X * a user-supplied function for each character. X * This function may be output() to write the X * string to the output file, or save() to save X * the string in the work buffer. X * scannumber() Reads a C numeric constant from the input stream, X * calling the user-supplied function for each X * character. (output() or save() as noted above.) X * save() Save one character in the work[] buffer. X * savestring() Saves a string in malloc() memory. X * getfile() Initialize a new FILEINFO structure, called when X * #include opens a new file, or a macro is to be X * expanded. X * getmem() Get a specified number of bytes from malloc memory. X * output() Write one character to stdout (calling putchar) -- X * implemented as a function so its address may be X * passed to scanstring() and scannumber(). X * lookid() Scans the next token (identifier) from the input X * stream. Looks for it in the #defined symbol table. X * Returns a pointer to the definition, if found, or NULL X * if not present. The identifier is stored in token[]. X * defnedel() Define enter/delete subroutine. Updates the X * symbol table. X * get() Read the next byte from the current input stream, X * handling end of (macro/file) input and embedded X * comments appropriately. Note that the global X * instring is -- essentially -- a parameter to get(). X * cget() Like get(), but skip over TOK_SEP. X * unget() Push last gotten character back on the input stream. X * cerror(), cwarn(), cfatal(), cierror(), ciwarn() X * These routines format an print messages to the user. X * cerror & cwarn take a format and a single string argument. X * cierror & ciwarn take a format and a single int (char) argument. X * cfatal takes a format and a single string argument. X */ X X/* X * This table must be rewritten for a non-Ascii machine. X * X * Note that several "non-visible" characters have special meaning: X * Hex 1D DEF_MAGIC -- a flag to prevent #define recursion. X * Hex 1E TOK_SEP -- a delimiter for token concatenation X * Hex 1F COM_SEP -- a zero-width whitespace for comment concatenation X */ X#if TOK_SEP != 0x1E || COM_SEP != 0x1F || DEF_MAGIC != 0x1D X << error type table isn't correct >> X#endif X X#if OK_DOLLAR X#define DOL LET X#else X#define DOL 000 X#endif X Xchar type[256] = { /* Character type codes Hex */ X END, 000, 000, 000, 000, 000, 000, 000, /* 00 */ X 000, SPA, 000, 000, 000, 000, 000, 000, /* 08 */ X 000, 000, 000, 000, 000, 000, 000, 000, /* 10 */ X 000, 000, 000, 000, 000, LET, 000, SPA, /* 18 */ X SPA,OP_NOT, QUO, 000, DOL,OP_MOD,OP_AND, QUO, /* 20 !"#$%&' */ XOP_LPA,OP_RPA,OP_MUL,OP_ADD, 000,OP_SUB, DOT,OP_DIV, /* 28 ()*+,-./ */ X DIG, DIG, DIG, DIG, DIG, DIG, DIG, DIG, /* 30 01234567 */ X DIG, DIG,OP_COL, 000, OP_LT, OP_EQ, OP_GT,OP_QUE, /* 38 89:;<=>? */ X 000, LET, LET, LET, LET, LET, LET, LET, /* 40 @ABCDEFG */ X LET, LET, LET, LET, LET, LET, LET, LET, /* 48 HIJKLMNO */ X LET, LET, LET, LET, LET, LET, LET, LET, /* 50 PQRSTUVW */ X LET, LET, LET, 000, BSH, 000,OP_XOR, LET, /* 58 XYZ[\]^_ */ X 000, LET, LET, LET, LET, LET, LET, LET, /* 60 `abcdefg */ X LET, LET, LET, LET, LET, LET, LET, LET, /* 68 hijklmno */ X LET, LET, LET, LET, LET, LET, LET, LET, /* 70 pqrstuvw */ X LET, LET, LET, 000, OP_OR, 000,OP_NOT, 000, /* 78 xyz{|}~ */ X 000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */ X 000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */ X 000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */ X 000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */ X 000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */ X 000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */ X 000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */ X 000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */ X}; X Xskipnl() X/* X * Skip to the end of the current input line. X */ X{ X register int c; X X do { /* Skip to newline */ X c = get(); X } while (c != '\n' && c != EOF_CHAR); X} X Xint Xskipws() X/* X * Skip over whitespace X */ X{ X register int c; X X do { /* Skip whitespace */ X c = get(); X#if COMMENT_INVISIBLE X } while (type[c] == SPA || c == COM_SEP); X#else X } while (type[c] == SPA); X#endif X return (c); X} X Xscanid(c) Xregister int c; /* First char of id */ X/* X * Get the next token (an id) into the token buffer. X * Note: this code is duplicated in lookid(). X * Change one, change both. X */ X{ X register char *bp; X X if (c == DEF_MAGIC) /* Eat the magic token */ X c = get(); /* undefiner. */ X bp = token; X do { X if (bp < &token[IDMAX]) /* token dim is IDMAX+1 */ X *bp++ = c; X c = get(); X } while (type[c] == LET || type[c] == DIG); X unget(); X *bp = EOS; X} X Xint Xmacroid(c) Xregister int c; X/* X * If c is a letter, scan the id. if it's #defined, expand it and scan X * the next character and try again. X * X * Else, return the character. If type[c] is a LET, the token is in token. X */ X{ X register DEFBUF *dp; X X if (infile != NULL && infile->fp != NULL) X recursion = 0; X while (type[c] == LET && (dp = lookid(c)) != NULL) { X expand(dp); X c = get(); X } X return (c); X} X Xint Xcatenate() X/* X * A token was just read (via macroid). X * If the next character is TOK_SEP, concatenate the next token X * return TRUE -- which should recall macroid after refreshing X * macroid's argument. If it is not TOK_SEP, unget() the character X * and return FALSE. X */ X{ X register int c; X register char *token1; X X#if OK_CONCAT X if (get() != TOK_SEP) { /* Token concatenation */ X unget(); X return (FALSE); X } X else { X token1 = savestring(token); /* Save first token */ X c = macroid(get()); /* Scan next token */ X switch(type[c]) { /* What was it? */ X case LET: /* An identifier, ... */ X if (strlen(token1) + strlen(token) >= NWORK) X cfatal("work buffer overflow doing %s #", token1); X sprintf(work, "%s%s", token1, token); X break; X X case DIG: /* A digit string */ X strcpy(work, token1); X workp = work + strlen(work); X do { X save(c); X } while ((c = get()) != TOK_SEP); X /* X * The trailing TOK_SEP is no longer needed. X */ X save(EOS); X break; X X default: /* An error, ... */ X if (isprint(c)) X cierror("Strange character '%c' after #", c); X else X cierror("Strange character (%d.) after #", c); X strcpy(work, token1); X unget(); X break; X } X /* X * work has the concatenated token and token1 has X * the first token (no longer needed). Unget the X * new (concatenated) token after freeing token1. X * Finally, setup to read the new token. X */ X free(token1); /* Free up memory */ X ungetstring(work); /* Unget the new thing, */ X return (TRUE); X } X#else X return (FALSE); /* Not supported */ X#endif X} X Xint Xscanstring(delim, outfun) Xregister int delim; /* ' or " */ Xint (*outfun)(); /* Output function */ X/* X * Scan off a string. Warning if terminated by newline or EOF. X * outfun() outputs the character -- to a buffer if in a macro. X * TRUE if ok, FALSE if error. X */ X{ X register int c; X X instring = TRUE; /* Don't strip comments */ X (*outfun)(delim); X while ((c = get()) != delim X && c != '\n' X && c != EOF_CHAR) { X (*outfun)(c); X if (c == '\\') X (*outfun)(get()); X } X instring = FALSE; X if (c == delim) { X (*outfun)(c); X return (TRUE); X } X else { X cerror("Unterminated string", NULLST); X unget(); X return (FALSE); X } X} X Xscannumber(c, outfun) Xregister int c; /* First char of number */ Xregister int (*outfun)(); /* Output/store func */ X/* X * Process a number. We know that c is from 0 to 9 or dot. X * Algorithm from Dave Conroy's Decus C. X */ X{ X register int radix; /* 8, 10, or 16 */ X int expseen; /* 'e' seen in floater */ X int signseen; /* '+' or '-' seen */ X int octal89; /* For bad octal test */ X int dotflag; /* TRUE if '.' was seen */ X X expseen = FALSE; /* No exponent seen yet */ X signseen = TRUE; /* No +/- allowed yet */ X octal89 = FALSE; /* No bad octal yet */ X radix = 10; /* Assume decimal */ X if ((dotflag = (c == '.')) != FALSE) { /* . something? */ X (*outfun)('.'); /* Always out the dot */ X if (type[(c = get())] != DIG) { /* If not a float numb, */ X unget(); /* Rescan strange char */ X return; /* All done for now */ X } X } /* End of float test */ X else if (c == '0') { /* Octal or hex? */ X (*outfun)(c); /* Stuff initial zero */ X radix = 8; /* Assume it's octal */ X c = get(); /* Look for an 'x' */ X if (c == 'x' || c == 'X') { /* Did we get one? */ X radix = 16; /* Remember new radix */ X (*outfun)(c); /* Stuff the 'x' */ X c = get(); /* Get next character */ X } X } X for (;;) { /* Process curr. char. */ X /* X * Note that this algorithm accepts "012e4" and "03.4" X * as legitimate floating-point numbers. X */ X if (radix != 16 && (c == 'e' || c == 'E')) { X if (expseen) /* Already saw 'E'? */ X break; /* Exit loop, bad nbr. */ X expseen = TRUE; /* Set exponent seen */ X signseen = FALSE; /* We can read '+' now */ X radix = 10; /* Decimal exponent */ X } X else if (radix != 16 && c == '.') { X if (dotflag) /* Saw dot already? */ X break; /* Exit loop, two dots */ X dotflag = TRUE; /* Remember the dot */ X radix = 10; /* Decimal fraction */ X } X else if (c == '+' || c == '-') { /* 1.0e+10 */ X if (signseen) /* Sign in wrong place? */ X break; /* Exit loop, not nbr. */ X /* signseen = TRUE; */ /* Remember we saw it */ X } X else { /* Check the digit */ X switch (c) { X case '8': case '9': /* Sometimes wrong */ X octal89 = TRUE; /* Do check later */ X case '0': case '1': case '2': case '3': X case '4': case '5': case '6': case '7': X break; /* Always ok */ X X case 'a': case 'b': case 'c': case 'd': case 'e': case 'f': X case 'A': case 'B': case 'C': case 'D': case 'E': case 'F': X if (radix == 16) /* Alpha's are ok only */ X break; /* if reading hex. */ X default: /* At number end */ X goto done; /* Break from for loop */ X } /* End of switch */ X } /* End general case */ X (*outfun)(c); /* Accept the character */ X signseen = TRUE; /* Don't read sign now */ X c = get(); /* Read another char */ X } /* End of scan loop */ X /* X * When we break out of the scan loop, c contains the first X * character (maybe) not in the number. If the number is an X * integer, allow a trailing 'L' for long and/or a trailing 'U' X * for unsigned. If not those, push the trailing character back X * on the input stream. Floating point numbers accept a trailing X * 'L' for "long double". X */ Xdone: if (dotflag || expseen) { /* Floating point? */ X if (c == 'l' || c == 'L') { X (*outfun)(c); X c = get(); /* Ungotten later */ X } X } X else { /* Else it's an integer */ X /* X * We know that dotflag and expseen are both zero, now: X * dotflag signals "saw 'L'", and X * expseen signals "saw 'U'". X */ X for (;;) { X switch (c) { X case 'l': X case 'L': X if (dotflag) X goto nomore; X dotflag = TRUE; X break; X X case 'u': X case 'U': X if (expseen) X goto nomore; X expseen = TRUE; X break; X X default: X goto nomore; X } X (*outfun)(c); /* Got 'L' or 'U'. */ X c = get(); /* Look at next, too. */ X } X } Xnomore: unget(); /* Not part of a number */ X if (octal89 && radix == 8) X cwarn("Illegal digit in octal number", NULLST); X} X Xsave(c) Xregister int c; X{ X if (workp >= &work[NWORK]) X cfatal("Work buffer overflow", NULLST); X else *workp++ = c; X} X Xchar * Xsavestring(text) Xchar *text; X/* X * Store a string into free memory. X */ X{ X register char *result; X X result = getmem(strlen(text) + 1); X strcpy(result, text); X return (result); X} X XFILEINFO * Xgetfile(bufsize, name) Xint bufsize; /* Line or define buffer size */ Xchar *name; /* File or macro name string */ X/* X * Common FILEINFO buffer initialization for a new file or macro. X */ X{ X register FILEINFO *file; X register int size; X X size = strlen(name); /* File/macro name */ X file = (FILEINFO *) getmem(sizeof (FILEINFO) + bufsize + size); X file->parent = infile; /* Chain files together */ X file->fp = NULL; /* No file yet */ X file->filename = savestring(name); /* Save file/macro name */ X file->progname = NULL; /* No #line seen yet */ X file->unrecur = 0; /* No macro fixup */ X file->bptr = file->buffer; /* Initialize line ptr */ X file->buffer[0] = EOS; /* Force first read */ X file->line = 0; /* (Not used just yet) */ X if (infile != NULL) /* If #include file */ X infile->line = line; /* Save current line */ X infile = file; /* New current file */ X line = 1; /* Note first line */ X return (file); /* All done. */ X} X Xchar * Xgetmem(size) Xint size; X/* X * Get a block of free memory. X */ X{ X register char *result; X extern char *malloc(); X X if ((result = malloc((unsigned) size)) == NULL) X cfatal("Out of memory", NULLST); X return (result); X} X X/* X * C P P S y m b o l T a b l e s X */ X X/* X * SBSIZE defines the number of hash-table slots for the symbol table. X * It must be a power of 2. X */ X#ifndef SBSIZE X#define SBSIZE 64 X#endif X#define SBMASK (SBSIZE - 1) X#if (SBSIZE ^ SBMASK) != ((SBSIZE * 2) - 1) X << error, SBSIZE must be a power of 2 >> X#endif X Xstatic DEFBUF *symtab[SBSIZE]; /* Symbol table queue headers */ X XDEFBUF * Xlookid(c) Xint c; /* First character of token */ X/* X * Look for the next token in the symbol table. Returns token in "token". X * If found, returns the table pointer; Else returns NULL. X */ X{ X register int nhash; X register DEFBUF *dp; X register char *np; X int temp; X int isrecurse; /* For #define foo foo */ X X np = token; X nhash = 0; X if ((isrecurse = (c == DEF_MAGIC))) /* If recursive macro */ X c = get(); /* hack, skip DEF_MAGIC */ X do { X if (np < &token[IDMAX]) { /* token dim is IDMAX+1 */ X *np++ = c; /* Store token byte */ X nhash += c; /* Update hash value */ X } X c = get(); /* And get another byte */ X } while (type[c] == LET || type[c] == DIG); X unget(); /* Rescan terminator */ X *np = EOS; /* Terminate token */ X if (isrecurse) /* Recursive definition */ X return (NULL); /* undefined just now */ X nhash += (np - token); /* Fix hash value */ X dp = symtab[nhash & SBMASK]; /* Starting bucket */ X while (dp != (DEFBUF *) NULL) { /* Search symbol table */ X if (dp->hash == nhash /* Fast precheck */ X && (temp = strcmp(dp->name, token)) >= 0) X break; X dp = dp->link; /* Nope, try next one */ X } X return ((temp == 0) ? dp : NULL); X} X XDEFBUF * Xdefendel(name, delete) Xchar *name; Xint delete; /* TRUE to delete a symbol */ X/* X * Enter this name in the lookup table (delete = FALSE) X * or delete this name (delete = TRUE). X * Returns a pointer to the define block (delete = FALSE) X * Returns NULL if the symbol wasn't defined (delete = TRUE). X */ X{ X register DEFBUF *dp; X register DEFBUF **prevp; X register char *np; X int nhash; X int temp; X int size; X X for (nhash = 0, np = name; *np != EOS;) X nhash += *np++; X size = (np - name); X nhash += size; X prevp = &symtab[nhash & SBMASK]; X while ((dp = *prevp) != (DEFBUF *) NULL) { X if (dp->hash == nhash X && (temp = strcmp(dp->name, name)) >= 0) { X if (temp > 0) X dp = NULL; /* Not found */ X else { X *prevp = dp->link; /* Found, unlink and */ X if (dp->repl != NULL) /* Free the replacement */ X free(dp->repl); /* if any, and then */ X free((char *) dp); /* Free the symbol */ X } X break; X } X prevp = &dp->link; X } X if (!delete) { X dp = (DEFBUF *) getmem(sizeof (DEFBUF) + size); X dp->link = *prevp; X *prevp = dp; X dp->hash = nhash; X dp->repl = NULL; X dp->nargs = 0; X strcpy(dp->name, name); X } X return (dp); X} X X#if DEBUG X Xdumpdef(why) Xchar *why; X{ X register DEFBUF *dp; X register DEFBUF **syp; X X printf("CPP symbol table dump %s\n", why); X for (syp = symtab; syp < &symtab[SBSIZE]; syp++) { X if ((dp = *syp) != (DEFBUF *) NULL) { X printf("symtab[%d]\n", (syp - symtab)); X do { X dumpadef((char *) NULL, dp); X } while ((dp = dp->link) != (DEFBUF *) NULL); X } X } X} X Xdumpadef(why, dp) Xchar *why; /* Notation */ Xregister DEFBUF *dp; X{ X register char *cp; X register int c; X X printf(" \"%s\" [%d]", dp->name, dp->nargs); X if (why != NULL) X printf(" (%s)", why); X if (dp->repl != NULL) { X printf(" => "); X for (cp = dp->repl; (c = *cp++ & 0xFF) != EOS;) { X if (c >= MAC_PARM && c <= (MAC_PARM + PAR_MAC)) X printf("<%d>", c - MAC_PARM); X else if (isprint(c) || c == '\n' || c == '\t') X putchar(c); X else if (c < ' ') X printf("<^%c>", c + '@'); X else X printf("<\\0%o>", c); X } X } X else { X printf(", no replacement."); X } X putchar('\n'); X} X#endif X X/* X * G E T X */ X Xint Xget() X/* X * Return the next character from a macro or the current file. X * Handle end of file from #include files. X */ X{ X register int c; X register FILEINFO *file; X register int popped; /* Recursion fixup */ X X popped = 0; Xget_from_file: X if ((file = infile) == NULL) X return (EOF_CHAR); Xnewline: X#if 0 X printf("get(%s), recursion %d, line %d, bptr = %d, buffer \"%s\"\n", X file->filename, recursion, line, X file->bptr - file->buffer, file->buffer); X#endif X /* X * Read a character from the current input line or macro. X * At EOS, either finish the current macro (freeing temp. X * storage) or read another line from the current input file. X * At EOF, exit the current file (#include) or, at EOF from X * the cpp input file, return EOF_CHAR to finish processing. X */ X if ((c = *file->bptr++ & 0xFF) == EOS) { X /* X * Nothing in current line or macro. Get next line (if X * input from a file), or do end of file/macro processing. X * In the latter case, jump back to restart from the top. X */ X if (file->fp == NULL) { /* NULL if macro */ X popped++; X recursion -= file->unrecur; X if (recursion < 0) X recursion = 0; X infile = file->parent; /* Unwind file chain */ X } X else { /* Else get from a file */ X if ((file->bptr = fgets(file->buffer, NBUFF, file->fp)) X != NULL) { X#if DEBUG X if (debug > 1) { /* Dump it to stdout */ X printf("\n#line %d (%s), %s", X line, file->filename, file->buffer); X } X#endif X goto newline; /* process the line */ X } X else { X fclose(file->fp); /* Close finished file */ X if ((infile = file->parent) != NULL) { X /* X * There is an "ungotten" newline in the current X * infile buffer (set there by doinclude() in X * cpp1.c). Thus, we know that the mainline code X * is skipping over blank lines and will do a X * #line at its convenience. X */ X wrongline = TRUE; /* Need a #line now */ X } X } X } X /* X * Free up space used by the (finished) file or macro and X * restart input from the parent file/macro, if any. X */ X free(file->filename); /* Free name and */ X if (file->progname != NULL) /* if a #line was seen, */ X free(file->progname); /* free it, too. */ X free((char *) file); /* Free file space */ X if (infile == NULL) /* If at end of file */ X return (EOF_CHAR); /* Return end of file */ X line = infile->line; /* Reset line number */ X goto get_from_file; /* Get from the top. */ X } X /* X * Common processing for the new character. X */ X if (c == DEF_MAGIC && file->fp != NULL) /* Don't allow delete */ X goto newline; /* from a file */ X if (file->parent != NULL) { /* Macro or #include */ X if (popped != 0) X file->parent->unrecur += popped; X else { X recursion -= file->parent->unrecur; X if (recursion < 0) X recursion = 0; X file->parent->unrecur = 0; X } X } X if (c == '\n') /* Maintain current */ X ++line; /* line counter */ X if (instring) /* Strings just return */ X return (c); /* the character. */ X else if (c == '/') { /* Comment? */ X instring = TRUE; /* So get() won't loop */ X if ((c = get()) != '*') { /* Next byte '*'? */ X instring = FALSE; /* Nope, no comment */ X unget(); /* Push the char. back */ X return ('/'); /* Return the slash */ X } X if (keepcomments) { /* If writing comments */ X putchar('/'); /* Write out the */ X putchar('*'); /* initializer */ X } X for (;;) { /* Eat a comment */ X c = get(); Xtest: if (keepcomments && c != EOF_CHAR) X cput(c); X switch (c) { X case EOF_CHAR: X cerror("EOF in comment", NULLST); X return (EOF_CHAR); X X case '/': X if ((c = get()) != '*') /* Don't let comments */ X goto test; /* Nest. */ X#ifdef VERBOSE X cwarn("Nested comments", NULLST); X#endif X /* Fall into * stuff */ X case '*': X if ((c = get()) != '/') /* If comment doesn't */ X goto test; /* end, look at next */ X instring = FALSE; /* End of comment, */ X if (keepcomments) { /* Put out the comment */ X cput(c); /* terminator, too */ X } X /* X * A comment is syntactically "whitespace" -- X * however, there are certain strange sequences X * such as X * #define foo(x) (something) X * foo|* comment *|(123) X * these are '/' ^ ^ X * where just returning space (or COM_SEP) will cause X * problems. This can be "fixed" by overwriting the X * '/' in the input line buffer with ' ' (or COM_SEP) X * but that may mess up an error message. X * So, we peek ahead -- if the next character is X * "whitespace" we just get another character, if not, X * we modify the buffer. All in the name of purity. X */ X if (*file->bptr == '\n' X || type[*file->bptr & 0xFF] == SPA) X goto newline; X#if COMMENT_INVISIBLE X /* X * Return magic (old-fashioned) syntactic space. X */ X return ((file->bptr[-1] = COM_SEP)); X#else X return ((file->bptr[-1] = ' ')); X#endif X X case '\n': /* we'll need a #line */ X if (!keepcomments) X wrongline = TRUE; /* later... */ X default: /* Anything else is */ X break; /* Just a character */ X } /* End switch */ X } /* End comment loop */ X } /* End if in comment */ X else if (!inmacro && c == '\\') { /* If backslash, peek */ X if ((c = get()) == '\n') { /* for a . If so, */ X wrongline = TRUE; X goto newline; X } X else { /* Backslash anything */ X unget(); /* Get it later */ X return ('\\'); /* Return the backslash */ X } X } X else if (c == '\f' || c == VT) /* Form Feed, Vertical */ X c = ' '; /* Tab are whitespace */ X return (c); /* Just return the char */ X} X Xunget() X/* X * Backup the pointer to reread the last character. Fatal error X * (code bug) if we backup too far. unget() may be called, X * without problems, at end of file. Only one character may X * be ungotten. If you need to unget more, call ungetstring(). X */ X{ X register FILEINFO *file; X X if ((file = infile) == NULL) X return; /* Unget after EOF */ X if (--file->bptr < file->buffer) X cfatal("Too much pushback", NULLST); X if (*file->bptr == '\n') /* Ungetting a newline? */ X --line; /* Unget the line number, too */ X} X Xungetstring(text) Xchar *text; X/* X * Push a string back on the input stream. This is done by treating X * the text as if it were a macro. X */ X{ X register FILEINFO *file; X extern FILEINFO *getfile(); X X file = getfile(strlen(text) + 1, ""); X strcpy(file->buffer, text); X} X Xint Xcget() X/* X * Get one character, absorb "funny space" after comments or X * token concatenation X */ X{ X register int c; X X do { X c = get(); X#if COMMENT_INVISIBLE X } while (c == TOK_SEP || c == COM_SEP); X#else X } while (c == TOK_SEP); X#endif X return (c); X} X X/* X * Error messages and other hacks. The first byte of severity X * is 'S' for string arguments and 'I' for int arguments. This X * is needed for portability with machines that have int's that X * are shorter than char *'s. X */ X Xstatic Xdomsg(severity, format, arg) Xchar *severity; /* "Error", "Warning", "Fatal" */ Xchar *format; /* Format for the error message */ Xchar *arg; /* Something for the message */ X/* X * Print filenames, macro names, and line numbers for error messages. X */ X{ X register char *tp; X register FILEINFO *file; X X fprintf(stderr, "%sline %d, %s: ", MSG_PREFIX, line, &severity[1]); X if (*severity == 'S') X fprintf(stderr, format, arg); X else X fprintf(stderr, format, (int) arg); X putc('\n', stderr); X if ((file = infile) == NULL) X return; /* At end of file */ X if (file->fp != NULL) { X tp = file->buffer; /* Print current file */ X fprintf(stderr, "%s", tp); /* name, making sure */ X if (tp[strlen(tp) - 1] != '\n') /* there's a newline */ X putc('\n', stderr); X } X while ((file = file->parent) != NULL) { /* Print #includes, too */ X if (file->fp == NULL) X fprintf(stderr, "from macro %s\n", file->filename); X else { X tp = file->buffer; X fprintf(stderr, "from file %s, line %d:\n%s", X (file->progname != NULL) X ? file->progname : file->filename, X file->line, tp); X if (tp[strlen(tp) - 1] != '\n') X putc('\n', stderr); X } X } X} X Xcerror(format, sarg) Xchar *format; Xchar *sarg; /* Single string argument */ X/* X * Print a normal error message, string argument. X */ X{ X domsg("SError", format, sarg); X errors++; X} X Xcierror(format, narg) Xchar *format; Xint narg; /* Single numeric argument */ X/* X * Print a normal error message, numeric argument. X */ X{ X domsg("IError", format, (char *) narg); X errors++; X} X Xcfatal(format, sarg) Xchar *format; Xchar *sarg; /* Single string argument */ X/* X * A real disaster X */ X{ X domsg("SFatal error", format, sarg); X exit(IO_ERROR); X} X Xcwarn(format, sarg) Xchar *format; Xchar *sarg; /* Single string argument */ X/* X * A non-fatal error, string argument. X */ X{ X domsg("SWarning", format, sarg); X} X Xciwarn(format, narg) Xchar *format; Xint narg; /* Single numeric argument */ X/* X * A non-fatal error, numeric argument. X */ X{ X domsg("IWarning", format, (char *) narg); X} X X X END-of-cpp6.c exit