7a77d77eff
...so the following strcpy does not cause a false abort under _FORTIFY_SOURCE=2 Change-Id: I395136f11020064766db76f87ed8f5b01c083c3a Reviewed-on: https://gerrit.libreoffice.org/18681 Tested-by: Jenkins <ci@libreoffice.org> Reviewed-by: Stephan Bergmann <sbergman@redhat.com>
1135 lines
37 KiB
C
1135 lines
37 KiB
C
/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
|
|
/*
|
|
* This file is part of the LibreOffice project.
|
|
*
|
|
* This Source Code Form is subject to the terms of the Mozilla Public
|
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/.
|
|
*
|
|
* This file incorporates work covered by the following license notice:
|
|
*
|
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
|
* contributor license agreements. See the NOTICE file distributed
|
|
* with this work for additional information regarding copyright
|
|
* ownership. The ASF licenses this file to you under the Apache
|
|
* License, Version 2.0 (the "License"); you may not use this file
|
|
* except in compliance with the License. You may obtain a copy of
|
|
* the License at http://www.apache.org/licenses/LICENSE-2.0 .
|
|
*/
|
|
|
|
#include <sal/types.h>
|
|
#include <stdio.h>
|
|
#include <ctype.h>
|
|
#include <string.h>
|
|
#include "cppdef.h"
|
|
#include "cpp.h"
|
|
|
|
/*ER evaluate macros to pDefOut */
|
|
|
|
/*
|
|
* skipnl() skips over input text to the end of the line.
|
|
* skipws() skips over "whitespace" (spaces or tabs), but
|
|
* not skip over the end of the line. It skips over
|
|
* TOK_SEP, however (though that shouldn't happen).
|
|
* scanid() reads the next token (C identifier) into token[].
|
|
* The caller has already read the first character of
|
|
* the identifier. Unlike macroid(), the token is
|
|
* never expanded.
|
|
* macroid() reads the next token (C identifier) into token[].
|
|
* If it is a #defined macro, it is expanded, and
|
|
* macroid() returns TRUE, otherwise, FALSE.
|
|
* catenate() Does the dirty work of token concatenation, TRUE if it did.
|
|
* scanstring() Reads a string from the input stream, calling
|
|
* a user-supplied function for each character.
|
|
* This function may be output() to write the
|
|
* string to the output file, or save() to save
|
|
* the string in the work buffer.
|
|
* scannumber() Reads a C numeric constant from the input stream,
|
|
* calling the user-supplied function for each
|
|
* character. (output() or save() as noted above.)
|
|
* save() Save one character in the work[] buffer.
|
|
* savestring() Saves a string in malloc() memory.
|
|
* getfile() Initialize a new FILEINFO structure, called when
|
|
* #include opens a new file, or a macro is to be
|
|
* expanded.
|
|
* getmem() Get a specified number of bytes from malloc memory.
|
|
* output() Write one character to stdout (calling PUTCHAR) --
|
|
* implemented as a function so its address may be
|
|
* passed to scanstring() and scannumber().
|
|
* lookid() Scans the next token (identifier) from the input
|
|
* stream. Looks for it in the #defined symbol table.
|
|
* Returns a pointer to the definition, if found, or NULL
|
|
* if not present. The identifier is stored in token[].
|
|
* defnedel() Define enter/delete subroutine. Updates the
|
|
* symbol table.
|
|
* get() Read the next byte from the current input stream,
|
|
* handling end of (macro/file) input and embedded
|
|
* comments appropriately. Note that the global
|
|
* instring is -- essentially -- a parameter to get().
|
|
* cget() Like get(), but skip over TOK_SEP.
|
|
* unget() Push last gotten character back on the input stream.
|
|
* cerror(), cwarn(), cfatal(), cierror(), ciwarn()
|
|
* These routines format an print messages to the user.
|
|
* cerror & cwarn take a format and a single string argument.
|
|
* cierror & ciwarn take a format and a single int (char) argument.
|
|
* cfatal takes a format and a single string argument.
|
|
*/
|
|
|
|
/*
|
|
* This table must be rewritten for a non-Ascii machine.
|
|
*
|
|
* Note that several "non-visible" characters have special meaning:
|
|
* Hex 1D DEF_MAGIC -- a flag to prevent #define recursion.
|
|
* Hex 1E TOK_SEP -- a delimiter for token concatenation
|
|
* Hex 1F COM_SEP -- a zero-width whitespace for comment concatenation
|
|
*/
|
|
#if TOK_SEP != 0x1E || COM_SEP != 0x1F || DEF_MAGIC != 0x1D
|
|
<< error type table is not correct >>
|
|
#endif
|
|
|
|
#define DOL LET
|
|
|
|
|
|
char type[256] = { /* Character type codes Hex */
|
|
END, 000, 000, 000, 000, 000, 000, 000, /* 00 */
|
|
000, SPA, 000, 000, 000, 000, 000, 000, /* 08 */
|
|
000, 000, 000, 000, 000, 000, 000, 000, /* 10 */
|
|
000, 000, 000, 000, 000, LET, 000, SPA, /* 18 */
|
|
SPA,OP_NOT, QUO, 000, DOL,OP_MOD,OP_AND, QUO, /* 20 !"#$%&' */
|
|
OP_LPA,OP_RPA,OP_MUL,OP_ADD, 000,OP_SUB, DOT,OP_DIV, /* 28 ()*+,-./ */
|
|
DIG, DIG, DIG, DIG, DIG, DIG, DIG, DIG, /* 30 01234567 */
|
|
DIG, DIG,OP_COL, 000, OP_LT, OP_EQ, OP_GT,OP_QUE, /* 38 89:;<=>? */
|
|
000, LET, LET, LET, LET, LET, LET, LET, /* 40 @ABCDEFG */
|
|
LET, LET, LET, LET, LET, LET, LET, LET, /* 48 HIJKLMNO */
|
|
LET, LET, LET, LET, LET, LET, LET, LET, /* 50 PQRSTUVW */
|
|
LET, LET, LET, 000, BSH, 000,OP_XOR, LET, /* 58 XYZ[\]^_ */
|
|
000, LET, LET, LET, LET, LET, LET, LET, /* 60 `abcdefg */
|
|
LET, LET, LET, LET, LET, LET, LET, LET, /* 68 hijklmno */
|
|
LET, LET, LET, LET, LET, LET, LET, LET, /* 70 pqrstuvw */
|
|
LET, LET, LET, 000, OP_OR, 000,OP_NOT, 000, /* 78 xyz{|}~ */
|
|
000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */
|
|
000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */
|
|
000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */
|
|
000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */
|
|
000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */
|
|
000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */
|
|
000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */
|
|
000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */
|
|
};
|
|
|
|
|
|
/*
|
|
* C P P S y m b o l T a b l e s
|
|
*/
|
|
|
|
/*
|
|
* SBSIZE defines the number of hash-table slots for the symbol table.
|
|
* It must be a power of 2.
|
|
*/
|
|
#ifndef SBSIZE
|
|
#define SBSIZE 64
|
|
#endif
|
|
#define SBMASK (SBSIZE - 1)
|
|
#if (SBSIZE ^ SBMASK) != ((SBSIZE * 2) - 1)
|
|
<< error, SBSIZE must be a power of 2 >>
|
|
#endif
|
|
|
|
|
|
static DEFBUF *symtab[SBSIZE]; /* Symbol table queue headers */
|
|
|
|
void InitCpp6()
|
|
{
|
|
int i;
|
|
for( i = 0; i < SBSIZE; i++ )
|
|
symtab[ i ] = NULL;
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
* Skip to the end of the current input line.
|
|
*/
|
|
void skipnl()
|
|
{
|
|
int c;
|
|
|
|
do
|
|
{ /* Skip to newline */
|
|
c = get();
|
|
}
|
|
while (c != '\n' && c != EOF_CHAR);
|
|
}
|
|
|
|
/*
|
|
* Skip over whitespace
|
|
*/
|
|
int skipws()
|
|
{
|
|
int c;
|
|
|
|
do { /* Skip whitespace */
|
|
c = get();
|
|
} while (type[c] == SPA);
|
|
return c;
|
|
}
|
|
|
|
/*
|
|
* Get the next token (an id) into the token buffer.
|
|
* Note: this code is duplicated in lookid().
|
|
* Change one, change both.
|
|
*/
|
|
void scanid(int c)
|
|
{
|
|
char* bp;
|
|
|
|
if (c == DEF_MAGIC) /* Eat the magic token */
|
|
c = get(); /* undefiner. */
|
|
bp = token;
|
|
do
|
|
{
|
|
if (bp < &token[IDMAX]) /* token dim is IDMAX+1 */
|
|
*bp++ = (char)c;
|
|
c = get();
|
|
}
|
|
while (type[c] == LET || type[c] == DIG);
|
|
unget();
|
|
*bp = EOS;
|
|
}
|
|
|
|
/*
|
|
* If c is a letter, scan the id. if it's #defined, expand it and scan
|
|
* the next character and try again.
|
|
*
|
|
* Else, return the character. If type[c] is a LET, the token is in token.
|
|
*/
|
|
int macroid(int c)
|
|
{
|
|
DEFBUF* dp;
|
|
|
|
if (infile != NULL && infile->fp != NULL)
|
|
recursion = 0;
|
|
while (type[c] == LET && (dp = lookid(c)) != NULL)
|
|
{
|
|
expand(dp);
|
|
c = get();
|
|
}
|
|
return c;
|
|
}
|
|
|
|
/*
|
|
* A token was just read (via macroid).
|
|
* If the next character is TOK_SEP, concatenate the next token
|
|
* return TRUE -- which should recall macroid after refreshing
|
|
* macroid's argument. If it is not TOK_SEP, unget() the character
|
|
* and return FALSE.
|
|
*/
|
|
int catenate()
|
|
{
|
|
int c;
|
|
char* token1;
|
|
|
|
if (get() != TOK_SEP) /* Token concatenation */
|
|
{
|
|
unget();
|
|
return FALSE;
|
|
}
|
|
else
|
|
{
|
|
token1 = savestring(token); /* Save first token */
|
|
c = macroid(get()); /* Scan next token */
|
|
switch(type[c]) /* What was it? */
|
|
{
|
|
case LET: /* An identifier, ... */
|
|
if (strlen(token1) + strlen(token) >= NWORK)
|
|
cfatal("work buffer overflow doing %s #", token1);
|
|
sprintf(work, "%s%s", token1, token);
|
|
break;
|
|
|
|
case DIG: /* A digit string */
|
|
strcpy(work, token1);
|
|
workp = work + strlen(work);
|
|
do
|
|
{
|
|
save(c);
|
|
}
|
|
while ((c = get()) != TOK_SEP);
|
|
/*
|
|
* The trailing TOK_SEP is no longer needed.
|
|
*/
|
|
save(EOS);
|
|
break;
|
|
|
|
default: /* An error, ... */
|
|
if (isprint(c))
|
|
cierror("Strange character '%c' after #", c);
|
|
else
|
|
cierror("Strange character (%d.) after #", c);
|
|
strcpy(work, token1);
|
|
unget();
|
|
break;
|
|
}
|
|
/*
|
|
* work has the concatenated token and token1 has
|
|
* the first token (no longer needed). Unget the
|
|
* new (concatenated) token after freeing token1.
|
|
* Finally, setup to read the new token.
|
|
*/
|
|
free(token1); /* Free up memory */
|
|
ungetstring(work); /* Unget the new thing, */
|
|
return TRUE;
|
|
}
|
|
}
|
|
|
|
/*
|
|
* Scan off a string. Warning if terminated by newline or EOF.
|
|
* outfun() outputs the character -- to a buffer if in a macro.
|
|
* TRUE if ok, FALSE if error.
|
|
*/
|
|
int scanstring(int delim,
|
|
#ifndef _NO_PROTO
|
|
void (*outfun)( int ) /* BP */ /* Output function */
|
|
#else
|
|
void (*outfun)() /* BP */
|
|
#endif
|
|
)
|
|
{
|
|
int c;
|
|
|
|
instring = TRUE; /* Don't strip comments */
|
|
(*outfun)(delim);
|
|
while ((c = get()) != delim &&
|
|
c != '\n' &&
|
|
c != EOF_CHAR)
|
|
{
|
|
if (c != DEF_MAGIC)
|
|
(*outfun)(c);
|
|
if (c == '\\')
|
|
(*outfun)(get());
|
|
}
|
|
instring = FALSE;
|
|
if (c == delim)
|
|
{
|
|
(*outfun)(c);
|
|
return TRUE;
|
|
}
|
|
else
|
|
{
|
|
cerror("Unterminated string", NULLST);
|
|
unget();
|
|
return FALSE;
|
|
}
|
|
}
|
|
|
|
/*
|
|
* Process a number. We know that c is from 0 to 9 or dot.
|
|
* Algorithm from Dave Conroy's Decus C.
|
|
*/
|
|
void scannumber(int c,
|
|
#ifndef _NO_PROTO
|
|
void (*outfun)( int ) /* BP */ /* Output/store func */
|
|
#else
|
|
void (*outfun)() /* BP */
|
|
#endif
|
|
)
|
|
{
|
|
int radix; /* 8, 10, or 16 */
|
|
int expseen; /* 'e' seen in floater */
|
|
int signseen; /* '+' or '-' seen */
|
|
int octal89; /* For bad octal test */
|
|
int dotflag; /* TRUE if '.' was seen */
|
|
|
|
expseen = FALSE; /* No exponent seen yet */
|
|
signseen = TRUE; /* No +/- allowed yet */
|
|
octal89 = FALSE; /* No bad octal yet */
|
|
radix = 10; /* Assume decimal */
|
|
if ((dotflag = (c == '.')) != FALSE) /* . something? */
|
|
{
|
|
(*outfun)('.'); /* Always out the dot */
|
|
if (type[(c = get())] != DIG) /* If not a float numb, */
|
|
{
|
|
unget(); /* Rescan strange char */
|
|
return; /* All done for now */
|
|
}
|
|
} /* End of float test */
|
|
else if (c == '0') /* Octal or hex? */
|
|
{
|
|
(*outfun)(c); /* Stuff initial zero */
|
|
radix = 8; /* Assume it's octal */
|
|
c = get(); /* Look for an 'x' */
|
|
if (c == 'x' || c == 'X') /* Did we get one? */
|
|
{
|
|
radix = 16; /* Remember new radix */
|
|
(*outfun)(c); /* Stuff the 'x' */
|
|
c = get(); /* Get next character */
|
|
}
|
|
}
|
|
for (;;) /* Process curr. char. */
|
|
{
|
|
/*
|
|
* Note that this algorithm accepts "012e4" and "03.4"
|
|
* as legitimate floating-point numbers.
|
|
*/
|
|
if (radix != 16 && (c == 'e' || c == 'E'))
|
|
{
|
|
if (expseen) /* Already saw 'E'? */
|
|
break; /* Exit loop, bad nbr. */
|
|
expseen = TRUE; /* Set exponent seen */
|
|
signseen = FALSE; /* We can read '+' now */
|
|
radix = 10; /* Decimal exponent */
|
|
}
|
|
else if (radix != 16 && c == '.')
|
|
{
|
|
if (dotflag) /* Saw dot already? */
|
|
break; /* Exit loop, two dots */
|
|
dotflag = TRUE; /* Remember the dot */
|
|
radix = 10; /* Decimal fraction */
|
|
}
|
|
else if (c == '+' || c == '-') /* 1.0e+10 */
|
|
{
|
|
if (signseen) /* Sign in wrong place? */
|
|
break; /* Exit loop, not nbr. */
|
|
/* signseen = TRUE; */ /* Remember we saw it */
|
|
}
|
|
else /* Check the digit */
|
|
{
|
|
switch (c)
|
|
{
|
|
case '8': case '9': /* Sometimes wrong */
|
|
octal89 = TRUE; /* Do check later */
|
|
case '0': case '1': case '2': case '3':
|
|
case '4': case '5': case '6': case '7':
|
|
break; /* Always ok */
|
|
|
|
case 'a': case 'b': case 'c': case 'd': case 'e': case 'f':
|
|
case 'A': case 'B': case 'C': case 'D': case 'E': case 'F':
|
|
if (radix == 16) /* Alpha's are ok only */
|
|
break; /* if reading hex. */
|
|
default: /* At number end */
|
|
goto done; /* Break from for loop */
|
|
} /* End of switch */
|
|
} /* End general case */
|
|
(*outfun)(c); /* Accept the character */
|
|
signseen = TRUE; /* Don't read sign now */
|
|
c = get(); /* Read another char */
|
|
} /* End of scan loop */
|
|
/*
|
|
* When we break out of the scan loop, c contains the first
|
|
* character (maybe) not in the number. If the number is an
|
|
* integer, allow a trailing 'L' for long and/or a trailing 'U'
|
|
* for unsigned. If not those, push the trailing character back
|
|
* on the input stream. Floating point numbers accept a trailing
|
|
* 'L' for "long double".
|
|
*/
|
|
done:
|
|
if (dotflag || expseen) /* Floating point? */
|
|
{
|
|
if (c == 'l' || c == 'L')
|
|
{
|
|
(*outfun)(c);
|
|
get(); /* Ungotten later */
|
|
}
|
|
}
|
|
else /* Else it's an integer */
|
|
{
|
|
/*
|
|
* We know that dotflag and expseen are both zero, now:
|
|
* dotflag signals "saw 'L'", and
|
|
* expseen signals "saw 'U'".
|
|
*/
|
|
for (;;)
|
|
{
|
|
switch (c)
|
|
{
|
|
case 'l':
|
|
case 'L':
|
|
if (dotflag)
|
|
goto nomore;
|
|
dotflag = TRUE;
|
|
break;
|
|
|
|
case 'u':
|
|
case 'U':
|
|
if (expseen)
|
|
goto nomore;
|
|
expseen = TRUE;
|
|
break;
|
|
|
|
default:
|
|
goto nomore;
|
|
}
|
|
(*outfun)(c); /* Got 'L' or 'U'. */
|
|
c = get(); /* Look at next, too. */
|
|
}
|
|
}
|
|
nomore:
|
|
unget(); /* Not part of a number */
|
|
if (octal89 && radix == 8)
|
|
cwarn("Illegal digit in octal number", NULLST);
|
|
}
|
|
|
|
void save(int c)
|
|
{
|
|
if (workp >= &work[NWORK])
|
|
{
|
|
work[NWORK-1] = '\0';
|
|
cfatal("Work buffer overflow: %s", work);
|
|
}
|
|
else
|
|
*workp++ = (char)c;
|
|
}
|
|
|
|
/*
|
|
* Store a string into free memory.
|
|
*/
|
|
char* savestring(char* text)
|
|
{
|
|
char* result;
|
|
|
|
size_t size = strlen(text) + 1;
|
|
result = getmem(size);
|
|
strcpy(result, text);
|
|
return result;
|
|
}
|
|
|
|
/*
|
|
* Common FILEINFO buffer initialization for a new file or macro.
|
|
*/
|
|
FILEINFO* getfile(size_t bufsize, char* name)
|
|
{
|
|
FILEINFO* file;
|
|
size_t size;
|
|
|
|
size = strlen(name); /* File/macro name */
|
|
file = (FILEINFO*) getmem(sizeof (FILEINFO) + bufsize + size);
|
|
file->parent = infile; /* Chain files together */
|
|
file->fp = NULL; /* No file yet */
|
|
file->filename = savestring(name); /* Save file/macro name */
|
|
file->progname = NULL; /* No #line seen yet */
|
|
file->unrecur = 0; /* No macro fixup */
|
|
file->bptr = file->buffer; /* Initialize line ptr */
|
|
file->buffer[0] = EOS; /* Force first read */
|
|
file->line = 0; /* (Not used just yet) */
|
|
if (infile != NULL) /* If #include file */
|
|
infile->line = line; /* Save current line */
|
|
infile = file; /* New current file */
|
|
line = 1; /* Note first line */
|
|
return file; /* All done. */
|
|
}
|
|
|
|
/*
|
|
* Get a block of free memory.
|
|
*/
|
|
char* getmem(size_t size)
|
|
{
|
|
char* result;
|
|
|
|
if ((result = malloc((unsigned) size)) == NULL)
|
|
cfatal("Out of memory", NULLST);
|
|
return result;
|
|
}
|
|
|
|
/*
|
|
* Look for the next token in the symbol table. Returns token in "token".
|
|
* If found, returns the table pointer; Else returns NULL.
|
|
*/
|
|
DEFBUF* lookid(int c)
|
|
{
|
|
int nhash;
|
|
DEFBUF* dp;
|
|
char* np;
|
|
int temp = 0;
|
|
int isrecurse; /* For #define foo foo */
|
|
|
|
np = token;
|
|
nhash = 0;
|
|
if (0 != (isrecurse = (c == DEF_MAGIC)))/* If recursive macro */
|
|
c = get(); /* hack, skip DEF_MAGIC */
|
|
do
|
|
{
|
|
if (np < &token[IDMAX]) /* token dim is IDMAX+1 */
|
|
{
|
|
*np++ = (char)c; /* Store token byte */
|
|
nhash += c; /* Update hash value */
|
|
}
|
|
c = get(); /* And get another byte */
|
|
}
|
|
while (type[c] == LET || type[c] == DIG);
|
|
unget(); /* Rescan terminator */
|
|
*np = EOS; /* Terminate token */
|
|
if (isrecurse) /* Recursive definition */
|
|
return NULL; /* undefined just now */
|
|
nhash += (np - token); /* Fix hash value */
|
|
dp = symtab[nhash & SBMASK]; /* Starting bucket */
|
|
while (dp != (DEFBUF*) NULL) /* Search symbol table */
|
|
{
|
|
if (dp->hash == nhash && /* Fast precheck */
|
|
(temp = strcmp(dp->name, token)) >= 0)
|
|
{
|
|
break;
|
|
}
|
|
dp = dp->link; /* Nope, try next one */
|
|
}
|
|
return ((temp == 0) ? dp : NULL);
|
|
}
|
|
|
|
/*
|
|
* Enter this name in the lookup table (delete = FALSE)
|
|
* or delete this name (delete = TRUE).
|
|
* Returns a pointer to the define block (delete = FALSE)
|
|
* Returns NULL if the symbol wasn't defined (delete = TRUE).
|
|
*/
|
|
DEFBUF* defendel(char* name, int delete)
|
|
{
|
|
DEFBUF* dp;
|
|
DEFBUF** prevp;
|
|
char* np;
|
|
int nhash;
|
|
int temp=0;
|
|
int size;
|
|
|
|
for (nhash = 0, np = name; *np != EOS;)
|
|
nhash += *np++;
|
|
size = (np - name);
|
|
nhash += size;
|
|
prevp = &symtab[nhash & SBMASK];
|
|
while ((dp = *prevp) != (DEFBUF*) NULL)
|
|
{
|
|
if (dp->hash == nhash &&
|
|
(temp = strcmp(dp->name, name)) >= 0)
|
|
{
|
|
if (temp > 0)
|
|
dp = NULL; /* Not found */
|
|
else
|
|
{
|
|
*prevp = dp->link; /* Found, unlink and */
|
|
if (dp->repl != NULL) /* Free the replacement */
|
|
free(dp->repl); /* if any, and then */
|
|
free((char*) dp); /* Free the symbol */
|
|
dp = NULL;
|
|
}
|
|
break;
|
|
}
|
|
prevp = &dp->link;
|
|
}
|
|
if (!delete)
|
|
{
|
|
dp = (DEFBUF*) getmem(sizeof (DEFBUF) + size + 1);
|
|
dp->link = *prevp;
|
|
*prevp = dp;
|
|
dp->hash = nhash;
|
|
dp->repl = NULL;
|
|
dp->nargs = 0;
|
|
strcpy(dp->name, name);
|
|
}
|
|
return dp;
|
|
}
|
|
|
|
#if OSL_DEBUG_LEVEL > 1
|
|
|
|
void dumpdef(char* why)
|
|
{
|
|
DEFBUF* dp;
|
|
DEFBUF** syp;
|
|
FILE* pRememberOut = NULL;
|
|
|
|
if ( bDumpDefs ) /*ER */
|
|
{
|
|
pRememberOut = pCppOut;
|
|
pCppOut = pDefOut;
|
|
}
|
|
fprintf( pCppOut, "CPP symbol table dump %s\n", why);
|
|
for (syp = symtab; syp < &symtab[SBSIZE]; syp++)
|
|
{
|
|
if ((dp = *syp) != (DEFBUF*) NULL)
|
|
{
|
|
fprintf( pCppOut, "symtab[%" SAL_PRI_PTRDIFFT "d]\n", (syp - symtab));
|
|
do
|
|
{
|
|
dumpadef((char*) NULL, dp);
|
|
}
|
|
while ((dp = dp->link) != (DEFBUF*) NULL);
|
|
}
|
|
}
|
|
if ( bDumpDefs )
|
|
{
|
|
fprintf( pCppOut, "\n");
|
|
pCppOut = pRememberOut;
|
|
}
|
|
}
|
|
|
|
void dumpadef(char* why, DEFBUF* dp)
|
|
{
|
|
char* cp;
|
|
int c;
|
|
FILE* pRememberOut = NULL;
|
|
|
|
/*ER dump #define's to pDefOut */
|
|
if ( bDumpDefs )
|
|
{
|
|
pRememberOut = pCppOut;
|
|
pCppOut = pDefOut;
|
|
}
|
|
fprintf( pCppOut, " \"%s\" [%d]", dp->name, dp->nargs);
|
|
if (why != NULL)
|
|
fprintf( pCppOut, " (%s)", why);
|
|
if (dp->repl != NULL)
|
|
{
|
|
fprintf( pCppOut, " => ");
|
|
for (cp = dp->repl; (c = *cp++ & 0xFF) != EOS;)
|
|
{
|
|
#ifdef SOLAR
|
|
if (c == DEL)
|
|
{
|
|
c = *cp++ & 0xFF;
|
|
if( c == EOS ) break;
|
|
fprintf( pCppOut, "<%%%d>", c - MAC_PARM);
|
|
}
|
|
#else
|
|
if (c >= MAC_PARM && c <= (MAC_PARM + PAR_MAC))
|
|
fprintf( pCppOut, "<%%%d>", c - MAC_PARM);
|
|
#endif
|
|
else if (isprint(c) || c == '\n' || c == '\t')
|
|
PUTCHAR(c);
|
|
else if (c < ' ')
|
|
fprintf( pCppOut, "<^%c>", c + '@');
|
|
else
|
|
fprintf( pCppOut, "<\\0%o>", c);
|
|
}
|
|
/*ER evaluate macros to pDefOut */
|
|
#ifdef EVALDEFS
|
|
if ( bDumpDefs && !bIsInEval && dp->nargs <= 0 )
|
|
{
|
|
FILEINFO* infileSave = infile;
|
|
char* tokenSave = savestring( token );
|
|
char* workSave = savestring( work );
|
|
int lineSave = line;
|
|
int wronglineSave = wrongline;
|
|
int recursionSave = recursion;
|
|
FILEINFO* file;
|
|
EVALTYPE valEval;
|
|
|
|
bIsInEval = 1;
|
|
infile = NULL; /* start from scrap */
|
|
line = 0;
|
|
wrongline = 0;
|
|
*token = EOS;
|
|
*work = EOS;
|
|
recursion = 0;
|
|
file = getfile( strlen( dp->repl ), dp->name );
|
|
strcpy( file->buffer, dp->repl );
|
|
fprintf( pCppOut, " ===> ");
|
|
nEvalOff = 0;
|
|
cppmain(); /* get() frees also *file */
|
|
valEval = 0;
|
|
if ( 0 == evaluate( EvalBuf, &valEval ) )
|
|
{
|
|
#ifdef EVALFLOATS
|
|
if ( valEval != (EVALTYPE)((long)valEval ) )
|
|
fprintf( pCppOut, " ==eval=> %f", valEval );
|
|
else
|
|
#endif
|
|
fprintf( pCppOut, " ==eval=> %ld", (long)valEval );
|
|
}
|
|
recursion = recursionSave;
|
|
wrongline = wronglineSave;
|
|
line = lineSave;
|
|
strcpy( work, workSave );
|
|
free( workSave );
|
|
strcpy( token, tokenSave );
|
|
free( tokenSave );
|
|
infile = infileSave;
|
|
bIsInEval = 0;
|
|
}
|
|
#endif
|
|
}
|
|
else
|
|
{
|
|
fprintf( pCppOut, ", no replacement.");
|
|
}
|
|
PUTCHAR('\n');
|
|
if ( bDumpDefs )
|
|
pCppOut = pRememberOut;
|
|
}
|
|
#endif
|
|
|
|
/*
|
|
* G E T
|
|
*/
|
|
|
|
/*
|
|
* Return the next character from a macro or the current file.
|
|
* Handle end of file from #include files.
|
|
*/
|
|
int get()
|
|
{
|
|
int c;
|
|
FILEINFO* file;
|
|
int popped; /* Recursion fixup */
|
|
|
|
popped = 0;
|
|
get_from_file:
|
|
if ((file = infile) == NULL)
|
|
return EOF_CHAR;
|
|
newline:
|
|
|
|
/*
|
|
* Read a character from the current input line or macro.
|
|
* At EOS, either finish the current macro (freeing temp.
|
|
* storage) or read another line from the current input file.
|
|
* At EOF, exit the current file (#include) or, at EOF from
|
|
* the cpp input file, return EOF_CHAR to finish processing.
|
|
*/
|
|
if ((c = *file->bptr++ & 0xFF) == EOS)
|
|
{
|
|
/*
|
|
* Nothing in current line or macro. Get next line (if
|
|
* input from a file), or do end of file/macro processing.
|
|
* In the latter case, jump back to restart from the top.
|
|
*/
|
|
if (file->fp == NULL) /* NULL if macro */
|
|
{
|
|
popped++;
|
|
recursion -= file->unrecur;
|
|
if (recursion < 0)
|
|
recursion = 0;
|
|
infile = file->parent; /* Unwind file chain */
|
|
}
|
|
else /* Else get from a file */
|
|
{
|
|
if ((file->bptr = fgets(file->buffer, NBUFF, file->fp)) != NULL)
|
|
{
|
|
#if OSL_DEBUG_LEVEL > 1
|
|
if (debug > 1) /* Dump it to stdout */
|
|
{
|
|
fprintf( pCppOut, "\n#line %d (%s), %s",
|
|
line, file->filename, file->buffer);
|
|
}
|
|
#endif
|
|
goto newline; /* process the line */
|
|
}
|
|
else
|
|
{
|
|
if( file->fp != stdin )
|
|
fclose(file->fp); /* Close finished file */
|
|
if ((infile = file->parent) != NULL)
|
|
{
|
|
/*
|
|
* There is an "ungotten" newline in the current
|
|
* infile buffer (set there by doinclude() in
|
|
* cpp1.c). Thus, we know that the mainline code
|
|
* is skipping over blank lines and will do a
|
|
* #line at its convenience.
|
|
*/
|
|
wrongline = TRUE; /* Need a #line now */
|
|
}
|
|
}
|
|
}
|
|
/*
|
|
* Free up space used by the (finished) file or macro and
|
|
* restart input from the parent file/macro, if any.
|
|
*/
|
|
free(file->filename); /* Free name and */
|
|
if (file->progname != NULL) /* if a #line was seen, */
|
|
free(file->progname); /* free it, too. */
|
|
free((char*) file); /* Free file space */
|
|
if (infile == NULL) /* If at end of file */
|
|
return EOF_CHAR; /* Return end of file */
|
|
line = infile->line; /* Reset line number */
|
|
goto get_from_file; /* Get from the top. */
|
|
}
|
|
/*
|
|
* Common processing for the new character.
|
|
*/
|
|
if (c == DEF_MAGIC && file->fp != NULL) /* Don't allow delete */
|
|
goto newline; /* from a file */
|
|
if (file->parent != NULL) /* Macro or #include */
|
|
{
|
|
if (popped != 0)
|
|
file->parent->unrecur += popped;
|
|
else
|
|
{
|
|
recursion -= file->parent->unrecur;
|
|
if (recursion < 0)
|
|
recursion = 0;
|
|
file->parent->unrecur = 0;
|
|
}
|
|
}
|
|
#if (HOST == SYS_UNIX)
|
|
if (c == '\r')
|
|
return get(); /* DOS fuck */
|
|
#endif
|
|
if (c == '\n') /* Maintain current */
|
|
++line; /* line counter */
|
|
if (instring) /* Strings just return */
|
|
return c; /* the character. */
|
|
else if (c == '/') /* Comment? */
|
|
{
|
|
instring = TRUE; /* So get() won't loop */
|
|
|
|
c = get();
|
|
if ((c != '*') && (c != '/')) /* Next byte '*'? */
|
|
{
|
|
instring = FALSE; /* Nope, no comment */
|
|
unget(); /* Push the char. back */
|
|
return '/'; /* Return the slash */
|
|
}
|
|
if (keepcomments) /* If writing comments */
|
|
{
|
|
PUTCHAR('/'); /* Write out the */
|
|
/* initializer */
|
|
if( '*' == c )
|
|
PUTCHAR('*');
|
|
else
|
|
PUTCHAR('/');
|
|
}
|
|
if( '*' == c )
|
|
{
|
|
for (;;) /* Eat a comment */
|
|
{
|
|
c = get();
|
|
test:
|
|
if (keepcomments && c != EOF_CHAR)
|
|
cput(c);
|
|
switch (c)
|
|
{
|
|
case EOF_CHAR:
|
|
cerror("EOF in comment", NULLST);
|
|
return EOF_CHAR;
|
|
|
|
case '/':
|
|
if ((c = get()) != '*') /* Don't let comments */
|
|
goto test; /* Nest. */
|
|
#ifdef STRICT_COMMENTS
|
|
cwarn("Nested comments", NULLST);
|
|
#endif
|
|
/* Fall into * stuff */
|
|
case '*':
|
|
if ((c = get()) != '/') /* If comment doesn't */
|
|
goto test; /* end, look at next */
|
|
instring = FALSE; /* End of comment, */
|
|
if (keepcomments) /* Put out the comment */
|
|
{
|
|
cput(c); /* terminator, too */
|
|
}
|
|
/*
|
|
* A comment is syntactically "whitespace" --
|
|
* however, there are certain strange sequences
|
|
* such as
|
|
* #define foo(x) (something)
|
|
* foo|* comment *|(123)
|
|
* these are '/' ^ ^
|
|
* where just returning space (or COM_SEP) will cause
|
|
* problems. This can be "fixed" by overwriting the
|
|
* '/' in the input line buffer with ' ' (or COM_SEP)
|
|
* but that may mess up an error message.
|
|
* So, we peek ahead -- if the next character is
|
|
* "whitespace" we just get another character, if not,
|
|
* we modify the buffer. All in the name of purity.
|
|
*/
|
|
if (*file->bptr == '\n' || type[*file->bptr & 0xFF] == SPA)
|
|
goto newline;
|
|
return (file->bptr[-1] = ' ');
|
|
|
|
case '\n': /* we'll need a #line */
|
|
if (!keepcomments)
|
|
wrongline = TRUE; /* later... */
|
|
default: /* Anything else is */
|
|
break; /* Just a character */
|
|
} /* End switch */
|
|
} /* End comment loop */
|
|
}
|
|
else /* c++ comment */
|
|
{
|
|
for (;;) /* Eat a comment */
|
|
{
|
|
c = get();
|
|
if (keepcomments && c != EOF_CHAR)
|
|
cput(c);
|
|
if( EOF_CHAR == c )
|
|
return EOF_CHAR;
|
|
else if( '\n' == c )
|
|
{
|
|
instring = FALSE; /* End of comment, */
|
|
return c;
|
|
}
|
|
}
|
|
}
|
|
} /* End if in comment */
|
|
else if (!inmacro && c == '\\') /* If backslash, peek */
|
|
{
|
|
if ((c = get()) == '\n') /* for a <nl>. If so, */
|
|
{
|
|
wrongline = TRUE;
|
|
goto newline;
|
|
}
|
|
else /* Backslash anything */
|
|
{
|
|
unget(); /* Get it later */
|
|
return '\\'; /* Return the backslash */
|
|
}
|
|
}
|
|
else if (c == '\f' || c == VT) /* Form Feed, Vertical */
|
|
{
|
|
c = ' '; /* Tab are whitespace */
|
|
}
|
|
else if (c == 0xef) /* eat up UTF-8 BOM */
|
|
{
|
|
if((c = get()) == 0xbb)
|
|
{
|
|
if((c = get()) == 0xbf)
|
|
{
|
|
c = get();
|
|
return c;
|
|
}
|
|
else
|
|
{
|
|
unget();
|
|
unget();
|
|
return 0xef;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
unget();
|
|
return 0xef;
|
|
}
|
|
}
|
|
return c; /* Just return the char */
|
|
}
|
|
|
|
/*
|
|
* Backup the pointer to reread the last character. Fatal error
|
|
* (code bug) if we backup too far. unget() may be called,
|
|
* without problems, at end of file. Only one character may
|
|
* be ungotten. If you need to unget more, call ungetstring().
|
|
*/
|
|
void unget()
|
|
{
|
|
FILEINFO* file;
|
|
|
|
if ((file = infile) == NULL)
|
|
return; /* Unget after EOF */
|
|
if (--file->bptr < file->buffer)
|
|
cfatal("Too much pushback", NULLST);
|
|
if (*file->bptr == '\n') /* Ungetting a newline? */
|
|
--line; /* Unget the line number, too */
|
|
}
|
|
|
|
/*
|
|
* Push a string back on the input stream. This is done by treating
|
|
* the text as if it were a macro.
|
|
*/
|
|
void ungetstring(char* text)
|
|
{
|
|
FILEINFO* file;
|
|
file = getfile(strlen(text) + 1, "");
|
|
strcpy(file->buffer, text);
|
|
}
|
|
|
|
/*
|
|
* Get one character, absorb "funny space" after comments or
|
|
* token concatenation
|
|
*/
|
|
int cget()
|
|
{
|
|
int c;
|
|
|
|
do
|
|
{
|
|
c = get();
|
|
}
|
|
while (c == TOK_SEP);
|
|
return c;
|
|
}
|
|
|
|
/*
|
|
* Error messages and other hacks. The first byte of severity
|
|
* is 'S' for string arguments and 'I' for int arguments. This
|
|
* is needed for portability with machines that have int's that
|
|
* are shorter than char *'s.
|
|
*/
|
|
|
|
/*
|
|
* Print filenames, macro names, and line numbers for error messages.
|
|
*/
|
|
static void domsg(char* severity, char* format, void* arg)
|
|
{
|
|
char* tp;
|
|
FILEINFO* file;
|
|
|
|
fprintf(stderr, "%sline %d, %s: ", MSG_PREFIX, line, &severity[1]);
|
|
if (*severity == 'S')
|
|
fprintf(stderr, format, (char*)arg);
|
|
else
|
|
fprintf(stderr, format, *((int*)arg) );
|
|
putc('\n', stderr);
|
|
if ((file = infile) == NULL)
|
|
return; /* At end of file */
|
|
if (file->fp != NULL)
|
|
{
|
|
tp = file->buffer; /* Print current file */
|
|
fprintf(stderr, "%s", tp); /* name, making sure */
|
|
if (tp[strlen(tp) - 1] != '\n') /* there's a newline */
|
|
putc('\n', stderr);
|
|
}
|
|
while ((file = file->parent) != NULL) /* Print #includes, too */
|
|
{
|
|
if (file->fp == NULL)
|
|
fprintf(stderr, "from macro %s\n", file->filename);
|
|
else
|
|
{
|
|
tp = file->buffer;
|
|
fprintf(stderr, "from file %s, line %d:\n%s",
|
|
(file->progname != NULL)
|
|
? file->progname : file->filename,
|
|
file->line, tp);
|
|
if (tp[strlen(tp) - 1] != '\n')
|
|
putc('\n', stderr);
|
|
}
|
|
}
|
|
}
|
|
|
|
/*
|
|
* Print a normal error message, string argument.
|
|
*/
|
|
void cerror(char* format, char* sarg)
|
|
{
|
|
domsg("SError", format, sarg);
|
|
errors++;
|
|
}
|
|
|
|
/*
|
|
* Print a normal error message, numeric argument.
|
|
*/
|
|
void cierror(char* format, int narg)
|
|
{
|
|
domsg("IError", format, &narg);
|
|
errors++;
|
|
}
|
|
|
|
/*
|
|
* A real disaster
|
|
*/
|
|
void cfatal(char* format, char* sarg)
|
|
{
|
|
domsg("SFatal error", format, sarg);
|
|
exit(IO_ERROR);
|
|
}
|
|
|
|
/*
|
|
* A non-fatal error, string argument.
|
|
*/
|
|
void cwarn(char* format, char* sarg)
|
|
{
|
|
domsg("SWarning", format, sarg);
|
|
}
|
|
|
|
/*
|
|
* A non-fatal error, numeric argument.
|
|
*/
|
|
void ciwarn(char* format, int narg)
|
|
{
|
|
domsg("IWarning", format, &narg);
|
|
}
|
|
|
|
/* vim:set shiftwidth=4 softtabstop=4 expandtab: */
|