office-gobmx/rsc/source/rscpp/cpp6.c
Stephan Bergmann 7a77d77eff Use a C99 flexible array member
...so the following strcpy does not cause a false abort under _FORTIFY_SOURCE=2

Change-Id: I395136f11020064766db76f87ed8f5b01c083c3a
Reviewed-on: https://gerrit.libreoffice.org/18681
Tested-by: Jenkins <ci@libreoffice.org>
Reviewed-by: Stephan Bergmann <sbergman@redhat.com>
2015-09-18 13:15:27 +00:00

1135 lines
37 KiB
C

/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
/*
* This file is part of the LibreOffice project.
*
* This Source Code Form is subject to the terms of the Mozilla Public
* License, v. 2.0. If a copy of the MPL was not distributed with this
* file, You can obtain one at http://mozilla.org/MPL/2.0/.
*
* This file incorporates work covered by the following license notice:
*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed
* with this work for additional information regarding copyright
* ownership. The ASF licenses this file to you under the Apache
* License, Version 2.0 (the "License"); you may not use this file
* except in compliance with the License. You may obtain a copy of
* the License at http://www.apache.org/licenses/LICENSE-2.0 .
*/
#include <sal/types.h>
#include <stdio.h>
#include <ctype.h>
#include <string.h>
#include "cppdef.h"
#include "cpp.h"
/*ER evaluate macros to pDefOut */
/*
* skipnl() skips over input text to the end of the line.
* skipws() skips over "whitespace" (spaces or tabs), but
* not skip over the end of the line. It skips over
* TOK_SEP, however (though that shouldn't happen).
* scanid() reads the next token (C identifier) into token[].
* The caller has already read the first character of
* the identifier. Unlike macroid(), the token is
* never expanded.
* macroid() reads the next token (C identifier) into token[].
* If it is a #defined macro, it is expanded, and
* macroid() returns TRUE, otherwise, FALSE.
* catenate() Does the dirty work of token concatenation, TRUE if it did.
* scanstring() Reads a string from the input stream, calling
* a user-supplied function for each character.
* This function may be output() to write the
* string to the output file, or save() to save
* the string in the work buffer.
* scannumber() Reads a C numeric constant from the input stream,
* calling the user-supplied function for each
* character. (output() or save() as noted above.)
* save() Save one character in the work[] buffer.
* savestring() Saves a string in malloc() memory.
* getfile() Initialize a new FILEINFO structure, called when
* #include opens a new file, or a macro is to be
* expanded.
* getmem() Get a specified number of bytes from malloc memory.
* output() Write one character to stdout (calling PUTCHAR) --
* implemented as a function so its address may be
* passed to scanstring() and scannumber().
* lookid() Scans the next token (identifier) from the input
* stream. Looks for it in the #defined symbol table.
* Returns a pointer to the definition, if found, or NULL
* if not present. The identifier is stored in token[].
* defnedel() Define enter/delete subroutine. Updates the
* symbol table.
* get() Read the next byte from the current input stream,
* handling end of (macro/file) input and embedded
* comments appropriately. Note that the global
* instring is -- essentially -- a parameter to get().
* cget() Like get(), but skip over TOK_SEP.
* unget() Push last gotten character back on the input stream.
* cerror(), cwarn(), cfatal(), cierror(), ciwarn()
* These routines format an print messages to the user.
* cerror & cwarn take a format and a single string argument.
* cierror & ciwarn take a format and a single int (char) argument.
* cfatal takes a format and a single string argument.
*/
/*
* This table must be rewritten for a non-Ascii machine.
*
* Note that several "non-visible" characters have special meaning:
* Hex 1D DEF_MAGIC -- a flag to prevent #define recursion.
* Hex 1E TOK_SEP -- a delimiter for token concatenation
* Hex 1F COM_SEP -- a zero-width whitespace for comment concatenation
*/
#if TOK_SEP != 0x1E || COM_SEP != 0x1F || DEF_MAGIC != 0x1D
<< error type table is not correct >>
#endif
#define DOL LET
char type[256] = { /* Character type codes Hex */
END, 000, 000, 000, 000, 000, 000, 000, /* 00 */
000, SPA, 000, 000, 000, 000, 000, 000, /* 08 */
000, 000, 000, 000, 000, 000, 000, 000, /* 10 */
000, 000, 000, 000, 000, LET, 000, SPA, /* 18 */
SPA,OP_NOT, QUO, 000, DOL,OP_MOD,OP_AND, QUO, /* 20 !"#$%&' */
OP_LPA,OP_RPA,OP_MUL,OP_ADD, 000,OP_SUB, DOT,OP_DIV, /* 28 ()*+,-./ */
DIG, DIG, DIG, DIG, DIG, DIG, DIG, DIG, /* 30 01234567 */
DIG, DIG,OP_COL, 000, OP_LT, OP_EQ, OP_GT,OP_QUE, /* 38 89:;<=>? */
000, LET, LET, LET, LET, LET, LET, LET, /* 40 @ABCDEFG */
LET, LET, LET, LET, LET, LET, LET, LET, /* 48 HIJKLMNO */
LET, LET, LET, LET, LET, LET, LET, LET, /* 50 PQRSTUVW */
LET, LET, LET, 000, BSH, 000,OP_XOR, LET, /* 58 XYZ[\]^_ */
000, LET, LET, LET, LET, LET, LET, LET, /* 60 `abcdefg */
LET, LET, LET, LET, LET, LET, LET, LET, /* 68 hijklmno */
LET, LET, LET, LET, LET, LET, LET, LET, /* 70 pqrstuvw */
LET, LET, LET, 000, OP_OR, 000,OP_NOT, 000, /* 78 xyz{|}~ */
000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */
000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */
000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */
000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */
000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */
000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */
000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */
000, 000, 000, 000, 000, 000, 000, 000, /* 80 .. FF */
};
/*
* C P P S y m b o l T a b l e s
*/
/*
* SBSIZE defines the number of hash-table slots for the symbol table.
* It must be a power of 2.
*/
#ifndef SBSIZE
#define SBSIZE 64
#endif
#define SBMASK (SBSIZE - 1)
#if (SBSIZE ^ SBMASK) != ((SBSIZE * 2) - 1)
<< error, SBSIZE must be a power of 2 >>
#endif
static DEFBUF *symtab[SBSIZE]; /* Symbol table queue headers */
void InitCpp6()
{
int i;
for( i = 0; i < SBSIZE; i++ )
symtab[ i ] = NULL;
}
/*
* Skip to the end of the current input line.
*/
void skipnl()
{
int c;
do
{ /* Skip to newline */
c = get();
}
while (c != '\n' && c != EOF_CHAR);
}
/*
* Skip over whitespace
*/
int skipws()
{
int c;
do { /* Skip whitespace */
c = get();
} while (type[c] == SPA);
return c;
}
/*
* Get the next token (an id) into the token buffer.
* Note: this code is duplicated in lookid().
* Change one, change both.
*/
void scanid(int c)
{
char* bp;
if (c == DEF_MAGIC) /* Eat the magic token */
c = get(); /* undefiner. */
bp = token;
do
{
if (bp < &token[IDMAX]) /* token dim is IDMAX+1 */
*bp++ = (char)c;
c = get();
}
while (type[c] == LET || type[c] == DIG);
unget();
*bp = EOS;
}
/*
* If c is a letter, scan the id. if it's #defined, expand it and scan
* the next character and try again.
*
* Else, return the character. If type[c] is a LET, the token is in token.
*/
int macroid(int c)
{
DEFBUF* dp;
if (infile != NULL && infile->fp != NULL)
recursion = 0;
while (type[c] == LET && (dp = lookid(c)) != NULL)
{
expand(dp);
c = get();
}
return c;
}
/*
* A token was just read (via macroid).
* If the next character is TOK_SEP, concatenate the next token
* return TRUE -- which should recall macroid after refreshing
* macroid's argument. If it is not TOK_SEP, unget() the character
* and return FALSE.
*/
int catenate()
{
int c;
char* token1;
if (get() != TOK_SEP) /* Token concatenation */
{
unget();
return FALSE;
}
else
{
token1 = savestring(token); /* Save first token */
c = macroid(get()); /* Scan next token */
switch(type[c]) /* What was it? */
{
case LET: /* An identifier, ... */
if (strlen(token1) + strlen(token) >= NWORK)
cfatal("work buffer overflow doing %s #", token1);
sprintf(work, "%s%s", token1, token);
break;
case DIG: /* A digit string */
strcpy(work, token1);
workp = work + strlen(work);
do
{
save(c);
}
while ((c = get()) != TOK_SEP);
/*
* The trailing TOK_SEP is no longer needed.
*/
save(EOS);
break;
default: /* An error, ... */
if (isprint(c))
cierror("Strange character '%c' after #", c);
else
cierror("Strange character (%d.) after #", c);
strcpy(work, token1);
unget();
break;
}
/*
* work has the concatenated token and token1 has
* the first token (no longer needed). Unget the
* new (concatenated) token after freeing token1.
* Finally, setup to read the new token.
*/
free(token1); /* Free up memory */
ungetstring(work); /* Unget the new thing, */
return TRUE;
}
}
/*
* Scan off a string. Warning if terminated by newline or EOF.
* outfun() outputs the character -- to a buffer if in a macro.
* TRUE if ok, FALSE if error.
*/
int scanstring(int delim,
#ifndef _NO_PROTO
void (*outfun)( int ) /* BP */ /* Output function */
#else
void (*outfun)() /* BP */
#endif
)
{
int c;
instring = TRUE; /* Don't strip comments */
(*outfun)(delim);
while ((c = get()) != delim &&
c != '\n' &&
c != EOF_CHAR)
{
if (c != DEF_MAGIC)
(*outfun)(c);
if (c == '\\')
(*outfun)(get());
}
instring = FALSE;
if (c == delim)
{
(*outfun)(c);
return TRUE;
}
else
{
cerror("Unterminated string", NULLST);
unget();
return FALSE;
}
}
/*
* Process a number. We know that c is from 0 to 9 or dot.
* Algorithm from Dave Conroy's Decus C.
*/
void scannumber(int c,
#ifndef _NO_PROTO
void (*outfun)( int ) /* BP */ /* Output/store func */
#else
void (*outfun)() /* BP */
#endif
)
{
int radix; /* 8, 10, or 16 */
int expseen; /* 'e' seen in floater */
int signseen; /* '+' or '-' seen */
int octal89; /* For bad octal test */
int dotflag; /* TRUE if '.' was seen */
expseen = FALSE; /* No exponent seen yet */
signseen = TRUE; /* No +/- allowed yet */
octal89 = FALSE; /* No bad octal yet */
radix = 10; /* Assume decimal */
if ((dotflag = (c == '.')) != FALSE) /* . something? */
{
(*outfun)('.'); /* Always out the dot */
if (type[(c = get())] != DIG) /* If not a float numb, */
{
unget(); /* Rescan strange char */
return; /* All done for now */
}
} /* End of float test */
else if (c == '0') /* Octal or hex? */
{
(*outfun)(c); /* Stuff initial zero */
radix = 8; /* Assume it's octal */
c = get(); /* Look for an 'x' */
if (c == 'x' || c == 'X') /* Did we get one? */
{
radix = 16; /* Remember new radix */
(*outfun)(c); /* Stuff the 'x' */
c = get(); /* Get next character */
}
}
for (;;) /* Process curr. char. */
{
/*
* Note that this algorithm accepts "012e4" and "03.4"
* as legitimate floating-point numbers.
*/
if (radix != 16 && (c == 'e' || c == 'E'))
{
if (expseen) /* Already saw 'E'? */
break; /* Exit loop, bad nbr. */
expseen = TRUE; /* Set exponent seen */
signseen = FALSE; /* We can read '+' now */
radix = 10; /* Decimal exponent */
}
else if (radix != 16 && c == '.')
{
if (dotflag) /* Saw dot already? */
break; /* Exit loop, two dots */
dotflag = TRUE; /* Remember the dot */
radix = 10; /* Decimal fraction */
}
else if (c == '+' || c == '-') /* 1.0e+10 */
{
if (signseen) /* Sign in wrong place? */
break; /* Exit loop, not nbr. */
/* signseen = TRUE; */ /* Remember we saw it */
}
else /* Check the digit */
{
switch (c)
{
case '8': case '9': /* Sometimes wrong */
octal89 = TRUE; /* Do check later */
case '0': case '1': case '2': case '3':
case '4': case '5': case '6': case '7':
break; /* Always ok */
case 'a': case 'b': case 'c': case 'd': case 'e': case 'f':
case 'A': case 'B': case 'C': case 'D': case 'E': case 'F':
if (radix == 16) /* Alpha's are ok only */
break; /* if reading hex. */
default: /* At number end */
goto done; /* Break from for loop */
} /* End of switch */
} /* End general case */
(*outfun)(c); /* Accept the character */
signseen = TRUE; /* Don't read sign now */
c = get(); /* Read another char */
} /* End of scan loop */
/*
* When we break out of the scan loop, c contains the first
* character (maybe) not in the number. If the number is an
* integer, allow a trailing 'L' for long and/or a trailing 'U'
* for unsigned. If not those, push the trailing character back
* on the input stream. Floating point numbers accept a trailing
* 'L' for "long double".
*/
done:
if (dotflag || expseen) /* Floating point? */
{
if (c == 'l' || c == 'L')
{
(*outfun)(c);
get(); /* Ungotten later */
}
}
else /* Else it's an integer */
{
/*
* We know that dotflag and expseen are both zero, now:
* dotflag signals "saw 'L'", and
* expseen signals "saw 'U'".
*/
for (;;)
{
switch (c)
{
case 'l':
case 'L':
if (dotflag)
goto nomore;
dotflag = TRUE;
break;
case 'u':
case 'U':
if (expseen)
goto nomore;
expseen = TRUE;
break;
default:
goto nomore;
}
(*outfun)(c); /* Got 'L' or 'U'. */
c = get(); /* Look at next, too. */
}
}
nomore:
unget(); /* Not part of a number */
if (octal89 && radix == 8)
cwarn("Illegal digit in octal number", NULLST);
}
void save(int c)
{
if (workp >= &work[NWORK])
{
work[NWORK-1] = '\0';
cfatal("Work buffer overflow: %s", work);
}
else
*workp++ = (char)c;
}
/*
* Store a string into free memory.
*/
char* savestring(char* text)
{
char* result;
size_t size = strlen(text) + 1;
result = getmem(size);
strcpy(result, text);
return result;
}
/*
* Common FILEINFO buffer initialization for a new file or macro.
*/
FILEINFO* getfile(size_t bufsize, char* name)
{
FILEINFO* file;
size_t size;
size = strlen(name); /* File/macro name */
file = (FILEINFO*) getmem(sizeof (FILEINFO) + bufsize + size);
file->parent = infile; /* Chain files together */
file->fp = NULL; /* No file yet */
file->filename = savestring(name); /* Save file/macro name */
file->progname = NULL; /* No #line seen yet */
file->unrecur = 0; /* No macro fixup */
file->bptr = file->buffer; /* Initialize line ptr */
file->buffer[0] = EOS; /* Force first read */
file->line = 0; /* (Not used just yet) */
if (infile != NULL) /* If #include file */
infile->line = line; /* Save current line */
infile = file; /* New current file */
line = 1; /* Note first line */
return file; /* All done. */
}
/*
* Get a block of free memory.
*/
char* getmem(size_t size)
{
char* result;
if ((result = malloc((unsigned) size)) == NULL)
cfatal("Out of memory", NULLST);
return result;
}
/*
* Look for the next token in the symbol table. Returns token in "token".
* If found, returns the table pointer; Else returns NULL.
*/
DEFBUF* lookid(int c)
{
int nhash;
DEFBUF* dp;
char* np;
int temp = 0;
int isrecurse; /* For #define foo foo */
np = token;
nhash = 0;
if (0 != (isrecurse = (c == DEF_MAGIC)))/* If recursive macro */
c = get(); /* hack, skip DEF_MAGIC */
do
{
if (np < &token[IDMAX]) /* token dim is IDMAX+1 */
{
*np++ = (char)c; /* Store token byte */
nhash += c; /* Update hash value */
}
c = get(); /* And get another byte */
}
while (type[c] == LET || type[c] == DIG);
unget(); /* Rescan terminator */
*np = EOS; /* Terminate token */
if (isrecurse) /* Recursive definition */
return NULL; /* undefined just now */
nhash += (np - token); /* Fix hash value */
dp = symtab[nhash & SBMASK]; /* Starting bucket */
while (dp != (DEFBUF*) NULL) /* Search symbol table */
{
if (dp->hash == nhash && /* Fast precheck */
(temp = strcmp(dp->name, token)) >= 0)
{
break;
}
dp = dp->link; /* Nope, try next one */
}
return ((temp == 0) ? dp : NULL);
}
/*
* Enter this name in the lookup table (delete = FALSE)
* or delete this name (delete = TRUE).
* Returns a pointer to the define block (delete = FALSE)
* Returns NULL if the symbol wasn't defined (delete = TRUE).
*/
DEFBUF* defendel(char* name, int delete)
{
DEFBUF* dp;
DEFBUF** prevp;
char* np;
int nhash;
int temp=0;
int size;
for (nhash = 0, np = name; *np != EOS;)
nhash += *np++;
size = (np - name);
nhash += size;
prevp = &symtab[nhash & SBMASK];
while ((dp = *prevp) != (DEFBUF*) NULL)
{
if (dp->hash == nhash &&
(temp = strcmp(dp->name, name)) >= 0)
{
if (temp > 0)
dp = NULL; /* Not found */
else
{
*prevp = dp->link; /* Found, unlink and */
if (dp->repl != NULL) /* Free the replacement */
free(dp->repl); /* if any, and then */
free((char*) dp); /* Free the symbol */
dp = NULL;
}
break;
}
prevp = &dp->link;
}
if (!delete)
{
dp = (DEFBUF*) getmem(sizeof (DEFBUF) + size + 1);
dp->link = *prevp;
*prevp = dp;
dp->hash = nhash;
dp->repl = NULL;
dp->nargs = 0;
strcpy(dp->name, name);
}
return dp;
}
#if OSL_DEBUG_LEVEL > 1
void dumpdef(char* why)
{
DEFBUF* dp;
DEFBUF** syp;
FILE* pRememberOut = NULL;
if ( bDumpDefs ) /*ER */
{
pRememberOut = pCppOut;
pCppOut = pDefOut;
}
fprintf( pCppOut, "CPP symbol table dump %s\n", why);
for (syp = symtab; syp < &symtab[SBSIZE]; syp++)
{
if ((dp = *syp) != (DEFBUF*) NULL)
{
fprintf( pCppOut, "symtab[%" SAL_PRI_PTRDIFFT "d]\n", (syp - symtab));
do
{
dumpadef((char*) NULL, dp);
}
while ((dp = dp->link) != (DEFBUF*) NULL);
}
}
if ( bDumpDefs )
{
fprintf( pCppOut, "\n");
pCppOut = pRememberOut;
}
}
void dumpadef(char* why, DEFBUF* dp)
{
char* cp;
int c;
FILE* pRememberOut = NULL;
/*ER dump #define's to pDefOut */
if ( bDumpDefs )
{
pRememberOut = pCppOut;
pCppOut = pDefOut;
}
fprintf( pCppOut, " \"%s\" [%d]", dp->name, dp->nargs);
if (why != NULL)
fprintf( pCppOut, " (%s)", why);
if (dp->repl != NULL)
{
fprintf( pCppOut, " => ");
for (cp = dp->repl; (c = *cp++ & 0xFF) != EOS;)
{
#ifdef SOLAR
if (c == DEL)
{
c = *cp++ & 0xFF;
if( c == EOS ) break;
fprintf( pCppOut, "<%%%d>", c - MAC_PARM);
}
#else
if (c >= MAC_PARM && c <= (MAC_PARM + PAR_MAC))
fprintf( pCppOut, "<%%%d>", c - MAC_PARM);
#endif
else if (isprint(c) || c == '\n' || c == '\t')
PUTCHAR(c);
else if (c < ' ')
fprintf( pCppOut, "<^%c>", c + '@');
else
fprintf( pCppOut, "<\\0%o>", c);
}
/*ER evaluate macros to pDefOut */
#ifdef EVALDEFS
if ( bDumpDefs && !bIsInEval && dp->nargs <= 0 )
{
FILEINFO* infileSave = infile;
char* tokenSave = savestring( token );
char* workSave = savestring( work );
int lineSave = line;
int wronglineSave = wrongline;
int recursionSave = recursion;
FILEINFO* file;
EVALTYPE valEval;
bIsInEval = 1;
infile = NULL; /* start from scrap */
line = 0;
wrongline = 0;
*token = EOS;
*work = EOS;
recursion = 0;
file = getfile( strlen( dp->repl ), dp->name );
strcpy( file->buffer, dp->repl );
fprintf( pCppOut, " ===> ");
nEvalOff = 0;
cppmain(); /* get() frees also *file */
valEval = 0;
if ( 0 == evaluate( EvalBuf, &valEval ) )
{
#ifdef EVALFLOATS
if ( valEval != (EVALTYPE)((long)valEval ) )
fprintf( pCppOut, " ==eval=> %f", valEval );
else
#endif
fprintf( pCppOut, " ==eval=> %ld", (long)valEval );
}
recursion = recursionSave;
wrongline = wronglineSave;
line = lineSave;
strcpy( work, workSave );
free( workSave );
strcpy( token, tokenSave );
free( tokenSave );
infile = infileSave;
bIsInEval = 0;
}
#endif
}
else
{
fprintf( pCppOut, ", no replacement.");
}
PUTCHAR('\n');
if ( bDumpDefs )
pCppOut = pRememberOut;
}
#endif
/*
* G E T
*/
/*
* Return the next character from a macro or the current file.
* Handle end of file from #include files.
*/
int get()
{
int c;
FILEINFO* file;
int popped; /* Recursion fixup */
popped = 0;
get_from_file:
if ((file = infile) == NULL)
return EOF_CHAR;
newline:
/*
* Read a character from the current input line or macro.
* At EOS, either finish the current macro (freeing temp.
* storage) or read another line from the current input file.
* At EOF, exit the current file (#include) or, at EOF from
* the cpp input file, return EOF_CHAR to finish processing.
*/
if ((c = *file->bptr++ & 0xFF) == EOS)
{
/*
* Nothing in current line or macro. Get next line (if
* input from a file), or do end of file/macro processing.
* In the latter case, jump back to restart from the top.
*/
if (file->fp == NULL) /* NULL if macro */
{
popped++;
recursion -= file->unrecur;
if (recursion < 0)
recursion = 0;
infile = file->parent; /* Unwind file chain */
}
else /* Else get from a file */
{
if ((file->bptr = fgets(file->buffer, NBUFF, file->fp)) != NULL)
{
#if OSL_DEBUG_LEVEL > 1
if (debug > 1) /* Dump it to stdout */
{
fprintf( pCppOut, "\n#line %d (%s), %s",
line, file->filename, file->buffer);
}
#endif
goto newline; /* process the line */
}
else
{
if( file->fp != stdin )
fclose(file->fp); /* Close finished file */
if ((infile = file->parent) != NULL)
{
/*
* There is an "ungotten" newline in the current
* infile buffer (set there by doinclude() in
* cpp1.c). Thus, we know that the mainline code
* is skipping over blank lines and will do a
* #line at its convenience.
*/
wrongline = TRUE; /* Need a #line now */
}
}
}
/*
* Free up space used by the (finished) file or macro and
* restart input from the parent file/macro, if any.
*/
free(file->filename); /* Free name and */
if (file->progname != NULL) /* if a #line was seen, */
free(file->progname); /* free it, too. */
free((char*) file); /* Free file space */
if (infile == NULL) /* If at end of file */
return EOF_CHAR; /* Return end of file */
line = infile->line; /* Reset line number */
goto get_from_file; /* Get from the top. */
}
/*
* Common processing for the new character.
*/
if (c == DEF_MAGIC && file->fp != NULL) /* Don't allow delete */
goto newline; /* from a file */
if (file->parent != NULL) /* Macro or #include */
{
if (popped != 0)
file->parent->unrecur += popped;
else
{
recursion -= file->parent->unrecur;
if (recursion < 0)
recursion = 0;
file->parent->unrecur = 0;
}
}
#if (HOST == SYS_UNIX)
if (c == '\r')
return get(); /* DOS fuck */
#endif
if (c == '\n') /* Maintain current */
++line; /* line counter */
if (instring) /* Strings just return */
return c; /* the character. */
else if (c == '/') /* Comment? */
{
instring = TRUE; /* So get() won't loop */
c = get();
if ((c != '*') && (c != '/')) /* Next byte '*'? */
{
instring = FALSE; /* Nope, no comment */
unget(); /* Push the char. back */
return '/'; /* Return the slash */
}
if (keepcomments) /* If writing comments */
{
PUTCHAR('/'); /* Write out the */
/* initializer */
if( '*' == c )
PUTCHAR('*');
else
PUTCHAR('/');
}
if( '*' == c )
{
for (;;) /* Eat a comment */
{
c = get();
test:
if (keepcomments && c != EOF_CHAR)
cput(c);
switch (c)
{
case EOF_CHAR:
cerror("EOF in comment", NULLST);
return EOF_CHAR;
case '/':
if ((c = get()) != '*') /* Don't let comments */
goto test; /* Nest. */
#ifdef STRICT_COMMENTS
cwarn("Nested comments", NULLST);
#endif
/* Fall into * stuff */
case '*':
if ((c = get()) != '/') /* If comment doesn't */
goto test; /* end, look at next */
instring = FALSE; /* End of comment, */
if (keepcomments) /* Put out the comment */
{
cput(c); /* terminator, too */
}
/*
* A comment is syntactically "whitespace" --
* however, there are certain strange sequences
* such as
* #define foo(x) (something)
* foo|* comment *|(123)
* these are '/' ^ ^
* where just returning space (or COM_SEP) will cause
* problems. This can be "fixed" by overwriting the
* '/' in the input line buffer with ' ' (or COM_SEP)
* but that may mess up an error message.
* So, we peek ahead -- if the next character is
* "whitespace" we just get another character, if not,
* we modify the buffer. All in the name of purity.
*/
if (*file->bptr == '\n' || type[*file->bptr & 0xFF] == SPA)
goto newline;
return (file->bptr[-1] = ' ');
case '\n': /* we'll need a #line */
if (!keepcomments)
wrongline = TRUE; /* later... */
default: /* Anything else is */
break; /* Just a character */
} /* End switch */
} /* End comment loop */
}
else /* c++ comment */
{
for (;;) /* Eat a comment */
{
c = get();
if (keepcomments && c != EOF_CHAR)
cput(c);
if( EOF_CHAR == c )
return EOF_CHAR;
else if( '\n' == c )
{
instring = FALSE; /* End of comment, */
return c;
}
}
}
} /* End if in comment */
else if (!inmacro && c == '\\') /* If backslash, peek */
{
if ((c = get()) == '\n') /* for a <nl>. If so, */
{
wrongline = TRUE;
goto newline;
}
else /* Backslash anything */
{
unget(); /* Get it later */
return '\\'; /* Return the backslash */
}
}
else if (c == '\f' || c == VT) /* Form Feed, Vertical */
{
c = ' '; /* Tab are whitespace */
}
else if (c == 0xef) /* eat up UTF-8 BOM */
{
if((c = get()) == 0xbb)
{
if((c = get()) == 0xbf)
{
c = get();
return c;
}
else
{
unget();
unget();
return 0xef;
}
}
else
{
unget();
return 0xef;
}
}
return c; /* Just return the char */
}
/*
* Backup the pointer to reread the last character. Fatal error
* (code bug) if we backup too far. unget() may be called,
* without problems, at end of file. Only one character may
* be ungotten. If you need to unget more, call ungetstring().
*/
void unget()
{
FILEINFO* file;
if ((file = infile) == NULL)
return; /* Unget after EOF */
if (--file->bptr < file->buffer)
cfatal("Too much pushback", NULLST);
if (*file->bptr == '\n') /* Ungetting a newline? */
--line; /* Unget the line number, too */
}
/*
* Push a string back on the input stream. This is done by treating
* the text as if it were a macro.
*/
void ungetstring(char* text)
{
FILEINFO* file;
file = getfile(strlen(text) + 1, "");
strcpy(file->buffer, text);
}
/*
* Get one character, absorb "funny space" after comments or
* token concatenation
*/
int cget()
{
int c;
do
{
c = get();
}
while (c == TOK_SEP);
return c;
}
/*
* Error messages and other hacks. The first byte of severity
* is 'S' for string arguments and 'I' for int arguments. This
* is needed for portability with machines that have int's that
* are shorter than char *'s.
*/
/*
* Print filenames, macro names, and line numbers for error messages.
*/
static void domsg(char* severity, char* format, void* arg)
{
char* tp;
FILEINFO* file;
fprintf(stderr, "%sline %d, %s: ", MSG_PREFIX, line, &severity[1]);
if (*severity == 'S')
fprintf(stderr, format, (char*)arg);
else
fprintf(stderr, format, *((int*)arg) );
putc('\n', stderr);
if ((file = infile) == NULL)
return; /* At end of file */
if (file->fp != NULL)
{
tp = file->buffer; /* Print current file */
fprintf(stderr, "%s", tp); /* name, making sure */
if (tp[strlen(tp) - 1] != '\n') /* there's a newline */
putc('\n', stderr);
}
while ((file = file->parent) != NULL) /* Print #includes, too */
{
if (file->fp == NULL)
fprintf(stderr, "from macro %s\n", file->filename);
else
{
tp = file->buffer;
fprintf(stderr, "from file %s, line %d:\n%s",
(file->progname != NULL)
? file->progname : file->filename,
file->line, tp);
if (tp[strlen(tp) - 1] != '\n')
putc('\n', stderr);
}
}
}
/*
* Print a normal error message, string argument.
*/
void cerror(char* format, char* sarg)
{
domsg("SError", format, sarg);
errors++;
}
/*
* Print a normal error message, numeric argument.
*/
void cierror(char* format, int narg)
{
domsg("IError", format, &narg);
errors++;
}
/*
* A real disaster
*/
void cfatal(char* format, char* sarg)
{
domsg("SFatal error", format, sarg);
exit(IO_ERROR);
}
/*
* A non-fatal error, string argument.
*/
void cwarn(char* format, char* sarg)
{
domsg("SWarning", format, sarg);
}
/*
* A non-fatal error, numeric argument.
*/
void ciwarn(char* format, int narg)
{
domsg("IWarning", format, &narg);
}
/* vim:set shiftwidth=4 softtabstop=4 expandtab: */