aboutsummaryrefslogtreecommitdiff
path: root/tinycc/tccpp.c
diff options
context:
space:
mode:
Diffstat (limited to 'tinycc/tccpp.c')
-rw-r--r--tinycc/tccpp.c3999
1 files changed, 0 insertions, 3999 deletions
diff --git a/tinycc/tccpp.c b/tinycc/tccpp.c
deleted file mode 100644
index 717ab48..0000000
--- a/tinycc/tccpp.c
+++ /dev/null
@@ -1,3999 +0,0 @@
-/*
- * TCC - Tiny C Compiler
- *
- * Copyright (c) 2001-2004 Fabrice Bellard
- *
- * This library is free software; you can redistribute it and/or
- * modify it under the terms of the GNU Lesser General Public
- * License as published by the Free Software Foundation; either
- * version 2 of the License, or (at your option) any later version.
- *
- * This library is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- * Lesser General Public License for more details.
- *
- * You should have received a copy of the GNU Lesser General Public
- * License along with this library; if not, write to the Free Software
- * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
- */
-
-#define USING_GLOBALS
-#include "tcc.h"
-
-/* #define to 1 to enable (see parse_pp_string()) */
-#define ACCEPT_LF_IN_STRINGS 0
-
-/********************************************************/
-/* global variables */
-
-ST_DATA int tok_flags;
-ST_DATA int parse_flags;
-
-ST_DATA struct BufferedFile *file;
-ST_DATA int tok;
-ST_DATA CValue tokc;
-ST_DATA const int *macro_ptr;
-ST_DATA CString tokcstr; /* current parsed string, if any */
-
-/* display benchmark infos */
-ST_DATA int tok_ident;
-ST_DATA TokenSym **table_ident;
-
-/* ------------------------------------------------------------------------- */
-
-static TokenSym *hash_ident[TOK_HASH_SIZE];
-static char token_buf[STRING_MAX_SIZE + 1];
-static CString cstr_buf;
-static TokenString tokstr_buf;
-static unsigned char isidnum_table[256 - CH_EOF];
-static int pp_debug_tok, pp_debug_symv;
-static int pp_once;
-static int pp_expr;
-static int pp_counter;
-static void tok_print(const char *msg, const int *str);
-
-static struct TinyAlloc *toksym_alloc;
-static struct TinyAlloc *tokstr_alloc;
-
-static TokenString *macro_stack;
-
-static const char tcc_keywords[] =
-#define DEF(id, str) str "\0"
-#include "tcctok.h"
-#undef DEF
-;
-
-/* WARNING: the content of this string encodes token numbers */
-static const unsigned char tok_two_chars[] =
-/* outdated -- gr
- "<=\236>=\235!=\225&&\240||\241++\244--\242==\224<<\1>>\2+=\253"
- "-=\255*=\252/=\257%=\245&=\246^=\336|=\374->\313..\250##\266";
-*/{
- '<','=', TOK_LE,
- '>','=', TOK_GE,
- '!','=', TOK_NE,
- '&','&', TOK_LAND,
- '|','|', TOK_LOR,
- '+','+', TOK_INC,
- '-','-', TOK_DEC,
- '=','=', TOK_EQ,
- '<','<', TOK_SHL,
- '>','>', TOK_SAR,
- '+','=', TOK_A_ADD,
- '-','=', TOK_A_SUB,
- '*','=', TOK_A_MUL,
- '/','=', TOK_A_DIV,
- '%','=', TOK_A_MOD,
- '&','=', TOK_A_AND,
- '^','=', TOK_A_XOR,
- '|','=', TOK_A_OR,
- '-','>', TOK_ARROW,
- '.','.', TOK_TWODOTS,
- '#','#', TOK_TWOSHARPS,
- '#','#', TOK_PPJOIN,
- 0
-};
-
-static void next_nomacro(void);
-
-ST_FUNC void skip(int c)
-{
- if (tok != c)
- tcc_error("'%c' expected (got \"%s\")", c, get_tok_str(tok, &tokc));
- next();
-}
-
-ST_FUNC void expect(const char *msg)
-{
- tcc_error("%s expected", msg);
-}
-
-/* ------------------------------------------------------------------------- */
-/* Custom allocator for tiny objects */
-
-#define USE_TAL
-
-#ifndef USE_TAL
-#define tal_free(al, p) tcc_free(p)
-#define tal_realloc(al, p, size) tcc_realloc(p, size)
-#define tal_new(a,b,c)
-#define tal_delete(a)
-#else
-#if !defined(MEM_DEBUG)
-#define tal_free(al, p) tal_free_impl(al, p)
-#define tal_realloc(al, p, size) tal_realloc_impl(&al, p, size)
-#define TAL_DEBUG_PARAMS
-#else
-#define TAL_DEBUG 1
-//#define TAL_INFO 1 /* collect and dump allocators stats */
-#define tal_free(al, p) tal_free_impl(al, p, __FILE__, __LINE__)
-#define tal_realloc(al, p, size) tal_realloc_impl(&al, p, size, __FILE__, __LINE__)
-#define TAL_DEBUG_PARAMS , const char *file, int line
-#define TAL_DEBUG_FILE_LEN 40
-#endif
-
-#define TOKSYM_TAL_SIZE (768 * 1024) /* allocator for tiny TokenSym in table_ident */
-#define TOKSTR_TAL_SIZE (768 * 1024) /* allocator for tiny TokenString instances */
-#define CSTR_TAL_SIZE (256 * 1024) /* allocator for tiny CString instances */
-#define TOKSYM_TAL_LIMIT 256 /* prefer unique limits to distinguish allocators debug msgs */
-#define TOKSTR_TAL_LIMIT 128 /* 32 * sizeof(int) */
-#define CSTR_TAL_LIMIT 1024
-
-typedef struct TinyAlloc {
- unsigned limit;
- unsigned size;
- uint8_t *buffer;
- uint8_t *p;
- unsigned nb_allocs;
- struct TinyAlloc *next, *top;
-#ifdef TAL_INFO
- unsigned nb_peak;
- unsigned nb_total;
- unsigned nb_missed;
- uint8_t *peak_p;
-#endif
-} TinyAlloc;
-
-typedef struct tal_header_t {
- unsigned size;
-#ifdef TAL_DEBUG
- int line_num; /* negative line_num used for double free check */
- char file_name[TAL_DEBUG_FILE_LEN + 1];
-#endif
-} tal_header_t;
-
-/* ------------------------------------------------------------------------- */
-
-static TinyAlloc *tal_new(TinyAlloc **pal, unsigned limit, unsigned size)
-{
- TinyAlloc *al = tcc_mallocz(sizeof(TinyAlloc));
- al->p = al->buffer = tcc_malloc(size);
- al->limit = limit;
- al->size = size;
- if (pal) *pal = al;
- return al;
-}
-
-static void tal_delete(TinyAlloc *al)
-{
- TinyAlloc *next;
-
-tail_call:
- if (!al)
- return;
-#ifdef TAL_INFO
- fprintf(stderr, "limit=%5d, size=%5g MB, nb_peak=%6d, nb_total=%8d, nb_missed=%6d, usage=%5.1f%%\n",
- al->limit, al->size / 1024.0 / 1024.0, al->nb_peak, al->nb_total, al->nb_missed,
- (al->peak_p - al->buffer) * 100.0 / al->size);
-#endif
-#ifdef TAL_DEBUG
- if (al->nb_allocs > 0) {
- uint8_t *p;
- fprintf(stderr, "TAL_DEBUG: memory leak %d chunk(s) (limit= %d)\n",
- al->nb_allocs, al->limit);
- p = al->buffer;
- while (p < al->p) {
- tal_header_t *header = (tal_header_t *)p;
- if (header->line_num > 0) {
- fprintf(stderr, "%s:%d: chunk of %d bytes leaked\n",
- header->file_name, header->line_num, header->size);
- }
- p += header->size + sizeof(tal_header_t);
- }
-#if MEM_DEBUG-0 == 2
- exit(2);
-#endif
- }
-#endif
- next = al->next;
- tcc_free(al->buffer);
- tcc_free(al);
- al = next;
- goto tail_call;
-}
-
-static void tal_free_impl(TinyAlloc *al, void *p TAL_DEBUG_PARAMS)
-{
- if (!p)
- return;
-tail_call:
- if (al->buffer <= (uint8_t *)p && (uint8_t *)p < al->buffer + al->size) {
-#ifdef TAL_DEBUG
- tal_header_t *header = (((tal_header_t *)p) - 1);
- if (header->line_num < 0) {
- fprintf(stderr, "%s:%d: TAL_DEBUG: double frees chunk from\n",
- file, line);
- fprintf(stderr, "%s:%d: %d bytes\n",
- header->file_name, (int)-header->line_num, (int)header->size);
- } else
- header->line_num = -header->line_num;
-#endif
- al->nb_allocs--;
- if (!al->nb_allocs)
- al->p = al->buffer;
- } else if (al->next) {
- al = al->next;
- goto tail_call;
- }
- else
- tcc_free(p);
-}
-
-static void *tal_realloc_impl(TinyAlloc **pal, void *p, unsigned size TAL_DEBUG_PARAMS)
-{
- tal_header_t *header;
- void *ret;
- int is_own;
- unsigned adj_size = (size + 3) & -4;
- TinyAlloc *al = *pal;
-
-tail_call:
- is_own = (al->buffer <= (uint8_t *)p && (uint8_t *)p < al->buffer + al->size);
- if ((!p || is_own) && size <= al->limit) {
- if (al->p - al->buffer + adj_size + sizeof(tal_header_t) < al->size) {
- header = (tal_header_t *)al->p;
- header->size = adj_size;
-#ifdef TAL_DEBUG
- { int ofs = strlen(file) - TAL_DEBUG_FILE_LEN;
- strncpy(header->file_name, file + (ofs > 0 ? ofs : 0), TAL_DEBUG_FILE_LEN);
- header->file_name[TAL_DEBUG_FILE_LEN] = 0;
- header->line_num = line; }
-#endif
- ret = al->p + sizeof(tal_header_t);
- al->p += adj_size + sizeof(tal_header_t);
- if (is_own) {
- header = (((tal_header_t *)p) - 1);
- if (p) memcpy(ret, p, header->size);
-#ifdef TAL_DEBUG
- header->line_num = -header->line_num;
-#endif
- } else {
- al->nb_allocs++;
- }
-#ifdef TAL_INFO
- if (al->nb_peak < al->nb_allocs)
- al->nb_peak = al->nb_allocs;
- if (al->peak_p < al->p)
- al->peak_p = al->p;
- al->nb_total++;
-#endif
- return ret;
- } else if (is_own) {
- al->nb_allocs--;
- ret = tal_realloc(*pal, 0, size);
- header = (((tal_header_t *)p) - 1);
- if (p) memcpy(ret, p, header->size);
-#ifdef TAL_DEBUG
- header->line_num = -header->line_num;
-#endif
- return ret;
- }
- if (al->next) {
- al = al->next;
- } else {
- TinyAlloc *bottom = al, *next = al->top ? al->top : al;
-
- al = tal_new(pal, next->limit, next->size * 2);
- al->next = next;
- bottom->top = al;
- }
- goto tail_call;
- }
- if (is_own) {
- al->nb_allocs--;
- ret = tcc_malloc(size);
- header = (((tal_header_t *)p) - 1);
- if (p) memcpy(ret, p, header->size);
-#ifdef TAL_DEBUG
- header->line_num = -header->line_num;
-#endif
- } else if (al->next) {
- al = al->next;
- goto tail_call;
- } else
- ret = tcc_realloc(p, size);
-#ifdef TAL_INFO
- al->nb_missed++;
-#endif
- return ret;
-}
-
-#endif /* USE_TAL */
-
-/* ------------------------------------------------------------------------- */
-/* CString handling */
-static void cstr_realloc(CString *cstr, int new_size)
-{
- int size;
-
- size = cstr->size_allocated;
- if (size < 8)
- size = 8; /* no need to allocate a too small first string */
- while (size < new_size)
- size = size * 2;
- cstr->data = tcc_realloc(cstr->data, size);
- cstr->size_allocated = size;
-}
-
-/* add a byte */
-ST_INLN void cstr_ccat(CString *cstr, int ch)
-{
- int size;
- size = cstr->size + 1;
- if (size > cstr->size_allocated)
- cstr_realloc(cstr, size);
- ((unsigned char *)cstr->data)[size - 1] = ch;
- cstr->size = size;
-}
-
-ST_INLN char *unicode_to_utf8 (char *b, uint32_t Uc)
-{
- if (Uc<0x80) *b++=Uc;
- else if (Uc<0x800) *b++=192+Uc/64, *b++=128+Uc%64;
- else if (Uc-0xd800u<0x800) goto error;
- else if (Uc<0x10000) *b++=224+Uc/4096, *b++=128+Uc/64%64, *b++=128+Uc%64;
- else if (Uc<0x110000) *b++=240+Uc/262144, *b++=128+Uc/4096%64, *b++=128+Uc/64%64, *b++=128+Uc%64;
- else error: tcc_error("0x%x is not a valid universal character", Uc);
- return b;
-}
-
-/* add a unicode character expanded into utf8 */
-ST_INLN void cstr_u8cat(CString *cstr, int ch)
-{
- char buf[4], *e;
- e = unicode_to_utf8(buf, (uint32_t)ch);
- cstr_cat(cstr, buf, e - buf);
-}
-
-ST_FUNC void cstr_cat(CString *cstr, const char *str, int len)
-{
- int size;
- if (len <= 0)
- len = strlen(str) + 1 + len;
- size = cstr->size + len;
- if (size > cstr->size_allocated)
- cstr_realloc(cstr, size);
- memmove(((unsigned char *)cstr->data) + cstr->size, str, len);
- cstr->size = size;
-}
-
-/* add a wide char */
-ST_FUNC void cstr_wccat(CString *cstr, int ch)
-{
- int size;
- size = cstr->size + sizeof(nwchar_t);
- if (size > cstr->size_allocated)
- cstr_realloc(cstr, size);
- *(nwchar_t *)(((unsigned char *)cstr->data) + size - sizeof(nwchar_t)) = ch;
- cstr->size = size;
-}
-
-ST_FUNC void cstr_new(CString *cstr)
-{
- memset(cstr, 0, sizeof(CString));
-}
-
-/* free string and reset it to NULL */
-ST_FUNC void cstr_free(CString *cstr)
-{
- tcc_free(cstr->data);
-}
-
-/* reset string to empty */
-ST_FUNC void cstr_reset(CString *cstr)
-{
- cstr->size = 0;
-}
-
-ST_FUNC int cstr_vprintf(CString *cstr, const char *fmt, va_list ap)
-{
- va_list v;
- int len, size = 80;
- for (;;) {
- size += cstr->size;
- if (size > cstr->size_allocated)
- cstr_realloc(cstr, size);
- size = cstr->size_allocated - cstr->size;
- va_copy(v, ap);
- len = vsnprintf((char*)cstr->data + cstr->size, size, fmt, v);
- va_end(v);
- if (len >= 0 && len < size)
- break;
- size *= 2;
- }
- cstr->size += len;
- return len;
-}
-
-ST_FUNC int cstr_printf(CString *cstr, const char *fmt, ...)
-{
- va_list ap; int len;
- va_start(ap, fmt);
- len = cstr_vprintf(cstr, fmt, ap);
- va_end(ap);
- return len;
-}
-
-/* XXX: unicode ? */
-static void add_char(CString *cstr, int c)
-{
- if (c == '\'' || c == '\"' || c == '\\') {
- /* XXX: could be more precise if char or string */
- cstr_ccat(cstr, '\\');
- }
- if (c >= 32 && c <= 126) {
- cstr_ccat(cstr, c);
- } else {
- cstr_ccat(cstr, '\\');
- if (c == '\n') {
- cstr_ccat(cstr, 'n');
- } else {
- cstr_ccat(cstr, '0' + ((c >> 6) & 7));
- cstr_ccat(cstr, '0' + ((c >> 3) & 7));
- cstr_ccat(cstr, '0' + (c & 7));
- }
- }
-}
-
-/* ------------------------------------------------------------------------- */
-/* allocate a new token */
-static TokenSym *tok_alloc_new(TokenSym **pts, const char *str, int len)
-{
- TokenSym *ts, **ptable;
- int i;
-
- if (tok_ident >= SYM_FIRST_ANOM)
- tcc_error("memory full (symbols)");
-
- /* expand token table if needed */
- i = tok_ident - TOK_IDENT;
- if ((i % TOK_ALLOC_INCR) == 0) {
- ptable = tcc_realloc(table_ident, (i + TOK_ALLOC_INCR) * sizeof(TokenSym *));
- table_ident = ptable;
- }
-
- ts = tal_realloc(toksym_alloc, 0, sizeof(TokenSym) + len);
- table_ident[i] = ts;
- ts->tok = tok_ident++;
- ts->sym_define = NULL;
- ts->sym_label = NULL;
- ts->sym_struct = NULL;
- ts->sym_identifier = NULL;
- ts->len = len;
- ts->hash_next = NULL;
- memcpy(ts->str, str, len);
- ts->str[len] = '\0';
- *pts = ts;
- return ts;
-}
-
-#define TOK_HASH_INIT 1
-#define TOK_HASH_FUNC(h, c) ((h) + ((h) << 5) + ((h) >> 27) + (c))
-
-
-/* find a token and add it if not found */
-ST_FUNC TokenSym *tok_alloc(const char *str, int len)
-{
- TokenSym *ts, **pts;
- int i;
- unsigned int h;
-
- h = TOK_HASH_INIT;
- for(i=0;i<len;i++)
- h = TOK_HASH_FUNC(h, ((unsigned char *)str)[i]);
- h &= (TOK_HASH_SIZE - 1);
-
- pts = &hash_ident[h];
- for(;;) {
- ts = *pts;
- if (!ts)
- break;
- if (ts->len == len && !memcmp(ts->str, str, len))
- return ts;
- pts = &(ts->hash_next);
- }
- return tok_alloc_new(pts, str, len);
-}
-
-ST_FUNC int tok_alloc_const(const char *str)
-{
- return tok_alloc(str, strlen(str))->tok;
-}
-
-
-/* XXX: buffer overflow */
-/* XXX: float tokens */
-ST_FUNC const char *get_tok_str(int v, CValue *cv)
-{
- char *p;
- int i, len;
-
- cstr_reset(&cstr_buf);
- p = cstr_buf.data;
-
- switch(v) {
- case TOK_CINT:
- case TOK_CUINT:
- case TOK_CLONG:
- case TOK_CULONG:
- case TOK_CLLONG:
- case TOK_CULLONG:
- /* XXX: not quite exact, but only useful for testing */
-#ifdef _WIN32
- sprintf(p, "%u", (unsigned)cv->i);
-#else
- sprintf(p, "%llu", (unsigned long long)cv->i);
-#endif
- break;
- case TOK_LCHAR:
- cstr_ccat(&cstr_buf, 'L');
- case TOK_CCHAR:
- cstr_ccat(&cstr_buf, '\'');
- add_char(&cstr_buf, cv->i);
- cstr_ccat(&cstr_buf, '\'');
- cstr_ccat(&cstr_buf, '\0');
- break;
- case TOK_PPNUM:
- case TOK_PPSTR:
- return (char*)cv->str.data;
- case TOK_LSTR:
- cstr_ccat(&cstr_buf, 'L');
- case TOK_STR:
- cstr_ccat(&cstr_buf, '\"');
- if (v == TOK_STR) {
- len = cv->str.size - 1;
- for(i=0;i<len;i++)
- add_char(&cstr_buf, ((unsigned char *)cv->str.data)[i]);
- } else {
- len = (cv->str.size / sizeof(nwchar_t)) - 1;
- for(i=0;i<len;i++)
- add_char(&cstr_buf, ((nwchar_t *)cv->str.data)[i]);
- }
- cstr_ccat(&cstr_buf, '\"');
- cstr_ccat(&cstr_buf, '\0');
- break;
-
- case TOK_CFLOAT:
- return strcpy(p, "<float>");
- case TOK_CDOUBLE:
- return strcpy(p, "<double>");
- case TOK_CLDOUBLE:
- return strcpy(p, "<long double>");
- case TOK_LINENUM:
- return strcpy(p, "<linenumber");
-
- /* above tokens have value, the ones below don't */
- case TOK_LT:
- v = '<';
- goto addv;
- case TOK_GT:
- v = '>';
- goto addv;
- case TOK_DOTS:
- return strcpy(p, "...");
- case TOK_A_SHL:
- return strcpy(p, "<<=");
- case TOK_A_SAR:
- return strcpy(p, ">>=");
- case TOK_EOF:
- return strcpy(p, "<eof>");
- case 0: /* anonymous nameless symbols */
- return strcpy(p, "<no name>");
- default:
- if (v < TOK_IDENT) {
- /* search in two bytes table */
- const unsigned char *q = tok_two_chars;
- while (*q) {
- if (q[2] == v) {
- *p++ = q[0];
- *p++ = q[1];
- *p = '\0';
- return cstr_buf.data;
- }
- q += 3;
- }
- if (v >= 127 || (v < 32 && !is_space(v) && v != '\n')) {
- sprintf(p, "<\\x%02x>", v);
- break;
- }
- addv:
- *p++ = v;
- *p = '\0';
- } else if (v < tok_ident) {
- return table_ident[v - TOK_IDENT]->str;
- } else if (v >= SYM_FIRST_ANOM) {
- /* special name for anonymous symbol */
- sprintf(p, "L.%u", v - SYM_FIRST_ANOM);
- } else {
- /* should never happen */
- return NULL;
- }
- break;
- }
- return cstr_buf.data;
-}
-
-static inline int check_space(int t, int *spc)
-{
- if (t < 256 && (isidnum_table[t - CH_EOF] & IS_SPC)) {
- if (*spc)
- return 1;
- *spc = 1;
- } else
- *spc = 0;
- return 0;
-}
-
-/* return the current character, handling end of block if necessary
- (but not stray) */
-static int handle_eob(void)
-{
- BufferedFile *bf = file;
- int len;
-
- /* only tries to read if really end of buffer */
- if (bf->buf_ptr >= bf->buf_end) {
- if (bf->fd >= 0) {
-#if defined(PARSE_DEBUG)
- len = 1;
-#else
- len = IO_BUF_SIZE;
-#endif
- len = read(bf->fd, bf->buffer, len);
- if (len < 0)
- len = 0;
- } else {
- len = 0;
- }
- total_bytes += len;
- bf->buf_ptr = bf->buffer;
- bf->buf_end = bf->buffer + len;
- *bf->buf_end = CH_EOB;
- }
- if (bf->buf_ptr < bf->buf_end) {
- return bf->buf_ptr[0];
- } else {
- bf->buf_ptr = bf->buf_end;
- return CH_EOF;
- }
-}
-
-/* read next char from current input file and handle end of input buffer */
-static int next_c(void)
-{
- int ch = *++file->buf_ptr;
- /* end of buffer/file handling */
- if (ch == CH_EOB && file->buf_ptr >= file->buf_end)
- ch = handle_eob();
- return ch;
-}
-
-/* input with '\[\r]\n' handling. */
-static int handle_stray_noerror(int err)
-{
- int ch;
- while ((ch = next_c()) == '\\') {
- ch = next_c();
- if (ch == '\n') {
- newl:
- file->line_num++;
- } else {
- if (ch == '\r') {
- ch = next_c();
- if (ch == '\n')
- goto newl;
- *--file->buf_ptr = '\r';
- }
- if (err)
- tcc_error("stray '\\' in program");
- /* may take advantage of 'BufferedFile.unget[4}' */
- return *--file->buf_ptr = '\\';
- }
- }
- return ch;
-}
-
-#define ninp() handle_stray_noerror(0)
-
-/* handle '\\' in strings, comments and skipped regions */
-static int handle_bs(uint8_t **p)
-{
- int c;
- file->buf_ptr = *p - 1;
- c = ninp();
- *p = file->buf_ptr;
- return c;
-}
-
-/* skip the stray and handle the \\n case. Output an error if
- incorrect char after the stray */
-static int handle_stray(uint8_t **p)
-{
- int c;
- file->buf_ptr = *p - 1;
- c = handle_stray_noerror(!(parse_flags & PARSE_FLAG_ACCEPT_STRAYS));
- *p = file->buf_ptr;
- return c;
-}
-
-/* handle the complicated stray case */
-#define PEEKC(c, p)\
-{\
- c = *++p;\
- if (c == '\\')\
- c = handle_stray(&p); \
-}
-
-static int skip_spaces(void)
-{
- int ch;
- --file->buf_ptr;
- do {
- ch = ninp();
- } while (isidnum_table[ch - CH_EOF] & IS_SPC);
- return ch;
-}
-
-/* single line C++ comments */
-static uint8_t *parse_line_comment(uint8_t *p)
-{
- int c;
- for(;;) {
- for (;;) {
- c = *++p;
- redo:
- if (c == '\n' || c == '\\')
- break;
- c = *++p;
- if (c == '\n' || c == '\\')
- break;
- }
- if (c == '\n')
- break;
- c = handle_bs(&p);
- if (c == CH_EOF)
- break;
- if (c != '\\')
- goto redo;
- }
- return p;
-}
-
-/* C comments */
-static uint8_t *parse_comment(uint8_t *p)
-{
- int c;
- for(;;) {
- /* fast skip loop */
- for(;;) {
- c = *++p;
- redo:
- if (c == '\n' || c == '*' || c == '\\')
- break;
- c = *++p;
- if (c == '\n' || c == '*' || c == '\\')
- break;
- }
- /* now we can handle all the cases */
- if (c == '\n') {
- file->line_num++;
- } else if (c == '*') {
- do {
- c = *++p;
- } while (c == '*');
- if (c == '\\')
- c = handle_bs(&p);
- if (c == '/')
- break;
- goto check_eof;
- } else {
- c = handle_bs(&p);
- check_eof:
- if (c == CH_EOF)
- tcc_error("unexpected end of file in comment");
- if (c != '\\')
- goto redo;
- }
- }
- return p + 1;
-}
-
-/* parse a string without interpreting escapes */
-static uint8_t *parse_pp_string(uint8_t *p, int sep, CString *str)
-{
- int c;
- for(;;) {
- c = *++p;
- redo:
- if (c == sep) {
- break;
- } else if (c == '\\') {
- c = handle_bs(&p);
- if (c == CH_EOF) {
- unterminated_string:
- /* XXX: indicate line number of start of string */
- tok_flags &= ~TOK_FLAG_BOL;
- tcc_error("missing terminating %c character", sep);
- } else if (c == '\\') {
- if (str)
- cstr_ccat(str, c);
- c = *++p;
- /* add char after '\\' unconditionally */
- if (c == '\\') {
- c = handle_bs(&p);
- if (c == CH_EOF)
- goto unterminated_string;
- }
- goto add_char;
- } else {
- goto redo;
- }
- } else if (c == '\n') {
- add_lf:
- if (ACCEPT_LF_IN_STRINGS) {
- file->line_num++;
- goto add_char;
- } else if (str) { /* not skipping */
- goto unterminated_string;
- } else {
- //tcc_warning("missing terminating %c character", sep);
- return p;
- }
- } else if (c == '\r') {
- c = *++p;
- if (c == '\\')
- c = handle_bs(&p);
- if (c == '\n')
- goto add_lf;
- if (c == CH_EOF)
- goto unterminated_string;
- if (str)
- cstr_ccat(str, '\r');
- goto redo;
- } else {
- add_char:
- if (str)
- cstr_ccat(str, c);
- }
- }
- p++;
- return p;
-}
-
-/* skip block of text until #else, #elif or #endif. skip also pairs of
- #if/#endif */
-static void preprocess_skip(void)
-{
- int a, start_of_line, c, in_warn_or_error;
- uint8_t *p;
-
- p = file->buf_ptr;
- a = 0;
-redo_start:
- start_of_line = 1;
- in_warn_or_error = 0;
- for(;;) {
- redo_no_start:
- c = *p;
- switch(c) {
- case ' ':
- case '\t':
- case '\f':
- case '\v':
- case '\r':
- p++;
- goto redo_no_start;
- case '\n':
- file->line_num++;
- p++;
- goto redo_start;
- case '\\':
- c = handle_bs(&p);
- if (c == CH_EOF)
- expect("#endif");
- if (c == '\\')
- ++p;
- goto redo_no_start;
- /* skip strings */
- case '\"':
- case '\'':
- if (in_warn_or_error)
- goto _default;
- tok_flags &= ~TOK_FLAG_BOL;
- p = parse_pp_string(p, c, NULL);
- break;
- /* skip comments */
- case '/':
- if (in_warn_or_error)
- goto _default;
- ++p;
- c = handle_bs(&p);
- if (c == '*') {
- p = parse_comment(p);
- } else if (c == '/') {
- p = parse_line_comment(p);
- }
- break;
- case '#':
- p++;
- if (start_of_line) {
- file->buf_ptr = p;
- next_nomacro();
- p = file->buf_ptr;
- if (a == 0 &&
- (tok == TOK_ELSE || tok == TOK_ELIF || tok == TOK_ENDIF))
- goto the_end;
- if (tok == TOK_IF || tok == TOK_IFDEF || tok == TOK_IFNDEF)
- a++;
- else if (tok == TOK_ENDIF)
- a--;
- else if( tok == TOK_ERROR || tok == TOK_WARNING)
- in_warn_or_error = 1;
- else if (tok == TOK_LINEFEED)
- goto redo_start;
- else if (parse_flags & PARSE_FLAG_ASM_FILE)
- p = parse_line_comment(p - 1);
- }
-#if !defined(TCC_TARGET_ARM)
- else if (parse_flags & PARSE_FLAG_ASM_FILE)
- p = parse_line_comment(p - 1);
-#else
- /* ARM assembly uses '#' for constants */
-#endif
- break;
-_default:
- default:
- p++;
- break;
- }
- start_of_line = 0;
- }
- the_end: ;
- file->buf_ptr = p;
-}
-
-#if 0
-/* return the number of additional 'ints' necessary to store the
- token */
-static inline int tok_size(const int *p)
-{
- switch(*p) {
- /* 4 bytes */
- case TOK_CINT:
- case TOK_CUINT:
- case TOK_CCHAR:
- case TOK_LCHAR:
- case TOK_CFLOAT:
- case TOK_LINENUM:
- return 1 + 1;
- case TOK_STR:
- case TOK_LSTR:
- case TOK_PPNUM:
- case TOK_PPSTR:
- return 1 + ((sizeof(CString) + ((CString *)(p+1))->size + 3) >> 2);
- case TOK_CLONG:
- case TOK_CULONG:
- return 1 + LONG_SIZE / 4;
- case TOK_CDOUBLE:
- case TOK_CLLONG:
- case TOK_CULLONG:
- return 1 + 2;
- case TOK_CLDOUBLE:
-#ifdef TCC_USING_DOUBLE_FOR_LDOUBLE
- return 1 + 8 / 4;
-#else
- return 1 + LDOUBLE_SIZE / 4;
-#endif
- default:
- return 1 + 0;
- }
-}
-#endif
-
-/* token string handling */
-ST_INLN void tok_str_new(TokenString *s)
-{
- s->str = NULL;
- s->len = s->lastlen = 0;
- s->allocated_len = 0;
- s->last_line_num = -1;
-}
-
-ST_FUNC TokenString *tok_str_alloc(void)
-{
- TokenString *str = tal_realloc(tokstr_alloc, 0, sizeof *str);
- tok_str_new(str);
- return str;
-}
-
-ST_FUNC int *tok_str_dup(TokenString *s)
-{
- int *str;
-
- str = tal_realloc(tokstr_alloc, 0, s->len * sizeof(int));
- memcpy(str, s->str, s->len * sizeof(int));
- return str;
-}
-
-ST_FUNC void tok_str_free_str(int *str)
-{
- tal_free(tokstr_alloc, str);
-}
-
-ST_FUNC void tok_str_free(TokenString *str)
-{
- tok_str_free_str(str->str);
- tal_free(tokstr_alloc, str);
-}
-
-ST_FUNC int *tok_str_realloc(TokenString *s, int new_size)
-{
- int *str, size;
-
- size = s->allocated_len;
- if (size < 16)
- size = 16;
- while (size < new_size)
- size = size * 2;
- if (size > s->allocated_len) {
- str = tal_realloc(tokstr_alloc, s->str, size * sizeof(int));
- s->allocated_len = size;
- s->str = str;
- }
- return s->str;
-}
-
-ST_FUNC void tok_str_add(TokenString *s, int t)
-{
- int len, *str;
-
- len = s->len;
- str = s->str;
- if (len >= s->allocated_len)
- str = tok_str_realloc(s, len + 1);
- str[len++] = t;
- s->len = len;
-}
-
-ST_FUNC void begin_macro(TokenString *str, int alloc)
-{
- str->alloc = alloc;
- str->prev = macro_stack;
- str->prev_ptr = macro_ptr;
- str->save_line_num = file->line_num;
- macro_ptr = str->str;
- macro_stack = str;
-}
-
-ST_FUNC void end_macro(void)
-{
- TokenString *str = macro_stack;
- macro_stack = str->prev;
- macro_ptr = str->prev_ptr;
- file->line_num = str->save_line_num;
- str->len = 0; /* matters if str not alloced, may be tokstr_buf */
- if (str->alloc != 0) {
- if (str->alloc == 2)
- str->str = NULL; /* don't free */
- tok_str_free(str);
- }
-}
-
-static void tok_str_add2(TokenString *s, int t, CValue *cv)
-{
- int len, *str;
-
- len = s->lastlen = s->len;
- str = s->str;
-
- /* allocate space for worst case */
- if (len + TOK_MAX_SIZE >= s->allocated_len)
- str = tok_str_realloc(s, len + TOK_MAX_SIZE + 1);
- str[len++] = t;
- switch(t) {
- case TOK_CINT:
- case TOK_CUINT:
- case TOK_CCHAR:
- case TOK_LCHAR:
- case TOK_CFLOAT:
- case TOK_LINENUM:
-#if LONG_SIZE == 4
- case TOK_CLONG:
- case TOK_CULONG:
-#endif
- str[len++] = cv->tab[0];
- break;
- case TOK_PPNUM:
- case TOK_PPSTR:
- case TOK_STR:
- case TOK_LSTR:
- {
- /* Insert the string into the int array. */
- size_t nb_words =
- 1 + (cv->str.size + sizeof(int) - 1) / sizeof(int);
- if (len + nb_words >= s->allocated_len)
- str = tok_str_realloc(s, len + nb_words + 1);
- str[len] = cv->str.size;
- memcpy(&str[len + 1], cv->str.data, cv->str.size);
- len += nb_words;
- }
- break;
- case TOK_CDOUBLE:
- case TOK_CLLONG:
- case TOK_CULLONG:
-#if LONG_SIZE == 8
- case TOK_CLONG:
- case TOK_CULONG:
-#endif
- str[len++] = cv->tab[0];
- str[len++] = cv->tab[1];
- break;
- case TOK_CLDOUBLE:
-#if LDOUBLE_SIZE == 8 || defined TCC_USING_DOUBLE_FOR_LDOUBLE
- str[len++] = cv->tab[0];
- str[len++] = cv->tab[1];
-#elif LDOUBLE_SIZE == 12
- str[len++] = cv->tab[0];
- str[len++] = cv->tab[1];
- str[len++] = cv->tab[2];
-#elif LDOUBLE_SIZE == 16
- str[len++] = cv->tab[0];
- str[len++] = cv->tab[1];
- str[len++] = cv->tab[2];
- str[len++] = cv->tab[3];
-#else
-#error add long double size support
-#endif
- break;
- default:
- break;
- }
- s->len = len;
-}
-
-/* add the current parse token in token string 's' */
-ST_FUNC void tok_str_add_tok(TokenString *s)
-{
- CValue cval;
-
- /* save line number info */
- if (file->line_num != s->last_line_num) {
- s->last_line_num = file->line_num;
- cval.i = s->last_line_num;
- tok_str_add2(s, TOK_LINENUM, &cval);
- }
- tok_str_add2(s, tok, &tokc);
-}
-
-/* get a token from an integer array and increment pointer. */
-static inline void tok_get(int *t, const int **pp, CValue *cv)
-{
- const int *p = *pp;
- int n, *tab;
-
- tab = cv->tab;
- switch(*t = *p++) {
-#if LONG_SIZE == 4
- case TOK_CLONG:
-#endif
- case TOK_CINT:
- case TOK_CCHAR:
- case TOK_LCHAR:
- case TOK_LINENUM:
- cv->i = *p++;
- break;
-#if LONG_SIZE == 4
- case TOK_CULONG:
-#endif
- case TOK_CUINT:
- cv->i = (unsigned)*p++;
- break;
- case TOK_CFLOAT:
- tab[0] = *p++;
- break;
- case TOK_STR:
- case TOK_LSTR:
- case TOK_PPNUM:
- case TOK_PPSTR:
- cv->str.size = *p++;
- cv->str.data = p;
- p += (cv->str.size + sizeof(int) - 1) / sizeof(int);
- break;
- case TOK_CDOUBLE:
- case TOK_CLLONG:
- case TOK_CULLONG:
-#if LONG_SIZE == 8
- case TOK_CLONG:
- case TOK_CULONG:
-#endif
- n = 2;
- goto copy;
- case TOK_CLDOUBLE:
-#if LDOUBLE_SIZE == 8 || defined TCC_USING_DOUBLE_FOR_LDOUBLE
- n = 2;
-#elif LDOUBLE_SIZE == 12
- n = 3;
-#elif LDOUBLE_SIZE == 16
- n = 4;
-#else
-# error add long double size support
-#endif
- copy:
- do
- *tab++ = *p++;
- while (--n);
- break;
- default:
- break;
- }
- *pp = p;
-}
-
-#if 0
-# define TOK_GET(t,p,c) tok_get(t,p,c)
-#else
-# define TOK_GET(t,p,c) do { \
- int _t = **(p); \
- if (TOK_HAS_VALUE(_t)) \
- tok_get(t, p, c); \
- else \
- *(t) = _t, ++*(p); \
- } while (0)
-#endif
-
-static int macro_is_equal(const int *a, const int *b)
-{
- CValue cv;
- int t;
-
- if (!a || !b)
- return 1;
-
- while (*a && *b) {
- cstr_reset(&tokcstr);
- TOK_GET(&t, &a, &cv);
- cstr_cat(&tokcstr, get_tok_str(t, &cv), 0);
- TOK_GET(&t, &b, &cv);
- if (strcmp(tokcstr.data, get_tok_str(t, &cv)))
- return 0;
- }
- return !(*a || *b);
-}
-
-/* defines handling */
-ST_INLN void define_push(int v, int macro_type, int *str, Sym *first_arg)
-{
- Sym *s, *o;
-
- o = define_find(v);
- s = sym_push2(&define_stack, v, macro_type, 0);
- s->d = str;
- s->next = first_arg;
- table_ident[v - TOK_IDENT]->sym_define = s;
-
- if (o && !macro_is_equal(o->d, s->d))
- tcc_warning("%s redefined", get_tok_str(v, NULL));
-}
-
-/* undefined a define symbol. Its name is just set to zero */
-ST_FUNC void define_undef(Sym *s)
-{
- int v = s->v;
- if (v >= TOK_IDENT && v < tok_ident)
- table_ident[v - TOK_IDENT]->sym_define = NULL;
-}
-
-ST_INLN Sym *define_find(int v)
-{
- v -= TOK_IDENT;
- if ((unsigned)v >= (unsigned)(tok_ident - TOK_IDENT))
- return NULL;
- return table_ident[v]->sym_define;
-}
-
-/* free define stack until top reaches 'b' */
-ST_FUNC void free_defines(Sym *b)
-{
- while (define_stack != b) {
- Sym *top = define_stack;
- define_stack = top->prev;
- tok_str_free_str(top->d);
- define_undef(top);
- sym_free(top);
- }
-}
-
-/* fake the nth "#if defined test_..." for tcc -dt -run */
-static void maybe_run_test(TCCState *s)
-{
- const char *p;
- if (s->include_stack_ptr != s->include_stack)
- return;
- p = get_tok_str(tok, NULL);
- if (0 != memcmp(p, "test_", 5))
- return;
- if (0 != --s->run_test)
- return;
- fprintf(s->ppfp, &"\n[%s]\n"[!(s->dflag & 32)], p), fflush(s->ppfp);
- define_push(tok, MACRO_OBJ, NULL, NULL);
-}
-
-static CachedInclude *
-search_cached_include(TCCState *s1, const char *filename, int add);
-
-static int parse_include(TCCState *s1, int do_next, int test)
-{
- int c, i;
- char name[1024], buf[1024], *p;
- CachedInclude *e;
-
- c = skip_spaces();
- if (c == '<' || c == '\"') {
- cstr_reset(&tokcstr);
- file->buf_ptr = parse_pp_string(file->buf_ptr, c == '<' ? '>' : c, &tokcstr);
- i = tokcstr.size;
- pstrncpy(name, tokcstr.data, i >= sizeof name ? sizeof name - 1 : i);
- next_nomacro();
- } else {
- /* computed #include : concatenate tokens until result is one of
- the two accepted forms. Don't convert pp-tokens to tokens here. */
- parse_flags = PARSE_FLAG_PREPROCESS
- | PARSE_FLAG_LINEFEED
- | (parse_flags & PARSE_FLAG_ASM_FILE);
- name[0] = 0;
- for (;;) {
- next();
- p = name, i = strlen(p) - 1;
- if (i > 0
- && ((p[0] == '"' && p[i] == '"')
- || (p[0] == '<' && p[i] == '>')))
- break;
- if (tok == TOK_LINEFEED)
- tcc_error("'#include' expects \"FILENAME\" or <FILENAME>");
- pstrcat(name, sizeof name, get_tok_str(tok, &tokc));
- }
- c = p[0];
- /* remove '<>|""' */
- memmove(p, p + 1, i - 1), p[i - 1] = 0;
- }
-
- i = do_next ? file->include_next_index : -1;
- for (;;) {
- ++i;
- if (i == 0) {
- /* check absolute include path */
- if (!IS_ABSPATH(name))
- continue;
- buf[0] = '\0';
- } else if (i == 1) {
- /* search in file's dir if "header.h" */
- if (c != '\"')
- continue;
- p = file->true_filename;
- pstrncpy(buf, p, tcc_basename(p) - p);
- } else {
- int j = i - 2, k = j - s1->nb_include_paths;
- if (k < 0)
- p = s1->include_paths[j];
- else if (k < s1->nb_sysinclude_paths)
- p = s1->sysinclude_paths[k];
- else if (test)
- return 0;
- else
- tcc_error("include file '%s' not found", name);
- pstrcpy(buf, sizeof buf, p);
- pstrcat(buf, sizeof buf, "/");
- }
- pstrcat(buf, sizeof buf, name);
- e = search_cached_include(s1, buf, 0);
- if (e && (define_find(e->ifndef_macro) || e->once == pp_once)) {
- /* no need to parse the include because the 'ifndef macro'
- is defined (or had #pragma once) */
-#ifdef INC_DEBUG
- printf("%s: skipping cached %s\n", file->filename, buf);
-#endif
- return 1;
- }
- if (tcc_open(s1, buf) >= 0)
- break;
- }
-
- if (test) {
- tcc_close();
- } else {
- if (s1->include_stack_ptr >= s1->include_stack + INCLUDE_STACK_SIZE)
- tcc_error("#include recursion too deep");
- /* push previous file on stack */
- *s1->include_stack_ptr++ = file->prev;
- file->include_next_index = i;
-#ifdef INC_DEBUG
- printf("%s: including %s\n", file->prev->filename, file->filename);
-#endif
- /* update target deps */
- if (s1->gen_deps) {
- BufferedFile *bf = file;
- while (i == 1 && (bf = bf->prev))
- i = bf->include_next_index;
- /* skip system include files */
- if (s1->include_sys_deps || i - 2 < s1->nb_include_paths)
- dynarray_add(&s1->target_deps, &s1->nb_target_deps,
- tcc_strdup(buf));
- }
- /* add include file debug info */
- tcc_debug_bincl(s1);
- tok_flags |= TOK_FLAG_BOF | TOK_FLAG_BOL;
- }
- return 1;
-}
-
-/* eval an expression for #if/#elif */
-static int expr_preprocess(TCCState *s1)
-{
- int c, t;
- TokenString *str;
-
- str = tok_str_alloc();
- pp_expr = 1;
- while (tok != TOK_LINEFEED && tok != TOK_EOF) {
- next(); /* do macro subst */
- redo:
- if (tok == TOK_DEFINED) {
- next_nomacro();
- t = tok;
- if (t == '(')
- next_nomacro();
- if (tok < TOK_IDENT)
- expect("identifier");
- if (s1->run_test)
- maybe_run_test(s1);
- c = 0;
- if (define_find(tok)
- || tok == TOK___HAS_INCLUDE
- || tok == TOK___HAS_INCLUDE_NEXT)
- c = 1;
- if (t == '(') {
- next_nomacro();
- if (tok != ')')
- expect("')'");
- }
- tok = TOK_CINT;
- tokc.i = c;
- } else if (tok == TOK___HAS_INCLUDE ||
- tok == TOK___HAS_INCLUDE_NEXT) {
- t = tok;
- next_nomacro();
- if (tok != '(')
- expect("(");
- c = parse_include(s1, t - TOK___HAS_INCLUDE, 1);
- if (tok != ')')
- expect("')'");
- tok = TOK_CINT;
- tokc.i = c;
- } else if (tok >= TOK_IDENT) {
- /* if undefined macro, replace with zero, check for func-like */
- t = tok;
- tok = TOK_CINT;
- tokc.i = 0;
- tok_str_add_tok(str);
- next();
- if (tok == '(')
- tcc_error("function-like macro '%s' is not defined",
- get_tok_str(t, NULL));
- goto redo;
- }
- tok_str_add_tok(str);
- }
- pp_expr = 0;
- tok_str_add(str, -1); /* simulate end of file */
- tok_str_add(str, 0);
- /* now evaluate C constant expression */
- begin_macro(str, 1);
- next();
- c = expr_const();
- end_macro();
- return c != 0;
-}
-
-
-/* parse after #define */
-ST_FUNC void parse_define(void)
-{
- Sym *s, *first, **ps;
- int v, t, varg, is_vaargs, spc;
- int saved_parse_flags = parse_flags;
-
- v = tok;
- if (v < TOK_IDENT || v == TOK_DEFINED)
- tcc_error("invalid macro name '%s'", get_tok_str(tok, &tokc));
- /* XXX: should check if same macro (ANSI) */
- first = NULL;
- t = MACRO_OBJ;
- /* We have to parse the whole define as if not in asm mode, in particular
- no line comment with '#' must be ignored. Also for function
- macros the argument list must be parsed without '.' being an ID
- character. */
- parse_flags = ((parse_flags & ~PARSE_FLAG_ASM_FILE) | PARSE_FLAG_SPACES);
- /* '(' must be just after macro definition for MACRO_FUNC */
- next_nomacro();
- parse_flags &= ~PARSE_FLAG_SPACES;
- if (tok == '(') {
- int dotid = set_idnum('.', 0);
- next_nomacro();
- ps = &first;
- if (tok != ')') for (;;) {
- varg = tok;
- next_nomacro();
- is_vaargs = 0;
- if (varg == TOK_DOTS) {
- varg = TOK___VA_ARGS__;
- is_vaargs = 1;
- } else if (tok == TOK_DOTS && gnu_ext) {
- is_vaargs = 1;
- next_nomacro();
- }
- if (varg < TOK_IDENT)
- bad_list:
- tcc_error("bad macro parameter list");
- s = sym_push2(&define_stack, varg | SYM_FIELD, is_vaargs, 0);
- *ps = s;
- ps = &s->next;
- if (tok == ')')
- break;
- if (tok != ',' || is_vaargs)
- goto bad_list;
- next_nomacro();
- }
- parse_flags |= PARSE_FLAG_SPACES;
- next_nomacro();
- t = MACRO_FUNC;
- set_idnum('.', dotid);
- }
-
- tokstr_buf.len = 0;
- spc = 2;
- parse_flags |= PARSE_FLAG_ACCEPT_STRAYS | PARSE_FLAG_SPACES | PARSE_FLAG_LINEFEED;
- /* The body of a macro definition should be parsed such that identifiers
- are parsed like the file mode determines (i.e. with '.' being an
- ID character in asm mode). But '#' should be retained instead of
- regarded as line comment leader, so still don't set ASM_FILE
- in parse_flags. */
- while (tok != TOK_LINEFEED && tok != TOK_EOF) {
- /* remove spaces around ## and after '#' */
- if (TOK_TWOSHARPS == tok) {
- if (2 == spc)
- goto bad_twosharp;
- if (1 == spc)
- --tokstr_buf.len;
- spc = 3;
- tok = TOK_PPJOIN;
- } else if ('#' == tok) {
- spc = 4;
- } else if (check_space(tok, &spc)) {
- goto skip;
- }
- tok_str_add2(&tokstr_buf, tok, &tokc);
- skip:
- next_nomacro();
- }
-
- parse_flags = saved_parse_flags;
- if (spc == 1)
- --tokstr_buf.len; /* remove trailing space */
- tok_str_add(&tokstr_buf, 0);
- if (3 == spc)
-bad_twosharp:
- tcc_error("'##' cannot appear at either end of macro");
- define_push(v, t, tok_str_dup(&tokstr_buf), first);
-}
-
-#ifdef _WIN32
-static unsigned long long calc_file_hash(const char *filename)
-{
- unsigned long long hash = 14695981039346656037ull; // FNV_offset_basis;
- int fd = open (filename, O_RDONLY | O_BINARY);
-
- if (fd < 0)
- return 0;
- for (;;) {
- unsigned char temp[IO_BUF_SIZE];
- int i, n = read(fd, temp, sizeof(temp));
-
- if (n <= 0)
- break;
- for (i = 0; i < n; i++)
- hash = hash * 1099511628211ull ^ temp[i]; // FNV_prime
- }
- close(fd);
- return hash ? hash : 1ull;
-}
-#endif
-
-static CachedInclude *search_cached_include(TCCState *s1, const char *filename, int add)
-{
- unsigned int h = 0;
- CachedInclude *e;
- int i;
- struct stat st;
-#ifdef _WIN32
- unsigned long long hash = 0;
-#endif
-
- /* This is needed for #pragmae once
- * We cannot use stat on windows because st_ino is not set correctly
- * so we calculate a hash of file contents.
- * This also works for hard/soft links as in gcc/clang.
- */
- memset (&st, 0, sizeof(st));
- if (stat (filename, &st))
- goto skip;
- h = st.st_size & (CACHED_INCLUDES_HASH_SIZE - 1);
-#ifdef _WIN32
- /* Only calculate file hash if file size same. */
- i = s1->cached_includes_hash[h];
- for(;;) {
- if (i == 0)
- break;
- e = s1->cached_includes[i - 1];
- if (e->st.st_size == st.st_size) {
- if (0 == PATHCMP(e->filename, filename)) {
- hash = e->hash;
- break;
- }
- if (e->hash == 0)
- e->hash = calc_file_hash(e->filename);
- if (hash == 0)
- hash = calc_file_hash(filename);
- }
- i = e->hash_next;
- }
-#endif
-
- i = s1->cached_includes_hash[h];
- for(;;) {
- if (i == 0)
- break;
- e = s1->cached_includes[i - 1];
-#ifdef _WIN32
- if (e->st.st_size == st.st_size && e->hash == hash)
-#else
- if (st.st_dev == e->st.st_dev && st.st_ino == e->st.st_ino)
-#endif
- return e;
- i = e->hash_next;
- }
-skip:
- if (!add)
- return NULL;
-
- e = tcc_malloc(sizeof(CachedInclude) + strlen(filename));
- e->st = st;
-#ifdef _WIN32
- e->hash = hash;
-#endif
- strcpy(e->filename, filename);
- e->ifndef_macro = e->once = 0;
- dynarray_add(&s1->cached_includes, &s1->nb_cached_includes, e);
- /* add in hash table */
- e->hash_next = s1->cached_includes_hash[h];
- s1->cached_includes_hash[h] = s1->nb_cached_includes;
-#ifdef INC_DEBUG
- printf("adding cached '%s'\n", filename);
-#endif
- return e;
-}
-
-static void pragma_parse(TCCState *s1)
-{
- next_nomacro();
- if (tok == TOK_push_macro || tok == TOK_pop_macro) {
- int t = tok, v;
- Sym *s;
-
- if (next(), tok != '(')
- goto pragma_err;
- if (next(), tok != TOK_STR)
- goto pragma_err;
- v = tok_alloc(tokc.str.data, tokc.str.size - 1)->tok;
- if (next(), tok != ')')
- goto pragma_err;
- if (t == TOK_push_macro) {
- while (NULL == (s = define_find(v)))
- define_push(v, 0, NULL, NULL);
- s->type.ref = s; /* set push boundary */
- } else {
- for (s = define_stack; s; s = s->prev)
- if (s->v == v && s->type.ref == s) {
- s->type.ref = NULL;
- break;
- }
- }
- if (s)
- table_ident[v - TOK_IDENT]->sym_define = s->d ? s : NULL;
- else
- tcc_warning("unbalanced #pragma pop_macro");
- pp_debug_tok = t, pp_debug_symv = v;
-
- } else if (tok == TOK_once) {
- search_cached_include(s1, file->filename, 1)->once = pp_once;
-
- } else if (s1->output_type == TCC_OUTPUT_PREPROCESS) {
- /* tcc -E: keep pragmas below unchanged */
- unget_tok(' ');
- unget_tok(TOK_PRAGMA);
- unget_tok('#');
- unget_tok(TOK_LINEFEED);
-
- } else if (tok == TOK_pack) {
- /* This may be:
- #pragma pack(1) // set
- #pragma pack() // reset to default
- #pragma pack(push) // push current
- #pragma pack(push,1) // push & set
- #pragma pack(pop) // restore previous */
- next();
- skip('(');
- if (tok == TOK_ASM_pop) {
- next();
- if (s1->pack_stack_ptr <= s1->pack_stack) {
- stk_error:
- tcc_error("out of pack stack");
- }
- s1->pack_stack_ptr--;
- } else {
- int val = 0;
- if (tok != ')') {
- if (tok == TOK_ASM_push) {
- next();
- if (s1->pack_stack_ptr >= s1->pack_stack + PACK_STACK_SIZE - 1)
- goto stk_error;
- val = *s1->pack_stack_ptr++;
- if (tok != ',')
- goto pack_set;
- next();
- }
- if (tok != TOK_CINT)
- goto pragma_err;
- val = tokc.i;
- if (val < 1 || val > 16 || (val & (val - 1)) != 0)
- goto pragma_err;
- next();
- }
- pack_set:
- *s1->pack_stack_ptr = val;
- }
- if (tok != ')')
- goto pragma_err;
-
- } else if (tok == TOK_comment) {
- char *p; int t;
- next();
- skip('(');
- t = tok;
- next();
- skip(',');
- if (tok != TOK_STR)
- goto pragma_err;
- p = tcc_strdup((char *)tokc.str.data);
- next();
- if (tok != ')')
- goto pragma_err;
- if (t == TOK_lib) {
- dynarray_add(&s1->pragma_libs, &s1->nb_pragma_libs, p);
- } else {
- if (t == TOK_option)
- tcc_set_options(s1, p);
- tcc_free(p);
- }
-
- } else
- tcc_warning_c(warn_unsupported)("#pragma %s ignored", get_tok_str(tok, &tokc));
- return;
-
-pragma_err:
- tcc_error("malformed #pragma directive");
- return;
-}
-
-/* is_bof is true if first non space token at beginning of file */
-ST_FUNC void preprocess(int is_bof)
-{
- TCCState *s1 = tcc_state;
- int c, n, saved_parse_flags;
- char buf[1024], *q;
- Sym *s;
-
- saved_parse_flags = parse_flags;
- parse_flags = PARSE_FLAG_PREPROCESS
- | PARSE_FLAG_TOK_NUM
- | PARSE_FLAG_TOK_STR
- | PARSE_FLAG_LINEFEED
- | (parse_flags & PARSE_FLAG_ASM_FILE)
- ;
-
- next_nomacro();
- redo:
- switch(tok) {
- case TOK_DEFINE:
- pp_debug_tok = tok;
- next_nomacro();
- pp_debug_symv = tok;
- parse_define();
- break;
- case TOK_UNDEF:
- pp_debug_tok = tok;
- next_nomacro();
- pp_debug_symv = tok;
- s = define_find(tok);
- /* undefine symbol by putting an invalid name */
- if (s)
- define_undef(s);
- break;
- case TOK_INCLUDE:
- case TOK_INCLUDE_NEXT:
- parse_include(s1, tok - TOK_INCLUDE, 0);
- break;
- case TOK_IFNDEF:
- c = 1;
- goto do_ifdef;
- case TOK_IF:
- c = expr_preprocess(s1);
- goto do_if;
- case TOK_IFDEF:
- c = 0;
- do_ifdef:
- next_nomacro();
- if (tok < TOK_IDENT)
- tcc_error("invalid argument for '#if%sdef'", c ? "n" : "");
- if (is_bof) {
- if (c) {
-#ifdef INC_DEBUG
- printf("#ifndef %s\n", get_tok_str(tok, NULL));
-#endif
- file->ifndef_macro = tok;
- }
- }
- if (define_find(tok)
- || tok == TOK___HAS_INCLUDE
- || tok == TOK___HAS_INCLUDE_NEXT)
- c ^= 1;
- do_if:
- if (s1->ifdef_stack_ptr >= s1->ifdef_stack + IFDEF_STACK_SIZE)
- tcc_error("memory full (ifdef)");
- *s1->ifdef_stack_ptr++ = c;
- goto test_skip;
- case TOK_ELSE:
- if (s1->ifdef_stack_ptr == s1->ifdef_stack)
- tcc_error("#else without matching #if");
- if (s1->ifdef_stack_ptr[-1] & 2)
- tcc_error("#else after #else");
- c = (s1->ifdef_stack_ptr[-1] ^= 3);
- goto test_else;
- case TOK_ELIF:
- if (s1->ifdef_stack_ptr == s1->ifdef_stack)
- tcc_error("#elif without matching #if");
- c = s1->ifdef_stack_ptr[-1];
- if (c > 1)
- tcc_error("#elif after #else");
- /* last #if/#elif expression was true: we skip */
- if (c == 1) {
- c = 0;
- } else {
- c = expr_preprocess(s1);
- s1->ifdef_stack_ptr[-1] = c;
- }
- test_else:
- if (s1->ifdef_stack_ptr == file->ifdef_stack_ptr + 1)
- file->ifndef_macro = 0;
- test_skip:
- if (!(c & 1)) {
- preprocess_skip();
- is_bof = 0;
- goto redo;
- }
- break;
- case TOK_ENDIF:
- if (s1->ifdef_stack_ptr <= file->ifdef_stack_ptr)
- tcc_error("#endif without matching #if");
- s1->ifdef_stack_ptr--;
- /* '#ifndef macro' was at the start of file. Now we check if
- an '#endif' is exactly at the end of file */
- if (file->ifndef_macro &&
- s1->ifdef_stack_ptr == file->ifdef_stack_ptr) {
- file->ifndef_macro_saved = file->ifndef_macro;
- /* need to set to zero to avoid false matches if another
- #ifndef at middle of file */
- file->ifndef_macro = 0;
- while (tok != TOK_LINEFEED)
- next_nomacro();
- tok_flags |= TOK_FLAG_ENDIF;
- goto the_end;
- }
- break;
- case TOK_PPNUM:
- n = strtoul((char*)tokc.str.data, &q, 10);
- goto _line_num;
- case TOK_LINE:
- next();
- if (tok != TOK_CINT)
- _line_err:
- tcc_error("wrong #line format");
- n = tokc.i;
- _line_num:
- next();
- if (tok != TOK_LINEFEED) {
- if (tok == TOK_STR) {
- if (file->true_filename == file->filename)
- file->true_filename = tcc_strdup(file->filename);
- q = (char *)tokc.str.data;
- buf[0] = 0;
- if (!IS_ABSPATH(q)) {
- /* prepend directory from real file */
- pstrcpy(buf, sizeof buf, file->true_filename);
- *tcc_basename(buf) = 0;
- }
- pstrcat(buf, sizeof buf, q);
- tcc_debug_putfile(s1, buf);
- } else if (parse_flags & PARSE_FLAG_ASM_FILE)
- break;
- else
- goto _line_err;
- --n;
- }
- if (file->fd > 0)
- total_lines += file->line_num - n;
- file->line_num = n;
- break;
- case TOK_ERROR:
- case TOK_WARNING:
- q = buf;
- c = skip_spaces();
- while (c != '\n' && c != CH_EOF) {
- if ((q - buf) < sizeof(buf) - 1)
- *q++ = c;
- c = ninp();
- }
- *q = '\0';
- if (tok == TOK_ERROR)
- tcc_error("#error %s", buf);
- else
- tcc_warning("#warning %s", buf);
- break;
- case TOK_PRAGMA:
- pragma_parse(s1);
- break;
- case TOK_LINEFEED:
- goto the_end;
- default:
- /* ignore gas line comment in an 'S' file. */
- if (saved_parse_flags & PARSE_FLAG_ASM_FILE)
- goto ignore;
- if (tok == '!' && is_bof)
- /* '!' is ignored at beginning to allow C scripts. */
- goto ignore;
- tcc_warning("Ignoring unknown preprocessing directive #%s", get_tok_str(tok, &tokc));
- ignore:
- file->buf_ptr = parse_line_comment(file->buf_ptr - 1);
- goto the_end;
- }
- /* ignore other preprocess commands or #! for C scripts */
- while (tok != TOK_LINEFEED)
- next_nomacro();
- the_end:
- parse_flags = saved_parse_flags;
-}
-
-/* evaluate escape codes in a string. */
-static void parse_escape_string(CString *outstr, const uint8_t *buf, int is_long)
-{
- int c, n, i;
- const uint8_t *p;
-
- p = buf;
- for(;;) {
- c = *p;
- if (c == '\0')
- break;
- if (c == '\\') {
- p++;
- /* escape */
- c = *p;
- switch(c) {
- case '0': case '1': case '2': case '3':
- case '4': case '5': case '6': case '7':
- /* at most three octal digits */
- n = c - '0';
- p++;
- c = *p;
- if (isoct(c)) {
- n = n * 8 + c - '0';
- p++;
- c = *p;
- if (isoct(c)) {
- n = n * 8 + c - '0';
- p++;
- }
- }
- c = n;
- goto add_char_nonext;
- case 'x': i = 0; goto parse_hex_or_ucn;
- case 'u': i = 4; goto parse_hex_or_ucn;
- case 'U': i = 8; goto parse_hex_or_ucn;
- parse_hex_or_ucn:
- p++;
- n = 0;
- do {
- c = *p;
- if (c >= 'a' && c <= 'f')
- c = c - 'a' + 10;
- else if (c >= 'A' && c <= 'F')
- c = c - 'A' + 10;
- else if (isnum(c))
- c = c - '0';
- else if (i > 0)
- expect("more hex digits in universal-character-name");
- else
- goto add_hex_or_ucn;
- n = n * 16 + c;
- p++;
- } while (--i);
- if (is_long) {
- add_hex_or_ucn:
- c = n;
- goto add_char_nonext;
- }
- cstr_u8cat(outstr, n);
- continue;
- case 'a':
- c = '\a';
- break;
- case 'b':
- c = '\b';
- break;
- case 'f':
- c = '\f';
- break;
- case 'n':
- c = '\n';
- break;
- case 'r':
- c = '\r';
- break;
- case 't':
- c = '\t';
- break;
- case 'v':
- c = '\v';
- break;
- case 'e':
- if (!gnu_ext)
- goto invalid_escape;
- c = 27;
- break;
- case '\'':
- case '\"':
- case '\\':
- case '?':
- break;
- default:
- invalid_escape:
- if (c >= '!' && c <= '~')
- tcc_warning("unknown escape sequence: \'\\%c\'", c);
- else
- tcc_warning("unknown escape sequence: \'\\x%x\'", c);
- break;
- }
- } else if (is_long && c >= 0x80) {
- /* assume we are processing UTF-8 sequence */
- /* reference: The Unicode Standard, Version 10.0, ch3.9 */
-
- int cont; /* count of continuation bytes */
- int skip; /* how many bytes should skip when error occurred */
- int i;
-
- /* decode leading byte */
- if (c < 0xC2) {
- skip = 1; goto invalid_utf8_sequence;
- } else if (c <= 0xDF) {
- cont = 1; n = c & 0x1f;
- } else if (c <= 0xEF) {
- cont = 2; n = c & 0xf;
- } else if (c <= 0xF4) {
- cont = 3; n = c & 0x7;
- } else {
- skip = 1; goto invalid_utf8_sequence;
- }
-
- /* decode continuation bytes */
- for (i = 1; i <= cont; i++) {
- int l = 0x80, h = 0xBF;
-
- /* adjust limit for second byte */
- if (i == 1) {
- switch (c) {
- case 0xE0: l = 0xA0; break;
- case 0xED: h = 0x9F; break;
- case 0xF0: l = 0x90; break;
- case 0xF4: h = 0x8F; break;
- }
- }
-
- if (p[i] < l || p[i] > h) {
- skip = i; goto invalid_utf8_sequence;
- }
-
- n = (n << 6) | (p[i] & 0x3f);
- }
-
- /* advance pointer */
- p += 1 + cont;
- c = n;
- goto add_char_nonext;
-
- /* error handling */
- invalid_utf8_sequence:
- tcc_warning("ill-formed UTF-8 subsequence starting with: \'\\x%x\'", c);
- c = 0xFFFD;
- p += skip;
- goto add_char_nonext;
-
- }
- p++;
- add_char_nonext:
- if (!is_long)
- cstr_ccat(outstr, c);
- else {
-#ifdef TCC_TARGET_PE
- /* store as UTF-16 */
- if (c < 0x10000) {
- cstr_wccat(outstr, c);
- } else {
- c -= 0x10000;
- cstr_wccat(outstr, (c >> 10) + 0xD800);
- cstr_wccat(outstr, (c & 0x3FF) + 0xDC00);
- }
-#else
- cstr_wccat(outstr, c);
-#endif
- }
- }
- /* add a trailing '\0' */
- if (!is_long)
- cstr_ccat(outstr, '\0');
- else
- cstr_wccat(outstr, '\0');
-}
-
-static void parse_string(const char *s, int len)
-{
- uint8_t buf[1000], *p = buf;
- int is_long, sep;
-
- if ((is_long = *s == 'L'))
- ++s, --len;
- sep = *s++;
- len -= 2;
- if (len >= sizeof buf)
- p = tcc_malloc(len + 1);
- memcpy(p, s, len);
- p[len] = 0;
-
- cstr_reset(&tokcstr);
- parse_escape_string(&tokcstr, p, is_long);
- if (p != buf)
- tcc_free(p);
-
- if (sep == '\'') {
- int char_size, i, n, c;
- /* XXX: make it portable */
- if (!is_long)
- tok = TOK_CCHAR, char_size = 1;
- else
- tok = TOK_LCHAR, char_size = sizeof(nwchar_t);
- n = tokcstr.size / char_size - 1;
- if (n < 1)
- tcc_error("empty character constant");
- if (n > 1)
- tcc_warning_c(warn_all)("multi-character character constant");
- for (c = i = 0; i < n; ++i) {
- if (is_long)
- c = ((nwchar_t *)tokcstr.data)[i];
- else
- c = (c << 8) | ((char *)tokcstr.data)[i];
- }
- tokc.i = c;
- } else {
- tokc.str.size = tokcstr.size;
- tokc.str.data = tokcstr.data;
- if (!is_long)
- tok = TOK_STR;
- else
- tok = TOK_LSTR;
- }
-}
-
-/* we use 64 bit numbers */
-#define BN_SIZE 2
-
-/* bn = (bn << shift) | or_val */
-static void bn_lshift(unsigned int *bn, int shift, int or_val)
-{
- int i;
- unsigned int v;
- for(i=0;i<BN_SIZE;i++) {
- v = bn[i];
- bn[i] = (v << shift) | or_val;
- or_val = v >> (32 - shift);
- }
-}
-
-static void bn_zero(unsigned int *bn)
-{
- int i;
- for(i=0;i<BN_SIZE;i++) {
- bn[i] = 0;
- }
-}
-
-/* parse number in null terminated string 'p' and return it in the
- current token */
-static void parse_number(const char *p)
-{
- int b, t, shift, frac_bits, s, exp_val, ch;
- char *q;
- unsigned int bn[BN_SIZE];
- double d;
-
- /* number */
- q = token_buf;
- ch = *p++;
- t = ch;
- ch = *p++;
- *q++ = t;
- b = 10;
- if (t == '.') {
- goto float_frac_parse;
- } else if (t == '0') {
- if (ch == 'x' || ch == 'X') {
- q--;
- ch = *p++;
- b = 16;
- } else if (tcc_state->tcc_ext && (ch == 'b' || ch == 'B')) {
- q--;
- ch = *p++;
- b = 2;
- }
- }
- /* parse all digits. cannot check octal numbers at this stage
- because of floating point constants */
- while (1) {
- if (ch >= 'a' && ch <= 'f')
- t = ch - 'a' + 10;
- else if (ch >= 'A' && ch <= 'F')
- t = ch - 'A' + 10;
- else if (isnum(ch))
- t = ch - '0';
- else
- break;
- if (t >= b)
- break;
- if (q >= token_buf + STRING_MAX_SIZE) {
- num_too_long:
- tcc_error("number too long");
- }
- *q++ = ch;
- ch = *p++;
- }
- if (ch == '.' ||
- ((ch == 'e' || ch == 'E') && b == 10) ||
- ((ch == 'p' || ch == 'P') && (b == 16 || b == 2))) {
- if (b != 10) {
- /* NOTE: strtox should support that for hexa numbers, but
- non ISOC99 libcs do not support it, so we prefer to do
- it by hand */
- /* hexadecimal or binary floats */
- /* XXX: handle overflows */
- *q = '\0';
- if (b == 16)
- shift = 4;
- else
- shift = 1;
- bn_zero(bn);
- q = token_buf;
- while (1) {
- t = *q++;
- if (t == '\0') {
- break;
- } else if (t >= 'a') {
- t = t - 'a' + 10;
- } else if (t >= 'A') {
- t = t - 'A' + 10;
- } else {
- t = t - '0';
- }
- bn_lshift(bn, shift, t);
- }
- frac_bits = 0;
- if (ch == '.') {
- ch = *p++;
- while (1) {
- t = ch;
- if (t >= 'a' && t <= 'f') {
- t = t - 'a' + 10;
- } else if (t >= 'A' && t <= 'F') {
- t = t - 'A' + 10;
- } else if (t >= '0' && t <= '9') {
- t = t - '0';
- } else {
- break;
- }
- if (t >= b)
- tcc_error("invalid digit");
- bn_lshift(bn, shift, t);
- frac_bits += shift;
- ch = *p++;
- }
- }
- if (ch != 'p' && ch != 'P')
- expect("exponent");
- ch = *p++;
- s = 1;
- exp_val = 0;
- if (ch == '+') {
- ch = *p++;
- } else if (ch == '-') {
- s = -1;
- ch = *p++;
- }
- if (ch < '0' || ch > '9')
- expect("exponent digits");
- while (ch >= '0' && ch <= '9') {
- exp_val = exp_val * 10 + ch - '0';
- ch = *p++;
- }
- exp_val = exp_val * s;
-
- /* now we can generate the number */
- /* XXX: should patch directly float number */
- d = (double)bn[1] * 4294967296.0 + (double)bn[0];
- d = ldexp(d, exp_val - frac_bits);
- t = toup(ch);
- if (t == 'F') {
- ch = *p++;
- tok = TOK_CFLOAT;
- /* float : should handle overflow */
- tokc.f = (float)d;
- } else if (t == 'L') {
- ch = *p++;
- tok = TOK_CLDOUBLE;
-#ifdef TCC_USING_DOUBLE_FOR_LDOUBLE
- tokc.d = d;
-#else
- /* XXX: not large enough */
- tokc.ld = (long double)d;
-#endif
- } else {
- tok = TOK_CDOUBLE;
- tokc.d = d;
- }
- } else {
- /* decimal floats */
- if (ch == '.') {
- if (q >= token_buf + STRING_MAX_SIZE)
- goto num_too_long;
- *q++ = ch;
- ch = *p++;
- float_frac_parse:
- while (ch >= '0' && ch <= '9') {
- if (q >= token_buf + STRING_MAX_SIZE)
- goto num_too_long;
- *q++ = ch;
- ch = *p++;
- }
- }
- if (ch == 'e' || ch == 'E') {
- if (q >= token_buf + STRING_MAX_SIZE)
- goto num_too_long;
- *q++ = ch;
- ch = *p++;
- if (ch == '-' || ch == '+') {
- if (q >= token_buf + STRING_MAX_SIZE)
- goto num_too_long;
- *q++ = ch;
- ch = *p++;
- }
- if (ch < '0' || ch > '9')
- expect("exponent digits");
- while (ch >= '0' && ch <= '9') {
- if (q >= token_buf + STRING_MAX_SIZE)
- goto num_too_long;
- *q++ = ch;
- ch = *p++;
- }
- }
- *q = '\0';
- t = toup(ch);
- errno = 0;
- if (t == 'F') {
- ch = *p++;
- tok = TOK_CFLOAT;
- tokc.f = strtof(token_buf, NULL);
- } else if (t == 'L') {
- ch = *p++;
- tok = TOK_CLDOUBLE;
-#ifdef TCC_USING_DOUBLE_FOR_LDOUBLE
- tokc.d = strtod(token_buf, NULL);
-#else
- tokc.ld = strtold(token_buf, NULL);
-#endif
- } else {
- tok = TOK_CDOUBLE;
- tokc.d = strtod(token_buf, NULL);
- }
- }
- } else {
- unsigned long long n, n1;
- int lcount, ucount, ov = 0;
- const char *p1;
-
- /* integer number */
- *q = '\0';
- q = token_buf;
- if (b == 10 && *q == '0') {
- b = 8;
- q++;
- }
- n = 0;
- while(1) {
- t = *q++;
- /* no need for checks except for base 10 / 8 errors */
- if (t == '\0')
- break;
- else if (t >= 'a')
- t = t - 'a' + 10;
- else if (t >= 'A')
- t = t - 'A' + 10;
- else
- t = t - '0';
- if (t >= b)
- tcc_error("invalid digit");
- n1 = n;
- n = n * b + t;
- /* detect overflow */
- if (n1 >= 0x1000000000000000ULL && n / b != n1)
- ov = 1;
- }
-
- /* Determine the characteristics (unsigned and/or 64bit) the type of
- the constant must have according to the constant suffix(es) */
- lcount = ucount = 0;
- p1 = p;
- for(;;) {
- t = toup(ch);
- if (t == 'L') {
- if (lcount >= 2)
- tcc_error("three 'l's in integer constant");
- if (lcount && *(p - 1) != ch)
- tcc_error("incorrect integer suffix: %s", p1);
- lcount++;
- ch = *p++;
- } else if (t == 'U') {
- if (ucount >= 1)
- tcc_error("two 'u's in integer constant");
- ucount++;
- ch = *p++;
- } else {
- break;
- }
- }
-
- /* Determine if it needs 64 bits and/or unsigned in order to fit */
- if (ucount == 0 && b == 10) {
- if (lcount <= (LONG_SIZE == 4)) {
- if (n >= 0x80000000U)
- lcount = (LONG_SIZE == 4) + 1;
- }
- if (n >= 0x8000000000000000ULL)
- ov = 1, ucount = 1;
- } else {
- if (lcount <= (LONG_SIZE == 4)) {
- if (n >= 0x100000000ULL)
- lcount = (LONG_SIZE == 4) + 1;
- else if (n >= 0x80000000U)
- ucount = 1;
- }
- if (n >= 0x8000000000000000ULL)
- ucount = 1;
- }
-
- if (ov)
- tcc_warning("integer constant overflow");
-
- tok = TOK_CINT;
- if (lcount) {
- tok = TOK_CLONG;
- if (lcount == 2)
- tok = TOK_CLLONG;
- }
- if (ucount)
- ++tok; /* TOK_CU... */
- tokc.i = n;
- }
- if (ch)
- tcc_error("invalid number");
-}
-
-
-#define PARSE2(c1, tok1, c2, tok2) \
- case c1: \
- PEEKC(c, p); \
- if (c == c2) { \
- p++; \
- tok = tok2; \
- } else { \
- tok = tok1; \
- } \
- break;
-
-/* return next token without macro substitution */
-static inline void next_nomacro1(void)
-{
- int t, c, is_long, len;
- TokenSym *ts;
- uint8_t *p, *p1;
- unsigned int h;
-
- p = file->buf_ptr;
- redo_no_start:
- c = *p;
- switch(c) {
- case ' ':
- case '\t':
- tok = c;
- p++;
- maybe_space:
- if (parse_flags & PARSE_FLAG_SPACES)
- goto keep_tok_flags;
- while (isidnum_table[*p - CH_EOF] & IS_SPC)
- ++p;
- goto redo_no_start;
- case '\f':
- case '\v':
- case '\r':
- p++;
- goto redo_no_start;
- case '\\':
- /* first look if it is in fact an end of buffer */
- c = handle_stray(&p);
- if (c == '\\')
- goto parse_simple;
- if (c == CH_EOF) {
- TCCState *s1 = tcc_state;
- if ((parse_flags & PARSE_FLAG_LINEFEED)
- && !(tok_flags & TOK_FLAG_EOF)) {
- tok_flags |= TOK_FLAG_EOF;
- tok = TOK_LINEFEED;
- goto keep_tok_flags;
- } else if (!(parse_flags & PARSE_FLAG_PREPROCESS)) {
- tok = TOK_EOF;
- } else if (s1->ifdef_stack_ptr != file->ifdef_stack_ptr) {
- tcc_error("missing #endif");
- } else if (s1->include_stack_ptr == s1->include_stack) {
- /* no include left : end of file. */
- tok = TOK_EOF;
- } else {
- tok_flags &= ~TOK_FLAG_EOF;
- /* pop include file */
-
- /* test if previous '#endif' was after a #ifdef at
- start of file */
- if (tok_flags & TOK_FLAG_ENDIF) {
-#ifdef INC_DEBUG
- printf("#endif %s\n", get_tok_str(file->ifndef_macro_saved, NULL));
-#endif
- search_cached_include(s1, file->filename, 1)
- ->ifndef_macro = file->ifndef_macro_saved;
- tok_flags &= ~TOK_FLAG_ENDIF;
- }
-
- /* add end of include file debug info */
- tcc_debug_eincl(tcc_state);
- /* pop include stack */
- tcc_close();
- s1->include_stack_ptr--;
- p = file->buf_ptr;
- if (p == file->buffer)
- tok_flags = TOK_FLAG_BOF;
- tok_flags |= TOK_FLAG_BOL;
- goto redo_no_start;
- }
- } else {
- goto redo_no_start;
- }
- break;
-
- case '\n':
- file->line_num++;
- tok_flags |= TOK_FLAG_BOL;
- p++;
-maybe_newline:
- if (0 == (parse_flags & PARSE_FLAG_LINEFEED))
- goto redo_no_start;
- tok = TOK_LINEFEED;
- goto keep_tok_flags;
-
- case '#':
- /* XXX: simplify */
- PEEKC(c, p);
- if ((tok_flags & TOK_FLAG_BOL) &&
- (parse_flags & PARSE_FLAG_PREPROCESS)) {
- file->buf_ptr = p;
- preprocess(tok_flags & TOK_FLAG_BOF);
- p = file->buf_ptr;
- goto maybe_newline;
- } else {
- if (c == '#') {
- p++;
- tok = TOK_TWOSHARPS;
- } else {
-#if !defined(TCC_TARGET_ARM)
- if (parse_flags & PARSE_FLAG_ASM_FILE) {
- p = parse_line_comment(p - 1);
- goto redo_no_start;
- } else
-#endif
- {
- tok = '#';
- }
- }
- }
- break;
-
- /* dollar is allowed to start identifiers when not parsing asm */
- case '$':
- if (!(isidnum_table[c - CH_EOF] & IS_ID)
- || (parse_flags & PARSE_FLAG_ASM_FILE))
- goto parse_simple;
-
- case 'a': case 'b': case 'c': case 'd':
- case 'e': case 'f': case 'g': case 'h':
- case 'i': case 'j': case 'k': case 'l':
- case 'm': case 'n': case 'o': case 'p':
- case 'q': case 'r': case 's': case 't':
- case 'u': case 'v': case 'w': case 'x':
- case 'y': case 'z':
- case 'A': case 'B': case 'C': case 'D':
- case 'E': case 'F': case 'G': case 'H':
- case 'I': case 'J': case 'K':
- case 'M': case 'N': case 'O': case 'P':
- case 'Q': case 'R': case 'S': case 'T':
- case 'U': case 'V': case 'W': case 'X':
- case 'Y': case 'Z':
- case '_':
- parse_ident_fast:
- p1 = p;
- h = TOK_HASH_INIT;
- h = TOK_HASH_FUNC(h, c);
- while (c = *++p, isidnum_table[c - CH_EOF] & (IS_ID|IS_NUM))
- h = TOK_HASH_FUNC(h, c);
- len = p - p1;
- if (c != '\\') {
- TokenSym **pts;
-
- /* fast case : no stray found, so we have the full token
- and we have already hashed it */
- h &= (TOK_HASH_SIZE - 1);
- pts = &hash_ident[h];
- for(;;) {
- ts = *pts;
- if (!ts)
- break;
- if (ts->len == len && !memcmp(ts->str, p1, len))
- goto token_found;
- pts = &(ts->hash_next);
- }
- ts = tok_alloc_new(pts, (char *) p1, len);
- token_found: ;
- } else {
- /* slower case */
- cstr_reset(&tokcstr);
- cstr_cat(&tokcstr, (char *) p1, len);
- p--;
- PEEKC(c, p);
- parse_ident_slow:
- while (isidnum_table[c - CH_EOF] & (IS_ID|IS_NUM))
- {
- cstr_ccat(&tokcstr, c);
- PEEKC(c, p);
- }
- ts = tok_alloc(tokcstr.data, tokcstr.size);
- }
- tok = ts->tok;
- break;
- case 'L':
- t = p[1];
- if (t != '\\' && t != '\'' && t != '\"') {
- /* fast case */
- goto parse_ident_fast;
- } else {
- PEEKC(c, p);
- if (c == '\'' || c == '\"') {
- is_long = 1;
- goto str_const;
- } else {
- cstr_reset(&tokcstr);
- cstr_ccat(&tokcstr, 'L');
- goto parse_ident_slow;
- }
- }
- break;
-
- case '0': case '1': case '2': case '3':
- case '4': case '5': case '6': case '7':
- case '8': case '9':
- t = c;
- PEEKC(c, p);
- /* after the first digit, accept digits, alpha, '.' or sign if
- prefixed by 'eEpP' */
- parse_num:
- cstr_reset(&tokcstr);
- for(;;) {
- cstr_ccat(&tokcstr, t);
- if (!((isidnum_table[c - CH_EOF] & (IS_ID|IS_NUM))
- || c == '.'
- || ((c == '+' || c == '-')
- && (((t == 'e' || t == 'E')
- && !(parse_flags & PARSE_FLAG_ASM_FILE
- /* 0xe+1 is 3 tokens in asm */
- && ((char*)tokcstr.data)[0] == '0'
- && toup(((char*)tokcstr.data)[1]) == 'X'))
- || t == 'p' || t == 'P'))))
- break;
- t = c;
- PEEKC(c, p);
- }
- /* We add a trailing '\0' to ease parsing */
- cstr_ccat(&tokcstr, '\0');
- tokc.str.size = tokcstr.size;
- tokc.str.data = tokcstr.data;
- tok = TOK_PPNUM;
- break;
-
- case '.':
- /* special dot handling because it can also start a number */
- PEEKC(c, p);
- if (isnum(c)) {
- t = '.';
- goto parse_num;
- } else if ((isidnum_table['.' - CH_EOF] & IS_ID)
- && (isidnum_table[c - CH_EOF] & (IS_ID|IS_NUM))) {
- *--p = c = '.';
- goto parse_ident_fast;
- } else if (c == '.') {
- PEEKC(c, p);
- if (c == '.') {
- p++;
- tok = TOK_DOTS;
- } else {
- *--p = '.'; /* may underflow into file->unget[] */
- tok = '.';
- }
- } else {
- tok = '.';
- }
- break;
- case '\'':
- case '\"':
- is_long = 0;
- str_const:
- cstr_reset(&tokcstr);
- if (is_long)
- cstr_ccat(&tokcstr, 'L');
- cstr_ccat(&tokcstr, c);
- p = parse_pp_string(p, c, &tokcstr);
- cstr_ccat(&tokcstr, c);
- cstr_ccat(&tokcstr, '\0');
- tokc.str.size = tokcstr.size;
- tokc.str.data = tokcstr.data;
- tok = TOK_PPSTR;
- break;
-
- case '<':
- PEEKC(c, p);
- if (c == '=') {
- p++;
- tok = TOK_LE;
- } else if (c == '<') {
- PEEKC(c, p);
- if (c == '=') {
- p++;
- tok = TOK_A_SHL;
- } else {
- tok = TOK_SHL;
- }
- } else {
- tok = TOK_LT;
- }
- break;
- case '>':
- PEEKC(c, p);
- if (c == '=') {
- p++;
- tok = TOK_GE;
- } else if (c == '>') {
- PEEKC(c, p);
- if (c == '=') {
- p++;
- tok = TOK_A_SAR;
- } else {
- tok = TOK_SAR;
- }
- } else {
- tok = TOK_GT;
- }
- break;
-
- case '&':
- PEEKC(c, p);
- if (c == '&') {
- p++;
- tok = TOK_LAND;
- } else if (c == '=') {
- p++;
- tok = TOK_A_AND;
- } else {
- tok = '&';
- }
- break;
-
- case '|':
- PEEKC(c, p);
- if (c == '|') {
- p++;
- tok = TOK_LOR;
- } else if (c == '=') {
- p++;
- tok = TOK_A_OR;
- } else {
- tok = '|';
- }
- break;
-
- case '+':
- PEEKC(c, p);
- if (c == '+') {
- p++;
- tok = TOK_INC;
- } else if (c == '=') {
- p++;
- tok = TOK_A_ADD;
- } else {
- tok = '+';
- }
- break;
-
- case '-':
- PEEKC(c, p);
- if (c == '-') {
- p++;
- tok = TOK_DEC;
- } else if (c == '=') {
- p++;
- tok = TOK_A_SUB;
- } else if (c == '>') {
- p++;
- tok = TOK_ARROW;
- } else {
- tok = '-';
- }
- break;
-
- PARSE2('!', '!', '=', TOK_NE)
- PARSE2('=', '=', '=', TOK_EQ)
- PARSE2('*', '*', '=', TOK_A_MUL)
- PARSE2('%', '%', '=', TOK_A_MOD)
- PARSE2('^', '^', '=', TOK_A_XOR)
-
- /* comments or operator */
- case '/':
- PEEKC(c, p);
- if (c == '*') {
- p = parse_comment(p);
- /* comments replaced by a blank */
- tok = ' ';
- goto maybe_space;
- } else if (c == '/') {
- p = parse_line_comment(p);
- tok = ' ';
- goto maybe_space;
- } else if (c == '=') {
- p++;
- tok = TOK_A_DIV;
- } else {
- tok = '/';
- }
- break;
-
- /* simple tokens */
- case '(':
- case ')':
- case '[':
- case ']':
- case '{':
- case '}':
- case ',':
- case ';':
- case ':':
- case '?':
- case '~':
- case '@': /* only used in assembler */
- parse_simple:
- tok = c;
- p++;
- break;
- default:
- if (c >= 0x80 && c <= 0xFF) /* utf8 identifiers */
- goto parse_ident_fast;
- if (parse_flags & PARSE_FLAG_ASM_FILE)
- goto parse_simple;
- tcc_error("unrecognized character \\x%02x", c);
- break;
- }
- tok_flags = 0;
-keep_tok_flags:
- file->buf_ptr = p;
-#if defined(PARSE_DEBUG)
- printf("token = %d %s\n", tok, get_tok_str(tok, &tokc));
-#endif
-}
-
-static void macro_subst(
- TokenString *tok_str,
- Sym **nested_list,
- const int *macro_str
- );
-
-/* substitute arguments in replacement lists in macro_str by the values in
- args (field d) and return allocated string */
-static int *macro_arg_subst(Sym **nested_list, const int *macro_str, Sym *args)
-{
- int t, t0, t1, spc;
- const int *st;
- Sym *s;
- CValue cval;
- TokenString str;
-
- tok_str_new(&str);
- t0 = t1 = 0;
- while(1) {
- TOK_GET(&t, &macro_str, &cval);
- if (!t)
- break;
- if (t == '#') {
- /* stringize */
- TOK_GET(&t, &macro_str, &cval);
- if (!t)
- goto bad_stringy;
- s = sym_find2(args, t);
- if (s) {
- cstr_reset(&tokcstr);
- cstr_ccat(&tokcstr, '\"');
- st = s->d;
- spc = 0;
- while (*st >= 0) {
- TOK_GET(&t, &st, &cval);
- if (t != TOK_PLCHLDR
- && t != TOK_NOSUBST
- && 0 == check_space(t, &spc)) {
- const char *s = get_tok_str(t, &cval);
- while (*s) {
- if (t == TOK_PPSTR && *s != '\'')
- add_char(&tokcstr, *s);
- else
- cstr_ccat(&tokcstr, *s);
- ++s;
- }
- }
- }
- tokcstr.size -= spc;
- cstr_ccat(&tokcstr, '\"');
- cstr_ccat(&tokcstr, '\0');
-#ifdef PP_DEBUG
- printf("\nstringize: <%s>\n", (char *)tokcstr.data);
-#endif
- /* add string */
- cval.str.size = tokcstr.size;
- cval.str.data = tokcstr.data;
- tok_str_add2(&str, TOK_PPSTR, &cval);
- } else {
- bad_stringy:
- expect("macro parameter after '#'");
- }
- } else if (t >= TOK_IDENT) {
- s = sym_find2(args, t);
- if (s) {
- st = s->d;
- /* if '##' is present before or after, no arg substitution */
- if (*macro_str == TOK_PPJOIN || t1 == TOK_PPJOIN) {
- /* special case for var arg macros : ## eats the ','
- if empty VA_ARGS variable. */
- if (t1 == TOK_PPJOIN && t0 == ',' && gnu_ext && s->type.t) {
- if (*st <= 0) {
- /* suppress ',' '##' */
- str.len -= 2;
- } else {
- /* suppress '##' and add variable */
- str.len--;
- goto add_var;
- }
- }
- } else {
- add_var:
- if (!s->next) {
- /* Expand arguments tokens and store them. In most
- cases we could also re-expand each argument if
- used multiple times, but not if the argument
- contains the __COUNTER__ macro. */
- TokenString str2;
- sym_push2(&s->next, s->v, s->type.t, 0);
- tok_str_new(&str2);
- macro_subst(&str2, nested_list, st);
- tok_str_add(&str2, 0);
- s->next->d = str2.str;
- }
- st = s->next->d;
- }
- if (*st <= 0) {
- /* expanded to empty string */
- tok_str_add(&str, TOK_PLCHLDR);
- } else for (;;) {
- int t2;
- TOK_GET(&t2, &st, &cval);
- if (t2 <= 0)
- break;
- tok_str_add2(&str, t2, &cval);
- }
- } else {
- tok_str_add(&str, t);
- }
- } else {
- tok_str_add2(&str, t, &cval);
- }
- t0 = t1, t1 = t;
- }
- tok_str_add(&str, 0);
- return str.str;
-}
-
-static char const ab_month_name[12][4] =
-{
- "Jan", "Feb", "Mar", "Apr", "May", "Jun",
- "Jul", "Aug", "Sep", "Oct", "Nov", "Dec"
-};
-
-static int paste_tokens(int t1, CValue *v1, int t2, CValue *v2)
-{
- int n, ret = 1;
-
- cstr_reset(&tokcstr);
- if (t1 != TOK_PLCHLDR)
- cstr_cat(&tokcstr, get_tok_str(t1, v1), -1);
- n = tokcstr.size;
- if (t2 != TOK_PLCHLDR)
- cstr_cat(&tokcstr, get_tok_str(t2, v2), -1);
- cstr_ccat(&tokcstr, '\0');
- //printf("paste <%s>\n", (char*)tokcstr.data);
-
- tcc_open_bf(tcc_state, ":paste:", tokcstr.size);
- memcpy(file->buffer, tokcstr.data, tokcstr.size);
- tok_flags = 0;
- for (;;) {
- next_nomacro1();
- if (0 == *file->buf_ptr)
- break;
- if (is_space(tok))
- continue;
- tcc_warning("pasting \"%.*s\" and \"%s\" does not give a valid"
- " preprocessing token", n, file->buffer, file->buffer + n);
- ret = 0;
- break;
- }
- tcc_close();
- return ret;
-}
-
-/* handle the '##' operator. Return NULL if no '##' seen. Otherwise
- return the resulting string (which must be freed). */
-static inline int *macro_twosharps(const int *ptr0)
-{
- int t;
- CValue cval;
- TokenString macro_str1;
- int start_of_nosubsts = -1;
- const int *ptr;
-
- /* we search the first '##' */
- for (ptr = ptr0;;) {
- TOK_GET(&t, &ptr, &cval);
- if (t == TOK_PPJOIN)
- break;
- if (t == 0)
- return NULL;
- }
-
- tok_str_new(&macro_str1);
-
- //tok_print(" $$$", ptr0);
- for (ptr = ptr0;;) {
- TOK_GET(&t, &ptr, &cval);
- if (t == 0)
- break;
- if (t == TOK_PPJOIN)
- continue;
- while (*ptr == TOK_PPJOIN) {
- int t1; CValue cv1;
- /* given 'a##b', remove nosubsts preceding 'a' */
- if (start_of_nosubsts >= 0)
- macro_str1.len = start_of_nosubsts;
- /* given 'a##b', remove nosubsts preceding 'b' */
- while ((t1 = *++ptr) == TOK_NOSUBST)
- ;
- if (t1 && t1 != TOK_PPJOIN) {
- TOK_GET(&t1, &ptr, &cv1);
- if (t != TOK_PLCHLDR || t1 != TOK_PLCHLDR) {
- if (paste_tokens(t, &cval, t1, &cv1)) {
- t = tok, cval = tokc;
- } else {
- tok_str_add2(&macro_str1, t, &cval);
- t = t1, cval = cv1;
- }
- }
- }
- }
- if (t == TOK_NOSUBST) {
- if (start_of_nosubsts < 0)
- start_of_nosubsts = macro_str1.len;
- } else {
- start_of_nosubsts = -1;
- }
- tok_str_add2(&macro_str1, t, &cval);
- }
- tok_str_add(&macro_str1, 0);
- //tok_print(" ###", macro_str1.str);
- return macro_str1.str;
-}
-
-/* peek or read [ws_str == NULL] next token from function macro call,
- walking up macro levels up to the file if necessary */
-static int next_argstream(Sym **nested_list, TokenString *ws_str)
-{
- int t;
- const int *p;
- Sym *sa;
-
- for (;;) {
- if (macro_ptr) {
- p = macro_ptr, t = *p;
- if (ws_str) {
- while (is_space(t) || TOK_LINEFEED == t || TOK_PLCHLDR == t)
- tok_str_add(ws_str, t), t = *++p;
- }
- if (t == 0) {
- end_macro();
- /* also, end of scope for nested defined symbol */
- sa = *nested_list;
- while (sa && sa->v == 0)
- sa = sa->prev;
- if (sa)
- sa->v = 0;
- continue;
- }
- } else {
- uint8_t *p = file->buf_ptr;
- int ch = handle_bs(&p);
- if (ws_str) {
- while (is_space(ch) || ch == '\n' || ch == '/') {
- if (ch == '/') {
- int c;
- PEEKC(c, p);
- if (c == '*') {
- p = parse_comment(p) - 1;
- } else if (c == '/') {
- p = parse_line_comment(p) - 1;
- } else {
- *--p = ch;
- break;
- }
- ch = ' ';
- }
- if (ch == '\n')
- file->line_num++;
- if (!(ch == '\f' || ch == '\v' || ch == '\r'))
- tok_str_add(ws_str, ch);
- PEEKC(ch, p);
- }
- }
- file->buf_ptr = p;
- t = ch;
- }
-
- if (ws_str)
- return t;
- next_nomacro();
- return tok;
- }
-}
-
-/* do macro substitution of current token with macro 's' and add
- result to (tok_str,tok_len). 'nested_list' is the list of all
- macros we got inside to avoid recursing. Return non zero if no
- substitution needs to be done */
-static int macro_subst_tok(
- TokenString *tok_str,
- Sym **nested_list,
- Sym *s)
-{
- Sym *args, *sa, *sa1;
- int parlevel, t, t1, spc;
- TokenString str;
- char *cstrval;
- CValue cval;
- char buf[32];
-
- /* if symbol is a macro, prepare substitution */
- /* special macros */
- if (tok == TOK___LINE__ || tok == TOK___COUNTER__) {
- t = tok == TOK___LINE__ ? file->line_num : pp_counter++;
- snprintf(buf, sizeof(buf), "%d", t);
- cstrval = buf;
- t1 = TOK_PPNUM;
- goto add_cstr1;
- } else if (tok == TOK___FILE__) {
- cstrval = file->filename;
- goto add_cstr;
- } else if (tok == TOK___DATE__ || tok == TOK___TIME__) {
- time_t ti;
- struct tm *tm;
-
- time(&ti);
- tm = localtime(&ti);
- if (tok == TOK___DATE__) {
- snprintf(buf, sizeof(buf), "%s %2d %d",
- ab_month_name[tm->tm_mon], tm->tm_mday, tm->tm_year + 1900);
- } else {
- snprintf(buf, sizeof(buf), "%02d:%02d:%02d",
- tm->tm_hour, tm->tm_min, tm->tm_sec);
- }
- cstrval = buf;
- add_cstr:
- t1 = TOK_STR;
- add_cstr1:
- cstr_reset(&tokcstr);
- cstr_cat(&tokcstr, cstrval, 0);
- cval.str.size = tokcstr.size;
- cval.str.data = tokcstr.data;
- tok_str_add2(tok_str, t1, &cval);
- } else if (s->d) {
- int saved_parse_flags = parse_flags;
- int *joined_str = NULL;
- int *mstr = s->d;
-
- if (s->type.t == MACRO_FUNC) {
- /* whitespace between macro name and argument list */
- TokenString ws_str;
- tok_str_new(&ws_str);
-
- spc = 0;
- parse_flags |= PARSE_FLAG_SPACES | PARSE_FLAG_LINEFEED
- | PARSE_FLAG_ACCEPT_STRAYS;
-
- /* get next token from argument stream */
- t = next_argstream(nested_list, &ws_str);
- if (t != '(') {
- /* not a macro substitution after all, restore the
- * macro token plus all whitespace we've read.
- * whitespace is intentionally not merged to preserve
- * newlines. */
- parse_flags = saved_parse_flags;
- tok_str_add(tok_str, tok);
- if (parse_flags & PARSE_FLAG_SPACES) {
- int i;
- for (i = 0; i < ws_str.len; i++)
- tok_str_add(tok_str, ws_str.str[i]);
- }
- if (ws_str.len && ws_str.str[ws_str.len - 1] == '\n')
- tok_flags |= TOK_FLAG_BOL;
- tok_str_free_str(ws_str.str);
- return 0;
- } else {
- tok_str_free_str(ws_str.str);
- }
- do {
- next_nomacro(); /* eat '(' */
- } while (tok == TOK_PLCHLDR || is_space(tok));
-
- /* argument macro */
- args = NULL;
- sa = s->next;
- /* NOTE: empty args are allowed, except if no args */
- for(;;) {
- do {
- next_argstream(nested_list, NULL);
- } while (tok == TOK_PLCHLDR || is_space(tok) ||
- TOK_LINEFEED == tok);
- empty_arg:
- /* handle '()' case */
- if (!args && !sa && tok == ')')
- break;
- if (!sa)
- tcc_error("macro '%s' used with too many args",
- get_tok_str(s->v, 0));
- tok_str_new(&str);
- parlevel = spc = 0;
- /* NOTE: non zero sa->t indicates VA_ARGS */
- while ((parlevel > 0 ||
- (tok != ')' &&
- (tok != ',' || sa->type.t)))) {
- if (tok == TOK_EOF || tok == 0)
- break;
- if (tok == '(')
- parlevel++;
- else if (tok == ')')
- parlevel--;
- if (tok == TOK_LINEFEED)
- tok = ' ';
- if (!check_space(tok, &spc))
- tok_str_add2(&str, tok, &tokc);
- next_argstream(nested_list, NULL);
- }
- if (parlevel)
- expect(")");
- str.len -= spc;
- tok_str_add(&str, -1);
- tok_str_add(&str, 0);
- sa1 = sym_push2(&args, sa->v & ~SYM_FIELD, sa->type.t, 0);
- sa1->d = str.str;
- sa = sa->next;
- if (tok == ')') {
- /* special case for gcc var args: add an empty
- var arg argument if it is omitted */
- if (sa && sa->type.t && gnu_ext)
- goto empty_arg;
- break;
- }
- if (tok != ',')
- expect(",");
- }
- if (sa) {
- tcc_error("macro '%s' used with too few args",
- get_tok_str(s->v, 0));
- }
-
- /* now subst each arg */
- mstr = macro_arg_subst(nested_list, mstr, args);
- /* free memory */
- sa = args;
- while (sa) {
- sa1 = sa->prev;
- tok_str_free_str(sa->d);
- if (sa->next) {
- tok_str_free_str(sa->next->d);
- sym_free(sa->next);
- }
- sym_free(sa);
- sa = sa1;
- }
- parse_flags = saved_parse_flags;
- }
-
- sym_push2(nested_list, s->v, 0, 0);
- parse_flags = saved_parse_flags;
- joined_str = macro_twosharps(mstr);
- macro_subst(tok_str, nested_list, joined_str ? joined_str : mstr);
-
- /* pop nested defined symbol */
- sa1 = *nested_list;
- *nested_list = sa1->prev;
- sym_free(sa1);
- if (joined_str)
- tok_str_free_str(joined_str);
- if (mstr != s->d)
- tok_str_free_str(mstr);
- }
- return 0;
-}
-
-/* do macro substitution of macro_str and add result to
- (tok_str,tok_len). 'nested_list' is the list of all macros we got
- inside to avoid recursing. */
-static void macro_subst(
- TokenString *tok_str,
- Sym **nested_list,
- const int *macro_str
- )
-{
- Sym *s;
- int t, spc, nosubst;
- CValue cval;
-
- spc = nosubst = 0;
-
- while (1) {
- TOK_GET(&t, &macro_str, &cval);
- if (t <= 0)
- break;
-
- if (t >= TOK_IDENT && 0 == nosubst) {
- s = define_find(t);
- if (s == NULL)
- goto no_subst;
-
- /* if nested substitution, do nothing */
- if (sym_find2(*nested_list, t)) {
- /* and mark it as TOK_NOSUBST, so it doesn't get subst'd again */
- tok_str_add2(tok_str, TOK_NOSUBST, NULL);
- goto no_subst;
- }
-
- {
- TokenString *str = tok_str_alloc();
- str->str = (int*)macro_str;
- begin_macro(str, 2);
-
- tok = t;
- macro_subst_tok(tok_str, nested_list, s);
-
- if (macro_stack != str) {
- /* already finished by reading function macro arguments */
- break;
- }
-
- macro_str = macro_ptr;
- end_macro ();
- }
- if (tok_str->len)
- spc = is_space(t = tok_str->str[tok_str->lastlen]);
- } else {
-no_subst:
- if (!check_space(t, &spc))
- tok_str_add2(tok_str, t, &cval);
-
- if (nosubst) {
- if (nosubst > 1 && (spc || (++nosubst == 3 && t == '(')))
- continue;
- nosubst = 0;
- }
- if (t == TOK_NOSUBST)
- nosubst = 1;
- }
- /* GCC supports 'defined' as result of a macro substitution */
- if (t == TOK_DEFINED && pp_expr)
- nosubst = 2;
- }
-}
-
-/* return next token without macro substitution. Can read input from
- macro_ptr buffer */
-static void next_nomacro(void)
-{
- int t;
- if (macro_ptr) {
- redo:
- t = *macro_ptr;
- if (TOK_HAS_VALUE(t)) {
- tok_get(&tok, &macro_ptr, &tokc);
- if (t == TOK_LINENUM) {
- file->line_num = tokc.i;
- goto redo;
- }
- } else {
- macro_ptr++;
- if (t < TOK_IDENT) {
- if (!(parse_flags & PARSE_FLAG_SPACES)
- && (isidnum_table[t - CH_EOF] & IS_SPC))
- goto redo;
- }
- tok = t;
- }
- } else {
- next_nomacro1();
- }
-}
-
-/* return next token with macro substitution */
-ST_FUNC void next(void)
-{
- int t;
- redo:
- next_nomacro();
- t = tok;
- if (macro_ptr) {
- if (!TOK_HAS_VALUE(t)) {
- if (t == TOK_NOSUBST || t == TOK_PLCHLDR) {
- /* discard preprocessor markers */
- goto redo;
- } else if (t == 0) {
- /* end of macro or unget token string */
- end_macro();
- goto redo;
- } else if (t == '\\') {
- if (!(parse_flags & PARSE_FLAG_ACCEPT_STRAYS))
- tcc_error("stray '\\' in program");
- }
- return;
- }
- } else if (t >= TOK_IDENT && (parse_flags & PARSE_FLAG_PREPROCESS)) {
- /* if reading from file, try to substitute macros */
- Sym *s = define_find(t);
- if (s) {
- Sym *nested_list = NULL;
- tokstr_buf.len = 0;
- macro_subst_tok(&tokstr_buf, &nested_list, s);
- tok_str_add(&tokstr_buf, 0);
- begin_macro(&tokstr_buf, 0);
- goto redo;
- }
- return;
- }
- /* convert preprocessor tokens into C tokens */
- if (t == TOK_PPNUM) {
- if (parse_flags & PARSE_FLAG_TOK_NUM)
- parse_number((char *)tokc.str.data);
- } else if (t == TOK_PPSTR) {
- if (parse_flags & PARSE_FLAG_TOK_STR)
- parse_string((char *)tokc.str.data, tokc.str.size - 1);
- }
-}
-
-/* push back current token and set current token to 'last_tok'. Only
- identifier case handled for labels. */
-ST_INLN void unget_tok(int last_tok)
-{
-
- TokenString *str = tok_str_alloc();
- tok_str_add2(str, tok, &tokc);
- tok_str_add(str, 0);
- begin_macro(str, 1);
- tok = last_tok;
-}
-
-/* ------------------------------------------------------------------------- */
-/* init preprocessor */
-
-static const char * const target_os_defs =
-#ifdef TCC_TARGET_PE
- "_WIN32\0"
-# if PTR_SIZE == 8
- "_WIN64\0"
-# endif
-#else
-# if defined TCC_TARGET_MACHO
- "__APPLE__\0"
-# elif TARGETOS_FreeBSD
- "__FreeBSD__ 12\0"
-# elif TARGETOS_FreeBSD_kernel
- "__FreeBSD_kernel__\0"
-# elif TARGETOS_NetBSD
- "__NetBSD__\0"
-# elif TARGETOS_OpenBSD
- "__OpenBSD__\0"
-# else
- "__linux__\0"
- "__linux\0"
-# if TARGETOS_ANDROID
- "__ANDROID__\0"
-# endif
-# endif
- "__unix__\0"
- "__unix\0"
-#endif
- ;
-
-static void putdef(CString *cs, const char *p)
-{
- cstr_printf(cs, "#define %s%s\n", p, &" 1"[!!strchr(p, ' ')*2]);
-}
-
-static void putdefs(CString *cs, const char *p)
-{
- while (*p)
- putdef(cs, p), p = strchr(p, 0) + 1;
-}
-
-static void tcc_predefs(TCCState *s1, CString *cs, int is_asm)
-{
- int a, b, c;
-
- sscanf(TCC_VERSION, "%d.%d.%d", &a, &b, &c);
- cstr_printf(cs, "#define __TINYC__ %d\n", a*10000 + b*100 + c);
-
- putdefs(cs, target_machine_defs);
- putdefs(cs, target_os_defs);
-
-#ifdef TCC_TARGET_ARM
- if (s1->float_abi == ARM_HARD_FLOAT)
- putdef(cs, "__ARM_PCS_VFP");
-#endif
- if (is_asm)
- putdef(cs, "__ASSEMBLER__");
- if (s1->output_type == TCC_OUTPUT_PREPROCESS)
- putdef(cs, "__TCC_PP__");
- if (s1->output_type == TCC_OUTPUT_MEMORY)
- putdef(cs, "__TCC_RUN__");
-#ifdef CONFIG_TCC_BACKTRACE
- if (s1->do_backtrace)
- putdef(cs, "__TCC_BACKTRACE__");
-#endif
-#ifdef CONFIG_TCC_BCHECK
- if (s1->do_bounds_check)
- putdef(cs, "__TCC_BCHECK__");
-#endif
- if (s1->char_is_unsigned)
- putdef(cs, "__CHAR_UNSIGNED__");
- if (s1->optimize > 0)
- putdef(cs, "__OPTIMIZE__");
- if (s1->option_pthread)
- putdef(cs, "_REENTRANT");
- if (s1->leading_underscore)
- putdef(cs, "__leading_underscore");
- cstr_printf(cs, "#define __SIZEOF_POINTER__ %d\n", PTR_SIZE);
- cstr_printf(cs, "#define __SIZEOF_LONG__ %d\n", LONG_SIZE);
- if (!is_asm) {
- putdef(cs, "__STDC__");
- cstr_printf(cs, "#define __STDC_VERSION__ %dL\n", s1->cversion);
- }
- cstr_printf(cs, "#define __BASE_FILE__ \"%s\"\n", file->filename);
-}
-
-ST_FUNC void preprocess_start(TCCState *s1, int filetype)
-{
- int is_asm = !!(filetype & (AFF_TYPE_ASM|AFF_TYPE_ASMPP));
-
- tccpp_new(s1);
-
- s1->include_stack_ptr = s1->include_stack;
- s1->ifdef_stack_ptr = s1->ifdef_stack;
- file->ifdef_stack_ptr = s1->ifdef_stack_ptr;
- pp_expr = 0;
- pp_counter = 0;
- pp_debug_tok = pp_debug_symv = 0;
- pp_once++;
- s1->pack_stack[0] = 0;
- s1->pack_stack_ptr = s1->pack_stack;
-
- set_idnum('$', !is_asm && s1->dollars_in_identifiers ? IS_ID : 0);
- set_idnum('.', is_asm ? IS_ID : 0);
-
- if (!(filetype & AFF_TYPE_ASM)) {
- CString cstr;
- cstr_new(&cstr);
- tcc_predefs(s1, &cstr, is_asm);
- if (s1->cmdline_defs.size)
- cstr_cat(&cstr, s1->cmdline_defs.data, s1->cmdline_defs.size);
- if (s1->cmdline_incl.size)
- cstr_cat(&cstr, s1->cmdline_incl.data, s1->cmdline_incl.size);
- //printf("%s\n", (char*)cstr.data);
- *s1->include_stack_ptr++ = file;
- tcc_open_bf(s1, "<command line>", cstr.size);
- memcpy(file->buffer, cstr.data, cstr.size);
- cstr_free(&cstr);
- }
-
- parse_flags = is_asm ? PARSE_FLAG_ASM_FILE : 0;
- tok_flags = TOK_FLAG_BOL | TOK_FLAG_BOF;
-}
-
-/* cleanup from error/setjmp */
-ST_FUNC void preprocess_end(TCCState *s1)
-{
- while (macro_stack)
- end_macro();
- macro_ptr = NULL;
- while (file)
- tcc_close();
- tccpp_delete(s1);
-}
-
-ST_FUNC int set_idnum(int c, int val)
-{
- int prev = isidnum_table[c - CH_EOF];
- isidnum_table[c - CH_EOF] = val;
- return prev;
-}
-
-ST_FUNC void tccpp_new(TCCState *s)
-{
- int i, c;
- const char *p, *r;
-
- /* init isid table */
- for(i = CH_EOF; i<128; i++)
- set_idnum(i,
- is_space(i) ? IS_SPC
- : isid(i) ? IS_ID
- : isnum(i) ? IS_NUM
- : 0);
-
- for(i = 128; i<256; i++)
- set_idnum(i, IS_ID);
-
- /* init allocators */
- tal_new(&toksym_alloc, TOKSYM_TAL_LIMIT, TOKSYM_TAL_SIZE);
- tal_new(&tokstr_alloc, TOKSTR_TAL_LIMIT, TOKSTR_TAL_SIZE);
-
- memset(hash_ident, 0, TOK_HASH_SIZE * sizeof(TokenSym *));
- memset(s->cached_includes_hash, 0, sizeof s->cached_includes_hash);
-
- cstr_new(&tokcstr);
- cstr_new(&cstr_buf);
- cstr_realloc(&cstr_buf, STRING_MAX_SIZE);
- tok_str_new(&tokstr_buf);
- tok_str_realloc(&tokstr_buf, TOKSTR_MAX_SIZE);
-
- tok_ident = TOK_IDENT;
- p = tcc_keywords;
- while (*p) {
- r = p;
- for(;;) {
- c = *r++;
- if (c == '\0')
- break;
- }
- tok_alloc(p, r - p - 1);
- p = r;
- }
-
- /* we add dummy defines for some special macros to speed up tests
- and to have working defined() */
- define_push(TOK___LINE__, MACRO_OBJ, NULL, NULL);
- define_push(TOK___FILE__, MACRO_OBJ, NULL, NULL);
- define_push(TOK___DATE__, MACRO_OBJ, NULL, NULL);
- define_push(TOK___TIME__, MACRO_OBJ, NULL, NULL);
- define_push(TOK___COUNTER__, MACRO_OBJ, NULL, NULL);
-}
-
-ST_FUNC void tccpp_delete(TCCState *s)
-{
- int i, n;
-
- dynarray_reset(&s->cached_includes, &s->nb_cached_includes);
-
- /* free tokens */
- n = tok_ident - TOK_IDENT;
- if (n > total_idents)
- total_idents = n;
- for(i = 0; i < n; i++)
- tal_free(toksym_alloc, table_ident[i]);
- tcc_free(table_ident);
- table_ident = NULL;
-
- /* free static buffers */
- cstr_free(&tokcstr);
- cstr_free(&cstr_buf);
- tok_str_free_str(tokstr_buf.str);
-
- /* free allocators */
- tal_delete(toksym_alloc);
- toksym_alloc = NULL;
- tal_delete(tokstr_alloc);
- tokstr_alloc = NULL;
-}
-
-/* ------------------------------------------------------------------------- */
-/* tcc -E [-P[1]] [-dD} support */
-
-static void tok_print(const char *msg, const int *str)
-{
- FILE *fp;
- int t, s = 0;
- CValue cval;
-
- fp = tcc_state->ppfp;
- fprintf(fp, "%s", msg);
- while (str) {
- TOK_GET(&t, &str, &cval);
- if (!t)
- break;
- fprintf(fp, &" %s"[s], get_tok_str(t, &cval)), s = 1;
- }
- fprintf(fp, "\n");
-}
-
-static void pp_line(TCCState *s1, BufferedFile *f, int level)
-{
- int d = f->line_num - f->line_ref;
-
- if (s1->dflag & 4)
- return;
-
- if (s1->Pflag == LINE_MACRO_OUTPUT_FORMAT_NONE) {
- ;
- } else if (level == 0 && f->line_ref && d < 8) {
- while (d > 0)
- fputs("\n", s1->ppfp), --d;
- } else if (s1->Pflag == LINE_MACRO_OUTPUT_FORMAT_STD) {
- fprintf(s1->ppfp, "#line %d \"%s\"\n", f->line_num, f->filename);
- } else {
- fprintf(s1->ppfp, "# %d \"%s\"%s\n", f->line_num, f->filename,
- level > 0 ? " 1" : level < 0 ? " 2" : "");
- }
- f->line_ref = f->line_num;
-}
-
-static void define_print(TCCState *s1, int v)
-{
- FILE *fp;
- Sym *s;
-
- s = define_find(v);
- if (NULL == s || NULL == s->d)
- return;
-
- fp = s1->ppfp;
- fprintf(fp, "#define %s", get_tok_str(v, NULL));
- if (s->type.t == MACRO_FUNC) {
- Sym *a = s->next;
- fprintf(fp,"(");
- if (a)
- for (;;) {
- fprintf(fp,"%s", get_tok_str(a->v & ~SYM_FIELD, NULL));
- if (!(a = a->next))
- break;
- fprintf(fp,",");
- }
- fprintf(fp,")");
- }
- tok_print("", s->d);
-}
-
-static void pp_debug_defines(TCCState *s1)
-{
- int v, t;
- const char *vs;
- FILE *fp;
-
- t = pp_debug_tok;
- if (t == 0)
- return;
-
- file->line_num--;
- pp_line(s1, file, 0);
- file->line_ref = ++file->line_num;
-
- fp = s1->ppfp;
- v = pp_debug_symv;
- vs = get_tok_str(v, NULL);
- if (t == TOK_DEFINE) {
- define_print(s1, v);
- } else if (t == TOK_UNDEF) {
- fprintf(fp, "#undef %s\n", vs);
- } else if (t == TOK_push_macro) {
- fprintf(fp, "#pragma push_macro(\"%s\")\n", vs);
- } else if (t == TOK_pop_macro) {
- fprintf(fp, "#pragma pop_macro(\"%s\")\n", vs);
- }
- pp_debug_tok = 0;
-}
-
-static void pp_debug_builtins(TCCState *s1)
-{
- int v;
- for (v = TOK_IDENT; v < tok_ident; ++v)
- define_print(s1, v);
-}
-
-/* Add a space between tokens a and b to avoid unwanted textual pasting */
-static int pp_need_space(int a, int b)
-{
- return 'E' == a ? '+' == b || '-' == b
- : '+' == a ? TOK_INC == b || '+' == b
- : '-' == a ? TOK_DEC == b || '-' == b
- : a >= TOK_IDENT ? b >= TOK_IDENT
- : a == TOK_PPNUM ? b >= TOK_IDENT
- : 0;
-}
-
-/* maybe hex like 0x1e */
-static int pp_check_he0xE(int t, const char *p)
-{
- if (t == TOK_PPNUM && toup(strchr(p, 0)[-1]) == 'E')
- return 'E';
- return t;
-}
-
-/* Preprocess the current file */
-ST_FUNC int tcc_preprocess(TCCState *s1)
-{
- BufferedFile **iptr;
- int token_seen, spcs, level;
- const char *p;
- char white[400];
-
- parse_flags = PARSE_FLAG_PREPROCESS
- | (parse_flags & PARSE_FLAG_ASM_FILE)
- | PARSE_FLAG_LINEFEED
- | PARSE_FLAG_SPACES
- | PARSE_FLAG_ACCEPT_STRAYS
- ;
- /* Credits to Fabrice Bellard's initial revision to demonstrate its
- capability to compile and run itself, provided all numbers are
- given as decimals. tcc -E -P10 will do. */
- if (s1->Pflag == LINE_MACRO_OUTPUT_FORMAT_P10)
- parse_flags |= PARSE_FLAG_TOK_NUM, s1->Pflag = 1;
-
- if (s1->do_bench) {
- /* for PP benchmarks */
- do next(); while (tok != TOK_EOF);
- return 0;
- }
-
- if (s1->dflag & 1) {
- pp_debug_builtins(s1);
- s1->dflag &= ~1;
- }
-
- token_seen = TOK_LINEFEED, spcs = 0, level = 0;
- if (file->prev)
- pp_line(s1, file->prev, level++);
- pp_line(s1, file, level);
- for (;;) {
- iptr = s1->include_stack_ptr;
- next();
- if (tok == TOK_EOF)
- break;
-
- level = s1->include_stack_ptr - iptr;
- if (level) {
- if (level > 0)
- pp_line(s1, *iptr, 0);
- pp_line(s1, file, level);
- }
- if (s1->dflag & 7) {
- pp_debug_defines(s1);
- if (s1->dflag & 4)
- continue;
- }
-
- if (is_space(tok)) {
- if (spcs < sizeof white - 1)
- white[spcs++] = tok;
- continue;
- } else if (tok == TOK_LINEFEED) {
- spcs = 0;
- if (token_seen == TOK_LINEFEED)
- continue;
- ++file->line_ref;
- } else if (token_seen == TOK_LINEFEED) {
- pp_line(s1, file, 0);
- } else if (spcs == 0 && pp_need_space(token_seen, tok)) {
- white[spcs++] = ' ';
- }
-
- white[spcs] = 0, fputs(white, s1->ppfp), spcs = 0;
- fputs(p = get_tok_str(tok, &tokc), s1->ppfp);
- token_seen = pp_check_he0xE(tok, p);
- }
- return 0;
-}
-
-/* ------------------------------------------------------------------------- */