c5a047348d
2000-04-25 Zack Weinberg <zack@wolery.cumb.org> * cpplib.h (struct cpp_buffer): Add 'mapped' flag; fix commentary. 2000-04-25 Neil Booth <NeilB@earthling.net> Restore previous patch, plus the following fixes: * cpphash.c (_cpp_create_definition): Test PREV_WHITESPACE in flags, not CPP_OPEN_PAREN. * cpplex.c (expand_token_space, init_token_list, cpp_free_token_list): Put the dummy token at list->tokens[-1]. (_cpp_lex_line, _cpp_lex_file): token list is 0-based. From-SVN: r33419
323 lines
13 KiB
C
323 lines
13 KiB
C
/* Part of CPP library.
|
|
Copyright (C) 1997, 1998, 1999, 2000 Free Software Foundation, Inc.
|
|
|
|
This program is free software; you can redistribute it and/or modify it
|
|
under the terms of the GNU General Public License as published by the
|
|
Free Software Foundation; either version 2, or (at your option) any
|
|
later version.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program; if not, write to the Free Software
|
|
Foundation, 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. */
|
|
|
|
/* This header defines all the internal data structures and functions
|
|
that need to be visible across files. It's called cpphash.h for
|
|
historical reasons. */
|
|
|
|
#ifndef __GCC_CPPHASH__
|
|
#define __GCC_CPPHASH__
|
|
|
|
typedef unsigned char U_CHAR;
|
|
|
|
/* Structure allocated for every #define. For a simple replacement
|
|
such as
|
|
#define foo bar ,
|
|
nargs = -1, the `pattern' list is null, and the expansion is just
|
|
the replacement text. Nargs = 0 means a functionlike macro with no args,
|
|
e.g.,
|
|
#define getchar() getc (stdin) .
|
|
When there are args, the expansion is the replacement text with the
|
|
args squashed out, and the reflist is a list describing how to
|
|
build the output from the input: e.g., "3 chars, then the 1st arg,
|
|
then 9 chars, then the 3rd arg, then 0 chars, then the 2nd arg".
|
|
The chars here come from the expansion. Whatever is left of the
|
|
expansion after the last arg-occurrence is copied after that arg.
|
|
Note that the reflist can be arbitrarily long---
|
|
its length depends on the number of times the arguments appear in
|
|
the replacement text, not how many args there are. Example:
|
|
#define f(x) x+x+x+x+x+x+x would have replacement text "++++++" and
|
|
pattern list
|
|
{ (0, 1), (1, 1), (1, 1), ..., (1, 1), NULL }
|
|
where (x, y) means (nchars, argno). */
|
|
|
|
struct reflist
|
|
{
|
|
struct reflist *next;
|
|
char stringify; /* nonzero if this arg was preceded by a
|
|
# operator. */
|
|
char raw_before; /* Nonzero if a ## operator before arg. */
|
|
char raw_after; /* Nonzero if a ## operator after arg. */
|
|
char rest_args; /* Nonzero if this arg. absorbs the rest */
|
|
int nchars; /* Number of literal chars to copy before
|
|
this arg occurrence. */
|
|
int argno; /* Number of arg to substitute (origin-0) */
|
|
};
|
|
|
|
typedef struct definition DEFINITION;
|
|
struct definition
|
|
{
|
|
int nargs;
|
|
int length; /* length of expansion string */
|
|
U_CHAR *expansion;
|
|
char rest_args; /* Nonzero if last arg. absorbs the rest */
|
|
struct reflist *pattern;
|
|
|
|
/* Names of macro args, concatenated in order with \0 between
|
|
them. The only use of this is that we warn on redefinition if
|
|
this differs between the old and new definitions. */
|
|
U_CHAR *argnames;
|
|
};
|
|
|
|
/* The structure of a node in the hash table. The hash table
|
|
has entries for all tokens defined by #define commands (type T_MACRO),
|
|
plus some special tokens like __LINE__ (these each have their own
|
|
type, and the appropriate code is run when that type of node is seen.
|
|
It does not contain control words like "#define", which are recognized
|
|
by a separate piece of code. */
|
|
|
|
/* different flavors of hash nodes */
|
|
enum node_type
|
|
{
|
|
T_VOID = 0, /* no definition yet */
|
|
T_SPECLINE, /* `__LINE__' */
|
|
T_DATE, /* `__DATE__' */
|
|
T_FILE, /* `__FILE__' */
|
|
T_BASE_FILE, /* `__BASE_FILE__' */
|
|
T_INCLUDE_LEVEL, /* `__INCLUDE_LEVEL__' */
|
|
T_TIME, /* `__TIME__' */
|
|
T_STDC, /* `__STDC__' */
|
|
T_CONST, /* Constant string, used by `__SIZE_TYPE__' etc */
|
|
T_XCONST, /* Ditto, but the string is malloced memory */
|
|
T_POISON, /* poisoned identifier */
|
|
T_MCONST, /* object-like macro defined to a single identifier */
|
|
T_MACRO, /* general object-like macro */
|
|
T_FMACRO, /* general function-like macro */
|
|
T_IDENTITY, /* macro defined to itself */
|
|
T_EMPTY /* macro defined to nothing */
|
|
};
|
|
|
|
/* different kinds of things that can appear in the value field
|
|
of a hash node. */
|
|
union hashval
|
|
{
|
|
const char *cpval; /* some predefined macros */
|
|
DEFINITION *defn; /* #define */
|
|
struct hashnode *aschain; /* #assert */
|
|
};
|
|
|
|
typedef struct hashnode HASHNODE;
|
|
struct hashnode
|
|
{
|
|
const U_CHAR *name; /* the actual name */
|
|
size_t length; /* length of token, for quick comparison */
|
|
unsigned long hash; /* cached hash value */
|
|
union hashval value; /* pointer to expansion, or whatever */
|
|
enum node_type type; /* type of special token */
|
|
int disabled; /* macro turned off for rescan? */
|
|
|
|
const char *file; /* File, line, column of definition; */
|
|
int line;
|
|
int col;
|
|
};
|
|
|
|
/* List of directories to look for include files in. */
|
|
struct file_name_list
|
|
{
|
|
struct file_name_list *next;
|
|
struct file_name_list *alloc; /* for the cache of
|
|
current directory entries */
|
|
char *name;
|
|
unsigned int nlen;
|
|
/* We use these to tell if the directory mentioned here is a duplicate
|
|
of an earlier directory on the search path. */
|
|
ino_t ino;
|
|
dev_t dev;
|
|
/* If the following is nonzero, it is a C-language system include
|
|
directory. */
|
|
int sysp;
|
|
/* Mapping of file names for this directory.
|
|
Only used on MS-DOS and related platforms. */
|
|
struct file_name_map *name_map;
|
|
};
|
|
#define ABSOLUTE_PATH ((struct file_name_list *)-1)
|
|
|
|
/* This structure is used for the table of all includes. It is
|
|
indexed by the `short name' (the name as it appeared in the
|
|
#include statement) which is stored in *nshort. */
|
|
struct ihash
|
|
{
|
|
/* Next file with the same short name but a
|
|
different (partial) pathname). */
|
|
struct ihash *next_this_file;
|
|
|
|
/* Location of the file in the include search path.
|
|
Used for include_next */
|
|
struct file_name_list *foundhere;
|
|
|
|
unsigned long hash; /* save hash value for future reference */
|
|
const char *nshort; /* name of file as referenced in #include;
|
|
points into name[] */
|
|
const U_CHAR *control_macro; /* macro, if any, preventing reinclusion -
|
|
see redundant_include_p */
|
|
const char name[1]; /* (partial) pathname of file */
|
|
};
|
|
typedef struct ihash IHASH;
|
|
|
|
/* Character classes.
|
|
If the definition of `numchar' looks odd to you, please look up the
|
|
definition of a pp-number in the C standard [section 6.4.8 of C99] */
|
|
#define ISidnum 0x01 /* a-zA-Z0-9_ */
|
|
#define ISidstart 0x02 /* _a-zA-Z */
|
|
#define ISnumstart 0x04 /* 0-9 */
|
|
#define IShspace 0x08 /* ' ' \t \f \v */
|
|
#define ISspace 0x10 /* ' ' \t \f \v \n */
|
|
|
|
#define _dollar_ok(x) ((x) == '$' && CPP_OPTION (pfile, dollars_in_ident))
|
|
|
|
#define is_idchar(x) ((_cpp_IStable[x] & ISidnum) || _dollar_ok(x))
|
|
#define is_idstart(x) ((_cpp_IStable[x] & ISidstart) || _dollar_ok(x))
|
|
#define is_numchar(x) (_cpp_IStable[x] & ISidnum)
|
|
#define is_numstart(x) (_cpp_IStable[x] & ISnumstart)
|
|
#define is_hspace(x) (_cpp_IStable[x] & IShspace)
|
|
#define is_space(x) (_cpp_IStable[x] & ISspace)
|
|
|
|
/* This table is constant if it can be initialized at compile time,
|
|
which is the case if cpp was compiled with GCC >=2.7, or another
|
|
compiler that supports C99. */
|
|
#if (GCC_VERSION >= 2007) || (__STDC_VERSION__ >= 199901L)
|
|
extern const unsigned char _cpp_IStable[256];
|
|
#else
|
|
extern unsigned char _cpp_IStable[256];
|
|
#endif
|
|
|
|
/* Macros. */
|
|
|
|
/* One character lookahead in the input buffer. Note that if this
|
|
returns EOF, it does *not* necessarily mean the file's end has been
|
|
reached. */
|
|
#define CPP_BUF_PEEK(BUFFER) \
|
|
((BUFFER)->cur < (BUFFER)->rlimit ? *(BUFFER)->cur : EOF)
|
|
|
|
/* Make sure PFILE->token_buffer has space for at least N more characters. */
|
|
#define CPP_RESERVE(PFILE, N) \
|
|
(CPP_WRITTEN (PFILE) + (size_t)(N) > (PFILE)->token_buffer_size \
|
|
&& (_cpp_grow_token_buffer (PFILE, N), 0))
|
|
|
|
/* Append string STR (of length N) to PFILE's output buffer.
|
|
Assume there is enough space. */
|
|
#define CPP_PUTS_Q(PFILE, STR, N) \
|
|
(memcpy ((PFILE)->limit, STR, (N)), (PFILE)->limit += (N))
|
|
/* Append string STR (of length N) to PFILE's output buffer. Make space. */
|
|
#define CPP_PUTS(PFILE, STR, N) CPP_RESERVE(PFILE, N), CPP_PUTS_Q(PFILE, STR,N)
|
|
/* Append character CH to PFILE's output buffer. Assume sufficient space. */
|
|
#define CPP_PUTC_Q(PFILE, CH) (*(PFILE)->limit++ = (CH))
|
|
/* Append character CH to PFILE's output buffer. Make space if need be. */
|
|
#define CPP_PUTC(PFILE, CH) (CPP_RESERVE (PFILE, 1), CPP_PUTC_Q (PFILE, CH))
|
|
|
|
/* Advance the current line by one. */
|
|
#define CPP_BUMP_BUFFER_LINE(PBUF) ((PBUF)->lineno++,\
|
|
(PBUF)->line_base = (PBUF)->cur)
|
|
#define CPP_BUMP_LINE(PFILE) CPP_BUMP_BUFFER_LINE(CPP_BUFFER(PFILE))
|
|
#define CPP_BUMP_BUFFER_LINE_CUR(PBUF, CUR) ((PBUF)->lineno++,\
|
|
(PBUF)->line_base = CUR)
|
|
#define CPP_BUMP_LINE_CUR(PFILE, CUR) \
|
|
CPP_BUMP_BUFFER_LINE_CUR(CPP_BUFFER(PFILE), CUR)
|
|
#define CPP_PREV_BUFFER(BUFFER) ((BUFFER)->prev)
|
|
|
|
/* Are we in column 1 right now? Used mainly for -traditional handling
|
|
of directives. */
|
|
#define CPP_IN_COLUMN_1(PFILE) \
|
|
(CPP_BUFFER (PFILE)->cur - CPP_BUFFER (PFILE)->line_base == 1)
|
|
|
|
#define CPP_PRINT_DEPS(PFILE) CPP_OPTION (PFILE, print_deps)
|
|
#define CPP_TRADITIONAL(PFILE) CPP_OPTION (PFILE, traditional)
|
|
#define CPP_PEDANTIC(PFILE) \
|
|
(CPP_OPTION (PFILE, pedantic) && !CPP_BUFFER (PFILE)->system_header_p)
|
|
#define CPP_WTRADITIONAL(PF) \
|
|
(CPP_OPTION (PF, warn_traditional) && !CPP_BUFFER (PF)->system_header_p)
|
|
|
|
/* CPP_IS_MACRO_BUFFER is true if the buffer contains macro expansion.
|
|
(Note that it is false while we're expanding macro *arguments*.) */
|
|
#define CPP_IS_MACRO_BUFFER(PBUF) ((PBUF)->macro != NULL)
|
|
|
|
/* Remember the current position of PFILE so it may be returned to
|
|
after looking ahead a bit.
|
|
|
|
Note that when you set a mark, you _must_ return to that mark. You
|
|
may not forget about it and continue parsing. You may not pop a
|
|
buffer with an active mark. You may not call CPP_BUMP_LINE while a
|
|
mark is active. */
|
|
#define CPP_SET_BUF_MARK(IP) ((IP)->mark = (IP)->cur)
|
|
#define CPP_GOTO_BUF_MARK(IP) ((IP)->cur = (IP)->mark, (IP)->mark = 0)
|
|
#define CPP_SET_MARK(PFILE) CPP_SET_BUF_MARK(CPP_BUFFER(PFILE))
|
|
#define CPP_GOTO_MARK(PFILE) CPP_GOTO_BUF_MARK(CPP_BUFFER(PFILE))
|
|
|
|
/* ACTIVE_MARK_P is true if there's a live mark in the buffer. */
|
|
#define ACTIVE_MARK_P(PFILE) (CPP_BUFFER (PFILE)->mark != 0)
|
|
|
|
/* Are mark and point adjacent characters? Used mostly to deal with
|
|
the somewhat annoying semantic of #define. */
|
|
#define ADJACENT_TO_MARK(PFILE) \
|
|
(CPP_BUFFER(PFILE)->cur - CPP_BUFFER(PFILE)->mark == 1)
|
|
|
|
/* In cpphash.c */
|
|
extern HASHNODE *_cpp_make_hashnode PARAMS ((const U_CHAR *, size_t,
|
|
enum node_type,
|
|
unsigned long));
|
|
extern unsigned int _cpp_calc_hash PARAMS ((const U_CHAR *, size_t));
|
|
extern HASHNODE *_cpp_lookup PARAMS ((cpp_reader *,
|
|
const U_CHAR *, int));
|
|
extern HASHNODE **_cpp_lookup_slot PARAMS ((cpp_reader *,
|
|
const U_CHAR *, int,
|
|
enum insert_option,
|
|
unsigned long *));
|
|
extern void _cpp_free_definition PARAMS ((DEFINITION *));
|
|
extern int _cpp_create_definition PARAMS ((cpp_reader *,
|
|
cpp_toklist *, HASHNODE *));
|
|
extern void _cpp_dump_definition PARAMS ((cpp_reader *, HASHNODE *));
|
|
extern void _cpp_quote_string PARAMS ((cpp_reader *, const char *));
|
|
extern void _cpp_macroexpand PARAMS ((cpp_reader *, HASHNODE *));
|
|
extern void _cpp_init_macro_hash PARAMS ((cpp_reader *));
|
|
extern void _cpp_dump_macro_hash PARAMS ((cpp_reader *));
|
|
|
|
/* In cppfiles.c */
|
|
extern void _cpp_simplify_pathname PARAMS ((char *));
|
|
extern void _cpp_execute_include PARAMS ((cpp_reader *, char *,
|
|
unsigned int, int,
|
|
struct file_name_list *));
|
|
extern void _cpp_init_include_hash PARAMS ((cpp_reader *));
|
|
extern const char *_cpp_fake_ihash PARAMS ((cpp_reader *, const char *));
|
|
|
|
/* In cppexp.c */
|
|
extern int _cpp_parse_expr PARAMS ((cpp_reader *));
|
|
|
|
/* In cpplex.c */
|
|
extern void _cpp_parse_name PARAMS ((cpp_reader *, int));
|
|
extern void _cpp_skip_rest_of_line PARAMS ((cpp_reader *));
|
|
extern void _cpp_skip_hspace PARAMS ((cpp_reader *));
|
|
extern void _cpp_expand_to_buffer PARAMS ((cpp_reader *,
|
|
const unsigned char *, int));
|
|
extern int _cpp_parse_assertion PARAMS ((cpp_reader *));
|
|
extern enum cpp_ttype _cpp_lex_token PARAMS ((cpp_reader *));
|
|
extern long _cpp_read_and_prescan PARAMS ((cpp_reader *, cpp_buffer *,
|
|
int, size_t));
|
|
extern void _cpp_init_input_buffer PARAMS ((cpp_reader *));
|
|
extern void _cpp_grow_token_buffer PARAMS ((cpp_reader *, long));
|
|
extern enum cpp_ttype _cpp_get_directive_token
|
|
PARAMS ((cpp_reader *));
|
|
extern enum cpp_ttype _cpp_get_define_token
|
|
PARAMS ((cpp_reader *));
|
|
extern void _cpp_scan_line PARAMS ((cpp_reader *, cpp_toklist *));
|
|
|
|
/* In cpplib.c */
|
|
extern int _cpp_handle_directive PARAMS ((cpp_reader *));
|
|
extern void _cpp_handle_eof PARAMS ((cpp_reader *));
|
|
extern void _cpp_check_directive PARAMS((cpp_toklist *, cpp_token *));
|
|
|
|
#endif
|