1 /* Part of CPP library.
2 Copyright (C) 1997, 1998, 1999, 2000, 2001 Free Software Foundation, Inc.
4 This program is free software; you can redistribute it and/or modify it
5 under the terms of the GNU General Public License as published by the
6 Free Software Foundation; either version 2, or (at your option) any
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program; if not, write to the Free Software
16 Foundation, 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. */
18 /* This header defines all the internal data structures and functions
19 that need to be visible across files. It's called cpphash.h for
20 historical reasons. */
25 #include "hashtable.h"
27 struct directive; /* Deliberately incomplete. */
29 /* Test if a sign is valid within a preprocessing number. */
30 #define VALID_SIGN(c, prevc) \
31 (((c) == '+' || (c) == '-') && \
32 ((prevc) == 'e' || (prevc) == 'E' \
33 || (((prevc) == 'p' || (prevc) == 'P') \
34 && CPP_OPTION (pfile, extended_numbers))))
36 #define CPP_OPTION(PFILE, OPTION) ((PFILE)->opts.OPTION)
37 #define CPP_BUFFER(PFILE) ((PFILE)->buffer)
38 #define CPP_BUF_COLUMN(BUF, CUR) ((CUR) - (BUF)->line_base + (BUF)->col_adjust)
39 #define CPP_BUF_COL(BUF) CPP_BUF_COLUMN(BUF, (BUF)->cur)
41 /* Maximum nesting of cpp_buffers. We use a static limit, partly for
42 efficiency, and partly to limit runaway recursion. */
43 #define CPP_STACK_MAX 200
46 #define POOL_ALIGN(size, align) (((size) + ((align) - 1)) & ~((align) - 1))
47 #define POOL_FRONT(p) ((p)->cur->front)
48 #define POOL_LIMIT(p) ((p)->cur->limit)
49 #define POOL_BASE(p) ((p)->cur->base)
50 #define POOL_SIZE(p) ((p)->cur->limit - (p)->cur->base)
51 #define POOL_ROOM(p) ((p)->cur->limit - (p)->cur->front)
52 #define POOL_USED(p) ((p)->cur->front - (p)->cur->base)
53 #define POOL_COMMIT(p, len) do {\
54 ((p)->cur->front += POOL_ALIGN (len, (p)->align));\
55 if ((p)->cur->front > (p)->cur->limit) abort ();} while (0)
57 typedef struct cpp_chunk cpp_chunk;
66 typedef struct cpp_pool cpp_pool;
69 struct cpp_chunk *cur, *locked, *first;
70 unsigned char *pos; /* Current position. */
75 /* List of directories to look for include files in. */
78 struct search_path *next;
80 /* NOTE: NAME may not be null terminated for the case of the current
84 /* We use these to tell if the directory mentioned here is a duplicate
85 of an earlier directory on the search path. */
88 /* Non-zero if it is a system include directory. */
90 /* Mapping of file names for this directory. Only used on MS-DOS
91 and related platforms. */
92 struct file_name_map *name_map;
96 enum include_type {IT_INCLUDE, IT_INCLUDE_NEXT, IT_IMPORT, IT_CMDLINE};
98 typedef struct toklist toklist;
105 typedef struct tokenrun tokenrun;
109 cpp_token *base, *limit;
112 typedef struct cpp_context cpp_context;
115 /* Doubly-linked list. */
116 cpp_context *next, *prev;
118 /* Contexts other than the base context are contiguous tokens.
119 e.g. macro expansions, expanded argument tokens. */
122 /* For a macro context, these are the macro and its arguments. */
128 /* Nonzero if first token on line is CPP_HASH. */
129 unsigned char in_directive;
131 /* True if we are skipping a failed conditional group. */
132 unsigned char skipping;
134 /* Nonzero if next token is the start of a line. */
137 /* Nonzero if in a directive that takes angle-bracketed headers. */
138 unsigned char angled_headers;
140 /* Nonzero to save comments. Turned off if discard_comments, and in
141 all directives apart from #define. */
142 unsigned char save_comments;
144 /* Nonzero if we're mid-comment. */
145 unsigned char lexing_comment;
147 /* Nonzero if lexing __VA_ARGS__ is valid. */
148 unsigned char va_args_ok;
150 /* Nonzero if lexing poisoned identifiers is valid. */
151 unsigned char poisoned_ok;
153 /* Nonzero to prevent macro expansion. */
154 unsigned char prevent_expansion;
156 /* Nonzero when parsing arguments to a function-like macro. */
157 unsigned char parsing_args;
159 /* Nonzero when in a # NUMBER directive. */
160 unsigned char line_extension;
163 /* Special nodes - identifiers with predefined significance. */
166 cpp_hashnode *n_L; /* L"str" */
167 cpp_hashnode *n_defined; /* defined operator */
168 cpp_hashnode *n_true; /* C++ keyword true */
169 cpp_hashnode *n_false; /* C++ keyword false */
170 cpp_hashnode *n__Pragma; /* _Pragma operator */
171 cpp_hashnode *n__STRICT_ANSI__; /* STDC_0_IN_SYSTEM_HEADERS */
172 cpp_hashnode *n__CHAR_UNSIGNED__; /* plain char is unsigned */
173 cpp_hashnode *n__VA_ARGS__; /* C99 vararg macros */
178 const unsigned char *cur; /* current position */
179 const unsigned char *rlimit; /* end of valid data */
180 const unsigned char *line_base; /* start of current line */
181 cppchar_t read_ahead; /* read ahead character */
182 cppchar_t extra_char; /* extra read-ahead for long tokens. */
184 struct cpp_buffer *prev;
186 const unsigned char *buf; /* Entire buffer. */
188 /* Pointer into the include table; non-NULL if this is a file
189 buffer. Used for include_next and to record control macros. */
190 struct include_file *inc;
192 /* Value of if_stack at start of this file.
193 Used to prohibit unmatched #endif (etc) in an include file. */
194 struct if_stack *if_stack;
196 /* Token column position adjustment owing to tabs in whitespace. */
197 unsigned int col_adjust;
199 /* Contains PREV_WHITE and/or AVOID_LPASTE. */
200 unsigned char saved_flags;
202 /* Because of the way the lexer works, -Wtrigraphs can sometimes
203 warn twice for the same trigraph. This helps prevent that. */
204 const unsigned char *last_Wtrigraphs;
206 /* True if we have already warned about C++ comments in this file.
207 The warning happens only for C89 extended mode with -pedantic on,
208 or for -Wtraditional, and only once per file (otherwise it would
209 be far too noisy). */
210 unsigned char warned_cplusplus_comments;
212 /* True if we don't process trigraphs and escaped newlines. True
213 for preprocessed input, command line directives, and _Pragma
215 unsigned char from_stage3;
217 /* Nonzero means that the directory to start searching for ""
218 include files has been calculated and stored in "dir" below. */
219 unsigned char search_cached;
221 /* At EOF, a buffer is automatically popped. If RETURN_AT_EOF is
222 true, a CPP_EOF token is then returned. Otherwise, the next
223 token from the enclosing buffer is returned. */
226 /* The directory of the this buffer's file. Its NAME member is not
227 allocated, so we don't need to worry about freeing it. */
228 struct search_path dir;
231 /* A cpp_reader encapsulates the "state" of a pre-processor run.
232 Applying cpp_get_token repeatedly yields a stream of pre-processor
233 tokens. Usually, there is only one cpp_reader object active. */
237 /* Top of buffer stack. */
241 struct lexer_state state;
243 /* Source line tracking. */
244 struct line_maps line_maps;
245 const struct line_map *map;
248 /* The position of the last lexed token and last lexed directive. */
249 cpp_lexer_pos lexer_pos;
250 cpp_lexer_pos directive_pos;
251 unsigned int directive_line;
254 cpp_pool ident_pool; /* For all identifiers, and permanent
255 numbers and strings. */
256 cpp_pool macro_pool; /* For macro definitions. Permanent. */
257 cpp_pool argument_pool; /* For macro arguments. Temporary. */
260 struct cpp_context base_context;
261 struct cpp_context *context;
263 /* If in_directive, the directive if known. */
264 const struct directive *directive;
266 /* Multiple inlcude optimisation. */
267 const cpp_hashnode *mi_cmacro;
268 const cpp_hashnode *mi_ind_cmacro;
272 cpp_token *cur_token;
273 tokenrun base_run, *cur_run;
275 /* Non-zero prevents the lexer from re-using the token runs. */
276 unsigned int keep_tokens;
278 /* Token lookahead. */
279 struct cpp_lookahead *la_read; /* Read from this lookahead. */
280 struct cpp_lookahead *la_write; /* Write to this lookahead. */
281 struct cpp_lookahead *la_unused; /* Free store. */
282 struct cpp_lookahead *la_saved; /* Backup when entering directive. */
284 /* Error counter for exit code. */
287 /* Line and column where a newline was first seen in a string
288 constant (multi-line strings). */
289 cpp_lexer_pos mlstring_pos;
291 /* Buffer to hold macro definition string. */
292 unsigned char *macro_buffer;
293 unsigned int macro_buffer_len;
295 /* Tree of other included files. See cppfiles.c. */
296 struct splay_tree_s *all_include_files;
298 /* Current maximum length of directory names in the search path
299 for include files. (Altered as we get more of them.) */
300 unsigned int max_include_len;
302 /* Date and time tokens. Calculated together if either is requested. */
306 /* Opaque handle to the dependencies of mkdeps.c. Used by -M etc. */
309 /* Obstack holding all macro hash nodes. This never shrinks.
311 struct obstack hash_ob;
313 /* Obstack holding buffer and conditional structures. This is a
314 real stack. See cpplib.c. */
315 struct obstack buffer_ob;
317 /* Pragma table - dynamic, because a library user can add to the
318 list of recognized pragmas. */
319 struct pragma_entry *pragmas;
322 struct cpp_callbacks cb;
324 /* Identifier hash table. */
325 struct ht *hash_table;
327 /* User visible options. */
328 struct cpp_options opts;
330 /* Special nodes - identifiers with predefined significance to the
332 struct spec_nodes spec_nodes;
334 /* Whether to print our version number. Done this way so
335 we don't get it twice for -v -version. */
336 unsigned char print_version;
338 /* Whether cpplib owns the hashtable. */
339 unsigned char our_hashtable;
342 /* Character classes. Based on the more primitive macros in safe-ctype.h.
343 If the definition of `numchar' looks odd to you, please look up the
344 definition of a pp-number in the C standard [section 6.4.8 of C99].
346 In the unlikely event that characters other than \r and \n enter
347 the set is_vspace, the macro handle_newline() in cpplex.c must be
349 #define _dollar_ok(x) ((x) == '$' && CPP_OPTION (pfile, dollars_in_ident))
351 #define is_idchar(x) (ISIDNUM(x) || _dollar_ok(x))
352 #define is_numchar(x) ISIDNUM(x)
353 #define is_idstart(x) (ISIDST(x) || _dollar_ok(x))
354 #define is_numstart(x) ISDIGIT(x)
355 #define is_hspace(x) ISBLANK(x)
356 #define is_vspace(x) IS_VSPACE(x)
357 #define is_nvspace(x) IS_NVSPACE(x)
358 #define is_space(x) IS_SPACE_OR_NUL(x)
360 /* This table is constant if it can be initialized at compile time,
361 which is the case if cpp was compiled with GCC >=2.7, or another
362 compiler that supports C99. */
363 #if HAVE_DESIGNATED_INITIALIZERS
364 extern const unsigned char _cpp_trigraph_map[UCHAR_MAX + 1];
366 extern unsigned char _cpp_trigraph_map[UCHAR_MAX + 1];
371 #define CPP_PRINT_DEPS(PFILE) CPP_OPTION (PFILE, print_deps)
372 #define CPP_IN_SYSTEM_HEADER(PFILE) ((PFILE)->map && (PFILE)->map->sysp)
373 #define CPP_PEDANTIC(PF) CPP_OPTION (PF, pedantic)
374 #define CPP_WTRADITIONAL(PF) CPP_OPTION (PF, warn_traditional)
377 enum error_type { WARNING = 0, WARNING_SYSHDR, PEDWARN, ERROR, FATAL, ICE };
378 extern int _cpp_begin_message PARAMS ((cpp_reader *, enum error_type,
379 const cpp_lexer_pos *));
382 extern void _cpp_free_definition PARAMS ((cpp_hashnode *));
383 extern int _cpp_create_definition PARAMS ((cpp_reader *, cpp_hashnode *));
384 extern void _cpp_pop_context PARAMS ((cpp_reader *));
385 extern void _cpp_free_lookaheads PARAMS ((cpp_reader *));
386 extern void _cpp_release_lookahead PARAMS ((cpp_reader *));
387 extern void _cpp_push_token PARAMS ((cpp_reader *, const cpp_token *,
388 const cpp_lexer_pos *));
391 extern void _cpp_init_hashtable PARAMS ((cpp_reader *, hash_table *));
392 extern void _cpp_destroy_hashtable PARAMS ((cpp_reader *));
395 extern void _cpp_fake_include PARAMS ((cpp_reader *, const char *));
396 extern void _cpp_never_reread PARAMS ((struct include_file *));
397 extern char *_cpp_simplify_pathname PARAMS ((char *));
398 extern bool _cpp_read_file PARAMS ((cpp_reader *, const char *));
399 extern bool _cpp_execute_include PARAMS ((cpp_reader *,
402 extern int _cpp_compare_file_date PARAMS ((cpp_reader *,
404 extern void _cpp_report_missing_guards PARAMS ((cpp_reader *));
405 extern void _cpp_init_includes PARAMS ((cpp_reader *));
406 extern void _cpp_cleanup_includes PARAMS ((cpp_reader *));
407 extern void _cpp_pop_file_buffer PARAMS ((cpp_reader *,
408 struct include_file *));
411 extern int _cpp_parse_expr PARAMS ((cpp_reader *));
414 extern void _cpp_lex_token PARAMS ((cpp_reader *, cpp_token *));
415 extern int _cpp_equiv_tokens PARAMS ((const cpp_token *,
417 extern void _cpp_init_tokenrun PARAMS ((tokenrun *, unsigned int));
418 extern void _cpp_init_pool PARAMS ((cpp_pool *, unsigned int,
419 unsigned int, unsigned int));
420 extern void _cpp_free_pool PARAMS ((cpp_pool *));
421 extern unsigned char *_cpp_pool_reserve PARAMS ((cpp_pool *, unsigned int));
422 extern unsigned char *_cpp_pool_alloc PARAMS ((cpp_pool *, unsigned int));
423 extern unsigned char *_cpp_next_chunk PARAMS ((cpp_pool *, unsigned int,
425 extern void _cpp_lock_pool PARAMS ((cpp_pool *));
426 extern void _cpp_unlock_pool PARAMS ((cpp_pool *));
429 extern bool _cpp_push_next_buffer PARAMS ((cpp_reader *));
432 extern int _cpp_test_assertion PARAMS ((cpp_reader *, int *));
433 extern int _cpp_handle_directive PARAMS ((cpp_reader *, int));
434 extern void _cpp_define_builtin PARAMS ((cpp_reader *, const char *));
435 extern void _cpp_do__Pragma PARAMS ((cpp_reader *));
436 extern void _cpp_init_directives PARAMS ((cpp_reader *));
437 extern void _cpp_init_internal_pragmas PARAMS ((cpp_reader *));
438 extern void _cpp_do_file_change PARAMS ((cpp_reader *, enum lc_reason,
440 unsigned int, unsigned int));
441 extern void _cpp_pop_buffer PARAMS ((cpp_reader *));
443 /* Utility routines and macros. */
444 #define DSC(str) (const U_CHAR *)str, sizeof str - 1
445 #define xnew(T) (T *) xmalloc (sizeof(T))
446 #define xcnew(T) (T *) xcalloc (1, sizeof(T))
447 #define xnewvec(T, N) (T *) xmalloc (sizeof(T) * (N))
448 #define xcnewvec(T, N) (T *) xcalloc (N, sizeof(T))
449 #define xobnew(O, T) (T *) obstack_alloc (O, sizeof(T))
451 /* These are inline functions instead of macros so we can get type
453 typedef unsigned char U_CHAR;
454 #define U (const U_CHAR *) /* Intended use: U"string" */
456 static inline int ustrcmp PARAMS ((const U_CHAR *, const U_CHAR *));
457 static inline int ustrncmp PARAMS ((const U_CHAR *, const U_CHAR *,
459 static inline size_t ustrlen PARAMS ((const U_CHAR *));
460 static inline U_CHAR *uxstrdup PARAMS ((const U_CHAR *));
461 static inline U_CHAR *ustrchr PARAMS ((const U_CHAR *, int));
462 static inline int ufputs PARAMS ((const U_CHAR *, FILE *));
466 const U_CHAR *s1, *s2;
468 return strcmp ((const char *)s1, (const char *)s2);
473 const U_CHAR *s1, *s2;
476 return strncmp ((const char *)s1, (const char *)s2, n);
483 return strlen ((const char *)s1);
486 static inline U_CHAR *
490 return (U_CHAR *) xstrdup ((const char *)s1);
493 static inline U_CHAR *
498 return (U_CHAR *) strchr ((const char *)s1, c);
506 return fputs ((const char *)s, f);
509 #endif /* ! GCC_CPPHASH_H */