2 Copyright (C) 1986-2022 Free Software Foundation, Inc.
3 Contributed by Per Bothner, 1994-95.
4 Based on CCCP program by Paul Rubin, June 1986
5 Adapted to ANSI C, Richard Stallman, Jan 1987
7 This program is free software; you can redistribute it and/or modify it
8 under the terms of the GNU General Public License as published by the
9 Free Software Foundation; either version 3, or (at your option) any
12 This program is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with this program; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
26 #include "localedir.h"
27 #include "filenames.h"
29 #ifndef ENABLE_CANONICAL_SYSTEM_HEADERS
30 #ifdef HAVE_DOS_BASED_FILE_SYSTEM
31 #define ENABLE_CANONICAL_SYSTEM_HEADERS 1
33 #define ENABLE_CANONICAL_SYSTEM_HEADERS 0
37 static void init_library (void);
38 static void mark_named_operators (cpp_reader *, int);
39 static bool read_original_filename (cpp_reader *);
40 static void read_original_directory (cpp_reader *);
41 static void post_options (cpp_reader *);
43 /* If we have designated initializers (GCC >2.7) these tables can be
44 initialized, constant data. Otherwise, they have to be filled in at
46 #if HAVE_DESIGNATED_INITIALIZERS
48 #define init_trigraph_map() /* Nothing. */
49 #define TRIGRAPH_MAP \
50 __extension__ const uchar _cpp_trigraph_map[UCHAR_MAX + 1] = {
53 #define s(p, v) [p] = v,
57 #define TRIGRAPH_MAP uchar _cpp_trigraph_map[UCHAR_MAX + 1] = { 0 }; \
58 static void init_trigraph_map (void) { \
59 unsigned char *x = _cpp_trigraph_map;
62 #define s(p, v) x[p] = v;
67 s('=', '#') s(')', ']') s('!', '|')
68 s('(', '[') s('\'', '^') s('>', '}')
69 s('/', '\\') s('<', '{') s('-', '~')
76 /* A set of booleans indicating what CPP features each source language
82 char extended_numbers;
83 char extended_identifiers;
90 char binary_constants;
91 char digit_separators;
93 char utf8_char_literals;
99 char warning_directive;
100 char delimited_escape_seqs;
103 static const struct lang_flags lang_defaults[] =
104 { /* c99 c++ xnum xid c11 std digr ulit rlit udlit bincst digsep trig u8chlit vaopt scope dfp szlit elifdef warndir delim */
105 /* GNUC89 */ { 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0 },
106 /* GNUC99 */ { 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0 },
107 /* GNUC11 */ { 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0 },
108 /* GNUC17 */ { 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0 },
109 /* GNUC2X */ { 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0 },
110 /* STDC89 */ { 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0 },
111 /* STDC94 */ { 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0 },
112 /* STDC99 */ { 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0 },
113 /* STDC11 */ { 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0 },
114 /* STDC17 */ { 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0 },
115 /* STDC2X */ { 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0 },
116 /* GNUCXX */ { 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0 },
117 /* CXX98 */ { 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0 },
118 /* GNUCXX11 */ { 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0 },
119 /* CXX11 */ { 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0 },
120 /* GNUCXX14 */ { 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0 },
121 /* CXX14 */ { 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0 },
122 /* GNUCXX17 */ { 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0 },
123 /* CXX17 */ { 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0 },
124 /* GNUCXX20 */ { 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0 },
125 /* CXX20 */ { 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0 },
126 /* GNUCXX23 */ { 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1 },
127 /* CXX23 */ { 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1 },
128 /* ASM */ { 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }
131 /* Sets internal flags correctly for a given language. */
133 cpp_set_lang (cpp_reader *pfile, enum c_lang lang)
135 const struct lang_flags *l = &lang_defaults[(int) lang];
137 CPP_OPTION (pfile, lang) = lang;
139 CPP_OPTION (pfile, c99) = l->c99;
140 CPP_OPTION (pfile, cplusplus) = l->cplusplus;
141 CPP_OPTION (pfile, extended_numbers) = l->extended_numbers;
142 CPP_OPTION (pfile, extended_identifiers) = l->extended_identifiers;
143 CPP_OPTION (pfile, c11_identifiers) = l->c11_identifiers;
144 CPP_OPTION (pfile, std) = l->std;
145 CPP_OPTION (pfile, digraphs) = l->digraphs;
146 CPP_OPTION (pfile, uliterals) = l->uliterals;
147 CPP_OPTION (pfile, rliterals) = l->rliterals;
148 CPP_OPTION (pfile, user_literals) = l->user_literals;
149 CPP_OPTION (pfile, binary_constants) = l->binary_constants;
150 CPP_OPTION (pfile, digit_separators) = l->digit_separators;
151 CPP_OPTION (pfile, trigraphs) = l->trigraphs;
152 CPP_OPTION (pfile, utf8_char_literals) = l->utf8_char_literals;
153 CPP_OPTION (pfile, va_opt) = l->va_opt;
154 CPP_OPTION (pfile, scope) = l->scope;
155 CPP_OPTION (pfile, dfp_constants) = l->dfp_constants;
156 CPP_OPTION (pfile, size_t_literals) = l->size_t_literals;
157 CPP_OPTION (pfile, elifdef) = l->elifdef;
158 CPP_OPTION (pfile, warning_directive) = l->warning_directive;
159 CPP_OPTION (pfile, delimited_escape_seqs) = l->delimited_escape_seqs;
162 /* Initialize library global state. */
166 static int initialized = 0;
174 /* Set up the trigraph map. This doesn't need to do anything if
175 we were compiled with a compiler that supports C99 designated
177 init_trigraph_map ();
180 (void) bindtextdomain (PACKAGE, LOCALEDIR);
185 /* Initialize a cpp_reader structure. */
187 cpp_create_reader (enum c_lang lang, cpp_hash_table *table,
188 class line_maps *line_table)
192 /* Initialize this instance of the library if it hasn't been already. */
195 pfile = XCNEW (cpp_reader);
196 memset (&pfile->base_context, 0, sizeof (pfile->base_context));
198 cpp_set_lang (pfile, lang);
199 CPP_OPTION (pfile, warn_multichar) = 1;
200 CPP_OPTION (pfile, discard_comments) = 1;
201 CPP_OPTION (pfile, discard_comments_in_macro_exp) = 1;
202 CPP_OPTION (pfile, max_include_depth) = 200;
203 CPP_OPTION (pfile, operator_names) = 1;
204 CPP_OPTION (pfile, warn_trigraphs) = 2;
205 CPP_OPTION (pfile, warn_endif_labels) = 1;
206 CPP_OPTION (pfile, cpp_warn_c90_c99_compat) = -1;
207 CPP_OPTION (pfile, cpp_warn_c11_c2x_compat) = -1;
208 CPP_OPTION (pfile, cpp_warn_cxx11_compat) = 0;
209 CPP_OPTION (pfile, cpp_warn_cxx20_compat) = 0;
210 CPP_OPTION (pfile, cpp_warn_deprecated) = 1;
211 CPP_OPTION (pfile, cpp_warn_long_long) = 0;
212 CPP_OPTION (pfile, dollars_in_ident) = 1;
213 CPP_OPTION (pfile, warn_dollars) = 1;
214 CPP_OPTION (pfile, warn_variadic_macros) = 1;
215 CPP_OPTION (pfile, warn_builtin_macro_redefined) = 1;
216 CPP_OPTION (pfile, cpp_warn_implicit_fallthrough) = 0;
217 /* By default, track locations of tokens resulting from macro
218 expansion. The '2' means, track the locations with the highest
219 accuracy. Read the comments for struct
220 cpp_options::track_macro_expansion to learn about the other
222 CPP_OPTION (pfile, track_macro_expansion) = 2;
223 CPP_OPTION (pfile, warn_normalize) = normalized_C;
224 CPP_OPTION (pfile, warn_literal_suffix) = 1;
225 CPP_OPTION (pfile, canonical_system_headers)
226 = ENABLE_CANONICAL_SYSTEM_HEADERS;
227 CPP_OPTION (pfile, ext_numeric_literals) = 1;
228 CPP_OPTION (pfile, warn_date_time) = 0;
229 CPP_OPTION (pfile, cpp_warn_bidirectional) = bidirectional_unpaired;
230 CPP_OPTION (pfile, cpp_warn_invalid_utf8) = 0;
231 CPP_OPTION (pfile, cpp_warn_unicode) = 1;
232 CPP_OPTION (pfile, cpp_input_charset_explicit) = 0;
234 /* Default CPP arithmetic to something sensible for the host for the
235 benefit of dumb users like fix-header. */
236 CPP_OPTION (pfile, precision) = CHAR_BIT * sizeof (long);
237 CPP_OPTION (pfile, char_precision) = CHAR_BIT;
238 CPP_OPTION (pfile, wchar_precision) = CHAR_BIT * sizeof (int);
239 CPP_OPTION (pfile, int_precision) = CHAR_BIT * sizeof (int);
240 CPP_OPTION (pfile, unsigned_char) = 0;
241 CPP_OPTION (pfile, unsigned_wchar) = 1;
242 CPP_OPTION (pfile, unsigned_utf8char) = 1;
243 CPP_OPTION (pfile, bytes_big_endian) = 1; /* does not matter */
245 /* Default to no charset conversion. */
246 CPP_OPTION (pfile, narrow_charset) = _cpp_default_encoding ();
247 CPP_OPTION (pfile, wide_charset) = 0;
249 /* Default the input character set to UTF-8. */
250 CPP_OPTION (pfile, input_charset) = _cpp_default_encoding ();
252 /* A fake empty "directory" used as the starting point for files
253 looked up without a search path. Name cannot be '/' because we
254 don't want to prepend anything at all to filenames using it. All
255 other entries are correct zero-initialized. */
256 pfile->no_search_path.name = (char *) "";
258 /* Initialize the line map. */
259 pfile->line_table = line_table;
261 /* Initialize lexer state. */
262 pfile->state.save_comments = ! CPP_OPTION (pfile, discard_comments);
264 /* Set up static tokens. */
265 pfile->avoid_paste.type = CPP_PADDING;
266 pfile->avoid_paste.val.source = NULL;
267 pfile->avoid_paste.src_loc = 0;
268 pfile->endarg.type = CPP_EOF;
269 pfile->endarg.flags = 0;
270 pfile->endarg.src_loc = 0;
272 /* Create a token buffer for the lexer. */
273 _cpp_init_tokenrun (&pfile->base_run, 250);
274 pfile->cur_run = &pfile->base_run;
275 pfile->cur_token = pfile->base_run.base;
277 /* Initialize the base context. */
278 pfile->context = &pfile->base_context;
279 pfile->base_context.c.macro = 0;
280 pfile->base_context.prev = pfile->base_context.next = 0;
282 /* Aligned and unaligned storage. */
283 pfile->a_buff = _cpp_get_buff (pfile, 0);
284 pfile->u_buff = _cpp_get_buff (pfile, 0);
286 /* Initialize table for push_macro/pop_macro. */
287 pfile->pushed_macros = 0;
289 /* Do not force token locations by default. */
290 pfile->forced_token_location = 0;
292 /* Note the timestamp is unset. */
293 pfile->time_stamp = time_t (-1);
294 pfile->time_stamp_kind = 0;
296 /* The expression parser stack. */
297 _cpp_expand_op_stack (pfile);
299 /* Initialize the buffer obstack. */
300 obstack_specify_allocation (&pfile->buffer_ob, 0, 0, xmalloc, free);
302 _cpp_init_files (pfile);
304 _cpp_init_hashtable (pfile, table);
309 /* Set the line_table entry in PFILE. This is called after reading a
310 PCH file, as the old line_table will be incorrect. */
312 cpp_set_line_map (cpp_reader *pfile, class line_maps *line_table)
314 pfile->line_table = line_table;
317 /* Free resources used by PFILE. Accessing PFILE after this function
318 returns leads to undefined behavior. Returns the error count. */
320 cpp_destroy (cpp_reader *pfile)
322 cpp_context *context, *contextn;
323 struct def_pragma_macro *pmacro;
324 tokenrun *run, *runn;
327 free (pfile->op_stack);
329 while (CPP_BUFFER (pfile) != NULL)
330 _cpp_pop_buffer (pfile);
332 free (pfile->out.base);
334 if (pfile->macro_buffer)
336 free (pfile->macro_buffer);
337 pfile->macro_buffer = NULL;
338 pfile->macro_buffer_len = 0;
342 deps_free (pfile->deps);
343 obstack_free (&pfile->buffer_ob, 0);
345 _cpp_destroy_hashtable (pfile);
346 _cpp_cleanup_files (pfile);
347 _cpp_destroy_iconv (pfile);
349 _cpp_free_buff (pfile->a_buff);
350 _cpp_free_buff (pfile->u_buff);
351 _cpp_free_buff (pfile->free_buffs);
353 for (run = &pfile->base_run; run; run = runn)
357 if (run != &pfile->base_run)
361 for (context = pfile->base_context.next; context; context = contextn)
363 contextn = context->next;
367 if (pfile->comments.entries)
369 for (i = 0; i < pfile->comments.count; i++)
370 free (pfile->comments.entries[i].comment);
372 free (pfile->comments.entries);
374 if (pfile->pushed_macros)
378 pmacro = pfile->pushed_macros;
379 pfile->pushed_macros = pmacro->next;
383 while (pfile->pushed_macros);
389 /* This structure defines one built-in identifier. A node will be
390 entered in the hash table under the name NAME, with value VALUE.
392 There are two tables of these. builtin_array holds all the
393 "builtin" macros: these are handled by builtin_macro() in
394 macro.cc. Builtin is somewhat of a misnomer -- the property of
395 interest is that these macros require special code to compute their
396 expansions. The value is a "cpp_builtin_type" enumerator.
398 operator_array holds the C++ named operators. These are keywords
399 which act as aliases for punctuators. In C++, they cannot be
400 altered through #define, and #if recognizes them as operators. In
401 C, these are not entered into the hash table at all (but see
402 <iso646.h>). The value is a token-type enumerator. */
405 const uchar *const name;
406 const unsigned short len;
407 const unsigned short value;
408 const bool always_warn_if_redefined;
411 #define B(n, t, f) { DSC(n), t, f }
412 static const struct builtin_macro builtin_array[] =
414 B("__TIMESTAMP__", BT_TIMESTAMP, false),
415 B("__TIME__", BT_TIME, false),
416 B("__DATE__", BT_DATE, false),
417 B("__FILE__", BT_FILE, false),
418 B("__FILE_NAME__", BT_FILE_NAME, false),
419 B("__BASE_FILE__", BT_BASE_FILE, false),
420 B("__LINE__", BT_SPECLINE, true),
421 B("__INCLUDE_LEVEL__", BT_INCLUDE_LEVEL, true),
422 B("__COUNTER__", BT_COUNTER, true),
423 /* Make sure to update the list of built-in
424 function-like macros in traditional.cc:
425 fun_like_macro() when adding more following */
426 B("__has_attribute", BT_HAS_ATTRIBUTE, true),
427 B("__has_c_attribute", BT_HAS_STD_ATTRIBUTE, true),
428 B("__has_cpp_attribute", BT_HAS_ATTRIBUTE, true),
429 B("__has_builtin", BT_HAS_BUILTIN, true),
430 B("__has_include", BT_HAS_INCLUDE, true),
431 B("__has_include_next",BT_HAS_INCLUDE_NEXT, true),
432 /* Keep builtins not used for -traditional-cpp at the end, and
433 update init_builtins() if any more are added. */
434 B("_Pragma", BT_PRAGMA, true),
435 B("__STDC__", BT_STDC, true),
439 struct builtin_operator
441 const uchar *const name;
442 const unsigned short len;
443 const unsigned short value;
446 #define B(n, t) { DSC(n), t }
447 static const struct builtin_operator operator_array[] =
449 B("and", CPP_AND_AND),
450 B("and_eq", CPP_AND_EQ),
451 B("bitand", CPP_AND),
453 B("compl", CPP_COMPL),
455 B("not_eq", CPP_NOT_EQ),
457 B("or_eq", CPP_OR_EQ),
459 B("xor_eq", CPP_XOR_EQ)
463 /* Mark the C++ named operators in the hash table. */
465 mark_named_operators (cpp_reader *pfile, int flags)
467 const struct builtin_operator *b;
469 for (b = operator_array;
470 b < (operator_array + ARRAY_SIZE (operator_array));
473 cpp_hashnode *hp = cpp_lookup (pfile, b->name, b->len);
475 hp->is_directive = 0;
476 hp->directive_index = b->value;
480 /* Helper function of cpp_type2name. Return the string associated with
481 named operator TYPE. */
483 cpp_named_operator2name (enum cpp_ttype type)
485 const struct builtin_operator *b;
487 for (b = operator_array;
488 b < (operator_array + ARRAY_SIZE (operator_array));
491 if (type == b->value)
492 return (const char *) b->name;
499 cpp_init_special_builtins (cpp_reader *pfile)
501 const struct builtin_macro *b;
502 size_t n = ARRAY_SIZE (builtin_array);
504 if (CPP_OPTION (pfile, traditional))
506 else if (! CPP_OPTION (pfile, stdc_0_in_system_headers)
507 || CPP_OPTION (pfile, std))
510 for (b = builtin_array; b < builtin_array + n; b++)
512 if ((b->value == BT_HAS_ATTRIBUTE
513 || b->value == BT_HAS_STD_ATTRIBUTE
514 || b->value == BT_HAS_BUILTIN)
515 && (CPP_OPTION (pfile, lang) == CLK_ASM
516 || pfile->cb.has_attribute == NULL))
518 cpp_hashnode *hp = cpp_lookup (pfile, b->name, b->len);
519 hp->type = NT_BUILTIN_MACRO;
520 if (b->always_warn_if_redefined)
521 hp->flags |= NODE_WARN;
522 hp->value.builtin = (enum cpp_builtin_type) b->value;
526 /* Restore macro C to builtin macro definition. */
529 _cpp_restore_special_builtin (cpp_reader *pfile, struct def_pragma_macro *c)
531 size_t len = strlen (c->name);
533 for (const struct builtin_macro *b = builtin_array;
534 b < builtin_array + ARRAY_SIZE (builtin_array); b++)
535 if (b->len == len && memcmp (c->name, b->name, len + 1) == 0)
537 cpp_hashnode *hp = cpp_lookup (pfile, b->name, b->len);
538 hp->type = NT_BUILTIN_MACRO;
539 if (b->always_warn_if_redefined)
540 hp->flags |= NODE_WARN;
541 hp->value.builtin = (enum cpp_builtin_type) b->value;
545 /* Read the builtins table above and enter them, and language-specific
546 macros, into the hash table. HOSTED is true if this is a hosted
549 cpp_init_builtins (cpp_reader *pfile, int hosted)
551 cpp_init_special_builtins (pfile);
553 if (!CPP_OPTION (pfile, traditional)
554 && (! CPP_OPTION (pfile, stdc_0_in_system_headers)
555 || CPP_OPTION (pfile, std)))
556 _cpp_define_builtin (pfile, "__STDC__ 1");
558 if (CPP_OPTION (pfile, cplusplus))
560 /* C++23 is not yet a standard. For now, use an invalid
561 * year/month, 202100L, which is larger than 202002L. */
562 if (CPP_OPTION (pfile, lang) == CLK_CXX23
563 || CPP_OPTION (pfile, lang) == CLK_GNUCXX23)
564 _cpp_define_builtin (pfile, "__cplusplus 202100L");
565 else if (CPP_OPTION (pfile, lang) == CLK_CXX20
566 || CPP_OPTION (pfile, lang) == CLK_GNUCXX20)
567 _cpp_define_builtin (pfile, "__cplusplus 202002L");
568 else if (CPP_OPTION (pfile, lang) == CLK_CXX17
569 || CPP_OPTION (pfile, lang) == CLK_GNUCXX17)
570 _cpp_define_builtin (pfile, "__cplusplus 201703L");
571 else if (CPP_OPTION (pfile, lang) == CLK_CXX14
572 || CPP_OPTION (pfile, lang) == CLK_GNUCXX14)
573 _cpp_define_builtin (pfile, "__cplusplus 201402L");
574 else if (CPP_OPTION (pfile, lang) == CLK_CXX11
575 || CPP_OPTION (pfile, lang) == CLK_GNUCXX11)
576 _cpp_define_builtin (pfile, "__cplusplus 201103L");
578 _cpp_define_builtin (pfile, "__cplusplus 199711L");
580 else if (CPP_OPTION (pfile, lang) == CLK_ASM)
581 _cpp_define_builtin (pfile, "__ASSEMBLER__ 1");
582 else if (CPP_OPTION (pfile, lang) == CLK_STDC94)
583 _cpp_define_builtin (pfile, "__STDC_VERSION__ 199409L");
584 else if (CPP_OPTION (pfile, lang) == CLK_STDC2X
585 || CPP_OPTION (pfile, lang) == CLK_GNUC2X)
586 _cpp_define_builtin (pfile, "__STDC_VERSION__ 202000L");
587 else if (CPP_OPTION (pfile, lang) == CLK_STDC17
588 || CPP_OPTION (pfile, lang) == CLK_GNUC17)
589 _cpp_define_builtin (pfile, "__STDC_VERSION__ 201710L");
590 else if (CPP_OPTION (pfile, lang) == CLK_STDC11
591 || CPP_OPTION (pfile, lang) == CLK_GNUC11)
592 _cpp_define_builtin (pfile, "__STDC_VERSION__ 201112L");
593 else if (CPP_OPTION (pfile, c99))
594 _cpp_define_builtin (pfile, "__STDC_VERSION__ 199901L");
596 if (CPP_OPTION (pfile, uliterals)
597 && !(CPP_OPTION (pfile, cplusplus)
598 && (CPP_OPTION (pfile, lang) == CLK_GNUCXX
599 || CPP_OPTION (pfile, lang) == CLK_CXX98)))
601 _cpp_define_builtin (pfile, "__STDC_UTF_16__ 1");
602 _cpp_define_builtin (pfile, "__STDC_UTF_32__ 1");
606 _cpp_define_builtin (pfile, "__STDC_HOSTED__ 1");
608 _cpp_define_builtin (pfile, "__STDC_HOSTED__ 0");
610 if (CPP_OPTION (pfile, objc))
611 _cpp_define_builtin (pfile, "__OBJC__ 1");
614 /* Sanity-checks are dependent on command-line options, so it is
615 called as a subroutine of cpp_read_main_file. */
617 static void sanity_checks (cpp_reader *);
618 static void sanity_checks (cpp_reader *pfile)
621 size_t max_precision = 2 * CHAR_BIT * sizeof (cpp_num_part);
623 /* Sanity checks for assumptions about CPP arithmetic and target
624 type precisions made by cpplib. */
627 cpp_error (pfile, CPP_DL_ICE, "cppchar_t must be an unsigned type");
629 if (CPP_OPTION (pfile, precision) > max_precision)
630 cpp_error (pfile, CPP_DL_ICE,
631 "preprocessor arithmetic has maximum precision of %lu bits;"
632 " target requires %lu bits",
633 (unsigned long) max_precision,
634 (unsigned long) CPP_OPTION (pfile, precision));
636 if (CPP_OPTION (pfile, precision) < CPP_OPTION (pfile, int_precision))
637 cpp_error (pfile, CPP_DL_ICE,
638 "CPP arithmetic must be at least as precise as a target int");
640 if (CPP_OPTION (pfile, char_precision) < 8)
641 cpp_error (pfile, CPP_DL_ICE, "target char is less than 8 bits wide");
643 if (CPP_OPTION (pfile, wchar_precision) < CPP_OPTION (pfile, char_precision))
644 cpp_error (pfile, CPP_DL_ICE,
645 "target wchar_t is narrower than target char");
647 if (CPP_OPTION (pfile, int_precision) < CPP_OPTION (pfile, char_precision))
648 cpp_error (pfile, CPP_DL_ICE,
649 "target int is narrower than target char");
651 /* This is assumed in eval_token() and could be fixed if necessary. */
652 if (sizeof (cppchar_t) > sizeof (cpp_num_part))
653 cpp_error (pfile, CPP_DL_ICE,
654 "CPP half-integer narrower than CPP character");
656 if (CPP_OPTION (pfile, wchar_precision) > BITS_PER_CPPCHAR_T)
657 cpp_error (pfile, CPP_DL_ICE,
658 "CPP on this host cannot handle wide character constants over"
659 " %lu bits, but the target requires %lu bits",
660 (unsigned long) BITS_PER_CPPCHAR_T,
661 (unsigned long) CPP_OPTION (pfile, wchar_precision));
664 # define sanity_checks(PFILE)
667 /* This is called after options have been parsed, and partially
670 cpp_post_options (cpp_reader *pfile)
674 sanity_checks (pfile);
676 post_options (pfile);
678 /* Mark named operators before handling command line macros. */
680 if (CPP_OPTION (pfile, cplusplus) && CPP_OPTION (pfile, operator_names))
681 flags |= NODE_OPERATOR;
682 if (CPP_OPTION (pfile, warn_cxx_operator_names))
683 flags |= NODE_DIAGNOSTIC | NODE_WARN_OPERATOR;
685 mark_named_operators (pfile, flags);
688 /* Setup for processing input from the file named FNAME, or stdin if
689 it is the empty string. Return the original filename on success
690 (e.g. foo.i->foo.c), or NULL on failure. INJECTING is true if
691 there may be injected headers before line 1 of the main file. */
693 cpp_read_main_file (cpp_reader *pfile, const char *fname, bool injecting)
695 if (mkdeps *deps = cpp_get_deps (pfile))
696 /* Set the default target (if there is none already). */
697 deps_add_default_target (deps, fname);
700 = _cpp_find_file (pfile, fname,
701 CPP_OPTION (pfile, preprocessed) ? &pfile->no_search_path
702 : CPP_OPTION (pfile, main_search) == CMS_user
703 ? pfile->quote_include
704 : CPP_OPTION (pfile, main_search) == CMS_system
705 ? pfile->bracket_include : &pfile->no_search_path,
706 /*angle=*/0, _cpp_FFK_NORMAL, 0);
708 if (_cpp_find_failed (pfile->main_file))
711 _cpp_stack_file (pfile, pfile->main_file,
712 injecting || CPP_OPTION (pfile, preprocessed)
713 ? IT_PRE_MAIN : IT_MAIN, 0);
715 /* For foo.i, read the original filename foo.c now, for the benefit
716 of the front ends. */
717 if (CPP_OPTION (pfile, preprocessed))
718 if (!read_original_filename (pfile))
720 /* We're on line 1 after all. */
721 auto *last = linemap_check_ordinary
722 (LINEMAPS_LAST_MAP (pfile->line_table, false));
724 /* Inform of as-if a file change. */
725 _cpp_do_file_change (pfile, LC_RENAME_VERBATIM, LINEMAP_FILE (last),
726 LINEMAP_LINE (last), LINEMAP_SYSP (last));
729 auto *map = LINEMAPS_LAST_ORDINARY_MAP (pfile->line_table);
730 pfile->main_loc = MAP_START_LOCATION (map);
732 return ORDINARY_MAP_FILE_NAME (map);
736 cpp_main_loc (const cpp_reader *pfile)
738 return pfile->main_loc;
741 /* For preprocessed files, if the very first characters are
742 '#<SPACE>[01]<SPACE>', then handle a line directive so we know the
743 original file name. This will generate file_change callbacks,
744 which the front ends must handle appropriately given their state of
745 initialization. We peek directly into the character buffer, so
746 that we're not confused by otherwise-skipped white space &
747 comments. We can be very picky, because this should have been
748 machine-generated text (by us, no less). This way we do not
749 interfere with the module directive state machine. */
752 read_original_filename (cpp_reader *pfile)
754 auto *buf = pfile->buffer->next_line;
756 if (pfile->buffer->rlimit - buf > 4
759 // Also permit '1', as that's what used to be here
760 && (buf[2] == '0' || buf[2] == '1')
763 const cpp_token *token = _cpp_lex_direct (pfile);
764 gcc_checking_assert (token->type == CPP_HASH);
765 if (_cpp_handle_directive (pfile, token->flags & PREV_WHITE))
767 read_original_directory (pfile);
769 auto *penult = &linemap_check_ordinary
770 (LINEMAPS_LAST_MAP (pfile->line_table, false))[-1];
771 if (penult[1].reason == LC_RENAME_VERBATIM)
773 /* Expunge any evidence of the original linemap. */
774 pfile->line_table->highest_location
775 = pfile->line_table->highest_line
776 = penult[0].start_location;
778 penult[1].start_location = penult[0].start_location;
779 penult[1].reason = penult[0].reason;
780 penult[0] = penult[1];
781 pfile->line_table->info_ordinary.used--;
782 pfile->line_table->info_ordinary.cache = 0;
792 /* For preprocessed files, if the tokens following the first filename
793 line is of the form # <line> "/path/name//", handle the
794 directive so we know the original current directory.
796 As with the first line peeking, we can do this without lexing by
799 read_original_directory (cpp_reader *pfile)
801 auto *buf = pfile->buffer->next_line;
803 if (pfile->buffer->rlimit - buf > 4
806 // Also permit '1', as that's what used to be here
807 && (buf[2] == '0' || buf[2] == '1')
810 const cpp_token *hash = _cpp_lex_direct (pfile);
811 gcc_checking_assert (hash->type == CPP_HASH);
812 pfile->state.in_directive = 1;
813 const cpp_token *number = _cpp_lex_direct (pfile);
814 gcc_checking_assert (number->type == CPP_NUMBER);
815 const cpp_token *string = _cpp_lex_direct (pfile);
816 pfile->state.in_directive = 0;
818 const unsigned char *text = nullptr;
820 if (string->type == CPP_STRING)
822 /* The string value includes the quotes. */
823 text = string->val.str.text;
824 len = string->val.str.len;
827 || !IS_DIR_SEPARATOR (text[len - 2])
828 || !IS_DIR_SEPARATOR (text[len - 3]))
830 /* That didn't work out, back out. */
831 _cpp_backup_tokens (pfile, 3);
835 if (pfile->cb.dir_change)
837 /* Smash the string directly, it's dead at this point */
838 char *smashy = (char *)text;
841 pfile->cb.dir_change (pfile, smashy + 1);
844 /* We should be at EOL. */
848 /* This is called at the end of preprocessing. It pops the last
849 buffer and writes dependency output.
851 Maybe it should also reset state, such that you could call
852 cpp_start_read with a new filename to restart processing. */
854 cpp_finish (cpp_reader *pfile, FILE *deps_stream)
856 /* Warn about unused macros before popping the final buffer. */
857 if (CPP_OPTION (pfile, warn_unused_macros))
858 cpp_forall_identifiers (pfile, _cpp_warn_if_unused_macro, NULL);
860 /* lex.cc leaves the final buffer on the stack. This it so that
861 it returns an unending stream of CPP_EOFs to the client. If we
862 popped the buffer, we'd dereference a NULL buffer pointer and
863 segfault. It's nice to allow the client to do worry-free excess
864 cpp_get_token calls. */
865 while (pfile->buffer)
866 _cpp_pop_buffer (pfile);
869 deps_write (pfile, deps_stream, 72);
871 /* Report on headers that could use multiple include guards. */
872 if (CPP_OPTION (pfile, print_include_names))
873 _cpp_report_missing_guards (pfile);
877 post_options (cpp_reader *pfile)
879 /* -Wtraditional is not useful in C++ mode. */
880 if (CPP_OPTION (pfile, cplusplus))
881 CPP_OPTION (pfile, cpp_warn_traditional) = 0;
883 /* Permanently disable macro expansion if we are rescanning
884 preprocessed text. Read preprocesed source in ISO mode. */
885 if (CPP_OPTION (pfile, preprocessed))
887 if (!CPP_OPTION (pfile, directives_only))
888 pfile->state.prevent_expansion = 1;
889 CPP_OPTION (pfile, traditional) = 0;
892 if (CPP_OPTION (pfile, warn_trigraphs) == 2)
893 CPP_OPTION (pfile, warn_trigraphs) = !CPP_OPTION (pfile, trigraphs);
895 if (CPP_OPTION (pfile, traditional))
897 CPP_OPTION (pfile, trigraphs) = 0;
898 CPP_OPTION (pfile, warn_trigraphs) = 0;
901 if (CPP_OPTION (pfile, module_directives))
903 /* These unspellable tokens have a leading space. */
904 const char *const inits[spec_nodes::M_HWM]
905 = {"export ", "module ", "import ", "__import"};
907 for (int ix = 0; ix != spec_nodes::M_HWM; ix++)
909 cpp_hashnode *node = cpp_lookup (pfile, UC (inits[ix]),
912 /* Token we pass to the compiler. */
913 pfile->spec_nodes.n_modules[ix][1] = node;
915 if (ix != spec_nodes::M__IMPORT)
916 /* Token we recognize when lexing, drop the trailing ' '. */
917 node = cpp_lookup (pfile, NODE_NAME (node), NODE_LEN (node) - 1);
919 node->flags |= NODE_MODULE;
920 pfile->spec_nodes.n_modules[ix][0] = node;