]> git.ipfire.org Git - thirdparty/gcc.git/blob - libcpp/init.cc
x86: Handle V16BF in ix86_avx256_split_vector_move_misalign
[thirdparty/gcc.git] / libcpp / init.cc
1 /* CPP Library.
2 Copyright (C) 1986-2022 Free Software Foundation, Inc.
3 Contributed by Per Bothner, 1994-95.
4 Based on CCCP program by Paul Rubin, June 1986
5 Adapted to ANSI C, Richard Stallman, Jan 1987
6
7 This program is free software; you can redistribute it and/or modify it
8 under the terms of the GNU General Public License as published by the
9 Free Software Foundation; either version 3, or (at your option) any
10 later version.
11
12 This program is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
16
17 You should have received a copy of the GNU General Public License
18 along with this program; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
20
21 #include "config.h"
22 #include "system.h"
23 #include "cpplib.h"
24 #include "internal.h"
25 #include "mkdeps.h"
26 #include "localedir.h"
27 #include "filenames.h"
28
29 #ifndef ENABLE_CANONICAL_SYSTEM_HEADERS
30 #ifdef HAVE_DOS_BASED_FILE_SYSTEM
31 #define ENABLE_CANONICAL_SYSTEM_HEADERS 1
32 #else
33 #define ENABLE_CANONICAL_SYSTEM_HEADERS 0
34 #endif
35 #endif
36
37 static void init_library (void);
38 static void mark_named_operators (cpp_reader *, int);
39 static bool read_original_filename (cpp_reader *);
40 static void read_original_directory (cpp_reader *);
41 static void post_options (cpp_reader *);
42
43 /* If we have designated initializers (GCC >2.7) these tables can be
44 initialized, constant data. Otherwise, they have to be filled in at
45 runtime. */
46 #if HAVE_DESIGNATED_INITIALIZERS
47
48 #define init_trigraph_map() /* Nothing. */
49 #define TRIGRAPH_MAP \
50 __extension__ const uchar _cpp_trigraph_map[UCHAR_MAX + 1] = {
51
52 #define END };
53 #define s(p, v) [p] = v,
54
55 #else
56
57 #define TRIGRAPH_MAP uchar _cpp_trigraph_map[UCHAR_MAX + 1] = { 0 }; \
58 static void init_trigraph_map (void) { \
59 unsigned char *x = _cpp_trigraph_map;
60
61 #define END }
62 #define s(p, v) x[p] = v;
63
64 #endif
65
66 TRIGRAPH_MAP
67 s('=', '#') s(')', ']') s('!', '|')
68 s('(', '[') s('\'', '^') s('>', '}')
69 s('/', '\\') s('<', '{') s('-', '~')
70 END
71
72 #undef s
73 #undef END
74 #undef TRIGRAPH_MAP
75
76 /* A set of booleans indicating what CPP features each source language
77 requires. */
78 struct lang_flags
79 {
80 char c99;
81 char cplusplus;
82 char extended_numbers;
83 char extended_identifiers;
84 char c11_identifiers;
85 char std;
86 char digraphs;
87 char uliterals;
88 char rliterals;
89 char user_literals;
90 char binary_constants;
91 char digit_separators;
92 char trigraphs;
93 char utf8_char_literals;
94 char va_opt;
95 char scope;
96 char dfp_constants;
97 char size_t_literals;
98 char elifdef;
99 char warning_directive;
100 char delimited_escape_seqs;
101 };
102
103 static const struct lang_flags lang_defaults[] =
104 { /* c99 c++ xnum xid c11 std digr ulit rlit udlit bincst digsep trig u8chlit vaopt scope dfp szlit elifdef warndir delim */
105 /* GNUC89 */ { 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0 },
106 /* GNUC99 */ { 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0 },
107 /* GNUC11 */ { 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0 },
108 /* GNUC17 */ { 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0 },
109 /* GNUC2X */ { 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 0 },
110 /* STDC89 */ { 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0 },
111 /* STDC94 */ { 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0 },
112 /* STDC99 */ { 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0 },
113 /* STDC11 */ { 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0 },
114 /* STDC17 */ { 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0 },
115 /* STDC2X */ { 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0 },
116 /* GNUCXX */ { 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0 },
117 /* CXX98 */ { 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0 },
118 /* GNUCXX11 */ { 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0 },
119 /* CXX11 */ { 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0 },
120 /* GNUCXX14 */ { 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0 },
121 /* CXX14 */ { 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0 },
122 /* GNUCXX17 */ { 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0 },
123 /* CXX17 */ { 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0 },
124 /* GNUCXX20 */ { 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0 },
125 /* CXX20 */ { 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0 },
126 /* GNUCXX23 */ { 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1 },
127 /* CXX23 */ { 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1 },
128 /* ASM */ { 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }
129 };
130
131 /* Sets internal flags correctly for a given language. */
132 void
133 cpp_set_lang (cpp_reader *pfile, enum c_lang lang)
134 {
135 const struct lang_flags *l = &lang_defaults[(int) lang];
136
137 CPP_OPTION (pfile, lang) = lang;
138
139 CPP_OPTION (pfile, c99) = l->c99;
140 CPP_OPTION (pfile, cplusplus) = l->cplusplus;
141 CPP_OPTION (pfile, extended_numbers) = l->extended_numbers;
142 CPP_OPTION (pfile, extended_identifiers) = l->extended_identifiers;
143 CPP_OPTION (pfile, c11_identifiers) = l->c11_identifiers;
144 CPP_OPTION (pfile, std) = l->std;
145 CPP_OPTION (pfile, digraphs) = l->digraphs;
146 CPP_OPTION (pfile, uliterals) = l->uliterals;
147 CPP_OPTION (pfile, rliterals) = l->rliterals;
148 CPP_OPTION (pfile, user_literals) = l->user_literals;
149 CPP_OPTION (pfile, binary_constants) = l->binary_constants;
150 CPP_OPTION (pfile, digit_separators) = l->digit_separators;
151 CPP_OPTION (pfile, trigraphs) = l->trigraphs;
152 CPP_OPTION (pfile, utf8_char_literals) = l->utf8_char_literals;
153 CPP_OPTION (pfile, va_opt) = l->va_opt;
154 CPP_OPTION (pfile, scope) = l->scope;
155 CPP_OPTION (pfile, dfp_constants) = l->dfp_constants;
156 CPP_OPTION (pfile, size_t_literals) = l->size_t_literals;
157 CPP_OPTION (pfile, elifdef) = l->elifdef;
158 CPP_OPTION (pfile, warning_directive) = l->warning_directive;
159 CPP_OPTION (pfile, delimited_escape_seqs) = l->delimited_escape_seqs;
160 }
161
162 /* Initialize library global state. */
163 static void
164 init_library (void)
165 {
166 static int initialized = 0;
167
168 if (! initialized)
169 {
170 initialized = 1;
171
172 _cpp_init_lexer ();
173
174 /* Set up the trigraph map. This doesn't need to do anything if
175 we were compiled with a compiler that supports C99 designated
176 initializers. */
177 init_trigraph_map ();
178
179 #ifdef ENABLE_NLS
180 (void) bindtextdomain (PACKAGE, LOCALEDIR);
181 #endif
182 }
183 }
184
185 /* Initialize a cpp_reader structure. */
186 cpp_reader *
187 cpp_create_reader (enum c_lang lang, cpp_hash_table *table,
188 class line_maps *line_table)
189 {
190 cpp_reader *pfile;
191
192 /* Initialize this instance of the library if it hasn't been already. */
193 init_library ();
194
195 pfile = XCNEW (cpp_reader);
196 memset (&pfile->base_context, 0, sizeof (pfile->base_context));
197
198 cpp_set_lang (pfile, lang);
199 CPP_OPTION (pfile, warn_multichar) = 1;
200 CPP_OPTION (pfile, discard_comments) = 1;
201 CPP_OPTION (pfile, discard_comments_in_macro_exp) = 1;
202 CPP_OPTION (pfile, max_include_depth) = 200;
203 CPP_OPTION (pfile, operator_names) = 1;
204 CPP_OPTION (pfile, warn_trigraphs) = 2;
205 CPP_OPTION (pfile, warn_endif_labels) = 1;
206 CPP_OPTION (pfile, cpp_warn_c90_c99_compat) = -1;
207 CPP_OPTION (pfile, cpp_warn_c11_c2x_compat) = -1;
208 CPP_OPTION (pfile, cpp_warn_cxx11_compat) = 0;
209 CPP_OPTION (pfile, cpp_warn_cxx20_compat) = 0;
210 CPP_OPTION (pfile, cpp_warn_deprecated) = 1;
211 CPP_OPTION (pfile, cpp_warn_long_long) = 0;
212 CPP_OPTION (pfile, dollars_in_ident) = 1;
213 CPP_OPTION (pfile, warn_dollars) = 1;
214 CPP_OPTION (pfile, warn_variadic_macros) = 1;
215 CPP_OPTION (pfile, warn_builtin_macro_redefined) = 1;
216 CPP_OPTION (pfile, cpp_warn_implicit_fallthrough) = 0;
217 /* By default, track locations of tokens resulting from macro
218 expansion. The '2' means, track the locations with the highest
219 accuracy. Read the comments for struct
220 cpp_options::track_macro_expansion to learn about the other
221 values. */
222 CPP_OPTION (pfile, track_macro_expansion) = 2;
223 CPP_OPTION (pfile, warn_normalize) = normalized_C;
224 CPP_OPTION (pfile, warn_literal_suffix) = 1;
225 CPP_OPTION (pfile, canonical_system_headers)
226 = ENABLE_CANONICAL_SYSTEM_HEADERS;
227 CPP_OPTION (pfile, ext_numeric_literals) = 1;
228 CPP_OPTION (pfile, warn_date_time) = 0;
229 CPP_OPTION (pfile, cpp_warn_bidirectional) = bidirectional_unpaired;
230
231 /* Default CPP arithmetic to something sensible for the host for the
232 benefit of dumb users like fix-header. */
233 CPP_OPTION (pfile, precision) = CHAR_BIT * sizeof (long);
234 CPP_OPTION (pfile, char_precision) = CHAR_BIT;
235 CPP_OPTION (pfile, wchar_precision) = CHAR_BIT * sizeof (int);
236 CPP_OPTION (pfile, int_precision) = CHAR_BIT * sizeof (int);
237 CPP_OPTION (pfile, unsigned_char) = 0;
238 CPP_OPTION (pfile, unsigned_wchar) = 1;
239 CPP_OPTION (pfile, unsigned_utf8char) = 1;
240 CPP_OPTION (pfile, bytes_big_endian) = 1; /* does not matter */
241
242 /* Default to no charset conversion. */
243 CPP_OPTION (pfile, narrow_charset) = _cpp_default_encoding ();
244 CPP_OPTION (pfile, wide_charset) = 0;
245
246 /* Default the input character set to UTF-8. */
247 CPP_OPTION (pfile, input_charset) = _cpp_default_encoding ();
248
249 /* A fake empty "directory" used as the starting point for files
250 looked up without a search path. Name cannot be '/' because we
251 don't want to prepend anything at all to filenames using it. All
252 other entries are correct zero-initialized. */
253 pfile->no_search_path.name = (char *) "";
254
255 /* Initialize the line map. */
256 pfile->line_table = line_table;
257
258 /* Initialize lexer state. */
259 pfile->state.save_comments = ! CPP_OPTION (pfile, discard_comments);
260
261 /* Set up static tokens. */
262 pfile->avoid_paste.type = CPP_PADDING;
263 pfile->avoid_paste.val.source = NULL;
264 pfile->avoid_paste.src_loc = 0;
265 pfile->endarg.type = CPP_EOF;
266 pfile->endarg.flags = 0;
267 pfile->endarg.src_loc = 0;
268
269 /* Create a token buffer for the lexer. */
270 _cpp_init_tokenrun (&pfile->base_run, 250);
271 pfile->cur_run = &pfile->base_run;
272 pfile->cur_token = pfile->base_run.base;
273
274 /* Initialize the base context. */
275 pfile->context = &pfile->base_context;
276 pfile->base_context.c.macro = 0;
277 pfile->base_context.prev = pfile->base_context.next = 0;
278
279 /* Aligned and unaligned storage. */
280 pfile->a_buff = _cpp_get_buff (pfile, 0);
281 pfile->u_buff = _cpp_get_buff (pfile, 0);
282
283 /* Initialize table for push_macro/pop_macro. */
284 pfile->pushed_macros = 0;
285
286 /* Do not force token locations by default. */
287 pfile->forced_token_location = 0;
288
289 /* Note the timestamp is unset. */
290 pfile->time_stamp = time_t (-1);
291 pfile->time_stamp_kind = 0;
292
293 /* The expression parser stack. */
294 _cpp_expand_op_stack (pfile);
295
296 /* Initialize the buffer obstack. */
297 obstack_specify_allocation (&pfile->buffer_ob, 0, 0, xmalloc, free);
298
299 _cpp_init_files (pfile);
300
301 _cpp_init_hashtable (pfile, table);
302
303 return pfile;
304 }
305
306 /* Set the line_table entry in PFILE. This is called after reading a
307 PCH file, as the old line_table will be incorrect. */
308 void
309 cpp_set_line_map (cpp_reader *pfile, class line_maps *line_table)
310 {
311 pfile->line_table = line_table;
312 }
313
314 /* Free resources used by PFILE. Accessing PFILE after this function
315 returns leads to undefined behavior. Returns the error count. */
316 void
317 cpp_destroy (cpp_reader *pfile)
318 {
319 cpp_context *context, *contextn;
320 struct def_pragma_macro *pmacro;
321 tokenrun *run, *runn;
322 int i;
323
324 free (pfile->op_stack);
325
326 while (CPP_BUFFER (pfile) != NULL)
327 _cpp_pop_buffer (pfile);
328
329 free (pfile->out.base);
330
331 if (pfile->macro_buffer)
332 {
333 free (pfile->macro_buffer);
334 pfile->macro_buffer = NULL;
335 pfile->macro_buffer_len = 0;
336 }
337
338 if (pfile->deps)
339 deps_free (pfile->deps);
340 obstack_free (&pfile->buffer_ob, 0);
341
342 _cpp_destroy_hashtable (pfile);
343 _cpp_cleanup_files (pfile);
344 _cpp_destroy_iconv (pfile);
345
346 _cpp_free_buff (pfile->a_buff);
347 _cpp_free_buff (pfile->u_buff);
348 _cpp_free_buff (pfile->free_buffs);
349
350 for (run = &pfile->base_run; run; run = runn)
351 {
352 runn = run->next;
353 free (run->base);
354 if (run != &pfile->base_run)
355 free (run);
356 }
357
358 for (context = pfile->base_context.next; context; context = contextn)
359 {
360 contextn = context->next;
361 free (context);
362 }
363
364 if (pfile->comments.entries)
365 {
366 for (i = 0; i < pfile->comments.count; i++)
367 free (pfile->comments.entries[i].comment);
368
369 free (pfile->comments.entries);
370 }
371 if (pfile->pushed_macros)
372 {
373 do
374 {
375 pmacro = pfile->pushed_macros;
376 pfile->pushed_macros = pmacro->next;
377 free (pmacro->name);
378 free (pmacro);
379 }
380 while (pfile->pushed_macros);
381 }
382
383 free (pfile);
384 }
385
386 /* This structure defines one built-in identifier. A node will be
387 entered in the hash table under the name NAME, with value VALUE.
388
389 There are two tables of these. builtin_array holds all the
390 "builtin" macros: these are handled by builtin_macro() in
391 macro.cc. Builtin is somewhat of a misnomer -- the property of
392 interest is that these macros require special code to compute their
393 expansions. The value is a "cpp_builtin_type" enumerator.
394
395 operator_array holds the C++ named operators. These are keywords
396 which act as aliases for punctuators. In C++, they cannot be
397 altered through #define, and #if recognizes them as operators. In
398 C, these are not entered into the hash table at all (but see
399 <iso646.h>). The value is a token-type enumerator. */
400 struct builtin_macro
401 {
402 const uchar *const name;
403 const unsigned short len;
404 const unsigned short value;
405 const bool always_warn_if_redefined;
406 };
407
408 #define B(n, t, f) { DSC(n), t, f }
409 static const struct builtin_macro builtin_array[] =
410 {
411 B("__TIMESTAMP__", BT_TIMESTAMP, false),
412 B("__TIME__", BT_TIME, false),
413 B("__DATE__", BT_DATE, false),
414 B("__FILE__", BT_FILE, false),
415 B("__FILE_NAME__", BT_FILE_NAME, false),
416 B("__BASE_FILE__", BT_BASE_FILE, false),
417 B("__LINE__", BT_SPECLINE, true),
418 B("__INCLUDE_LEVEL__", BT_INCLUDE_LEVEL, true),
419 B("__COUNTER__", BT_COUNTER, true),
420 /* Make sure to update the list of built-in
421 function-like macros in traditional.cc:
422 fun_like_macro() when adding more following */
423 B("__has_attribute", BT_HAS_ATTRIBUTE, true),
424 B("__has_c_attribute", BT_HAS_STD_ATTRIBUTE, true),
425 B("__has_cpp_attribute", BT_HAS_ATTRIBUTE, true),
426 B("__has_builtin", BT_HAS_BUILTIN, true),
427 B("__has_include", BT_HAS_INCLUDE, true),
428 B("__has_include_next",BT_HAS_INCLUDE_NEXT, true),
429 /* Keep builtins not used for -traditional-cpp at the end, and
430 update init_builtins() if any more are added. */
431 B("_Pragma", BT_PRAGMA, true),
432 B("__STDC__", BT_STDC, true),
433 };
434 #undef B
435
436 struct builtin_operator
437 {
438 const uchar *const name;
439 const unsigned short len;
440 const unsigned short value;
441 };
442
443 #define B(n, t) { DSC(n), t }
444 static const struct builtin_operator operator_array[] =
445 {
446 B("and", CPP_AND_AND),
447 B("and_eq", CPP_AND_EQ),
448 B("bitand", CPP_AND),
449 B("bitor", CPP_OR),
450 B("compl", CPP_COMPL),
451 B("not", CPP_NOT),
452 B("not_eq", CPP_NOT_EQ),
453 B("or", CPP_OR_OR),
454 B("or_eq", CPP_OR_EQ),
455 B("xor", CPP_XOR),
456 B("xor_eq", CPP_XOR_EQ)
457 };
458 #undef B
459
460 /* Mark the C++ named operators in the hash table. */
461 static void
462 mark_named_operators (cpp_reader *pfile, int flags)
463 {
464 const struct builtin_operator *b;
465
466 for (b = operator_array;
467 b < (operator_array + ARRAY_SIZE (operator_array));
468 b++)
469 {
470 cpp_hashnode *hp = cpp_lookup (pfile, b->name, b->len);
471 hp->flags |= flags;
472 hp->is_directive = 0;
473 hp->directive_index = b->value;
474 }
475 }
476
477 /* Helper function of cpp_type2name. Return the string associated with
478 named operator TYPE. */
479 const char *
480 cpp_named_operator2name (enum cpp_ttype type)
481 {
482 const struct builtin_operator *b;
483
484 for (b = operator_array;
485 b < (operator_array + ARRAY_SIZE (operator_array));
486 b++)
487 {
488 if (type == b->value)
489 return (const char *) b->name;
490 }
491
492 return NULL;
493 }
494
495 void
496 cpp_init_special_builtins (cpp_reader *pfile)
497 {
498 const struct builtin_macro *b;
499 size_t n = ARRAY_SIZE (builtin_array);
500
501 if (CPP_OPTION (pfile, traditional))
502 n -= 2;
503 else if (! CPP_OPTION (pfile, stdc_0_in_system_headers)
504 || CPP_OPTION (pfile, std))
505 n--;
506
507 for (b = builtin_array; b < builtin_array + n; b++)
508 {
509 if ((b->value == BT_HAS_ATTRIBUTE
510 || b->value == BT_HAS_STD_ATTRIBUTE
511 || b->value == BT_HAS_BUILTIN)
512 && (CPP_OPTION (pfile, lang) == CLK_ASM
513 || pfile->cb.has_attribute == NULL))
514 continue;
515 cpp_hashnode *hp = cpp_lookup (pfile, b->name, b->len);
516 hp->type = NT_BUILTIN_MACRO;
517 if (b->always_warn_if_redefined)
518 hp->flags |= NODE_WARN;
519 hp->value.builtin = (enum cpp_builtin_type) b->value;
520 }
521 }
522
523 /* Restore macro C to builtin macro definition. */
524
525 void
526 _cpp_restore_special_builtin (cpp_reader *pfile, struct def_pragma_macro *c)
527 {
528 size_t len = strlen (c->name);
529
530 for (const struct builtin_macro *b = builtin_array;
531 b < builtin_array + ARRAY_SIZE (builtin_array); b++)
532 if (b->len == len && memcmp (c->name, b->name, len + 1) == 0)
533 {
534 cpp_hashnode *hp = cpp_lookup (pfile, b->name, b->len);
535 hp->type = NT_BUILTIN_MACRO;
536 if (b->always_warn_if_redefined)
537 hp->flags |= NODE_WARN;
538 hp->value.builtin = (enum cpp_builtin_type) b->value;
539 }
540 }
541
542 /* Read the builtins table above and enter them, and language-specific
543 macros, into the hash table. HOSTED is true if this is a hosted
544 environment. */
545 void
546 cpp_init_builtins (cpp_reader *pfile, int hosted)
547 {
548 cpp_init_special_builtins (pfile);
549
550 if (!CPP_OPTION (pfile, traditional)
551 && (! CPP_OPTION (pfile, stdc_0_in_system_headers)
552 || CPP_OPTION (pfile, std)))
553 _cpp_define_builtin (pfile, "__STDC__ 1");
554
555 if (CPP_OPTION (pfile, cplusplus))
556 {
557 /* C++23 is not yet a standard. For now, use an invalid
558 * year/month, 202100L, which is larger than 202002L. */
559 if (CPP_OPTION (pfile, lang) == CLK_CXX23
560 || CPP_OPTION (pfile, lang) == CLK_GNUCXX23)
561 _cpp_define_builtin (pfile, "__cplusplus 202100L");
562 else if (CPP_OPTION (pfile, lang) == CLK_CXX20
563 || CPP_OPTION (pfile, lang) == CLK_GNUCXX20)
564 _cpp_define_builtin (pfile, "__cplusplus 202002L");
565 else if (CPP_OPTION (pfile, lang) == CLK_CXX17
566 || CPP_OPTION (pfile, lang) == CLK_GNUCXX17)
567 _cpp_define_builtin (pfile, "__cplusplus 201703L");
568 else if (CPP_OPTION (pfile, lang) == CLK_CXX14
569 || CPP_OPTION (pfile, lang) == CLK_GNUCXX14)
570 _cpp_define_builtin (pfile, "__cplusplus 201402L");
571 else if (CPP_OPTION (pfile, lang) == CLK_CXX11
572 || CPP_OPTION (pfile, lang) == CLK_GNUCXX11)
573 _cpp_define_builtin (pfile, "__cplusplus 201103L");
574 else
575 _cpp_define_builtin (pfile, "__cplusplus 199711L");
576 }
577 else if (CPP_OPTION (pfile, lang) == CLK_ASM)
578 _cpp_define_builtin (pfile, "__ASSEMBLER__ 1");
579 else if (CPP_OPTION (pfile, lang) == CLK_STDC94)
580 _cpp_define_builtin (pfile, "__STDC_VERSION__ 199409L");
581 else if (CPP_OPTION (pfile, lang) == CLK_STDC2X
582 || CPP_OPTION (pfile, lang) == CLK_GNUC2X)
583 _cpp_define_builtin (pfile, "__STDC_VERSION__ 202000L");
584 else if (CPP_OPTION (pfile, lang) == CLK_STDC17
585 || CPP_OPTION (pfile, lang) == CLK_GNUC17)
586 _cpp_define_builtin (pfile, "__STDC_VERSION__ 201710L");
587 else if (CPP_OPTION (pfile, lang) == CLK_STDC11
588 || CPP_OPTION (pfile, lang) == CLK_GNUC11)
589 _cpp_define_builtin (pfile, "__STDC_VERSION__ 201112L");
590 else if (CPP_OPTION (pfile, c99))
591 _cpp_define_builtin (pfile, "__STDC_VERSION__ 199901L");
592
593 if (CPP_OPTION (pfile, uliterals)
594 && !(CPP_OPTION (pfile, cplusplus)
595 && (CPP_OPTION (pfile, lang) == CLK_GNUCXX
596 || CPP_OPTION (pfile, lang) == CLK_CXX98)))
597 {
598 _cpp_define_builtin (pfile, "__STDC_UTF_16__ 1");
599 _cpp_define_builtin (pfile, "__STDC_UTF_32__ 1");
600 }
601
602 if (hosted)
603 _cpp_define_builtin (pfile, "__STDC_HOSTED__ 1");
604 else
605 _cpp_define_builtin (pfile, "__STDC_HOSTED__ 0");
606
607 if (CPP_OPTION (pfile, objc))
608 _cpp_define_builtin (pfile, "__OBJC__ 1");
609 }
610
611 /* Sanity-checks are dependent on command-line options, so it is
612 called as a subroutine of cpp_read_main_file. */
613 #if CHECKING_P
614 static void sanity_checks (cpp_reader *);
615 static void sanity_checks (cpp_reader *pfile)
616 {
617 cppchar_t test = 0;
618 size_t max_precision = 2 * CHAR_BIT * sizeof (cpp_num_part);
619
620 /* Sanity checks for assumptions about CPP arithmetic and target
621 type precisions made by cpplib. */
622 test--;
623 if (test < 1)
624 cpp_error (pfile, CPP_DL_ICE, "cppchar_t must be an unsigned type");
625
626 if (CPP_OPTION (pfile, precision) > max_precision)
627 cpp_error (pfile, CPP_DL_ICE,
628 "preprocessor arithmetic has maximum precision of %lu bits;"
629 " target requires %lu bits",
630 (unsigned long) max_precision,
631 (unsigned long) CPP_OPTION (pfile, precision));
632
633 if (CPP_OPTION (pfile, precision) < CPP_OPTION (pfile, int_precision))
634 cpp_error (pfile, CPP_DL_ICE,
635 "CPP arithmetic must be at least as precise as a target int");
636
637 if (CPP_OPTION (pfile, char_precision) < 8)
638 cpp_error (pfile, CPP_DL_ICE, "target char is less than 8 bits wide");
639
640 if (CPP_OPTION (pfile, wchar_precision) < CPP_OPTION (pfile, char_precision))
641 cpp_error (pfile, CPP_DL_ICE,
642 "target wchar_t is narrower than target char");
643
644 if (CPP_OPTION (pfile, int_precision) < CPP_OPTION (pfile, char_precision))
645 cpp_error (pfile, CPP_DL_ICE,
646 "target int is narrower than target char");
647
648 /* This is assumed in eval_token() and could be fixed if necessary. */
649 if (sizeof (cppchar_t) > sizeof (cpp_num_part))
650 cpp_error (pfile, CPP_DL_ICE,
651 "CPP half-integer narrower than CPP character");
652
653 if (CPP_OPTION (pfile, wchar_precision) > BITS_PER_CPPCHAR_T)
654 cpp_error (pfile, CPP_DL_ICE,
655 "CPP on this host cannot handle wide character constants over"
656 " %lu bits, but the target requires %lu bits",
657 (unsigned long) BITS_PER_CPPCHAR_T,
658 (unsigned long) CPP_OPTION (pfile, wchar_precision));
659 }
660 #else
661 # define sanity_checks(PFILE)
662 #endif
663
664 /* This is called after options have been parsed, and partially
665 processed. */
666 void
667 cpp_post_options (cpp_reader *pfile)
668 {
669 int flags;
670
671 sanity_checks (pfile);
672
673 post_options (pfile);
674
675 /* Mark named operators before handling command line macros. */
676 flags = 0;
677 if (CPP_OPTION (pfile, cplusplus) && CPP_OPTION (pfile, operator_names))
678 flags |= NODE_OPERATOR;
679 if (CPP_OPTION (pfile, warn_cxx_operator_names))
680 flags |= NODE_DIAGNOSTIC | NODE_WARN_OPERATOR;
681 if (flags != 0)
682 mark_named_operators (pfile, flags);
683 }
684
685 /* Setup for processing input from the file named FNAME, or stdin if
686 it is the empty string. Return the original filename on success
687 (e.g. foo.i->foo.c), or NULL on failure. INJECTING is true if
688 there may be injected headers before line 1 of the main file. */
689 const char *
690 cpp_read_main_file (cpp_reader *pfile, const char *fname, bool injecting)
691 {
692 if (mkdeps *deps = cpp_get_deps (pfile))
693 /* Set the default target (if there is none already). */
694 deps_add_default_target (deps, fname);
695
696 pfile->main_file
697 = _cpp_find_file (pfile, fname,
698 CPP_OPTION (pfile, preprocessed) ? &pfile->no_search_path
699 : CPP_OPTION (pfile, main_search) == CMS_user
700 ? pfile->quote_include
701 : CPP_OPTION (pfile, main_search) == CMS_system
702 ? pfile->bracket_include : &pfile->no_search_path,
703 /*angle=*/0, _cpp_FFK_NORMAL, 0);
704
705 if (_cpp_find_failed (pfile->main_file))
706 return NULL;
707
708 _cpp_stack_file (pfile, pfile->main_file,
709 injecting || CPP_OPTION (pfile, preprocessed)
710 ? IT_PRE_MAIN : IT_MAIN, 0);
711
712 /* For foo.i, read the original filename foo.c now, for the benefit
713 of the front ends. */
714 if (CPP_OPTION (pfile, preprocessed))
715 if (!read_original_filename (pfile))
716 {
717 /* We're on line 1 after all. */
718 auto *last = linemap_check_ordinary
719 (LINEMAPS_LAST_MAP (pfile->line_table, false));
720 last->to_line = 1;
721 /* Inform of as-if a file change. */
722 _cpp_do_file_change (pfile, LC_RENAME_VERBATIM, LINEMAP_FILE (last),
723 LINEMAP_LINE (last), LINEMAP_SYSP (last));
724 }
725
726 auto *map = LINEMAPS_LAST_ORDINARY_MAP (pfile->line_table);
727 pfile->main_loc = MAP_START_LOCATION (map);
728
729 return ORDINARY_MAP_FILE_NAME (map);
730 }
731
732 location_t
733 cpp_main_loc (const cpp_reader *pfile)
734 {
735 return pfile->main_loc;
736 }
737
738 /* For preprocessed files, if the very first characters are
739 '#<SPACE>[01]<SPACE>', then handle a line directive so we know the
740 original file name. This will generate file_change callbacks,
741 which the front ends must handle appropriately given their state of
742 initialization. We peek directly into the character buffer, so
743 that we're not confused by otherwise-skipped white space &
744 comments. We can be very picky, because this should have been
745 machine-generated text (by us, no less). This way we do not
746 interfere with the module directive state machine. */
747
748 static bool
749 read_original_filename (cpp_reader *pfile)
750 {
751 auto *buf = pfile->buffer->next_line;
752
753 if (pfile->buffer->rlimit - buf > 4
754 && buf[0] == '#'
755 && buf[1] == ' '
756 // Also permit '1', as that's what used to be here
757 && (buf[2] == '0' || buf[2] == '1')
758 && buf[3] == ' ')
759 {
760 const cpp_token *token = _cpp_lex_direct (pfile);
761 gcc_checking_assert (token->type == CPP_HASH);
762 if (_cpp_handle_directive (pfile, token->flags & PREV_WHITE))
763 {
764 read_original_directory (pfile);
765
766 auto *penult = &linemap_check_ordinary
767 (LINEMAPS_LAST_MAP (pfile->line_table, false))[-1];
768 if (penult[1].reason == LC_RENAME_VERBATIM)
769 {
770 /* Expunge any evidence of the original linemap. */
771 pfile->line_table->highest_location
772 = pfile->line_table->highest_line
773 = penult[0].start_location;
774
775 penult[1].start_location = penult[0].start_location;
776 penult[1].reason = penult[0].reason;
777 penult[0] = penult[1];
778 pfile->line_table->info_ordinary.used--;
779 pfile->line_table->info_ordinary.cache = 0;
780 }
781
782 return true;
783 }
784 }
785
786 return false;
787 }
788
789 /* For preprocessed files, if the tokens following the first filename
790 line is of the form # <line> "/path/name//", handle the
791 directive so we know the original current directory.
792
793 As with the first line peeking, we can do this without lexing by
794 being picky. */
795 static void
796 read_original_directory (cpp_reader *pfile)
797 {
798 auto *buf = pfile->buffer->next_line;
799
800 if (pfile->buffer->rlimit - buf > 4
801 && buf[0] == '#'
802 && buf[1] == ' '
803 // Also permit '1', as that's what used to be here
804 && (buf[2] == '0' || buf[2] == '1')
805 && buf[3] == ' ')
806 {
807 const cpp_token *hash = _cpp_lex_direct (pfile);
808 gcc_checking_assert (hash->type == CPP_HASH);
809 pfile->state.in_directive = 1;
810 const cpp_token *number = _cpp_lex_direct (pfile);
811 gcc_checking_assert (number->type == CPP_NUMBER);
812 const cpp_token *string = _cpp_lex_direct (pfile);
813 pfile->state.in_directive = 0;
814
815 const unsigned char *text = nullptr;
816 size_t len = 0;
817 if (string->type == CPP_STRING)
818 {
819 /* The string value includes the quotes. */
820 text = string->val.str.text;
821 len = string->val.str.len;
822 }
823 if (len < 5
824 || !IS_DIR_SEPARATOR (text[len - 2])
825 || !IS_DIR_SEPARATOR (text[len - 3]))
826 {
827 /* That didn't work out, back out. */
828 _cpp_backup_tokens (pfile, 3);
829 return;
830 }
831
832 if (pfile->cb.dir_change)
833 {
834 /* Smash the string directly, it's dead at this point */
835 char *smashy = (char *)text;
836 smashy[len - 3] = 0;
837
838 pfile->cb.dir_change (pfile, smashy + 1);
839 }
840
841 /* We should be at EOL. */
842 }
843 }
844
845 /* This is called at the end of preprocessing. It pops the last
846 buffer and writes dependency output.
847
848 Maybe it should also reset state, such that you could call
849 cpp_start_read with a new filename to restart processing. */
850 void
851 cpp_finish (cpp_reader *pfile, FILE *deps_stream)
852 {
853 /* Warn about unused macros before popping the final buffer. */
854 if (CPP_OPTION (pfile, warn_unused_macros))
855 cpp_forall_identifiers (pfile, _cpp_warn_if_unused_macro, NULL);
856
857 /* lex.cc leaves the final buffer on the stack. This it so that
858 it returns an unending stream of CPP_EOFs to the client. If we
859 popped the buffer, we'd dereference a NULL buffer pointer and
860 segfault. It's nice to allow the client to do worry-free excess
861 cpp_get_token calls. */
862 while (pfile->buffer)
863 _cpp_pop_buffer (pfile);
864
865 if (deps_stream)
866 deps_write (pfile, deps_stream, 72);
867
868 /* Report on headers that could use multiple include guards. */
869 if (CPP_OPTION (pfile, print_include_names))
870 _cpp_report_missing_guards (pfile);
871 }
872
873 static void
874 post_options (cpp_reader *pfile)
875 {
876 /* -Wtraditional is not useful in C++ mode. */
877 if (CPP_OPTION (pfile, cplusplus))
878 CPP_OPTION (pfile, cpp_warn_traditional) = 0;
879
880 /* Permanently disable macro expansion if we are rescanning
881 preprocessed text. Read preprocesed source in ISO mode. */
882 if (CPP_OPTION (pfile, preprocessed))
883 {
884 if (!CPP_OPTION (pfile, directives_only))
885 pfile->state.prevent_expansion = 1;
886 CPP_OPTION (pfile, traditional) = 0;
887 }
888
889 if (CPP_OPTION (pfile, warn_trigraphs) == 2)
890 CPP_OPTION (pfile, warn_trigraphs) = !CPP_OPTION (pfile, trigraphs);
891
892 if (CPP_OPTION (pfile, traditional))
893 {
894 CPP_OPTION (pfile, trigraphs) = 0;
895 CPP_OPTION (pfile, warn_trigraphs) = 0;
896 }
897
898 if (CPP_OPTION (pfile, module_directives))
899 {
900 /* These unspellable tokens have a leading space. */
901 const char *const inits[spec_nodes::M_HWM]
902 = {"export ", "module ", "import ", "__import"};
903
904 for (int ix = 0; ix != spec_nodes::M_HWM; ix++)
905 {
906 cpp_hashnode *node = cpp_lookup (pfile, UC (inits[ix]),
907 strlen (inits[ix]));
908
909 /* Token we pass to the compiler. */
910 pfile->spec_nodes.n_modules[ix][1] = node;
911
912 if (ix != spec_nodes::M__IMPORT)
913 /* Token we recognize when lexing, drop the trailing ' '. */
914 node = cpp_lookup (pfile, NODE_NAME (node), NODE_LEN (node) - 1);
915
916 node->flags |= NODE_MODULE;
917 pfile->spec_nodes.n_modules[ix][0] = node;
918 }
919 }
920 }