]>
Commit | Line | Data |
---|---|---|
1e8b9746 | 1 | /* Part of CPP library. |
806a3d45 | 2 | Copyright (C) 1997-2014 Free Software Foundation, Inc. |
a8cffe11 | 3 | |
4 | This program is free software; you can redistribute it and/or modify it | |
5 | under the terms of the GNU General Public License as published by the | |
6bc9506f | 6 | Free Software Foundation; either version 3, or (at your option) any |
a8cffe11 | 7 | later version. |
8 | ||
9 | This program is distributed in the hope that it will be useful, | |
10 | but WITHOUT ANY WARRANTY; without even the implied warranty of | |
11 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
12 | GNU General Public License for more details. | |
13 | ||
14 | You should have received a copy of the GNU General Public License | |
6bc9506f | 15 | along with this program; see the file COPYING3. If not see |
16 | <http://www.gnu.org/licenses/>. */ | |
a8cffe11 | 17 | |
1e8b9746 | 18 | /* This header defines all the internal data structures and functions |
d856c8a6 | 19 | that need to be visible across files. It should not be used outside |
20 | cpplib. */ | |
1e8b9746 | 21 | |
d856c8a6 | 22 | #ifndef LIBCPP_INTERNAL_H |
23 | #define LIBCPP_INTERNAL_H | |
73a17672 | 24 | |
d856c8a6 | 25 | #include "symtab.h" |
c39ed964 | 26 | #include "cpp-id-data.h" |
0d086e18 | 27 | |
39b83bdb | 28 | #if HAVE_ICONV |
ebc03810 | 29 | #include <iconv.h> |
30 | #else | |
31 | #define HAVE_ICONV 0 | |
32 | typedef int iconv_t; /* dummy */ | |
33 | #endif | |
34 | ||
e61157d7 | 35 | #ifdef __cplusplus |
36 | extern "C" { | |
37 | #endif | |
38 | ||
0d086e18 | 39 | struct directive; /* Deliberately incomplete. */ |
02516fb9 | 40 | struct pending_option; |
5bbf045f | 41 | struct op; |
f579c40a | 42 | struct _cpp_strbuf; |
9a432f9a | 43 | |
44 | typedef bool (*convert_f) (iconv_t, const unsigned char *, size_t, | |
f579c40a | 45 | struct _cpp_strbuf *); |
9a432f9a | 46 | struct cset_converter |
47 | { | |
48 | convert_f func; | |
49 | iconv_t cd; | |
924bbf02 | 50 | int width; |
9a432f9a | 51 | }; |
28898f20 | 52 | |
13c457e1 | 53 | #define BITS_PER_CPPCHAR_T (CHAR_BIT * sizeof (cppchar_t)) |
54 | ||
79bd622b | 55 | /* Test if a sign is valid within a preprocessing number. */ |
56 | #define VALID_SIGN(c, prevc) \ | |
57 | (((c) == '+' || (c) == '-') && \ | |
58 | ((prevc) == 'e' || (prevc) == 'E' \ | |
5db5d057 | 59 | || (((prevc) == 'p' || (prevc) == 'P') \ |
60 | && CPP_OPTION (pfile, extended_numbers)))) | |
79bd622b | 61 | |
4d6f7dd4 | 62 | #define DIGIT_SEP(c) ((c) == '\'' && CPP_OPTION (pfile, digit_separators)) |
63 | ||
28898f20 | 64 | #define CPP_OPTION(PFILE, OPTION) ((PFILE)->opts.OPTION) |
65 | #define CPP_BUFFER(PFILE) ((PFILE)->buffer) | |
a54e0bf8 | 66 | #define CPP_BUF_COLUMN(BUF, CUR) ((CUR) - (BUF)->line_base) |
28898f20 | 67 | #define CPP_BUF_COL(BUF) CPP_BUF_COLUMN(BUF, (BUF)->cur) |
68 | ||
610625e3 | 69 | #define CPP_INCREMENT_LINE(PFILE, COLS_HINT) do { \ |
dbddc569 | 70 | const struct line_maps *line_table = PFILE->line_table; \ |
97bfb9ef | 71 | const struct line_map *map = \ |
72 | LINEMAPS_LAST_ORDINARY_MAP (line_table); \ | |
4999c35b | 73 | linenum_type line = SOURCE_LINE (map, line_table->highest_line); \ |
dbddc569 | 74 | linemap_line_start (PFILE->line_table, line + 1, COLS_HINT); \ |
610625e3 | 75 | } while (0) |
76 | ||
28898f20 | 77 | /* Maximum nesting of cpp_buffers. We use a static limit, partly for |
78 | efficiency, and partly to limit runaway recursion. */ | |
79 | #define CPP_STACK_MAX 200 | |
80 | ||
198b48a0 | 81 | /* Host alignment handling. */ |
82 | struct dummy | |
83 | { | |
84 | char c; | |
85 | union | |
86 | { | |
87 | double d; | |
88 | int *p; | |
89 | } u; | |
90 | }; | |
91 | ||
92 | #define DEFAULT_ALIGNMENT offsetof (struct dummy, u) | |
93 | #define CPP_ALIGN2(size, align) (((size) + ((align) - 1)) & ~((align) - 1)) | |
94 | #define CPP_ALIGN(size) CPP_ALIGN2 (size, DEFAULT_ALIGNMENT) | |
95 | ||
71a7c282 | 96 | #define _cpp_mark_macro_used(NODE) do { \ |
97 | if ((NODE)->type == NT_MACRO && !((NODE)->flags & NODE_BUILTIN)) \ | |
98 | (NODE)->value.macro->used = 1; } while (0) | |
99 | ||
c7e5d924 | 100 | /* A generic memory buffer, and operations on it. */ |
06c92cbc | 101 | typedef struct _cpp_buff _cpp_buff; |
102 | struct _cpp_buff | |
103 | { | |
104 | struct _cpp_buff *next; | |
1fdf6039 | 105 | unsigned char *base, *cur, *limit; |
06c92cbc | 106 | }; |
107 | ||
f7fdd7a1 | 108 | extern _cpp_buff *_cpp_get_buff (cpp_reader *, size_t); |
109 | extern void _cpp_release_buff (cpp_reader *, _cpp_buff *); | |
110 | extern void _cpp_extend_buff (cpp_reader *, _cpp_buff **, size_t); | |
111 | extern _cpp_buff *_cpp_append_extend_buff (cpp_reader *, _cpp_buff *, size_t); | |
112 | extern void _cpp_free_buff (_cpp_buff *); | |
113 | extern unsigned char *_cpp_aligned_alloc (cpp_reader *, size_t); | |
114 | extern unsigned char *_cpp_unaligned_alloc (cpp_reader *, size_t); | |
c7e5d924 | 115 | |
e6a5f963 | 116 | #define BUFF_ROOM(BUFF) (size_t) ((BUFF)->limit - (BUFF)->cur) |
1fdf6039 | 117 | #define BUFF_FRONT(BUFF) ((BUFF)->cur) |
118 | #define BUFF_LIMIT(BUFF) ((BUFF)->limit) | |
06c92cbc | 119 | |
0d6d8dc0 | 120 | /* #include types. */ |
6adc88f8 | 121 | enum include_type {IT_INCLUDE, IT_INCLUDE_NEXT, IT_IMPORT, IT_CMDLINE, IT_DEFAULT}; |
0d6d8dc0 | 122 | |
f9b5f742 | 123 | union utoken |
28898f20 | 124 | { |
f9b5f742 | 125 | const cpp_token *token; |
126 | const cpp_token **ptoken; | |
28898f20 | 127 | }; |
128 | ||
e484a1cc | 129 | /* A "run" of tokens; part of a chain of runs. */ |
83dcbb5c | 130 | typedef struct tokenrun tokenrun; |
131 | struct tokenrun | |
132 | { | |
fb5ab82c | 133 | tokenrun *next, *prev; |
83dcbb5c | 134 | cpp_token *base, *limit; |
135 | }; | |
136 | ||
a854276a | 137 | /* Accessor macros for struct cpp_context. */ |
878d9b47 | 138 | #define FIRST(c) ((c)->u.iso.first) |
139 | #define LAST(c) ((c)->u.iso.last) | |
140 | #define CUR(c) ((c)->u.trad.cur) | |
141 | #define RLIMIT(c) ((c)->u.trad.rlimit) | |
a854276a | 142 | |
ce70f433 | 143 | /* This describes some additional data that is added to the macro |
144 | token context of type cpp_context, when -ftrack-macro-expansion is | |
145 | on. */ | |
146 | typedef struct | |
147 | { | |
148 | /* The node of the macro we are referring to. */ | |
149 | cpp_hashnode *macro_node; | |
150 | /* This buffer contains an array of virtual locations. The virtual | |
151 | location at index 0 is the virtual location of the token at index | |
152 | 0 in the current instance of cpp_context; similarly for all the | |
153 | other virtual locations. */ | |
154 | source_location *virt_locs; | |
155 | /* This is a pointer to the current virtual location. This is used | |
156 | to iterate over the virtual locations while we iterate over the | |
157 | tokens they belong to. */ | |
158 | source_location *cur_virt_loc; | |
159 | } macro_context; | |
160 | ||
161 | /* The kind of tokens carried by a cpp_context. */ | |
162 | enum context_tokens_kind { | |
163 | /* This is the value of cpp_context::tokens_kind if u.iso.first | |
164 | contains an instance of cpp_token **. */ | |
165 | TOKENS_KIND_INDIRECT, | |
166 | /* This is the value of cpp_context::tokens_kind if u.iso.first | |
167 | contains an instance of cpp_token *. */ | |
168 | TOKENS_KIND_DIRECT, | |
169 | /* This is the value of cpp_context::tokens_kind when the token | |
170 | context contains tokens resulting from macro expansion. In that | |
171 | case struct cpp_context::macro points to an instance of struct | |
172 | macro_context. This is used only when the | |
173 | -ftrack-macro-expansion flag is on. */ | |
174 | TOKENS_KIND_EXTENDED | |
175 | }; | |
176 | ||
28898f20 | 177 | typedef struct cpp_context cpp_context; |
178 | struct cpp_context | |
179 | { | |
180 | /* Doubly-linked list. */ | |
181 | cpp_context *next, *prev; | |
182 | ||
a854276a | 183 | union |
184 | { | |
185 | /* For ISO macro expansion. Contexts other than the base context | |
186 | are contiguous tokens. e.g. macro expansions, expanded | |
187 | argument tokens. */ | |
188 | struct | |
189 | { | |
190 | union utoken first; | |
191 | union utoken last; | |
192 | } iso; | |
193 | ||
194 | /* For traditional macro expansion. */ | |
195 | struct | |
196 | { | |
fe4dcd90 | 197 | const unsigned char *cur; |
198 | const unsigned char *rlimit; | |
a854276a | 199 | } trad; |
200 | } u; | |
28898f20 | 201 | |
084163dc | 202 | /* If non-NULL, a buffer used for storage related to this context. |
1785b647 | 203 | When the context is popped, the buffer is released. */ |
084163dc | 204 | _cpp_buff *buff; |
205 | ||
ce70f433 | 206 | /* If tokens_kind is TOKEN_KIND_EXTENDED, then (as we thus are in a |
207 | macro context) this is a pointer to an instance of macro_context. | |
208 | Otherwise if tokens_kind is *not* TOKEN_KIND_EXTENDED, then, if | |
209 | we are in a macro context, this is a pointer to an instance of | |
210 | cpp_hashnode, representing the name of the macro this context is | |
211 | for. If we are not in a macro context, then this is just NULL. | |
212 | Note that when tokens_kind is TOKEN_KIND_EXTENDED, the memory | |
213 | used by the instance of macro_context pointed to by this member | |
214 | is de-allocated upon de-allocation of the instance of struct | |
215 | cpp_context. */ | |
216 | union | |
217 | { | |
218 | macro_context *mc; | |
219 | cpp_hashnode *macro; | |
220 | } c; | |
f9b5f742 | 221 | |
ce70f433 | 222 | /* This determines the type of tokens held by this context. */ |
223 | enum context_tokens_kind tokens_kind; | |
28898f20 | 224 | }; |
225 | ||
226 | struct lexer_state | |
227 | { | |
228 | /* Nonzero if first token on line is CPP_HASH. */ | |
229 | unsigned char in_directive; | |
230 | ||
7825551f | 231 | /* Nonzero if in a directive that will handle padding tokens itself. |
232 | #include needs this to avoid problems with computed include and | |
233 | spacing between tokens. */ | |
234 | unsigned char directive_wants_padding; | |
235 | ||
5e878517 | 236 | /* True if we are skipping a failed conditional group. */ |
237 | unsigned char skipping; | |
238 | ||
28898f20 | 239 | /* Nonzero if in a directive that takes angle-bracketed headers. */ |
240 | unsigned char angled_headers; | |
241 | ||
bab5e68f | 242 | /* Nonzero if in a #if or #elif directive. */ |
243 | unsigned char in_expression; | |
244 | ||
28898f20 | 245 | /* Nonzero to save comments. Turned off if discard_comments, and in |
246 | all directives apart from #define. */ | |
247 | unsigned char save_comments; | |
248 | ||
28898f20 | 249 | /* Nonzero if lexing __VA_ARGS__ is valid. */ |
250 | unsigned char va_args_ok; | |
251 | ||
252 | /* Nonzero if lexing poisoned identifiers is valid. */ | |
253 | unsigned char poisoned_ok; | |
254 | ||
255 | /* Nonzero to prevent macro expansion. */ | |
b1a9ff83 | 256 | unsigned char prevent_expansion; |
28898f20 | 257 | |
258 | /* Nonzero when parsing arguments to a function-like macro. */ | |
259 | unsigned char parsing_args; | |
5bbf045f | 260 | |
f6751ff2 | 261 | /* Nonzero if in a __has_include__ or __has_include_next__ statement. */ |
262 | unsigned char in__has_include__; | |
263 | ||
3eb3f293 | 264 | /* Nonzero if prevent_expansion is true only because output is |
265 | being discarded. */ | |
266 | unsigned char discarding_output; | |
267 | ||
5bbf045f | 268 | /* Nonzero to skip evaluating part of an expression. */ |
269 | unsigned int skip_eval; | |
b75b98aa | 270 | |
271 | /* Nonzero when handling a deferred pragma. */ | |
272 | unsigned char in_deferred_pragma; | |
273 | ||
274 | /* Nonzero if the deferred pragma being handled allows macro expansion. */ | |
275 | unsigned char pragma_allow_expansion; | |
28898f20 | 276 | }; |
277 | ||
278 | /* Special nodes - identifiers with predefined significance. */ | |
279 | struct spec_nodes | |
280 | { | |
28898f20 | 281 | cpp_hashnode *n_defined; /* defined operator */ |
528671b3 | 282 | cpp_hashnode *n_true; /* C++ keyword true */ |
283 | cpp_hashnode *n_false; /* C++ keyword false */ | |
28898f20 | 284 | cpp_hashnode *n__VA_ARGS__; /* C99 vararg macros */ |
f6751ff2 | 285 | cpp_hashnode *n__has_include__; /* __has_include__ operator */ |
286 | cpp_hashnode *n__has_include_next__; /* __has_include_next__ operator */ | |
28898f20 | 287 | }; |
288 | ||
a54e0bf8 | 289 | typedef struct _cpp_line_note _cpp_line_note; |
290 | struct _cpp_line_note | |
291 | { | |
292 | /* Location in the clean line the note refers to. */ | |
fe4dcd90 | 293 | const unsigned char *pos; |
a54e0bf8 | 294 | |
aad4a87f | 295 | /* Type of note. The 9 'from' trigraph characters represent those |
296 | trigraphs, '\\' an escaped newline, ' ' an escaped newline with | |
3a45011c | 297 | intervening space, 0 represents a note that has already been handled, |
298 | and anything else is invalid. */ | |
aad4a87f | 299 | unsigned int type; |
a54e0bf8 | 300 | }; |
301 | ||
e484a1cc | 302 | /* Represents the contents of a file cpplib has read in. */ |
d7503801 | 303 | struct cpp_buffer |
304 | { | |
fe4dcd90 | 305 | const unsigned char *cur; /* Current location. */ |
306 | const unsigned char *line_base; /* Start of current physical line. */ | |
307 | const unsigned char *next_line; /* Start of to-be-cleaned logical line. */ | |
787c3d1a | 308 | |
fe4dcd90 | 309 | const unsigned char *buf; /* Entire character buffer. */ |
310 | const unsigned char *rlimit; /* Writable byte at end of file. */ | |
914db4b7 | 311 | const unsigned char *to_free; /* Pointer that should be freed when |
312 | popping the buffer. */ | |
a54e0bf8 | 313 | |
fe4dcd90 | 314 | _cpp_line_note *notes; /* Array of notes. */ |
315 | unsigned int cur_note; /* Next note to process. */ | |
316 | unsigned int notes_used; /* Number of notes. */ | |
317 | unsigned int notes_cap; /* Size of allocated array. */ | |
d7503801 | 318 | |
d7503801 | 319 | struct cpp_buffer *prev; |
320 | ||
1824e2bd | 321 | /* Pointer into the file table; non-NULL if this is a file buffer. |
322 | Used for include_next and to record control macros. */ | |
323 | struct _cpp_file *file; | |
d7503801 | 324 | |
cca5dddc | 325 | /* Saved value of __TIMESTAMP__ macro - date and time of last modification |
326 | of the assotiated file. */ | |
327 | const unsigned char *timestamp; | |
328 | ||
d7503801 | 329 | /* Value of if_stack at start of this file. |
330 | Used to prohibit unmatched #endif (etc) in an include file. */ | |
331 | struct if_stack *if_stack; | |
332 | ||
a54e0bf8 | 333 | /* True if we need to get the next clean line. */ |
334 | bool need_line; | |
d7503801 | 335 | |
336 | /* True if we have already warned about C++ comments in this file. | |
337 | The warning happens only for C89 extended mode with -pedantic on, | |
338 | or for -Wtraditional, and only once per file (otherwise it would | |
339 | be far too noisy). */ | |
610625e3 | 340 | unsigned int warned_cplusplus_comments : 1; |
d7503801 | 341 | |
342 | /* True if we don't process trigraphs and escaped newlines. True | |
343 | for preprocessed input, command line directives, and _Pragma | |
344 | buffers. */ | |
610625e3 | 345 | unsigned int from_stage3 : 1; |
d7503801 | 346 | |
6e04daf1 | 347 | /* At EOF, a buffer is automatically popped. If RETURN_AT_EOF is |
348 | true, a CPP_EOF token is then returned. Otherwise, the next | |
349 | token from the enclosing buffer is returned. */ | |
350 | unsigned int return_at_eof : 1; | |
0d6d8dc0 | 351 | |
610625e3 | 352 | /* One for a system header, two for a C system header file that therefore |
7c2df241 | 353 | needs to be extern "C" protected in C++, and zero otherwise. */ |
610625e3 | 354 | unsigned char sysp; |
355 | ||
3ec84a0b | 356 | /* The directory of the this buffer's file. Its NAME member is not |
357 | allocated, so we don't need to worry about freeing it. */ | |
1824e2bd | 358 | struct cpp_dir dir; |
0bb65704 | 359 | |
787c3d1a | 360 | /* Descriptor for converting from the input character set to the |
361 | source character set. */ | |
362 | struct cset_converter input_cset_desc; | |
d7503801 | 363 | }; |
364 | ||
038c21f1 | 365 | /* The list of saved macros by push_macro pragma. */ |
366 | struct def_pragma_macro { | |
367 | /* Chain element to previous saved macro. */ | |
368 | struct def_pragma_macro *next; | |
369 | /* Name of the macro. */ | |
370 | char *name; | |
371 | /* The stored macro content. */ | |
0d601ff4 | 372 | unsigned char *definition; |
373 | ||
374 | /* Definition line number. */ | |
375 | source_location line; | |
376 | /* If macro defined in system header. */ | |
377 | unsigned int syshdr : 1; | |
378 | /* Nonzero if it has been expanded or had its existence tested. */ | |
379 | unsigned int used : 1; | |
380 | ||
381 | /* Mark if we save an undefined macro. */ | |
382 | unsigned int is_undef : 1; | |
038c21f1 | 383 | }; |
384 | ||
28898f20 | 385 | /* A cpp_reader encapsulates the "state" of a pre-processor run. |
386 | Applying cpp_get_token repeatedly yields a stream of pre-processor | |
387 | tokens. Usually, there is only one cpp_reader object active. */ | |
28898f20 | 388 | struct cpp_reader |
389 | { | |
390 | /* Top of buffer stack. */ | |
391 | cpp_buffer *buffer; | |
392 | ||
bab5e68f | 393 | /* Overlaid buffer (can be different after processing #include). */ |
394 | cpp_buffer *overlaid_buffer; | |
395 | ||
28898f20 | 396 | /* Lexer state. */ |
397 | struct lexer_state state; | |
398 | ||
1ea7ed21 | 399 | /* Source line tracking. */ |
ceec9c13 | 400 | struct line_maps *line_table; |
36a0aa7c | 401 | |
729d2022 | 402 | /* The line of the '#' of the current directive. */ |
ed000086 | 403 | source_location directive_line; |
28898f20 | 404 | |
06c92cbc | 405 | /* Memory buffers. */ |
e6a5f963 | 406 | _cpp_buff *a_buff; /* Aligned permanent storage. */ |
1fdf6039 | 407 | _cpp_buff *u_buff; /* Unaligned permanent storage. */ |
408 | _cpp_buff *free_buffs; /* Free buffer chain. */ | |
06c92cbc | 409 | |
28898f20 | 410 | /* Context stack. */ |
411 | struct cpp_context base_context; | |
412 | struct cpp_context *context; | |
413 | ||
414 | /* If in_directive, the directive if known. */ | |
415 | const struct directive *directive; | |
416 | ||
d6d3c909 | 417 | /* Token generated while handling a directive, if any. */ |
418 | cpp_token directive_result; | |
419 | ||
931b0a0f | 420 | /* When expanding a macro at top-level, this is the location of the |
421 | macro invocation. */ | |
422 | source_location invocation_location; | |
423 | ||
8c6425eb | 424 | /* Nonzero if we are about to expand a macro. Note that if we are |
425 | really expanding a macro, the function macro_of_context returns | |
426 | the macro being expanded and this flag is set to false. Client | |
427 | code should use the function in_macro_expansion_p to know if we | |
428 | are either about to expand a macro, or are actually expanding | |
429 | one. */ | |
430 | bool about_to_expand_macro_p; | |
931b0a0f | 431 | |
e69f4d0e | 432 | /* Search paths for include files. */ |
1824e2bd | 433 | struct cpp_dir *quote_include; /* "" */ |
434 | struct cpp_dir *bracket_include; /* <> */ | |
435 | struct cpp_dir no_search_path; /* No path. */ | |
436 | ||
68faebf4 | 437 | /* Chain of all hashed _cpp_file instances. */ |
438 | struct _cpp_file *all_files; | |
1824e2bd | 439 | |
64386834 | 440 | struct _cpp_file *main_file; |
441 | ||
1824e2bd | 442 | /* File and directory hash table. */ |
aab5b9fa | 443 | struct htab *file_hash; |
821fa045 | 444 | struct htab *dir_hash; |
64cb8c90 | 445 | struct file_hash_entry_pool *file_hash_entries; |
1824e2bd | 446 | |
248dfc42 | 447 | /* Negative path lookup hash table. */ |
448 | struct htab *nonexistent_file_hash; | |
449 | struct obstack nonexistent_file_ob; | |
450 | ||
1824e2bd | 451 | /* Nonzero means don't look for #include "foo" the source-file |
452 | directory. */ | |
453 | bool quote_ignores_source_dir; | |
454 | ||
678704be | 455 | /* Nonzero if any file has contained #pragma once or #import has |
68faebf4 | 456 | been used. */ |
457 | bool seen_once_only; | |
e69f4d0e | 458 | |
7ef5b942 | 459 | /* Multiple include optimization. */ |
28898f20 | 460 | const cpp_hashnode *mi_cmacro; |
461 | const cpp_hashnode *mi_ind_cmacro; | |
fa233610 | 462 | bool mi_valid; |
28898f20 | 463 | |
83dcbb5c | 464 | /* Lexing. */ |
465 | cpp_token *cur_token; | |
466 | tokenrun base_run, *cur_run; | |
fb5ab82c | 467 | unsigned int lookaheads; |
83dcbb5c | 468 | |
d10cfa8d | 469 | /* Nonzero prevents the lexer from re-using the token runs. */ |
83dcbb5c | 470 | unsigned int keep_tokens; |
471 | ||
28898f20 | 472 | /* Buffer to hold macro definition string. */ |
473 | unsigned char *macro_buffer; | |
474 | unsigned int macro_buffer_len; | |
475 | ||
9a432f9a | 476 | /* Descriptor for converting from the source character set to the |
477 | execution character set. */ | |
478 | struct cset_converter narrow_cset_desc; | |
ebc03810 | 479 | |
538ba11a | 480 | /* Descriptor for converting from the source character set to the |
481 | UTF-8 execution character set. */ | |
482 | struct cset_converter utf8_cset_desc; | |
483 | ||
924bbf02 | 484 | /* Descriptor for converting from the source character set to the |
485 | UTF-16 execution character set. */ | |
486 | struct cset_converter char16_cset_desc; | |
487 | ||
488 | /* Descriptor for converting from the source character set to the | |
489 | UTF-32 execution character set. */ | |
490 | struct cset_converter char32_cset_desc; | |
491 | ||
9a432f9a | 492 | /* Descriptor for converting from the source character set to the |
493 | wide execution character set. */ | |
494 | struct cset_converter wide_cset_desc; | |
ebc03810 | 495 | |
9c343313 | 496 | /* Date and time text. Calculated together if either is requested. */ |
fe4dcd90 | 497 | const unsigned char *date; |
498 | const unsigned char *time; | |
28898f20 | 499 | |
f9b5f742 | 500 | /* EOF token, and a token forcing paste avoidance. */ |
501 | cpp_token avoid_paste; | |
502 | cpp_token eof; | |
503 | ||
61191376 | 504 | /* Opaque handle to the dependencies of mkdeps.c. */ |
28898f20 | 505 | struct deps *deps; |
506 | ||
507 | /* Obstack holding all macro hash nodes. This never shrinks. | |
f03668bd | 508 | See identifiers.c */ |
0d086e18 | 509 | struct obstack hash_ob; |
28898f20 | 510 | |
511 | /* Obstack holding buffer and conditional structures. This is a | |
f03668bd | 512 | real stack. See directives.c. */ |
0d086e18 | 513 | struct obstack buffer_ob; |
28898f20 | 514 | |
515 | /* Pragma table - dynamic, because a library user can add to the | |
516 | list of recognized pragmas. */ | |
517 | struct pragma_entry *pragmas; | |
518 | ||
5c120a72 | 519 | /* Call backs to cpplib client. */ |
28898f20 | 520 | struct cpp_callbacks cb; |
521 | ||
b1a9ff83 | 522 | /* Identifier hash table. */ |
0d086e18 | 523 | struct ht *hash_table; |
524 | ||
5bbf045f | 525 | /* Expression parser stack. */ |
526 | struct op *op_stack, *op_limit; | |
527 | ||
28898f20 | 528 | /* User visible options. */ |
529 | struct cpp_options opts; | |
530 | ||
531 | /* Special nodes - identifiers with predefined significance to the | |
532 | preprocessor. */ | |
533 | struct spec_nodes spec_nodes; | |
534 | ||
0d086e18 | 535 | /* Whether cpplib owns the hashtable. */ |
1824e2bd | 536 | bool our_hashtable; |
0bb65704 | 537 | |
fb83e0d6 | 538 | /* Traditional preprocessing output buffer (a logical line). */ |
539 | struct | |
540 | { | |
fe4dcd90 | 541 | unsigned char *base; |
542 | unsigned char *limit; | |
543 | unsigned char *cur; | |
ed000086 | 544 | source_location first_line; |
fb83e0d6 | 545 | } out; |
546 | ||
f03668bd | 547 | /* Used for buffer overlays by traditional.c. */ |
fe4dcd90 | 548 | const unsigned char *saved_cur, *saved_rlimit, *saved_line_base; |
610625e3 | 549 | |
573aba85 | 550 | /* A saved list of the defined macros, for dependency checking |
551 | of precompiled headers. */ | |
552 | struct cpp_savedstate *savedstate; | |
ce079f70 | 553 | |
554 | /* Next value of __COUNTER__ macro. */ | |
555 | unsigned int counter; | |
956c6108 | 556 | |
557 | /* Table of comments, when state.save_comments is true. */ | |
558 | cpp_comment_table comments; | |
038c21f1 | 559 | |
560 | /* List of saved macros by push_macro. */ | |
561 | struct def_pragma_macro *pushed_macros; | |
6ea2c7a3 | 562 | |
563 | /* If non-null, the lexer will use this location for the next token | |
564 | instead of getting a location from the linemap. */ | |
565 | source_location *forced_token_location_p; | |
28898f20 | 566 | }; |
567 | ||
93ce8ce4 | 568 | /* Character classes. Based on the more primitive macros in safe-ctype.h. |
1e8b9746 | 569 | If the definition of `numchar' looks odd to you, please look up the |
78719282 | 570 | definition of a pp-number in the C standard [section 6.4.8 of C99]. |
571 | ||
572 | In the unlikely event that characters other than \r and \n enter | |
f03668bd | 573 | the set is_vspace, the macro handle_newline() in lex.c must be |
78719282 | 574 | updated. */ |
2ff3ad1d | 575 | #define _dollar_ok(x) ((x) == '$' && CPP_OPTION (pfile, dollars_in_ident)) |
1e8b9746 | 576 | |
93ce8ce4 | 577 | #define is_idchar(x) (ISIDNUM(x) || _dollar_ok(x)) |
578 | #define is_numchar(x) ISIDNUM(x) | |
579 | #define is_idstart(x) (ISIDST(x) || _dollar_ok(x)) | |
580 | #define is_numstart(x) ISDIGIT(x) | |
581 | #define is_hspace(x) ISBLANK(x) | |
582 | #define is_vspace(x) IS_VSPACE(x) | |
583 | #define is_nvspace(x) IS_NVSPACE(x) | |
584 | #define is_space(x) IS_SPACE_OR_NUL(x) | |
1e8b9746 | 585 | |
93ce8ce4 | 586 | /* This table is constant if it can be initialized at compile time, |
1e8b9746 | 587 | which is the case if cpp was compiled with GCC >=2.7, or another |
588 | compiler that supports C99. */ | |
b3954366 | 589 | #if HAVE_DESIGNATED_INITIALIZERS |
b3954366 | 590 | extern const unsigned char _cpp_trigraph_map[UCHAR_MAX + 1]; |
1e8b9746 | 591 | #else |
b3954366 | 592 | extern unsigned char _cpp_trigraph_map[UCHAR_MAX + 1]; |
1e8b9746 | 593 | #endif |
594 | ||
595 | /* Macros. */ | |
596 | ||
610625e3 | 597 | static inline int cpp_in_system_header (cpp_reader *); |
598 | static inline int | |
599 | cpp_in_system_header (cpp_reader *pfile) | |
600 | { | |
601 | return pfile->buffer ? pfile->buffer->sysp : 0; | |
602 | } | |
5ae82d58 | 603 | #define CPP_PEDANTIC(PF) CPP_OPTION (PF, cpp_pedantic) |
604 | #define CPP_WTRADITIONAL(PF) CPP_OPTION (PF, cpp_warn_traditional) | |
1e8b9746 | 605 | |
927b511f | 606 | static inline int cpp_in_primary_file (cpp_reader *); |
607 | static inline int | |
608 | cpp_in_primary_file (cpp_reader *pfile) | |
609 | { | |
610 | return pfile->line_table->depth == 1; | |
611 | } | |
612 | ||
f03668bd | 613 | /* In macro.c */ |
f7fdd7a1 | 614 | extern void _cpp_free_definition (cpp_hashnode *); |
615 | extern bool _cpp_create_definition (cpp_reader *, cpp_hashnode *); | |
616 | extern void _cpp_pop_context (cpp_reader *); | |
617 | extern void _cpp_push_text_context (cpp_reader *, cpp_hashnode *, | |
fe4dcd90 | 618 | const unsigned char *, size_t); |
109ca87a | 619 | extern bool _cpp_save_parameter (cpp_reader *, cpp_macro *, cpp_hashnode *, |
620 | cpp_hashnode *); | |
f7fdd7a1 | 621 | extern bool _cpp_arguments_ok (cpp_reader *, cpp_macro *, const cpp_hashnode *, |
622 | unsigned int); | |
fe4dcd90 | 623 | extern const unsigned char *_cpp_builtin_macro_text (cpp_reader *, |
624 | cpp_hashnode *); | |
b75b98aa | 625 | extern int _cpp_warn_if_unused_macro (cpp_reader *, cpp_hashnode *, void *); |
626 | extern void _cpp_push_token_context (cpp_reader *, cpp_hashnode *, | |
627 | const cpp_token *, unsigned int); | |
89768577 | 628 | extern void _cpp_backup_tokens_direct (cpp_reader *, unsigned int); |
b75b98aa | 629 | |
f03668bd | 630 | /* In identifiers.c */ |
2b15d2ba | 631 | extern void _cpp_init_hashtable (cpp_reader *, cpp_hash_table *); |
f7fdd7a1 | 632 | extern void _cpp_destroy_hashtable (cpp_reader *); |
73a17672 | 633 | |
f03668bd | 634 | /* In files.c */ |
64386834 | 635 | typedef struct _cpp_file _cpp_file; |
04c0bfd0 | 636 | extern _cpp_file *_cpp_find_file (cpp_reader *, const char *, cpp_dir *, |
6adc88f8 | 637 | bool, int, bool); |
64386834 | 638 | extern bool _cpp_find_failed (_cpp_file *); |
68faebf4 | 639 | extern void _cpp_mark_file_once_only (cpp_reader *, struct _cpp_file *); |
f7fdd7a1 | 640 | extern void _cpp_fake_include (cpp_reader *, const char *); |
64386834 | 641 | extern bool _cpp_stack_file (cpp_reader *, _cpp_file*, bool); |
1824e2bd | 642 | extern bool _cpp_stack_include (cpp_reader *, const char *, int, |
643 | enum include_type); | |
f7fdd7a1 | 644 | extern int _cpp_compare_file_date (cpp_reader *, const char *, int); |
645 | extern void _cpp_report_missing_guards (cpp_reader *); | |
1824e2bd | 646 | extern void _cpp_init_files (cpp_reader *); |
647 | extern void _cpp_cleanup_files (cpp_reader *); | |
914db4b7 | 648 | extern void _cpp_pop_file_buffer (cpp_reader *, struct _cpp_file *, |
649 | const unsigned char *); | |
9f787687 | 650 | extern bool _cpp_save_file_entries (cpp_reader *pfile, FILE *f); |
651 | extern bool _cpp_read_file_entries (cpp_reader *, FILE *); | |
5e791406 | 652 | extern const char *_cpp_get_file_name (_cpp_file *); |
cca5dddc | 653 | extern struct stat *_cpp_get_file_stat (_cpp_file *); |
f6751ff2 | 654 | extern bool _cpp_has_header (cpp_reader *, const char *, int, |
655 | enum include_type); | |
1e8b9746 | 656 | |
f03668bd | 657 | /* In expr.c */ |
536a48ee | 658 | extern bool _cpp_parse_expr (cpp_reader *, bool); |
f7fdd7a1 | 659 | extern struct op *_cpp_expand_op_stack (cpp_reader *); |
1e8b9746 | 660 | |
f03668bd | 661 | /* In lex.c */ |
f7fdd7a1 | 662 | extern void _cpp_process_line_notes (cpp_reader *, int); |
663 | extern void _cpp_clean_line (cpp_reader *); | |
664 | extern bool _cpp_get_fresh_line (cpp_reader *); | |
665 | extern bool _cpp_skip_block_comment (cpp_reader *); | |
666 | extern cpp_token *_cpp_temp_token (cpp_reader *); | |
667 | extern const cpp_token *_cpp_lex_token (cpp_reader *); | |
668 | extern cpp_token *_cpp_lex_direct (cpp_reader *); | |
109ca87a | 669 | extern unsigned char *_cpp_spell_ident_ucns (unsigned char *, cpp_hashnode *); |
f7fdd7a1 | 670 | extern int _cpp_equiv_tokens (const cpp_token *, const cpp_token *); |
671 | extern void _cpp_init_tokenrun (tokenrun *, unsigned int); | |
038c21f1 | 672 | extern cpp_hashnode *_cpp_lex_identifier (cpp_reader *, const char *); |
a2eb22f0 | 673 | extern int _cpp_remaining_tokens_num_in_context (cpp_context *); |
b735cc56 | 674 | extern void _cpp_init_lexer (void); |
0578f103 | 675 | |
f03668bd | 676 | /* In init.c. */ |
f7fdd7a1 | 677 | extern void _cpp_maybe_push_include_file (cpp_reader *); |
ba99525e | 678 | extern const char *cpp_named_operator2name (enum cpp_ttype type); |
fe560637 | 679 | |
f03668bd | 680 | /* In directives.c */ |
f7fdd7a1 | 681 | extern int _cpp_test_assertion (cpp_reader *, unsigned int *); |
682 | extern int _cpp_handle_directive (cpp_reader *, int); | |
683 | extern void _cpp_define_builtin (cpp_reader *, const char *); | |
684 | extern char ** _cpp_save_pragma_names (cpp_reader *); | |
685 | extern void _cpp_restore_pragma_names (cpp_reader *, char **); | |
2d507e67 | 686 | extern int _cpp_do__Pragma (cpp_reader *); |
f7fdd7a1 | 687 | extern void _cpp_init_directives (cpp_reader *); |
688 | extern void _cpp_init_internal_pragmas (cpp_reader *); | |
689 | extern void _cpp_do_file_change (cpp_reader *, enum lc_reason, const char *, | |
4999c35b | 690 | linenum_type, unsigned int); |
f7fdd7a1 | 691 | extern void _cpp_pop_buffer (cpp_reader *); |
f6751ff2 | 692 | extern char *_cpp_bracket_include (cpp_reader *); |
e057cf7c | 693 | |
fcde64dc | 694 | /* In directives.c */ |
695 | struct _cpp_dir_only_callbacks | |
696 | { | |
697 | /* Called to print a block of lines. */ | |
698 | void (*print_lines) (int, const void *, size_t); | |
699 | void (*maybe_print_line) (source_location); | |
700 | }; | |
701 | ||
702 | extern void _cpp_preprocess_dir_only (cpp_reader *, | |
703 | const struct _cpp_dir_only_callbacks *); | |
704 | ||
f03668bd | 705 | /* In traditional.c. */ |
69edc0b3 | 706 | extern bool _cpp_scan_out_logical_line (cpp_reader *, cpp_macro *); |
f7fdd7a1 | 707 | extern bool _cpp_read_logical_line_trad (cpp_reader *); |
fe4dcd90 | 708 | extern void _cpp_overlay_buffer (cpp_reader *pfile, const unsigned char *, |
709 | size_t); | |
f7fdd7a1 | 710 | extern void _cpp_remove_overlay (cpp_reader *); |
711 | extern bool _cpp_create_trad_definition (cpp_reader *, cpp_macro *); | |
712 | extern bool _cpp_expansions_different_trad (const cpp_macro *, | |
713 | const cpp_macro *); | |
fe4dcd90 | 714 | extern unsigned char *_cpp_copy_replacement_text (const cpp_macro *, |
715 | unsigned char *); | |
f7fdd7a1 | 716 | extern size_t _cpp_replacement_text_len (const cpp_macro *); |
0bb65704 | 717 | |
f03668bd | 718 | /* In charset.c. */ |
bce47149 | 719 | |
720 | /* The normalization state at this point in the sequence. | |
721 | It starts initialized to all zeros, and at the end | |
722 | 'level' is the normalization level of the sequence. */ | |
723 | ||
724 | struct normalize_state | |
725 | { | |
460f52aa | 726 | /* The previous starter character. */ |
bce47149 | 727 | cppchar_t previous; |
460f52aa | 728 | /* The combining class of the previous character (whether or not a |
729 | starter). */ | |
bce47149 | 730 | unsigned char prev_class; |
731 | /* The lowest normalization level so far. */ | |
732 | enum cpp_normalize_level level; | |
733 | }; | |
734 | #define INITIAL_NORMALIZE_STATE { 0, 0, normalized_KC } | |
735 | #define NORMALIZE_STATE_RESULT(st) ((st)->level) | |
736 | ||
460f52aa | 737 | /* We saw a character C that matches ISIDNUM(), update a |
bce47149 | 738 | normalize_state appropriately. */ |
460f52aa | 739 | #define NORMALIZE_STATE_UPDATE_IDNUM(st, c) \ |
740 | ((st)->previous = (c), (st)->prev_class = 0) | |
bce47149 | 741 | |
fe4dcd90 | 742 | extern cppchar_t _cpp_valid_ucn (cpp_reader *, const unsigned char **, |
bce47149 | 743 | const unsigned char *, int, |
744 | struct normalize_state *state); | |
9a432f9a | 745 | extern void _cpp_destroy_iconv (cpp_reader *); |
fe4dcd90 | 746 | extern unsigned char *_cpp_convert_input (cpp_reader *, const char *, |
747 | unsigned char *, size_t, size_t, | |
d656d07a | 748 | const unsigned char **, off_t *); |
57ba96e9 | 749 | extern const char *_cpp_default_encoding (void); |
bb1fa6bb | 750 | extern cpp_hashnode * _cpp_interpret_identifier (cpp_reader *pfile, |
751 | const unsigned char *id, | |
752 | size_t len); | |
2cbf1359 | 753 | |
c95d8aaa | 754 | /* Utility routines and macros. */ |
fe4dcd90 | 755 | #define DSC(str) (const unsigned char *)str, sizeof str - 1 |
c95d8aaa | 756 | |
28898f20 | 757 | /* These are inline functions instead of macros so we can get type |
758 | checking. */ | |
fe4dcd90 | 759 | static inline int ustrcmp (const unsigned char *, const unsigned char *); |
760 | static inline int ustrncmp (const unsigned char *, const unsigned char *, | |
761 | size_t); | |
762 | static inline size_t ustrlen (const unsigned char *); | |
d8954404 | 763 | static inline const unsigned char *uxstrdup (const unsigned char *); |
764 | static inline const unsigned char *ustrchr (const unsigned char *, int); | |
fe4dcd90 | 765 | static inline int ufputs (const unsigned char *, FILE *); |
28898f20 | 766 | |
bb30d1f4 | 767 | /* Use a const char for the second parameter since it is usually a literal. */ |
768 | static inline int ustrcspn (const unsigned char *, const char *); | |
769 | ||
28898f20 | 770 | static inline int |
fe4dcd90 | 771 | ustrcmp (const unsigned char *s1, const unsigned char *s2) |
28898f20 | 772 | { |
773 | return strcmp ((const char *)s1, (const char *)s2); | |
774 | } | |
775 | ||
776 | static inline int | |
fe4dcd90 | 777 | ustrncmp (const unsigned char *s1, const unsigned char *s2, size_t n) |
28898f20 | 778 | { |
779 | return strncmp ((const char *)s1, (const char *)s2, n); | |
780 | } | |
781 | ||
bb30d1f4 | 782 | static inline int |
783 | ustrcspn (const unsigned char *s1, const char *s2) | |
784 | { | |
785 | return strcspn ((const char *)s1, s2); | |
786 | } | |
787 | ||
28898f20 | 788 | static inline size_t |
fe4dcd90 | 789 | ustrlen (const unsigned char *s1) |
28898f20 | 790 | { |
791 | return strlen ((const char *)s1); | |
792 | } | |
793 | ||
d8954404 | 794 | static inline const unsigned char * |
fe4dcd90 | 795 | uxstrdup (const unsigned char *s1) |
28898f20 | 796 | { |
d8954404 | 797 | return (const unsigned char *) xstrdup ((const char *)s1); |
28898f20 | 798 | } |
799 | ||
d8954404 | 800 | static inline const unsigned char * |
fe4dcd90 | 801 | ustrchr (const unsigned char *s1, int c) |
28898f20 | 802 | { |
d8954404 | 803 | return (const unsigned char *) strchr ((const char *)s1, c); |
28898f20 | 804 | } |
805 | ||
806 | static inline int | |
fe4dcd90 | 807 | ufputs (const unsigned char *s, FILE *f) |
28898f20 | 808 | { |
809 | return fputs ((const char *)s, f); | |
810 | } | |
811 | ||
97bfb9ef | 812 | /* In line-map.c. */ |
813 | ||
814 | /* Create a macro map. A macro map encodes source locations of tokens | |
815 | that are part of a macro replacement-list, at a macro expansion | |
816 | point. See the extensive comments of struct line_map and struct | |
817 | line_map_macro, in line-map.h. | |
818 | ||
819 | This map shall be created when the macro is expanded. The map | |
820 | encodes the source location of the expansion point of the macro as | |
821 | well as the "original" source location of each token that is part | |
822 | of the macro replacement-list. If a macro is defined but never | |
823 | expanded, it has no macro map. SET is the set of maps the macro | |
824 | map should be part of. MACRO_NODE is the macro which the new macro | |
825 | map should encode source locations for. EXPANSION is the location | |
826 | of the expansion point of MACRO. For function-like macros | |
827 | invocations, it's best to make it point to the closing parenthesis | |
828 | of the macro, rather than the the location of the first character | |
829 | of the macro. NUM_TOKENS is the number of tokens that are part of | |
830 | the replacement-list of MACRO. */ | |
831 | const struct line_map *linemap_enter_macro (struct line_maps *, | |
832 | struct cpp_hashnode*, | |
833 | source_location, | |
834 | unsigned int); | |
835 | ||
836 | /* Create and return a virtual location for a token that is part of a | |
837 | macro expansion-list at a macro expansion point. See the comment | |
838 | inside struct line_map_macro to see what an expansion-list exactly | |
839 | is. | |
840 | ||
841 | A call to this function must come after a call to | |
842 | linemap_enter_macro. | |
843 | ||
844 | MAP is the map into which the source location is created. TOKEN_NO | |
845 | is the index of the token in the macro replacement-list, starting | |
846 | at number 0. | |
847 | ||
848 | ORIG_LOC is the location of the token outside of this macro | |
849 | expansion. If the token comes originally from the macro | |
850 | definition, it is the locus in the macro definition; otherwise it | |
851 | is a location in the context of the caller of this macro expansion | |
852 | (which is a virtual location or a source location if the caller is | |
853 | itself a macro expansion or not). | |
854 | ||
855 | MACRO_DEFINITION_LOC is the location in the macro definition, | |
856 | either of the token itself or of a macro parameter that it | |
857 | replaces. */ | |
858 | source_location linemap_add_macro_token (const struct line_map *, | |
859 | unsigned int, | |
860 | source_location, | |
861 | source_location); | |
862 | ||
863 | /* Return the source line number corresponding to source location | |
864 | LOCATION. SET is the line map set LOCATION comes from. If | |
865 | LOCATION is the location of token that is part of the | |
866 | expansion-list of a macro expansion return the line number of the | |
867 | macro expansion point. */ | |
868 | int linemap_get_expansion_line (struct line_maps *, | |
869 | source_location); | |
870 | ||
871 | /* Return the path of the file corresponding to source code location | |
872 | LOCATION. | |
873 | ||
874 | If LOCATION is the location of a token that is part of the | |
875 | replacement-list of a macro expansion return the file path of the | |
876 | macro expansion point. | |
877 | ||
878 | SET is the line map set LOCATION comes from. */ | |
879 | const char* linemap_get_expansion_filename (struct line_maps *, | |
880 | source_location); | |
881 | ||
e61157d7 | 882 | #ifdef __cplusplus |
883 | } | |
884 | #endif | |
885 | ||
d856c8a6 | 886 | #endif /* ! LIBCPP_INTERNAL_H */ |