internal.h revision 1.5.4.2 1 /* Part of CPP library.
2 Copyright (C) 1997-2017 Free Software Foundation, Inc.
3
4 This program is free software; you can redistribute it and/or modify it
5 under the terms of the GNU General Public License as published by the
6 Free Software Foundation; either version 3, or (at your option) any
7 later version.
8
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
13
14 You should have received a copy of the GNU General Public License
15 along with this program; see the file COPYING3. If not see
16 <http://www.gnu.org/licenses/>. */
17
18 /* This header defines all the internal data structures and functions
19 that need to be visible across files. It should not be used outside
20 cpplib. */
21
22 #ifndef LIBCPP_INTERNAL_H
23 #define LIBCPP_INTERNAL_H
24
25 #include "symtab.h"
26 #include "cpp-id-data.h"
27
28 #if HAVE_ICONV
29 #include <iconv.h>
30 #else
31 #define HAVE_ICONV 0
32 typedef int iconv_t; /* dummy */
33 #endif
34
35 #ifdef __cplusplus
36 extern "C" {
37 #endif
38
39 struct directive; /* Deliberately incomplete. */
40 struct pending_option;
41 struct op;
42 struct _cpp_strbuf;
43
44 typedef bool (*convert_f) (iconv_t, const unsigned char *, size_t,
45 struct _cpp_strbuf *);
46 struct cset_converter
47 {
48 convert_f func;
49 iconv_t cd;
50 int width;
51 };
52
53 #define BITS_PER_CPPCHAR_T (CHAR_BIT * sizeof (cppchar_t))
54
55 /* Test if a sign is valid within a preprocessing number. */
56 #define VALID_SIGN(c, prevc) \
57 (((c) == '+' || (c) == '-') && \
58 ((prevc) == 'e' || (prevc) == 'E' \
59 || (((prevc) == 'p' || (prevc) == 'P') \
60 && CPP_OPTION (pfile, extended_numbers))))
61
62 #define DIGIT_SEP(c) ((c) == '\'' && CPP_OPTION (pfile, digit_separators))
63
64 #define CPP_OPTION(PFILE, OPTION) ((PFILE)->opts.OPTION)
65 #define CPP_BUFFER(PFILE) ((PFILE)->buffer)
66 #define CPP_BUF_COLUMN(BUF, CUR) ((CUR) - (BUF)->line_base)
67 #define CPP_BUF_COL(BUF) CPP_BUF_COLUMN(BUF, (BUF)->cur)
68
69 #define CPP_INCREMENT_LINE(PFILE, COLS_HINT) do { \
70 const struct line_maps *line_table = PFILE->line_table; \
71 const struct line_map_ordinary *map = \
72 LINEMAPS_LAST_ORDINARY_MAP (line_table); \
73 linenum_type line = SOURCE_LINE (map, line_table->highest_line); \
74 linemap_line_start (PFILE->line_table, line + 1, COLS_HINT); \
75 } while (0)
76
77 /* Maximum nesting of cpp_buffers. We use a static limit, partly for
78 efficiency, and partly to limit runaway recursion. */
79 #define CPP_STACK_MAX 200
80
81 /* Host alignment handling. */
82 struct dummy
83 {
84 char c;
85 union
86 {
87 double d;
88 int *p;
89 } u;
90 };
91
92 #define DEFAULT_ALIGNMENT offsetof (struct dummy, u)
93 #define CPP_ALIGN2(size, align) (((size) + ((align) - 1)) & ~((align) - 1))
94 #define CPP_ALIGN(size) CPP_ALIGN2 (size, DEFAULT_ALIGNMENT)
95
96 #define _cpp_mark_macro_used(NODE) do { \
97 if ((NODE)->type == NT_MACRO && !((NODE)->flags & NODE_BUILTIN)) \
98 (NODE)->value.macro->used = 1; } while (0)
99
100 /* A generic memory buffer, and operations on it. */
101 typedef struct _cpp_buff _cpp_buff;
102 struct _cpp_buff
103 {
104 struct _cpp_buff *next;
105 unsigned char *base, *cur, *limit;
106 };
107
108 extern _cpp_buff *_cpp_get_buff (cpp_reader *, size_t);
109 extern void _cpp_release_buff (cpp_reader *, _cpp_buff *);
110 extern void _cpp_extend_buff (cpp_reader *, _cpp_buff **, size_t);
111 extern _cpp_buff *_cpp_append_extend_buff (cpp_reader *, _cpp_buff *, size_t);
112 extern void _cpp_free_buff (_cpp_buff *);
113 extern unsigned char *_cpp_aligned_alloc (cpp_reader *, size_t);
114 extern unsigned char *_cpp_unaligned_alloc (cpp_reader *, size_t);
115
116 #define BUFF_ROOM(BUFF) (size_t) ((BUFF)->limit - (BUFF)->cur)
117 #define BUFF_FRONT(BUFF) ((BUFF)->cur)
118 #define BUFF_LIMIT(BUFF) ((BUFF)->limit)
119
120 /* #include types. */
121 enum include_type {IT_INCLUDE, IT_INCLUDE_NEXT, IT_IMPORT, IT_CMDLINE, IT_DEFAULT};
122
123 union utoken
124 {
125 const cpp_token *token;
126 const cpp_token **ptoken;
127 };
128
129 /* A "run" of tokens; part of a chain of runs. */
130 typedef struct tokenrun tokenrun;
131 struct tokenrun
132 {
133 tokenrun *next, *prev;
134 cpp_token *base, *limit;
135 };
136
137 /* Accessor macros for struct cpp_context. */
138 #define FIRST(c) ((c)->u.iso.first)
139 #define LAST(c) ((c)->u.iso.last)
140 #define CUR(c) ((c)->u.trad.cur)
141 #define RLIMIT(c) ((c)->u.trad.rlimit)
142
143 /* This describes some additional data that is added to the macro
144 token context of type cpp_context, when -ftrack-macro-expansion is
145 on. */
146 typedef struct
147 {
148 /* The node of the macro we are referring to. */
149 cpp_hashnode *macro_node;
150 /* This buffer contains an array of virtual locations. The virtual
151 location at index 0 is the virtual location of the token at index
152 0 in the current instance of cpp_context; similarly for all the
153 other virtual locations. */
154 source_location *virt_locs;
155 /* This is a pointer to the current virtual location. This is used
156 to iterate over the virtual locations while we iterate over the
157 tokens they belong to. */
158 source_location *cur_virt_loc;
159 } macro_context;
160
161 /* The kind of tokens carried by a cpp_context. */
162 enum context_tokens_kind {
163 /* This is the value of cpp_context::tokens_kind if u.iso.first
164 contains an instance of cpp_token **. */
165 TOKENS_KIND_INDIRECT,
166 /* This is the value of cpp_context::tokens_kind if u.iso.first
167 contains an instance of cpp_token *. */
168 TOKENS_KIND_DIRECT,
169 /* This is the value of cpp_context::tokens_kind when the token
170 context contains tokens resulting from macro expansion. In that
171 case struct cpp_context::macro points to an instance of struct
172 macro_context. This is used only when the
173 -ftrack-macro-expansion flag is on. */
174 TOKENS_KIND_EXTENDED
175 };
176
177 typedef struct cpp_context cpp_context;
178 struct cpp_context
179 {
180 /* Doubly-linked list. */
181 cpp_context *next, *prev;
182
183 union
184 {
185 /* For ISO macro expansion. Contexts other than the base context
186 are contiguous tokens. e.g. macro expansions, expanded
187 argument tokens. */
188 struct
189 {
190 union utoken first;
191 union utoken last;
192 } iso;
193
194 /* For traditional macro expansion. */
195 struct
196 {
197 const unsigned char *cur;
198 const unsigned char *rlimit;
199 } trad;
200 } u;
201
202 /* If non-NULL, a buffer used for storage related to this context.
203 When the context is popped, the buffer is released. */
204 _cpp_buff *buff;
205
206 /* If tokens_kind is TOKEN_KIND_EXTENDED, then (as we thus are in a
207 macro context) this is a pointer to an instance of macro_context.
208 Otherwise if tokens_kind is *not* TOKEN_KIND_EXTENDED, then, if
209 we are in a macro context, this is a pointer to an instance of
210 cpp_hashnode, representing the name of the macro this context is
211 for. If we are not in a macro context, then this is just NULL.
212 Note that when tokens_kind is TOKEN_KIND_EXTENDED, the memory
213 used by the instance of macro_context pointed to by this member
214 is de-allocated upon de-allocation of the instance of struct
215 cpp_context. */
216 union
217 {
218 macro_context *mc;
219 cpp_hashnode *macro;
220 } c;
221
222 /* This determines the type of tokens held by this context. */
223 enum context_tokens_kind tokens_kind;
224 };
225
226 struct lexer_state
227 {
228 /* Nonzero if first token on line is CPP_HASH. */
229 unsigned char in_directive;
230
231 /* Nonzero if we are collecting macro arguments */
232 unsigned char collecting_args;
233
234 /* Nonzero if in a directive that will handle padding tokens itself.
235 #include needs this to avoid problems with computed include and
236 spacing between tokens. */
237 unsigned char directive_wants_padding;
238
239 /* True if we are skipping a failed conditional group. */
240 unsigned char skipping;
241
242 /* Nonzero if in a directive that takes angle-bracketed headers. */
243 unsigned char angled_headers;
244
245 /* Nonzero if in a #if or #elif directive. */
246 unsigned char in_expression;
247
248 /* Nonzero to save comments. Turned off if discard_comments, and in
249 all directives apart from #define. */
250 unsigned char save_comments;
251
252 /* Nonzero if lexing __VA_ARGS__ is valid. */
253 unsigned char va_args_ok;
254
255 /* Nonzero if lexing poisoned identifiers is valid. */
256 unsigned char poisoned_ok;
257
258 /* Nonzero to prevent macro expansion. */
259 unsigned char prevent_expansion;
260
261 /* Nonzero when parsing arguments to a function-like macro. */
262 unsigned char parsing_args;
263
264 /* Nonzero if in a __has_include__ or __has_include_next__ statement. */
265 unsigned char in__has_include__;
266
267 /* Nonzero if prevent_expansion is true only because output is
268 being discarded. */
269 unsigned char discarding_output;
270
271 /* Nonzero to skip evaluating part of an expression. */
272 unsigned int skip_eval;
273
274 /* Nonzero when handling a deferred pragma. */
275 unsigned char in_deferred_pragma;
276
277 /* Nonzero if the deferred pragma being handled allows macro expansion. */
278 unsigned char pragma_allow_expansion;
279 };
280
281 /* Special nodes - identifiers with predefined significance. */
282 struct spec_nodes
283 {
284 cpp_hashnode *n_defined; /* defined operator */
285 cpp_hashnode *n_true; /* C++ keyword true */
286 cpp_hashnode *n_false; /* C++ keyword false */
287 cpp_hashnode *n__VA_ARGS__; /* C99 vararg macros */
288 cpp_hashnode *n__has_include__; /* __has_include__ operator */
289 cpp_hashnode *n__has_include_next__; /* __has_include_next__ operator */
290 };
291
292 typedef struct _cpp_line_note _cpp_line_note;
293 struct _cpp_line_note
294 {
295 /* Location in the clean line the note refers to. */
296 const unsigned char *pos;
297
298 /* Type of note. The 9 'from' trigraph characters represent those
299 trigraphs, '\\' an escaped newline, ' ' an escaped newline with
300 intervening space, 0 represents a note that has already been handled,
301 and anything else is invalid. */
302 unsigned int type;
303 };
304
305 /* Represents the contents of a file cpplib has read in. */
306 struct cpp_buffer
307 {
308 const unsigned char *cur; /* Current location. */
309 const unsigned char *line_base; /* Start of current physical line. */
310 const unsigned char *next_line; /* Start of to-be-cleaned logical line. */
311
312 const unsigned char *buf; /* Entire character buffer. */
313 const unsigned char *rlimit; /* Writable byte at end of file. */
314 const unsigned char *to_free; /* Pointer that should be freed when
315 popping the buffer. */
316
317 _cpp_line_note *notes; /* Array of notes. */
318 unsigned int cur_note; /* Next note to process. */
319 unsigned int notes_used; /* Number of notes. */
320 unsigned int notes_cap; /* Size of allocated array. */
321
322 struct cpp_buffer *prev;
323
324 /* Pointer into the file table; non-NULL if this is a file buffer.
325 Used for include_next and to record control macros. */
326 struct _cpp_file *file;
327
328 /* Saved value of __TIMESTAMP__ macro - date and time of last modification
329 of the assotiated file. */
330 const unsigned char *timestamp;
331
332 /* Value of if_stack at start of this file.
333 Used to prohibit unmatched #endif (etc) in an include file. */
334 struct if_stack *if_stack;
335
336 /* True if we need to get the next clean line. */
337 bool need_line;
338
339 /* True if we have already warned about C++ comments in this file.
340 The warning happens only for C89 extended mode with -pedantic on,
341 or for -Wtraditional, and only once per file (otherwise it would
342 be far too noisy). */
343 unsigned int warned_cplusplus_comments : 1;
344
345 /* True if we don't process trigraphs and escaped newlines. True
346 for preprocessed input, command line directives, and _Pragma
347 buffers. */
348 unsigned int from_stage3 : 1;
349
350 /* At EOF, a buffer is automatically popped. If RETURN_AT_EOF is
351 true, a CPP_EOF token is then returned. Otherwise, the next
352 token from the enclosing buffer is returned. */
353 unsigned int return_at_eof : 1;
354
355 /* One for a system header, two for a C system header file that therefore
356 needs to be extern "C" protected in C++, and zero otherwise. */
357 unsigned char sysp;
358
359 /* The directory of the this buffer's file. Its NAME member is not
360 allocated, so we don't need to worry about freeing it. */
361 struct cpp_dir dir;
362
363 /* Descriptor for converting from the input character set to the
364 source character set. */
365 struct cset_converter input_cset_desc;
366 };
367
368 /* The list of saved macros by push_macro pragma. */
369 struct def_pragma_macro {
370 /* Chain element to previous saved macro. */
371 struct def_pragma_macro *next;
372 /* Name of the macro. */
373 char *name;
374 /* The stored macro content. */
375 unsigned char *definition;
376
377 /* Definition line number. */
378 source_location line;
379 /* If macro defined in system header. */
380 unsigned int syshdr : 1;
381 /* Nonzero if it has been expanded or had its existence tested. */
382 unsigned int used : 1;
383
384 /* Mark if we save an undefined macro. */
385 unsigned int is_undef : 1;
386 /* Nonzero if it was a builtin macro. */
387 unsigned int is_builtin : 1;
388 };
389
390 /* A cpp_reader encapsulates the "state" of a pre-processor run.
391 Applying cpp_get_token repeatedly yields a stream of pre-processor
392 tokens. Usually, there is only one cpp_reader object active. */
393 struct cpp_reader
394 {
395 /* Top of buffer stack. */
396 cpp_buffer *buffer;
397
398 /* Overlaid buffer (can be different after processing #include). */
399 cpp_buffer *overlaid_buffer;
400
401 /* Lexer state. */
402 struct lexer_state state;
403
404 /* Source line tracking. */
405 struct line_maps *line_table;
406
407 /* The line of the '#' of the current directive. */
408 source_location directive_line;
409
410 /* Memory buffers. */
411 _cpp_buff *a_buff; /* Aligned permanent storage. */
412 _cpp_buff *u_buff; /* Unaligned permanent storage. */
413 _cpp_buff *free_buffs; /* Free buffer chain. */
414
415 /* Context stack. */
416 struct cpp_context base_context;
417 struct cpp_context *context;
418
419 /* If in_directive, the directive if known. */
420 const struct directive *directive;
421
422 /* Token generated while handling a directive, if any. */
423 cpp_token directive_result;
424
425 /* When expanding a macro at top-level, this is the location of the
426 macro invocation. */
427 source_location invocation_location;
428
429 /* This is the node representing the macro being expanded at
430 top-level. The value of this data member is valid iff
431 in_macro_expansion_p() returns TRUE. */
432 cpp_hashnode *top_most_macro_node;
433
434 /* Nonzero if we are about to expand a macro. Note that if we are
435 really expanding a macro, the function macro_of_context returns
436 the macro being expanded and this flag is set to false. Client
437 code should use the function in_macro_expansion_p to know if we
438 are either about to expand a macro, or are actually expanding
439 one. */
440 bool about_to_expand_macro_p;
441
442 /* Search paths for include files. */
443 struct cpp_dir *quote_include; /* "" */
444 struct cpp_dir *bracket_include; /* <> */
445 struct cpp_dir no_search_path; /* No path. */
446
447 /* Chain of all hashed _cpp_file instances. */
448 struct _cpp_file *all_files;
449
450 struct _cpp_file *main_file;
451
452 /* File and directory hash table. */
453 struct htab *file_hash;
454 struct htab *dir_hash;
455 struct file_hash_entry_pool *file_hash_entries;
456
457 /* Negative path lookup hash table. */
458 struct htab *nonexistent_file_hash;
459 struct obstack nonexistent_file_ob;
460
461 /* Nonzero means don't look for #include "foo" the source-file
462 directory. */
463 bool quote_ignores_source_dir;
464
465 /* Nonzero if any file has contained #pragma once or #import has
466 been used. */
467 bool seen_once_only;
468
469 /* Multiple include optimization. */
470 const cpp_hashnode *mi_cmacro;
471 const cpp_hashnode *mi_ind_cmacro;
472 bool mi_valid;
473
474 /* Lexing. */
475 cpp_token *cur_token;
476 tokenrun base_run, *cur_run;
477 unsigned int lookaheads;
478
479 /* Nonzero prevents the lexer from re-using the token runs. */
480 unsigned int keep_tokens;
481
482 /* Buffer to hold macro definition string. */
483 unsigned char *macro_buffer;
484 unsigned int macro_buffer_len;
485
486 /* Descriptor for converting from the source character set to the
487 execution character set. */
488 struct cset_converter narrow_cset_desc;
489
490 /* Descriptor for converting from the source character set to the
491 UTF-8 execution character set. */
492 struct cset_converter utf8_cset_desc;
493
494 /* Descriptor for converting from the source character set to the
495 UTF-16 execution character set. */
496 struct cset_converter char16_cset_desc;
497
498 /* Descriptor for converting from the source character set to the
499 UTF-32 execution character set. */
500 struct cset_converter char32_cset_desc;
501
502 /* Descriptor for converting from the source character set to the
503 wide execution character set. */
504 struct cset_converter wide_cset_desc;
505
506 /* Date and time text. Calculated together if either is requested. */
507 const unsigned char *date;
508 const unsigned char *time;
509
510 /* Externally set timestamp to replace current date and time useful for
511 reproducibility. It should be initialized to -2 (not yet set) and
512 set to -1 to disable it or to a non-negative value to enable it. */
513 time_t source_date_epoch;
514
515 /* EOF token, and a token forcing paste avoidance. */
516 cpp_token avoid_paste;
517 cpp_token eof;
518
519 /* Opaque handle to the dependencies of mkdeps.c. */
520 struct deps *deps;
521
522 /* Obstack holding all macro hash nodes. This never shrinks.
523 See identifiers.c */
524 struct obstack hash_ob;
525
526 /* Obstack holding buffer and conditional structures. This is a
527 real stack. See directives.c. */
528 struct obstack buffer_ob;
529
530 /* Pragma table - dynamic, because a library user can add to the
531 list of recognized pragmas. */
532 struct pragma_entry *pragmas;
533
534 /* Call backs to cpplib client. */
535 struct cpp_callbacks cb;
536
537 /* Identifier hash table. */
538 struct ht *hash_table;
539
540 /* Expression parser stack. */
541 struct op *op_stack, *op_limit;
542
543 /* User visible options. */
544 struct cpp_options opts;
545
546 /* Special nodes - identifiers with predefined significance to the
547 preprocessor. */
548 struct spec_nodes spec_nodes;
549
550 /* Whether cpplib owns the hashtable. */
551 bool our_hashtable;
552
553 /* Traditional preprocessing output buffer (a logical line). */
554 struct
555 {
556 unsigned char *base;
557 unsigned char *limit;
558 unsigned char *cur;
559 source_location first_line;
560 } out;
561
562 /* Used for buffer overlays by traditional.c. */
563 const unsigned char *saved_cur, *saved_rlimit, *saved_line_base;
564
565 /* A saved list of the defined macros, for dependency checking
566 of precompiled headers. */
567 struct cpp_savedstate *savedstate;
568
569 /* Next value of __COUNTER__ macro. */
570 unsigned int counter;
571
572 /* Table of comments, when state.save_comments is true. */
573 cpp_comment_table comments;
574
575 /* List of saved macros by push_macro. */
576 struct def_pragma_macro *pushed_macros;
577
578 /* If non-null, the lexer will use this location for the next token
579 instead of getting a location from the linemap. */
580 source_location *forced_token_location_p;
581 };
582
583 /* Character classes. Based on the more primitive macros in safe-ctype.h.
584 If the definition of `numchar' looks odd to you, please look up the
585 definition of a pp-number in the C standard [section 6.4.8 of C99].
586
587 In the unlikely event that characters other than \r and \n enter
588 the set is_vspace, the macro handle_newline() in lex.c must be
589 updated. */
590 #define _dollar_ok(x) ((x) == '$' && CPP_OPTION (pfile, dollars_in_ident))
591
592 #define is_idchar(x) (ISIDNUM(x) || _dollar_ok(x))
593 #define is_numchar(x) ISIDNUM(x)
594 #define is_idstart(x) (ISIDST(x) || _dollar_ok(x))
595 #define is_numstart(x) ISDIGIT(x)
596 #define is_hspace(x) ISBLANK(x)
597 #define is_vspace(x) IS_VSPACE(x)
598 #define is_nvspace(x) IS_NVSPACE(x)
599 #define is_space(x) IS_SPACE_OR_NUL(x)
600
601 /* This table is constant if it can be initialized at compile time,
602 which is the case if cpp was compiled with GCC >=2.7, or another
603 compiler that supports C99. */
604 #if HAVE_DESIGNATED_INITIALIZERS
605 extern const unsigned char _cpp_trigraph_map[UCHAR_MAX + 1];
606 #else
607 extern unsigned char _cpp_trigraph_map[UCHAR_MAX + 1];
608 #endif
609
610 /* Macros. */
611
612 static inline int cpp_in_system_header (cpp_reader *);
613 static inline int
614 cpp_in_system_header (cpp_reader *pfile)
615 {
616 return pfile->buffer ? pfile->buffer->sysp : 0;
617 }
618 #define CPP_PEDANTIC(PF) CPP_OPTION (PF, cpp_pedantic)
619 #define CPP_WTRADITIONAL(PF) CPP_OPTION (PF, cpp_warn_traditional)
620
621 static inline int cpp_in_primary_file (cpp_reader *);
622 static inline int
623 cpp_in_primary_file (cpp_reader *pfile)
624 {
625 return pfile->line_table->depth == 1;
626 }
627
628 /* In macro.c */
629 extern void _cpp_free_definition (cpp_hashnode *);
630 extern bool _cpp_create_definition (cpp_reader *, cpp_hashnode *);
631 extern void _cpp_pop_context (cpp_reader *);
632 extern void _cpp_push_text_context (cpp_reader *, cpp_hashnode *,
633 const unsigned char *, size_t);
634 extern bool _cpp_save_parameter (cpp_reader *, cpp_macro *, cpp_hashnode *,
635 cpp_hashnode *);
636 extern bool _cpp_arguments_ok (cpp_reader *, cpp_macro *, const cpp_hashnode *,
637 unsigned int);
638 extern const unsigned char *_cpp_builtin_macro_text (cpp_reader *,
639 cpp_hashnode *,
640 source_location = 0);
641 extern int _cpp_warn_if_unused_macro (cpp_reader *, cpp_hashnode *, void *);
642 extern void _cpp_push_token_context (cpp_reader *, cpp_hashnode *,
643 const cpp_token *, unsigned int);
644 extern void _cpp_backup_tokens_direct (cpp_reader *, unsigned int);
645
646 /* In identifiers.c */
647 extern void _cpp_init_hashtable (cpp_reader *, cpp_hash_table *);
648 extern void _cpp_destroy_hashtable (cpp_reader *);
649
650 /* In files.c */
651 typedef struct _cpp_file _cpp_file;
652 extern _cpp_file *_cpp_find_file (cpp_reader *, const char *, cpp_dir *,
653 bool, int, bool, source_location);
654 extern bool _cpp_find_failed (_cpp_file *);
655 extern void _cpp_mark_file_once_only (cpp_reader *, struct _cpp_file *);
656 extern void _cpp_fake_include (cpp_reader *, const char *);
657 extern bool _cpp_stack_file (cpp_reader *, _cpp_file*, bool,
658 source_location);
659 extern bool _cpp_stack_include (cpp_reader *, const char *, int,
660 enum include_type, source_location);
661 extern int _cpp_compare_file_date (cpp_reader *, const char *, int);
662 extern void _cpp_report_missing_guards (cpp_reader *);
663 extern void _cpp_init_files (cpp_reader *);
664 extern void _cpp_cleanup_files (cpp_reader *);
665 extern void _cpp_pop_file_buffer (cpp_reader *, struct _cpp_file *,
666 const unsigned char *);
667 extern bool _cpp_save_file_entries (cpp_reader *pfile, FILE *f);
668 extern bool _cpp_read_file_entries (cpp_reader *, FILE *);
669 extern const char *_cpp_get_file_name (_cpp_file *);
670 extern struct stat *_cpp_get_file_stat (_cpp_file *);
671 extern bool _cpp_has_header (cpp_reader *, const char *, int,
672 enum include_type);
673
674 /* In expr.c */
675 extern bool _cpp_parse_expr (cpp_reader *, bool);
676 extern struct op *_cpp_expand_op_stack (cpp_reader *);
677
678 /* In lex.c */
679 extern void _cpp_process_line_notes (cpp_reader *, int);
680 extern void _cpp_clean_line (cpp_reader *);
681 extern bool _cpp_get_fresh_line (cpp_reader *);
682 extern bool _cpp_skip_block_comment (cpp_reader *);
683 extern cpp_token *_cpp_temp_token (cpp_reader *);
684 extern const cpp_token *_cpp_lex_token (cpp_reader *);
685 extern cpp_token *_cpp_lex_direct (cpp_reader *);
686 extern unsigned char *_cpp_spell_ident_ucns (unsigned char *, cpp_hashnode *);
687 extern int _cpp_equiv_tokens (const cpp_token *, const cpp_token *);
688 extern void _cpp_init_tokenrun (tokenrun *, unsigned int);
689 extern cpp_hashnode *_cpp_lex_identifier (cpp_reader *, const char *);
690 extern int _cpp_remaining_tokens_num_in_context (cpp_context *);
691 extern void _cpp_init_lexer (void);
692
693 /* In init.c. */
694 extern void _cpp_maybe_push_include_file (cpp_reader *);
695 extern const char *cpp_named_operator2name (enum cpp_ttype type);
696 extern void _cpp_restore_special_builtin (cpp_reader *pfile,
697 struct def_pragma_macro *);
698
699 /* In directives.c */
700 extern int _cpp_test_assertion (cpp_reader *, unsigned int *);
701 extern int _cpp_handle_directive (cpp_reader *, int);
702 extern void _cpp_define_builtin (cpp_reader *, const char *);
703 extern char ** _cpp_save_pragma_names (cpp_reader *);
704 extern void _cpp_restore_pragma_names (cpp_reader *, char **);
705 extern int _cpp_do__Pragma (cpp_reader *, source_location);
706 extern void _cpp_init_directives (cpp_reader *);
707 extern void _cpp_init_internal_pragmas (cpp_reader *);
708 extern void _cpp_do_file_change (cpp_reader *, enum lc_reason, const char *,
709 linenum_type, unsigned int);
710 extern void _cpp_pop_buffer (cpp_reader *);
711 extern char *_cpp_bracket_include (cpp_reader *);
712
713 /* In directives.c */
714 struct _cpp_dir_only_callbacks
715 {
716 /* Called to print a block of lines. */
717 void (*print_lines) (int, const void *, size_t);
718 void (*maybe_print_line) (source_location);
719 };
720
721 extern void _cpp_preprocess_dir_only (cpp_reader *,
722 const struct _cpp_dir_only_callbacks *);
723
724 /* In traditional.c. */
725 extern bool _cpp_scan_out_logical_line (cpp_reader *, cpp_macro *, bool);
726 extern bool _cpp_read_logical_line_trad (cpp_reader *);
727 extern void _cpp_overlay_buffer (cpp_reader *pfile, const unsigned char *,
728 size_t);
729 extern void _cpp_remove_overlay (cpp_reader *);
730 extern bool _cpp_create_trad_definition (cpp_reader *, cpp_macro *);
731 extern bool _cpp_expansions_different_trad (const cpp_macro *,
732 const cpp_macro *);
733 extern unsigned char *_cpp_copy_replacement_text (const cpp_macro *,
734 unsigned char *);
735 extern size_t _cpp_replacement_text_len (const cpp_macro *);
736
737 /* In charset.c. */
738
739 /* The normalization state at this point in the sequence.
740 It starts initialized to all zeros, and at the end
741 'level' is the normalization level of the sequence. */
742
743 struct normalize_state
744 {
745 /* The previous starter character. */
746 cppchar_t previous;
747 /* The combining class of the previous character (whether or not a
748 starter). */
749 unsigned char prev_class;
750 /* The lowest normalization level so far. */
751 enum cpp_normalize_level level;
752 };
753 #define INITIAL_NORMALIZE_STATE { 0, 0, normalized_KC }
754 #define NORMALIZE_STATE_RESULT(st) ((st)->level)
755
756 /* We saw a character C that matches ISIDNUM(), update a
757 normalize_state appropriately. */
758 #define NORMALIZE_STATE_UPDATE_IDNUM(st, c) \
759 ((st)->previous = (c), (st)->prev_class = 0)
760
761 extern bool _cpp_valid_ucn (cpp_reader *, const unsigned char **,
762 const unsigned char *, int,
763 struct normalize_state *state,
764 cppchar_t *,
765 source_range *char_range,
766 cpp_string_location_reader *loc_reader);
767 extern void _cpp_destroy_iconv (cpp_reader *);
768 extern unsigned char *_cpp_convert_input (cpp_reader *, const char *,
769 unsigned char *, size_t, size_t,
770 const unsigned char **, off_t *);
771 extern const char *_cpp_default_encoding (void);
772 extern cpp_hashnode * _cpp_interpret_identifier (cpp_reader *pfile,
773 const unsigned char *id,
774 size_t len);
775
776 /* Utility routines and macros. */
777 #define DSC(str) (const unsigned char *)str, sizeof str - 1
778
779 /* These are inline functions instead of macros so we can get type
780 checking. */
781 static inline int ustrcmp (const unsigned char *, const unsigned char *);
782 static inline int ustrncmp (const unsigned char *, const unsigned char *,
783 size_t);
784 static inline size_t ustrlen (const unsigned char *);
785 static inline const unsigned char *uxstrdup (const unsigned char *);
786 static inline const unsigned char *ustrchr (const unsigned char *, int);
787 static inline int ufputs (const unsigned char *, FILE *);
788
789 /* Use a const char for the second parameter since it is usually a literal. */
790 static inline int ustrcspn (const unsigned char *, const char *);
791
792 static inline int
793 ustrcmp (const unsigned char *s1, const unsigned char *s2)
794 {
795 return strcmp ((const char *)s1, (const char *)s2);
796 }
797
798 static inline int
799 ustrncmp (const unsigned char *s1, const unsigned char *s2, size_t n)
800 {
801 return strncmp ((const char *)s1, (const char *)s2, n);
802 }
803
804 static inline int
805 ustrcspn (const unsigned char *s1, const char *s2)
806 {
807 return strcspn ((const char *)s1, s2);
808 }
809
810 static inline size_t
811 ustrlen (const unsigned char *s1)
812 {
813 return strlen ((const char *)s1);
814 }
815
816 static inline const unsigned char *
817 uxstrdup (const unsigned char *s1)
818 {
819 return (const unsigned char *) xstrdup ((const char *)s1);
820 }
821
822 static inline const unsigned char *
823 ustrchr (const unsigned char *s1, int c)
824 {
825 return (const unsigned char *) strchr ((const char *)s1, c);
826 }
827
828 static inline int
829 ufputs (const unsigned char *s, FILE *f)
830 {
831 return fputs ((const char *)s, f);
832 }
833
834 /* In line-map.c. */
835
836 /* Create a macro map. A macro map encodes source locations of tokens
837 that are part of a macro replacement-list, at a macro expansion
838 point. See the extensive comments of struct line_map and struct
839 line_map_macro, in line-map.h.
840
841 This map shall be created when the macro is expanded. The map
842 encodes the source location of the expansion point of the macro as
843 well as the "original" source location of each token that is part
844 of the macro replacement-list. If a macro is defined but never
845 expanded, it has no macro map. SET is the set of maps the macro
846 map should be part of. MACRO_NODE is the macro which the new macro
847 map should encode source locations for. EXPANSION is the location
848 of the expansion point of MACRO. For function-like macros
849 invocations, it's best to make it point to the closing parenthesis
850 of the macro, rather than the the location of the first character
851 of the macro. NUM_TOKENS is the number of tokens that are part of
852 the replacement-list of MACRO. */
853 const line_map_macro *linemap_enter_macro (struct line_maps *,
854 struct cpp_hashnode*,
855 source_location,
856 unsigned int);
857
858 /* Create and return a virtual location for a token that is part of a
859 macro expansion-list at a macro expansion point. See the comment
860 inside struct line_map_macro to see what an expansion-list exactly
861 is.
862
863 A call to this function must come after a call to
864 linemap_enter_macro.
865
866 MAP is the map into which the source location is created. TOKEN_NO
867 is the index of the token in the macro replacement-list, starting
868 at number 0.
869
870 ORIG_LOC is the location of the token outside of this macro
871 expansion. If the token comes originally from the macro
872 definition, it is the locus in the macro definition; otherwise it
873 is a location in the context of the caller of this macro expansion
874 (which is a virtual location or a source location if the caller is
875 itself a macro expansion or not).
876
877 MACRO_DEFINITION_LOC is the location in the macro definition,
878 either of the token itself or of a macro parameter that it
879 replaces. */
880 source_location linemap_add_macro_token (const line_map_macro *,
881 unsigned int,
882 source_location,
883 source_location);
884
885 /* Return the source line number corresponding to source location
886 LOCATION. SET is the line map set LOCATION comes from. If
887 LOCATION is the location of token that is part of the
888 expansion-list of a macro expansion return the line number of the
889 macro expansion point. */
890 int linemap_get_expansion_line (struct line_maps *,
891 source_location);
892
893 /* Return the path of the file corresponding to source code location
894 LOCATION.
895
896 If LOCATION is the location of a token that is part of the
897 replacement-list of a macro expansion return the file path of the
898 macro expansion point.
899
900 SET is the line map set LOCATION comes from. */
901 const char* linemap_get_expansion_filename (struct line_maps *,
902 source_location);
903
904 #ifdef __cplusplus
905 }
906 #endif
907
908 #endif /* ! LIBCPP_INTERNAL_H */
909