Home | History | Annotate | Line # | Download | only in libcpp
internal.h revision 1.5.4.2
      1 /* Part of CPP library.
      2    Copyright (C) 1997-2017 Free Software Foundation, Inc.
      3 
      4 This program is free software; you can redistribute it and/or modify it
      5 under the terms of the GNU General Public License as published by the
      6 Free Software Foundation; either version 3, or (at your option) any
      7 later version.
      8 
      9 This program is distributed in the hope that it will be useful,
     10 but WITHOUT ANY WARRANTY; without even the implied warranty of
     11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
     12 GNU General Public License for more details.
     13 
     14 You should have received a copy of the GNU General Public License
     15 along with this program; see the file COPYING3.  If not see
     16 <http://www.gnu.org/licenses/>.  */
     17 
     18 /* This header defines all the internal data structures and functions
     19    that need to be visible across files.  It should not be used outside
     20    cpplib.  */
     21 
     22 #ifndef LIBCPP_INTERNAL_H
     23 #define LIBCPP_INTERNAL_H
     24 
     25 #include "symtab.h"
     26 #include "cpp-id-data.h"
     27 
     28 #if HAVE_ICONV
     29 #include <iconv.h>
     30 #else
     31 #define HAVE_ICONV 0
     32 typedef int iconv_t;  /* dummy */
     33 #endif
     34 
     35 #ifdef __cplusplus
     36 extern "C" {
     37 #endif
     38 
     39 struct directive;		/* Deliberately incomplete.  */
     40 struct pending_option;
     41 struct op;
     42 struct _cpp_strbuf;
     43 
     44 typedef bool (*convert_f) (iconv_t, const unsigned char *, size_t,
     45 			   struct _cpp_strbuf *);
     46 struct cset_converter
     47 {
     48   convert_f func;
     49   iconv_t cd;
     50   int width;
     51 };
     52 
     53 #define BITS_PER_CPPCHAR_T (CHAR_BIT * sizeof (cppchar_t))
     54 
     55 /* Test if a sign is valid within a preprocessing number.  */
     56 #define VALID_SIGN(c, prevc) \
     57   (((c) == '+' || (c) == '-') && \
     58    ((prevc) == 'e' || (prevc) == 'E' \
     59     || (((prevc) == 'p' || (prevc) == 'P') \
     60         && CPP_OPTION (pfile, extended_numbers))))
     61 
     62 #define DIGIT_SEP(c) ((c) == '\'' && CPP_OPTION (pfile, digit_separators))
     63 
     64 #define CPP_OPTION(PFILE, OPTION) ((PFILE)->opts.OPTION)
     65 #define CPP_BUFFER(PFILE) ((PFILE)->buffer)
     66 #define CPP_BUF_COLUMN(BUF, CUR) ((CUR) - (BUF)->line_base)
     67 #define CPP_BUF_COL(BUF) CPP_BUF_COLUMN(BUF, (BUF)->cur)
     68 
     69 #define CPP_INCREMENT_LINE(PFILE, COLS_HINT) do { \
     70     const struct line_maps *line_table = PFILE->line_table; \
     71     const struct line_map_ordinary *map = \
     72       LINEMAPS_LAST_ORDINARY_MAP (line_table); \
     73     linenum_type line = SOURCE_LINE (map, line_table->highest_line); \
     74     linemap_line_start (PFILE->line_table, line + 1, COLS_HINT); \
     75   } while (0)
     76 
     77 /* Maximum nesting of cpp_buffers.  We use a static limit, partly for
     78    efficiency, and partly to limit runaway recursion.  */
     79 #define CPP_STACK_MAX 200
     80 
     81 /* Host alignment handling.  */
     82 struct dummy
     83 {
     84   char c;
     85   union
     86   {
     87     double d;
     88     int *p;
     89   } u;
     90 };
     91 
     92 #define DEFAULT_ALIGNMENT offsetof (struct dummy, u)
     93 #define CPP_ALIGN2(size, align) (((size) + ((align) - 1)) & ~((align) - 1))
     94 #define CPP_ALIGN(size) CPP_ALIGN2 (size, DEFAULT_ALIGNMENT)
     95 
     96 #define _cpp_mark_macro_used(NODE) do {					\
     97   if ((NODE)->type == NT_MACRO && !((NODE)->flags & NODE_BUILTIN))	\
     98     (NODE)->value.macro->used = 1; } while (0)
     99 
    100 /* A generic memory buffer, and operations on it.  */
    101 typedef struct _cpp_buff _cpp_buff;
    102 struct _cpp_buff
    103 {
    104   struct _cpp_buff *next;
    105   unsigned char *base, *cur, *limit;
    106 };
    107 
    108 extern _cpp_buff *_cpp_get_buff (cpp_reader *, size_t);
    109 extern void _cpp_release_buff (cpp_reader *, _cpp_buff *);
    110 extern void _cpp_extend_buff (cpp_reader *, _cpp_buff **, size_t);
    111 extern _cpp_buff *_cpp_append_extend_buff (cpp_reader *, _cpp_buff *, size_t);
    112 extern void _cpp_free_buff (_cpp_buff *);
    113 extern unsigned char *_cpp_aligned_alloc (cpp_reader *, size_t);
    114 extern unsigned char *_cpp_unaligned_alloc (cpp_reader *, size_t);
    115 
    116 #define BUFF_ROOM(BUFF) (size_t) ((BUFF)->limit - (BUFF)->cur)
    117 #define BUFF_FRONT(BUFF) ((BUFF)->cur)
    118 #define BUFF_LIMIT(BUFF) ((BUFF)->limit)
    119 
    120 /* #include types.  */
    121 enum include_type {IT_INCLUDE, IT_INCLUDE_NEXT, IT_IMPORT, IT_CMDLINE, IT_DEFAULT};
    122 
    123 union utoken
    124 {
    125   const cpp_token *token;
    126   const cpp_token **ptoken;
    127 };
    128 
    129 /* A "run" of tokens; part of a chain of runs.  */
    130 typedef struct tokenrun tokenrun;
    131 struct tokenrun
    132 {
    133   tokenrun *next, *prev;
    134   cpp_token *base, *limit;
    135 };
    136 
    137 /* Accessor macros for struct cpp_context.  */
    138 #define FIRST(c) ((c)->u.iso.first)
    139 #define LAST(c) ((c)->u.iso.last)
    140 #define CUR(c) ((c)->u.trad.cur)
    141 #define RLIMIT(c) ((c)->u.trad.rlimit)
    142 
    143 /* This describes some additional data that is added to the macro
    144    token context of type cpp_context, when -ftrack-macro-expansion is
    145    on.  */
    146 typedef struct
    147 {
    148   /* The node of the macro we are referring to.  */
    149   cpp_hashnode *macro_node;
    150   /* This buffer contains an array of virtual locations.  The virtual
    151      location at index 0 is the virtual location of the token at index
    152      0 in the current instance of cpp_context; similarly for all the
    153      other virtual locations.  */
    154   source_location *virt_locs;
    155   /* This is a pointer to the current virtual location.  This is used
    156      to iterate over the virtual locations while we iterate over the
    157      tokens they belong to.  */
    158   source_location *cur_virt_loc;
    159 } macro_context;
    160 
    161 /* The kind of tokens carried by a cpp_context.  */
    162 enum context_tokens_kind {
    163   /* This is the value of cpp_context::tokens_kind if u.iso.first
    164      contains an instance of cpp_token **.  */
    165   TOKENS_KIND_INDIRECT,
    166   /* This is the value of cpp_context::tokens_kind if u.iso.first
    167      contains an instance of cpp_token *.  */
    168   TOKENS_KIND_DIRECT,
    169   /* This is the value of cpp_context::tokens_kind when the token
    170      context contains tokens resulting from macro expansion.  In that
    171      case struct cpp_context::macro points to an instance of struct
    172      macro_context.  This is used only when the
    173      -ftrack-macro-expansion flag is on.  */
    174   TOKENS_KIND_EXTENDED
    175 };
    176 
    177 typedef struct cpp_context cpp_context;
    178 struct cpp_context
    179 {
    180   /* Doubly-linked list.  */
    181   cpp_context *next, *prev;
    182 
    183   union
    184   {
    185     /* For ISO macro expansion.  Contexts other than the base context
    186        are contiguous tokens.  e.g. macro expansions, expanded
    187        argument tokens.  */
    188     struct
    189     {
    190       union utoken first;
    191       union utoken last;
    192     } iso;
    193 
    194     /* For traditional macro expansion.  */
    195     struct
    196     {
    197       const unsigned char *cur;
    198       const unsigned char *rlimit;
    199     } trad;
    200   } u;
    201 
    202   /* If non-NULL, a buffer used for storage related to this context.
    203      When the context is popped, the buffer is released.  */
    204   _cpp_buff *buff;
    205 
    206   /* If tokens_kind is TOKEN_KIND_EXTENDED, then (as we thus are in a
    207      macro context) this is a pointer to an instance of macro_context.
    208      Otherwise if tokens_kind is *not* TOKEN_KIND_EXTENDED, then, if
    209      we are in a macro context, this is a pointer to an instance of
    210      cpp_hashnode, representing the name of the macro this context is
    211      for.  If we are not in a macro context, then this is just NULL.
    212      Note that when tokens_kind is TOKEN_KIND_EXTENDED, the memory
    213      used by the instance of macro_context pointed to by this member
    214      is de-allocated upon de-allocation of the instance of struct
    215      cpp_context.  */
    216   union
    217   {
    218     macro_context *mc;
    219     cpp_hashnode *macro;
    220   } c;
    221 
    222   /* This determines the type of tokens held by this context.  */
    223   enum context_tokens_kind tokens_kind;
    224 };
    225 
    226 struct lexer_state
    227 {
    228   /* Nonzero if first token on line is CPP_HASH.  */
    229   unsigned char in_directive;
    230 
    231   /* Nonzero if we are collecting macro arguments */
    232   unsigned char collecting_args;
    233 
    234   /* Nonzero if in a directive that will handle padding tokens itself.
    235      #include needs this to avoid problems with computed include and
    236      spacing between tokens.  */
    237   unsigned char directive_wants_padding;
    238 
    239   /* True if we are skipping a failed conditional group.  */
    240   unsigned char skipping;
    241 
    242   /* Nonzero if in a directive that takes angle-bracketed headers.  */
    243   unsigned char angled_headers;
    244 
    245   /* Nonzero if in a #if or #elif directive.  */
    246   unsigned char in_expression;
    247 
    248   /* Nonzero to save comments.  Turned off if discard_comments, and in
    249      all directives apart from #define.  */
    250   unsigned char save_comments;
    251 
    252   /* Nonzero if lexing __VA_ARGS__ is valid.  */
    253   unsigned char va_args_ok;
    254 
    255   /* Nonzero if lexing poisoned identifiers is valid.  */
    256   unsigned char poisoned_ok;
    257 
    258   /* Nonzero to prevent macro expansion.  */
    259   unsigned char prevent_expansion;
    260 
    261   /* Nonzero when parsing arguments to a function-like macro.  */
    262   unsigned char parsing_args;
    263 
    264   /* Nonzero if in a __has_include__ or __has_include_next__ statement.  */
    265   unsigned char in__has_include__;
    266 
    267   /* Nonzero if prevent_expansion is true only because output is
    268      being discarded.  */
    269   unsigned char discarding_output;
    270 
    271   /* Nonzero to skip evaluating part of an expression.  */
    272   unsigned int skip_eval;
    273 
    274   /* Nonzero when handling a deferred pragma.  */
    275   unsigned char in_deferred_pragma;
    276 
    277   /* Nonzero if the deferred pragma being handled allows macro expansion.  */
    278   unsigned char pragma_allow_expansion;
    279 };
    280 
    281 /* Special nodes - identifiers with predefined significance.  */
    282 struct spec_nodes
    283 {
    284   cpp_hashnode *n_defined;		/* defined operator */
    285   cpp_hashnode *n_true;			/* C++ keyword true */
    286   cpp_hashnode *n_false;		/* C++ keyword false */
    287   cpp_hashnode *n__VA_ARGS__;		/* C99 vararg macros */
    288   cpp_hashnode *n__has_include__;	/* __has_include__ operator */
    289   cpp_hashnode *n__has_include_next__;	/* __has_include_next__ operator */
    290 };
    291 
    292 typedef struct _cpp_line_note _cpp_line_note;
    293 struct _cpp_line_note
    294 {
    295   /* Location in the clean line the note refers to.  */
    296   const unsigned char *pos;
    297 
    298   /* Type of note.  The 9 'from' trigraph characters represent those
    299      trigraphs, '\\' an escaped newline, ' ' an escaped newline with
    300      intervening space, 0 represents a note that has already been handled,
    301      and anything else is invalid.  */
    302   unsigned int type;
    303 };
    304 
    305 /* Represents the contents of a file cpplib has read in.  */
    306 struct cpp_buffer
    307 {
    308   const unsigned char *cur;        /* Current location.  */
    309   const unsigned char *line_base;  /* Start of current physical line.  */
    310   const unsigned char *next_line;  /* Start of to-be-cleaned logical line.  */
    311 
    312   const unsigned char *buf;        /* Entire character buffer.  */
    313   const unsigned char *rlimit;     /* Writable byte at end of file.  */
    314   const unsigned char *to_free;	   /* Pointer that should be freed when
    315 				      popping the buffer.  */
    316 
    317   _cpp_line_note *notes;           /* Array of notes.  */
    318   unsigned int cur_note;           /* Next note to process.  */
    319   unsigned int notes_used;         /* Number of notes.  */
    320   unsigned int notes_cap;          /* Size of allocated array.  */
    321 
    322   struct cpp_buffer *prev;
    323 
    324   /* Pointer into the file table; non-NULL if this is a file buffer.
    325      Used for include_next and to record control macros.  */
    326   struct _cpp_file *file;
    327 
    328   /* Saved value of __TIMESTAMP__ macro - date and time of last modification
    329      of the assotiated file.  */
    330   const unsigned char *timestamp;
    331 
    332   /* Value of if_stack at start of this file.
    333      Used to prohibit unmatched #endif (etc) in an include file.  */
    334   struct if_stack *if_stack;
    335 
    336   /* True if we need to get the next clean line.  */
    337   bool need_line;
    338 
    339   /* True if we have already warned about C++ comments in this file.
    340      The warning happens only for C89 extended mode with -pedantic on,
    341      or for -Wtraditional, and only once per file (otherwise it would
    342      be far too noisy).  */
    343   unsigned int warned_cplusplus_comments : 1;
    344 
    345   /* True if we don't process trigraphs and escaped newlines.  True
    346      for preprocessed input, command line directives, and _Pragma
    347      buffers.  */
    348   unsigned int from_stage3 : 1;
    349 
    350   /* At EOF, a buffer is automatically popped.  If RETURN_AT_EOF is
    351      true, a CPP_EOF token is then returned.  Otherwise, the next
    352      token from the enclosing buffer is returned.  */
    353   unsigned int return_at_eof : 1;
    354 
    355   /* One for a system header, two for a C system header file that therefore
    356      needs to be extern "C" protected in C++, and zero otherwise.  */
    357   unsigned char sysp;
    358 
    359   /* The directory of the this buffer's file.  Its NAME member is not
    360      allocated, so we don't need to worry about freeing it.  */
    361   struct cpp_dir dir;
    362 
    363   /* Descriptor for converting from the input character set to the
    364      source character set.  */
    365   struct cset_converter input_cset_desc;
    366 };
    367 
    368 /* The list of saved macros by push_macro pragma.  */
    369 struct def_pragma_macro {
    370   /* Chain element to previous saved macro.  */
    371   struct def_pragma_macro *next;
    372   /* Name of the macro.  */
    373   char *name;
    374   /* The stored macro content.  */
    375   unsigned char *definition;
    376 
    377   /* Definition line number.  */
    378   source_location line;
    379   /* If macro defined in system header.  */
    380   unsigned int syshdr   : 1;
    381   /* Nonzero if it has been expanded or had its existence tested.  */
    382   unsigned int used     : 1;
    383 
    384   /* Mark if we save an undefined macro.  */
    385   unsigned int is_undef : 1;
    386   /* Nonzero if it was a builtin macro.  */
    387   unsigned int is_builtin : 1;
    388 };
    389 
    390 /* A cpp_reader encapsulates the "state" of a pre-processor run.
    391    Applying cpp_get_token repeatedly yields a stream of pre-processor
    392    tokens.  Usually, there is only one cpp_reader object active.  */
    393 struct cpp_reader
    394 {
    395   /* Top of buffer stack.  */
    396   cpp_buffer *buffer;
    397 
    398   /* Overlaid buffer (can be different after processing #include).  */
    399   cpp_buffer *overlaid_buffer;
    400 
    401   /* Lexer state.  */
    402   struct lexer_state state;
    403 
    404   /* Source line tracking.  */
    405   struct line_maps *line_table;
    406 
    407   /* The line of the '#' of the current directive.  */
    408   source_location directive_line;
    409 
    410   /* Memory buffers.  */
    411   _cpp_buff *a_buff;		/* Aligned permanent storage.  */
    412   _cpp_buff *u_buff;		/* Unaligned permanent storage.  */
    413   _cpp_buff *free_buffs;	/* Free buffer chain.  */
    414 
    415   /* Context stack.  */
    416   struct cpp_context base_context;
    417   struct cpp_context *context;
    418 
    419   /* If in_directive, the directive if known.  */
    420   const struct directive *directive;
    421 
    422   /* Token generated while handling a directive, if any. */
    423   cpp_token directive_result;
    424 
    425   /* When expanding a macro at top-level, this is the location of the
    426      macro invocation.  */
    427   source_location invocation_location;
    428 
    429   /* This is the node representing the macro being expanded at
    430      top-level.  The value of this data member is valid iff
    431      in_macro_expansion_p() returns TRUE.  */
    432   cpp_hashnode *top_most_macro_node;
    433 
    434   /* Nonzero if we are about to expand a macro.  Note that if we are
    435      really expanding a macro, the function macro_of_context returns
    436      the macro being expanded and this flag is set to false.  Client
    437      code should use the function in_macro_expansion_p to know if we
    438      are either about to expand a macro, or are actually expanding
    439      one.  */
    440   bool about_to_expand_macro_p;
    441 
    442   /* Search paths for include files.  */
    443   struct cpp_dir *quote_include;	/* "" */
    444   struct cpp_dir *bracket_include;	/* <> */
    445   struct cpp_dir no_search_path;	/* No path.  */
    446 
    447   /* Chain of all hashed _cpp_file instances.  */
    448   struct _cpp_file *all_files;
    449 
    450   struct _cpp_file *main_file;
    451 
    452   /* File and directory hash table.  */
    453   struct htab *file_hash;
    454   struct htab *dir_hash;
    455   struct file_hash_entry_pool *file_hash_entries;
    456 
    457   /* Negative path lookup hash table.  */
    458   struct htab *nonexistent_file_hash;
    459   struct obstack nonexistent_file_ob;
    460 
    461   /* Nonzero means don't look for #include "foo" the source-file
    462      directory.  */
    463   bool quote_ignores_source_dir;
    464 
    465   /* Nonzero if any file has contained #pragma once or #import has
    466      been used.  */
    467   bool seen_once_only;
    468 
    469   /* Multiple include optimization.  */
    470   const cpp_hashnode *mi_cmacro;
    471   const cpp_hashnode *mi_ind_cmacro;
    472   bool mi_valid;
    473 
    474   /* Lexing.  */
    475   cpp_token *cur_token;
    476   tokenrun base_run, *cur_run;
    477   unsigned int lookaheads;
    478 
    479   /* Nonzero prevents the lexer from re-using the token runs.  */
    480   unsigned int keep_tokens;
    481 
    482   /* Buffer to hold macro definition string.  */
    483   unsigned char *macro_buffer;
    484   unsigned int macro_buffer_len;
    485 
    486   /* Descriptor for converting from the source character set to the
    487      execution character set.  */
    488   struct cset_converter narrow_cset_desc;
    489 
    490   /* Descriptor for converting from the source character set to the
    491      UTF-8 execution character set.  */
    492   struct cset_converter utf8_cset_desc;
    493 
    494   /* Descriptor for converting from the source character set to the
    495      UTF-16 execution character set.  */
    496   struct cset_converter char16_cset_desc;
    497 
    498   /* Descriptor for converting from the source character set to the
    499      UTF-32 execution character set.  */
    500   struct cset_converter char32_cset_desc;
    501 
    502   /* Descriptor for converting from the source character set to the
    503      wide execution character set.  */
    504   struct cset_converter wide_cset_desc;
    505 
    506   /* Date and time text.  Calculated together if either is requested.  */
    507   const unsigned char *date;
    508   const unsigned char *time;
    509 
    510   /* Externally set timestamp to replace current date and time useful for
    511      reproducibility.  It should be initialized to -2 (not yet set) and
    512      set to -1 to disable it or to a non-negative value to enable it.  */
    513   time_t source_date_epoch;
    514 
    515   /* EOF token, and a token forcing paste avoidance.  */
    516   cpp_token avoid_paste;
    517   cpp_token eof;
    518 
    519   /* Opaque handle to the dependencies of mkdeps.c.  */
    520   struct deps *deps;
    521 
    522   /* Obstack holding all macro hash nodes.  This never shrinks.
    523      See identifiers.c */
    524   struct obstack hash_ob;
    525 
    526   /* Obstack holding buffer and conditional structures.  This is a
    527      real stack.  See directives.c.  */
    528   struct obstack buffer_ob;
    529 
    530   /* Pragma table - dynamic, because a library user can add to the
    531      list of recognized pragmas.  */
    532   struct pragma_entry *pragmas;
    533 
    534   /* Call backs to cpplib client.  */
    535   struct cpp_callbacks cb;
    536 
    537   /* Identifier hash table.  */
    538   struct ht *hash_table;
    539 
    540   /* Expression parser stack.  */
    541   struct op *op_stack, *op_limit;
    542 
    543   /* User visible options.  */
    544   struct cpp_options opts;
    545 
    546   /* Special nodes - identifiers with predefined significance to the
    547      preprocessor.  */
    548   struct spec_nodes spec_nodes;
    549 
    550   /* Whether cpplib owns the hashtable.  */
    551   bool our_hashtable;
    552 
    553   /* Traditional preprocessing output buffer (a logical line).  */
    554   struct
    555   {
    556     unsigned char *base;
    557     unsigned char *limit;
    558     unsigned char *cur;
    559     source_location first_line;
    560   } out;
    561 
    562   /* Used for buffer overlays by traditional.c.  */
    563   const unsigned char *saved_cur, *saved_rlimit, *saved_line_base;
    564 
    565   /* A saved list of the defined macros, for dependency checking
    566      of precompiled headers.  */
    567   struct cpp_savedstate *savedstate;
    568 
    569   /* Next value of __COUNTER__ macro. */
    570   unsigned int counter;
    571 
    572   /* Table of comments, when state.save_comments is true.  */
    573   cpp_comment_table comments;
    574 
    575   /* List of saved macros by push_macro.  */
    576   struct def_pragma_macro *pushed_macros;
    577 
    578   /* If non-null, the lexer will use this location for the next token
    579      instead of getting a location from the linemap.  */
    580   source_location *forced_token_location_p;
    581 };
    582 
    583 /* Character classes.  Based on the more primitive macros in safe-ctype.h.
    584    If the definition of `numchar' looks odd to you, please look up the
    585    definition of a pp-number in the C standard [section 6.4.8 of C99].
    586 
    587    In the unlikely event that characters other than \r and \n enter
    588    the set is_vspace, the macro handle_newline() in lex.c must be
    589    updated.  */
    590 #define _dollar_ok(x)	((x) == '$' && CPP_OPTION (pfile, dollars_in_ident))
    591 
    592 #define is_idchar(x)	(ISIDNUM(x) || _dollar_ok(x))
    593 #define is_numchar(x)	ISIDNUM(x)
    594 #define is_idstart(x)	(ISIDST(x) || _dollar_ok(x))
    595 #define is_numstart(x)	ISDIGIT(x)
    596 #define is_hspace(x)	ISBLANK(x)
    597 #define is_vspace(x)	IS_VSPACE(x)
    598 #define is_nvspace(x)	IS_NVSPACE(x)
    599 #define is_space(x)	IS_SPACE_OR_NUL(x)
    600 
    601 /* This table is constant if it can be initialized at compile time,
    602    which is the case if cpp was compiled with GCC >=2.7, or another
    603    compiler that supports C99.  */
    604 #if HAVE_DESIGNATED_INITIALIZERS
    605 extern const unsigned char _cpp_trigraph_map[UCHAR_MAX + 1];
    606 #else
    607 extern unsigned char _cpp_trigraph_map[UCHAR_MAX + 1];
    608 #endif
    609 
    610 /* Macros.  */
    611 
    612 static inline int cpp_in_system_header (cpp_reader *);
    613 static inline int
    614 cpp_in_system_header (cpp_reader *pfile)
    615 {
    616   return pfile->buffer ? pfile->buffer->sysp : 0;
    617 }
    618 #define CPP_PEDANTIC(PF) CPP_OPTION (PF, cpp_pedantic)
    619 #define CPP_WTRADITIONAL(PF) CPP_OPTION (PF, cpp_warn_traditional)
    620 
    621 static inline int cpp_in_primary_file (cpp_reader *);
    622 static inline int
    623 cpp_in_primary_file (cpp_reader *pfile)
    624 {
    625   return pfile->line_table->depth == 1;
    626 }
    627 
    628 /* In macro.c */
    629 extern void _cpp_free_definition (cpp_hashnode *);
    630 extern bool _cpp_create_definition (cpp_reader *, cpp_hashnode *);
    631 extern void _cpp_pop_context (cpp_reader *);
    632 extern void _cpp_push_text_context (cpp_reader *, cpp_hashnode *,
    633 				    const unsigned char *, size_t);
    634 extern bool _cpp_save_parameter (cpp_reader *, cpp_macro *, cpp_hashnode *,
    635 				 cpp_hashnode *);
    636 extern bool _cpp_arguments_ok (cpp_reader *, cpp_macro *, const cpp_hashnode *,
    637 			       unsigned int);
    638 extern const unsigned char *_cpp_builtin_macro_text (cpp_reader *,
    639 						     cpp_hashnode *,
    640 						     source_location = 0);
    641 extern int _cpp_warn_if_unused_macro (cpp_reader *, cpp_hashnode *, void *);
    642 extern void _cpp_push_token_context (cpp_reader *, cpp_hashnode *,
    643 				     const cpp_token *, unsigned int);
    644 extern void _cpp_backup_tokens_direct (cpp_reader *, unsigned int);
    645 
    646 /* In identifiers.c */
    647 extern void _cpp_init_hashtable (cpp_reader *, cpp_hash_table *);
    648 extern void _cpp_destroy_hashtable (cpp_reader *);
    649 
    650 /* In files.c */
    651 typedef struct _cpp_file _cpp_file;
    652 extern _cpp_file *_cpp_find_file (cpp_reader *, const char *, cpp_dir *,
    653 				  bool, int, bool, source_location);
    654 extern bool _cpp_find_failed (_cpp_file *);
    655 extern void _cpp_mark_file_once_only (cpp_reader *, struct _cpp_file *);
    656 extern void _cpp_fake_include (cpp_reader *, const char *);
    657 extern bool _cpp_stack_file (cpp_reader *, _cpp_file*, bool,
    658 			     source_location);
    659 extern bool _cpp_stack_include (cpp_reader *, const char *, int,
    660 				enum include_type, source_location);
    661 extern int _cpp_compare_file_date (cpp_reader *, const char *, int);
    662 extern void _cpp_report_missing_guards (cpp_reader *);
    663 extern void _cpp_init_files (cpp_reader *);
    664 extern void _cpp_cleanup_files (cpp_reader *);
    665 extern void _cpp_pop_file_buffer (cpp_reader *, struct _cpp_file *,
    666 				  const unsigned char *);
    667 extern bool _cpp_save_file_entries (cpp_reader *pfile, FILE *f);
    668 extern bool _cpp_read_file_entries (cpp_reader *, FILE *);
    669 extern const char *_cpp_get_file_name (_cpp_file *);
    670 extern struct stat *_cpp_get_file_stat (_cpp_file *);
    671 extern bool _cpp_has_header (cpp_reader *, const char *, int,
    672 			     enum include_type);
    673 
    674 /* In expr.c */
    675 extern bool _cpp_parse_expr (cpp_reader *, bool);
    676 extern struct op *_cpp_expand_op_stack (cpp_reader *);
    677 
    678 /* In lex.c */
    679 extern void _cpp_process_line_notes (cpp_reader *, int);
    680 extern void _cpp_clean_line (cpp_reader *);
    681 extern bool _cpp_get_fresh_line (cpp_reader *);
    682 extern bool _cpp_skip_block_comment (cpp_reader *);
    683 extern cpp_token *_cpp_temp_token (cpp_reader *);
    684 extern const cpp_token *_cpp_lex_token (cpp_reader *);
    685 extern cpp_token *_cpp_lex_direct (cpp_reader *);
    686 extern unsigned char *_cpp_spell_ident_ucns (unsigned char *, cpp_hashnode *);
    687 extern int _cpp_equiv_tokens (const cpp_token *, const cpp_token *);
    688 extern void _cpp_init_tokenrun (tokenrun *, unsigned int);
    689 extern cpp_hashnode *_cpp_lex_identifier (cpp_reader *, const char *);
    690 extern int _cpp_remaining_tokens_num_in_context (cpp_context *);
    691 extern void _cpp_init_lexer (void);
    692 
    693 /* In init.c.  */
    694 extern void _cpp_maybe_push_include_file (cpp_reader *);
    695 extern const char *cpp_named_operator2name (enum cpp_ttype type);
    696 extern void _cpp_restore_special_builtin (cpp_reader *pfile,
    697 					  struct def_pragma_macro *);
    698 
    699 /* In directives.c */
    700 extern int _cpp_test_assertion (cpp_reader *, unsigned int *);
    701 extern int _cpp_handle_directive (cpp_reader *, int);
    702 extern void _cpp_define_builtin (cpp_reader *, const char *);
    703 extern char ** _cpp_save_pragma_names (cpp_reader *);
    704 extern void _cpp_restore_pragma_names (cpp_reader *, char **);
    705 extern int _cpp_do__Pragma (cpp_reader *, source_location);
    706 extern void _cpp_init_directives (cpp_reader *);
    707 extern void _cpp_init_internal_pragmas (cpp_reader *);
    708 extern void _cpp_do_file_change (cpp_reader *, enum lc_reason, const char *,
    709 				 linenum_type, unsigned int);
    710 extern void _cpp_pop_buffer (cpp_reader *);
    711 extern char *_cpp_bracket_include (cpp_reader *);
    712 
    713 /* In directives.c */
    714 struct _cpp_dir_only_callbacks
    715 {
    716   /* Called to print a block of lines. */
    717   void (*print_lines) (int, const void *, size_t);
    718   void (*maybe_print_line) (source_location);
    719 };
    720 
    721 extern void _cpp_preprocess_dir_only (cpp_reader *,
    722 				      const struct _cpp_dir_only_callbacks *);
    723 
    724 /* In traditional.c.  */
    725 extern bool _cpp_scan_out_logical_line (cpp_reader *, cpp_macro *, bool);
    726 extern bool _cpp_read_logical_line_trad (cpp_reader *);
    727 extern void _cpp_overlay_buffer (cpp_reader *pfile, const unsigned char *,
    728 				 size_t);
    729 extern void _cpp_remove_overlay (cpp_reader *);
    730 extern bool _cpp_create_trad_definition (cpp_reader *, cpp_macro *);
    731 extern bool _cpp_expansions_different_trad (const cpp_macro *,
    732 					    const cpp_macro *);
    733 extern unsigned char *_cpp_copy_replacement_text (const cpp_macro *,
    734 						  unsigned char *);
    735 extern size_t _cpp_replacement_text_len (const cpp_macro *);
    736 
    737 /* In charset.c.  */
    738 
    739 /* The normalization state at this point in the sequence.
    740    It starts initialized to all zeros, and at the end
    741    'level' is the normalization level of the sequence.  */
    742 
    743 struct normalize_state
    744 {
    745   /* The previous starter character.  */
    746   cppchar_t previous;
    747   /* The combining class of the previous character (whether or not a
    748      starter).  */
    749   unsigned char prev_class;
    750   /* The lowest normalization level so far.  */
    751   enum cpp_normalize_level level;
    752 };
    753 #define INITIAL_NORMALIZE_STATE { 0, 0, normalized_KC }
    754 #define NORMALIZE_STATE_RESULT(st) ((st)->level)
    755 
    756 /* We saw a character C that matches ISIDNUM(), update a
    757    normalize_state appropriately.  */
    758 #define NORMALIZE_STATE_UPDATE_IDNUM(st, c)	\
    759   ((st)->previous = (c), (st)->prev_class = 0)
    760 
    761 extern bool _cpp_valid_ucn (cpp_reader *, const unsigned char **,
    762 			    const unsigned char *, int,
    763 			    struct normalize_state *state,
    764 			    cppchar_t *,
    765 			    source_range *char_range,
    766 			    cpp_string_location_reader *loc_reader);
    767 extern void _cpp_destroy_iconv (cpp_reader *);
    768 extern unsigned char *_cpp_convert_input (cpp_reader *, const char *,
    769 					  unsigned char *, size_t, size_t,
    770 					  const unsigned char **, off_t *);
    771 extern const char *_cpp_default_encoding (void);
    772 extern cpp_hashnode * _cpp_interpret_identifier (cpp_reader *pfile,
    773 						 const unsigned char *id,
    774 						 size_t len);
    775 
    776 /* Utility routines and macros.  */
    777 #define DSC(str) (const unsigned char *)str, sizeof str - 1
    778 
    779 /* These are inline functions instead of macros so we can get type
    780    checking.  */
    781 static inline int ustrcmp (const unsigned char *, const unsigned char *);
    782 static inline int ustrncmp (const unsigned char *, const unsigned char *,
    783 			    size_t);
    784 static inline size_t ustrlen (const unsigned char *);
    785 static inline const unsigned char *uxstrdup (const unsigned char *);
    786 static inline const unsigned char *ustrchr (const unsigned char *, int);
    787 static inline int ufputs (const unsigned char *, FILE *);
    788 
    789 /* Use a const char for the second parameter since it is usually a literal.  */
    790 static inline int ustrcspn (const unsigned char *, const char *);
    791 
    792 static inline int
    793 ustrcmp (const unsigned char *s1, const unsigned char *s2)
    794 {
    795   return strcmp ((const char *)s1, (const char *)s2);
    796 }
    797 
    798 static inline int
    799 ustrncmp (const unsigned char *s1, const unsigned char *s2, size_t n)
    800 {
    801   return strncmp ((const char *)s1, (const char *)s2, n);
    802 }
    803 
    804 static inline int
    805 ustrcspn (const unsigned char *s1, const char *s2)
    806 {
    807   return strcspn ((const char *)s1, s2);
    808 }
    809 
    810 static inline size_t
    811 ustrlen (const unsigned char *s1)
    812 {
    813   return strlen ((const char *)s1);
    814 }
    815 
    816 static inline const unsigned char *
    817 uxstrdup (const unsigned char *s1)
    818 {
    819   return (const unsigned char *) xstrdup ((const char *)s1);
    820 }
    821 
    822 static inline const unsigned char *
    823 ustrchr (const unsigned char *s1, int c)
    824 {
    825   return (const unsigned char *) strchr ((const char *)s1, c);
    826 }
    827 
    828 static inline int
    829 ufputs (const unsigned char *s, FILE *f)
    830 {
    831   return fputs ((const char *)s, f);
    832 }
    833 
    834   /* In line-map.c.  */
    835 
    836 /* Create a macro map.  A macro map encodes source locations of tokens
    837    that are part of a macro replacement-list, at a macro expansion
    838    point. See the extensive comments of struct line_map and struct
    839    line_map_macro, in line-map.h.
    840 
    841    This map shall be created when the macro is expanded. The map
    842    encodes the source location of the expansion point of the macro as
    843    well as the "original" source location of each token that is part
    844    of the macro replacement-list. If a macro is defined but never
    845    expanded, it has no macro map.  SET is the set of maps the macro
    846    map should be part of.  MACRO_NODE is the macro which the new macro
    847    map should encode source locations for.  EXPANSION is the location
    848    of the expansion point of MACRO. For function-like macros
    849    invocations, it's best to make it point to the closing parenthesis
    850    of the macro, rather than the the location of the first character
    851    of the macro.  NUM_TOKENS is the number of tokens that are part of
    852    the replacement-list of MACRO.  */
    853 const line_map_macro *linemap_enter_macro (struct line_maps *,
    854 					   struct cpp_hashnode*,
    855 					   source_location,
    856 					   unsigned int);
    857 
    858 /* Create and return a virtual location for a token that is part of a
    859    macro expansion-list at a macro expansion point.  See the comment
    860    inside struct line_map_macro to see what an expansion-list exactly
    861    is.
    862 
    863    A call to this function must come after a call to
    864    linemap_enter_macro.
    865 
    866    MAP is the map into which the source location is created.  TOKEN_NO
    867    is the index of the token in the macro replacement-list, starting
    868    at number 0.
    869 
    870    ORIG_LOC is the location of the token outside of this macro
    871    expansion.  If the token comes originally from the macro
    872    definition, it is the locus in the macro definition; otherwise it
    873    is a location in the context of the caller of this macro expansion
    874    (which is a virtual location or a source location if the caller is
    875    itself a macro expansion or not).
    876 
    877    MACRO_DEFINITION_LOC is the location in the macro definition,
    878    either of the token itself or of a macro parameter that it
    879    replaces.  */
    880 source_location linemap_add_macro_token (const line_map_macro *,
    881 					 unsigned int,
    882 					 source_location,
    883 					 source_location);
    884 
    885 /* Return the source line number corresponding to source location
    886    LOCATION.  SET is the line map set LOCATION comes from.  If
    887    LOCATION is the location of token that is part of the
    888    expansion-list of a macro expansion return the line number of the
    889    macro expansion point.  */
    890 int linemap_get_expansion_line (struct line_maps *,
    891 				source_location);
    892 
    893 /* Return the path of the file corresponding to source code location
    894    LOCATION.
    895 
    896    If LOCATION is the location of a token that is part of the
    897    replacement-list of a macro expansion return the file path of the
    898    macro expansion point.
    899 
    900    SET is the line map set LOCATION comes from.  */
    901 const char* linemap_get_expansion_filename (struct line_maps *,
    902 					    source_location);
    903 
    904 #ifdef __cplusplus
    905 }
    906 #endif
    907 
    908 #endif /* ! LIBCPP_INTERNAL_H */
    909