Home | History | Annotate | Line # | Download | only in libcpp
internal.h revision 1.12
      1 /* Part of CPP library.
      2    Copyright (C) 1997-2022 Free Software Foundation, Inc.
      3 
      4 This program is free software; you can redistribute it and/or modify it
      5 under the terms of the GNU General Public License as published by the
      6 Free Software Foundation; either version 3, or (at your option) any
      7 later version.
      8 
      9 This program is distributed in the hope that it will be useful,
     10 but WITHOUT ANY WARRANTY; without even the implied warranty of
     11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
     12 GNU General Public License for more details.
     13 
     14 You should have received a copy of the GNU General Public License
     15 along with this program; see the file COPYING3.  If not see
     16 <http://www.gnu.org/licenses/>.  */
     17 
     18 /* This header defines all the internal data structures and functions
     19    that need to be visible across files.  It should not be used outside
     20    cpplib.  */
     21 
     22 #ifndef LIBCPP_INTERNAL_H
     23 #define LIBCPP_INTERNAL_H
     24 
     25 #include "symtab.h"
     26 #include "cpplib.h"
     27 
     28 #if HAVE_ICONV
     29 #include <iconv.h>
     30 #else
     31 #define HAVE_ICONV 0
     32 typedef int iconv_t;  /* dummy */
     33 #endif
     34 
     35 #ifdef __cplusplus
     36 extern "C" {
     37 #endif
     38 
     39 struct directive;		/* Deliberately incomplete.  */
     40 struct pending_option;
     41 struct op;
     42 struct _cpp_strbuf;
     43 
     44 typedef bool (*convert_f) (iconv_t, const unsigned char *, size_t,
     45 			   struct _cpp_strbuf *);
     46 struct cset_converter
     47 {
     48   convert_f func;
     49   iconv_t cd;
     50   int width;
     51   const char* from;
     52   const char* to;
     53 };
     54 
     55 #define BITS_PER_CPPCHAR_T (CHAR_BIT * sizeof (cppchar_t))
     56 
     57 /* Test if a sign is valid within a preprocessing number.  */
     58 #define VALID_SIGN(c, prevc) \
     59   (((c) == '+' || (c) == '-') && \
     60    ((prevc) == 'e' || (prevc) == 'E' \
     61     || (((prevc) == 'p' || (prevc) == 'P') \
     62         && CPP_OPTION (pfile, extended_numbers))))
     63 
     64 #define DIGIT_SEP(c) ((c) == '\'' && CPP_OPTION (pfile, digit_separators))
     65 
     66 #define CPP_OPTION(PFILE, OPTION) ((PFILE)->opts.OPTION)
     67 #define CPP_BUFFER(PFILE) ((PFILE)->buffer)
     68 #define CPP_BUF_COLUMN(BUF, CUR) ((CUR) - (BUF)->line_base)
     69 #define CPP_BUF_COL(BUF) CPP_BUF_COLUMN(BUF, (BUF)->cur)
     70 
     71 #define CPP_INCREMENT_LINE(PFILE, COLS_HINT) do { \
     72     const class line_maps *line_table = PFILE->line_table; \
     73     const struct line_map_ordinary *map = \
     74       LINEMAPS_LAST_ORDINARY_MAP (line_table); \
     75     linenum_type line = SOURCE_LINE (map, line_table->highest_line); \
     76     linemap_line_start (PFILE->line_table, line + 1, COLS_HINT); \
     77   } while (0)
     78 
     79 /* Host alignment handling.  */
     80 struct dummy
     81 {
     82   char c;
     83   union
     84   {
     85     double d;
     86     int *p;
     87   } u;
     88 };
     89 
     90 #define DEFAULT_ALIGNMENT offsetof (struct dummy, u)
     91 #define CPP_ALIGN2(size, align) (((size) + ((align) - 1)) & ~((align) - 1))
     92 #define CPP_ALIGN(size) CPP_ALIGN2 (size, DEFAULT_ALIGNMENT)
     93 
     94 #define _cpp_mark_macro_used(NODE) 					\
     95   (cpp_user_macro_p (NODE) ? (NODE)->value.macro->used = 1 : 0)
     96 
     97 /* A generic memory buffer, and operations on it.  */
     98 typedef struct _cpp_buff _cpp_buff;
     99 struct _cpp_buff
    100 {
    101   struct _cpp_buff *next;
    102   unsigned char *base, *cur, *limit;
    103 };
    104 
    105 extern _cpp_buff *_cpp_get_buff (cpp_reader *, size_t);
    106 extern void _cpp_release_buff (cpp_reader *, _cpp_buff *);
    107 extern void _cpp_extend_buff (cpp_reader *, _cpp_buff **, size_t);
    108 extern _cpp_buff *_cpp_append_extend_buff (cpp_reader *, _cpp_buff *, size_t);
    109 extern void _cpp_free_buff (_cpp_buff *);
    110 extern unsigned char *_cpp_aligned_alloc (cpp_reader *, size_t);
    111 extern unsigned char *_cpp_unaligned_alloc (cpp_reader *, size_t);
    112 
    113 #define BUFF_ROOM(BUFF) (size_t) ((BUFF)->limit - (BUFF)->cur)
    114 #define BUFF_FRONT(BUFF) ((BUFF)->cur)
    115 #define BUFF_LIMIT(BUFF) ((BUFF)->limit)
    116 
    117 /* #include types.  */
    118 enum include_type
    119   {
    120    /* Directive-based including mechanisms.  */
    121    IT_INCLUDE,  /* #include */
    122    IT_INCLUDE_NEXT,  /* #include_next */
    123    IT_IMPORT,   /* #import  */
    124 
    125    /* Non-directive including mechanisms.  */
    126    IT_CMDLINE,  /* -include */
    127    IT_DEFAULT,  /* forced header  */
    128    IT_MAIN,     /* main, start on line 1 */
    129    IT_PRE_MAIN,  /* main, but there will be a preamble before line
    130 		    1 */
    131 
    132    IT_DIRECTIVE_HWM = IT_IMPORT + 1,  /* Directives below this.  */
    133    IT_HEADER_HWM = IT_DEFAULT + 1     /* Header files below this.  */
    134   };
    135 
    136 union utoken
    137 {
    138   const cpp_token *token;
    139   const cpp_token **ptoken;
    140 };
    141 
    142 /* A "run" of tokens; part of a chain of runs.  */
    143 typedef struct tokenrun tokenrun;
    144 struct tokenrun
    145 {
    146   tokenrun *next, *prev;
    147   cpp_token *base, *limit;
    148 };
    149 
    150 /* Accessor macros for struct cpp_context.  */
    151 #define FIRST(c) ((c)->u.iso.first)
    152 #define LAST(c) ((c)->u.iso.last)
    153 #define CUR(c) ((c)->u.trad.cur)
    154 #define RLIMIT(c) ((c)->u.trad.rlimit)
    155 
    156 /* This describes some additional data that is added to the macro
    157    token context of type cpp_context, when -ftrack-macro-expansion is
    158    on.  */
    159 typedef struct
    160 {
    161   /* The node of the macro we are referring to.  */
    162   cpp_hashnode *macro_node;
    163   /* This buffer contains an array of virtual locations.  The virtual
    164      location at index 0 is the virtual location of the token at index
    165      0 in the current instance of cpp_context; similarly for all the
    166      other virtual locations.  */
    167   location_t *virt_locs;
    168   /* This is a pointer to the current virtual location.  This is used
    169      to iterate over the virtual locations while we iterate over the
    170      tokens they belong to.  */
    171   location_t *cur_virt_loc;
    172 } macro_context;
    173 
    174 /* The kind of tokens carried by a cpp_context.  */
    175 enum context_tokens_kind {
    176   /* This is the value of cpp_context::tokens_kind if u.iso.first
    177      contains an instance of cpp_token **.  */
    178   TOKENS_KIND_INDIRECT,
    179   /* This is the value of cpp_context::tokens_kind if u.iso.first
    180      contains an instance of cpp_token *.  */
    181   TOKENS_KIND_DIRECT,
    182   /* This is the value of cpp_context::tokens_kind when the token
    183      context contains tokens resulting from macro expansion.  In that
    184      case struct cpp_context::macro points to an instance of struct
    185      macro_context.  This is used only when the
    186      -ftrack-macro-expansion flag is on.  */
    187   TOKENS_KIND_EXTENDED
    188 };
    189 
    190 typedef struct cpp_context cpp_context;
    191 struct cpp_context
    192 {
    193   /* Doubly-linked list.  */
    194   cpp_context *next, *prev;
    195 
    196   union
    197   {
    198     /* For ISO macro expansion.  Contexts other than the base context
    199        are contiguous tokens.  e.g. macro expansions, expanded
    200        argument tokens.  */
    201     struct
    202     {
    203       union utoken first;
    204       union utoken last;
    205     } iso;
    206 
    207     /* For traditional macro expansion.  */
    208     struct
    209     {
    210       const unsigned char *cur;
    211       const unsigned char *rlimit;
    212     } trad;
    213   } u;
    214 
    215   /* If non-NULL, a buffer used for storage related to this context.
    216      When the context is popped, the buffer is released.  */
    217   _cpp_buff *buff;
    218 
    219   /* If tokens_kind is TOKEN_KIND_EXTENDED, then (as we thus are in a
    220      macro context) this is a pointer to an instance of macro_context.
    221      Otherwise if tokens_kind is *not* TOKEN_KIND_EXTENDED, then, if
    222      we are in a macro context, this is a pointer to an instance of
    223      cpp_hashnode, representing the name of the macro this context is
    224      for.  If we are not in a macro context, then this is just NULL.
    225      Note that when tokens_kind is TOKEN_KIND_EXTENDED, the memory
    226      used by the instance of macro_context pointed to by this member
    227      is de-allocated upon de-allocation of the instance of struct
    228      cpp_context.  */
    229   union
    230   {
    231     macro_context *mc;
    232     cpp_hashnode *macro;
    233   } c;
    234 
    235   /* This determines the type of tokens held by this context.  */
    236   enum context_tokens_kind tokens_kind;
    237 };
    238 
    239 struct lexer_state
    240 {
    241   /* 1 if we're handling a directive.  2 if it's an include-like
    242      directive.  */
    243   unsigned char in_directive;
    244 
    245   /* Nonzero if in a directive that will handle padding tokens itself.
    246      #include needs this to avoid problems with computed include and
    247      spacing between tokens.  */
    248   unsigned char directive_wants_padding;
    249 
    250   /* True if we are skipping a failed conditional group.  */
    251   unsigned char skipping;
    252 
    253   /* Nonzero if in a directive that takes angle-bracketed headers.  */
    254   unsigned char angled_headers;
    255 
    256   /* Nonzero if in a #if or #elif directive.  */
    257   unsigned char in_expression;
    258 
    259   /* Nonzero to save comments.  Turned off if discard_comments, and in
    260      all directives apart from #define.  */
    261   unsigned char save_comments;
    262 
    263   /* Nonzero if lexing __VA_ARGS__ and __VA_OPT__ are valid.  */
    264   unsigned char va_args_ok;
    265 
    266   /* Nonzero if lexing poisoned identifiers is valid.  */
    267   unsigned char poisoned_ok;
    268 
    269   /* Nonzero to prevent macro expansion.  */
    270   unsigned char prevent_expansion;
    271 
    272   /* Nonzero when parsing arguments to a function-like macro.  */
    273   unsigned char parsing_args;
    274 
    275   /* Nonzero if prevent_expansion is true only because output is
    276      being discarded.  */
    277   unsigned char discarding_output;
    278 
    279   /* Nonzero to skip evaluating part of an expression.  */
    280   unsigned int skip_eval;
    281 
    282   /* Nonzero when tokenizing a deferred pragma.  */
    283   unsigned char in_deferred_pragma;
    284 
    285   /* Count to token that is a header-name.  */
    286   unsigned char directive_file_token;
    287 
    288   /* Nonzero if the deferred pragma being handled allows macro expansion.  */
    289   unsigned char pragma_allow_expansion;
    290 
    291   /* Nonzero if _Pragma should not be interpreted.  */
    292   unsigned char ignore__Pragma;
    293 };
    294 
    295 /* Special nodes - identifiers with predefined significance.  */
    296 struct spec_nodes
    297 {
    298   cpp_hashnode *n_defined;		/* defined operator */
    299   cpp_hashnode *n_true;			/* C++ keyword true */
    300   cpp_hashnode *n_false;		/* C++ keyword false */
    301   cpp_hashnode *n__VA_ARGS__;		/* C99 vararg macros */
    302   cpp_hashnode *n__VA_OPT__;		/* C++ vararg macros */
    303 
    304   enum {M_EXPORT, M_MODULE, M_IMPORT, M__IMPORT, M_HWM};
    305 
    306   /* C++20 modules, only set when module_directives is in effect.
    307      incoming variants [0], outgoing ones [1] */
    308   cpp_hashnode *n_modules[M_HWM][2];
    309 };
    310 
    311 typedef struct _cpp_line_note _cpp_line_note;
    312 struct _cpp_line_note
    313 {
    314   /* Location in the clean line the note refers to.  */
    315   const unsigned char *pos;
    316 
    317   /* Type of note.  The 9 'from' trigraph characters represent those
    318      trigraphs, '\\' an escaped newline, ' ' an escaped newline with
    319      intervening space, 0 represents a note that has already been handled,
    320      and anything else is invalid.  */
    321   unsigned int type;
    322 };
    323 
    324 /* Represents the contents of a file cpplib has read in.  */
    325 struct cpp_buffer
    326 {
    327   const unsigned char *cur;        /* Current location.  */
    328   const unsigned char *line_base;  /* Start of current physical line.  */
    329   const unsigned char *next_line;  /* Start of to-be-cleaned logical line.  */
    330 
    331   const unsigned char *buf;        /* Entire character buffer.  */
    332   const unsigned char *rlimit;     /* Writable byte at end of file.  */
    333   const unsigned char *to_free;	   /* Pointer that should be freed when
    334 				      popping the buffer.  */
    335 
    336   _cpp_line_note *notes;           /* Array of notes.  */
    337   unsigned int cur_note;           /* Next note to process.  */
    338   unsigned int notes_used;         /* Number of notes.  */
    339   unsigned int notes_cap;          /* Size of allocated array.  */
    340 
    341   struct cpp_buffer *prev;
    342 
    343   /* Pointer into the file table; non-NULL if this is a file buffer.
    344      Used for include_next and to record control macros.  */
    345   struct _cpp_file *file;
    346 
    347   /* Saved value of __TIMESTAMP__ macro - date and time of last modification
    348      of the assotiated file.  */
    349   const unsigned char *timestamp;
    350 
    351   /* Value of if_stack at start of this file.
    352      Used to prohibit unmatched #endif (etc) in an include file.  */
    353   struct if_stack *if_stack;
    354 
    355   /* True if we need to get the next clean line.  */
    356   bool need_line : 1;
    357 
    358   /* True if we have already warned about C++ comments in this file.
    359      The warning happens only for C89 extended mode with -pedantic on,
    360      or for -Wtraditional, and only once per file (otherwise it would
    361      be far too noisy).  */
    362   bool warned_cplusplus_comments : 1;
    363 
    364   /* True if we don't process trigraphs and escaped newlines.  True
    365      for preprocessed input, command line directives, and _Pragma
    366      buffers.  */
    367   bool from_stage3 : 1;
    368 
    369   /* At EOF, a buffer is automatically popped.  If RETURN_AT_EOF is
    370      true, a CPP_EOF token is then returned.  Otherwise, the next
    371      token from the enclosing buffer is returned.  */
    372   bool return_at_eof : 1;
    373 
    374   /* One for a system header, two for a C system header file that therefore
    375      needs to be extern "C" protected in C++, and zero otherwise.  */
    376   unsigned char sysp;
    377 
    378   /* The directory of the this buffer's file.  Its NAME member is not
    379      allocated, so we don't need to worry about freeing it.  */
    380   struct cpp_dir dir;
    381 
    382   /* Descriptor for converting from the input character set to the
    383      source character set.  */
    384   struct cset_converter input_cset_desc;
    385 };
    386 
    387 /* The list of saved macros by push_macro pragma.  */
    388 struct def_pragma_macro {
    389   /* Chain element to previous saved macro.  */
    390   struct def_pragma_macro *next;
    391   /* Name of the macro.  */
    392   char *name;
    393   /* The stored macro content.  */
    394   unsigned char *definition;
    395 
    396   /* Definition line number.  */
    397   location_t line;
    398   /* If macro defined in system header.  */
    399   unsigned int syshdr   : 1;
    400   /* Nonzero if it has been expanded or had its existence tested.  */
    401   unsigned int used     : 1;
    402 
    403   /* Mark if we save an undefined macro.  */
    404   unsigned int is_undef : 1;
    405   /* Nonzero if it was a builtin macro.  */
    406   unsigned int is_builtin : 1;
    407 };
    408 
    409 /* A cpp_reader encapsulates the "state" of a pre-processor run.
    410    Applying cpp_get_token repeatedly yields a stream of pre-processor
    411    tokens.  Usually, there is only one cpp_reader object active.  */
    412 struct cpp_reader
    413 {
    414   /* Top of buffer stack.  */
    415   cpp_buffer *buffer;
    416 
    417   /* Overlaid buffer (can be different after processing #include).  */
    418   cpp_buffer *overlaid_buffer;
    419 
    420   /* Lexer state.  */
    421   struct lexer_state state;
    422 
    423   /* Source line tracking.  */
    424   class line_maps *line_table;
    425 
    426   /* The line of the '#' of the current directive.  */
    427   location_t directive_line;
    428 
    429   /* Memory buffers.  */
    430   _cpp_buff *a_buff;		/* Aligned permanent storage.  */
    431   _cpp_buff *u_buff;		/* Unaligned permanent storage.  */
    432   _cpp_buff *free_buffs;	/* Free buffer chain.  */
    433 
    434   /* Context stack.  */
    435   struct cpp_context base_context;
    436   struct cpp_context *context;
    437 
    438   /* If in_directive, the directive if known.  */
    439   const struct directive *directive;
    440 
    441   /* Token generated while handling a directive, if any. */
    442   cpp_token directive_result;
    443 
    444   /* When expanding a macro at top-level, this is the location of the
    445      macro invocation.  */
    446   location_t invocation_location;
    447 
    448   /* This is the node representing the macro being expanded at
    449      top-level.  The value of this data member is valid iff
    450      cpp_in_macro_expansion_p() returns TRUE.  */
    451   cpp_hashnode *top_most_macro_node;
    452 
    453   /* Nonzero if we are about to expand a macro.  Note that if we are
    454      really expanding a macro, the function macro_of_context returns
    455      the macro being expanded and this flag is set to false.  Client
    456      code should use the function cpp_in_macro_expansion_p to know if we
    457      are either about to expand a macro, or are actually expanding
    458      one.  */
    459   bool about_to_expand_macro_p;
    460 
    461   /* Search paths for include files.  */
    462   struct cpp_dir *quote_include;	/* "" */
    463   struct cpp_dir *bracket_include;	/* <> */
    464   struct cpp_dir no_search_path;	/* No path.  */
    465 
    466   /* Chain of all hashed _cpp_file instances.  */
    467   struct _cpp_file *all_files;
    468 
    469   struct _cpp_file *main_file;
    470 
    471   /* File and directory hash table.  */
    472   struct htab *file_hash;
    473   struct htab *dir_hash;
    474   struct file_hash_entry_pool *file_hash_entries;
    475 
    476   /* Negative path lookup hash table.  */
    477   struct htab *nonexistent_file_hash;
    478   struct obstack nonexistent_file_ob;
    479 
    480   /* Nonzero means don't look for #include "foo" the source-file
    481      directory.  */
    482   bool quote_ignores_source_dir;
    483 
    484   /* Nonzero if any file has contained #pragma once or #import has
    485      been used.  */
    486   bool seen_once_only;
    487 
    488   /* Multiple include optimization.  */
    489   const cpp_hashnode *mi_cmacro;
    490   const cpp_hashnode *mi_ind_cmacro;
    491   bool mi_valid;
    492 
    493   /* Lexing.  */
    494   cpp_token *cur_token;
    495   tokenrun base_run, *cur_run;
    496   unsigned int lookaheads;
    497 
    498   /* Nonzero prevents the lexer from re-using the token runs.  */
    499   unsigned int keep_tokens;
    500 
    501   /* Buffer to hold macro definition string.  */
    502   unsigned char *macro_buffer;
    503   unsigned int macro_buffer_len;
    504 
    505   /* Descriptor for converting from the source character set to the
    506      execution character set.  */
    507   struct cset_converter narrow_cset_desc;
    508 
    509   /* Descriptor for converting from the source character set to the
    510      UTF-8 execution character set.  */
    511   struct cset_converter utf8_cset_desc;
    512 
    513   /* Descriptor for converting from the source character set to the
    514      UTF-16 execution character set.  */
    515   struct cset_converter char16_cset_desc;
    516 
    517   /* Descriptor for converting from the source character set to the
    518      UTF-32 execution character set.  */
    519   struct cset_converter char32_cset_desc;
    520 
    521   /* Descriptor for converting from the source character set to the
    522      wide execution character set.  */
    523   struct cset_converter wide_cset_desc;
    524 
    525   /* Date and time text.  Calculated together if either is requested.  */
    526   const unsigned char *date;
    527   const unsigned char *time;
    528 
    529   /* Time stamp, set idempotently lazily.  */
    530   time_t time_stamp;
    531   int time_stamp_kind; /* Or errno.  */
    532 
    533   /* A token forcing paste avoidance, and one demarking macro arguments.  */
    534   cpp_token avoid_paste;
    535   cpp_token endarg;
    536 
    537   /* Opaque handle to the dependencies of mkdeps.cc.  */
    538   class mkdeps *deps;
    539 
    540   /* Obstack holding all macro hash nodes.  This never shrinks.
    541      See identifiers.cc */
    542   struct obstack hash_ob;
    543 
    544   /* Obstack holding buffer and conditional structures.  This is a
    545      real stack.  See directives.cc.  */
    546   struct obstack buffer_ob;
    547 
    548   /* Pragma table - dynamic, because a library user can add to the
    549      list of recognized pragmas.  */
    550   struct pragma_entry *pragmas;
    551 
    552   /* Call backs to cpplib client.  */
    553   struct cpp_callbacks cb;
    554 
    555   /* Identifier hash table.  */
    556   struct ht *hash_table;
    557 
    558   /* Expression parser stack.  */
    559   struct op *op_stack, *op_limit;
    560 
    561   /* User visible options.  */
    562   struct cpp_options opts;
    563 
    564   /* Special nodes - identifiers with predefined significance to the
    565      preprocessor.  */
    566   struct spec_nodes spec_nodes;
    567 
    568   /* Whether cpplib owns the hashtable.  */
    569   bool our_hashtable;
    570 
    571   /* Traditional preprocessing output buffer (a logical line).  */
    572   struct
    573   {
    574     unsigned char *base;
    575     unsigned char *limit;
    576     unsigned char *cur;
    577     location_t first_line;
    578   } out;
    579 
    580   /* Used for buffer overlays by traditional.cc.  */
    581   const unsigned char *saved_cur, *saved_rlimit, *saved_line_base;
    582 
    583   /* A saved list of the defined macros, for dependency checking
    584      of precompiled headers.  */
    585   struct cpp_savedstate *savedstate;
    586 
    587   /* Next value of __COUNTER__ macro. */
    588   unsigned int counter;
    589 
    590   /* Table of comments, when state.save_comments is true.  */
    591   cpp_comment_table comments;
    592 
    593   /* List of saved macros by push_macro.  */
    594   struct def_pragma_macro *pushed_macros;
    595 
    596   /* If non-zero, the lexer will use this location for the next token
    597      instead of getting a location from the linemap.  */
    598   location_t forced_token_location;
    599 
    600   /* Location identifying the main source file -- intended to be line
    601      zero of said file.  */
    602   location_t main_loc;
    603 
    604   /* Returns true iff we should warn about UTF-8 bidirectional control
    605      characters.  */
    606   bool warn_bidi_p () const
    607   {
    608     return (CPP_OPTION (this, cpp_warn_bidirectional)
    609 	    & (bidirectional_unpaired|bidirectional_any));
    610   }
    611 };
    612 
    613 /* Character classes.  Based on the more primitive macros in safe-ctype.h.
    614    If the definition of `numchar' looks odd to you, please look up the
    615    definition of a pp-number in the C standard [section 6.4.8 of C99].
    616 
    617    In the unlikely event that characters other than \r and \n enter
    618    the set is_vspace, the macro handle_newline() in lex.cc must be
    619    updated.  */
    620 #define _dollar_ok(x)	((x) == '$' && CPP_OPTION (pfile, dollars_in_ident))
    621 
    622 #define is_idchar(x)	(ISIDNUM(x) || _dollar_ok(x))
    623 #define is_numchar(x)	ISIDNUM(x)
    624 #define is_idstart(x)	(ISIDST(x) || _dollar_ok(x))
    625 #define is_numstart(x)	ISDIGIT(x)
    626 #define is_hspace(x)	ISBLANK(x)
    627 #define is_vspace(x)	IS_VSPACE(x)
    628 #define is_nvspace(x)	IS_NVSPACE(x)
    629 #define is_space(x)	IS_SPACE_OR_NUL(x)
    630 
    631 #define SEEN_EOL() (pfile->cur_token[-1].type == CPP_EOF)
    632 
    633 /* This table is constant if it can be initialized at compile time,
    634    which is the case if cpp was compiled with GCC >=2.7, or another
    635    compiler that supports C99.  */
    636 #if HAVE_DESIGNATED_INITIALIZERS
    637 extern const unsigned char _cpp_trigraph_map[UCHAR_MAX + 1];
    638 #else
    639 extern unsigned char _cpp_trigraph_map[UCHAR_MAX + 1];
    640 #endif
    641 
    642 #if !defined (HAVE_UCHAR) && !defined (IN_GCC)
    643 typedef unsigned char uchar;
    644 #endif
    645 
    646 #define UC (const uchar *)  /* Intended use: UC"string" */
    647 
    648 /* Accessors.  */
    649 
    650 inline int
    651 _cpp_in_system_header (cpp_reader *pfile)
    652 {
    653   return pfile->buffer ? pfile->buffer->sysp : 0;
    654 }
    655 #define CPP_PEDANTIC(PF) CPP_OPTION (PF, cpp_pedantic)
    656 #define CPP_WTRADITIONAL(PF) CPP_OPTION (PF, cpp_warn_traditional)
    657 
    658 /* Return true if we're in the main file (unless it's considered to be
    659    an include file in its own right.  */
    660 inline int
    661 _cpp_in_main_source_file (cpp_reader *pfile)
    662 {
    663   return (!CPP_OPTION (pfile, main_search)
    664 	  && pfile->buffer->file == pfile->main_file);
    665 }
    666 
    667 /* True if NODE is a macro for the purposes of ifdef, defined etc.  */
    668 inline bool _cpp_defined_macro_p (cpp_hashnode *node)
    669 {
    670   /* Do not treat conditional macros as being defined.  This is due to
    671      the powerpc port using conditional macros for 'vector', 'bool',
    672      and 'pixel' to act as conditional keywords.  This messes up tests
    673      like #ifndef bool.  */
    674   return cpp_macro_p (node) && !(node->flags & NODE_CONDITIONAL);
    675 }
    676 
    677 /* In macro.cc */
    678 extern bool _cpp_notify_macro_use (cpp_reader *pfile, cpp_hashnode *node,
    679 				   location_t);
    680 inline bool _cpp_maybe_notify_macro_use (cpp_reader *pfile, cpp_hashnode *node,
    681 					 location_t loc)
    682 {
    683   if (!(node->flags & NODE_USED))
    684     return _cpp_notify_macro_use (pfile, node, loc);
    685   return true;
    686 }
    687 extern cpp_macro *_cpp_new_macro (cpp_reader *, cpp_macro_kind, void *);
    688 extern void _cpp_free_definition (cpp_hashnode *);
    689 extern bool _cpp_create_definition (cpp_reader *, cpp_hashnode *);
    690 extern void _cpp_pop_context (cpp_reader *);
    691 extern void _cpp_push_text_context (cpp_reader *, cpp_hashnode *,
    692 				    const unsigned char *, size_t);
    693 extern bool _cpp_save_parameter (cpp_reader *, unsigned, cpp_hashnode *,
    694 				 cpp_hashnode *);
    695 extern void _cpp_unsave_parameters (cpp_reader *, unsigned);
    696 extern bool _cpp_arguments_ok (cpp_reader *, cpp_macro *, const cpp_hashnode *,
    697 			       unsigned int);
    698 extern const unsigned char *_cpp_builtin_macro_text (cpp_reader *,
    699 						     cpp_hashnode *,
    700 						     location_t = 0);
    701 extern int _cpp_warn_if_unused_macro (cpp_reader *, cpp_hashnode *, void *);
    702 extern void _cpp_push_token_context (cpp_reader *, cpp_hashnode *,
    703 				     const cpp_token *, unsigned int);
    704 extern void _cpp_backup_tokens_direct (cpp_reader *, unsigned int);
    705 
    706 /* In identifiers.cc */
    707 extern void _cpp_init_hashtable (cpp_reader *, cpp_hash_table *);
    708 extern void _cpp_destroy_hashtable (cpp_reader *);
    709 
    710 /* In files.cc */
    711 enum _cpp_find_file_kind
    712   { _cpp_FFK_NORMAL, _cpp_FFK_FAKE, _cpp_FFK_PRE_INCLUDE, _cpp_FFK_HAS_INCLUDE };
    713 extern _cpp_file *_cpp_find_file (cpp_reader *, const char *, cpp_dir *,
    714 				  int angle, _cpp_find_file_kind, location_t);
    715 extern bool _cpp_find_failed (_cpp_file *);
    716 extern void _cpp_mark_file_once_only (cpp_reader *, struct _cpp_file *);
    717 extern const char *_cpp_find_header_unit (cpp_reader *, const char *file,
    718 					  bool angle_p,  location_t);
    719 extern void _cpp_fake_include (cpp_reader *, const char *);
    720 extern bool _cpp_stack_file (cpp_reader *, _cpp_file*, include_type, location_t);
    721 extern bool _cpp_stack_include (cpp_reader *, const char *, int,
    722 				enum include_type, location_t);
    723 extern int _cpp_compare_file_date (cpp_reader *, const char *, int);
    724 extern void _cpp_report_missing_guards (cpp_reader *);
    725 extern void _cpp_init_files (cpp_reader *);
    726 extern void _cpp_cleanup_files (cpp_reader *);
    727 extern void _cpp_pop_file_buffer (cpp_reader *, struct _cpp_file *,
    728 				  const unsigned char *);
    729 extern bool _cpp_save_file_entries (cpp_reader *pfile, FILE *f);
    730 extern bool _cpp_read_file_entries (cpp_reader *, FILE *);
    731 extern const char *_cpp_get_file_name (_cpp_file *);
    732 extern struct stat *_cpp_get_file_stat (_cpp_file *);
    733 extern bool _cpp_has_header (cpp_reader *, const char *, int,
    734 			     enum include_type);
    735 
    736 /* In expr.cc */
    737 extern bool _cpp_parse_expr (cpp_reader *, bool);
    738 extern struct op *_cpp_expand_op_stack (cpp_reader *);
    739 
    740 /* In lex.cc */
    741 extern void _cpp_process_line_notes (cpp_reader *, int);
    742 extern void _cpp_clean_line (cpp_reader *);
    743 extern bool _cpp_get_fresh_line (cpp_reader *);
    744 extern bool _cpp_skip_block_comment (cpp_reader *);
    745 extern cpp_token *_cpp_temp_token (cpp_reader *);
    746 extern const cpp_token *_cpp_lex_token (cpp_reader *);
    747 extern cpp_token *_cpp_lex_direct (cpp_reader *);
    748 extern unsigned char *_cpp_spell_ident_ucns (unsigned char *, cpp_hashnode *);
    749 extern int _cpp_equiv_tokens (const cpp_token *, const cpp_token *);
    750 extern void _cpp_init_tokenrun (tokenrun *, unsigned int);
    751 extern cpp_hashnode *_cpp_lex_identifier (cpp_reader *, const char *);
    752 extern int _cpp_remaining_tokens_num_in_context (cpp_context *);
    753 extern void _cpp_init_lexer (void);
    754 static inline void *_cpp_reserve_room (cpp_reader *pfile, size_t have,
    755 				       size_t extra)
    756 {
    757   if (BUFF_ROOM (pfile->a_buff) < (have + extra))
    758     _cpp_extend_buff (pfile, &pfile->a_buff, extra);
    759   return BUFF_FRONT (pfile->a_buff);
    760 }
    761 extern void *_cpp_commit_buff (cpp_reader *pfile, size_t size);
    762 
    763 /* In init.cc.  */
    764 extern void _cpp_maybe_push_include_file (cpp_reader *);
    765 extern const char *cpp_named_operator2name (enum cpp_ttype type);
    766 extern void _cpp_restore_special_builtin (cpp_reader *pfile,
    767 					  struct def_pragma_macro *);
    768 
    769 /* In directives.cc */
    770 extern int _cpp_test_assertion (cpp_reader *, unsigned int *);
    771 extern int _cpp_handle_directive (cpp_reader *, bool);
    772 extern void _cpp_define_builtin (cpp_reader *, const char *);
    773 extern char ** _cpp_save_pragma_names (cpp_reader *);
    774 extern void _cpp_restore_pragma_names (cpp_reader *, char **);
    775 extern int _cpp_do__Pragma (cpp_reader *, location_t);
    776 extern void _cpp_init_directives (cpp_reader *);
    777 extern void _cpp_init_internal_pragmas (cpp_reader *);
    778 extern void _cpp_do_file_change (cpp_reader *, enum lc_reason, const char *,
    779 				 linenum_type, unsigned int);
    780 extern void _cpp_pop_buffer (cpp_reader *);
    781 extern char *_cpp_bracket_include (cpp_reader *);
    782 
    783 /* In errors.cc  */
    784 extern location_t cpp_diagnostic_get_current_location (cpp_reader *);
    785 
    786 /* In traditional.cc.  */
    787 extern bool _cpp_scan_out_logical_line (cpp_reader *, cpp_macro *, bool);
    788 extern bool _cpp_read_logical_line_trad (cpp_reader *);
    789 extern void _cpp_overlay_buffer (cpp_reader *pfile, const unsigned char *,
    790 				 size_t);
    791 extern void _cpp_remove_overlay (cpp_reader *);
    792 extern cpp_macro *_cpp_create_trad_definition (cpp_reader *);
    793 extern bool _cpp_expansions_different_trad (const cpp_macro *,
    794 					    const cpp_macro *);
    795 extern unsigned char *_cpp_copy_replacement_text (const cpp_macro *,
    796 						  unsigned char *);
    797 extern size_t _cpp_replacement_text_len (const cpp_macro *);
    798 
    799 /* In charset.cc.  */
    800 
    801 /* The normalization state at this point in the sequence.
    802    It starts initialized to all zeros, and at the end
    803    'level' is the normalization level of the sequence.  */
    804 
    805 struct normalize_state
    806 {
    807   /* The previous starter character.  */
    808   cppchar_t previous;
    809   /* The combining class of the previous character (whether or not a
    810      starter).  */
    811   unsigned char prev_class;
    812   /* The lowest normalization level so far.  */
    813   enum cpp_normalize_level level;
    814 };
    815 #define INITIAL_NORMALIZE_STATE { 0, 0, normalized_KC }
    816 #define NORMALIZE_STATE_RESULT(st) ((st)->level)
    817 
    818 /* We saw a character C that matches ISIDNUM(), update a
    819    normalize_state appropriately.  */
    820 #define NORMALIZE_STATE_UPDATE_IDNUM(st, c)	\
    821   ((st)->previous = (c), (st)->prev_class = 0)
    822 
    823 extern bool _cpp_valid_ucn (cpp_reader *, const unsigned char **,
    824 			    const unsigned char *, int,
    825 			    struct normalize_state *state,
    826 			    cppchar_t *,
    827 			    source_range *char_range,
    828 			    cpp_string_location_reader *loc_reader);
    829 
    830 extern bool _cpp_valid_utf8 (cpp_reader *pfile,
    831 			     const uchar **pstr,
    832 			     const uchar *limit,
    833 			     int identifier_pos,
    834 			     struct normalize_state *nst,
    835 			     cppchar_t *cp);
    836 
    837 extern void _cpp_destroy_iconv (cpp_reader *);
    838 extern unsigned char *_cpp_convert_input (cpp_reader *, const char *,
    839 					  unsigned char *, size_t, size_t,
    840 					  const unsigned char **, off_t *);
    841 extern const char *_cpp_default_encoding (void);
    842 extern cpp_hashnode * _cpp_interpret_identifier (cpp_reader *pfile,
    843 						 const unsigned char *id,
    844 						 size_t len);
    845 
    846 /* Utility routines and macros.  */
    847 #define DSC(str) (const unsigned char *)str, sizeof str - 1
    848 
    849 /* These are inline functions instead of macros so we can get type
    850    checking.  */
    851 static inline int ustrcmp (const unsigned char *, const unsigned char *);
    852 static inline int ustrncmp (const unsigned char *, const unsigned char *,
    853 			    size_t);
    854 static inline size_t ustrlen (const unsigned char *);
    855 static inline const unsigned char *uxstrdup (const unsigned char *);
    856 static inline const unsigned char *ustrchr (const unsigned char *, int);
    857 static inline int ufputs (const unsigned char *, FILE *);
    858 
    859 /* Use a const char for the second parameter since it is usually a literal.  */
    860 static inline int ustrcspn (const unsigned char *, const char *);
    861 
    862 static inline int
    863 ustrcmp (const unsigned char *s1, const unsigned char *s2)
    864 {
    865   return strcmp ((const char *)s1, (const char *)s2);
    866 }
    867 
    868 static inline int
    869 ustrncmp (const unsigned char *s1, const unsigned char *s2, size_t n)
    870 {
    871   return strncmp ((const char *)s1, (const char *)s2, n);
    872 }
    873 
    874 static inline int
    875 ustrcspn (const unsigned char *s1, const char *s2)
    876 {
    877   return strcspn ((const char *)s1, s2);
    878 }
    879 
    880 static inline size_t
    881 ustrlen (const unsigned char *s1)
    882 {
    883   return strlen ((const char *)s1);
    884 }
    885 
    886 static inline const unsigned char *
    887 uxstrdup (const unsigned char *s1)
    888 {
    889   return (const unsigned char *) xstrdup ((const char *)s1);
    890 }
    891 
    892 static inline const unsigned char *
    893 ustrchr (const unsigned char *s1, int c)
    894 {
    895   return (const unsigned char *) strchr ((const char *)s1, c);
    896 }
    897 
    898 static inline int
    899 ufputs (const unsigned char *s, FILE *f)
    900 {
    901   return fputs ((const char *)s, f);
    902 }
    903 
    904 /* In line-map.cc.  */
    905 
    906 /* Create and return a virtual location for a token that is part of a
    907    macro expansion-list at a macro expansion point.  See the comment
    908    inside struct line_map_macro to see what an expansion-list exactly
    909    is.
    910 
    911    A call to this function must come after a call to
    912    linemap_enter_macro.
    913 
    914    MAP is the map into which the source location is created.  TOKEN_NO
    915    is the index of the token in the macro replacement-list, starting
    916    at number 0.
    917 
    918    ORIG_LOC is the location of the token outside of this macro
    919    expansion.  If the token comes originally from the macro
    920    definition, it is the locus in the macro definition; otherwise it
    921    is a location in the context of the caller of this macro expansion
    922    (which is a virtual location or a source location if the caller is
    923    itself a macro expansion or not).
    924 
    925    MACRO_DEFINITION_LOC is the location in the macro definition,
    926    either of the token itself or of a macro parameter that it
    927    replaces.  */
    928 location_t linemap_add_macro_token (const line_map_macro *,
    929 				    unsigned int,
    930 				    location_t,
    931 				    location_t);
    932 
    933 /* Return the source line number corresponding to source location
    934    LOCATION.  SET is the line map set LOCATION comes from.  If
    935    LOCATION is the location of token that is part of the
    936    expansion-list of a macro expansion return the line number of the
    937    macro expansion point.  */
    938 int linemap_get_expansion_line (class line_maps *,
    939 				location_t);
    940 
    941 /* Return the path of the file corresponding to source code location
    942    LOCATION.
    943 
    944    If LOCATION is the location of a token that is part of the
    945    replacement-list of a macro expansion return the file path of the
    946    macro expansion point.
    947 
    948    SET is the line map set LOCATION comes from.  */
    949 const char* linemap_get_expansion_filename (class line_maps *,
    950 					    location_t);
    951 
    952 /* A subclass of rich_location for emitting a diagnostic
    953    at the current location of the reader, but flagging
    954    it with set_escape_on_output (true).  */
    955 class encoding_rich_location : public rich_location
    956 {
    957  public:
    958   encoding_rich_location (cpp_reader *pfile)
    959   : rich_location (pfile->line_table,
    960 		   cpp_diagnostic_get_current_location (pfile))
    961   {
    962     set_escape_on_output (true);
    963   }
    964 
    965   encoding_rich_location (cpp_reader *pfile, location_t loc)
    966   : rich_location (pfile->line_table, loc)
    967   {
    968     set_escape_on_output (true);
    969   }
    970 };
    971 
    972 #ifdef __cplusplus
    973 }
    974 #endif
    975 
    976 #endif /* ! LIBCPP_INTERNAL_H */
    977