1/* Part of CPP library.
2   Copyright (C) 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2007,
3   2008, 2009 Free Software Foundation, Inc.
4
5This program is free software; you can redistribute it and/or modify it
6under the terms of the GNU General Public License as published by the
7Free Software Foundation; either version 3, or (at your option) any
8later version.
9
10This program is distributed in the hope that it will be useful,
11but WITHOUT ANY WARRANTY; without even the implied warranty of
12MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
13GNU General Public License for more details.
14
15You should have received a copy of the GNU General Public License
16along with this program; see the file COPYING3.  If not see
17<http://www.gnu.org/licenses/>.  */
18
19/* This header defines all the internal data structures and functions
20   that need to be visible across files.  It should not be used outside
21   cpplib.  */
22
23#ifndef LIBCPP_INTERNAL_H
24#define LIBCPP_INTERNAL_H
25
26#include "symtab.h"
27#include "cpp-id-data.h"
28
29#if HAVE_ICONV
30#include <iconv.h>
31#else
32#define HAVE_ICONV 0
33typedef int iconv_t;  /* dummy */
34#endif
35
36#ifdef __cplusplus
37extern "C" {
38#endif
39
40struct directive;		/* Deliberately incomplete.  */
41struct pending_option;
42struct op;
43struct _cpp_strbuf;
44
45typedef bool (*convert_f) (iconv_t, const unsigned char *, size_t,
46			   struct _cpp_strbuf *);
47struct cset_converter
48{
49  convert_f func;
50  iconv_t cd;
51  int width;
52};
53
54#define BITS_PER_CPPCHAR_T (CHAR_BIT * sizeof (cppchar_t))
55
56/* Test if a sign is valid within a preprocessing number.  */
57#define VALID_SIGN(c, prevc) \
58  (((c) == '+' || (c) == '-') && \
59   ((prevc) == 'e' || (prevc) == 'E' \
60    || (((prevc) == 'p' || (prevc) == 'P') \
61        && CPP_OPTION (pfile, extended_numbers))))
62
63#define CPP_OPTION(PFILE, OPTION) ((PFILE)->opts.OPTION)
64#define CPP_BUFFER(PFILE) ((PFILE)->buffer)
65#define CPP_BUF_COLUMN(BUF, CUR) ((CUR) - (BUF)->line_base)
66#define CPP_BUF_COL(BUF) CPP_BUF_COLUMN(BUF, (BUF)->cur)
67
68#define CPP_INCREMENT_LINE(PFILE, COLS_HINT) do { \
69    const struct line_maps *line_table = PFILE->line_table; \
70    const struct line_map *map = &line_table->maps[line_table->used-1]; \
71    linenum_type line = SOURCE_LINE (map, line_table->highest_line); \
72    linemap_line_start (PFILE->line_table, line + 1, COLS_HINT); \
73  } while (0)
74
75/* Maximum nesting of cpp_buffers.  We use a static limit, partly for
76   efficiency, and partly to limit runaway recursion.  */
77#define CPP_STACK_MAX 200
78
79/* Host alignment handling.  */
80struct dummy
81{
82  char c;
83  union
84  {
85    double d;
86    int *p;
87  } u;
88};
89
90#define DEFAULT_ALIGNMENT offsetof (struct dummy, u)
91#define CPP_ALIGN2(size, align) (((size) + ((align) - 1)) & ~((align) - 1))
92#define CPP_ALIGN(size) CPP_ALIGN2 (size, DEFAULT_ALIGNMENT)
93
94#define _cpp_mark_macro_used(NODE) do {					\
95  if ((NODE)->type == NT_MACRO && !((NODE)->flags & NODE_BUILTIN))	\
96    (NODE)->value.macro->used = 1; } while (0)
97
98/* A generic memory buffer, and operations on it.  */
99typedef struct _cpp_buff _cpp_buff;
100struct _cpp_buff
101{
102  struct _cpp_buff *next;
103  unsigned char *base, *cur, *limit;
104};
105
106extern _cpp_buff *_cpp_get_buff (cpp_reader *, size_t);
107extern void _cpp_release_buff (cpp_reader *, _cpp_buff *);
108extern void _cpp_extend_buff (cpp_reader *, _cpp_buff **, size_t);
109extern _cpp_buff *_cpp_append_extend_buff (cpp_reader *, _cpp_buff *, size_t);
110extern void _cpp_free_buff (_cpp_buff *);
111extern unsigned char *_cpp_aligned_alloc (cpp_reader *, size_t);
112extern unsigned char *_cpp_unaligned_alloc (cpp_reader *, size_t);
113
114#define BUFF_ROOM(BUFF) (size_t) ((BUFF)->limit - (BUFF)->cur)
115#define BUFF_FRONT(BUFF) ((BUFF)->cur)
116#define BUFF_LIMIT(BUFF) ((BUFF)->limit)
117
118/* #include types.  */
119enum include_type {IT_INCLUDE, IT_INCLUDE_NEXT, IT_IMPORT, IT_CMDLINE};
120
121union utoken
122{
123  const cpp_token *token;
124  const cpp_token **ptoken;
125};
126
127/* A "run" of tokens; part of a chain of runs.  */
128typedef struct tokenrun tokenrun;
129struct tokenrun
130{
131  tokenrun *next, *prev;
132  cpp_token *base, *limit;
133};
134
135/* Accessor macros for struct cpp_context.  */
136#define FIRST(c) ((c)->u.iso.first)
137#define LAST(c) ((c)->u.iso.last)
138#define CUR(c) ((c)->u.trad.cur)
139#define RLIMIT(c) ((c)->u.trad.rlimit)
140
141typedef struct cpp_context cpp_context;
142struct cpp_context
143{
144  /* Doubly-linked list.  */
145  cpp_context *next, *prev;
146
147  union
148  {
149    /* For ISO macro expansion.  Contexts other than the base context
150       are contiguous tokens.  e.g. macro expansions, expanded
151       argument tokens.  */
152    struct
153    {
154      union utoken first;
155      union utoken last;
156    } iso;
157
158    /* For traditional macro expansion.  */
159    struct
160    {
161      const unsigned char *cur;
162      const unsigned char *rlimit;
163    } trad;
164  } u;
165
166  /* If non-NULL, a buffer used for storage related to this context.
167     When the context is popped, the buffer is released.  */
168  _cpp_buff *buff;
169
170  /* For a macro context, the macro node, otherwise NULL.  */
171  cpp_hashnode *macro;
172
173  /* True if utoken element is token, else ptoken.  */
174  bool direct_p;
175};
176
177struct lexer_state
178{
179  /* Nonzero if first token on line is CPP_HASH.  */
180  unsigned char in_directive;
181
182  /* Nonzero if we are collecting macro arguments */
183  unsigned char collecting_args;
184
185  /* Nonzero if in a directive that will handle padding tokens itself.
186     #include needs this to avoid problems with computed include and
187     spacing between tokens.  */
188  unsigned char directive_wants_padding;
189
190  /* True if we are skipping a failed conditional group.  */
191  unsigned char skipping;
192
193  /* Nonzero if in a directive that takes angle-bracketed headers.  */
194  unsigned char angled_headers;
195
196  /* Nonzero if in a #if or #elif directive.  */
197  unsigned char in_expression;
198
199  /* Nonzero to save comments.  Turned off if discard_comments, and in
200     all directives apart from #define.  */
201  unsigned char save_comments;
202
203  /* Nonzero if lexing __VA_ARGS__ is valid.  */
204  unsigned char va_args_ok;
205
206  /* Nonzero if lexing poisoned identifiers is valid.  */
207  unsigned char poisoned_ok;
208
209  /* Nonzero to prevent macro expansion.  */
210  unsigned char prevent_expansion;
211
212  /* Nonzero when parsing arguments to a function-like macro.  */
213  unsigned char parsing_args;
214
215  /* Nonzero if prevent_expansion is true only because output is
216     being discarded.  */
217  unsigned char discarding_output;
218
219  /* Nonzero to skip evaluating part of an expression.  */
220  unsigned int skip_eval;
221
222  /* Nonzero when handling a deferred pragma.  */
223  unsigned char in_deferred_pragma;
224
225  /* Nonzero if the deferred pragma being handled allows macro expansion.  */
226  unsigned char pragma_allow_expansion;
227};
228
229/* Special nodes - identifiers with predefined significance.  */
230struct spec_nodes
231{
232  cpp_hashnode *n_defined;		/* defined operator */
233  cpp_hashnode *n_true;			/* C++ keyword true */
234  cpp_hashnode *n_false;		/* C++ keyword false */
235  cpp_hashnode *n__VA_ARGS__;		/* C99 vararg macros */
236};
237
238typedef struct _cpp_line_note _cpp_line_note;
239struct _cpp_line_note
240{
241  /* Location in the clean line the note refers to.  */
242  const unsigned char *pos;
243
244  /* Type of note.  The 9 'from' trigraph characters represent those
245     trigraphs, '\\' an escaped newline, ' ' an escaped newline with
246     intervening space, 0 represents a note that has already been handled,
247     and anything else is invalid.  */
248  unsigned int type;
249};
250
251/* Represents the contents of a file cpplib has read in.  */
252struct cpp_buffer
253{
254  const unsigned char *cur;        /* Current location.  */
255  const unsigned char *line_base;  /* Start of current physical line.  */
256  const unsigned char *next_line;  /* Start of to-be-cleaned logical line.  */
257
258  const unsigned char *buf;        /* Entire character buffer.  */
259  const unsigned char *rlimit;     /* Writable byte at end of file.  */
260
261  _cpp_line_note *notes;           /* Array of notes.  */
262  unsigned int cur_note;           /* Next note to process.  */
263  unsigned int notes_used;         /* Number of notes.  */
264  unsigned int notes_cap;          /* Size of allocated array.  */
265
266  struct cpp_buffer *prev;
267
268  /* Pointer into the file table; non-NULL if this is a file buffer.
269     Used for include_next and to record control macros.  */
270  struct _cpp_file *file;
271
272  /* Saved value of __TIMESTAMP__ macro - date and time of last modification
273     of the assotiated file.  */
274  const unsigned char *timestamp;
275
276  /* Value of if_stack at start of this file.
277     Used to prohibit unmatched #endif (etc) in an include file.  */
278  struct if_stack *if_stack;
279
280  /* True if we need to get the next clean line.  */
281  bool need_line;
282
283  /* True if we have already warned about C++ comments in this file.
284     The warning happens only for C89 extended mode with -pedantic on,
285     or for -Wtraditional, and only once per file (otherwise it would
286     be far too noisy).  */
287  unsigned int warned_cplusplus_comments : 1;
288
289  /* True if we don't process trigraphs and escaped newlines.  True
290     for preprocessed input, command line directives, and _Pragma
291     buffers.  */
292  unsigned int from_stage3 : 1;
293
294  /* At EOF, a buffer is automatically popped.  If RETURN_AT_EOF is
295     true, a CPP_EOF token is then returned.  Otherwise, the next
296     token from the enclosing buffer is returned.  */
297  unsigned int return_at_eof : 1;
298
299  /* One for a system header, two for a C system header file that therefore
300     needs to be extern "C" protected in C++, and zero otherwise.  */
301  unsigned char sysp;
302
303  /* The directory of the this buffer's file.  Its NAME member is not
304     allocated, so we don't need to worry about freeing it.  */
305  struct cpp_dir dir;
306
307  /* Descriptor for converting from the input character set to the
308     source character set.  */
309  struct cset_converter input_cset_desc;
310};
311
312/* The list of saved macros by push_macro pragma.  */
313struct def_pragma_macro {
314  /* Chain element to previous saved macro.  */
315  struct def_pragma_macro *next;
316  /* Name of the macro.  */
317  char *name;
318  /* The stored macro content.  */
319  cpp_macro *value;
320};
321
322/* A cpp_reader encapsulates the "state" of a pre-processor run.
323   Applying cpp_get_token repeatedly yields a stream of pre-processor
324   tokens.  Usually, there is only one cpp_reader object active.  */
325struct cpp_reader
326{
327  /* Top of buffer stack.  */
328  cpp_buffer *buffer;
329
330  /* Overlaid buffer (can be different after processing #include).  */
331  cpp_buffer *overlaid_buffer;
332
333  /* Lexer state.  */
334  struct lexer_state state;
335
336  /* Source line tracking.  */
337  struct line_maps *line_table;
338
339  /* The line of the '#' of the current directive.  */
340  source_location directive_line;
341
342  /* Memory buffers.  */
343  _cpp_buff *a_buff;		/* Aligned permanent storage.  */
344  _cpp_buff *u_buff;		/* Unaligned permanent storage.  */
345  _cpp_buff *free_buffs;	/* Free buffer chain.  */
346
347  /* Context stack.  */
348  struct cpp_context base_context;
349  struct cpp_context *context;
350
351  /* If in_directive, the directive if known.  */
352  const struct directive *directive;
353
354  /* Token generated while handling a directive, if any. */
355  cpp_token directive_result;
356
357  /* When expanding a macro at top-level, this is the location of the
358     macro invocation.  */
359  source_location invocation_location;
360
361  /* True if this call to cpp_get_token should consider setting
362     invocation_location.  */
363  bool set_invocation_location;
364
365  /* Search paths for include files.  */
366  struct cpp_dir *quote_include;	/* "" */
367  struct cpp_dir *bracket_include;	/* <> */
368  struct cpp_dir no_search_path;	/* No path.  */
369
370  /* Chain of all hashed _cpp_file instances.  */
371  struct _cpp_file *all_files;
372
373  struct _cpp_file *main_file;
374
375  /* File and directory hash table.  */
376  struct htab *file_hash;
377  struct htab *dir_hash;
378  struct file_hash_entry_pool *file_hash_entries;
379
380  /* Negative path lookup hash table.  */
381  struct htab *nonexistent_file_hash;
382  struct obstack nonexistent_file_ob;
383
384  /* Nonzero means don't look for #include "foo" the source-file
385     directory.  */
386  bool quote_ignores_source_dir;
387
388  /* Nonzero if any file has contained #pragma once or #import has
389     been used.  */
390  bool seen_once_only;
391
392  /* Multiple include optimization.  */
393  const cpp_hashnode *mi_cmacro;
394  const cpp_hashnode *mi_ind_cmacro;
395  bool mi_valid;
396
397  /* Lexing.  */
398  cpp_token *cur_token;
399  tokenrun base_run, *cur_run;
400  unsigned int lookaheads;
401
402  /* Nonzero prevents the lexer from re-using the token runs.  */
403  unsigned int keep_tokens;
404
405  /* Buffer to hold macro definition string.  */
406  unsigned char *macro_buffer;
407  unsigned int macro_buffer_len;
408
409  /* Descriptor for converting from the source character set to the
410     execution character set.  */
411  struct cset_converter narrow_cset_desc;
412
413  /* Descriptor for converting from the source character set to the
414     UTF-8 execution character set.  */
415  struct cset_converter utf8_cset_desc;
416
417  /* Descriptor for converting from the source character set to the
418     UTF-16 execution character set.  */
419  struct cset_converter char16_cset_desc;
420
421  /* Descriptor for converting from the source character set to the
422     UTF-32 execution character set.  */
423  struct cset_converter char32_cset_desc;
424
425  /* Descriptor for converting from the source character set to the
426     wide execution character set.  */
427  struct cset_converter wide_cset_desc;
428
429  /* Date and time text.  Calculated together if either is requested.  */
430  const unsigned char *date;
431  const unsigned char *time;
432
433  /* EOF token, and a token forcing paste avoidance.  */
434  cpp_token avoid_paste;
435  cpp_token eof;
436
437  /* Opaque handle to the dependencies of mkdeps.c.  */
438  struct deps *deps;
439
440  /* Obstack holding all macro hash nodes.  This never shrinks.
441     See identifiers.c */
442  struct obstack hash_ob;
443
444  /* Obstack holding buffer and conditional structures.  This is a
445     real stack.  See directives.c.  */
446  struct obstack buffer_ob;
447
448  /* Pragma table - dynamic, because a library user can add to the
449     list of recognized pragmas.  */
450  struct pragma_entry *pragmas;
451
452  /* Call backs to cpplib client.  */
453  struct cpp_callbacks cb;
454
455  /* Identifier hash table.  */
456  struct ht *hash_table;
457
458  /* Expression parser stack.  */
459  struct op *op_stack, *op_limit;
460
461  /* User visible options.  */
462  struct cpp_options opts;
463
464  /* Special nodes - identifiers with predefined significance to the
465     preprocessor.  */
466  struct spec_nodes spec_nodes;
467
468  /* Whether cpplib owns the hashtable.  */
469  bool our_hashtable;
470
471  /* Traditional preprocessing output buffer (a logical line).  */
472  struct
473  {
474    unsigned char *base;
475    unsigned char *limit;
476    unsigned char *cur;
477    source_location first_line;
478  } out;
479
480  /* Used for buffer overlays by traditional.c.  */
481  const unsigned char *saved_cur, *saved_rlimit, *saved_line_base;
482
483  /* A saved list of the defined macros, for dependency checking
484     of precompiled headers.  */
485  struct cpp_savedstate *savedstate;
486
487  /* Next value of __COUNTER__ macro. */
488  unsigned int counter;
489
490  /* Table of comments, when state.save_comments is true.  */
491  cpp_comment_table comments;
492
493  /* List of saved macros by push_macro.  */
494  struct def_pragma_macro *pushed_macros;
495};
496
497/* Character classes.  Based on the more primitive macros in safe-ctype.h.
498   If the definition of `numchar' looks odd to you, please look up the
499   definition of a pp-number in the C standard [section 6.4.8 of C99].
500
501   In the unlikely event that characters other than \r and \n enter
502   the set is_vspace, the macro handle_newline() in lex.c must be
503   updated.  */
504#define _dollar_ok(x)	((x) == '$' && CPP_OPTION (pfile, dollars_in_ident))
505
506#define is_idchar(x)	(ISIDNUM(x) || _dollar_ok(x))
507#define is_numchar(x)	ISIDNUM(x)
508#define is_idstart(x)	(ISIDST(x) || _dollar_ok(x))
509#define is_numstart(x)	ISDIGIT(x)
510#define is_hspace(x)	ISBLANK(x)
511#define is_vspace(x)	IS_VSPACE(x)
512#define is_nvspace(x)	IS_NVSPACE(x)
513#define is_space(x)	IS_SPACE_OR_NUL(x)
514
515/* This table is constant if it can be initialized at compile time,
516   which is the case if cpp was compiled with GCC >=2.7, or another
517   compiler that supports C99.  */
518#if HAVE_DESIGNATED_INITIALIZERS
519extern const unsigned char _cpp_trigraph_map[UCHAR_MAX + 1];
520#else
521extern unsigned char _cpp_trigraph_map[UCHAR_MAX + 1];
522#endif
523
524/* Macros.  */
525
526static inline int cpp_in_system_header (cpp_reader *);
527static inline int
528cpp_in_system_header (cpp_reader *pfile)
529{
530  return pfile->buffer ? pfile->buffer->sysp : 0;
531}
532#define CPP_PEDANTIC(PF) CPP_OPTION (PF, pedantic)
533#define CPP_WTRADITIONAL(PF) CPP_OPTION (PF, warn_traditional)
534
535static inline int cpp_in_primary_file (cpp_reader *);
536static inline int
537cpp_in_primary_file (cpp_reader *pfile)
538{
539  return pfile->line_table->depth == 1;
540}
541
542/* In macro.c */
543extern void _cpp_free_definition (cpp_hashnode *);
544extern bool _cpp_create_definition (cpp_reader *, cpp_hashnode *);
545extern void _cpp_pop_context (cpp_reader *);
546extern void _cpp_push_text_context (cpp_reader *, cpp_hashnode *,
547				    const unsigned char *, size_t);
548extern bool _cpp_save_parameter (cpp_reader *, cpp_macro *, cpp_hashnode *);
549extern bool _cpp_arguments_ok (cpp_reader *, cpp_macro *, const cpp_hashnode *,
550			       unsigned int);
551extern const unsigned char *_cpp_builtin_macro_text (cpp_reader *,
552						     cpp_hashnode *);
553extern int _cpp_warn_if_unused_macro (cpp_reader *, cpp_hashnode *, void *);
554extern void _cpp_push_token_context (cpp_reader *, cpp_hashnode *,
555				     const cpp_token *, unsigned int);
556extern void _cpp_backup_tokens_direct (cpp_reader *, unsigned int);
557
558/* In identifiers.c */
559extern void _cpp_init_hashtable (cpp_reader *, hash_table *);
560extern void _cpp_destroy_hashtable (cpp_reader *);
561
562/* In files.c */
563typedef struct _cpp_file _cpp_file;
564extern _cpp_file *_cpp_find_file (cpp_reader *, const char *, cpp_dir *,
565				  bool, int);
566extern bool _cpp_find_failed (_cpp_file *);
567extern void _cpp_mark_file_once_only (cpp_reader *, struct _cpp_file *);
568extern void _cpp_fake_include (cpp_reader *, const char *);
569extern bool _cpp_stack_file (cpp_reader *, _cpp_file*, bool);
570extern bool _cpp_stack_include (cpp_reader *, const char *, int,
571				enum include_type);
572extern int _cpp_compare_file_date (cpp_reader *, const char *, int);
573extern void _cpp_report_missing_guards (cpp_reader *);
574extern void _cpp_init_files (cpp_reader *);
575extern void _cpp_cleanup_files (cpp_reader *);
576extern void _cpp_pop_file_buffer (cpp_reader *, struct _cpp_file *);
577extern bool _cpp_save_file_entries (cpp_reader *pfile, FILE *f);
578extern bool _cpp_read_file_entries (cpp_reader *, FILE *);
579extern struct stat *_cpp_get_file_stat (_cpp_file *);
580
581/* In expr.c */
582extern bool _cpp_parse_expr (cpp_reader *, bool);
583extern struct op *_cpp_expand_op_stack (cpp_reader *);
584
585/* In lex.c */
586extern void _cpp_process_line_notes (cpp_reader *, int);
587extern void _cpp_clean_line (cpp_reader *);
588extern bool _cpp_get_fresh_line (cpp_reader *);
589extern bool _cpp_skip_block_comment (cpp_reader *);
590extern cpp_token *_cpp_temp_token (cpp_reader *);
591extern const cpp_token *_cpp_lex_token (cpp_reader *);
592extern cpp_token *_cpp_lex_direct (cpp_reader *);
593extern int _cpp_equiv_tokens (const cpp_token *, const cpp_token *);
594extern void _cpp_init_tokenrun (tokenrun *, unsigned int);
595extern cpp_hashnode *_cpp_lex_identifier (cpp_reader *, const char *);
596
597/* In init.c.  */
598extern void _cpp_maybe_push_include_file (cpp_reader *);
599extern const char *cpp_named_operator2name (enum cpp_ttype type);
600
601/* In directives.c */
602extern int _cpp_test_assertion (cpp_reader *, unsigned int *);
603extern int _cpp_handle_directive (cpp_reader *, int);
604extern void _cpp_define_builtin (cpp_reader *, const char *);
605extern char ** _cpp_save_pragma_names (cpp_reader *);
606extern void _cpp_restore_pragma_names (cpp_reader *, char **);
607extern int _cpp_do__Pragma (cpp_reader *);
608extern void _cpp_init_directives (cpp_reader *);
609extern void _cpp_init_internal_pragmas (cpp_reader *);
610extern void _cpp_do_file_change (cpp_reader *, enum lc_reason, const char *,
611				 linenum_type, unsigned int);
612extern void _cpp_pop_buffer (cpp_reader *);
613
614/* In directives.c */
615struct _cpp_dir_only_callbacks
616{
617  /* Called to print a block of lines. */
618  void (*print_lines) (int, const void *, size_t);
619  void (*maybe_print_line) (source_location);
620};
621
622extern void _cpp_preprocess_dir_only (cpp_reader *,
623				      const struct _cpp_dir_only_callbacks *);
624
625/* In traditional.c.  */
626extern bool _cpp_scan_out_logical_line (cpp_reader *, cpp_macro *);
627extern bool _cpp_read_logical_line_trad (cpp_reader *);
628extern void _cpp_overlay_buffer (cpp_reader *pfile, const unsigned char *,
629				 size_t);
630extern void _cpp_remove_overlay (cpp_reader *);
631extern bool _cpp_create_trad_definition (cpp_reader *, cpp_macro *);
632extern bool _cpp_expansions_different_trad (const cpp_macro *,
633					    const cpp_macro *);
634extern unsigned char *_cpp_copy_replacement_text (const cpp_macro *,
635						  unsigned char *);
636extern size_t _cpp_replacement_text_len (const cpp_macro *);
637
638/* In charset.c.  */
639
640/* The normalization state at this point in the sequence.
641   It starts initialized to all zeros, and at the end
642   'level' is the normalization level of the sequence.  */
643
644struct normalize_state
645{
646  /* The previous character.  */
647  cppchar_t previous;
648  /* The combining class of the previous character.  */
649  unsigned char prev_class;
650  /* The lowest normalization level so far.  */
651  enum cpp_normalize_level level;
652};
653#define INITIAL_NORMALIZE_STATE { 0, 0, normalized_KC }
654#define NORMALIZE_STATE_RESULT(st) ((st)->level)
655
656/* We saw a character that matches ISIDNUM(), update a
657   normalize_state appropriately.  */
658#define NORMALIZE_STATE_UPDATE_IDNUM(st) \
659  ((st)->previous = 0, (st)->prev_class = 0)
660
661extern cppchar_t _cpp_valid_ucn (cpp_reader *, const unsigned char **,
662				 const unsigned char *, int,
663				 struct normalize_state *state);
664extern void _cpp_destroy_iconv (cpp_reader *);
665extern unsigned char *_cpp_convert_input (cpp_reader *, const char *,
666					  unsigned char *, size_t, size_t,
667					  const unsigned char **, off_t *);
668extern const char *_cpp_default_encoding (void);
669extern cpp_hashnode * _cpp_interpret_identifier (cpp_reader *pfile,
670						 const unsigned char *id,
671						 size_t len);
672
673/* Utility routines and macros.  */
674#define DSC(str) (const unsigned char *)str, sizeof str - 1
675
676/* These are inline functions instead of macros so we can get type
677   checking.  */
678static inline int ustrcmp (const unsigned char *, const unsigned char *);
679static inline int ustrncmp (const unsigned char *, const unsigned char *,
680			    size_t);
681static inline size_t ustrlen (const unsigned char *);
682static inline unsigned char *uxstrdup (const unsigned char *);
683static inline unsigned char *ustrchr (const unsigned char *, int);
684static inline int ufputs (const unsigned char *, FILE *);
685
686/* Use a const char for the second parameter since it is usually a literal.  */
687static inline int ustrcspn (const unsigned char *, const char *);
688
689static inline int
690ustrcmp (const unsigned char *s1, const unsigned char *s2)
691{
692  return strcmp ((const char *)s1, (const char *)s2);
693}
694
695static inline int
696ustrncmp (const unsigned char *s1, const unsigned char *s2, size_t n)
697{
698  return strncmp ((const char *)s1, (const char *)s2, n);
699}
700
701static inline int
702ustrcspn (const unsigned char *s1, const char *s2)
703{
704  return strcspn ((const char *)s1, s2);
705}
706
707static inline size_t
708ustrlen (const unsigned char *s1)
709{
710  return strlen ((const char *)s1);
711}
712
713static inline unsigned char *
714uxstrdup (const unsigned char *s1)
715{
716  return (unsigned char *) xstrdup ((const char *)s1);
717}
718
719static inline unsigned char *
720ustrchr (const unsigned char *s1, int c)
721{
722  return (unsigned char *) strchr ((const char *)s1, c);
723}
724
725static inline int
726ufputs (const unsigned char *s, FILE *f)
727{
728  return fputs ((const char *)s, f);
729}
730
731#ifdef __cplusplus
732}
733#endif
734
735#endif /* ! LIBCPP_INTERNAL_H */
736