gcclibs/libcpp/lex.c

169695Skan/* CPP Library - lexical analysis.
169695Skan   Copyright (C) 2000, 2001, 2002, 2003, 2004, 2005 Free Software Foundation, Inc.
169695Skan   Contributed by Per Bothner, 1994-95.
169695Skan   Based on CCCP program by Paul Rubin, June 1986
169695Skan   Adapted to ANSI C, Richard Stallman, Jan 1987
169695Skan   Broken out to separate file, Zack Weinberg, Mar 2000
169695Skan
169695SkanThis program is free software; you can redistribute it and/or modify it
169695Skanunder the terms of the GNU General Public License as published by the
169695SkanFree Software Foundation; either version 2, or (at your option) any
169695Skanlater version.
169695Skan
169695SkanThis program is distributed in the hope that it will be useful,
169695Skanbut WITHOUT ANY WARRANTY; without even the implied warranty of
169695SkanMERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
169695SkanGNU General Public License for more details.
169695Skan
169695SkanYou should have received a copy of the GNU General Public License
169695Skanalong with this program; if not, write to the Free Software
169695SkanFoundation, 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.  */
169695Skan
169695Skan#include "config.h"
169695Skan#include "system.h"
169695Skan#include "cpplib.h"
169695Skan#include "internal.h"
169695Skan
169695Skanenum spell_type
169695Skan{
169695Skan  SPELL_OPERATOR = 0,
169695Skan  SPELL_IDENT,
169695Skan  SPELL_LITERAL,
169695Skan  SPELL_NONE
169695Skan};
169695Skan
169695Skanstruct token_spelling
169695Skan{
169695Skan  enum spell_type category;
169695Skan  const unsigned char *name;
169695Skan};
169695Skan
169695Skanstatic const unsigned char *const digraph_spellings[] =
169695Skan{ U"%:", U"%:%:", U"<:", U":>", U"<%", U"%>" };
169695Skan
169695Skan#define OP(e, s) { SPELL_OPERATOR, U s  },
169695Skan#define TK(e, s) { SPELL_ ## s,    U #e },
169695Skanstatic const struct token_spelling token_spellings[N_TTYPES] = { TTYPE_TABLE };
169695Skan#undef OP
169695Skan#undef TK
169695Skan
169695Skan#define TOKEN_SPELL(token) (token_spellings[(token)->type].category)
169695Skan#define TOKEN_NAME(token) (token_spellings[(token)->type].name)
169695Skan
169695Skanstatic void add_line_note (cpp_buffer *, const uchar *, unsigned int);
169695Skanstatic int skip_line_comment (cpp_reader *);
169695Skanstatic void skip_whitespace (cpp_reader *, cppchar_t);
169695Skanstatic void lex_string (cpp_reader *, cpp_token *, const uchar *);
169695Skanstatic void save_comment (cpp_reader *, cpp_token *, const uchar *, cppchar_t);
169695Skanstatic void create_literal (cpp_reader *, cpp_token *, const uchar *,
169695Skan			    unsigned int, enum cpp_ttype);
169695Skanstatic bool warn_in_comment (cpp_reader *, _cpp_line_note *);
169695Skanstatic int name_p (cpp_reader *, const cpp_string *);
169695Skanstatic tokenrun *next_tokenrun (tokenrun *);
169695Skan
169695Skanstatic _cpp_buff *new_buff (size_t);
169695Skan
169695Skan
169695Skan/* Utility routine:
169695Skan
169695Skan   Compares, the token TOKEN to the NUL-terminated string STRING.
169695Skan   TOKEN must be a CPP_NAME.  Returns 1 for equal, 0 for unequal.  */
169695Skanint
169695Skancpp_ideq (const cpp_token *token, const char *string)
169695Skan{
169695Skan  if (token->type != CPP_NAME)
169695Skan    return 0;
169695Skan
169695Skan  return !ustrcmp (NODE_NAME (token->val.node), (const uchar *) string);
169695Skan}
169695Skan
169695Skan/* Record a note TYPE at byte POS into the current cleaned logical
169695Skan   line.  */
169695Skanstatic void
169695Skanadd_line_note (cpp_buffer *buffer, const uchar *pos, unsigned int type)
169695Skan{
169695Skan  if (buffer->notes_used == buffer->notes_cap)
169695Skan    {
169695Skan      buffer->notes_cap = buffer->notes_cap * 2 + 200;
169695Skan      buffer->notes = XRESIZEVEC (_cpp_line_note, buffer->notes,
169695Skan                                  buffer->notes_cap);
169695Skan    }
169695Skan
169695Skan  buffer->notes[buffer->notes_used].pos = pos;
169695Skan  buffer->notes[buffer->notes_used].type = type;
169695Skan  buffer->notes_used++;
169695Skan}
169695Skan
169695Skan/* Returns with a logical line that contains no escaped newlines or
169695Skan   trigraphs.  This is a time-critical inner loop.  */
169695Skanvoid
169695Skan_cpp_clean_line (cpp_reader *pfile)
169695Skan{
169695Skan  cpp_buffer *buffer;
169695Skan  const uchar *s;
169695Skan  uchar c, *d, *p;
169695Skan
169695Skan  buffer = pfile->buffer;
169695Skan  buffer->cur_note = buffer->notes_used = 0;
169695Skan  buffer->cur = buffer->line_base = buffer->next_line;
169695Skan  buffer->need_line = false;
169695Skan  s = buffer->next_line - 1;
169695Skan
169695Skan  if (!buffer->from_stage3)
169695Skan    {
169695Skan      /* Short circuit for the common case of an un-escaped line with
169695Skan	 no trigraphs.  The primary win here is by not writing any
169695Skan	 data back to memory until we have to.  */
169695Skan      for (;;)
169695Skan	{
169695Skan	  c = *++s;
169695Skan	  if (c == '\n' || c == '\r')
169695Skan	    {
169695Skan	      d = (uchar *) s;
169695Skan
169695Skan	      if (s == buffer->rlimit)
169695Skan		goto done;
169695Skan
169695Skan	      /* DOS line ending? */
169695Skan	      if (c == '\r' && s[1] == '\n')
169695Skan		s++;
169695Skan
169695Skan	      if (s == buffer->rlimit)
169695Skan		goto done;
169695Skan
169695Skan	      /* check for escaped newline */
169695Skan	      p = d;
169695Skan	      while (p != buffer->next_line && is_nvspace (p[-1]))
169695Skan		p--;
169695Skan	      if (p == buffer->next_line || p[-1] != '\\')
169695Skan		goto done;
169695Skan
169695Skan	      /* Have an escaped newline; process it and proceed to
169695Skan		 the slow path.  */
169695Skan	      add_line_note (buffer, p - 1, p != d ? ' ' : '\\');
169695Skan	      d = p - 2;
169695Skan	      buffer->next_line = p - 1;
169695Skan	      break;
169695Skan	    }
169695Skan	  if (c == '?' && s[1] == '?' && _cpp_trigraph_map[s[2]])
169695Skan	    {
169695Skan	      /* Have a trigraph.  We may or may not have to convert
169695Skan		 it.  Add a line note regardless, for -Wtrigraphs.  */
169695Skan	      add_line_note (buffer, s, s[2]);
169695Skan	      if (CPP_OPTION (pfile, trigraphs))
169695Skan		{
169695Skan		  /* We do, and that means we have to switch to the
169695Skan		     slow path.  */
169695Skan		  d = (uchar *) s;
169695Skan		  *d = _cpp_trigraph_map[s[2]];
169695Skan		  s += 2;
169695Skan		  break;
169695Skan		}
169695Skan	    }
169695Skan	}
169695Skan
169695Skan
169695Skan      for (;;)
169695Skan	{
169695Skan	  c = *++s;
169695Skan	  *++d = c;
169695Skan
169695Skan	  if (c == '\n' || c == '\r')
169695Skan	    {
169695Skan		  /* Handle DOS line endings.  */
169695Skan	      if (c == '\r' && s != buffer->rlimit && s[1] == '\n')
169695Skan		s++;
169695Skan	      if (s == buffer->rlimit)
169695Skan		break;
169695Skan
169695Skan	      /* Escaped?  */
169695Skan	      p = d;
169695Skan	      while (p != buffer->next_line && is_nvspace (p[-1]))
169695Skan		p--;
169695Skan	      if (p == buffer->next_line || p[-1] != '\\')
169695Skan		break;
169695Skan
169695Skan	      add_line_note (buffer, p - 1, p != d ? ' ': '\\');
169695Skan	      d = p - 2;
169695Skan	      buffer->next_line = p - 1;
169695Skan	    }
169695Skan	  else if (c == '?' && s[1] == '?' && _cpp_trigraph_map[s[2]])
169695Skan	    {
169695Skan	      /* Add a note regardless, for the benefit of -Wtrigraphs.  */
169695Skan	      add_line_note (buffer, d, s[2]);
169695Skan	      if (CPP_OPTION (pfile, trigraphs))
169695Skan		{
169695Skan		  *d = _cpp_trigraph_map[s[2]];
169695Skan		  s += 2;
169695Skan		}
169695Skan	    }
169695Skan	}
169695Skan    }
169695Skan  else
169695Skan    {
169695Skan      do
169695Skan	s++;
169695Skan      while (*s != '\n' && *s != '\r');
169695Skan      d = (uchar *) s;
169695Skan
169695Skan      /* Handle DOS line endings.  */
169695Skan      if (*s == '\r' && s != buffer->rlimit && s[1] == '\n')
169695Skan	s++;
169695Skan    }
169695Skan
169695Skan done:
169695Skan  *d = '\n';
169695Skan  /* A sentinel note that should never be processed.  */
169695Skan  add_line_note (buffer, d + 1, '\n');
169695Skan  buffer->next_line = s + 1;
169695Skan}
169695Skan
169695Skan/* Return true if the trigraph indicated by NOTE should be warned
169695Skan   about in a comment.  */
169695Skanstatic bool
169695Skanwarn_in_comment (cpp_reader *pfile, _cpp_line_note *note)
169695Skan{
169695Skan  const uchar *p;
169695Skan
169695Skan  /* Within comments we don't warn about trigraphs, unless the
169695Skan     trigraph forms an escaped newline, as that may change
169695Skan     behavior.  */
169695Skan  if (note->type != '/')
169695Skan    return false;
169695Skan
169695Skan  /* If -trigraphs, then this was an escaped newline iff the next note
169695Skan     is coincident.  */
169695Skan  if (CPP_OPTION (pfile, trigraphs))
169695Skan    return note[1].pos == note->pos;
169695Skan
169695Skan  /* Otherwise, see if this forms an escaped newline.  */
169695Skan  p = note->pos + 3;
169695Skan  while (is_nvspace (*p))
169695Skan    p++;
169695Skan
169695Skan  /* There might have been escaped newlines between the trigraph and the
169695Skan     newline we found.  Hence the position test.  */
169695Skan  return (*p == '\n' && p < note[1].pos);
169695Skan}
169695Skan
169695Skan/* Process the notes created by add_line_note as far as the current
169695Skan   location.  */
169695Skanvoid
169695Skan_cpp_process_line_notes (cpp_reader *pfile, int in_comment)
169695Skan{
169695Skan  cpp_buffer *buffer = pfile->buffer;
169695Skan
169695Skan  for (;;)
169695Skan    {
169695Skan      _cpp_line_note *note = &buffer->notes[buffer->cur_note];
169695Skan      unsigned int col;
169695Skan
169695Skan      if (note->pos > buffer->cur)
169695Skan	break;
169695Skan
169695Skan      buffer->cur_note++;
169695Skan      col = CPP_BUF_COLUMN (buffer, note->pos + 1);
169695Skan
169695Skan      if (note->type == '\\' || note->type == ' ')
169695Skan	{
169695Skan	  if (note->type == ' ' && !in_comment)
169695Skan	    cpp_error_with_line (pfile, CPP_DL_WARNING, pfile->line_table->highest_line, col,
169695Skan				 "backslash and newline separated by space");
169695Skan
169695Skan	  if (buffer->next_line > buffer->rlimit)
169695Skan	    {
169695Skan	      cpp_error_with_line (pfile, CPP_DL_PEDWARN, pfile->line_table->highest_line, col,
169695Skan				   "backslash-newline at end of file");
169695Skan	      /* Prevent "no newline at end of file" warning.  */
169695Skan	      buffer->next_line = buffer->rlimit;
169695Skan	    }
169695Skan
169695Skan	  buffer->line_base = note->pos;
169695Skan	  CPP_INCREMENT_LINE (pfile, 0);
169695Skan	}
169695Skan      else if (_cpp_trigraph_map[note->type])
169695Skan	{
169695Skan	  if (CPP_OPTION (pfile, warn_trigraphs)
169695Skan	      && (!in_comment || warn_in_comment (pfile, note)))
169695Skan	    {
169695Skan	      if (CPP_OPTION (pfile, trigraphs))
169695Skan		cpp_error_with_line (pfile, CPP_DL_WARNING, pfile->line_table->highest_line, col,
169695Skan				     "trigraph ??%c converted to %c",
169695Skan				     note->type,
169695Skan				     (int) _cpp_trigraph_map[note->type]);
169695Skan	      else
169695Skan		{
169695Skan		  cpp_error_with_line
169695Skan		    (pfile, CPP_DL_WARNING, pfile->line_table->highest_line, col,
169695Skan		     "trigraph ??%c ignored, use -trigraphs to enable",
169695Skan		     note->type);
169695Skan		}
169695Skan	    }
169695Skan	}
169695Skan      else
169695Skan	abort ();
169695Skan    }
169695Skan}
169695Skan
169695Skan/* Skip a C-style block comment.  We find the end of the comment by
169695Skan   seeing if an asterisk is before every '/' we encounter.  Returns
169695Skan   nonzero if comment terminated by EOF, zero otherwise.
169695Skan
169695Skan   Buffer->cur points to the initial asterisk of the comment.  */
169695Skanbool
169695Skan_cpp_skip_block_comment (cpp_reader *pfile)
169695Skan{
169695Skan  cpp_buffer *buffer = pfile->buffer;
169695Skan  const uchar *cur = buffer->cur;
169695Skan  uchar c;
169695Skan
169695Skan  cur++;
169695Skan  if (*cur == '/')
169695Skan    cur++;
169695Skan
169695Skan  for (;;)
169695Skan    {
169695Skan      /* People like decorating comments with '*', so check for '/'
169695Skan	 instead for efficiency.  */
169695Skan      c = *cur++;
169695Skan
169695Skan      if (c == '/')
169695Skan	{
169695Skan	  if (cur[-2] == '*')
169695Skan	    break;
169695Skan
169695Skan	  /* Warn about potential nested comments, but not if the '/'
169695Skan	     comes immediately before the true comment delimiter.
169695Skan	     Don't bother to get it right across escaped newlines.  */
169695Skan	  if (CPP_OPTION (pfile, warn_comments)
169695Skan	      && cur[0] == '*' && cur[1] != '/')
169695Skan	    {
169695Skan	      buffer->cur = cur;
169695Skan	      cpp_error_with_line (pfile, CPP_DL_WARNING,
169695Skan				   pfile->line_table->highest_line, CPP_BUF_COL (buffer),
169695Skan				   "\"/*\" within comment");
169695Skan	    }
169695Skan	}
169695Skan      else if (c == '\n')
169695Skan	{
169695Skan	  unsigned int cols;
169695Skan	  buffer->cur = cur - 1;
169695Skan	  _cpp_process_line_notes (pfile, true);
169695Skan	  if (buffer->next_line >= buffer->rlimit)
169695Skan	    return true;
169695Skan	  _cpp_clean_line (pfile);
169695Skan
169695Skan	  cols = buffer->next_line - buffer->line_base;
169695Skan	  CPP_INCREMENT_LINE (pfile, cols);
169695Skan
169695Skan	  cur = buffer->cur;
169695Skan	}
169695Skan    }
169695Skan
169695Skan  buffer->cur = cur;
169695Skan  _cpp_process_line_notes (pfile, true);
169695Skan  return false;
169695Skan}
169695Skan
169695Skan/* Skip a C++ line comment, leaving buffer->cur pointing to the
169695Skan   terminating newline.  Handles escaped newlines.  Returns nonzero
169695Skan   if a multiline comment.  */
169695Skanstatic int
169695Skanskip_line_comment (cpp_reader *pfile)
169695Skan{
169695Skan  cpp_buffer *buffer = pfile->buffer;
169695Skan  unsigned int orig_line = pfile->line_table->highest_line;
169695Skan
169695Skan  while (*buffer->cur != '\n')
169695Skan    buffer->cur++;
169695Skan
169695Skan  _cpp_process_line_notes (pfile, true);
169695Skan  return orig_line != pfile->line_table->highest_line;
169695Skan}
169695Skan
169695Skan/* Skips whitespace, saving the next non-whitespace character.  */
169695Skanstatic void
169695Skanskip_whitespace (cpp_reader *pfile, cppchar_t c)
169695Skan{
169695Skan  cpp_buffer *buffer = pfile->buffer;
169695Skan  bool saw_NUL = false;
169695Skan
169695Skan  do
169695Skan    {
169695Skan      /* Horizontal space always OK.  */
169695Skan      if (c == ' ' || c == '\t')
169695Skan	;
169695Skan      /* Just \f \v or \0 left.  */
169695Skan      else if (c == '\0')
169695Skan	saw_NUL = true;
169695Skan      else if (pfile->state.in_directive && CPP_PEDANTIC (pfile))
169695Skan	cpp_error_with_line (pfile, CPP_DL_PEDWARN, pfile->line_table->highest_line,
169695Skan			     CPP_BUF_COL (buffer),
169695Skan			     "%s in preprocessing directive",
169695Skan			     c == '\f' ? "form feed" : "vertical tab");
169695Skan
169695Skan      c = *buffer->cur++;
169695Skan    }
169695Skan  /* We only want non-vertical space, i.e. ' ' \t \f \v \0.  */
169695Skan  while (is_nvspace (c));
169695Skan
169695Skan  if (saw_NUL)
169695Skan    cpp_error (pfile, CPP_DL_WARNING, "null character(s) ignored");
169695Skan
169695Skan  buffer->cur--;
169695Skan}
169695Skan
169695Skan/* See if the characters of a number token are valid in a name (no
169695Skan   '.', '+' or '-').  */
169695Skanstatic int
169695Skanname_p (cpp_reader *pfile, const cpp_string *string)
169695Skan{
169695Skan  unsigned int i;
169695Skan
169695Skan  for (i = 0; i < string->len; i++)
169695Skan    if (!is_idchar (string->text[i]))
169695Skan      return 0;
169695Skan
169695Skan  return 1;
169695Skan}
169695Skan
169695Skan/* After parsing an identifier or other sequence, produce a warning about
169695Skan   sequences not in NFC/NFKC.  */
169695Skanstatic void
169695Skanwarn_about_normalization (cpp_reader *pfile,
169695Skan			  const cpp_token *token,
169695Skan			  const struct normalize_state *s)
169695Skan{
169695Skan  if (CPP_OPTION (pfile, warn_normalize) < NORMALIZE_STATE_RESULT (s)
169695Skan      && !pfile->state.skipping)
169695Skan    {
169695Skan      /* Make sure that the token is printed using UCNs, even
169695Skan	 if we'd otherwise happily print UTF-8.  */
169695Skan      unsigned char *buf = XNEWVEC (unsigned char, cpp_token_len (token));
169695Skan      size_t sz;
169695Skan
169695Skan      sz = cpp_spell_token (pfile, token, buf, false) - buf;
169695Skan      if (NORMALIZE_STATE_RESULT (s) == normalized_C)
169695Skan	cpp_error_with_line (pfile, CPP_DL_WARNING, token->src_loc, 0,
169695Skan			     "`%.*s' is not in NFKC", (int) sz, buf);
169695Skan      else
169695Skan	cpp_error_with_line (pfile, CPP_DL_WARNING, token->src_loc, 0,
169695Skan			     "`%.*s' is not in NFC", (int) sz, buf);
169695Skan    }
169695Skan}
169695Skan
169695Skan/* Returns TRUE if the sequence starting at buffer->cur is invalid in
169695Skan   an identifier.  FIRST is TRUE if this starts an identifier.  */
169695Skanstatic bool
169695Skanforms_identifier_p (cpp_reader *pfile, int first,
169695Skan		    struct normalize_state *state)
169695Skan{
169695Skan  cpp_buffer *buffer = pfile->buffer;
169695Skan
169695Skan  if (*buffer->cur == '$')
169695Skan    {
169695Skan      if (!CPP_OPTION (pfile, dollars_in_ident))
169695Skan	return false;
169695Skan
169695Skan      buffer->cur++;
169695Skan      if (CPP_OPTION (pfile, warn_dollars) && !pfile->state.skipping)
169695Skan	{
169695Skan	  CPP_OPTION (pfile, warn_dollars) = 0;
169695Skan	  cpp_error (pfile, CPP_DL_PEDWARN, "'$' in identifier or number");
169695Skan	}
169695Skan
169695Skan      return true;
169695Skan    }
169695Skan
169695Skan  /* Is this a syntactically valid UCN?  */
169695Skan  if (CPP_OPTION (pfile, extended_identifiers)
169695Skan      && *buffer->cur == '\\'
169695Skan      && (buffer->cur[1] == 'u' || buffer->cur[1] == 'U'))
169695Skan    {
169695Skan      buffer->cur += 2;
169695Skan      if (_cpp_valid_ucn (pfile, &buffer->cur, buffer->rlimit, 1 + !first,
169695Skan			  state))
169695Skan	return true;
169695Skan      buffer->cur -= 2;
169695Skan    }
169695Skan
169695Skan  return false;
169695Skan}
169695Skan
169695Skan/* Lex an identifier starting at BUFFER->CUR - 1.  */
169695Skanstatic cpp_hashnode *
169695Skanlex_identifier (cpp_reader *pfile, const uchar *base, bool starts_ucn,
169695Skan		struct normalize_state *nst)
169695Skan{
169695Skan  cpp_hashnode *result;
169695Skan  const uchar *cur;
169695Skan  unsigned int len;
169695Skan  unsigned int hash = HT_HASHSTEP (0, *base);
169695Skan
169695Skan  cur = pfile->buffer->cur;
169695Skan  if (! starts_ucn)
169695Skan    while (ISIDNUM (*cur))
169695Skan      {
169695Skan	hash = HT_HASHSTEP (hash, *cur);
169695Skan	cur++;
169695Skan      }
169695Skan  pfile->buffer->cur = cur;
169695Skan  if (starts_ucn || forms_identifier_p (pfile, false, nst))
169695Skan    {
169695Skan      /* Slower version for identifiers containing UCNs (or $).  */
169695Skan      do {
169695Skan	while (ISIDNUM (*pfile->buffer->cur))
169695Skan	  {
169695Skan	    pfile->buffer->cur++;
169695Skan	    NORMALIZE_STATE_UPDATE_IDNUM (nst);
169695Skan	  }
169695Skan      } while (forms_identifier_p (pfile, false, nst));
169695Skan      result = _cpp_interpret_identifier (pfile, base,
169695Skan					  pfile->buffer->cur - base);
169695Skan    }
169695Skan  else
169695Skan    {
169695Skan      len = cur - base;
169695Skan      hash = HT_HASHFINISH (hash, len);
169695Skan
169695Skan      result = (cpp_hashnode *)
169695Skan	ht_lookup_with_hash (pfile->hash_table, base, len, hash, HT_ALLOC);
169695Skan    }
169695Skan
169695Skan  /* Rarely, identifiers require diagnostics when lexed.  */
169695Skan  if (__builtin_expect ((result->flags & NODE_DIAGNOSTIC)
169695Skan			&& !pfile->state.skipping, 0))
169695Skan    {
169695Skan      /* It is allowed to poison the same identifier twice.  */
169695Skan      if ((result->flags & NODE_POISONED) && !pfile->state.poisoned_ok)
169695Skan	cpp_error (pfile, CPP_DL_ERROR, "attempt to use poisoned \"%s\"",
169695Skan		   NODE_NAME (result));
169695Skan
169695Skan      /* Constraint 6.10.3.5: __VA_ARGS__ should only appear in the
169695Skan	 replacement list of a variadic macro.  */
169695Skan      if (result == pfile->spec_nodes.n__VA_ARGS__
169695Skan	  && !pfile->state.va_args_ok)
169695Skan	cpp_error (pfile, CPP_DL_PEDWARN,
169695Skan		   "__VA_ARGS__ can only appear in the expansion"
169695Skan		   " of a C99 variadic macro");
169695Skan    }
169695Skan
169695Skan  return result;
169695Skan}
169695Skan
169695Skan/* Lex a number to NUMBER starting at BUFFER->CUR - 1.  */
169695Skanstatic void
169695Skanlex_number (cpp_reader *pfile, cpp_string *number,
169695Skan	    struct normalize_state *nst)
169695Skan{
169695Skan  const uchar *cur;
169695Skan  const uchar *base;
169695Skan  uchar *dest;
169695Skan
169695Skan  base = pfile->buffer->cur - 1;
169695Skan  do
169695Skan    {
169695Skan      cur = pfile->buffer->cur;
169695Skan
169695Skan      /* N.B. ISIDNUM does not include $.  */
169695Skan      while (ISIDNUM (*cur) || *cur == '.' || VALID_SIGN (*cur, cur[-1]))
169695Skan	{
169695Skan	  cur++;
169695Skan	  NORMALIZE_STATE_UPDATE_IDNUM (nst);
169695Skan	}
169695Skan
169695Skan      pfile->buffer->cur = cur;
169695Skan    }
169695Skan  while (forms_identifier_p (pfile, false, nst));
169695Skan
169695Skan  number->len = cur - base;
169695Skan  dest = _cpp_unaligned_alloc (pfile, number->len + 1);
169695Skan  memcpy (dest, base, number->len);
169695Skan  dest[number->len] = '\0';
169695Skan  number->text = dest;
169695Skan}
169695Skan
169695Skan/* Create a token of type TYPE with a literal spelling.  */
169695Skanstatic void
169695Skancreate_literal (cpp_reader *pfile, cpp_token *token, const uchar *base,
169695Skan		unsigned int len, enum cpp_ttype type)
169695Skan{
169695Skan  uchar *dest = _cpp_unaligned_alloc (pfile, len + 1);
169695Skan
169695Skan  memcpy (dest, base, len);
169695Skan  dest[len] = '\0';
169695Skan  token->type = type;
169695Skan  token->val.str.len = len;
169695Skan  token->val.str.text = dest;
169695Skan}
169695Skan
169695Skan/* Lexes a string, character constant, or angle-bracketed header file
169695Skan   name.  The stored string contains the spelling, including opening
169695Skan   quote and leading any leading 'L'.  It returns the type of the
169695Skan   literal, or CPP_OTHER if it was not properly terminated.
169695Skan
169695Skan   The spelling is NUL-terminated, but it is not guaranteed that this
169695Skan   is the first NUL since embedded NULs are preserved.  */
169695Skanstatic void
169695Skanlex_string (cpp_reader *pfile, cpp_token *token, const uchar *base)
169695Skan{
169695Skan  bool saw_NUL = false;
169695Skan  const uchar *cur;
169695Skan  cppchar_t terminator;
169695Skan  enum cpp_ttype type;
169695Skan
169695Skan  cur = base;
169695Skan  terminator = *cur++;
169695Skan  if (terminator == 'L')
169695Skan    terminator = *cur++;
169695Skan  if (terminator == '\"')
169695Skan    type = *base == 'L' ? CPP_WSTRING: CPP_STRING;
169695Skan  else if (terminator == '\'')
169695Skan    type = *base == 'L' ? CPP_WCHAR: CPP_CHAR;
169695Skan  else
169695Skan    terminator = '>', type = CPP_HEADER_NAME;
169695Skan
169695Skan  for (;;)
169695Skan    {
169695Skan      cppchar_t c = *cur++;
169695Skan
169695Skan      /* In #include-style directives, terminators are not escapable.  */
169695Skan      if (c == '\\' && !pfile->state.angled_headers && *cur != '\n')
169695Skan	cur++;
169695Skan      else if (c == terminator)
169695Skan	break;
169695Skan      else if (c == '\n')
169695Skan	{
169695Skan	  cur--;
169695Skan	  type = CPP_OTHER;
169695Skan	  break;
169695Skan	}
169695Skan      else if (c == '\0')
169695Skan	saw_NUL = true;
169695Skan    }
169695Skan
169695Skan  if (saw_NUL && !pfile->state.skipping)
169695Skan    cpp_error (pfile, CPP_DL_WARNING,
169695Skan	       "null character(s) preserved in literal");
169695Skan
169695Skan  if (type == CPP_OTHER && CPP_OPTION (pfile, lang) != CLK_ASM)
169695Skan    cpp_error (pfile, CPP_DL_PEDWARN, "missing terminating %c character",
169695Skan	       (int) terminator);
169695Skan
169695Skan  pfile->buffer->cur = cur;
169695Skan  create_literal (pfile, token, base, cur - base, type);
169695Skan}
169695Skan
169695Skan/* The stored comment includes the comment start and any terminator.  */
169695Skanstatic void
169695Skansave_comment (cpp_reader *pfile, cpp_token *token, const unsigned char *from,
169695Skan	      cppchar_t type)
169695Skan{
169695Skan  unsigned char *buffer;
169695Skan  unsigned int len, clen;
169695Skan
169695Skan  len = pfile->buffer->cur - from + 1; /* + 1 for the initial '/'.  */
169695Skan
169695Skan  /* C++ comments probably (not definitely) have moved past a new
169695Skan     line, which we don't want to save in the comment.  */
169695Skan  if (is_vspace (pfile->buffer->cur[-1]))
169695Skan    len--;
169695Skan
169695Skan  /* If we are currently in a directive, then we need to store all
169695Skan     C++ comments as C comments internally, and so we need to
169695Skan     allocate a little extra space in that case.
169695Skan
169695Skan     Note that the only time we encounter a directive here is
169695Skan     when we are saving comments in a "#define".  */
169695Skan  clen = (pfile->state.in_directive && type == '/') ? len + 2 : len;
169695Skan
169695Skan  buffer = _cpp_unaligned_alloc (pfile, clen);
169695Skan
169695Skan  token->type = CPP_COMMENT;
169695Skan  token->val.str.len = clen;
169695Skan  token->val.str.text = buffer;
169695Skan
169695Skan  buffer[0] = '/';
169695Skan  memcpy (buffer + 1, from, len - 1);
169695Skan
169695Skan  /* Finish conversion to a C comment, if necessary.  */
169695Skan  if (pfile->state.in_directive && type == '/')
169695Skan    {
169695Skan      buffer[1] = '*';
169695Skan      buffer[clen - 2] = '*';
169695Skan      buffer[clen - 1] = '/';
169695Skan    }
169695Skan}
169695Skan
169695Skan/* Allocate COUNT tokens for RUN.  */
169695Skanvoid
169695Skan_cpp_init_tokenrun (tokenrun *run, unsigned int count)
169695Skan{
169695Skan  run->base = XNEWVEC (cpp_token, count);
169695Skan  run->limit = run->base + count;
169695Skan  run->next = NULL;
169695Skan}
169695Skan
169695Skan/* Returns the next tokenrun, or creates one if there is none.  */
169695Skanstatic tokenrun *
169695Skannext_tokenrun (tokenrun *run)
169695Skan{
169695Skan  if (run->next == NULL)
169695Skan    {
169695Skan      run->next = XNEW (tokenrun);
169695Skan      run->next->prev = run;
169695Skan      _cpp_init_tokenrun (run->next, 250);
169695Skan    }
169695Skan
169695Skan  return run->next;
169695Skan}
169695Skan
169695Skan/* Allocate a single token that is invalidated at the same time as the
169695Skan   rest of the tokens on the line.  Has its line and col set to the
169695Skan   same as the last lexed token, so that diagnostics appear in the
169695Skan   right place.  */
169695Skancpp_token *
169695Skan_cpp_temp_token (cpp_reader *pfile)
169695Skan{
169695Skan  cpp_token *old, *result;
169695Skan
169695Skan  old = pfile->cur_token - 1;
169695Skan  if (pfile->cur_token == pfile->cur_run->limit)
169695Skan    {
169695Skan      pfile->cur_run = next_tokenrun (pfile->cur_run);
169695Skan      pfile->cur_token = pfile->cur_run->base;
169695Skan    }
169695Skan
169695Skan  result = pfile->cur_token++;
169695Skan  result->src_loc = old->src_loc;
169695Skan  return result;
169695Skan}
169695Skan
169695Skan/* Lex a token into RESULT (external interface).  Takes care of issues
169695Skan   like directive handling, token lookahead, multiple include
169695Skan   optimization and skipping.  */
169695Skanconst cpp_token *
169695Skan_cpp_lex_token (cpp_reader *pfile)
169695Skan{
169695Skan  cpp_token *result;
169695Skan
169695Skan  for (;;)
169695Skan    {
169695Skan      if (pfile->cur_token == pfile->cur_run->limit)
169695Skan	{
169695Skan	  pfile->cur_run = next_tokenrun (pfile->cur_run);
169695Skan	  pfile->cur_token = pfile->cur_run->base;
169695Skan	}
169695Skan
169695Skan      if (pfile->lookaheads)
169695Skan	{
169695Skan	  pfile->lookaheads--;
169695Skan	  result = pfile->cur_token++;
169695Skan	}
169695Skan      else
169695Skan	result = _cpp_lex_direct (pfile);
169695Skan
169695Skan      if (result->flags & BOL)
169695Skan	{
169695Skan	  /* Is this a directive.  If _cpp_handle_directive returns
169695Skan	     false, it is an assembler #.  */
169695Skan	  if (result->type == CPP_HASH
169695Skan	      /* 6.10.3 p 11: Directives in a list of macro arguments
169695Skan		 gives undefined behavior.  This implementation
169695Skan		 handles the directive as normal.  */
169695Skan	      && pfile->state.parsing_args != 1)
169695Skan	    {
169695Skan	      if (_cpp_handle_directive (pfile, result->flags & PREV_WHITE))
169695Skan		{
169695Skan		  if (pfile->directive_result.type == CPP_PADDING)
169695Skan		    continue;
169695Skan		  result = &pfile->directive_result;
169695Skan		}
169695Skan	    }
169695Skan	  else if (pfile->state.in_deferred_pragma)
169695Skan	    result = &pfile->directive_result;
169695Skan
169695Skan	  if (pfile->cb.line_change && !pfile->state.skipping)
169695Skan	    pfile->cb.line_change (pfile, result, pfile->state.parsing_args);
169695Skan	}
169695Skan
169695Skan      /* We don't skip tokens in directives.  */
169695Skan      if (pfile->state.in_directive || pfile->state.in_deferred_pragma)
169695Skan	break;
169695Skan
169695Skan      /* Outside a directive, invalidate controlling macros.  At file
169695Skan	 EOF, _cpp_lex_direct takes care of popping the buffer, so we never
169695Skan	 get here and MI optimization works.  */
169695Skan      pfile->mi_valid = false;
169695Skan
169695Skan      if (!pfile->state.skipping || result->type == CPP_EOF)
169695Skan	break;
169695Skan    }
169695Skan
169695Skan  return result;
169695Skan}
169695Skan
169695Skan/* Returns true if a fresh line has been loaded.  */
169695Skanbool
169695Skan_cpp_get_fresh_line (cpp_reader *pfile)
169695Skan{
169695Skan  int return_at_eof;
169695Skan
169695Skan  /* We can't get a new line until we leave the current directive.  */
169695Skan  if (pfile->state.in_directive)
169695Skan    return false;
169695Skan
169695Skan  for (;;)
169695Skan    {
169695Skan      cpp_buffer *buffer = pfile->buffer;
169695Skan
169695Skan      if (!buffer->need_line)
169695Skan	return true;
169695Skan
169695Skan      if (buffer->next_line < buffer->rlimit)
169695Skan	{
169695Skan	  _cpp_clean_line (pfile);
169695Skan	  return true;
169695Skan	}
169695Skan
169695Skan      /* First, get out of parsing arguments state.  */
169695Skan      if (pfile->state.parsing_args)
169695Skan	return false;
169695Skan
169695Skan      /* End of buffer.  Non-empty files should end in a newline.  */
169695Skan      if (buffer->buf != buffer->rlimit
169695Skan	  && buffer->next_line > buffer->rlimit
169695Skan	  && !buffer->from_stage3)
169695Skan	{
169695Skan	  /* Only warn once.  */
169695Skan	  buffer->next_line = buffer->rlimit;
169695Skan	  cpp_error_with_line (pfile, CPP_DL_PEDWARN, pfile->line_table->highest_line,
169695Skan			       CPP_BUF_COLUMN (buffer, buffer->cur),
169695Skan			       "no newline at end of file");
169695Skan	}
169695Skan
169695Skan      return_at_eof = buffer->return_at_eof;
169695Skan      _cpp_pop_buffer (pfile);
169695Skan      if (pfile->buffer == NULL || return_at_eof)
169695Skan	return false;
169695Skan    }
169695Skan}
169695Skan
169695Skan#define IF_NEXT_IS(CHAR, THEN_TYPE, ELSE_TYPE)		\
169695Skan  do							\
169695Skan    {							\
169695Skan      result->type = ELSE_TYPE;				\
169695Skan      if (*buffer->cur == CHAR)				\
169695Skan	buffer->cur++, result->type = THEN_TYPE;	\
169695Skan    }							\
169695Skan  while (0)
169695Skan
169695Skan/* Lex a token into pfile->cur_token, which is also incremented, to
169695Skan   get diagnostics pointing to the correct location.
169695Skan
169695Skan   Does not handle issues such as token lookahead, multiple-include
169695Skan   optimization, directives, skipping etc.  This function is only
169695Skan   suitable for use by _cpp_lex_token, and in special cases like
169695Skan   lex_expansion_token which doesn't care for any of these issues.
169695Skan
169695Skan   When meeting a newline, returns CPP_EOF if parsing a directive,
169695Skan   otherwise returns to the start of the token buffer if permissible.
169695Skan   Returns the location of the lexed token.  */
169695Skancpp_token *
169695Skan_cpp_lex_direct (cpp_reader *pfile)
169695Skan{
169695Skan  cppchar_t c;
169695Skan  cpp_buffer *buffer;
169695Skan  const unsigned char *comment_start;
169695Skan  cpp_token *result = pfile->cur_token++;
169695Skan
169695Skan fresh_line:
169695Skan  result->flags = 0;
169695Skan  buffer = pfile->buffer;
169695Skan  if (buffer->need_line)
169695Skan    {
169695Skan      if (pfile->state.in_deferred_pragma)
169695Skan	{
169695Skan	  result->type = CPP_PRAGMA_EOL;
169695Skan	  pfile->state.in_deferred_pragma = false;
169695Skan	  if (!pfile->state.pragma_allow_expansion)
169695Skan	    pfile->state.prevent_expansion--;
169695Skan	  return result;
169695Skan	}
169695Skan      if (!_cpp_get_fresh_line (pfile))
169695Skan	{
169695Skan	  result->type = CPP_EOF;
169695Skan	  if (!pfile->state.in_directive)
169695Skan	    {
169695Skan	      /* Tell the compiler the line number of the EOF token.  */
169695Skan	      result->src_loc = pfile->line_table->highest_line;
169695Skan	      result->flags = BOL;
169695Skan	    }
169695Skan	  return result;
169695Skan	}
169695Skan      if (!pfile->keep_tokens)
169695Skan	{
169695Skan	  pfile->cur_run = &pfile->base_run;
169695Skan	  result = pfile->base_run.base;
169695Skan	  pfile->cur_token = result + 1;
169695Skan	}
169695Skan      result->flags = BOL;
169695Skan      if (pfile->state.parsing_args == 2)
169695Skan	result->flags |= PREV_WHITE;
169695Skan    }
169695Skan  buffer = pfile->buffer;
169695Skan update_tokens_line:
169695Skan  result->src_loc = pfile->line_table->highest_line;
169695Skan
169695Skan skipped_white:
169695Skan  if (buffer->cur >= buffer->notes[buffer->cur_note].pos
169695Skan      && !pfile->overlaid_buffer)
169695Skan    {
169695Skan      _cpp_process_line_notes (pfile, false);
169695Skan      result->src_loc = pfile->line_table->highest_line;
169695Skan    }
169695Skan  c = *buffer->cur++;
169695Skan
169695Skan  LINEMAP_POSITION_FOR_COLUMN (result->src_loc, pfile->line_table,
169695Skan			       CPP_BUF_COLUMN (buffer, buffer->cur));
169695Skan
169695Skan  switch (c)
169695Skan    {
169695Skan    case ' ': case '\t': case '\f': case '\v': case '\0':
169695Skan      result->flags |= PREV_WHITE;
169695Skan      skip_whitespace (pfile, c);
169695Skan      goto skipped_white;
169695Skan
169695Skan    case '\n':
169695Skan      if (buffer->cur < buffer->rlimit)
169695Skan	CPP_INCREMENT_LINE (pfile, 0);
169695Skan      buffer->need_line = true;
169695Skan      goto fresh_line;
169695Skan
169695Skan    case '0': case '1': case '2': case '3': case '4':
169695Skan    case '5': case '6': case '7': case '8': case '9':
169695Skan      {
169695Skan	struct normalize_state nst = INITIAL_NORMALIZE_STATE;
169695Skan	result->type = CPP_NUMBER;
169695Skan	lex_number (pfile, &result->val.str, &nst);
169695Skan	warn_about_normalization (pfile, result, &nst);
169695Skan	break;
169695Skan      }
169695Skan
169695Skan    case 'L':
169695Skan      /* 'L' may introduce wide characters or strings.  */
169695Skan      if (*buffer->cur == '\'' || *buffer->cur == '"')
169695Skan	{
169695Skan	  lex_string (pfile, result, buffer->cur - 1);
169695Skan	  break;
169695Skan	}
169695Skan      /* Fall through.  */
169695Skan
169695Skan    case '_':
169695Skan    case 'a': case 'b': case 'c': case 'd': case 'e': case 'f':
169695Skan    case 'g': case 'h': case 'i': case 'j': case 'k': case 'l':
169695Skan    case 'm': case 'n': case 'o': case 'p': case 'q': case 'r':
169695Skan    case 's': case 't': case 'u': case 'v': case 'w': case 'x':
169695Skan    case 'y': case 'z':
169695Skan    case 'A': case 'B': case 'C': case 'D': case 'E': case 'F':
169695Skan    case 'G': case 'H': case 'I': case 'J': case 'K':
169695Skan    case 'M': case 'N': case 'O': case 'P': case 'Q': case 'R':
169695Skan    case 'S': case 'T': case 'U': case 'V': case 'W': case 'X':
169695Skan    case 'Y': case 'Z':
169695Skan      result->type = CPP_NAME;
169695Skan      {
169695Skan	struct normalize_state nst = INITIAL_NORMALIZE_STATE;
169695Skan	result->val.node = lex_identifier (pfile, buffer->cur - 1, false,
169695Skan					   &nst);
169695Skan	warn_about_normalization (pfile, result, &nst);
169695Skan      }
169695Skan
169695Skan      /* Convert named operators to their proper types.  */
169695Skan      if (result->val.node->flags & NODE_OPERATOR)
169695Skan	{
169695Skan	  result->flags |= NAMED_OP;
169695Skan	  result->type = (enum cpp_ttype) result->val.node->directive_index;
169695Skan	}
169695Skan      break;
169695Skan
169695Skan    case '\'':
169695Skan    case '"':
169695Skan      lex_string (pfile, result, buffer->cur - 1);
169695Skan      break;
169695Skan
169695Skan    case '/':
169695Skan      /* A potential block or line comment.  */
169695Skan      comment_start = buffer->cur;
169695Skan      c = *buffer->cur;
169695Skan
169695Skan      if (c == '*')
169695Skan	{
169695Skan	  if (_cpp_skip_block_comment (pfile))
169695Skan	    cpp_error (pfile, CPP_DL_ERROR, "unterminated comment");
169695Skan	}
169695Skan      else if (c == '/' && (CPP_OPTION (pfile, cplusplus_comments)
169695Skan			    || cpp_in_system_header (pfile)))
169695Skan	{
169695Skan	  /* Warn about comments only if pedantically GNUC89, and not
169695Skan	     in system headers.  */
169695Skan	  if (CPP_OPTION (pfile, lang) == CLK_GNUC89 && CPP_PEDANTIC (pfile)
169695Skan	      && ! buffer->warned_cplusplus_comments)
169695Skan	    {
169695Skan	      cpp_error (pfile, CPP_DL_PEDWARN,
169695Skan			 "C++ style comments are not allowed in ISO C90");
169695Skan	      cpp_error (pfile, CPP_DL_PEDWARN,
169695Skan			 "(this will be reported only once per input file)");
169695Skan	      buffer->warned_cplusplus_comments = 1;
169695Skan	    }
169695Skan
169695Skan	  if (skip_line_comment (pfile) && CPP_OPTION (pfile, warn_comments))
169695Skan	    cpp_error (pfile, CPP_DL_WARNING, "multi-line comment");
169695Skan	}
169695Skan      else if (c == '=')
169695Skan	{
169695Skan	  buffer->cur++;
169695Skan	  result->type = CPP_DIV_EQ;
169695Skan	  break;
169695Skan	}
169695Skan      else
169695Skan	{
169695Skan	  result->type = CPP_DIV;
169695Skan	  break;
169695Skan	}
169695Skan
169695Skan      if (!pfile->state.save_comments)
169695Skan	{
169695Skan	  result->flags |= PREV_WHITE;
169695Skan	  goto update_tokens_line;
169695Skan	}
169695Skan
169695Skan      /* Save the comment as a token in its own right.  */
169695Skan      save_comment (pfile, result, comment_start, c);
169695Skan      break;
169695Skan
169695Skan    case '<':
169695Skan      if (pfile->state.angled_headers)
169695Skan	{
169695Skan	  lex_string (pfile, result, buffer->cur - 1);
169695Skan	  break;
169695Skan	}
169695Skan
169695Skan      result->type = CPP_LESS;
169695Skan      if (*buffer->cur == '=')
169695Skan	buffer->cur++, result->type = CPP_LESS_EQ;
169695Skan      else if (*buffer->cur == '<')
169695Skan	{
169695Skan	  buffer->cur++;
169695Skan	  IF_NEXT_IS ('=', CPP_LSHIFT_EQ, CPP_LSHIFT);
169695Skan	}
169695Skan      else if (CPP_OPTION (pfile, digraphs))
169695Skan	{
169695Skan	  if (*buffer->cur == ':')
169695Skan	    {
169695Skan	      buffer->cur++;
169695Skan	      result->flags |= DIGRAPH;
169695Skan	      result->type = CPP_OPEN_SQUARE;
169695Skan	    }
169695Skan	  else if (*buffer->cur == '%')
169695Skan	    {
169695Skan	      buffer->cur++;
169695Skan	      result->flags |= DIGRAPH;
169695Skan	      result->type = CPP_OPEN_BRACE;
169695Skan	    }
169695Skan	}
169695Skan      break;
169695Skan
169695Skan    case '>':
169695Skan      result->type = CPP_GREATER;
169695Skan      if (*buffer->cur == '=')
169695Skan	buffer->cur++, result->type = CPP_GREATER_EQ;
169695Skan      else if (*buffer->cur == '>')
169695Skan	{
169695Skan	  buffer->cur++;
169695Skan	  IF_NEXT_IS ('=', CPP_RSHIFT_EQ, CPP_RSHIFT);
169695Skan	}
169695Skan      break;
169695Skan
169695Skan    case '%':
169695Skan      result->type = CPP_MOD;
169695Skan      if (*buffer->cur == '=')
169695Skan	buffer->cur++, result->type = CPP_MOD_EQ;
169695Skan      else if (CPP_OPTION (pfile, digraphs))
169695Skan	{
169695Skan	  if (*buffer->cur == ':')
169695Skan	    {
169695Skan	      buffer->cur++;
169695Skan	      result->flags |= DIGRAPH;
169695Skan	      result->type = CPP_HASH;
169695Skan	      if (*buffer->cur == '%' && buffer->cur[1] == ':')
169695Skan		buffer->cur += 2, result->type = CPP_PASTE;
169695Skan	    }
169695Skan	  else if (*buffer->cur == '>')
169695Skan	    {
169695Skan	      buffer->cur++;
169695Skan	      result->flags |= DIGRAPH;
169695Skan	      result->type = CPP_CLOSE_BRACE;
169695Skan	    }
169695Skan	}
169695Skan      break;
169695Skan
169695Skan    case '.':
169695Skan      result->type = CPP_DOT;
169695Skan      if (ISDIGIT (*buffer->cur))
169695Skan	{
169695Skan	  struct normalize_state nst = INITIAL_NORMALIZE_STATE;
169695Skan	  result->type = CPP_NUMBER;
169695Skan	  lex_number (pfile, &result->val.str, &nst);
169695Skan	  warn_about_normalization (pfile, result, &nst);
169695Skan	}
169695Skan      else if (*buffer->cur == '.' && buffer->cur[1] == '.')
169695Skan	buffer->cur += 2, result->type = CPP_ELLIPSIS;
169695Skan      else if (*buffer->cur == '*' && CPP_OPTION (pfile, cplusplus))
169695Skan	buffer->cur++, result->type = CPP_DOT_STAR;
169695Skan      break;
169695Skan
169695Skan    case '+':
169695Skan      result->type = CPP_PLUS;
169695Skan      if (*buffer->cur == '+')
169695Skan	buffer->cur++, result->type = CPP_PLUS_PLUS;
169695Skan      else if (*buffer->cur == '=')
169695Skan	buffer->cur++, result->type = CPP_PLUS_EQ;
169695Skan      break;
169695Skan
169695Skan    case '-':
169695Skan      result->type = CPP_MINUS;
169695Skan      if (*buffer->cur == '>')
169695Skan	{
169695Skan	  buffer->cur++;
169695Skan	  result->type = CPP_DEREF;
169695Skan	  if (*buffer->cur == '*' && CPP_OPTION (pfile, cplusplus))
169695Skan	    buffer->cur++, result->type = CPP_DEREF_STAR;
169695Skan	}
169695Skan      else if (*buffer->cur == '-')
169695Skan	buffer->cur++, result->type = CPP_MINUS_MINUS;
169695Skan      else if (*buffer->cur == '=')
169695Skan	buffer->cur++, result->type = CPP_MINUS_EQ;
169695Skan      break;
169695Skan
169695Skan    case '&':
169695Skan      result->type = CPP_AND;
169695Skan      if (*buffer->cur == '&')
169695Skan	buffer->cur++, result->type = CPP_AND_AND;
169695Skan      else if (*buffer->cur == '=')
169695Skan	buffer->cur++, result->type = CPP_AND_EQ;
169695Skan      break;
169695Skan
169695Skan    case '|':
169695Skan      result->type = CPP_OR;
169695Skan      if (*buffer->cur == '|')
169695Skan	buffer->cur++, result->type = CPP_OR_OR;
169695Skan      else if (*buffer->cur == '=')
169695Skan	buffer->cur++, result->type = CPP_OR_EQ;
169695Skan      break;
169695Skan
169695Skan    case ':':
169695Skan      result->type = CPP_COLON;
169695Skan      if (*buffer->cur == ':' && CPP_OPTION (pfile, cplusplus))
169695Skan	buffer->cur++, result->type = CPP_SCOPE;
169695Skan      else if (*buffer->cur == '>' && CPP_OPTION (pfile, digraphs))
169695Skan	{
169695Skan	  buffer->cur++;
169695Skan	  result->flags |= DIGRAPH;
169695Skan	  result->type = CPP_CLOSE_SQUARE;
169695Skan	}
169695Skan      break;
169695Skan
169695Skan    case '*': IF_NEXT_IS ('=', CPP_MULT_EQ, CPP_MULT); break;
169695Skan    case '=': IF_NEXT_IS ('=', CPP_EQ_EQ, CPP_EQ); break;
169695Skan    case '!': IF_NEXT_IS ('=', CPP_NOT_EQ, CPP_NOT); break;
169695Skan    case '^': IF_NEXT_IS ('=', CPP_XOR_EQ, CPP_XOR); break;
169695Skan    case '#': IF_NEXT_IS ('#', CPP_PASTE, CPP_HASH); break;
169695Skan
169695Skan    case '?': result->type = CPP_QUERY; break;
169695Skan    case '~': result->type = CPP_COMPL; break;
169695Skan    case ',': result->type = CPP_COMMA; break;
169695Skan    case '(': result->type = CPP_OPEN_PAREN; break;
169695Skan    case ')': result->type = CPP_CLOSE_PAREN; break;
169695Skan    case '[': result->type = CPP_OPEN_SQUARE; break;
169695Skan    case ']': result->type = CPP_CLOSE_SQUARE; break;
169695Skan    case '{': result->type = CPP_OPEN_BRACE; break;
169695Skan    case '}': result->type = CPP_CLOSE_BRACE; break;
169695Skan    case ';': result->type = CPP_SEMICOLON; break;
169695Skan
169695Skan      /* @ is a punctuator in Objective-C.  */
169695Skan    case '@': result->type = CPP_ATSIGN; break;
169695Skan
169695Skan    case '$':
169695Skan    case '\\':
169695Skan      {
169695Skan	const uchar *base = --buffer->cur;
169695Skan	struct normalize_state nst = INITIAL_NORMALIZE_STATE;
169695Skan
169695Skan	if (forms_identifier_p (pfile, true, &nst))
169695Skan	  {
169695Skan	    result->type = CPP_NAME;
169695Skan	    result->val.node = lex_identifier (pfile, base, true, &nst);
169695Skan	    warn_about_normalization (pfile, result, &nst);
169695Skan	    break;
169695Skan	  }
169695Skan	buffer->cur++;
169695Skan      }
169695Skan
169695Skan    default:
169695Skan      create_literal (pfile, result, buffer->cur - 1, 1, CPP_OTHER);
169695Skan      break;
169695Skan    }
169695Skan
169695Skan  return result;
169695Skan}
169695Skan
169695Skan/* An upper bound on the number of bytes needed to spell TOKEN.
169695Skan   Does not include preceding whitespace.  */
169695Skanunsigned int
169695Skancpp_token_len (const cpp_token *token)
169695Skan{
169695Skan  unsigned int len;
169695Skan
169695Skan  switch (TOKEN_SPELL (token))
169695Skan    {
169695Skan    default:		len = 4;				break;
169695Skan    case SPELL_LITERAL:	len = token->val.str.len;		break;
169695Skan    case SPELL_IDENT:	len = NODE_LEN (token->val.node) * 10;	break;
169695Skan    }
169695Skan
169695Skan  return len;
169695Skan}
169695Skan
169695Skan/* Parse UTF-8 out of NAMEP and place a \U escape in BUFFER.
169695Skan   Return the number of bytes read out of NAME.  (There are always
169695Skan   10 bytes written to BUFFER.)  */
169695Skan
169695Skanstatic size_t
169695Skanutf8_to_ucn (unsigned char *buffer, const unsigned char *name)
169695Skan{
169695Skan  int j;
169695Skan  int ucn_len = 0;
169695Skan  int ucn_len_c;
169695Skan  unsigned t;
169695Skan  unsigned long utf32;
169695Skan
169695Skan  /* Compute the length of the UTF-8 sequence.  */
169695Skan  for (t = *name; t & 0x80; t <<= 1)
169695Skan    ucn_len++;
169695Skan
169695Skan  utf32 = *name & (0x7F >> ucn_len);
169695Skan  for (ucn_len_c = 1; ucn_len_c < ucn_len; ucn_len_c++)
169695Skan    {
169695Skan      utf32 = (utf32 << 6) | (*++name & 0x3F);
169695Skan
169695Skan      /* Ill-formed UTF-8.  */
169695Skan      if ((*name & ~0x3F) != 0x80)
169695Skan	abort ();
169695Skan    }
169695Skan
169695Skan  *buffer++ = '\\';
169695Skan  *buffer++ = 'U';
169695Skan  for (j = 7; j >= 0; j--)
169695Skan    *buffer++ = "0123456789abcdef"[(utf32 >> (4 * j)) & 0xF];
169695Skan  return ucn_len;
169695Skan}
169695Skan
169695Skan
169695Skan/* Write the spelling of a token TOKEN to BUFFER.  The buffer must
169695Skan   already contain the enough space to hold the token's spelling.
169695Skan   Returns a pointer to the character after the last character written.
169695Skan   FORSTRING is true if this is to be the spelling after translation
169695Skan   phase 1 (this is different for UCNs).
169695Skan   FIXME: Would be nice if we didn't need the PFILE argument.  */
169695Skanunsigned char *
169695Skancpp_spell_token (cpp_reader *pfile, const cpp_token *token,
169695Skan		 unsigned char *buffer, bool forstring)
169695Skan{
169695Skan  switch (TOKEN_SPELL (token))
169695Skan    {
169695Skan    case SPELL_OPERATOR:
169695Skan      {
169695Skan	const unsigned char *spelling;
169695Skan	unsigned char c;
169695Skan
169695Skan	if (token->flags & DIGRAPH)
169695Skan	  spelling
169695Skan	    = digraph_spellings[(int) token->type - (int) CPP_FIRST_DIGRAPH];
169695Skan	else if (token->flags & NAMED_OP)
169695Skan	  goto spell_ident;
169695Skan	else
169695Skan	  spelling = TOKEN_NAME (token);
169695Skan
169695Skan	while ((c = *spelling++) != '\0')
169695Skan	  *buffer++ = c;
169695Skan      }
169695Skan      break;
169695Skan
169695Skan    spell_ident:
169695Skan    case SPELL_IDENT:
169695Skan      if (forstring)
169695Skan	{
169695Skan	  memcpy (buffer, NODE_NAME (token->val.node),
169695Skan		  NODE_LEN (token->val.node));
169695Skan	  buffer += NODE_LEN (token->val.node);
169695Skan	}
169695Skan      else
169695Skan	{
169695Skan	  size_t i;
169695Skan	  const unsigned char * name = NODE_NAME (token->val.node);
169695Skan
169695Skan	  for (i = 0; i < NODE_LEN (token->val.node); i++)
169695Skan	    if (name[i] & ~0x7F)
169695Skan	      {
169695Skan		i += utf8_to_ucn (buffer, name + i) - 1;
169695Skan		buffer += 10;
169695Skan	      }
169695Skan	    else
169695Skan	      *buffer++ = NODE_NAME (token->val.node)[i];
169695Skan	}
169695Skan      break;
169695Skan
169695Skan    case SPELL_LITERAL:
169695Skan      memcpy (buffer, token->val.str.text, token->val.str.len);
169695Skan      buffer += token->val.str.len;
169695Skan      break;
169695Skan
169695Skan    case SPELL_NONE:
169695Skan      cpp_error (pfile, CPP_DL_ICE,
169695Skan		 "unspellable token %s", TOKEN_NAME (token));
169695Skan      break;
169695Skan    }
169695Skan
169695Skan  return buffer;
169695Skan}
169695Skan
169695Skan/* Returns TOKEN spelt as a null-terminated string.  The string is
169695Skan   freed when the reader is destroyed.  Useful for diagnostics.  */
169695Skanunsigned char *
169695Skancpp_token_as_text (cpp_reader *pfile, const cpp_token *token)
169695Skan{
169695Skan  unsigned int len = cpp_token_len (token) + 1;
169695Skan  unsigned char *start = _cpp_unaligned_alloc (pfile, len), *end;
169695Skan
169695Skan  end = cpp_spell_token (pfile, token, start, false);
169695Skan  end[0] = '\0';
169695Skan
169695Skan  return start;
169695Skan}
169695Skan
169695Skan/* Used by C front ends, which really should move to using
169695Skan   cpp_token_as_text.  */
169695Skanconst char *
169695Skancpp_type2name (enum cpp_ttype type)
169695Skan{
169695Skan  return (const char *) token_spellings[type].name;
169695Skan}
169695Skan
169695Skan/* Writes the spelling of token to FP, without any preceding space.
169695Skan   Separated from cpp_spell_token for efficiency - to avoid stdio
169695Skan   double-buffering.  */
169695Skanvoid
169695Skancpp_output_token (const cpp_token *token, FILE *fp)
169695Skan{
169695Skan  switch (TOKEN_SPELL (token))
169695Skan    {
169695Skan    case SPELL_OPERATOR:
169695Skan      {
169695Skan	const unsigned char *spelling;
169695Skan	int c;
169695Skan
169695Skan	if (token->flags & DIGRAPH)
169695Skan	  spelling
169695Skan	    = digraph_spellings[(int) token->type - (int) CPP_FIRST_DIGRAPH];
169695Skan	else if (token->flags & NAMED_OP)
169695Skan	  goto spell_ident;
169695Skan	else
169695Skan	  spelling = TOKEN_NAME (token);
169695Skan
169695Skan	c = *spelling;
169695Skan	do
169695Skan	  putc (c, fp);
169695Skan	while ((c = *++spelling) != '\0');
169695Skan      }
169695Skan      break;
169695Skan
169695Skan    spell_ident:
169695Skan    case SPELL_IDENT:
169695Skan      {
169695Skan	size_t i;
169695Skan	const unsigned char * name = NODE_NAME (token->val.node);
169695Skan
169695Skan	for (i = 0; i < NODE_LEN (token->val.node); i++)
169695Skan	  if (name[i] & ~0x7F)
169695Skan	    {
169695Skan	      unsigned char buffer[10];
169695Skan	      i += utf8_to_ucn (buffer, name + i) - 1;
169695Skan	      fwrite (buffer, 1, 10, fp);
169695Skan	    }
169695Skan	  else
169695Skan	    fputc (NODE_NAME (token->val.node)[i], fp);
169695Skan      }
169695Skan      break;
169695Skan
169695Skan    case SPELL_LITERAL:
169695Skan      fwrite (token->val.str.text, 1, token->val.str.len, fp);
169695Skan      break;
169695Skan
169695Skan    case SPELL_NONE:
169695Skan      /* An error, most probably.  */
169695Skan      break;
169695Skan    }
169695Skan}
169695Skan
169695Skan/* Compare two tokens.  */
169695Skanint
169695Skan_cpp_equiv_tokens (const cpp_token *a, const cpp_token *b)
169695Skan{
169695Skan  if (a->type == b->type && a->flags == b->flags)
169695Skan    switch (TOKEN_SPELL (a))
169695Skan      {
169695Skan      default:			/* Keep compiler happy.  */
169695Skan      case SPELL_OPERATOR:
169695Skan	return 1;
169695Skan      case SPELL_NONE:
169695Skan	return (a->type != CPP_MACRO_ARG || a->val.arg_no == b->val.arg_no);
169695Skan      case SPELL_IDENT:
169695Skan	return a->val.node == b->val.node;
169695Skan      case SPELL_LITERAL:
169695Skan	return (a->val.str.len == b->val.str.len
169695Skan		&& !memcmp (a->val.str.text, b->val.str.text,
169695Skan			    a->val.str.len));
169695Skan      }
169695Skan
169695Skan  return 0;
169695Skan}
169695Skan
169695Skan/* Returns nonzero if a space should be inserted to avoid an
169695Skan   accidental token paste for output.  For simplicity, it is
169695Skan   conservative, and occasionally advises a space where one is not
169695Skan   needed, e.g. "." and ".2".  */
169695Skanint
169695Skancpp_avoid_paste (cpp_reader *pfile, const cpp_token *token1,
169695Skan		 const cpp_token *token2)
169695Skan{
169695Skan  enum cpp_ttype a = token1->type, b = token2->type;
169695Skan  cppchar_t c;
169695Skan
169695Skan  if (token1->flags & NAMED_OP)
169695Skan    a = CPP_NAME;
169695Skan  if (token2->flags & NAMED_OP)
169695Skan    b = CPP_NAME;
169695Skan
169695Skan  c = EOF;
169695Skan  if (token2->flags & DIGRAPH)
169695Skan    c = digraph_spellings[(int) b - (int) CPP_FIRST_DIGRAPH][0];
169695Skan  else if (token_spellings[b].category == SPELL_OPERATOR)
169695Skan    c = token_spellings[b].name[0];
169695Skan
169695Skan  /* Quickly get everything that can paste with an '='.  */
169695Skan  if ((int) a <= (int) CPP_LAST_EQ && c == '=')
169695Skan    return 1;
169695Skan
169695Skan  switch (a)
169695Skan    {
169695Skan    case CPP_GREATER:	return c == '>';
169695Skan    case CPP_LESS:	return c == '<' || c == '%' || c == ':';
169695Skan    case CPP_PLUS:	return c == '+';
169695Skan    case CPP_MINUS:	return c == '-' || c == '>';
169695Skan    case CPP_DIV:	return c == '/' || c == '*'; /* Comments.  */
169695Skan    case CPP_MOD:	return c == ':' || c == '>';
169695Skan    case CPP_AND:	return c == '&';
169695Skan    case CPP_OR:	return c == '|';
169695Skan    case CPP_COLON:	return c == ':' || c == '>';
169695Skan    case CPP_DEREF:	return c == '*';
169695Skan    case CPP_DOT:	return c == '.' || c == '%' || b == CPP_NUMBER;
169695Skan    case CPP_HASH:	return c == '#' || c == '%'; /* Digraph form.  */
169695Skan    case CPP_NAME:	return ((b == CPP_NUMBER
169695Skan				 && name_p (pfile, &token2->val.str))
169695Skan				|| b == CPP_NAME
169695Skan				|| b == CPP_CHAR || b == CPP_STRING); /* L */
169695Skan    case CPP_NUMBER:	return (b == CPP_NUMBER || b == CPP_NAME
169695Skan				|| c == '.' || c == '+' || c == '-');
169695Skan				      /* UCNs */
169695Skan    case CPP_OTHER:	return ((token1->val.str.text[0] == '\\'
169695Skan				 && b == CPP_NAME)
169695Skan				|| (CPP_OPTION (pfile, objc)
169695Skan				    && token1->val.str.text[0] == '@'
169695Skan				    && (b == CPP_NAME || b == CPP_STRING)));
169695Skan    default:		break;
169695Skan    }
169695Skan
169695Skan  return 0;
169695Skan}
169695Skan
169695Skan/* Output all the remaining tokens on the current line, and a newline
169695Skan   character, to FP.  Leading whitespace is removed.  If there are
169695Skan   macros, special token padding is not performed.  */
169695Skanvoid
169695Skancpp_output_line (cpp_reader *pfile, FILE *fp)
169695Skan{
169695Skan  const cpp_token *token;
169695Skan
169695Skan  token = cpp_get_token (pfile);
169695Skan  while (token->type != CPP_EOF)
169695Skan    {
169695Skan      cpp_output_token (token, fp);
169695Skan      token = cpp_get_token (pfile);
169695Skan      if (token->flags & PREV_WHITE)
169695Skan	putc (' ', fp);
169695Skan    }
169695Skan
169695Skan  putc ('\n', fp);
169695Skan}
169695Skan
169695Skan/* Memory buffers.  Changing these three constants can have a dramatic
169695Skan   effect on performance.  The values here are reasonable defaults,
169695Skan   but might be tuned.  If you adjust them, be sure to test across a
169695Skan   range of uses of cpplib, including heavy nested function-like macro
169695Skan   expansion.  Also check the change in peak memory usage (NJAMD is a
169695Skan   good tool for this).  */
169695Skan#define MIN_BUFF_SIZE 8000
169695Skan#define BUFF_SIZE_UPPER_BOUND(MIN_SIZE) (MIN_BUFF_SIZE + (MIN_SIZE) * 3 / 2)
169695Skan#define EXTENDED_BUFF_SIZE(BUFF, MIN_EXTRA) \
169695Skan	(MIN_EXTRA + ((BUFF)->limit - (BUFF)->cur) * 2)
169695Skan
169695Skan#if MIN_BUFF_SIZE > BUFF_SIZE_UPPER_BOUND (0)
169695Skan  #error BUFF_SIZE_UPPER_BOUND must be at least as large as MIN_BUFF_SIZE!
169695Skan#endif
169695Skan
169695Skan/* Create a new allocation buffer.  Place the control block at the end
169695Skan   of the buffer, so that buffer overflows will cause immediate chaos.  */
169695Skanstatic _cpp_buff *
169695Skannew_buff (size_t len)
169695Skan{
169695Skan  _cpp_buff *result;
169695Skan  unsigned char *base;
169695Skan
169695Skan  if (len < MIN_BUFF_SIZE)
169695Skan    len = MIN_BUFF_SIZE;
169695Skan  len = CPP_ALIGN (len);
169695Skan
169695Skan  base = XNEWVEC (unsigned char, len + sizeof (_cpp_buff));
169695Skan  result = (_cpp_buff *) (base + len);
169695Skan  result->base = base;
169695Skan  result->cur = base;
169695Skan  result->limit = base + len;
169695Skan  result->next = NULL;
169695Skan  return result;
169695Skan}
169695Skan
169695Skan/* Place a chain of unwanted allocation buffers on the free list.  */
169695Skanvoid
169695Skan_cpp_release_buff (cpp_reader *pfile, _cpp_buff *buff)
169695Skan{
169695Skan  _cpp_buff *end = buff;
169695Skan
169695Skan  while (end->next)
169695Skan    end = end->next;
169695Skan  end->next = pfile->free_buffs;
169695Skan  pfile->free_buffs = buff;
169695Skan}
169695Skan
169695Skan/* Return a free buffer of size at least MIN_SIZE.  */
169695Skan_cpp_buff *
169695Skan_cpp_get_buff (cpp_reader *pfile, size_t min_size)
169695Skan{
169695Skan  _cpp_buff *result, **p;
169695Skan
169695Skan  for (p = &pfile->free_buffs;; p = &(*p)->next)
169695Skan    {
169695Skan      size_t size;
169695Skan
169695Skan      if (*p == NULL)
169695Skan	return new_buff (min_size);
169695Skan      result = *p;
169695Skan      size = result->limit - result->base;
169695Skan      /* Return a buffer that's big enough, but don't waste one that's
169695Skan         way too big.  */
169695Skan      if (size >= min_size && size <= BUFF_SIZE_UPPER_BOUND (min_size))
169695Skan	break;
169695Skan    }
169695Skan
169695Skan  *p = result->next;
169695Skan  result->next = NULL;
169695Skan  result->cur = result->base;
169695Skan  return result;
169695Skan}
169695Skan
169695Skan/* Creates a new buffer with enough space to hold the uncommitted
169695Skan   remaining bytes of BUFF, and at least MIN_EXTRA more bytes.  Copies
169695Skan   the excess bytes to the new buffer.  Chains the new buffer after
169695Skan   BUFF, and returns the new buffer.  */
169695Skan_cpp_buff *
169695Skan_cpp_append_extend_buff (cpp_reader *pfile, _cpp_buff *buff, size_t min_extra)
169695Skan{
169695Skan  size_t size = EXTENDED_BUFF_SIZE (buff, min_extra);
169695Skan  _cpp_buff *new_buff = _cpp_get_buff (pfile, size);
169695Skan
169695Skan  buff->next = new_buff;
169695Skan  memcpy (new_buff->base, buff->cur, BUFF_ROOM (buff));
169695Skan  return new_buff;
169695Skan}
169695Skan
169695Skan/* Creates a new buffer with enough space to hold the uncommitted
169695Skan   remaining bytes of the buffer pointed to by BUFF, and at least
169695Skan   MIN_EXTRA more bytes.  Copies the excess bytes to the new buffer.
169695Skan   Chains the new buffer before the buffer pointed to by BUFF, and
169695Skan   updates the pointer to point to the new buffer.  */
169695Skanvoid
169695Skan_cpp_extend_buff (cpp_reader *pfile, _cpp_buff **pbuff, size_t min_extra)
169695Skan{
169695Skan  _cpp_buff *new_buff, *old_buff = *pbuff;
169695Skan  size_t size = EXTENDED_BUFF_SIZE (old_buff, min_extra);
169695Skan
169695Skan  new_buff = _cpp_get_buff (pfile, size);
169695Skan  memcpy (new_buff->base, old_buff->cur, BUFF_ROOM (old_buff));
169695Skan  new_buff->next = old_buff;
169695Skan  *pbuff = new_buff;
169695Skan}
169695Skan
169695Skan/* Free a chain of buffers starting at BUFF.  */
169695Skanvoid
169695Skan_cpp_free_buff (_cpp_buff *buff)
169695Skan{
169695Skan  _cpp_buff *next;
169695Skan
169695Skan  for (; buff; buff = next)
169695Skan    {
169695Skan      next = buff->next;
169695Skan      free (buff->base);
169695Skan    }
169695Skan}
169695Skan
169695Skan/* Allocate permanent, unaligned storage of length LEN.  */
169695Skanunsigned char *
169695Skan_cpp_unaligned_alloc (cpp_reader *pfile, size_t len)
169695Skan{
169695Skan  _cpp_buff *buff = pfile->u_buff;
169695Skan  unsigned char *result = buff->cur;
169695Skan
169695Skan  if (len > (size_t) (buff->limit - result))
169695Skan    {
169695Skan      buff = _cpp_get_buff (pfile, len);
169695Skan      buff->next = pfile->u_buff;
169695Skan      pfile->u_buff = buff;
169695Skan      result = buff->cur;
169695Skan    }
169695Skan
169695Skan  buff->cur = result + len;
169695Skan  return result;
169695Skan}
169695Skan
169695Skan/* Allocate permanent, unaligned storage of length LEN from a_buff.
169695Skan   That buffer is used for growing allocations when saving macro
169695Skan   replacement lists in a #define, and when parsing an answer to an
169695Skan   assertion in #assert, #unassert or #if (and therefore possibly
169695Skan   whilst expanding macros).  It therefore must not be used by any
169695Skan   code that they might call: specifically the lexer and the guts of
169695Skan   the macro expander.
169695Skan
169695Skan   All existing other uses clearly fit this restriction: storing
169695Skan   registered pragmas during initialization.  */
169695Skanunsigned char *
169695Skan_cpp_aligned_alloc (cpp_reader *pfile, size_t len)
169695Skan{
169695Skan  _cpp_buff *buff = pfile->a_buff;
169695Skan  unsigned char *result = buff->cur;
169695Skan
169695Skan  if (len > (size_t) (buff->limit - result))
169695Skan    {
169695Skan      buff = _cpp_get_buff (pfile, len);
169695Skan      buff->next = pfile->a_buff;
169695Skan      pfile->a_buff = buff;
169695Skan      result = buff->cur;
169695Skan    }
169695Skan
169695Skan  buff->cur = result + len;
169695Skan  return result;
169695Skan}
169695Skan
169695Skan/* Say which field of TOK is in use.  */
169695Skan
169695Skanenum cpp_token_fld_kind
169695Skancpp_token_val_index (cpp_token *tok)
169695Skan{
169695Skan  switch (TOKEN_SPELL (tok))
169695Skan    {
169695Skan    case SPELL_IDENT:
169695Skan      return CPP_TOKEN_FLD_NODE;
169695Skan    case SPELL_LITERAL:
169695Skan      return CPP_TOKEN_FLD_STR;
169695Skan    case SPELL_NONE:
169695Skan      if (tok->type == CPP_MACRO_ARG)
169695Skan	return CPP_TOKEN_FLD_ARG_NO;
169695Skan      else if (tok->type == CPP_PADDING)
169695Skan	return CPP_TOKEN_FLD_SOURCE;
169695Skan      else if (tok->type == CPP_PRAGMA)
169695Skan	return CPP_TOKEN_FLD_PRAGMA;
169695Skan      /* else fall through */
169695Skan    default:
169695Skan      return CPP_TOKEN_FLD_NONE;
169695Skan    }
169695Skan}