gcc/gcc/cpplex.c

*c87b03e5Sespie/* CPP Library - lexical analysis.
*c87b03e5Sespie   Copyright (C) 2000, 2001, 2002 Free Software Foundation, Inc.
*c87b03e5Sespie   Contributed by Per Bothner, 1994-95.
*c87b03e5Sespie   Based on CCCP program by Paul Rubin, June 1986
*c87b03e5Sespie   Adapted to ANSI C, Richard Stallman, Jan 1987
*c87b03e5Sespie   Broken out to separate file, Zack Weinberg, Mar 2000
*c87b03e5Sespie   Single-pass line tokenization by Neil Booth, April 2000
*c87b03e5Sespie
*c87b03e5SespieThis program is free software; you can redistribute it and/or modify it
*c87b03e5Sespieunder the terms of the GNU General Public License as published by the
*c87b03e5SespieFree Software Foundation; either version 2, or (at your option) any
*c87b03e5Sespielater version.
*c87b03e5Sespie
*c87b03e5SespieThis program is distributed in the hope that it will be useful,
*c87b03e5Sespiebut WITHOUT ANY WARRANTY; without even the implied warranty of
*c87b03e5SespieMERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
*c87b03e5SespieGNU General Public License for more details.
*c87b03e5Sespie
*c87b03e5SespieYou should have received a copy of the GNU General Public License
*c87b03e5Sespiealong with this program; if not, write to the Free Software
*c87b03e5SespieFoundation, 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.  */
*c87b03e5Sespie
*c87b03e5Sespie#include "config.h"
*c87b03e5Sespie#include "system.h"
*c87b03e5Sespie#include "cpplib.h"
*c87b03e5Sespie#include "cpphash.h"
*c87b03e5Sespie
*c87b03e5Sespie#ifdef MULTIBYTE_CHARS
*c87b03e5Sespie#include "mbchar.h"
*c87b03e5Sespie#include <locale.h>
*c87b03e5Sespie#endif
*c87b03e5Sespie
*c87b03e5Sespie/* Tokens with SPELL_STRING store their spelling in the token list,
*c87b03e5Sespie   and it's length in the token->val.name.len.  */
*c87b03e5Sespieenum spell_type
*c87b03e5Sespie{
*c87b03e5Sespie  SPELL_OPERATOR = 0,
*c87b03e5Sespie  SPELL_CHAR,
*c87b03e5Sespie  SPELL_IDENT,
*c87b03e5Sespie  SPELL_NUMBER,
*c87b03e5Sespie  SPELL_STRING,
*c87b03e5Sespie  SPELL_NONE
*c87b03e5Sespie};
*c87b03e5Sespie
*c87b03e5Sespiestruct token_spelling
*c87b03e5Sespie{
*c87b03e5Sespie  enum spell_type category;
*c87b03e5Sespie  const unsigned char *name;
*c87b03e5Sespie};
*c87b03e5Sespie
*c87b03e5Sespiestatic const unsigned char *const digraph_spellings[] =
*c87b03e5Sespie{ U"%:", U"%:%:", U"<:", U":>", U"<%", U"%>" };
*c87b03e5Sespie
*c87b03e5Sespie#define OP(e, s) { SPELL_OPERATOR, U s           },
*c87b03e5Sespie#define TK(e, s) { s,              U STRINGX (e) },
*c87b03e5Sespiestatic const struct token_spelling token_spellings[N_TTYPES] = { TTYPE_TABLE };
*c87b03e5Sespie#undef OP
*c87b03e5Sespie#undef TK
*c87b03e5Sespie
*c87b03e5Sespie#define TOKEN_SPELL(token) (token_spellings[(token)->type].category)
*c87b03e5Sespie#define TOKEN_NAME(token) (token_spellings[(token)->type].name)
*c87b03e5Sespie#define BACKUP() do {buffer->cur = buffer->backup_to;} while (0)
*c87b03e5Sespie
*c87b03e5Sespiestatic void handle_newline PARAMS ((cpp_reader *));
*c87b03e5Sespiestatic cppchar_t skip_escaped_newlines PARAMS ((cpp_reader *));
*c87b03e5Sespiestatic cppchar_t get_effective_char PARAMS ((cpp_reader *));
*c87b03e5Sespie
*c87b03e5Sespiestatic int skip_block_comment PARAMS ((cpp_reader *));
*c87b03e5Sespiestatic int skip_line_comment PARAMS ((cpp_reader *));
*c87b03e5Sespiestatic void adjust_column PARAMS ((cpp_reader *));
*c87b03e5Sespiestatic int skip_whitespace PARAMS ((cpp_reader *, cppchar_t));
*c87b03e5Sespiestatic cpp_hashnode *parse_identifier PARAMS ((cpp_reader *));
*c87b03e5Sespiestatic uchar *parse_slow PARAMS ((cpp_reader *, const uchar *, int,
*c87b03e5Sespie				  unsigned int *));
*c87b03e5Sespiestatic void parse_number PARAMS ((cpp_reader *, cpp_string *, int));
*c87b03e5Sespiestatic int unescaped_terminator_p PARAMS ((cpp_reader *, const uchar *));
*c87b03e5Sespiestatic void parse_string PARAMS ((cpp_reader *, cpp_token *, cppchar_t));
*c87b03e5Sespiestatic bool trigraph_p PARAMS ((cpp_reader *));
*c87b03e5Sespiestatic void save_comment PARAMS ((cpp_reader *, cpp_token *, const uchar *,
*c87b03e5Sespie				  cppchar_t));
*c87b03e5Sespiestatic bool continue_after_nul PARAMS ((cpp_reader *));
*c87b03e5Sespiestatic int name_p PARAMS ((cpp_reader *, const cpp_string *));
*c87b03e5Sespiestatic int maybe_read_ucs PARAMS ((cpp_reader *, const unsigned char **,
*c87b03e5Sespie				   const unsigned char *, cppchar_t *));
*c87b03e5Sespiestatic tokenrun *next_tokenrun PARAMS ((tokenrun *));
*c87b03e5Sespie
*c87b03e5Sespiestatic unsigned int hex_digit_value PARAMS ((unsigned int));
*c87b03e5Sespiestatic _cpp_buff *new_buff PARAMS ((size_t));
*c87b03e5Sespie
*c87b03e5Sespie/* Utility routine:
*c87b03e5Sespie
*c87b03e5Sespie   Compares, the token TOKEN to the NUL-terminated string STRING.
*c87b03e5Sespie   TOKEN must be a CPP_NAME.  Returns 1 for equal, 0 for unequal.  */
*c87b03e5Sespieint
*c87b03e5Sespiecpp_ideq (token, string)
*c87b03e5Sespie     const cpp_token *token;
*c87b03e5Sespie     const char *string;
*c87b03e5Sespie{
*c87b03e5Sespie  if (token->type != CPP_NAME)
*c87b03e5Sespie    return 0;
*c87b03e5Sespie
*c87b03e5Sespie  return !ustrcmp (NODE_NAME (token->val.node), (const uchar *) string);
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Call when meeting a newline, assumed to be in buffer->cur[-1].
*c87b03e5Sespie   Returns with buffer->cur pointing to the character immediately
*c87b03e5Sespie   following the newline (combination).  */
*c87b03e5Sespiestatic void
*c87b03e5Sespiehandle_newline (pfile)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie{
*c87b03e5Sespie  cpp_buffer *buffer = pfile->buffer;
*c87b03e5Sespie
*c87b03e5Sespie  /* Handle CR-LF and LF-CR.  Most other implementations (e.g. java)
*c87b03e5Sespie     only accept CR-LF; maybe we should fall back to that behavior?  */
*c87b03e5Sespie  if (buffer->cur[-1] + buffer->cur[0] == '\r' + '\n')
*c87b03e5Sespie    buffer->cur++;
*c87b03e5Sespie
*c87b03e5Sespie  buffer->line_base = buffer->cur;
*c87b03e5Sespie  buffer->col_adjust = 0;
*c87b03e5Sespie  pfile->line++;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Subroutine of skip_escaped_newlines; called when a 3-character
*c87b03e5Sespie   sequence beginning with "??" is encountered.  buffer->cur points to
*c87b03e5Sespie   the second '?'.
*c87b03e5Sespie
*c87b03e5Sespie   Warn if necessary, and returns true if the sequence forms a
*c87b03e5Sespie   trigraph and the trigraph should be honored.  */
*c87b03e5Sespiestatic bool
*c87b03e5Sespietrigraph_p (pfile)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie{
*c87b03e5Sespie  cpp_buffer *buffer = pfile->buffer;
*c87b03e5Sespie  cppchar_t from_char = buffer->cur[1];
*c87b03e5Sespie  bool accept;
*c87b03e5Sespie
*c87b03e5Sespie  if (!_cpp_trigraph_map[from_char])
*c87b03e5Sespie    return false;
*c87b03e5Sespie
*c87b03e5Sespie  accept = CPP_OPTION (pfile, trigraphs);
*c87b03e5Sespie
*c87b03e5Sespie  /* Don't warn about trigraphs in comments.  */
*c87b03e5Sespie  if (CPP_OPTION (pfile, warn_trigraphs) && !pfile->state.lexing_comment)
*c87b03e5Sespie    {
*c87b03e5Sespie      if (accept)
*c87b03e5Sespie	cpp_error_with_line (pfile, DL_WARNING,
*c87b03e5Sespie			     pfile->line, CPP_BUF_COL (buffer) - 1,
*c87b03e5Sespie			     "trigraph ??%c converted to %c",
*c87b03e5Sespie			     (int) from_char,
*c87b03e5Sespie			     (int) _cpp_trigraph_map[from_char]);
*c87b03e5Sespie      else if (buffer->cur != buffer->last_Wtrigraphs)
*c87b03e5Sespie	{
*c87b03e5Sespie	  buffer->last_Wtrigraphs = buffer->cur;
*c87b03e5Sespie	  cpp_error_with_line (pfile, DL_WARNING,
*c87b03e5Sespie			       pfile->line, CPP_BUF_COL (buffer) - 1,
*c87b03e5Sespie			       "trigraph ??%c ignored", (int) from_char);
*c87b03e5Sespie	}
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  return accept;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Skips any escaped newlines introduced by '?' or a '\\', assumed to
*c87b03e5Sespie   lie in buffer->cur[-1].  Returns the next byte, which will be in
*c87b03e5Sespie   buffer->cur[-1].  This routine performs preprocessing stages 1 and
*c87b03e5Sespie   2 of the ISO C standard.  */
*c87b03e5Sespiestatic cppchar_t
*c87b03e5Sespieskip_escaped_newlines (pfile)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie{
*c87b03e5Sespie  cpp_buffer *buffer = pfile->buffer;
*c87b03e5Sespie  cppchar_t next = buffer->cur[-1];
*c87b03e5Sespie
*c87b03e5Sespie  /* Only do this if we apply stages 1 and 2.  */
*c87b03e5Sespie  if (!buffer->from_stage3)
*c87b03e5Sespie    {
*c87b03e5Sespie      const unsigned char *saved_cur;
*c87b03e5Sespie      cppchar_t next1;
*c87b03e5Sespie
*c87b03e5Sespie      do
*c87b03e5Sespie	{
*c87b03e5Sespie	  if (next == '?')
*c87b03e5Sespie	    {
*c87b03e5Sespie	      if (buffer->cur[0] != '?' || !trigraph_p (pfile))
*c87b03e5Sespie		break;
*c87b03e5Sespie
*c87b03e5Sespie	      /* Translate the trigraph.  */
*c87b03e5Sespie	      next = _cpp_trigraph_map[buffer->cur[1]];
*c87b03e5Sespie	      buffer->cur += 2;
*c87b03e5Sespie	      if (next != '\\')
*c87b03e5Sespie		break;
*c87b03e5Sespie	    }
*c87b03e5Sespie
*c87b03e5Sespie	  if (buffer->cur == buffer->rlimit)
*c87b03e5Sespie	    break;
*c87b03e5Sespie
*c87b03e5Sespie	  /* We have a backslash, and room for at least one more
*c87b03e5Sespie	     character.  Skip horizontal whitespace.  */
*c87b03e5Sespie	  saved_cur = buffer->cur;
*c87b03e5Sespie	  do
*c87b03e5Sespie	    next1 = *buffer->cur++;
*c87b03e5Sespie	  while (is_nvspace (next1) && buffer->cur < buffer->rlimit);
*c87b03e5Sespie
*c87b03e5Sespie	  if (!is_vspace (next1))
*c87b03e5Sespie	    {
*c87b03e5Sespie	      buffer->cur = saved_cur;
*c87b03e5Sespie	      break;
*c87b03e5Sespie	    }
*c87b03e5Sespie
*c87b03e5Sespie	  if (saved_cur != buffer->cur - 1
*c87b03e5Sespie	      && !pfile->state.lexing_comment)
*c87b03e5Sespie	    cpp_error (pfile, DL_WARNING,
*c87b03e5Sespie		       "backslash and newline separated by space");
*c87b03e5Sespie
*c87b03e5Sespie	  handle_newline (pfile);
*c87b03e5Sespie	  buffer->backup_to = buffer->cur;
*c87b03e5Sespie	  if (buffer->cur == buffer->rlimit)
*c87b03e5Sespie	    {
*c87b03e5Sespie	      cpp_error (pfile, DL_PEDWARN,
*c87b03e5Sespie			 "backslash-newline at end of file");
*c87b03e5Sespie	      next = EOF;
*c87b03e5Sespie	    }
*c87b03e5Sespie	  else
*c87b03e5Sespie	    next = *buffer->cur++;
*c87b03e5Sespie	}
*c87b03e5Sespie      while (next == '\\' || next == '?');
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  return next;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Obtain the next character, after trigraph conversion and skipping
*c87b03e5Sespie   an arbitrarily long string of escaped newlines.  The common case of
*c87b03e5Sespie   no trigraphs or escaped newlines falls through quickly.  On return,
*c87b03e5Sespie   buffer->backup_to points to where to return to if the character is
*c87b03e5Sespie   not to be processed.  */
*c87b03e5Sespiestatic cppchar_t
*c87b03e5Sespieget_effective_char (pfile)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie{
*c87b03e5Sespie  cppchar_t next;
*c87b03e5Sespie  cpp_buffer *buffer = pfile->buffer;
*c87b03e5Sespie
*c87b03e5Sespie  buffer->backup_to = buffer->cur;
*c87b03e5Sespie  next = *buffer->cur++;
*c87b03e5Sespie  if (__builtin_expect (next == '?' || next == '\\', 0))
*c87b03e5Sespie    next = skip_escaped_newlines (pfile);
*c87b03e5Sespie
*c87b03e5Sespie  return next;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Skip a C-style block comment.  We find the end of the comment by
*c87b03e5Sespie   seeing if an asterisk is before every '/' we encounter.  Returns
*c87b03e5Sespie   nonzero if comment terminated by EOF, zero otherwise.  */
*c87b03e5Sespiestatic int
*c87b03e5Sespieskip_block_comment (pfile)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie{
*c87b03e5Sespie  cpp_buffer *buffer = pfile->buffer;
*c87b03e5Sespie  cppchar_t c = EOF, prevc = EOF;
*c87b03e5Sespie
*c87b03e5Sespie  pfile->state.lexing_comment = 1;
*c87b03e5Sespie  while (buffer->cur != buffer->rlimit)
*c87b03e5Sespie    {
*c87b03e5Sespie      prevc = c, c = *buffer->cur++;
*c87b03e5Sespie
*c87b03e5Sespie      /* FIXME: For speed, create a new character class of characters
*c87b03e5Sespie	 of interest inside block comments.  */
*c87b03e5Sespie      if (c == '?' || c == '\\')
*c87b03e5Sespie	c = skip_escaped_newlines (pfile);
*c87b03e5Sespie
*c87b03e5Sespie      /* People like decorating comments with '*', so check for '/'
*c87b03e5Sespie	 instead for efficiency.  */
*c87b03e5Sespie      if (c == '/')
*c87b03e5Sespie	{
*c87b03e5Sespie	  if (prevc == '*')
*c87b03e5Sespie	    break;
*c87b03e5Sespie
*c87b03e5Sespie	  /* Warn about potential nested comments, but not if the '/'
*c87b03e5Sespie	     comes immediately before the true comment delimiter.
*c87b03e5Sespie	     Don't bother to get it right across escaped newlines.  */
*c87b03e5Sespie	  if (CPP_OPTION (pfile, warn_comments)
*c87b03e5Sespie	      && buffer->cur[0] == '*' && buffer->cur[1] != '/')
*c87b03e5Sespie	    cpp_error_with_line (pfile, DL_WARNING,
*c87b03e5Sespie				 pfile->line, CPP_BUF_COL (buffer),
*c87b03e5Sespie				 "\"/*\" within comment");
*c87b03e5Sespie	}
*c87b03e5Sespie      else if (is_vspace (c))
*c87b03e5Sespie	handle_newline (pfile);
*c87b03e5Sespie      else if (c == '\t')
*c87b03e5Sespie	adjust_column (pfile);
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  pfile->state.lexing_comment = 0;
*c87b03e5Sespie  return c != '/' || prevc != '*';
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Skip a C++ line comment, leaving buffer->cur pointing to the
*c87b03e5Sespie   terminating newline.  Handles escaped newlines.  Returns nonzero
*c87b03e5Sespie   if a multiline comment.  */
*c87b03e5Sespiestatic int
*c87b03e5Sespieskip_line_comment (pfile)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie{
*c87b03e5Sespie  cpp_buffer *buffer = pfile->buffer;
*c87b03e5Sespie  unsigned int orig_line = pfile->line;
*c87b03e5Sespie  cppchar_t c;
*c87b03e5Sespie#ifdef MULTIBYTE_CHARS
*c87b03e5Sespie  wchar_t wc;
*c87b03e5Sespie  int char_len;
*c87b03e5Sespie#endif
*c87b03e5Sespie
*c87b03e5Sespie  pfile->state.lexing_comment = 1;
*c87b03e5Sespie#ifdef MULTIBYTE_CHARS
*c87b03e5Sespie  /* Reset multibyte conversion state.  */
*c87b03e5Sespie  (void) local_mbtowc (NULL, NULL, 0);
*c87b03e5Sespie#endif
*c87b03e5Sespie  do
*c87b03e5Sespie    {
*c87b03e5Sespie      if (buffer->cur == buffer->rlimit)
*c87b03e5Sespie	goto at_eof;
*c87b03e5Sespie
*c87b03e5Sespie#ifdef MULTIBYTE_CHARS
*c87b03e5Sespie      char_len = local_mbtowc (&wc, (const char *) buffer->cur,
*c87b03e5Sespie			       buffer->rlimit - buffer->cur);
*c87b03e5Sespie      if (char_len == -1)
*c87b03e5Sespie	{
*c87b03e5Sespie	  cpp_error (pfile, DL_WARNING,
*c87b03e5Sespie		     "ignoring invalid multibyte character");
*c87b03e5Sespie	  char_len = 1;
*c87b03e5Sespie	  c = *buffer->cur++;
*c87b03e5Sespie	}
*c87b03e5Sespie      else
*c87b03e5Sespie	{
*c87b03e5Sespie	  buffer->cur += char_len;
*c87b03e5Sespie	  c = wc;
*c87b03e5Sespie	}
*c87b03e5Sespie#else
*c87b03e5Sespie      c = *buffer->cur++;
*c87b03e5Sespie#endif
*c87b03e5Sespie      if (c == '?' || c == '\\')
*c87b03e5Sespie	c = skip_escaped_newlines (pfile);
*c87b03e5Sespie    }
*c87b03e5Sespie  while (!is_vspace (c));
*c87b03e5Sespie
*c87b03e5Sespie  /* Step back over the newline, except at EOF.  */
*c87b03e5Sespie  buffer->cur--;
*c87b03e5Sespie at_eof:
*c87b03e5Sespie
*c87b03e5Sespie  pfile->state.lexing_comment = 0;
*c87b03e5Sespie  return orig_line != pfile->line;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* pfile->buffer->cur is one beyond the \t character.  Update
*c87b03e5Sespie   col_adjust so we track the column correctly.  */
*c87b03e5Sespiestatic void
*c87b03e5Sespieadjust_column (pfile)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie{
*c87b03e5Sespie  cpp_buffer *buffer = pfile->buffer;
*c87b03e5Sespie  unsigned int col = CPP_BUF_COL (buffer) - 1; /* Zero-based column.  */
*c87b03e5Sespie
*c87b03e5Sespie  /* Round it up to multiple of the tabstop, but subtract 1 since the
*c87b03e5Sespie     tab itself occupies a character position.  */
*c87b03e5Sespie  buffer->col_adjust += (CPP_OPTION (pfile, tabstop)
*c87b03e5Sespie			 - col % CPP_OPTION (pfile, tabstop)) - 1;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Skips whitespace, saving the next non-whitespace character.
*c87b03e5Sespie   Adjusts pfile->col_adjust to account for tabs.  Without this,
*c87b03e5Sespie   tokens might be assigned an incorrect column.  */
*c87b03e5Sespiestatic int
*c87b03e5Sespieskip_whitespace (pfile, c)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     cppchar_t c;
*c87b03e5Sespie{
*c87b03e5Sespie  cpp_buffer *buffer = pfile->buffer;
*c87b03e5Sespie  unsigned int warned = 0;
*c87b03e5Sespie
*c87b03e5Sespie  do
*c87b03e5Sespie    {
*c87b03e5Sespie      /* Horizontal space always OK.  */
*c87b03e5Sespie      if (c == ' ')
*c87b03e5Sespie	;
*c87b03e5Sespie      else if (c == '\t')
*c87b03e5Sespie	adjust_column (pfile);
*c87b03e5Sespie      /* Just \f \v or \0 left.  */
*c87b03e5Sespie      else if (c == '\0')
*c87b03e5Sespie	{
*c87b03e5Sespie	  if (buffer->cur - 1 == buffer->rlimit)
*c87b03e5Sespie	    return 0;
*c87b03e5Sespie	  if (!warned)
*c87b03e5Sespie	    {
*c87b03e5Sespie	      cpp_error (pfile, DL_WARNING, "null character(s) ignored");
*c87b03e5Sespie	      warned = 1;
*c87b03e5Sespie	    }
*c87b03e5Sespie	}
*c87b03e5Sespie      else if (pfile->state.in_directive && CPP_PEDANTIC (pfile))
*c87b03e5Sespie	cpp_error_with_line (pfile, DL_PEDWARN, pfile->line,
*c87b03e5Sespie			     CPP_BUF_COL (buffer),
*c87b03e5Sespie			     "%s in preprocessing directive",
*c87b03e5Sespie			     c == '\f' ? "form feed" : "vertical tab");
*c87b03e5Sespie
*c87b03e5Sespie      c = *buffer->cur++;
*c87b03e5Sespie    }
*c87b03e5Sespie  /* We only want non-vertical space, i.e. ' ' \t \f \v \0.  */
*c87b03e5Sespie  while (is_nvspace (c));
*c87b03e5Sespie
*c87b03e5Sespie  buffer->cur--;
*c87b03e5Sespie  return 1;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* See if the characters of a number token are valid in a name (no
*c87b03e5Sespie   '.', '+' or '-').  */
*c87b03e5Sespiestatic int
*c87b03e5Sespiename_p (pfile, string)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     const cpp_string *string;
*c87b03e5Sespie{
*c87b03e5Sespie  unsigned int i;
*c87b03e5Sespie
*c87b03e5Sespie  for (i = 0; i < string->len; i++)
*c87b03e5Sespie    if (!is_idchar (string->text[i]))
*c87b03e5Sespie      return 0;
*c87b03e5Sespie
*c87b03e5Sespie  return 1;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Parse an identifier, skipping embedded backslash-newlines.  This is
*c87b03e5Sespie   a critical inner loop.  The common case is an identifier which has
*c87b03e5Sespie   not been split by backslash-newline, does not contain a dollar
*c87b03e5Sespie   sign, and has already been scanned (roughly 10:1 ratio of
*c87b03e5Sespie   seen:unseen identifiers in normal code; the distribution is
*c87b03e5Sespie   Poisson-like).  Second most common case is a new identifier, not
*c87b03e5Sespie   split and no dollar sign.  The other possibilities are rare and
*c87b03e5Sespie   have been relegated to parse_slow.  */
*c87b03e5Sespiestatic cpp_hashnode *
*c87b03e5Sespieparse_identifier (pfile)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie{
*c87b03e5Sespie  cpp_hashnode *result;
*c87b03e5Sespie  const uchar *cur, *base;
*c87b03e5Sespie
*c87b03e5Sespie  /* Fast-path loop.  Skim over a normal identifier.
*c87b03e5Sespie     N.B. ISIDNUM does not include $.  */
*c87b03e5Sespie  cur = pfile->buffer->cur;
*c87b03e5Sespie  while (ISIDNUM (*cur))
*c87b03e5Sespie    cur++;
*c87b03e5Sespie
*c87b03e5Sespie  /* Check for slow-path cases.  */
*c87b03e5Sespie  if (*cur == '?' || *cur == '\\' || *cur == '$')
*c87b03e5Sespie    {
*c87b03e5Sespie      unsigned int len;
*c87b03e5Sespie
*c87b03e5Sespie      base = parse_slow (pfile, cur, 0, &len);
*c87b03e5Sespie      result = (cpp_hashnode *)
*c87b03e5Sespie	ht_lookup (pfile->hash_table, base, len, HT_ALLOCED);
*c87b03e5Sespie    }
*c87b03e5Sespie  else
*c87b03e5Sespie    {
*c87b03e5Sespie      base = pfile->buffer->cur - 1;
*c87b03e5Sespie      pfile->buffer->cur = cur;
*c87b03e5Sespie      result = (cpp_hashnode *)
*c87b03e5Sespie	ht_lookup (pfile->hash_table, base, cur - base, HT_ALLOC);
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  /* Rarely, identifiers require diagnostics when lexed.
*c87b03e5Sespie     XXX Has to be forced out of the fast path.  */
*c87b03e5Sespie  if (__builtin_expect ((result->flags & NODE_DIAGNOSTIC)
*c87b03e5Sespie			&& !pfile->state.skipping, 0))
*c87b03e5Sespie    {
*c87b03e5Sespie      /* It is allowed to poison the same identifier twice.  */
*c87b03e5Sespie      if ((result->flags & NODE_POISONED) && !pfile->state.poisoned_ok)
*c87b03e5Sespie	cpp_error (pfile, DL_ERROR, "attempt to use poisoned \"%s\"",
*c87b03e5Sespie		   NODE_NAME (result));
*c87b03e5Sespie
*c87b03e5Sespie      /* Constraint 6.10.3.5: __VA_ARGS__ should only appear in the
*c87b03e5Sespie	 replacement list of a variadic macro.  */
*c87b03e5Sespie      if (result == pfile->spec_nodes.n__VA_ARGS__
*c87b03e5Sespie	  && !pfile->state.va_args_ok)
*c87b03e5Sespie	cpp_error (pfile, DL_PEDWARN,
*c87b03e5Sespie	"__VA_ARGS__ can only appear in the expansion of a C99 variadic macro");
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  return result;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Slow path.  This handles numbers and identifiers which have been
*c87b03e5Sespie   split, or contain dollar signs.  The part of the token from
*c87b03e5Sespie   PFILE->buffer->cur-1 to CUR has already been scanned.  NUMBER_P is
*c87b03e5Sespie   1 if it's a number, and 2 if it has a leading period.  Returns a
*c87b03e5Sespie   pointer to the token's NUL-terminated spelling in permanent
*c87b03e5Sespie   storage, and sets PLEN to its length.  */
*c87b03e5Sespiestatic uchar *
*c87b03e5Sespieparse_slow (pfile, cur, number_p, plen)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     const uchar *cur;
*c87b03e5Sespie     int number_p;
*c87b03e5Sespie     unsigned int *plen;
*c87b03e5Sespie{
*c87b03e5Sespie  cpp_buffer *buffer = pfile->buffer;
*c87b03e5Sespie  const uchar *base = buffer->cur - 1;
*c87b03e5Sespie  struct obstack *stack = &pfile->hash_table->stack;
*c87b03e5Sespie  unsigned int c, prevc, saw_dollar = 0;
*c87b03e5Sespie
*c87b03e5Sespie  /* Place any leading period.  */
*c87b03e5Sespie  if (number_p == 2)
*c87b03e5Sespie    obstack_1grow (stack, '.');
*c87b03e5Sespie
*c87b03e5Sespie  /* Copy the part of the token which is known to be okay.  */
*c87b03e5Sespie  obstack_grow (stack, base, cur - base);
*c87b03e5Sespie
*c87b03e5Sespie  /* Now process the part which isn't.  We are looking at one of
*c87b03e5Sespie     '$', '\\', or '?' on entry to this loop.  */
*c87b03e5Sespie  prevc = cur[-1];
*c87b03e5Sespie  c = *cur++;
*c87b03e5Sespie  buffer->cur = cur;
*c87b03e5Sespie  for (;;)
*c87b03e5Sespie    {
*c87b03e5Sespie      /* Potential escaped newline?  */
*c87b03e5Sespie      buffer->backup_to = buffer->cur - 1;
*c87b03e5Sespie      if (c == '?' || c == '\\')
*c87b03e5Sespie	c = skip_escaped_newlines (pfile);
*c87b03e5Sespie
*c87b03e5Sespie      if (!is_idchar (c))
*c87b03e5Sespie	{
*c87b03e5Sespie	  if (!number_p)
*c87b03e5Sespie	    break;
*c87b03e5Sespie	  if (c != '.' && !VALID_SIGN (c, prevc))
*c87b03e5Sespie	    break;
*c87b03e5Sespie	}
*c87b03e5Sespie
*c87b03e5Sespie      /* Handle normal identifier characters in this loop.  */
*c87b03e5Sespie      do
*c87b03e5Sespie	{
*c87b03e5Sespie	  prevc = c;
*c87b03e5Sespie	  obstack_1grow (stack, c);
*c87b03e5Sespie
*c87b03e5Sespie	  if (c == '$')
*c87b03e5Sespie	    saw_dollar++;
*c87b03e5Sespie
*c87b03e5Sespie	  c = *buffer->cur++;
*c87b03e5Sespie	}
*c87b03e5Sespie      while (is_idchar (c));
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  /* Step back over the unwanted char.  */
*c87b03e5Sespie  BACKUP ();
*c87b03e5Sespie
*c87b03e5Sespie  /* $ is not an identifier character in the standard, but is commonly
*c87b03e5Sespie     accepted as an extension.  Don't warn about it in skipped
*c87b03e5Sespie     conditional blocks.  */
*c87b03e5Sespie  if (saw_dollar && CPP_PEDANTIC (pfile) && ! pfile->state.skipping)
*c87b03e5Sespie    cpp_error (pfile, DL_PEDWARN, "'$' character(s) in identifier or number");
*c87b03e5Sespie
*c87b03e5Sespie  /* Identifiers and numbers are null-terminated.  */
*c87b03e5Sespie  *plen = obstack_object_size (stack);
*c87b03e5Sespie  obstack_1grow (stack, '\0');
*c87b03e5Sespie  return obstack_finish (stack);
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Parse a number, beginning with character C, skipping embedded
*c87b03e5Sespie   backslash-newlines.  LEADING_PERIOD is nonzero if there was a "."
*c87b03e5Sespie   before C.  Place the result in NUMBER.  */
*c87b03e5Sespiestatic void
*c87b03e5Sespieparse_number (pfile, number, leading_period)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     cpp_string *number;
*c87b03e5Sespie     int leading_period;
*c87b03e5Sespie{
*c87b03e5Sespie  const uchar *cur;
*c87b03e5Sespie
*c87b03e5Sespie  /* Fast-path loop.  Skim over a normal number.
*c87b03e5Sespie     N.B. ISIDNUM does not include $.  */
*c87b03e5Sespie  cur = pfile->buffer->cur;
*c87b03e5Sespie  while (ISIDNUM (*cur) || *cur == '.' || VALID_SIGN (*cur, cur[-1]))
*c87b03e5Sespie    cur++;
*c87b03e5Sespie
*c87b03e5Sespie  /* Check for slow-path cases.  */
*c87b03e5Sespie  if (*cur == '?' || *cur == '\\' || *cur == '$')
*c87b03e5Sespie    number->text = parse_slow (pfile, cur, 1 + leading_period, &number->len);
*c87b03e5Sespie  else
*c87b03e5Sespie    {
*c87b03e5Sespie      const uchar *base = pfile->buffer->cur - 1;
*c87b03e5Sespie      uchar *dest;
*c87b03e5Sespie
*c87b03e5Sespie      number->len = cur - base + leading_period;
*c87b03e5Sespie      dest = _cpp_unaligned_alloc (pfile, number->len + 1);
*c87b03e5Sespie      dest[number->len] = '\0';
*c87b03e5Sespie      number->text = dest;
*c87b03e5Sespie
*c87b03e5Sespie      if (leading_period)
*c87b03e5Sespie	*dest++ = '.';
*c87b03e5Sespie      memcpy (dest, base, cur - base);
*c87b03e5Sespie      pfile->buffer->cur = cur;
*c87b03e5Sespie    }
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Subroutine of parse_string.  */
*c87b03e5Sespiestatic int
*c87b03e5Sespieunescaped_terminator_p (pfile, dest)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     const unsigned char *dest;
*c87b03e5Sespie{
*c87b03e5Sespie  const unsigned char *start, *temp;
*c87b03e5Sespie
*c87b03e5Sespie  /* In #include-style directives, terminators are not escapeable.  */
*c87b03e5Sespie  if (pfile->state.angled_headers)
*c87b03e5Sespie    return 1;
*c87b03e5Sespie
*c87b03e5Sespie  start = BUFF_FRONT (pfile->u_buff);
*c87b03e5Sespie
*c87b03e5Sespie  /* An odd number of consecutive backslashes represents an escaped
*c87b03e5Sespie     terminator.  */
*c87b03e5Sespie  for (temp = dest; temp > start && temp[-1] == '\\'; temp--)
*c87b03e5Sespie    ;
*c87b03e5Sespie
*c87b03e5Sespie  return ((dest - temp) & 1) == 0;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Parses a string, character constant, or angle-bracketed header file
*c87b03e5Sespie   name.  Handles embedded trigraphs and escaped newlines.  The stored
*c87b03e5Sespie   string is guaranteed NUL-terminated, but it is not guaranteed that
*c87b03e5Sespie   this is the first NUL since embedded NULs are preserved.
*c87b03e5Sespie
*c87b03e5Sespie   When this function returns, buffer->cur points to the next
*c87b03e5Sespie   character to be processed.  */
*c87b03e5Sespiestatic void
*c87b03e5Sespieparse_string (pfile, token, terminator)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     cpp_token *token;
*c87b03e5Sespie     cppchar_t terminator;
*c87b03e5Sespie{
*c87b03e5Sespie  cpp_buffer *buffer = pfile->buffer;
*c87b03e5Sespie  unsigned char *dest, *limit;
*c87b03e5Sespie  cppchar_t c;
*c87b03e5Sespie  bool warned_nulls = false;
*c87b03e5Sespie#ifdef MULTIBYTE_CHARS
*c87b03e5Sespie  wchar_t wc;
*c87b03e5Sespie  int char_len;
*c87b03e5Sespie#endif
*c87b03e5Sespie
*c87b03e5Sespie  dest = BUFF_FRONT (pfile->u_buff);
*c87b03e5Sespie  limit = BUFF_LIMIT (pfile->u_buff);
*c87b03e5Sespie
*c87b03e5Sespie#ifdef MULTIBYTE_CHARS
*c87b03e5Sespie  /* Reset multibyte conversion state.  */
*c87b03e5Sespie  (void) local_mbtowc (NULL, NULL, 0);
*c87b03e5Sespie#endif
*c87b03e5Sespie  for (;;)
*c87b03e5Sespie    {
*c87b03e5Sespie      /* We need room for another char, possibly the terminating NUL.  */
*c87b03e5Sespie      if ((size_t) (limit - dest) < 1)
*c87b03e5Sespie	{
*c87b03e5Sespie	  size_t len_so_far = dest - BUFF_FRONT (pfile->u_buff);
*c87b03e5Sespie	  _cpp_extend_buff (pfile, &pfile->u_buff, 2);
*c87b03e5Sespie	  dest = BUFF_FRONT (pfile->u_buff) + len_so_far;
*c87b03e5Sespie	  limit = BUFF_LIMIT (pfile->u_buff);
*c87b03e5Sespie	}
*c87b03e5Sespie
*c87b03e5Sespie#ifdef MULTIBYTE_CHARS
*c87b03e5Sespie      char_len = local_mbtowc (&wc, (const char *) buffer->cur,
*c87b03e5Sespie			       buffer->rlimit - buffer->cur);
*c87b03e5Sespie      if (char_len == -1)
*c87b03e5Sespie	{
*c87b03e5Sespie	  cpp_error (pfile, DL_WARNING,
*c87b03e5Sespie		     "ignoring invalid multibyte character");
*c87b03e5Sespie	  char_len = 1;
*c87b03e5Sespie	  c = *buffer->cur++;
*c87b03e5Sespie	}
*c87b03e5Sespie      else
*c87b03e5Sespie	{
*c87b03e5Sespie	  buffer->cur += char_len;
*c87b03e5Sespie	  c = wc;
*c87b03e5Sespie	}
*c87b03e5Sespie#else
*c87b03e5Sespie      c = *buffer->cur++;
*c87b03e5Sespie#endif
*c87b03e5Sespie
*c87b03e5Sespie      /* Handle trigraphs, escaped newlines etc.  */
*c87b03e5Sespie      if (c == '?' || c == '\\')
*c87b03e5Sespie	c = skip_escaped_newlines (pfile);
*c87b03e5Sespie
*c87b03e5Sespie      if (c == terminator)
*c87b03e5Sespie	{
*c87b03e5Sespie	  if (unescaped_terminator_p (pfile, dest))
*c87b03e5Sespie	    break;
*c87b03e5Sespie	}
*c87b03e5Sespie      else if (is_vspace (c))
*c87b03e5Sespie	{
*c87b03e5Sespie	  /* No string literal may extend over multiple lines.  In
*c87b03e5Sespie	     assembly language, suppress the error except for <>
*c87b03e5Sespie	     includes.  This is a kludge around not knowing where
*c87b03e5Sespie	     comments are.  */
*c87b03e5Sespie	unterminated:
*c87b03e5Sespie	  if (CPP_OPTION (pfile, lang) != CLK_ASM || terminator == '>')
*c87b03e5Sespie	    cpp_error (pfile, DL_ERROR, "missing terminating %c character",
*c87b03e5Sespie		       (int) terminator);
*c87b03e5Sespie	  buffer->cur--;
*c87b03e5Sespie	  break;
*c87b03e5Sespie	}
*c87b03e5Sespie      else if (c == '\0')
*c87b03e5Sespie	{
*c87b03e5Sespie	  if (buffer->cur - 1 == buffer->rlimit)
*c87b03e5Sespie	    goto unterminated;
*c87b03e5Sespie	  if (!warned_nulls)
*c87b03e5Sespie	    {
*c87b03e5Sespie	      warned_nulls = true;
*c87b03e5Sespie	      cpp_error (pfile, DL_WARNING,
*c87b03e5Sespie			 "null character(s) preserved in literal");
*c87b03e5Sespie	    }
*c87b03e5Sespie	}
*c87b03e5Sespie#ifdef MULTIBYTE_CHARS
*c87b03e5Sespie      if (char_len > 1)
*c87b03e5Sespie	{
*c87b03e5Sespie	  for ( ; char_len > 0; --char_len)
*c87b03e5Sespie	    *dest++ = (*buffer->cur - char_len);
*c87b03e5Sespie	}
*c87b03e5Sespie      else
*c87b03e5Sespie#endif
*c87b03e5Sespie	*dest++ = c;
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  *dest = '\0';
*c87b03e5Sespie
*c87b03e5Sespie  token->val.str.text = BUFF_FRONT (pfile->u_buff);
*c87b03e5Sespie  token->val.str.len = dest - BUFF_FRONT (pfile->u_buff);
*c87b03e5Sespie  BUFF_FRONT (pfile->u_buff) = dest + 1;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* The stored comment includes the comment start and any terminator.  */
*c87b03e5Sespiestatic void
*c87b03e5Sespiesave_comment (pfile, token, from, type)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     cpp_token *token;
*c87b03e5Sespie     const unsigned char *from;
*c87b03e5Sespie     cppchar_t type;
*c87b03e5Sespie{
*c87b03e5Sespie  unsigned char *buffer;
*c87b03e5Sespie  unsigned int len, clen;
*c87b03e5Sespie
*c87b03e5Sespie  len = pfile->buffer->cur - from + 1; /* + 1 for the initial '/'.  */
*c87b03e5Sespie
*c87b03e5Sespie  /* C++ comments probably (not definitely) have moved past a new
*c87b03e5Sespie     line, which we don't want to save in the comment.  */
*c87b03e5Sespie  if (is_vspace (pfile->buffer->cur[-1]))
*c87b03e5Sespie    len--;
*c87b03e5Sespie
*c87b03e5Sespie  /* If we are currently in a directive, then we need to store all
*c87b03e5Sespie     C++ comments as C comments internally, and so we need to
*c87b03e5Sespie     allocate a little extra space in that case.
*c87b03e5Sespie
*c87b03e5Sespie     Note that the only time we encounter a directive here is
*c87b03e5Sespie     when we are saving comments in a "#define".  */
*c87b03e5Sespie  clen = (pfile->state.in_directive && type == '/') ? len + 2 : len;
*c87b03e5Sespie
*c87b03e5Sespie  buffer = _cpp_unaligned_alloc (pfile, clen);
*c87b03e5Sespie
*c87b03e5Sespie  token->type = CPP_COMMENT;
*c87b03e5Sespie  token->val.str.len = clen;
*c87b03e5Sespie  token->val.str.text = buffer;
*c87b03e5Sespie
*c87b03e5Sespie  buffer[0] = '/';
*c87b03e5Sespie  memcpy (buffer + 1, from, len - 1);
*c87b03e5Sespie
*c87b03e5Sespie  /* Finish conversion to a C comment, if necessary.  */
*c87b03e5Sespie  if (pfile->state.in_directive && type == '/')
*c87b03e5Sespie    {
*c87b03e5Sespie      buffer[1] = '*';
*c87b03e5Sespie      buffer[clen - 2] = '*';
*c87b03e5Sespie      buffer[clen - 1] = '/';
*c87b03e5Sespie    }
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Allocate COUNT tokens for RUN.  */
*c87b03e5Sespievoid
*c87b03e5Sespie_cpp_init_tokenrun (run, count)
*c87b03e5Sespie     tokenrun *run;
*c87b03e5Sespie     unsigned int count;
*c87b03e5Sespie{
*c87b03e5Sespie  run->base = xnewvec (cpp_token, count);
*c87b03e5Sespie  run->limit = run->base + count;
*c87b03e5Sespie  run->next = NULL;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Returns the next tokenrun, or creates one if there is none.  */
*c87b03e5Sespiestatic tokenrun *
*c87b03e5Sespienext_tokenrun (run)
*c87b03e5Sespie     tokenrun *run;
*c87b03e5Sespie{
*c87b03e5Sespie  if (run->next == NULL)
*c87b03e5Sespie    {
*c87b03e5Sespie      run->next = xnew (tokenrun);
*c87b03e5Sespie      run->next->prev = run;
*c87b03e5Sespie      _cpp_init_tokenrun (run->next, 250);
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  return run->next;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Allocate a single token that is invalidated at the same time as the
*c87b03e5Sespie   rest of the tokens on the line.  Has its line and col set to the
*c87b03e5Sespie   same as the last lexed token, so that diagnostics appear in the
*c87b03e5Sespie   right place.  */
*c87b03e5Sespiecpp_token *
*c87b03e5Sespie_cpp_temp_token (pfile)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie{
*c87b03e5Sespie  cpp_token *old, *result;
*c87b03e5Sespie
*c87b03e5Sespie  old = pfile->cur_token - 1;
*c87b03e5Sespie  if (pfile->cur_token == pfile->cur_run->limit)
*c87b03e5Sespie    {
*c87b03e5Sespie      pfile->cur_run = next_tokenrun (pfile->cur_run);
*c87b03e5Sespie      pfile->cur_token = pfile->cur_run->base;
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  result = pfile->cur_token++;
*c87b03e5Sespie  result->line = old->line;
*c87b03e5Sespie  result->col = old->col;
*c87b03e5Sespie  return result;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Lex a token into RESULT (external interface).  Takes care of issues
*c87b03e5Sespie   like directive handling, token lookahead, multiple include
*c87b03e5Sespie   optimization and skipping.  */
*c87b03e5Sespieconst cpp_token *
*c87b03e5Sespie_cpp_lex_token (pfile)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie{
*c87b03e5Sespie  cpp_token *result;
*c87b03e5Sespie
*c87b03e5Sespie  for (;;)
*c87b03e5Sespie    {
*c87b03e5Sespie      if (pfile->cur_token == pfile->cur_run->limit)
*c87b03e5Sespie	{
*c87b03e5Sespie	  pfile->cur_run = next_tokenrun (pfile->cur_run);
*c87b03e5Sespie	  pfile->cur_token = pfile->cur_run->base;
*c87b03e5Sespie	}
*c87b03e5Sespie
*c87b03e5Sespie      if (pfile->lookaheads)
*c87b03e5Sespie	{
*c87b03e5Sespie	  pfile->lookaheads--;
*c87b03e5Sespie	  result = pfile->cur_token++;
*c87b03e5Sespie	}
*c87b03e5Sespie      else
*c87b03e5Sespie	result = _cpp_lex_direct (pfile);
*c87b03e5Sespie
*c87b03e5Sespie      if (result->flags & BOL)
*c87b03e5Sespie	{
*c87b03e5Sespie	  /* Is this a directive.  If _cpp_handle_directive returns
*c87b03e5Sespie	     false, it is an assembler #.  */
*c87b03e5Sespie	  if (result->type == CPP_HASH
*c87b03e5Sespie	      /* 6.10.3 p 11: Directives in a list of macro arguments
*c87b03e5Sespie		 gives undefined behavior.  This implementation
*c87b03e5Sespie		 handles the directive as normal.  */
*c87b03e5Sespie	      && pfile->state.parsing_args != 1
*c87b03e5Sespie	      && _cpp_handle_directive (pfile, result->flags & PREV_WHITE))
*c87b03e5Sespie	    continue;
*c87b03e5Sespie	  if (pfile->cb.line_change && !pfile->state.skipping)
*c87b03e5Sespie	    (*pfile->cb.line_change)(pfile, result, pfile->state.parsing_args);
*c87b03e5Sespie	}
*c87b03e5Sespie
*c87b03e5Sespie      /* We don't skip tokens in directives.  */
*c87b03e5Sespie      if (pfile->state.in_directive)
*c87b03e5Sespie	break;
*c87b03e5Sespie
*c87b03e5Sespie      /* Outside a directive, invalidate controlling macros.  At file
*c87b03e5Sespie	 EOF, _cpp_lex_direct takes care of popping the buffer, so we never
*c87b03e5Sespie	 get here and MI optimisation works.  */
*c87b03e5Sespie      pfile->mi_valid = false;
*c87b03e5Sespie
*c87b03e5Sespie      if (!pfile->state.skipping || result->type == CPP_EOF)
*c87b03e5Sespie	break;
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  return result;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* A NUL terminates the current buffer.  For ISO preprocessing this is
*c87b03e5Sespie   EOF, but for traditional preprocessing it indicates we need a line
*c87b03e5Sespie   refill.  Returns TRUE to continue preprocessing a new buffer, FALSE
*c87b03e5Sespie   to return a CPP_EOF to the caller.  */
*c87b03e5Sespiestatic bool
*c87b03e5Sespiecontinue_after_nul (pfile)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie{
*c87b03e5Sespie  cpp_buffer *buffer = pfile->buffer;
*c87b03e5Sespie  bool more = false;
*c87b03e5Sespie
*c87b03e5Sespie  buffer->saved_flags = BOL;
*c87b03e5Sespie  if (CPP_OPTION (pfile, traditional))
*c87b03e5Sespie    {
*c87b03e5Sespie      if (pfile->state.in_directive)
*c87b03e5Sespie	return false;
*c87b03e5Sespie
*c87b03e5Sespie      _cpp_remove_overlay (pfile);
*c87b03e5Sespie      more = _cpp_read_logical_line_trad (pfile);
*c87b03e5Sespie      _cpp_overlay_buffer (pfile, pfile->out.base,
*c87b03e5Sespie			   pfile->out.cur - pfile->out.base);
*c87b03e5Sespie      pfile->line = pfile->out.first_line;
*c87b03e5Sespie    }
*c87b03e5Sespie  else
*c87b03e5Sespie    {
*c87b03e5Sespie      /* Stop parsing arguments with a CPP_EOF.  When we finally come
*c87b03e5Sespie	 back here, do the work of popping the buffer.  */
*c87b03e5Sespie      if (!pfile->state.parsing_args)
*c87b03e5Sespie	{
*c87b03e5Sespie	  if (buffer->cur != buffer->line_base)
*c87b03e5Sespie	    {
*c87b03e5Sespie	      /* Non-empty files should end in a newline.  Don't warn
*c87b03e5Sespie		 for command line and _Pragma buffers.  */
*c87b03e5Sespie	      handle_newline (pfile);
*c87b03e5Sespie	    }
*c87b03e5Sespie
*c87b03e5Sespie	  /* Similarly, finish an in-progress directive with CPP_EOF
*c87b03e5Sespie	     before popping the buffer.  */
*c87b03e5Sespie	  if (!pfile->state.in_directive && buffer->prev)
*c87b03e5Sespie	    {
*c87b03e5Sespie	      more = !buffer->return_at_eof;
*c87b03e5Sespie	      _cpp_pop_buffer (pfile);
*c87b03e5Sespie	    }
*c87b03e5Sespie	}
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  return more;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie#define IF_NEXT_IS(CHAR, THEN_TYPE, ELSE_TYPE)	\
*c87b03e5Sespie  do {						\
*c87b03e5Sespie    if (get_effective_char (pfile) == CHAR)	\
*c87b03e5Sespie      result->type = THEN_TYPE;			\
*c87b03e5Sespie    else					\
*c87b03e5Sespie      {						\
*c87b03e5Sespie        BACKUP ();				\
*c87b03e5Sespie        result->type = ELSE_TYPE;		\
*c87b03e5Sespie      }						\
*c87b03e5Sespie  } while (0)
*c87b03e5Sespie
*c87b03e5Sespie/* Lex a token into pfile->cur_token, which is also incremented, to
*c87b03e5Sespie   get diagnostics pointing to the correct location.
*c87b03e5Sespie
*c87b03e5Sespie   Does not handle issues such as token lookahead, multiple-include
*c87b03e5Sespie   optimisation, directives, skipping etc.  This function is only
*c87b03e5Sespie   suitable for use by _cpp_lex_token, and in special cases like
*c87b03e5Sespie   lex_expansion_token which doesn't care for any of these issues.
*c87b03e5Sespie
*c87b03e5Sespie   When meeting a newline, returns CPP_EOF if parsing a directive,
*c87b03e5Sespie   otherwise returns to the start of the token buffer if permissible.
*c87b03e5Sespie   Returns the location of the lexed token.  */
*c87b03e5Sespiecpp_token *
*c87b03e5Sespie_cpp_lex_direct (pfile)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie{
*c87b03e5Sespie  cppchar_t c;
*c87b03e5Sespie  cpp_buffer *buffer;
*c87b03e5Sespie  const unsigned char *comment_start;
*c87b03e5Sespie  cpp_token *result = pfile->cur_token++;
*c87b03e5Sespie
*c87b03e5Sespie fresh_line:
*c87b03e5Sespie  buffer = pfile->buffer;
*c87b03e5Sespie  result->flags = buffer->saved_flags;
*c87b03e5Sespie  buffer->saved_flags = 0;
*c87b03e5Sespie update_tokens_line:
*c87b03e5Sespie  result->line = pfile->line;
*c87b03e5Sespie
*c87b03e5Sespie skipped_white:
*c87b03e5Sespie  c = *buffer->cur++;
*c87b03e5Sespie  result->col = CPP_BUF_COLUMN (buffer, buffer->cur);
*c87b03e5Sespie
*c87b03e5Sespie trigraph:
*c87b03e5Sespie  switch (c)
*c87b03e5Sespie    {
*c87b03e5Sespie    case ' ': case '\t': case '\f': case '\v': case '\0':
*c87b03e5Sespie      result->flags |= PREV_WHITE;
*c87b03e5Sespie      if (skip_whitespace (pfile, c))
*c87b03e5Sespie	goto skipped_white;
*c87b03e5Sespie
*c87b03e5Sespie      /* End of buffer.  */
*c87b03e5Sespie      buffer->cur--;
*c87b03e5Sespie      if (continue_after_nul (pfile))
*c87b03e5Sespie	goto fresh_line;
*c87b03e5Sespie      result->type = CPP_EOF;
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case '\n': case '\r':
*c87b03e5Sespie      handle_newline (pfile);
*c87b03e5Sespie      buffer->saved_flags = BOL;
*c87b03e5Sespie      if (! pfile->state.in_directive)
*c87b03e5Sespie	{
*c87b03e5Sespie	  if (pfile->state.parsing_args == 2)
*c87b03e5Sespie	    buffer->saved_flags |= PREV_WHITE;
*c87b03e5Sespie	  if (!pfile->keep_tokens)
*c87b03e5Sespie	    {
*c87b03e5Sespie	      pfile->cur_run = &pfile->base_run;
*c87b03e5Sespie	      result = pfile->base_run.base;
*c87b03e5Sespie	      pfile->cur_token = result + 1;
*c87b03e5Sespie	    }
*c87b03e5Sespie	  goto fresh_line;
*c87b03e5Sespie	}
*c87b03e5Sespie      result->type = CPP_EOF;
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case '?':
*c87b03e5Sespie    case '\\':
*c87b03e5Sespie      /* These could start an escaped newline, or '?' a trigraph.  Let
*c87b03e5Sespie	 skip_escaped_newlines do all the work.  */
*c87b03e5Sespie      {
*c87b03e5Sespie	unsigned int line = pfile->line;
*c87b03e5Sespie
*c87b03e5Sespie	c = skip_escaped_newlines (pfile);
*c87b03e5Sespie	if (line != pfile->line)
*c87b03e5Sespie	  {
*c87b03e5Sespie	    buffer->cur--;
*c87b03e5Sespie	    /* We had at least one escaped newline of some sort.
*c87b03e5Sespie	       Update the token's line and column.  */
*c87b03e5Sespie	    goto update_tokens_line;
*c87b03e5Sespie	  }
*c87b03e5Sespie      }
*c87b03e5Sespie
*c87b03e5Sespie      /* We are either the original '?' or '\\', or a trigraph.  */
*c87b03e5Sespie      if (c == '?')
*c87b03e5Sespie	result->type = CPP_QUERY;
*c87b03e5Sespie      else if (c == '\\')
*c87b03e5Sespie	goto random_char;
*c87b03e5Sespie      else
*c87b03e5Sespie	goto trigraph;
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case '0': case '1': case '2': case '3': case '4':
*c87b03e5Sespie    case '5': case '6': case '7': case '8': case '9':
*c87b03e5Sespie      result->type = CPP_NUMBER;
*c87b03e5Sespie      parse_number (pfile, &result->val.str, 0);
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case 'L':
*c87b03e5Sespie      /* 'L' may introduce wide characters or strings.  */
*c87b03e5Sespie      {
*c87b03e5Sespie	const unsigned char *pos = buffer->cur;
*c87b03e5Sespie
*c87b03e5Sespie	c = get_effective_char (pfile);
*c87b03e5Sespie	if (c == '\'' || c == '"')
*c87b03e5Sespie	  {
*c87b03e5Sespie	    result->type = (c == '"' ? CPP_WSTRING: CPP_WCHAR);
*c87b03e5Sespie	    parse_string (pfile, result, c);
*c87b03e5Sespie	    break;
*c87b03e5Sespie	  }
*c87b03e5Sespie	buffer->cur = pos;
*c87b03e5Sespie      }
*c87b03e5Sespie      /* Fall through.  */
*c87b03e5Sespie
*c87b03e5Sespie    start_ident:
*c87b03e5Sespie    case '_':
*c87b03e5Sespie    case 'a': case 'b': case 'c': case 'd': case 'e': case 'f':
*c87b03e5Sespie    case 'g': case 'h': case 'i': case 'j': case 'k': case 'l':
*c87b03e5Sespie    case 'm': case 'n': case 'o': case 'p': case 'q': case 'r':
*c87b03e5Sespie    case 's': case 't': case 'u': case 'v': case 'w': case 'x':
*c87b03e5Sespie    case 'y': case 'z':
*c87b03e5Sespie    case 'A': case 'B': case 'C': case 'D': case 'E': case 'F':
*c87b03e5Sespie    case 'G': case 'H': case 'I': case 'J': case 'K':
*c87b03e5Sespie    case 'M': case 'N': case 'O': case 'P': case 'Q': case 'R':
*c87b03e5Sespie    case 'S': case 'T': case 'U': case 'V': case 'W': case 'X':
*c87b03e5Sespie    case 'Y': case 'Z':
*c87b03e5Sespie      result->type = CPP_NAME;
*c87b03e5Sespie      result->val.node = parse_identifier (pfile);
*c87b03e5Sespie
*c87b03e5Sespie      /* Convert named operators to their proper types.  */
*c87b03e5Sespie      if (result->val.node->flags & NODE_OPERATOR)
*c87b03e5Sespie	{
*c87b03e5Sespie	  result->flags |= NAMED_OP;
*c87b03e5Sespie	  result->type = result->val.node->value.operator;
*c87b03e5Sespie	}
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case '\'':
*c87b03e5Sespie    case '"':
*c87b03e5Sespie      result->type = c == '"' ? CPP_STRING: CPP_CHAR;
*c87b03e5Sespie      parse_string (pfile, result, c);
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case '/':
*c87b03e5Sespie      /* A potential block or line comment.  */
*c87b03e5Sespie      comment_start = buffer->cur;
*c87b03e5Sespie      c = get_effective_char (pfile);
*c87b03e5Sespie
*c87b03e5Sespie      if (c == '*')
*c87b03e5Sespie	{
*c87b03e5Sespie	  if (skip_block_comment (pfile))
*c87b03e5Sespie	    cpp_error (pfile, DL_ERROR, "unterminated comment");
*c87b03e5Sespie	}
*c87b03e5Sespie      else if (c == '/' && (CPP_OPTION (pfile, cplusplus_comments)
*c87b03e5Sespie			    || CPP_IN_SYSTEM_HEADER (pfile)))
*c87b03e5Sespie	{
*c87b03e5Sespie	  /* Warn about comments only if pedantically GNUC89, and not
*c87b03e5Sespie	     in system headers.  */
*c87b03e5Sespie	  if (CPP_OPTION (pfile, lang) == CLK_GNUC89 && CPP_PEDANTIC (pfile)
*c87b03e5Sespie	      && ! buffer->warned_cplusplus_comments)
*c87b03e5Sespie	    {
*c87b03e5Sespie	      cpp_error (pfile, DL_PEDWARN,
*c87b03e5Sespie			 "C++ style comments are not allowed in ISO C90");
*c87b03e5Sespie	      cpp_error (pfile, DL_PEDWARN,
*c87b03e5Sespie			 "(this will be reported only once per input file)");
*c87b03e5Sespie	      buffer->warned_cplusplus_comments = 1;
*c87b03e5Sespie	    }
*c87b03e5Sespie
*c87b03e5Sespie	  if (skip_line_comment (pfile) && CPP_OPTION (pfile, warn_comments))
*c87b03e5Sespie	    cpp_error (pfile, DL_WARNING, "multi-line comment");
*c87b03e5Sespie	}
*c87b03e5Sespie      else if (c == '=')
*c87b03e5Sespie	{
*c87b03e5Sespie	  result->type = CPP_DIV_EQ;
*c87b03e5Sespie	  break;
*c87b03e5Sespie	}
*c87b03e5Sespie      else
*c87b03e5Sespie	{
*c87b03e5Sespie	  BACKUP ();
*c87b03e5Sespie	  result->type = CPP_DIV;
*c87b03e5Sespie	  break;
*c87b03e5Sespie	}
*c87b03e5Sespie
*c87b03e5Sespie      if (!pfile->state.save_comments)
*c87b03e5Sespie	{
*c87b03e5Sespie	  result->flags |= PREV_WHITE;
*c87b03e5Sespie	  goto update_tokens_line;
*c87b03e5Sespie	}
*c87b03e5Sespie
*c87b03e5Sespie      /* Save the comment as a token in its own right.  */
*c87b03e5Sespie      save_comment (pfile, result, comment_start, c);
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case '<':
*c87b03e5Sespie      if (pfile->state.angled_headers)
*c87b03e5Sespie	{
*c87b03e5Sespie	  result->type = CPP_HEADER_NAME;
*c87b03e5Sespie	  parse_string (pfile, result, '>');
*c87b03e5Sespie	  break;
*c87b03e5Sespie	}
*c87b03e5Sespie
*c87b03e5Sespie      c = get_effective_char (pfile);
*c87b03e5Sespie      if (c == '=')
*c87b03e5Sespie	result->type = CPP_LESS_EQ;
*c87b03e5Sespie      else if (c == '<')
*c87b03e5Sespie	IF_NEXT_IS ('=', CPP_LSHIFT_EQ, CPP_LSHIFT);
*c87b03e5Sespie      else if (c == '?' && CPP_OPTION (pfile, cplusplus))
*c87b03e5Sespie	IF_NEXT_IS ('=', CPP_MIN_EQ, CPP_MIN);
*c87b03e5Sespie      else if (c == ':' && CPP_OPTION (pfile, digraphs))
*c87b03e5Sespie	{
*c87b03e5Sespie	  result->type = CPP_OPEN_SQUARE;
*c87b03e5Sespie	  result->flags |= DIGRAPH;
*c87b03e5Sespie	}
*c87b03e5Sespie      else if (c == '%' && CPP_OPTION (pfile, digraphs))
*c87b03e5Sespie	{
*c87b03e5Sespie	  result->type = CPP_OPEN_BRACE;
*c87b03e5Sespie	  result->flags |= DIGRAPH;
*c87b03e5Sespie	}
*c87b03e5Sespie      else
*c87b03e5Sespie	{
*c87b03e5Sespie	  BACKUP ();
*c87b03e5Sespie	  result->type = CPP_LESS;
*c87b03e5Sespie	}
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case '>':
*c87b03e5Sespie      c = get_effective_char (pfile);
*c87b03e5Sespie      if (c == '=')
*c87b03e5Sespie	result->type = CPP_GREATER_EQ;
*c87b03e5Sespie      else if (c == '>')
*c87b03e5Sespie	IF_NEXT_IS ('=', CPP_RSHIFT_EQ, CPP_RSHIFT);
*c87b03e5Sespie      else if (c == '?' && CPP_OPTION (pfile, cplusplus))
*c87b03e5Sespie	IF_NEXT_IS ('=', CPP_MAX_EQ, CPP_MAX);
*c87b03e5Sespie      else
*c87b03e5Sespie	{
*c87b03e5Sespie	  BACKUP ();
*c87b03e5Sespie	  result->type = CPP_GREATER;
*c87b03e5Sespie	}
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case '%':
*c87b03e5Sespie      c = get_effective_char (pfile);
*c87b03e5Sespie      if (c == '=')
*c87b03e5Sespie	result->type = CPP_MOD_EQ;
*c87b03e5Sespie      else if (CPP_OPTION (pfile, digraphs) && c == ':')
*c87b03e5Sespie	{
*c87b03e5Sespie	  result->flags |= DIGRAPH;
*c87b03e5Sespie	  result->type = CPP_HASH;
*c87b03e5Sespie	  if (get_effective_char (pfile) == '%')
*c87b03e5Sespie	    {
*c87b03e5Sespie	      const unsigned char *pos = buffer->cur;
*c87b03e5Sespie
*c87b03e5Sespie	      if (get_effective_char (pfile) == ':')
*c87b03e5Sespie		result->type = CPP_PASTE;
*c87b03e5Sespie	      else
*c87b03e5Sespie		buffer->cur = pos - 1;
*c87b03e5Sespie	    }
*c87b03e5Sespie	  else
*c87b03e5Sespie	    BACKUP ();
*c87b03e5Sespie	}
*c87b03e5Sespie      else if (CPP_OPTION (pfile, digraphs) && c == '>')
*c87b03e5Sespie	{
*c87b03e5Sespie	  result->flags |= DIGRAPH;
*c87b03e5Sespie	  result->type = CPP_CLOSE_BRACE;
*c87b03e5Sespie	}
*c87b03e5Sespie      else
*c87b03e5Sespie	{
*c87b03e5Sespie	  BACKUP ();
*c87b03e5Sespie	  result->type = CPP_MOD;
*c87b03e5Sespie	}
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case '.':
*c87b03e5Sespie      result->type = CPP_DOT;
*c87b03e5Sespie      c = get_effective_char (pfile);
*c87b03e5Sespie      if (c == '.')
*c87b03e5Sespie	{
*c87b03e5Sespie	  const unsigned char *pos = buffer->cur;
*c87b03e5Sespie
*c87b03e5Sespie	  if (get_effective_char (pfile) == '.')
*c87b03e5Sespie	    result->type = CPP_ELLIPSIS;
*c87b03e5Sespie	  else
*c87b03e5Sespie	    buffer->cur = pos - 1;
*c87b03e5Sespie	}
*c87b03e5Sespie      /* All known character sets have 0...9 contiguous.  */
*c87b03e5Sespie      else if (ISDIGIT (c))
*c87b03e5Sespie	{
*c87b03e5Sespie	  result->type = CPP_NUMBER;
*c87b03e5Sespie	  parse_number (pfile, &result->val.str, 1);
*c87b03e5Sespie	}
*c87b03e5Sespie      else if (c == '*' && CPP_OPTION (pfile, cplusplus))
*c87b03e5Sespie	result->type = CPP_DOT_STAR;
*c87b03e5Sespie      else
*c87b03e5Sespie	BACKUP ();
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case '+':
*c87b03e5Sespie      c = get_effective_char (pfile);
*c87b03e5Sespie      if (c == '+')
*c87b03e5Sespie	result->type = CPP_PLUS_PLUS;
*c87b03e5Sespie      else if (c == '=')
*c87b03e5Sespie	result->type = CPP_PLUS_EQ;
*c87b03e5Sespie      else
*c87b03e5Sespie	{
*c87b03e5Sespie	  BACKUP ();
*c87b03e5Sespie	  result->type = CPP_PLUS;
*c87b03e5Sespie	}
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case '-':
*c87b03e5Sespie      c = get_effective_char (pfile);
*c87b03e5Sespie      if (c == '>')
*c87b03e5Sespie	{
*c87b03e5Sespie	  result->type = CPP_DEREF;
*c87b03e5Sespie	  if (CPP_OPTION (pfile, cplusplus))
*c87b03e5Sespie	    {
*c87b03e5Sespie	      if (get_effective_char (pfile) == '*')
*c87b03e5Sespie		result->type = CPP_DEREF_STAR;
*c87b03e5Sespie	      else
*c87b03e5Sespie		BACKUP ();
*c87b03e5Sespie	    }
*c87b03e5Sespie	}
*c87b03e5Sespie      else if (c == '-')
*c87b03e5Sespie	result->type = CPP_MINUS_MINUS;
*c87b03e5Sespie      else if (c == '=')
*c87b03e5Sespie	result->type = CPP_MINUS_EQ;
*c87b03e5Sespie      else
*c87b03e5Sespie	{
*c87b03e5Sespie	  BACKUP ();
*c87b03e5Sespie	  result->type = CPP_MINUS;
*c87b03e5Sespie	}
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case '&':
*c87b03e5Sespie      c = get_effective_char (pfile);
*c87b03e5Sespie      if (c == '&')
*c87b03e5Sespie	result->type = CPP_AND_AND;
*c87b03e5Sespie      else if (c == '=')
*c87b03e5Sespie	result->type = CPP_AND_EQ;
*c87b03e5Sespie      else
*c87b03e5Sespie	{
*c87b03e5Sespie	  BACKUP ();
*c87b03e5Sespie	  result->type = CPP_AND;
*c87b03e5Sespie	}
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case '|':
*c87b03e5Sespie      c = get_effective_char (pfile);
*c87b03e5Sespie      if (c == '|')
*c87b03e5Sespie	result->type = CPP_OR_OR;
*c87b03e5Sespie      else if (c == '=')
*c87b03e5Sespie	result->type = CPP_OR_EQ;
*c87b03e5Sespie      else
*c87b03e5Sespie	{
*c87b03e5Sespie	  BACKUP ();
*c87b03e5Sespie	  result->type = CPP_OR;
*c87b03e5Sespie	}
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case ':':
*c87b03e5Sespie      c = get_effective_char (pfile);
*c87b03e5Sespie      if (c == ':' && CPP_OPTION (pfile, cplusplus))
*c87b03e5Sespie	result->type = CPP_SCOPE;
*c87b03e5Sespie      else if (c == '>' && CPP_OPTION (pfile, digraphs))
*c87b03e5Sespie	{
*c87b03e5Sespie	  result->flags |= DIGRAPH;
*c87b03e5Sespie	  result->type = CPP_CLOSE_SQUARE;
*c87b03e5Sespie	}
*c87b03e5Sespie      else
*c87b03e5Sespie	{
*c87b03e5Sespie	  BACKUP ();
*c87b03e5Sespie	  result->type = CPP_COLON;
*c87b03e5Sespie	}
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case '*': IF_NEXT_IS ('=', CPP_MULT_EQ, CPP_MULT); break;
*c87b03e5Sespie    case '=': IF_NEXT_IS ('=', CPP_EQ_EQ, CPP_EQ); break;
*c87b03e5Sespie    case '!': IF_NEXT_IS ('=', CPP_NOT_EQ, CPP_NOT); break;
*c87b03e5Sespie    case '^': IF_NEXT_IS ('=', CPP_XOR_EQ, CPP_XOR); break;
*c87b03e5Sespie    case '#': IF_NEXT_IS ('#', CPP_PASTE, CPP_HASH); break;
*c87b03e5Sespie
*c87b03e5Sespie    case '~': result->type = CPP_COMPL; break;
*c87b03e5Sespie    case ',': result->type = CPP_COMMA; break;
*c87b03e5Sespie    case '(': result->type = CPP_OPEN_PAREN; break;
*c87b03e5Sespie    case ')': result->type = CPP_CLOSE_PAREN; break;
*c87b03e5Sespie    case '[': result->type = CPP_OPEN_SQUARE; break;
*c87b03e5Sespie    case ']': result->type = CPP_CLOSE_SQUARE; break;
*c87b03e5Sespie    case '{': result->type = CPP_OPEN_BRACE; break;
*c87b03e5Sespie    case '}': result->type = CPP_CLOSE_BRACE; break;
*c87b03e5Sespie    case ';': result->type = CPP_SEMICOLON; break;
*c87b03e5Sespie
*c87b03e5Sespie      /* @ is a punctuator in Objective-C.  */
*c87b03e5Sespie    case '@': result->type = CPP_ATSIGN; break;
*c87b03e5Sespie
*c87b03e5Sespie    case '$':
*c87b03e5Sespie      if (CPP_OPTION (pfile, dollars_in_ident))
*c87b03e5Sespie	goto start_ident;
*c87b03e5Sespie      /* Fall through...  */
*c87b03e5Sespie
*c87b03e5Sespie    random_char:
*c87b03e5Sespie    default:
*c87b03e5Sespie      result->type = CPP_OTHER;
*c87b03e5Sespie      result->val.c = c;
*c87b03e5Sespie      break;
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  return result;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* An upper bound on the number of bytes needed to spell TOKEN,
*c87b03e5Sespie   including preceding whitespace.  */
*c87b03e5Sespieunsigned int
*c87b03e5Sespiecpp_token_len (token)
*c87b03e5Sespie     const cpp_token *token;
*c87b03e5Sespie{
*c87b03e5Sespie  unsigned int len;
*c87b03e5Sespie
*c87b03e5Sespie  switch (TOKEN_SPELL (token))
*c87b03e5Sespie    {
*c87b03e5Sespie    default:		len = 0;				break;
*c87b03e5Sespie    case SPELL_NUMBER:
*c87b03e5Sespie    case SPELL_STRING:	len = token->val.str.len;		break;
*c87b03e5Sespie    case SPELL_IDENT:	len = NODE_LEN (token->val.node);	break;
*c87b03e5Sespie    }
*c87b03e5Sespie  /* 1 for whitespace, 4 for comment delimiters.  */
*c87b03e5Sespie  return len + 5;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Write the spelling of a token TOKEN to BUFFER.  The buffer must
*c87b03e5Sespie   already contain the enough space to hold the token's spelling.
*c87b03e5Sespie   Returns a pointer to the character after the last character
*c87b03e5Sespie   written.  */
*c87b03e5Sespieunsigned char *
*c87b03e5Sespiecpp_spell_token (pfile, token, buffer)
*c87b03e5Sespie     cpp_reader *pfile;		/* Would be nice to be rid of this...  */
*c87b03e5Sespie     const cpp_token *token;
*c87b03e5Sespie     unsigned char *buffer;
*c87b03e5Sespie{
*c87b03e5Sespie  switch (TOKEN_SPELL (token))
*c87b03e5Sespie    {
*c87b03e5Sespie    case SPELL_OPERATOR:
*c87b03e5Sespie      {
*c87b03e5Sespie	const unsigned char *spelling;
*c87b03e5Sespie	unsigned char c;
*c87b03e5Sespie
*c87b03e5Sespie	if (token->flags & DIGRAPH)
*c87b03e5Sespie	  spelling
*c87b03e5Sespie	    = digraph_spellings[(int) token->type - (int) CPP_FIRST_DIGRAPH];
*c87b03e5Sespie	else if (token->flags & NAMED_OP)
*c87b03e5Sespie	  goto spell_ident;
*c87b03e5Sespie	else
*c87b03e5Sespie	  spelling = TOKEN_NAME (token);
*c87b03e5Sespie
*c87b03e5Sespie	while ((c = *spelling++) != '\0')
*c87b03e5Sespie	  *buffer++ = c;
*c87b03e5Sespie      }
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case SPELL_CHAR:
*c87b03e5Sespie      *buffer++ = token->val.c;
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    spell_ident:
*c87b03e5Sespie    case SPELL_IDENT:
*c87b03e5Sespie      memcpy (buffer, NODE_NAME (token->val.node), NODE_LEN (token->val.node));
*c87b03e5Sespie      buffer += NODE_LEN (token->val.node);
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case SPELL_NUMBER:
*c87b03e5Sespie      memcpy (buffer, token->val.str.text, token->val.str.len);
*c87b03e5Sespie      buffer += token->val.str.len;
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case SPELL_STRING:
*c87b03e5Sespie      {
*c87b03e5Sespie	int left, right, tag;
*c87b03e5Sespie	switch (token->type)
*c87b03e5Sespie	  {
*c87b03e5Sespie	  case CPP_STRING:	left = '"';  right = '"';  tag = '\0'; break;
*c87b03e5Sespie	  case CPP_WSTRING:	left = '"';  right = '"';  tag = 'L';  break;
*c87b03e5Sespie	  case CPP_CHAR:	left = '\''; right = '\''; tag = '\0'; break;
*c87b03e5Sespie    	  case CPP_WCHAR:	left = '\''; right = '\''; tag = 'L';  break;
*c87b03e5Sespie	  case CPP_HEADER_NAME:	left = '<';  right = '>';  tag = '\0'; break;
*c87b03e5Sespie	  default:
*c87b03e5Sespie	    cpp_error (pfile, DL_ICE, "unknown string token %s\n",
*c87b03e5Sespie		       TOKEN_NAME (token));
*c87b03e5Sespie	    return buffer;
*c87b03e5Sespie	  }
*c87b03e5Sespie	if (tag) *buffer++ = tag;
*c87b03e5Sespie	*buffer++ = left;
*c87b03e5Sespie	memcpy (buffer, token->val.str.text, token->val.str.len);
*c87b03e5Sespie	buffer += token->val.str.len;
*c87b03e5Sespie	*buffer++ = right;
*c87b03e5Sespie      }
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case SPELL_NONE:
*c87b03e5Sespie      cpp_error (pfile, DL_ICE, "unspellable token %s", TOKEN_NAME (token));
*c87b03e5Sespie      break;
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  return buffer;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Returns TOKEN spelt as a null-terminated string.  The string is
*c87b03e5Sespie   freed when the reader is destroyed.  Useful for diagnostics.  */
*c87b03e5Sespieunsigned char *
*c87b03e5Sespiecpp_token_as_text (pfile, token)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     const cpp_token *token;
*c87b03e5Sespie{
*c87b03e5Sespie  unsigned int len = cpp_token_len (token);
*c87b03e5Sespie  unsigned char *start = _cpp_unaligned_alloc (pfile, len), *end;
*c87b03e5Sespie
*c87b03e5Sespie  end = cpp_spell_token (pfile, token, start);
*c87b03e5Sespie  end[0] = '\0';
*c87b03e5Sespie
*c87b03e5Sespie  return start;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Used by C front ends, which really should move to using
*c87b03e5Sespie   cpp_token_as_text.  */
*c87b03e5Sespieconst char *
*c87b03e5Sespiecpp_type2name (type)
*c87b03e5Sespie     enum cpp_ttype type;
*c87b03e5Sespie{
*c87b03e5Sespie  return (const char *) token_spellings[type].name;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Writes the spelling of token to FP, without any preceding space.
*c87b03e5Sespie   Separated from cpp_spell_token for efficiency - to avoid stdio
*c87b03e5Sespie   double-buffering.  */
*c87b03e5Sespievoid
*c87b03e5Sespiecpp_output_token (token, fp)
*c87b03e5Sespie     const cpp_token *token;
*c87b03e5Sespie     FILE *fp;
*c87b03e5Sespie{
*c87b03e5Sespie  switch (TOKEN_SPELL (token))
*c87b03e5Sespie    {
*c87b03e5Sespie    case SPELL_OPERATOR:
*c87b03e5Sespie      {
*c87b03e5Sespie	const unsigned char *spelling;
*c87b03e5Sespie	int c;
*c87b03e5Sespie
*c87b03e5Sespie	if (token->flags & DIGRAPH)
*c87b03e5Sespie	  spelling
*c87b03e5Sespie	    = digraph_spellings[(int) token->type - (int) CPP_FIRST_DIGRAPH];
*c87b03e5Sespie	else if (token->flags & NAMED_OP)
*c87b03e5Sespie	  goto spell_ident;
*c87b03e5Sespie	else
*c87b03e5Sespie	  spelling = TOKEN_NAME (token);
*c87b03e5Sespie
*c87b03e5Sespie	c = *spelling;
*c87b03e5Sespie	do
*c87b03e5Sespie	  putc (c, fp);
*c87b03e5Sespie	while ((c = *++spelling) != '\0');
*c87b03e5Sespie      }
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case SPELL_CHAR:
*c87b03e5Sespie      putc (token->val.c, fp);
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    spell_ident:
*c87b03e5Sespie    case SPELL_IDENT:
*c87b03e5Sespie      fwrite (NODE_NAME (token->val.node), 1, NODE_LEN (token->val.node), fp);
*c87b03e5Sespie    break;
*c87b03e5Sespie
*c87b03e5Sespie    case SPELL_NUMBER:
*c87b03e5Sespie      fwrite (token->val.str.text, 1, token->val.str.len, fp);
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case SPELL_STRING:
*c87b03e5Sespie      {
*c87b03e5Sespie	int left, right, tag;
*c87b03e5Sespie	switch (token->type)
*c87b03e5Sespie	  {
*c87b03e5Sespie	  case CPP_STRING:	left = '"';  right = '"';  tag = '\0'; break;
*c87b03e5Sespie	  case CPP_WSTRING:	left = '"';  right = '"';  tag = 'L';  break;
*c87b03e5Sespie	  case CPP_CHAR:	left = '\''; right = '\''; tag = '\0'; break;
*c87b03e5Sespie    	  case CPP_WCHAR:	left = '\''; right = '\''; tag = 'L';  break;
*c87b03e5Sespie	  case CPP_HEADER_NAME:	left = '<';  right = '>';  tag = '\0'; break;
*c87b03e5Sespie	  default:
*c87b03e5Sespie	    fprintf (stderr, "impossible STRING token %s\n", TOKEN_NAME (token));
*c87b03e5Sespie	    return;
*c87b03e5Sespie	  }
*c87b03e5Sespie	if (tag) putc (tag, fp);
*c87b03e5Sespie	putc (left, fp);
*c87b03e5Sespie	fwrite (token->val.str.text, 1, token->val.str.len, fp);
*c87b03e5Sespie	putc (right, fp);
*c87b03e5Sespie      }
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case SPELL_NONE:
*c87b03e5Sespie      /* An error, most probably.  */
*c87b03e5Sespie      break;
*c87b03e5Sespie    }
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Compare two tokens.  */
*c87b03e5Sespieint
*c87b03e5Sespie_cpp_equiv_tokens (a, b)
*c87b03e5Sespie     const cpp_token *a, *b;
*c87b03e5Sespie{
*c87b03e5Sespie  if (a->type == b->type && a->flags == b->flags)
*c87b03e5Sespie    switch (TOKEN_SPELL (a))
*c87b03e5Sespie      {
*c87b03e5Sespie      default:			/* Keep compiler happy.  */
*c87b03e5Sespie      case SPELL_OPERATOR:
*c87b03e5Sespie	return 1;
*c87b03e5Sespie      case SPELL_CHAR:
*c87b03e5Sespie	return a->val.c == b->val.c; /* Character.  */
*c87b03e5Sespie      case SPELL_NONE:
*c87b03e5Sespie	return (a->type != CPP_MACRO_ARG || a->val.arg_no == b->val.arg_no);
*c87b03e5Sespie      case SPELL_IDENT:
*c87b03e5Sespie	return a->val.node == b->val.node;
*c87b03e5Sespie      case SPELL_NUMBER:
*c87b03e5Sespie      case SPELL_STRING:
*c87b03e5Sespie	return (a->val.str.len == b->val.str.len
*c87b03e5Sespie		&& !memcmp (a->val.str.text, b->val.str.text,
*c87b03e5Sespie			    a->val.str.len));
*c87b03e5Sespie      }
*c87b03e5Sespie
*c87b03e5Sespie  return 0;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Returns nonzero if a space should be inserted to avoid an
*c87b03e5Sespie   accidental token paste for output.  For simplicity, it is
*c87b03e5Sespie   conservative, and occasionally advises a space where one is not
*c87b03e5Sespie   needed, e.g. "." and ".2".  */
*c87b03e5Sespieint
*c87b03e5Sespiecpp_avoid_paste (pfile, token1, token2)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     const cpp_token *token1, *token2;
*c87b03e5Sespie{
*c87b03e5Sespie  enum cpp_ttype a = token1->type, b = token2->type;
*c87b03e5Sespie  cppchar_t c;
*c87b03e5Sespie
*c87b03e5Sespie  if (token1->flags & NAMED_OP)
*c87b03e5Sespie    a = CPP_NAME;
*c87b03e5Sespie  if (token2->flags & NAMED_OP)
*c87b03e5Sespie    b = CPP_NAME;
*c87b03e5Sespie
*c87b03e5Sespie  c = EOF;
*c87b03e5Sespie  if (token2->flags & DIGRAPH)
*c87b03e5Sespie    c = digraph_spellings[(int) b - (int) CPP_FIRST_DIGRAPH][0];
*c87b03e5Sespie  else if (token_spellings[b].category == SPELL_OPERATOR)
*c87b03e5Sespie    c = token_spellings[b].name[0];
*c87b03e5Sespie
*c87b03e5Sespie  /* Quickly get everything that can paste with an '='.  */
*c87b03e5Sespie  if ((int) a <= (int) CPP_LAST_EQ && c == '=')
*c87b03e5Sespie    return 1;
*c87b03e5Sespie
*c87b03e5Sespie  switch (a)
*c87b03e5Sespie    {
*c87b03e5Sespie    case CPP_GREATER:	return c == '>' || c == '?';
*c87b03e5Sespie    case CPP_LESS:	return c == '<' || c == '?' || c == '%' || c == ':';
*c87b03e5Sespie    case CPP_PLUS:	return c == '+';
*c87b03e5Sespie    case CPP_MINUS:	return c == '-' || c == '>';
*c87b03e5Sespie    case CPP_DIV:	return c == '/' || c == '*'; /* Comments.  */
*c87b03e5Sespie    case CPP_MOD:	return c == ':' || c == '>';
*c87b03e5Sespie    case CPP_AND:	return c == '&';
*c87b03e5Sespie    case CPP_OR:	return c == '|';
*c87b03e5Sespie    case CPP_COLON:	return c == ':' || c == '>';
*c87b03e5Sespie    case CPP_DEREF:	return c == '*';
*c87b03e5Sespie    case CPP_DOT:	return c == '.' || c == '%' || b == CPP_NUMBER;
*c87b03e5Sespie    case CPP_HASH:	return c == '#' || c == '%'; /* Digraph form.  */
*c87b03e5Sespie    case CPP_NAME:	return ((b == CPP_NUMBER
*c87b03e5Sespie				 && name_p (pfile, &token2->val.str))
*c87b03e5Sespie				|| b == CPP_NAME
*c87b03e5Sespie				|| b == CPP_CHAR || b == CPP_STRING); /* L */
*c87b03e5Sespie    case CPP_NUMBER:	return (b == CPP_NUMBER || b == CPP_NAME
*c87b03e5Sespie				|| c == '.' || c == '+' || c == '-');
*c87b03e5Sespie    case CPP_OTHER:	return (CPP_OPTION (pfile, objc)
*c87b03e5Sespie				&& token1->val.c == '@'
*c87b03e5Sespie				&& (b == CPP_NAME || b == CPP_STRING));
*c87b03e5Sespie    default:		break;
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  return 0;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Output all the remaining tokens on the current line, and a newline
*c87b03e5Sespie   character, to FP.  Leading whitespace is removed.  If there are
*c87b03e5Sespie   macros, special token padding is not performed.  */
*c87b03e5Sespievoid
*c87b03e5Sespiecpp_output_line (pfile, fp)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     FILE *fp;
*c87b03e5Sespie{
*c87b03e5Sespie  const cpp_token *token;
*c87b03e5Sespie
*c87b03e5Sespie  token = cpp_get_token (pfile);
*c87b03e5Sespie  while (token->type != CPP_EOF)
*c87b03e5Sespie    {
*c87b03e5Sespie      cpp_output_token (token, fp);
*c87b03e5Sespie      token = cpp_get_token (pfile);
*c87b03e5Sespie      if (token->flags & PREV_WHITE)
*c87b03e5Sespie	putc (' ', fp);
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  putc ('\n', fp);
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Returns the value of a hexadecimal digit.  */
*c87b03e5Sespiestatic unsigned int
*c87b03e5Sespiehex_digit_value (c)
*c87b03e5Sespie     unsigned int c;
*c87b03e5Sespie{
*c87b03e5Sespie  if (hex_p (c))
*c87b03e5Sespie    return hex_value (c);
*c87b03e5Sespie  else
*c87b03e5Sespie    abort ();
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Parse a '\uNNNN' or '\UNNNNNNNN' sequence.  Returns 1 to indicate
*c87b03e5Sespie   failure if cpplib is not parsing C++ or C99.  Such failure is
*c87b03e5Sespie   silent, and no variables are updated.  Otherwise returns 0, and
*c87b03e5Sespie   warns if -Wtraditional.
*c87b03e5Sespie
*c87b03e5Sespie   [lex.charset]: The character designated by the universal character
*c87b03e5Sespie   name \UNNNNNNNN is that character whose character short name in
*c87b03e5Sespie   ISO/IEC 10646 is NNNNNNNN; the character designated by the
*c87b03e5Sespie   universal character name \uNNNN is that character whose character
*c87b03e5Sespie   short name in ISO/IEC 10646 is 0000NNNN.  If the hexadecimal value
*c87b03e5Sespie   for a universal character name is less than 0x20 or in the range
*c87b03e5Sespie   0x7F-0x9F (inclusive), or if the universal character name
*c87b03e5Sespie   designates a character in the basic source character set, then the
*c87b03e5Sespie   program is ill-formed.
*c87b03e5Sespie
*c87b03e5Sespie   We assume that wchar_t is Unicode, so we don't need to do any
*c87b03e5Sespie   mapping.  Is this ever wrong?
*c87b03e5Sespie
*c87b03e5Sespie   PC points to the 'u' or 'U', PSTR is points to the byte after PC,
*c87b03e5Sespie   LIMIT is the end of the string or charconst.  PSTR is updated to
*c87b03e5Sespie   point after the UCS on return, and the UCS is written into PC.  */
*c87b03e5Sespie
*c87b03e5Sespiestatic int
*c87b03e5Sespiemaybe_read_ucs (pfile, pstr, limit, pc)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     const unsigned char **pstr;
*c87b03e5Sespie     const unsigned char *limit;
*c87b03e5Sespie     cppchar_t *pc;
*c87b03e5Sespie{
*c87b03e5Sespie  const unsigned char *p = *pstr;
*c87b03e5Sespie  unsigned int code = 0;
*c87b03e5Sespie  unsigned int c = *pc, length;
*c87b03e5Sespie
*c87b03e5Sespie  /* Only attempt to interpret a UCS for C++ and C99.  */
*c87b03e5Sespie  if (! (CPP_OPTION (pfile, cplusplus) || CPP_OPTION (pfile, c99)))
*c87b03e5Sespie    return 1;
*c87b03e5Sespie
*c87b03e5Sespie  if (CPP_WTRADITIONAL (pfile))
*c87b03e5Sespie    cpp_error (pfile, DL_WARNING,
*c87b03e5Sespie	       "the meaning of '\\%c' is different in traditional C", c);
*c87b03e5Sespie
*c87b03e5Sespie  length = (c == 'u' ? 4: 8);
*c87b03e5Sespie
*c87b03e5Sespie  if ((size_t) (limit - p) < length)
*c87b03e5Sespie    {
*c87b03e5Sespie      cpp_error (pfile, DL_ERROR, "incomplete universal-character-name");
*c87b03e5Sespie      /* Skip to the end to avoid more diagnostics.  */
*c87b03e5Sespie      p = limit;
*c87b03e5Sespie    }
*c87b03e5Sespie  else
*c87b03e5Sespie    {
*c87b03e5Sespie      for (; length; length--, p++)
*c87b03e5Sespie	{
*c87b03e5Sespie	  c = *p;
*c87b03e5Sespie	  if (ISXDIGIT (c))
*c87b03e5Sespie	    code = (code << 4) + hex_digit_value (c);
*c87b03e5Sespie	  else
*c87b03e5Sespie	    {
*c87b03e5Sespie	      cpp_error (pfile, DL_ERROR,
*c87b03e5Sespie			 "non-hex digit '%c' in universal-character-name", c);
*c87b03e5Sespie	      /* We shouldn't skip in case there are multibyte chars.  */
*c87b03e5Sespie	      break;
*c87b03e5Sespie	    }
*c87b03e5Sespie	}
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie#ifdef TARGET_EBCDIC
*c87b03e5Sespie  cpp_error (pfile, DL_ERROR, "universal-character-name on EBCDIC target");
*c87b03e5Sespie  code = 0x3f;  /* EBCDIC invalid character */
*c87b03e5Sespie#else
*c87b03e5Sespie /* True extended characters are OK.  */
*c87b03e5Sespie  if (code >= 0xa0
*c87b03e5Sespie      && !(code & 0x80000000)
*c87b03e5Sespie      && !(code >= 0xD800 && code <= 0xDFFF))
*c87b03e5Sespie    ;
*c87b03e5Sespie  /* The standard permits $, @ and ` to be specified as UCNs.  We use
*c87b03e5Sespie     hex escapes so that this also works with EBCDIC hosts.  */
*c87b03e5Sespie  else if (code == 0x24 || code == 0x40 || code == 0x60)
*c87b03e5Sespie    ;
*c87b03e5Sespie  /* Don't give another error if one occurred above.  */
*c87b03e5Sespie  else if (length == 0)
*c87b03e5Sespie    cpp_error (pfile, DL_ERROR, "universal-character-name out of range");
*c87b03e5Sespie#endif
*c87b03e5Sespie
*c87b03e5Sespie  *pstr = p;
*c87b03e5Sespie  *pc = code;
*c87b03e5Sespie  return 0;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Returns the value of an escape sequence, truncated to the correct
*c87b03e5Sespie   target precision.  PSTR points to the input pointer, which is just
*c87b03e5Sespie   after the backslash.  LIMIT is how much text we have.  WIDE is true
*c87b03e5Sespie   if the escape sequence is part of a wide character constant or
*c87b03e5Sespie   string literal.  Handles all relevant diagnostics.  */
*c87b03e5Sespiecppchar_t
*c87b03e5Sespiecpp_parse_escape (pfile, pstr, limit, wide)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     const unsigned char **pstr;
*c87b03e5Sespie     const unsigned char *limit;
*c87b03e5Sespie     int wide;
*c87b03e5Sespie{
*c87b03e5Sespie  int unknown = 0;
*c87b03e5Sespie  const unsigned char *str = *pstr;
*c87b03e5Sespie  cppchar_t c, mask;
*c87b03e5Sespie  unsigned int width;
*c87b03e5Sespie
*c87b03e5Sespie  if (wide)
*c87b03e5Sespie    width = CPP_OPTION (pfile, wchar_precision);
*c87b03e5Sespie  else
*c87b03e5Sespie    width = CPP_OPTION (pfile, char_precision);
*c87b03e5Sespie  if (width < BITS_PER_CPPCHAR_T)
*c87b03e5Sespie    mask = ((cppchar_t) 1 << width) - 1;
*c87b03e5Sespie  else
*c87b03e5Sespie    mask = ~0;
*c87b03e5Sespie
*c87b03e5Sespie  c = *str++;
*c87b03e5Sespie  switch (c)
*c87b03e5Sespie    {
*c87b03e5Sespie    case '\\': case '\'': case '"': case '?': break;
*c87b03e5Sespie    case 'b': c = TARGET_BS;	  break;
*c87b03e5Sespie    case 'f': c = TARGET_FF;	  break;
*c87b03e5Sespie    case 'n': c = TARGET_NEWLINE; break;
*c87b03e5Sespie    case 'r': c = TARGET_CR;	  break;
*c87b03e5Sespie    case 't': c = TARGET_TAB;	  break;
*c87b03e5Sespie    case 'v': c = TARGET_VT;	  break;
*c87b03e5Sespie
*c87b03e5Sespie    case '(': case '{': case '[': case '%':
*c87b03e5Sespie      /* '\(', etc, are used at beginning of line to avoid confusing Emacs.
*c87b03e5Sespie	 '\%' is used to prevent SCCS from getting confused.  */
*c87b03e5Sespie      unknown = CPP_PEDANTIC (pfile);
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case 'a':
*c87b03e5Sespie      if (CPP_WTRADITIONAL (pfile))
*c87b03e5Sespie	cpp_error (pfile, DL_WARNING,
*c87b03e5Sespie		   "the meaning of '\\a' is different in traditional C");
*c87b03e5Sespie      c = TARGET_BELL;
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case 'e': case 'E':
*c87b03e5Sespie      if (CPP_PEDANTIC (pfile))
*c87b03e5Sespie	cpp_error (pfile, DL_PEDWARN,
*c87b03e5Sespie		   "non-ISO-standard escape sequence, '\\%c'", (int) c);
*c87b03e5Sespie      c = TARGET_ESC;
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case 'u': case 'U':
*c87b03e5Sespie      unknown = maybe_read_ucs (pfile, &str, limit, &c);
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case 'x':
*c87b03e5Sespie      if (CPP_WTRADITIONAL (pfile))
*c87b03e5Sespie	cpp_error (pfile, DL_WARNING,
*c87b03e5Sespie		   "the meaning of '\\x' is different in traditional C");
*c87b03e5Sespie
*c87b03e5Sespie      {
*c87b03e5Sespie	cppchar_t i = 0, overflow = 0;
*c87b03e5Sespie	int digits_found = 0;
*c87b03e5Sespie
*c87b03e5Sespie	while (str < limit)
*c87b03e5Sespie	  {
*c87b03e5Sespie	    c = *str;
*c87b03e5Sespie	    if (! ISXDIGIT (c))
*c87b03e5Sespie	      break;
*c87b03e5Sespie	    str++;
*c87b03e5Sespie	    overflow |= i ^ (i << 4 >> 4);
*c87b03e5Sespie	    i = (i << 4) + hex_digit_value (c);
*c87b03e5Sespie	    digits_found = 1;
*c87b03e5Sespie	  }
*c87b03e5Sespie
*c87b03e5Sespie	if (!digits_found)
*c87b03e5Sespie	  cpp_error (pfile, DL_ERROR,
*c87b03e5Sespie		       "\\x used with no following hex digits");
*c87b03e5Sespie
*c87b03e5Sespie	if (overflow | (i != (i & mask)))
*c87b03e5Sespie	  {
*c87b03e5Sespie	    cpp_error (pfile, DL_PEDWARN,
*c87b03e5Sespie		       "hex escape sequence out of range");
*c87b03e5Sespie	    i &= mask;
*c87b03e5Sespie	  }
*c87b03e5Sespie	c = i;
*c87b03e5Sespie      }
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    case '0':  case '1':  case '2':  case '3':
*c87b03e5Sespie    case '4':  case '5':  case '6':  case '7':
*c87b03e5Sespie      {
*c87b03e5Sespie	size_t count = 0;
*c87b03e5Sespie	cppchar_t i = c - '0';
*c87b03e5Sespie
*c87b03e5Sespie	while (str < limit && ++count < 3)
*c87b03e5Sespie	  {
*c87b03e5Sespie	    c = *str;
*c87b03e5Sespie	    if (c < '0' || c > '7')
*c87b03e5Sespie	      break;
*c87b03e5Sespie	    str++;
*c87b03e5Sespie	    i = (i << 3) + c - '0';
*c87b03e5Sespie	  }
*c87b03e5Sespie
*c87b03e5Sespie	if (i != (i & mask))
*c87b03e5Sespie	  {
*c87b03e5Sespie	    cpp_error (pfile, DL_PEDWARN,
*c87b03e5Sespie		       "octal escape sequence out of range");
*c87b03e5Sespie	    i &= mask;
*c87b03e5Sespie	  }
*c87b03e5Sespie	c = i;
*c87b03e5Sespie      }
*c87b03e5Sespie      break;
*c87b03e5Sespie
*c87b03e5Sespie    default:
*c87b03e5Sespie      unknown = 1;
*c87b03e5Sespie      break;
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  if (unknown)
*c87b03e5Sespie    {
*c87b03e5Sespie      if (ISGRAPH (c))
*c87b03e5Sespie	cpp_error (pfile, DL_PEDWARN,
*c87b03e5Sespie		   "unknown escape sequence '\\%c'", (int) c);
*c87b03e5Sespie      else
*c87b03e5Sespie	cpp_error (pfile, DL_PEDWARN,
*c87b03e5Sespie		   "unknown escape sequence: '\\%03o'", (int) c);
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  if (c > mask)
*c87b03e5Sespie    {
*c87b03e5Sespie      cpp_error (pfile, DL_PEDWARN, "escape sequence out of range for its type");
*c87b03e5Sespie      c &= mask;
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  *pstr = str;
*c87b03e5Sespie  return c;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Interpret a (possibly wide) character constant in TOKEN.
*c87b03e5Sespie   WARN_MULTI warns about multi-character charconsts.  PCHARS_SEEN
*c87b03e5Sespie   points to a variable that is filled in with the number of
*c87b03e5Sespie   characters seen, and UNSIGNEDP to a variable that indicates whether
*c87b03e5Sespie   the result has signed type.  */
*c87b03e5Sespiecppchar_t
*c87b03e5Sespiecpp_interpret_charconst (pfile, token, pchars_seen, unsignedp)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     const cpp_token *token;
*c87b03e5Sespie     unsigned int *pchars_seen;
*c87b03e5Sespie     int *unsignedp;
*c87b03e5Sespie{
*c87b03e5Sespie  const unsigned char *str = token->val.str.text;
*c87b03e5Sespie  const unsigned char *limit = str + token->val.str.len;
*c87b03e5Sespie  unsigned int chars_seen = 0;
*c87b03e5Sespie  size_t width, max_chars;
*c87b03e5Sespie  cppchar_t c, mask, result = 0;
*c87b03e5Sespie  bool unsigned_p;
*c87b03e5Sespie
*c87b03e5Sespie#ifdef MULTIBYTE_CHARS
*c87b03e5Sespie  (void) local_mbtowc (NULL, NULL, 0);
*c87b03e5Sespie#endif
*c87b03e5Sespie
*c87b03e5Sespie  /* Width in bits.  */
*c87b03e5Sespie  if (token->type == CPP_CHAR)
*c87b03e5Sespie    {
*c87b03e5Sespie      width = CPP_OPTION (pfile, char_precision);
*c87b03e5Sespie      max_chars = CPP_OPTION (pfile, int_precision) / width;
*c87b03e5Sespie      unsigned_p = CPP_OPTION (pfile, unsigned_char);
*c87b03e5Sespie    }
*c87b03e5Sespie  else
*c87b03e5Sespie    {
*c87b03e5Sespie      width = CPP_OPTION (pfile, wchar_precision);
*c87b03e5Sespie      max_chars = 1;
*c87b03e5Sespie      unsigned_p = CPP_OPTION (pfile, unsigned_wchar);
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  if (width < BITS_PER_CPPCHAR_T)
*c87b03e5Sespie    mask = ((cppchar_t) 1 << width) - 1;
*c87b03e5Sespie  else
*c87b03e5Sespie    mask = ~0;
*c87b03e5Sespie
*c87b03e5Sespie  while (str < limit)
*c87b03e5Sespie    {
*c87b03e5Sespie#ifdef MULTIBYTE_CHARS
*c87b03e5Sespie      wchar_t wc;
*c87b03e5Sespie      int char_len;
*c87b03e5Sespie
*c87b03e5Sespie      char_len = local_mbtowc (&wc, str, limit - str);
*c87b03e5Sespie      if (char_len == -1)
*c87b03e5Sespie	{
*c87b03e5Sespie	  cpp_error (pfile, DL_WARNING,
*c87b03e5Sespie		     "ignoring invalid multibyte character");
*c87b03e5Sespie	  c = *str++;
*c87b03e5Sespie	}
*c87b03e5Sespie      else
*c87b03e5Sespie	{
*c87b03e5Sespie	  str += char_len;
*c87b03e5Sespie	  c = wc;
*c87b03e5Sespie	}
*c87b03e5Sespie#else
*c87b03e5Sespie      c = *str++;
*c87b03e5Sespie#endif
*c87b03e5Sespie
*c87b03e5Sespie      if (c == '\\')
*c87b03e5Sespie	c = cpp_parse_escape (pfile, &str, limit, token->type == CPP_WCHAR);
*c87b03e5Sespie
*c87b03e5Sespie#ifdef MAP_CHARACTER
*c87b03e5Sespie      if (ISPRINT (c))
*c87b03e5Sespie	c = MAP_CHARACTER (c);
*c87b03e5Sespie#endif
*c87b03e5Sespie
*c87b03e5Sespie      chars_seen++;
*c87b03e5Sespie
*c87b03e5Sespie      /* Truncate the character, scale the result and merge the two.  */
*c87b03e5Sespie      c &= mask;
*c87b03e5Sespie      if (width < BITS_PER_CPPCHAR_T)
*c87b03e5Sespie	result = (result << width) | c;
*c87b03e5Sespie      else
*c87b03e5Sespie	result = c;
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  if (chars_seen == 0)
*c87b03e5Sespie    cpp_error (pfile, DL_ERROR, "empty character constant");
*c87b03e5Sespie  else if (chars_seen > 1)
*c87b03e5Sespie    {
*c87b03e5Sespie      /* Multichar charconsts are of type int and therefore signed.  */
*c87b03e5Sespie      unsigned_p = 0;
*c87b03e5Sespie
*c87b03e5Sespie      if (chars_seen > max_chars)
*c87b03e5Sespie	{
*c87b03e5Sespie	  chars_seen = max_chars;
*c87b03e5Sespie	  cpp_error (pfile, DL_WARNING,
*c87b03e5Sespie		     "character constant too long for its type");
*c87b03e5Sespie	}
*c87b03e5Sespie      else if (CPP_OPTION (pfile, warn_multichar))
*c87b03e5Sespie	cpp_error (pfile, DL_WARNING, "multi-character character constant");
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  /* Sign-extend or truncate the constant to cppchar_t.  The value is
*c87b03e5Sespie     in WIDTH bits, but for multi-char charconsts it's value is the
*c87b03e5Sespie     full target type's width.  */
*c87b03e5Sespie  if (chars_seen > 1)
*c87b03e5Sespie    width *= max_chars;
*c87b03e5Sespie  if (width < BITS_PER_CPPCHAR_T)
*c87b03e5Sespie    {
*c87b03e5Sespie      mask = ((cppchar_t) 1 << width) - 1;
*c87b03e5Sespie      if (unsigned_p || !(result & (1 << (width - 1))))
*c87b03e5Sespie	result &= mask;
*c87b03e5Sespie      else
*c87b03e5Sespie	result |= ~mask;
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  *pchars_seen = chars_seen;
*c87b03e5Sespie  *unsignedp = unsigned_p;
*c87b03e5Sespie  return result;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Memory buffers.  Changing these three constants can have a dramatic
*c87b03e5Sespie   effect on performance.  The values here are reasonable defaults,
*c87b03e5Sespie   but might be tuned.  If you adjust them, be sure to test across a
*c87b03e5Sespie   range of uses of cpplib, including heavy nested function-like macro
*c87b03e5Sespie   expansion.  Also check the change in peak memory usage (NJAMD is a
*c87b03e5Sespie   good tool for this).  */
*c87b03e5Sespie#define MIN_BUFF_SIZE 8000
*c87b03e5Sespie#define BUFF_SIZE_UPPER_BOUND(MIN_SIZE) (MIN_BUFF_SIZE + (MIN_SIZE) * 3 / 2)
*c87b03e5Sespie#define EXTENDED_BUFF_SIZE(BUFF, MIN_EXTRA) \
*c87b03e5Sespie	(MIN_EXTRA + ((BUFF)->limit - (BUFF)->cur) * 2)
*c87b03e5Sespie
*c87b03e5Sespie#if MIN_BUFF_SIZE > BUFF_SIZE_UPPER_BOUND (0)
*c87b03e5Sespie  #error BUFF_SIZE_UPPER_BOUND must be at least as large as MIN_BUFF_SIZE!
*c87b03e5Sespie#endif
*c87b03e5Sespie
*c87b03e5Sespie/* Create a new allocation buffer.  Place the control block at the end
*c87b03e5Sespie   of the buffer, so that buffer overflows will cause immediate chaos.  */
*c87b03e5Sespiestatic _cpp_buff *
*c87b03e5Sespienew_buff (len)
*c87b03e5Sespie     size_t len;
*c87b03e5Sespie{
*c87b03e5Sespie  _cpp_buff *result;
*c87b03e5Sespie  unsigned char *base;
*c87b03e5Sespie
*c87b03e5Sespie  if (len < MIN_BUFF_SIZE)
*c87b03e5Sespie    len = MIN_BUFF_SIZE;
*c87b03e5Sespie  len = CPP_ALIGN (len);
*c87b03e5Sespie
*c87b03e5Sespie  base = xmalloc (len + sizeof (_cpp_buff));
*c87b03e5Sespie  result = (_cpp_buff *) (base + len);
*c87b03e5Sespie  result->base = base;
*c87b03e5Sespie  result->cur = base;
*c87b03e5Sespie  result->limit = base + len;
*c87b03e5Sespie  result->next = NULL;
*c87b03e5Sespie  return result;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Place a chain of unwanted allocation buffers on the free list.  */
*c87b03e5Sespievoid
*c87b03e5Sespie_cpp_release_buff (pfile, buff)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     _cpp_buff *buff;
*c87b03e5Sespie{
*c87b03e5Sespie  _cpp_buff *end = buff;
*c87b03e5Sespie
*c87b03e5Sespie  while (end->next)
*c87b03e5Sespie    end = end->next;
*c87b03e5Sespie  end->next = pfile->free_buffs;
*c87b03e5Sespie  pfile->free_buffs = buff;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Return a free buffer of size at least MIN_SIZE.  */
*c87b03e5Sespie_cpp_buff *
*c87b03e5Sespie_cpp_get_buff (pfile, min_size)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     size_t min_size;
*c87b03e5Sespie{
*c87b03e5Sespie  _cpp_buff *result, **p;
*c87b03e5Sespie
*c87b03e5Sespie  for (p = &pfile->free_buffs;; p = &(*p)->next)
*c87b03e5Sespie    {
*c87b03e5Sespie      size_t size;
*c87b03e5Sespie
*c87b03e5Sespie      if (*p == NULL)
*c87b03e5Sespie	return new_buff (min_size);
*c87b03e5Sespie      result = *p;
*c87b03e5Sespie      size = result->limit - result->base;
*c87b03e5Sespie      /* Return a buffer that's big enough, but don't waste one that's
*c87b03e5Sespie         way too big.  */
*c87b03e5Sespie      if (size >= min_size && size <= BUFF_SIZE_UPPER_BOUND (min_size))
*c87b03e5Sespie	break;
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  *p = result->next;
*c87b03e5Sespie  result->next = NULL;
*c87b03e5Sespie  result->cur = result->base;
*c87b03e5Sespie  return result;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Creates a new buffer with enough space to hold the uncommitted
*c87b03e5Sespie   remaining bytes of BUFF, and at least MIN_EXTRA more bytes.  Copies
*c87b03e5Sespie   the excess bytes to the new buffer.  Chains the new buffer after
*c87b03e5Sespie   BUFF, and returns the new buffer.  */
*c87b03e5Sespie_cpp_buff *
*c87b03e5Sespie_cpp_append_extend_buff (pfile, buff, min_extra)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     _cpp_buff *buff;
*c87b03e5Sespie     size_t min_extra;
*c87b03e5Sespie{
*c87b03e5Sespie  size_t size = EXTENDED_BUFF_SIZE (buff, min_extra);
*c87b03e5Sespie  _cpp_buff *new_buff = _cpp_get_buff (pfile, size);
*c87b03e5Sespie
*c87b03e5Sespie  buff->next = new_buff;
*c87b03e5Sespie  memcpy (new_buff->base, buff->cur, BUFF_ROOM (buff));
*c87b03e5Sespie  return new_buff;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Creates a new buffer with enough space to hold the uncommitted
*c87b03e5Sespie   remaining bytes of the buffer pointed to by BUFF, and at least
*c87b03e5Sespie   MIN_EXTRA more bytes.  Copies the excess bytes to the new buffer.
*c87b03e5Sespie   Chains the new buffer before the buffer pointed to by BUFF, and
*c87b03e5Sespie   updates the pointer to point to the new buffer.  */
*c87b03e5Sespievoid
*c87b03e5Sespie_cpp_extend_buff (pfile, pbuff, min_extra)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     _cpp_buff **pbuff;
*c87b03e5Sespie     size_t min_extra;
*c87b03e5Sespie{
*c87b03e5Sespie  _cpp_buff *new_buff, *old_buff = *pbuff;
*c87b03e5Sespie  size_t size = EXTENDED_BUFF_SIZE (old_buff, min_extra);
*c87b03e5Sespie
*c87b03e5Sespie  new_buff = _cpp_get_buff (pfile, size);
*c87b03e5Sespie  memcpy (new_buff->base, old_buff->cur, BUFF_ROOM (old_buff));
*c87b03e5Sespie  new_buff->next = old_buff;
*c87b03e5Sespie  *pbuff = new_buff;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Free a chain of buffers starting at BUFF.  */
*c87b03e5Sespievoid
*c87b03e5Sespie_cpp_free_buff (buff)
*c87b03e5Sespie     _cpp_buff *buff;
*c87b03e5Sespie{
*c87b03e5Sespie  _cpp_buff *next;
*c87b03e5Sespie
*c87b03e5Sespie  for (; buff; buff = next)
*c87b03e5Sespie    {
*c87b03e5Sespie      next = buff->next;
*c87b03e5Sespie      free (buff->base);
*c87b03e5Sespie    }
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Allocate permanent, unaligned storage of length LEN.  */
*c87b03e5Sespieunsigned char *
*c87b03e5Sespie_cpp_unaligned_alloc (pfile, len)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     size_t len;
*c87b03e5Sespie{
*c87b03e5Sespie  _cpp_buff *buff = pfile->u_buff;
*c87b03e5Sespie  unsigned char *result = buff->cur;
*c87b03e5Sespie
*c87b03e5Sespie  if (len > (size_t) (buff->limit - result))
*c87b03e5Sespie    {
*c87b03e5Sespie      buff = _cpp_get_buff (pfile, len);
*c87b03e5Sespie      buff->next = pfile->u_buff;
*c87b03e5Sespie      pfile->u_buff = buff;
*c87b03e5Sespie      result = buff->cur;
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  buff->cur = result + len;
*c87b03e5Sespie  return result;
*c87b03e5Sespie}
*c87b03e5Sespie
*c87b03e5Sespie/* Allocate permanent, unaligned storage of length LEN from a_buff.
*c87b03e5Sespie   That buffer is used for growing allocations when saving macro
*c87b03e5Sespie   replacement lists in a #define, and when parsing an answer to an
*c87b03e5Sespie   assertion in #assert, #unassert or #if (and therefore possibly
*c87b03e5Sespie   whilst expanding macros).  It therefore must not be used by any
*c87b03e5Sespie   code that they might call: specifically the lexer and the guts of
*c87b03e5Sespie   the macro expander.
*c87b03e5Sespie
*c87b03e5Sespie   All existing other uses clearly fit this restriction: storing
*c87b03e5Sespie   registered pragmas during initialization.  */
*c87b03e5Sespieunsigned char *
*c87b03e5Sespie_cpp_aligned_alloc (pfile, len)
*c87b03e5Sespie     cpp_reader *pfile;
*c87b03e5Sespie     size_t len;
*c87b03e5Sespie{
*c87b03e5Sespie  _cpp_buff *buff = pfile->a_buff;
*c87b03e5Sespie  unsigned char *result = buff->cur;
*c87b03e5Sespie
*c87b03e5Sespie  if (len > (size_t) (buff->limit - result))
*c87b03e5Sespie    {
*c87b03e5Sespie      buff = _cpp_get_buff (pfile, len);
*c87b03e5Sespie      buff->next = pfile->a_buff;
*c87b03e5Sespie      pfile->a_buff = buff;
*c87b03e5Sespie      result = buff->cur;
*c87b03e5Sespie    }
*c87b03e5Sespie
*c87b03e5Sespie  buff->cur = result + len;
*c87b03e5Sespie  return result;
*c87b03e5Sespie}