clang/Lex/TokenConcatenation.h

193326Sed//===--- TokenConcatenation.h - Token Concatenation Avoidance ---*- C++ -*-===//
193326Sed//
193326Sed//                     The LLVM Compiler Infrastructure
193326Sed//
193326Sed// This file is distributed under the University of Illinois Open Source
193326Sed// License. See LICENSE.TXT for details.
193326Sed//
193326Sed//===----------------------------------------------------------------------===//
193326Sed//
193326Sed// This file defines the TokenConcatenation class.
193326Sed//
193326Sed//===----------------------------------------------------------------------===//
193326Sed
193326Sed#ifndef CLANG_LEX_TOKEN_CONCATENATION_H
193326Sed#define CLANG_LEX_TOKEN_CONCATENATION_H
193326Sed
193326Sed#include "clang/Basic/TokenKinds.h"
193326Sed
193326Sednamespace clang {
193326Sed  class Preprocessor;
193326Sed  class Token;
198092Srdivacky
193326Sed  /// TokenConcatenation class, which answers the question of
193326Sed  ///   "Is it safe to emit two tokens without a whitespace between them, or
193326Sed  ///    would that cause implicit concatenation of the tokens?"
193326Sed  ///
193326Sed  /// For example, it emitting two identifiers "foo" and "bar" next to each
193326Sed  /// other would cause the lexer to produce one "foobar" token.  Emitting "1"
193326Sed  /// and ")" next to each other is safe.
193326Sed  ///
193326Sed  class TokenConcatenation {
193326Sed    Preprocessor &PP;
198092Srdivacky
193326Sed    enum AvoidConcatInfo {
193326Sed      /// By default, a token never needs to avoid concatenation.  Most tokens
193326Sed      /// (e.g. ',', ')', etc) don't cause a problem when concatenated.
193326Sed      aci_never_avoid_concat = 0,
198092Srdivacky
193326Sed      /// aci_custom_firstchar - AvoidConcat contains custom code to handle this
193326Sed      /// token's requirements, and it needs to know the first character of the
193326Sed      /// token.
193326Sed      aci_custom_firstchar = 1,
198092Srdivacky
193326Sed      /// aci_custom - AvoidConcat contains custom code to handle this token's
193326Sed      /// requirements, but it doesn't need to know the first character of the
193326Sed      /// token.
193326Sed      aci_custom = 2,
198092Srdivacky
193326Sed      /// aci_avoid_equal - Many tokens cannot be safely followed by an '='
193326Sed      /// character.  For example, "<<" turns into "<<=" when followed by an =.
193326Sed      aci_avoid_equal = 4
193326Sed    };
198092Srdivacky
193326Sed    /// TokenInfo - This array contains information for each token on what
193326Sed    /// action to take when avoiding concatenation of tokens in the AvoidConcat
193326Sed    /// method.
193326Sed    char TokenInfo[tok::NUM_TOKENS];
193326Sed  public:
193326Sed    TokenConcatenation(Preprocessor &PP);
198092Srdivacky
207619Srdivacky    bool AvoidConcat(const Token &PrevPrevTok,
207619Srdivacky                     const Token &PrevTok,
207619Srdivacky                     const Token &Tok) const;
193326Sed
193326Sed  private:
226633Sdim    /// IsIdentifierStringPrefix - Return true if the spelling of the token
226633Sdim    /// is literally 'L', 'u', 'U', or 'u8'.
226633Sdim    bool IsIdentifierStringPrefix(const Token &Tok) const;
193326Sed  };
193326Sed  } // end clang namespace
193326Sed
193326Sed#endif