TokenAnnotator.cpp revision 363496
1//===--- TokenAnnotator.cpp - Format C++ code -----------------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8///
9/// \file
10/// This file implements a token annotator, i.e. creates
11/// \c AnnotatedTokens out of \c FormatTokens with required extra information.
12///
13//===----------------------------------------------------------------------===//
14
15#include "TokenAnnotator.h"
16#include "FormatToken.h"
17#include "clang/Basic/SourceManager.h"
18#include "clang/Basic/TokenKinds.h"
19#include "llvm/ADT/SmallPtrSet.h"
20#include "llvm/Support/Debug.h"
21
22#define DEBUG_TYPE "format-token-annotator"
23
24namespace clang {
25namespace format {
26
27namespace {
28
29/// Returns \c true if the token can be used as an identifier in
30/// an Objective-C \c @selector, \c false otherwise.
31///
32/// Because getFormattingLangOpts() always lexes source code as
33/// Objective-C++, C++ keywords like \c new and \c delete are
34/// lexed as tok::kw_*, not tok::identifier, even for Objective-C.
35///
36/// For Objective-C and Objective-C++, both identifiers and keywords
37/// are valid inside @selector(...) (or a macro which
38/// invokes @selector(...)). So, we allow treat any identifier or
39/// keyword as a potential Objective-C selector component.
40static bool canBeObjCSelectorComponent(const FormatToken &Tok) {
41  return Tok.Tok.getIdentifierInfo() != nullptr;
42}
43
44/// With `Left` being '(', check if we're at either `[...](` or
45/// `[...]<...>(`, where the [ opens a lambda capture list.
46static bool isLambdaParameterList(const FormatToken *Left) {
47  // Skip <...> if present.
48  if (Left->Previous && Left->Previous->is(tok::greater) &&
49      Left->Previous->MatchingParen &&
50      Left->Previous->MatchingParen->is(TT_TemplateOpener))
51    Left = Left->Previous->MatchingParen;
52
53  // Check for `[...]`.
54  return Left->Previous && Left->Previous->is(tok::r_square) &&
55         Left->Previous->MatchingParen &&
56         Left->Previous->MatchingParen->is(TT_LambdaLSquare);
57}
58
59/// A parser that gathers additional information about tokens.
60///
61/// The \c TokenAnnotator tries to match parenthesis and square brakets and
62/// store a parenthesis levels. It also tries to resolve matching "<" and ">"
63/// into template parameter lists.
64class AnnotatingParser {
65public:
66  AnnotatingParser(const FormatStyle &Style, AnnotatedLine &Line,
67                   const AdditionalKeywords &Keywords)
68      : Style(Style), Line(Line), CurrentToken(Line.First), AutoFound(false),
69        Keywords(Keywords) {
70    Contexts.push_back(Context(tok::unknown, 1, /*IsExpression=*/false));
71    resetTokenMetadata(CurrentToken);
72  }
73
74private:
75  bool parseAngle() {
76    if (!CurrentToken || !CurrentToken->Previous)
77      return false;
78    if (NonTemplateLess.count(CurrentToken->Previous))
79      return false;
80
81    const FormatToken &Previous = *CurrentToken->Previous; // The '<'.
82    if (Previous.Previous) {
83      if (Previous.Previous->Tok.isLiteral())
84        return false;
85      if (Previous.Previous->is(tok::r_paren) && Contexts.size() > 1 &&
86          (!Previous.Previous->MatchingParen ||
87           !Previous.Previous->MatchingParen->is(TT_OverloadedOperatorLParen)))
88        return false;
89    }
90
91    FormatToken *Left = CurrentToken->Previous;
92    Left->ParentBracket = Contexts.back().ContextKind;
93    ScopedContextCreator ContextCreator(*this, tok::less, 12);
94
95    // If this angle is in the context of an expression, we need to be more
96    // hesitant to detect it as opening template parameters.
97    bool InExprContext = Contexts.back().IsExpression;
98
99    Contexts.back().IsExpression = false;
100    // If there's a template keyword before the opening angle bracket, this is a
101    // template parameter, not an argument.
102    Contexts.back().InTemplateArgument =
103        Left->Previous && Left->Previous->Tok.isNot(tok::kw_template);
104
105    if (Style.Language == FormatStyle::LK_Java &&
106        CurrentToken->is(tok::question))
107      next();
108
109    while (CurrentToken) {
110      if (CurrentToken->is(tok::greater)) {
111        Left->MatchingParen = CurrentToken;
112        CurrentToken->MatchingParen = Left;
113        // In TT_Proto, we must distignuish between:
114        //   map<key, value>
115        //   msg < item: data >
116        //   msg: < item: data >
117        // In TT_TextProto, map<key, value> does not occur.
118        if (Style.Language == FormatStyle::LK_TextProto ||
119            (Style.Language == FormatStyle::LK_Proto && Left->Previous &&
120             Left->Previous->isOneOf(TT_SelectorName, TT_DictLiteral)))
121          CurrentToken->Type = TT_DictLiteral;
122        else
123          CurrentToken->Type = TT_TemplateCloser;
124        next();
125        return true;
126      }
127      if (CurrentToken->is(tok::question) &&
128          Style.Language == FormatStyle::LK_Java) {
129        next();
130        continue;
131      }
132      if (CurrentToken->isOneOf(tok::r_paren, tok::r_square, tok::r_brace) ||
133          (CurrentToken->isOneOf(tok::colon, tok::question) && InExprContext &&
134           Style.Language != FormatStyle::LK_Proto &&
135           Style.Language != FormatStyle::LK_TextProto))
136        return false;
137      // If a && or || is found and interpreted as a binary operator, this set
138      // of angles is likely part of something like "a < b && c > d". If the
139      // angles are inside an expression, the ||/&& might also be a binary
140      // operator that was misinterpreted because we are parsing template
141      // parameters.
142      // FIXME: This is getting out of hand, write a decent parser.
143      if (CurrentToken->Previous->isOneOf(tok::pipepipe, tok::ampamp) &&
144          CurrentToken->Previous->is(TT_BinaryOperator) &&
145          Contexts[Contexts.size() - 2].IsExpression &&
146          !Line.startsWith(tok::kw_template))
147        return false;
148      updateParameterCount(Left, CurrentToken);
149      if (Style.Language == FormatStyle::LK_Proto) {
150        if (FormatToken *Previous = CurrentToken->getPreviousNonComment()) {
151          if (CurrentToken->is(tok::colon) ||
152              (CurrentToken->isOneOf(tok::l_brace, tok::less) &&
153               Previous->isNot(tok::colon)))
154            Previous->Type = TT_SelectorName;
155        }
156      }
157      if (!consumeToken())
158        return false;
159    }
160    return false;
161  }
162
163  bool parseParens(bool LookForDecls = false) {
164    if (!CurrentToken)
165      return false;
166    FormatToken *Left = CurrentToken->Previous;
167    Left->ParentBracket = Contexts.back().ContextKind;
168    ScopedContextCreator ContextCreator(*this, tok::l_paren, 1);
169
170    // FIXME: This is a bit of a hack. Do better.
171    Contexts.back().ColonIsForRangeExpr =
172        Contexts.size() == 2 && Contexts[0].ColonIsForRangeExpr;
173
174    bool StartsObjCMethodExpr = false;
175    if (FormatToken *MaybeSel = Left->Previous) {
176      // @selector( starts a selector.
177      if (MaybeSel->isObjCAtKeyword(tok::objc_selector) && MaybeSel->Previous &&
178          MaybeSel->Previous->is(tok::at)) {
179        StartsObjCMethodExpr = true;
180      }
181    }
182
183    if (Left->is(TT_OverloadedOperatorLParen)) {
184      Contexts.back().IsExpression = false;
185    } else if (Style.Language == FormatStyle::LK_JavaScript &&
186               (Line.startsWith(Keywords.kw_type, tok::identifier) ||
187                Line.startsWith(tok::kw_export, Keywords.kw_type,
188                                tok::identifier))) {
189      // type X = (...);
190      // export type X = (...);
191      Contexts.back().IsExpression = false;
192    } else if (Left->Previous &&
193               (Left->Previous->isOneOf(tok::kw_static_assert, tok::kw_decltype,
194                                        tok::kw_while, tok::l_paren,
195                                        tok::comma) ||
196                Left->Previous->isIf() ||
197                Left->Previous->is(TT_BinaryOperator))) {
198      // static_assert, if and while usually contain expressions.
199      Contexts.back().IsExpression = true;
200    } else if (Style.Language == FormatStyle::LK_JavaScript && Left->Previous &&
201               (Left->Previous->is(Keywords.kw_function) ||
202                (Left->Previous->endsSequence(tok::identifier,
203                                              Keywords.kw_function)))) {
204      // function(...) or function f(...)
205      Contexts.back().IsExpression = false;
206    } else if (Style.Language == FormatStyle::LK_JavaScript && Left->Previous &&
207               Left->Previous->is(TT_JsTypeColon)) {
208      // let x: (SomeType);
209      Contexts.back().IsExpression = false;
210    } else if (isLambdaParameterList(Left)) {
211      // This is a parameter list of a lambda expression.
212      Contexts.back().IsExpression = false;
213    } else if (Line.InPPDirective &&
214               (!Left->Previous || !Left->Previous->is(tok::identifier))) {
215      Contexts.back().IsExpression = true;
216    } else if (Contexts[Contexts.size() - 2].CaretFound) {
217      // This is the parameter list of an ObjC block.
218      Contexts.back().IsExpression = false;
219    } else if (Left->Previous && Left->Previous->is(tok::kw___attribute)) {
220      Left->Type = TT_AttributeParen;
221    } else if (Left->Previous && Left->Previous->is(TT_ForEachMacro)) {
222      // The first argument to a foreach macro is a declaration.
223      Contexts.back().IsForEachMacro = true;
224      Contexts.back().IsExpression = false;
225    } else if (Left->Previous && Left->Previous->MatchingParen &&
226               Left->Previous->MatchingParen->is(TT_ObjCBlockLParen)) {
227      Contexts.back().IsExpression = false;
228    } else if (!Line.MustBeDeclaration && !Line.InPPDirective) {
229      bool IsForOrCatch =
230          Left->Previous && Left->Previous->isOneOf(tok::kw_for, tok::kw_catch);
231      Contexts.back().IsExpression = !IsForOrCatch;
232    }
233
234    if (StartsObjCMethodExpr) {
235      Contexts.back().ColonIsObjCMethodExpr = true;
236      Left->Type = TT_ObjCMethodExpr;
237    }
238
239    // MightBeFunctionType and ProbablyFunctionType are used for
240    // function pointer and reference types as well as Objective-C
241    // block types:
242    //
243    // void (*FunctionPointer)(void);
244    // void (&FunctionReference)(void);
245    // void (^ObjCBlock)(void);
246    bool MightBeFunctionType = !Contexts[Contexts.size() - 2].IsExpression;
247    bool ProbablyFunctionType =
248        CurrentToken->isOneOf(tok::star, tok::amp, tok::caret);
249    bool HasMultipleLines = false;
250    bool HasMultipleParametersOnALine = false;
251    bool MightBeObjCForRangeLoop =
252        Left->Previous && Left->Previous->is(tok::kw_for);
253    FormatToken *PossibleObjCForInToken = nullptr;
254    while (CurrentToken) {
255      // LookForDecls is set when "if (" has been seen. Check for
256      // 'identifier' '*' 'identifier' followed by not '=' -- this
257      // '*' has to be a binary operator but determineStarAmpUsage() will
258      // categorize it as an unary operator, so set the right type here.
259      if (LookForDecls && CurrentToken->Next) {
260        FormatToken *Prev = CurrentToken->getPreviousNonComment();
261        if (Prev) {
262          FormatToken *PrevPrev = Prev->getPreviousNonComment();
263          FormatToken *Next = CurrentToken->Next;
264          if (PrevPrev && PrevPrev->is(tok::identifier) &&
265              Prev->isOneOf(tok::star, tok::amp, tok::ampamp) &&
266              CurrentToken->is(tok::identifier) && Next->isNot(tok::equal)) {
267            Prev->Type = TT_BinaryOperator;
268            LookForDecls = false;
269          }
270        }
271      }
272
273      if (CurrentToken->Previous->is(TT_PointerOrReference) &&
274          CurrentToken->Previous->Previous->isOneOf(tok::l_paren,
275                                                    tok::coloncolon))
276        ProbablyFunctionType = true;
277      if (CurrentToken->is(tok::comma))
278        MightBeFunctionType = false;
279      if (CurrentToken->Previous->is(TT_BinaryOperator))
280        Contexts.back().IsExpression = true;
281      if (CurrentToken->is(tok::r_paren)) {
282        if (MightBeFunctionType && ProbablyFunctionType && CurrentToken->Next &&
283            (CurrentToken->Next->is(tok::l_paren) ||
284             (CurrentToken->Next->is(tok::l_square) && Line.MustBeDeclaration)))
285          Left->Type = Left->Next->is(tok::caret) ? TT_ObjCBlockLParen
286                                                  : TT_FunctionTypeLParen;
287        Left->MatchingParen = CurrentToken;
288        CurrentToken->MatchingParen = Left;
289
290        if (CurrentToken->Next && CurrentToken->Next->is(tok::l_brace) &&
291            Left->Previous && Left->Previous->is(tok::l_paren)) {
292          // Detect the case where macros are used to generate lambdas or
293          // function bodies, e.g.:
294          //   auto my_lambda = MARCO((Type *type, int i) { .. body .. });
295          for (FormatToken *Tok = Left; Tok != CurrentToken; Tok = Tok->Next) {
296            if (Tok->is(TT_BinaryOperator) &&
297                Tok->isOneOf(tok::star, tok::amp, tok::ampamp))
298              Tok->Type = TT_PointerOrReference;
299          }
300        }
301
302        if (StartsObjCMethodExpr) {
303          CurrentToken->Type = TT_ObjCMethodExpr;
304          if (Contexts.back().FirstObjCSelectorName) {
305            Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
306                Contexts.back().LongestObjCSelectorName;
307          }
308        }
309
310        if (Left->is(TT_AttributeParen))
311          CurrentToken->Type = TT_AttributeParen;
312        if (Left->Previous && Left->Previous->is(TT_JavaAnnotation))
313          CurrentToken->Type = TT_JavaAnnotation;
314        if (Left->Previous && Left->Previous->is(TT_LeadingJavaAnnotation))
315          CurrentToken->Type = TT_LeadingJavaAnnotation;
316        if (Left->Previous && Left->Previous->is(TT_AttributeSquare))
317          CurrentToken->Type = TT_AttributeSquare;
318
319        if (!HasMultipleLines)
320          Left->PackingKind = PPK_Inconclusive;
321        else if (HasMultipleParametersOnALine)
322          Left->PackingKind = PPK_BinPacked;
323        else
324          Left->PackingKind = PPK_OnePerLine;
325
326        next();
327        return true;
328      }
329      if (CurrentToken->isOneOf(tok::r_square, tok::r_brace))
330        return false;
331
332      if (CurrentToken->is(tok::l_brace))
333        Left->Type = TT_Unknown; // Not TT_ObjCBlockLParen
334      if (CurrentToken->is(tok::comma) && CurrentToken->Next &&
335          !CurrentToken->Next->HasUnescapedNewline &&
336          !CurrentToken->Next->isTrailingComment())
337        HasMultipleParametersOnALine = true;
338      if ((CurrentToken->Previous->isOneOf(tok::kw_const, tok::kw_auto) ||
339           CurrentToken->Previous->isSimpleTypeSpecifier()) &&
340          !CurrentToken->is(tok::l_brace))
341        Contexts.back().IsExpression = false;
342      if (CurrentToken->isOneOf(tok::semi, tok::colon)) {
343        MightBeObjCForRangeLoop = false;
344        if (PossibleObjCForInToken) {
345          PossibleObjCForInToken->Type = TT_Unknown;
346          PossibleObjCForInToken = nullptr;
347        }
348      }
349      if (MightBeObjCForRangeLoop && CurrentToken->is(Keywords.kw_in)) {
350        PossibleObjCForInToken = CurrentToken;
351        PossibleObjCForInToken->Type = TT_ObjCForIn;
352      }
353      // When we discover a 'new', we set CanBeExpression to 'false' in order to
354      // parse the type correctly. Reset that after a comma.
355      if (CurrentToken->is(tok::comma))
356        Contexts.back().CanBeExpression = true;
357
358      FormatToken *Tok = CurrentToken;
359      if (!consumeToken())
360        return false;
361      updateParameterCount(Left, Tok);
362      if (CurrentToken && CurrentToken->HasUnescapedNewline)
363        HasMultipleLines = true;
364    }
365    return false;
366  }
367
368  bool isCSharpAttributeSpecifier(const FormatToken &Tok) {
369    if (!Style.isCSharp())
370      return false;
371
372    const FormatToken *AttrTok = Tok.Next;
373    if (!AttrTok)
374      return false;
375
376    // Just an empty declaration e.g. string [].
377    if (AttrTok->is(tok::r_square))
378      return false;
379
380    // Move along the tokens inbetween the '[' and ']' e.g. [STAThread].
381    while (AttrTok && AttrTok->isNot(tok::r_square)) {
382      AttrTok = AttrTok->Next;
383    }
384
385    if (!AttrTok)
386      return false;
387
388    // Move past the end of ']'.
389    AttrTok = AttrTok->Next;
390    if (!AttrTok)
391      return false;
392
393    // Limit this to being an access modifier that follows.
394    if (AttrTok->isOneOf(tok::kw_public, tok::kw_private, tok::kw_protected,
395                         tok::kw_class, tok::kw_static, tok::l_square,
396                         Keywords.kw_internal)) {
397      return true;
398    }
399
400    // incase its a [XXX] retval func(....
401    if (AttrTok->Next &&
402        AttrTok->Next->startsSequence(tok::identifier, tok::l_paren))
403      return true;
404
405    return false;
406  }
407
408  bool isCpp11AttributeSpecifier(const FormatToken &Tok) {
409    if (!Style.isCpp() || !Tok.startsSequence(tok::l_square, tok::l_square))
410      return false;
411    // The first square bracket is part of an ObjC array literal
412    if (Tok.Previous && Tok.Previous->is(tok::at)) {
413      return false;
414    }
415    const FormatToken *AttrTok = Tok.Next->Next;
416    if (!AttrTok)
417      return false;
418    // C++17 '[[using ns: foo, bar(baz, blech)]]'
419    // We assume nobody will name an ObjC variable 'using'.
420    if (AttrTok->startsSequence(tok::kw_using, tok::identifier, tok::colon))
421      return true;
422    if (AttrTok->isNot(tok::identifier))
423      return false;
424    while (AttrTok && !AttrTok->startsSequence(tok::r_square, tok::r_square)) {
425      // ObjC message send. We assume nobody will use : in a C++11 attribute
426      // specifier parameter, although this is technically valid:
427      // [[foo(:)]].
428      if (AttrTok->is(tok::colon) ||
429          AttrTok->startsSequence(tok::identifier, tok::identifier) ||
430          AttrTok->startsSequence(tok::r_paren, tok::identifier))
431        return false;
432      if (AttrTok->is(tok::ellipsis))
433        return true;
434      AttrTok = AttrTok->Next;
435    }
436    return AttrTok && AttrTok->startsSequence(tok::r_square, tok::r_square);
437  }
438
439  bool parseSquare() {
440    if (!CurrentToken)
441      return false;
442
443    // A '[' could be an index subscript (after an identifier or after
444    // ')' or ']'), it could be the start of an Objective-C method
445    // expression, it could the start of an Objective-C array literal,
446    // or it could be a C++ attribute specifier [[foo::bar]].
447    FormatToken *Left = CurrentToken->Previous;
448    Left->ParentBracket = Contexts.back().ContextKind;
449    FormatToken *Parent = Left->getPreviousNonComment();
450
451    // Cases where '>' is followed by '['.
452    // In C++, this can happen either in array of templates (foo<int>[10])
453    // or when array is a nested template type (unique_ptr<type1<type2>[]>).
454    bool CppArrayTemplates =
455        Style.isCpp() && Parent && Parent->is(TT_TemplateCloser) &&
456        (Contexts.back().CanBeExpression || Contexts.back().IsExpression ||
457         Contexts.back().InTemplateArgument);
458
459    bool IsCpp11AttributeSpecifier = isCpp11AttributeSpecifier(*Left) ||
460                                     Contexts.back().InCpp11AttributeSpecifier;
461
462    // Treat C# Attributes [STAThread] much like C++ attributes [[...]].
463    bool IsCSharp11AttributeSpecifier =
464        isCSharpAttributeSpecifier(*Left) ||
465        Contexts.back().InCSharpAttributeSpecifier;
466
467    bool InsideInlineASM = Line.startsWith(tok::kw_asm);
468    bool IsCppStructuredBinding = Left->isCppStructuredBinding(Style);
469    bool StartsObjCMethodExpr =
470        !IsCppStructuredBinding && !InsideInlineASM && !CppArrayTemplates &&
471        Style.isCpp() && !IsCpp11AttributeSpecifier &&
472        Contexts.back().CanBeExpression && Left->isNot(TT_LambdaLSquare) &&
473        !CurrentToken->isOneOf(tok::l_brace, tok::r_square) &&
474        (!Parent ||
475         Parent->isOneOf(tok::colon, tok::l_square, tok::l_paren,
476                         tok::kw_return, tok::kw_throw) ||
477         Parent->isUnaryOperator() ||
478         // FIXME(bug 36976): ObjC return types shouldn't use TT_CastRParen.
479         Parent->isOneOf(TT_ObjCForIn, TT_CastRParen) ||
480         (getBinOpPrecedence(Parent->Tok.getKind(), true, true) >
481          prec::Unknown));
482    bool ColonFound = false;
483
484    unsigned BindingIncrease = 1;
485    if (IsCppStructuredBinding) {
486      Left->Type = TT_StructuredBindingLSquare;
487    } else if (Left->is(TT_Unknown)) {
488      if (StartsObjCMethodExpr) {
489        Left->Type = TT_ObjCMethodExpr;
490      } else if (IsCpp11AttributeSpecifier) {
491        Left->Type = TT_AttributeSquare;
492      } else if (Style.Language == FormatStyle::LK_JavaScript && Parent &&
493                 Contexts.back().ContextKind == tok::l_brace &&
494                 Parent->isOneOf(tok::l_brace, tok::comma)) {
495        Left->Type = TT_JsComputedPropertyName;
496      } else if (Style.isCpp() && Contexts.back().ContextKind == tok::l_brace &&
497                 Parent && Parent->isOneOf(tok::l_brace, tok::comma)) {
498        Left->Type = TT_DesignatedInitializerLSquare;
499      } else if (IsCSharp11AttributeSpecifier) {
500        Left->Type = TT_AttributeSquare;
501      } else if (CurrentToken->is(tok::r_square) && Parent &&
502                 Parent->is(TT_TemplateCloser)) {
503        Left->Type = TT_ArraySubscriptLSquare;
504      } else if (Style.Language == FormatStyle::LK_Proto ||
505                 Style.Language == FormatStyle::LK_TextProto) {
506        // Square braces in LK_Proto can either be message field attributes:
507        //
508        // optional Aaa aaa = 1 [
509        //   (aaa) = aaa
510        // ];
511        //
512        // extensions 123 [
513        //   (aaa) = aaa
514        // ];
515        //
516        // or text proto extensions (in options):
517        //
518        // option (Aaa.options) = {
519        //   [type.type/type] {
520        //     key: value
521        //   }
522        // }
523        //
524        // or repeated fields (in options):
525        //
526        // option (Aaa.options) = {
527        //   keys: [ 1, 2, 3 ]
528        // }
529        //
530        // In the first and the third case we want to spread the contents inside
531        // the square braces; in the second we want to keep them inline.
532        Left->Type = TT_ArrayInitializerLSquare;
533        if (!Left->endsSequence(tok::l_square, tok::numeric_constant,
534                                tok::equal) &&
535            !Left->endsSequence(tok::l_square, tok::numeric_constant,
536                                tok::identifier) &&
537            !Left->endsSequence(tok::l_square, tok::colon, TT_SelectorName)) {
538          Left->Type = TT_ProtoExtensionLSquare;
539          BindingIncrease = 10;
540        }
541      } else if (!CppArrayTemplates && Parent &&
542                 Parent->isOneOf(TT_BinaryOperator, TT_TemplateCloser, tok::at,
543                                 tok::comma, tok::l_paren, tok::l_square,
544                                 tok::question, tok::colon, tok::kw_return,
545                                 // Should only be relevant to JavaScript:
546                                 tok::kw_default)) {
547        Left->Type = TT_ArrayInitializerLSquare;
548      } else {
549        BindingIncrease = 10;
550        Left->Type = TT_ArraySubscriptLSquare;
551      }
552    }
553
554    ScopedContextCreator ContextCreator(*this, tok::l_square, BindingIncrease);
555    Contexts.back().IsExpression = true;
556    if (Style.Language == FormatStyle::LK_JavaScript && Parent &&
557        Parent->is(TT_JsTypeColon))
558      Contexts.back().IsExpression = false;
559
560    Contexts.back().ColonIsObjCMethodExpr = StartsObjCMethodExpr;
561    Contexts.back().InCpp11AttributeSpecifier = IsCpp11AttributeSpecifier;
562    Contexts.back().InCSharpAttributeSpecifier = IsCSharp11AttributeSpecifier;
563
564    while (CurrentToken) {
565      if (CurrentToken->is(tok::r_square)) {
566        if (IsCpp11AttributeSpecifier)
567          CurrentToken->Type = TT_AttributeSquare;
568        if (IsCSharp11AttributeSpecifier)
569          CurrentToken->Type = TT_AttributeSquare;
570        else if (((CurrentToken->Next &&
571                   CurrentToken->Next->is(tok::l_paren)) ||
572                  (CurrentToken->Previous &&
573                   CurrentToken->Previous->Previous == Left)) &&
574                 Left->is(TT_ObjCMethodExpr)) {
575          // An ObjC method call is rarely followed by an open parenthesis. It
576          // also can't be composed of just one token, unless it's a macro that
577          // will be expanded to more tokens.
578          // FIXME: Do we incorrectly label ":" with this?
579          StartsObjCMethodExpr = false;
580          Left->Type = TT_Unknown;
581        }
582        if (StartsObjCMethodExpr && CurrentToken->Previous != Left) {
583          CurrentToken->Type = TT_ObjCMethodExpr;
584          // If we haven't seen a colon yet, make sure the last identifier
585          // before the r_square is tagged as a selector name component.
586          if (!ColonFound && CurrentToken->Previous &&
587              CurrentToken->Previous->is(TT_Unknown) &&
588              canBeObjCSelectorComponent(*CurrentToken->Previous))
589            CurrentToken->Previous->Type = TT_SelectorName;
590          // determineStarAmpUsage() thinks that '*' '[' is allocating an
591          // array of pointers, but if '[' starts a selector then '*' is a
592          // binary operator.
593          if (Parent && Parent->is(TT_PointerOrReference))
594            Parent->Type = TT_BinaryOperator;
595        }
596        // An arrow after an ObjC method expression is not a lambda arrow.
597        if (CurrentToken->Type == TT_ObjCMethodExpr && CurrentToken->Next &&
598            CurrentToken->Next->is(TT_LambdaArrow))
599          CurrentToken->Next->Type = TT_Unknown;
600        Left->MatchingParen = CurrentToken;
601        CurrentToken->MatchingParen = Left;
602        // FirstObjCSelectorName is set when a colon is found. This does
603        // not work, however, when the method has no parameters.
604        // Here, we set FirstObjCSelectorName when the end of the method call is
605        // reached, in case it was not set already.
606        if (!Contexts.back().FirstObjCSelectorName) {
607          FormatToken *Previous = CurrentToken->getPreviousNonComment();
608          if (Previous && Previous->is(TT_SelectorName)) {
609            Previous->ObjCSelectorNameParts = 1;
610            Contexts.back().FirstObjCSelectorName = Previous;
611          }
612        } else {
613          Left->ParameterCount =
614              Contexts.back().FirstObjCSelectorName->ObjCSelectorNameParts;
615        }
616        if (Contexts.back().FirstObjCSelectorName) {
617          Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
618              Contexts.back().LongestObjCSelectorName;
619          if (Left->BlockParameterCount > 1)
620            Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName = 0;
621        }
622        next();
623        return true;
624      }
625      if (CurrentToken->isOneOf(tok::r_paren, tok::r_brace))
626        return false;
627      if (CurrentToken->is(tok::colon)) {
628        if (IsCpp11AttributeSpecifier &&
629            CurrentToken->endsSequence(tok::colon, tok::identifier,
630                                       tok::kw_using)) {
631          // Remember that this is a [[using ns: foo]] C++ attribute, so we
632          // don't add a space before the colon (unlike other colons).
633          CurrentToken->Type = TT_AttributeColon;
634        } else if (Left->isOneOf(TT_ArraySubscriptLSquare,
635                                 TT_DesignatedInitializerLSquare)) {
636          Left->Type = TT_ObjCMethodExpr;
637          StartsObjCMethodExpr = true;
638          Contexts.back().ColonIsObjCMethodExpr = true;
639          if (Parent && Parent->is(tok::r_paren))
640            // FIXME(bug 36976): ObjC return types shouldn't use TT_CastRParen.
641            Parent->Type = TT_CastRParen;
642        }
643        ColonFound = true;
644      }
645      if (CurrentToken->is(tok::comma) && Left->is(TT_ObjCMethodExpr) &&
646          !ColonFound)
647        Left->Type = TT_ArrayInitializerLSquare;
648      FormatToken *Tok = CurrentToken;
649      if (!consumeToken())
650        return false;
651      updateParameterCount(Left, Tok);
652    }
653    return false;
654  }
655
656  bool parseBrace() {
657    if (CurrentToken) {
658      FormatToken *Left = CurrentToken->Previous;
659      Left->ParentBracket = Contexts.back().ContextKind;
660
661      if (Contexts.back().CaretFound)
662        Left->Type = TT_ObjCBlockLBrace;
663      Contexts.back().CaretFound = false;
664
665      ScopedContextCreator ContextCreator(*this, tok::l_brace, 1);
666      Contexts.back().ColonIsDictLiteral = true;
667      if (Left->BlockKind == BK_BracedInit)
668        Contexts.back().IsExpression = true;
669      if (Style.Language == FormatStyle::LK_JavaScript && Left->Previous &&
670          Left->Previous->is(TT_JsTypeColon))
671        Contexts.back().IsExpression = false;
672
673      while (CurrentToken) {
674        if (CurrentToken->is(tok::r_brace)) {
675          Left->MatchingParen = CurrentToken;
676          CurrentToken->MatchingParen = Left;
677          next();
678          return true;
679        }
680        if (CurrentToken->isOneOf(tok::r_paren, tok::r_square))
681          return false;
682        updateParameterCount(Left, CurrentToken);
683        if (CurrentToken->isOneOf(tok::colon, tok::l_brace, tok::less)) {
684          FormatToken *Previous = CurrentToken->getPreviousNonComment();
685          if (Previous->is(TT_JsTypeOptionalQuestion))
686            Previous = Previous->getPreviousNonComment();
687          if ((CurrentToken->is(tok::colon) &&
688               (!Contexts.back().ColonIsDictLiteral || !Style.isCpp())) ||
689              Style.Language == FormatStyle::LK_Proto ||
690              Style.Language == FormatStyle::LK_TextProto) {
691            Left->Type = TT_DictLiteral;
692            if (Previous->Tok.getIdentifierInfo() ||
693                Previous->is(tok::string_literal))
694              Previous->Type = TT_SelectorName;
695          }
696          if (CurrentToken->is(tok::colon) ||
697              Style.Language == FormatStyle::LK_JavaScript)
698            Left->Type = TT_DictLiteral;
699        }
700        if (CurrentToken->is(tok::comma) &&
701            Style.Language == FormatStyle::LK_JavaScript)
702          Left->Type = TT_DictLiteral;
703        if (!consumeToken())
704          return false;
705      }
706    }
707    return true;
708  }
709
710  void updateParameterCount(FormatToken *Left, FormatToken *Current) {
711    // For ObjC methods, the number of parameters is calculated differently as
712    // method declarations have a different structure (the parameters are not
713    // inside a bracket scope).
714    if (Current->is(tok::l_brace) && Current->BlockKind == BK_Block)
715      ++Left->BlockParameterCount;
716    if (Current->is(tok::comma)) {
717      ++Left->ParameterCount;
718      if (!Left->Role)
719        Left->Role.reset(new CommaSeparatedList(Style));
720      Left->Role->CommaFound(Current);
721    } else if (Left->ParameterCount == 0 && Current->isNot(tok::comment)) {
722      Left->ParameterCount = 1;
723    }
724  }
725
726  bool parseConditional() {
727    while (CurrentToken) {
728      if (CurrentToken->is(tok::colon)) {
729        CurrentToken->Type = TT_ConditionalExpr;
730        next();
731        return true;
732      }
733      if (!consumeToken())
734        return false;
735    }
736    return false;
737  }
738
739  bool parseTemplateDeclaration() {
740    if (CurrentToken && CurrentToken->is(tok::less)) {
741      CurrentToken->Type = TT_TemplateOpener;
742      next();
743      if (!parseAngle())
744        return false;
745      if (CurrentToken)
746        CurrentToken->Previous->ClosesTemplateDeclaration = true;
747      return true;
748    }
749    return false;
750  }
751
752  bool consumeToken() {
753    FormatToken *Tok = CurrentToken;
754    next();
755    switch (Tok->Tok.getKind()) {
756    case tok::plus:
757    case tok::minus:
758      if (!Tok->Previous && Line.MustBeDeclaration)
759        Tok->Type = TT_ObjCMethodSpecifier;
760      break;
761    case tok::colon:
762      if (!Tok->Previous)
763        return false;
764      // Colons from ?: are handled in parseConditional().
765      if (Style.Language == FormatStyle::LK_JavaScript) {
766        if (Contexts.back().ColonIsForRangeExpr || // colon in for loop
767            (Contexts.size() == 1 &&               // switch/case labels
768             !Line.First->isOneOf(tok::kw_enum, tok::kw_case)) ||
769            Contexts.back().ContextKind == tok::l_paren ||  // function params
770            Contexts.back().ContextKind == tok::l_square || // array type
771            (!Contexts.back().IsExpression &&
772             Contexts.back().ContextKind == tok::l_brace) || // object type
773            (Contexts.size() == 1 &&
774             Line.MustBeDeclaration)) { // method/property declaration
775          Contexts.back().IsExpression = false;
776          Tok->Type = TT_JsTypeColon;
777          break;
778        }
779      }
780      if (Contexts.back().ColonIsDictLiteral ||
781          Style.Language == FormatStyle::LK_Proto ||
782          Style.Language == FormatStyle::LK_TextProto) {
783        Tok->Type = TT_DictLiteral;
784        if (Style.Language == FormatStyle::LK_TextProto) {
785          if (FormatToken *Previous = Tok->getPreviousNonComment())
786            Previous->Type = TT_SelectorName;
787        }
788      } else if (Contexts.back().ColonIsObjCMethodExpr ||
789                 Line.startsWith(TT_ObjCMethodSpecifier)) {
790        Tok->Type = TT_ObjCMethodExpr;
791        const FormatToken *BeforePrevious = Tok->Previous->Previous;
792        // Ensure we tag all identifiers in method declarations as
793        // TT_SelectorName.
794        bool UnknownIdentifierInMethodDeclaration =
795            Line.startsWith(TT_ObjCMethodSpecifier) &&
796            Tok->Previous->is(tok::identifier) && Tok->Previous->is(TT_Unknown);
797        if (!BeforePrevious ||
798            // FIXME(bug 36976): ObjC return types shouldn't use TT_CastRParen.
799            !(BeforePrevious->is(TT_CastRParen) ||
800              (BeforePrevious->is(TT_ObjCMethodExpr) &&
801               BeforePrevious->is(tok::colon))) ||
802            BeforePrevious->is(tok::r_square) ||
803            Contexts.back().LongestObjCSelectorName == 0 ||
804            UnknownIdentifierInMethodDeclaration) {
805          Tok->Previous->Type = TT_SelectorName;
806          if (!Contexts.back().FirstObjCSelectorName)
807            Contexts.back().FirstObjCSelectorName = Tok->Previous;
808          else if (Tok->Previous->ColumnWidth >
809                   Contexts.back().LongestObjCSelectorName)
810            Contexts.back().LongestObjCSelectorName =
811                Tok->Previous->ColumnWidth;
812          Tok->Previous->ParameterIndex =
813              Contexts.back().FirstObjCSelectorName->ObjCSelectorNameParts;
814          ++Contexts.back().FirstObjCSelectorName->ObjCSelectorNameParts;
815        }
816      } else if (Contexts.back().ColonIsForRangeExpr) {
817        Tok->Type = TT_RangeBasedForLoopColon;
818      } else if (CurrentToken && CurrentToken->is(tok::numeric_constant)) {
819        Tok->Type = TT_BitFieldColon;
820      } else if (Contexts.size() == 1 &&
821                 !Line.First->isOneOf(tok::kw_enum, tok::kw_case)) {
822        if (Tok->getPreviousNonComment()->isOneOf(tok::r_paren,
823                                                  tok::kw_noexcept))
824          Tok->Type = TT_CtorInitializerColon;
825        else
826          Tok->Type = TT_InheritanceColon;
827      } else if (canBeObjCSelectorComponent(*Tok->Previous) && Tok->Next &&
828                 (Tok->Next->isOneOf(tok::r_paren, tok::comma) ||
829                  (canBeObjCSelectorComponent(*Tok->Next) && Tok->Next->Next &&
830                   Tok->Next->Next->is(tok::colon)))) {
831        // This handles a special macro in ObjC code where selectors including
832        // the colon are passed as macro arguments.
833        Tok->Type = TT_ObjCMethodExpr;
834      } else if (Contexts.back().ContextKind == tok::l_paren) {
835        Tok->Type = TT_InlineASMColon;
836      }
837      break;
838    case tok::pipe:
839    case tok::amp:
840      // | and & in declarations/type expressions represent union and
841      // intersection types, respectively.
842      if (Style.Language == FormatStyle::LK_JavaScript &&
843          !Contexts.back().IsExpression)
844        Tok->Type = TT_JsTypeOperator;
845      break;
846    case tok::kw_if:
847    case tok::kw_while:
848      if (Tok->is(tok::kw_if) && CurrentToken &&
849          CurrentToken->isOneOf(tok::kw_constexpr, tok::identifier))
850        next();
851      if (CurrentToken && CurrentToken->is(tok::l_paren)) {
852        next();
853        if (!parseParens(/*LookForDecls=*/true))
854          return false;
855      }
856      break;
857    case tok::kw_for:
858      if (Style.Language == FormatStyle::LK_JavaScript) {
859        // x.for and {for: ...}
860        if ((Tok->Previous && Tok->Previous->is(tok::period)) ||
861            (Tok->Next && Tok->Next->is(tok::colon)))
862          break;
863        // JS' for await ( ...
864        if (CurrentToken && CurrentToken->is(Keywords.kw_await))
865          next();
866      }
867      Contexts.back().ColonIsForRangeExpr = true;
868      next();
869      if (!parseParens())
870        return false;
871      break;
872    case tok::l_paren:
873      // When faced with 'operator()()', the kw_operator handler incorrectly
874      // marks the first l_paren as a OverloadedOperatorLParen. Here, we make
875      // the first two parens OverloadedOperators and the second l_paren an
876      // OverloadedOperatorLParen.
877      if (Tok->Previous && Tok->Previous->is(tok::r_paren) &&
878          Tok->Previous->MatchingParen &&
879          Tok->Previous->MatchingParen->is(TT_OverloadedOperatorLParen)) {
880        Tok->Previous->Type = TT_OverloadedOperator;
881        Tok->Previous->MatchingParen->Type = TT_OverloadedOperator;
882        Tok->Type = TT_OverloadedOperatorLParen;
883      }
884
885      if (!parseParens())
886        return false;
887      if (Line.MustBeDeclaration && Contexts.size() == 1 &&
888          !Contexts.back().IsExpression && !Line.startsWith(TT_ObjCProperty) &&
889          (!Tok->Previous ||
890           !Tok->Previous->isOneOf(tok::kw_decltype, tok::kw___attribute,
891                                   TT_LeadingJavaAnnotation)))
892        Line.MightBeFunctionDecl = true;
893      break;
894    case tok::l_square:
895      if (!parseSquare())
896        return false;
897      break;
898    case tok::l_brace:
899      if (Style.Language == FormatStyle::LK_TextProto) {
900        FormatToken *Previous = Tok->getPreviousNonComment();
901        if (Previous && Previous->Type != TT_DictLiteral)
902          Previous->Type = TT_SelectorName;
903      }
904      if (!parseBrace())
905        return false;
906      break;
907    case tok::less:
908      if (parseAngle()) {
909        Tok->Type = TT_TemplateOpener;
910        // In TT_Proto, we must distignuish between:
911        //   map<key, value>
912        //   msg < item: data >
913        //   msg: < item: data >
914        // In TT_TextProto, map<key, value> does not occur.
915        if (Style.Language == FormatStyle::LK_TextProto ||
916            (Style.Language == FormatStyle::LK_Proto && Tok->Previous &&
917             Tok->Previous->isOneOf(TT_SelectorName, TT_DictLiteral))) {
918          Tok->Type = TT_DictLiteral;
919          FormatToken *Previous = Tok->getPreviousNonComment();
920          if (Previous && Previous->Type != TT_DictLiteral)
921            Previous->Type = TT_SelectorName;
922        }
923      } else {
924        Tok->Type = TT_BinaryOperator;
925        NonTemplateLess.insert(Tok);
926        CurrentToken = Tok;
927        next();
928      }
929      break;
930    case tok::r_paren:
931    case tok::r_square:
932      return false;
933    case tok::r_brace:
934      // Lines can start with '}'.
935      if (Tok->Previous)
936        return false;
937      break;
938    case tok::greater:
939      if (Style.Language != FormatStyle::LK_TextProto)
940        Tok->Type = TT_BinaryOperator;
941      if (Tok->Previous && Tok->Previous->is(TT_TemplateCloser))
942        Tok->SpacesRequiredBefore = 1;
943      break;
944    case tok::kw_operator:
945      if (Style.Language == FormatStyle::LK_TextProto ||
946          Style.Language == FormatStyle::LK_Proto)
947        break;
948      while (CurrentToken &&
949             !CurrentToken->isOneOf(tok::l_paren, tok::semi, tok::r_paren)) {
950        if (CurrentToken->isOneOf(tok::star, tok::amp))
951          CurrentToken->Type = TT_PointerOrReference;
952        consumeToken();
953        if (CurrentToken && CurrentToken->Previous->isOneOf(
954                                TT_BinaryOperator, TT_UnaryOperator, tok::comma,
955                                tok::star, tok::arrow, tok::amp, tok::ampamp))
956          CurrentToken->Previous->Type = TT_OverloadedOperator;
957      }
958      if (CurrentToken) {
959        CurrentToken->Type = TT_OverloadedOperatorLParen;
960        if (CurrentToken->Previous->is(TT_BinaryOperator))
961          CurrentToken->Previous->Type = TT_OverloadedOperator;
962      }
963      break;
964    case tok::question:
965      if (Style.Language == FormatStyle::LK_JavaScript && Tok->Next &&
966          Tok->Next->isOneOf(tok::semi, tok::comma, tok::colon, tok::r_paren,
967                             tok::r_brace)) {
968        // Question marks before semicolons, colons, etc. indicate optional
969        // types (fields, parameters), e.g.
970        //   function(x?: string, y?) {...}
971        //   class X { y?; }
972        Tok->Type = TT_JsTypeOptionalQuestion;
973        break;
974      }
975      // Declarations cannot be conditional expressions, this can only be part
976      // of a type declaration.
977      if (Line.MustBeDeclaration && !Contexts.back().IsExpression &&
978          Style.Language == FormatStyle::LK_JavaScript)
979        break;
980      parseConditional();
981      break;
982    case tok::kw_template:
983      parseTemplateDeclaration();
984      break;
985    case tok::comma:
986      if (Contexts.back().InCtorInitializer)
987        Tok->Type = TT_CtorInitializerComma;
988      else if (Contexts.back().InInheritanceList)
989        Tok->Type = TT_InheritanceComma;
990      else if (Contexts.back().FirstStartOfName &&
991               (Contexts.size() == 1 || Line.startsWith(tok::kw_for))) {
992        Contexts.back().FirstStartOfName->PartOfMultiVariableDeclStmt = true;
993        Line.IsMultiVariableDeclStmt = true;
994      }
995      if (Contexts.back().IsForEachMacro)
996        Contexts.back().IsExpression = true;
997      break;
998    case tok::identifier:
999      if (Tok->isOneOf(Keywords.kw___has_include,
1000                       Keywords.kw___has_include_next)) {
1001        parseHasInclude();
1002      }
1003      break;
1004    default:
1005      break;
1006    }
1007    return true;
1008  }
1009
1010  void parseIncludeDirective() {
1011    if (CurrentToken && CurrentToken->is(tok::less)) {
1012      next();
1013      while (CurrentToken) {
1014        // Mark tokens up to the trailing line comments as implicit string
1015        // literals.
1016        if (CurrentToken->isNot(tok::comment) &&
1017            !CurrentToken->TokenText.startswith("//"))
1018          CurrentToken->Type = TT_ImplicitStringLiteral;
1019        next();
1020      }
1021    }
1022  }
1023
1024  void parseWarningOrError() {
1025    next();
1026    // We still want to format the whitespace left of the first token of the
1027    // warning or error.
1028    next();
1029    while (CurrentToken) {
1030      CurrentToken->Type = TT_ImplicitStringLiteral;
1031      next();
1032    }
1033  }
1034
1035  void parsePragma() {
1036    next(); // Consume "pragma".
1037    if (CurrentToken &&
1038        CurrentToken->isOneOf(Keywords.kw_mark, Keywords.kw_option)) {
1039      bool IsMark = CurrentToken->is(Keywords.kw_mark);
1040      next(); // Consume "mark".
1041      next(); // Consume first token (so we fix leading whitespace).
1042      while (CurrentToken) {
1043        if (IsMark || CurrentToken->Previous->is(TT_BinaryOperator))
1044          CurrentToken->Type = TT_ImplicitStringLiteral;
1045        next();
1046      }
1047    }
1048  }
1049
1050  void parseHasInclude() {
1051    if (!CurrentToken || !CurrentToken->is(tok::l_paren))
1052      return;
1053    next(); // '('
1054    parseIncludeDirective();
1055    next(); // ')'
1056  }
1057
1058  LineType parsePreprocessorDirective() {
1059    bool IsFirstToken = CurrentToken->IsFirst;
1060    LineType Type = LT_PreprocessorDirective;
1061    next();
1062    if (!CurrentToken)
1063      return Type;
1064
1065    if (Style.Language == FormatStyle::LK_JavaScript && IsFirstToken) {
1066      // JavaScript files can contain shebang lines of the form:
1067      // #!/usr/bin/env node
1068      // Treat these like C++ #include directives.
1069      while (CurrentToken) {
1070        // Tokens cannot be comments here.
1071        CurrentToken->Type = TT_ImplicitStringLiteral;
1072        next();
1073      }
1074      return LT_ImportStatement;
1075    }
1076
1077    if (CurrentToken->Tok.is(tok::numeric_constant)) {
1078      CurrentToken->SpacesRequiredBefore = 1;
1079      return Type;
1080    }
1081    // Hashes in the middle of a line can lead to any strange token
1082    // sequence.
1083    if (!CurrentToken->Tok.getIdentifierInfo())
1084      return Type;
1085    switch (CurrentToken->Tok.getIdentifierInfo()->getPPKeywordID()) {
1086    case tok::pp_include:
1087    case tok::pp_include_next:
1088    case tok::pp_import:
1089      next();
1090      parseIncludeDirective();
1091      Type = LT_ImportStatement;
1092      break;
1093    case tok::pp_error:
1094    case tok::pp_warning:
1095      parseWarningOrError();
1096      break;
1097    case tok::pp_pragma:
1098      parsePragma();
1099      break;
1100    case tok::pp_if:
1101    case tok::pp_elif:
1102      Contexts.back().IsExpression = true;
1103      next();
1104      parseLine();
1105      break;
1106    default:
1107      break;
1108    }
1109    while (CurrentToken) {
1110      FormatToken *Tok = CurrentToken;
1111      next();
1112      if (Tok->is(tok::l_paren))
1113        parseParens();
1114      else if (Tok->isOneOf(Keywords.kw___has_include,
1115                            Keywords.kw___has_include_next))
1116        parseHasInclude();
1117    }
1118    return Type;
1119  }
1120
1121public:
1122  LineType parseLine() {
1123    if (!CurrentToken)
1124      return LT_Invalid;
1125    NonTemplateLess.clear();
1126    if (CurrentToken->is(tok::hash))
1127      return parsePreprocessorDirective();
1128
1129    // Directly allow to 'import <string-literal>' to support protocol buffer
1130    // definitions (github.com/google/protobuf) or missing "#" (either way we
1131    // should not break the line).
1132    IdentifierInfo *Info = CurrentToken->Tok.getIdentifierInfo();
1133    if ((Style.Language == FormatStyle::LK_Java &&
1134         CurrentToken->is(Keywords.kw_package)) ||
1135        (Info && Info->getPPKeywordID() == tok::pp_import &&
1136         CurrentToken->Next &&
1137         CurrentToken->Next->isOneOf(tok::string_literal, tok::identifier,
1138                                     tok::kw_static))) {
1139      next();
1140      parseIncludeDirective();
1141      return LT_ImportStatement;
1142    }
1143
1144    // If this line starts and ends in '<' and '>', respectively, it is likely
1145    // part of "#define <a/b.h>".
1146    if (CurrentToken->is(tok::less) && Line.Last->is(tok::greater)) {
1147      parseIncludeDirective();
1148      return LT_ImportStatement;
1149    }
1150
1151    // In .proto files, top-level options and package statements are very
1152    // similar to import statements and should not be line-wrapped.
1153    if (Style.Language == FormatStyle::LK_Proto && Line.Level == 0 &&
1154        CurrentToken->isOneOf(Keywords.kw_option, Keywords.kw_package)) {
1155      next();
1156      if (CurrentToken && CurrentToken->is(tok::identifier)) {
1157        while (CurrentToken)
1158          next();
1159        return LT_ImportStatement;
1160      }
1161    }
1162
1163    bool KeywordVirtualFound = false;
1164    bool ImportStatement = false;
1165
1166    // import {...} from '...';
1167    if (Style.Language == FormatStyle::LK_JavaScript &&
1168        CurrentToken->is(Keywords.kw_import))
1169      ImportStatement = true;
1170
1171    while (CurrentToken) {
1172      if (CurrentToken->is(tok::kw_virtual))
1173        KeywordVirtualFound = true;
1174      if (Style.Language == FormatStyle::LK_JavaScript) {
1175        // export {...} from '...';
1176        // An export followed by "from 'some string';" is a re-export from
1177        // another module identified by a URI and is treated as a
1178        // LT_ImportStatement (i.e. prevent wraps on it for long URIs).
1179        // Just "export {...};" or "export class ..." should not be treated as
1180        // an import in this sense.
1181        if (Line.First->is(tok::kw_export) &&
1182            CurrentToken->is(Keywords.kw_from) && CurrentToken->Next &&
1183            CurrentToken->Next->isStringLiteral())
1184          ImportStatement = true;
1185        if (isClosureImportStatement(*CurrentToken))
1186          ImportStatement = true;
1187      }
1188      if (!consumeToken())
1189        return LT_Invalid;
1190    }
1191    if (KeywordVirtualFound)
1192      return LT_VirtualFunctionDecl;
1193    if (ImportStatement)
1194      return LT_ImportStatement;
1195
1196    if (Line.startsWith(TT_ObjCMethodSpecifier)) {
1197      if (Contexts.back().FirstObjCSelectorName)
1198        Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
1199            Contexts.back().LongestObjCSelectorName;
1200      return LT_ObjCMethodDecl;
1201    }
1202
1203    return LT_Other;
1204  }
1205
1206private:
1207  bool isClosureImportStatement(const FormatToken &Tok) {
1208    // FIXME: Closure-library specific stuff should not be hard-coded but be
1209    // configurable.
1210    return Tok.TokenText == "goog" && Tok.Next && Tok.Next->is(tok::period) &&
1211           Tok.Next->Next &&
1212           (Tok.Next->Next->TokenText == "module" ||
1213            Tok.Next->Next->TokenText == "provide" ||
1214            Tok.Next->Next->TokenText == "require" ||
1215            Tok.Next->Next->TokenText == "requireType" ||
1216            Tok.Next->Next->TokenText == "forwardDeclare") &&
1217           Tok.Next->Next->Next && Tok.Next->Next->Next->is(tok::l_paren);
1218  }
1219
1220  void resetTokenMetadata(FormatToken *Token) {
1221    if (!Token)
1222      return;
1223
1224    // Reset token type in case we have already looked at it and then
1225    // recovered from an error (e.g. failure to find the matching >).
1226    if (!CurrentToken->isOneOf(
1227            TT_LambdaLSquare, TT_LambdaLBrace, TT_ForEachMacro,
1228            TT_TypenameMacro, TT_FunctionLBrace, TT_ImplicitStringLiteral,
1229            TT_InlineASMBrace, TT_JsFatArrow, TT_LambdaArrow, TT_NamespaceMacro,
1230            TT_OverloadedOperator, TT_RegexLiteral, TT_TemplateString,
1231            TT_ObjCStringLiteral))
1232      CurrentToken->Type = TT_Unknown;
1233    CurrentToken->Role.reset();
1234    CurrentToken->MatchingParen = nullptr;
1235    CurrentToken->FakeLParens.clear();
1236    CurrentToken->FakeRParens = 0;
1237  }
1238
1239  void next() {
1240    if (CurrentToken) {
1241      CurrentToken->NestingLevel = Contexts.size() - 1;
1242      CurrentToken->BindingStrength = Contexts.back().BindingStrength;
1243      modifyContext(*CurrentToken);
1244      determineTokenType(*CurrentToken);
1245      CurrentToken = CurrentToken->Next;
1246    }
1247
1248    resetTokenMetadata(CurrentToken);
1249  }
1250
1251  /// A struct to hold information valid in a specific context, e.g.
1252  /// a pair of parenthesis.
1253  struct Context {
1254    Context(tok::TokenKind ContextKind, unsigned BindingStrength,
1255            bool IsExpression)
1256        : ContextKind(ContextKind), BindingStrength(BindingStrength),
1257          IsExpression(IsExpression) {}
1258
1259    tok::TokenKind ContextKind;
1260    unsigned BindingStrength;
1261    bool IsExpression;
1262    unsigned LongestObjCSelectorName = 0;
1263    bool ColonIsForRangeExpr = false;
1264    bool ColonIsDictLiteral = false;
1265    bool ColonIsObjCMethodExpr = false;
1266    FormatToken *FirstObjCSelectorName = nullptr;
1267    FormatToken *FirstStartOfName = nullptr;
1268    bool CanBeExpression = true;
1269    bool InTemplateArgument = false;
1270    bool InCtorInitializer = false;
1271    bool InInheritanceList = false;
1272    bool CaretFound = false;
1273    bool IsForEachMacro = false;
1274    bool InCpp11AttributeSpecifier = false;
1275    bool InCSharpAttributeSpecifier = false;
1276  };
1277
1278  /// Puts a new \c Context onto the stack \c Contexts for the lifetime
1279  /// of each instance.
1280  struct ScopedContextCreator {
1281    AnnotatingParser &P;
1282
1283    ScopedContextCreator(AnnotatingParser &P, tok::TokenKind ContextKind,
1284                         unsigned Increase)
1285        : P(P) {
1286      P.Contexts.push_back(Context(ContextKind,
1287                                   P.Contexts.back().BindingStrength + Increase,
1288                                   P.Contexts.back().IsExpression));
1289    }
1290
1291    ~ScopedContextCreator() { P.Contexts.pop_back(); }
1292  };
1293
1294  void modifyContext(const FormatToken &Current) {
1295    if (Current.getPrecedence() == prec::Assignment &&
1296        !Line.First->isOneOf(tok::kw_template, tok::kw_using, tok::kw_return) &&
1297        // Type aliases use `type X = ...;` in TypeScript and can be exported
1298        // using `export type ...`.
1299        !(Style.Language == FormatStyle::LK_JavaScript &&
1300          (Line.startsWith(Keywords.kw_type, tok::identifier) ||
1301           Line.startsWith(tok::kw_export, Keywords.kw_type,
1302                           tok::identifier))) &&
1303        (!Current.Previous || Current.Previous->isNot(tok::kw_operator))) {
1304      Contexts.back().IsExpression = true;
1305      if (!Line.startsWith(TT_UnaryOperator)) {
1306        for (FormatToken *Previous = Current.Previous;
1307             Previous && Previous->Previous &&
1308             !Previous->Previous->isOneOf(tok::comma, tok::semi);
1309             Previous = Previous->Previous) {
1310          if (Previous->isOneOf(tok::r_square, tok::r_paren)) {
1311            Previous = Previous->MatchingParen;
1312            if (!Previous)
1313              break;
1314          }
1315          if (Previous->opensScope())
1316            break;
1317          if (Previous->isOneOf(TT_BinaryOperator, TT_UnaryOperator) &&
1318              Previous->isOneOf(tok::star, tok::amp, tok::ampamp) &&
1319              Previous->Previous && Previous->Previous->isNot(tok::equal))
1320            Previous->Type = TT_PointerOrReference;
1321        }
1322      }
1323    } else if (Current.is(tok::lessless) &&
1324               (!Current.Previous || !Current.Previous->is(tok::kw_operator))) {
1325      Contexts.back().IsExpression = true;
1326    } else if (Current.isOneOf(tok::kw_return, tok::kw_throw)) {
1327      Contexts.back().IsExpression = true;
1328    } else if (Current.is(TT_TrailingReturnArrow)) {
1329      Contexts.back().IsExpression = false;
1330    } else if (Current.is(TT_LambdaArrow) || Current.is(Keywords.kw_assert)) {
1331      Contexts.back().IsExpression = Style.Language == FormatStyle::LK_Java;
1332    } else if (Current.Previous &&
1333               Current.Previous->is(TT_CtorInitializerColon)) {
1334      Contexts.back().IsExpression = true;
1335      Contexts.back().InCtorInitializer = true;
1336    } else if (Current.Previous && Current.Previous->is(TT_InheritanceColon)) {
1337      Contexts.back().InInheritanceList = true;
1338    } else if (Current.isOneOf(tok::r_paren, tok::greater, tok::comma)) {
1339      for (FormatToken *Previous = Current.Previous;
1340           Previous && Previous->isOneOf(tok::star, tok::amp);
1341           Previous = Previous->Previous)
1342        Previous->Type = TT_PointerOrReference;
1343      if (Line.MustBeDeclaration && !Contexts.front().InCtorInitializer)
1344        Contexts.back().IsExpression = false;
1345    } else if (Current.is(tok::kw_new)) {
1346      Contexts.back().CanBeExpression = false;
1347    } else if (Current.is(tok::semi) ||
1348               (Current.is(tok::exclaim) && Current.Previous &&
1349                !Current.Previous->is(tok::kw_operator))) {
1350      // This should be the condition or increment in a for-loop.
1351      // But not operator !() (can't use TT_OverloadedOperator here as its not
1352      // been annotated yet).
1353      Contexts.back().IsExpression = true;
1354    }
1355  }
1356
1357  static FormatToken *untilMatchingParen(FormatToken *Current) {
1358    // Used when `MatchingParen` is not yet established.
1359    int ParenLevel = 0;
1360    while (Current) {
1361      if (Current->is(tok::l_paren))
1362        ParenLevel++;
1363      if (Current->is(tok::r_paren))
1364        ParenLevel--;
1365      if (ParenLevel < 1)
1366        break;
1367      Current = Current->Next;
1368    }
1369    return Current;
1370  }
1371
1372  static bool isDeductionGuide(FormatToken &Current) {
1373    // Look for a deduction guide template<T> A(...) -> A<...>;
1374    if (Current.Previous && Current.Previous->is(tok::r_paren) &&
1375        Current.startsSequence(tok::arrow, tok::identifier, tok::less)) {
1376      // Find the TemplateCloser.
1377      FormatToken *TemplateCloser = Current.Next->Next;
1378      int NestingLevel = 0;
1379      while (TemplateCloser) {
1380        // Skip over an expressions in parens  A<(3 < 2)>;
1381        if (TemplateCloser->is(tok::l_paren)) {
1382          // No Matching Paren yet so skip to matching paren
1383          TemplateCloser = untilMatchingParen(TemplateCloser);
1384        }
1385        if (TemplateCloser->is(tok::less))
1386          NestingLevel++;
1387        if (TemplateCloser->is(tok::greater))
1388          NestingLevel--;
1389        if (NestingLevel < 1)
1390          break;
1391        TemplateCloser = TemplateCloser->Next;
1392      }
1393      // Assuming we have found the end of the template ensure its followed
1394      // with a semi-colon.
1395      if (TemplateCloser && TemplateCloser->Next &&
1396          TemplateCloser->Next->is(tok::semi) &&
1397          Current.Previous->MatchingParen) {
1398        // Determine if the identifier `A` prior to the A<..>; is the same as
1399        // prior to the A(..)
1400        FormatToken *LeadingIdentifier =
1401            Current.Previous->MatchingParen->Previous;
1402
1403        // Differentiate a deduction guide by seeing the
1404        // > of the template prior to the leading identifier.
1405        if (LeadingIdentifier) {
1406          FormatToken *PriorLeadingIdentifier = LeadingIdentifier->Previous;
1407          // Skip back past explicit decoration
1408          if (PriorLeadingIdentifier &&
1409              PriorLeadingIdentifier->is(tok::kw_explicit))
1410            PriorLeadingIdentifier = PriorLeadingIdentifier->Previous;
1411
1412          return (PriorLeadingIdentifier &&
1413                  PriorLeadingIdentifier->is(TT_TemplateCloser) &&
1414                  LeadingIdentifier->TokenText == Current.Next->TokenText);
1415        }
1416      }
1417    }
1418    return false;
1419  }
1420
1421  void determineTokenType(FormatToken &Current) {
1422    if (!Current.is(TT_Unknown))
1423      // The token type is already known.
1424      return;
1425
1426    if (Style.Language == FormatStyle::LK_JavaScript) {
1427      if (Current.is(tok::exclaim)) {
1428        if (Current.Previous &&
1429            (Current.Previous->isOneOf(tok::identifier, tok::kw_namespace,
1430                                       tok::r_paren, tok::r_square,
1431                                       tok::r_brace) ||
1432             Current.Previous->Tok.isLiteral())) {
1433          Current.Type = TT_JsNonNullAssertion;
1434          return;
1435        }
1436        if (Current.Next &&
1437            Current.Next->isOneOf(TT_BinaryOperator, Keywords.kw_as)) {
1438          Current.Type = TT_JsNonNullAssertion;
1439          return;
1440        }
1441      }
1442    }
1443
1444    // Line.MightBeFunctionDecl can only be true after the parentheses of a
1445    // function declaration have been found. In this case, 'Current' is a
1446    // trailing token of this declaration and thus cannot be a name.
1447    if (Current.is(Keywords.kw_instanceof)) {
1448      Current.Type = TT_BinaryOperator;
1449    } else if (isStartOfName(Current) &&
1450               (!Line.MightBeFunctionDecl || Current.NestingLevel != 0)) {
1451      Contexts.back().FirstStartOfName = &Current;
1452      Current.Type = TT_StartOfName;
1453    } else if (Current.is(tok::semi)) {
1454      // Reset FirstStartOfName after finding a semicolon so that a for loop
1455      // with multiple increment statements is not confused with a for loop
1456      // having multiple variable declarations.
1457      Contexts.back().FirstStartOfName = nullptr;
1458    } else if (Current.isOneOf(tok::kw_auto, tok::kw___auto_type)) {
1459      AutoFound = true;
1460    } else if (Current.is(tok::arrow) &&
1461               Style.Language == FormatStyle::LK_Java) {
1462      Current.Type = TT_LambdaArrow;
1463    } else if (Current.is(tok::arrow) && AutoFound && Line.MustBeDeclaration &&
1464               Current.NestingLevel == 0 &&
1465               !Current.Previous->is(tok::kw_operator)) {
1466      // not auto operator->() -> xxx;
1467      Current.Type = TT_TrailingReturnArrow;
1468
1469    } else if (isDeductionGuide(Current)) {
1470      // Deduction guides trailing arrow " A(...) -> A<T>;".
1471      Current.Type = TT_TrailingReturnArrow;
1472    } else if (Current.isOneOf(tok::star, tok::amp, tok::ampamp)) {
1473      Current.Type = determineStarAmpUsage(Current,
1474                                           Contexts.back().CanBeExpression &&
1475                                               Contexts.back().IsExpression,
1476                                           Contexts.back().InTemplateArgument);
1477    } else if (Current.isOneOf(tok::minus, tok::plus, tok::caret)) {
1478      Current.Type = determinePlusMinusCaretUsage(Current);
1479      if (Current.is(TT_UnaryOperator) && Current.is(tok::caret))
1480        Contexts.back().CaretFound = true;
1481    } else if (Current.isOneOf(tok::minusminus, tok::plusplus)) {
1482      Current.Type = determineIncrementUsage(Current);
1483    } else if (Current.isOneOf(tok::exclaim, tok::tilde)) {
1484      Current.Type = TT_UnaryOperator;
1485    } else if (Current.is(tok::question)) {
1486      if (Style.Language == FormatStyle::LK_JavaScript &&
1487          Line.MustBeDeclaration && !Contexts.back().IsExpression) {
1488        // In JavaScript, `interface X { foo?(): bar; }` is an optional method
1489        // on the interface, not a ternary expression.
1490        Current.Type = TT_JsTypeOptionalQuestion;
1491      } else {
1492        Current.Type = TT_ConditionalExpr;
1493      }
1494    } else if (Current.isBinaryOperator() &&
1495               (!Current.Previous || Current.Previous->isNot(tok::l_square)) &&
1496               (!Current.is(tok::greater) &&
1497                Style.Language != FormatStyle::LK_TextProto)) {
1498      Current.Type = TT_BinaryOperator;
1499    } else if (Current.is(tok::comment)) {
1500      if (Current.TokenText.startswith("/*")) {
1501        if (Current.TokenText.endswith("*/"))
1502          Current.Type = TT_BlockComment;
1503        else
1504          // The lexer has for some reason determined a comment here. But we
1505          // cannot really handle it, if it isn't properly terminated.
1506          Current.Tok.setKind(tok::unknown);
1507      } else {
1508        Current.Type = TT_LineComment;
1509      }
1510    } else if (Current.is(tok::r_paren)) {
1511      if (rParenEndsCast(Current))
1512        Current.Type = TT_CastRParen;
1513      if (Current.MatchingParen && Current.Next &&
1514          !Current.Next->isBinaryOperator() &&
1515          !Current.Next->isOneOf(tok::semi, tok::colon, tok::l_brace,
1516                                 tok::comma, tok::period, tok::arrow,
1517                                 tok::coloncolon))
1518        if (FormatToken *AfterParen = Current.MatchingParen->Next) {
1519          // Make sure this isn't the return type of an Obj-C block declaration
1520          if (AfterParen->Tok.isNot(tok::caret)) {
1521            if (FormatToken *BeforeParen = Current.MatchingParen->Previous)
1522              if (BeforeParen->is(tok::identifier) &&
1523                  !BeforeParen->is(TT_TypenameMacro) &&
1524                  BeforeParen->TokenText == BeforeParen->TokenText.upper() &&
1525                  (!BeforeParen->Previous ||
1526                   BeforeParen->Previous->ClosesTemplateDeclaration))
1527                Current.Type = TT_FunctionAnnotationRParen;
1528          }
1529        }
1530    } else if (Current.is(tok::at) && Current.Next &&
1531               Style.Language != FormatStyle::LK_JavaScript &&
1532               Style.Language != FormatStyle::LK_Java) {
1533      // In Java & JavaScript, "@..." is a decorator or annotation. In ObjC, it
1534      // marks declarations and properties that need special formatting.
1535      switch (Current.Next->Tok.getObjCKeywordID()) {
1536      case tok::objc_interface:
1537      case tok::objc_implementation:
1538      case tok::objc_protocol:
1539        Current.Type = TT_ObjCDecl;
1540        break;
1541      case tok::objc_property:
1542        Current.Type = TT_ObjCProperty;
1543        break;
1544      default:
1545        break;
1546      }
1547    } else if (Current.is(tok::period)) {
1548      FormatToken *PreviousNoComment = Current.getPreviousNonComment();
1549      if (PreviousNoComment &&
1550          PreviousNoComment->isOneOf(tok::comma, tok::l_brace))
1551        Current.Type = TT_DesignatedInitializerPeriod;
1552      else if (Style.Language == FormatStyle::LK_Java && Current.Previous &&
1553               Current.Previous->isOneOf(TT_JavaAnnotation,
1554                                         TT_LeadingJavaAnnotation)) {
1555        Current.Type = Current.Previous->Type;
1556      }
1557    } else if (canBeObjCSelectorComponent(Current) &&
1558               // FIXME(bug 36976): ObjC return types shouldn't use
1559               // TT_CastRParen.
1560               Current.Previous && Current.Previous->is(TT_CastRParen) &&
1561               Current.Previous->MatchingParen &&
1562               Current.Previous->MatchingParen->Previous &&
1563               Current.Previous->MatchingParen->Previous->is(
1564                   TT_ObjCMethodSpecifier)) {
1565      // This is the first part of an Objective-C selector name. (If there's no
1566      // colon after this, this is the only place which annotates the identifier
1567      // as a selector.)
1568      Current.Type = TT_SelectorName;
1569    } else if (Current.isOneOf(tok::identifier, tok::kw_const,
1570                               tok::kw_noexcept) &&
1571               Current.Previous &&
1572               !Current.Previous->isOneOf(tok::equal, tok::at) &&
1573               Line.MightBeFunctionDecl && Contexts.size() == 1) {
1574      // Line.MightBeFunctionDecl can only be true after the parentheses of a
1575      // function declaration have been found.
1576      Current.Type = TT_TrailingAnnotation;
1577    } else if ((Style.Language == FormatStyle::LK_Java ||
1578                Style.Language == FormatStyle::LK_JavaScript) &&
1579               Current.Previous) {
1580      if (Current.Previous->is(tok::at) &&
1581          Current.isNot(Keywords.kw_interface)) {
1582        const FormatToken &AtToken = *Current.Previous;
1583        const FormatToken *Previous = AtToken.getPreviousNonComment();
1584        if (!Previous || Previous->is(TT_LeadingJavaAnnotation))
1585          Current.Type = TT_LeadingJavaAnnotation;
1586        else
1587          Current.Type = TT_JavaAnnotation;
1588      } else if (Current.Previous->is(tok::period) &&
1589                 Current.Previous->isOneOf(TT_JavaAnnotation,
1590                                           TT_LeadingJavaAnnotation)) {
1591        Current.Type = Current.Previous->Type;
1592      }
1593    }
1594  }
1595
1596  /// Take a guess at whether \p Tok starts a name of a function or
1597  /// variable declaration.
1598  ///
1599  /// This is a heuristic based on whether \p Tok is an identifier following
1600  /// something that is likely a type.
1601  bool isStartOfName(const FormatToken &Tok) {
1602    if (Tok.isNot(tok::identifier) || !Tok.Previous)
1603      return false;
1604
1605    if (Tok.Previous->isOneOf(TT_LeadingJavaAnnotation, Keywords.kw_instanceof,
1606                              Keywords.kw_as))
1607      return false;
1608    if (Style.Language == FormatStyle::LK_JavaScript &&
1609        Tok.Previous->is(Keywords.kw_in))
1610      return false;
1611
1612    // Skip "const" as it does not have an influence on whether this is a name.
1613    FormatToken *PreviousNotConst = Tok.getPreviousNonComment();
1614    while (PreviousNotConst && PreviousNotConst->is(tok::kw_const))
1615      PreviousNotConst = PreviousNotConst->getPreviousNonComment();
1616
1617    if (!PreviousNotConst)
1618      return false;
1619
1620    bool IsPPKeyword = PreviousNotConst->is(tok::identifier) &&
1621                       PreviousNotConst->Previous &&
1622                       PreviousNotConst->Previous->is(tok::hash);
1623
1624    if (PreviousNotConst->is(TT_TemplateCloser))
1625      return PreviousNotConst && PreviousNotConst->MatchingParen &&
1626             PreviousNotConst->MatchingParen->Previous &&
1627             PreviousNotConst->MatchingParen->Previous->isNot(tok::period) &&
1628             PreviousNotConst->MatchingParen->Previous->isNot(tok::kw_template);
1629
1630    if (PreviousNotConst->is(tok::r_paren) && PreviousNotConst->MatchingParen &&
1631        PreviousNotConst->MatchingParen->Previous &&
1632        PreviousNotConst->MatchingParen->Previous->is(tok::kw_decltype))
1633      return true;
1634
1635    return (!IsPPKeyword &&
1636            PreviousNotConst->isOneOf(tok::identifier, tok::kw_auto)) ||
1637           PreviousNotConst->is(TT_PointerOrReference) ||
1638           PreviousNotConst->isSimpleTypeSpecifier();
1639  }
1640
1641  /// Determine whether ')' is ending a cast.
1642  bool rParenEndsCast(const FormatToken &Tok) {
1643    // C-style casts are only used in C++ and Java.
1644    if (!Style.isCpp() && Style.Language != FormatStyle::LK_Java)
1645      return false;
1646
1647    // Empty parens aren't casts and there are no casts at the end of the line.
1648    if (Tok.Previous == Tok.MatchingParen || !Tok.Next || !Tok.MatchingParen)
1649      return false;
1650
1651    FormatToken *LeftOfParens = Tok.MatchingParen->getPreviousNonComment();
1652    if (LeftOfParens) {
1653      // If there is a closing parenthesis left of the current parentheses,
1654      // look past it as these might be chained casts.
1655      if (LeftOfParens->is(tok::r_paren)) {
1656        if (!LeftOfParens->MatchingParen ||
1657            !LeftOfParens->MatchingParen->Previous)
1658          return false;
1659        LeftOfParens = LeftOfParens->MatchingParen->Previous;
1660      }
1661
1662      // If there is an identifier (or with a few exceptions a keyword) right
1663      // before the parentheses, this is unlikely to be a cast.
1664      if (LeftOfParens->Tok.getIdentifierInfo() &&
1665          !LeftOfParens->isOneOf(Keywords.kw_in, tok::kw_return, tok::kw_case,
1666                                 tok::kw_delete))
1667        return false;
1668
1669      // Certain other tokens right before the parentheses are also signals that
1670      // this cannot be a cast.
1671      if (LeftOfParens->isOneOf(tok::at, tok::r_square, TT_OverloadedOperator,
1672                                TT_TemplateCloser, tok::ellipsis))
1673        return false;
1674    }
1675
1676    if (Tok.Next->is(tok::question))
1677      return false;
1678
1679    // Functions which end with decorations like volatile, noexcept are unlikely
1680    // to be casts.
1681    if (Tok.Next->isOneOf(tok::kw_noexcept, tok::kw_volatile, tok::kw_const,
1682                          tok::kw_throw, tok::arrow, Keywords.kw_override,
1683                          Keywords.kw_final) ||
1684        isCpp11AttributeSpecifier(*Tok.Next))
1685      return false;
1686
1687    // As Java has no function types, a "(" after the ")" likely means that this
1688    // is a cast.
1689    if (Style.Language == FormatStyle::LK_Java && Tok.Next->is(tok::l_paren))
1690      return true;
1691
1692    // If a (non-string) literal follows, this is likely a cast.
1693    if (Tok.Next->isNot(tok::string_literal) &&
1694        (Tok.Next->Tok.isLiteral() ||
1695         Tok.Next->isOneOf(tok::kw_sizeof, tok::kw_alignof)))
1696      return true;
1697
1698    // Heuristically try to determine whether the parentheses contain a type.
1699    bool ParensAreType =
1700        !Tok.Previous ||
1701        Tok.Previous->isOneOf(TT_PointerOrReference, TT_TemplateCloser) ||
1702        Tok.Previous->isSimpleTypeSpecifier();
1703    bool ParensCouldEndDecl =
1704        Tok.Next->isOneOf(tok::equal, tok::semi, tok::l_brace, tok::greater);
1705    if (ParensAreType && !ParensCouldEndDecl)
1706      return true;
1707
1708    // At this point, we heuristically assume that there are no casts at the
1709    // start of the line. We assume that we have found most cases where there
1710    // are by the logic above, e.g. "(void)x;".
1711    if (!LeftOfParens)
1712      return false;
1713
1714    // Certain token types inside the parentheses mean that this can't be a
1715    // cast.
1716    for (const FormatToken *Token = Tok.MatchingParen->Next; Token != &Tok;
1717         Token = Token->Next)
1718      if (Token->is(TT_BinaryOperator))
1719        return false;
1720
1721    // If the following token is an identifier or 'this', this is a cast. All
1722    // cases where this can be something else are handled above.
1723    if (Tok.Next->isOneOf(tok::identifier, tok::kw_this))
1724      return true;
1725
1726    if (!Tok.Next->Next)
1727      return false;
1728
1729    // If the next token after the parenthesis is a unary operator, assume
1730    // that this is cast, unless there are unexpected tokens inside the
1731    // parenthesis.
1732    bool NextIsUnary =
1733        Tok.Next->isUnaryOperator() || Tok.Next->isOneOf(tok::amp, tok::star);
1734    if (!NextIsUnary || Tok.Next->is(tok::plus) ||
1735        !Tok.Next->Next->isOneOf(tok::identifier, tok::numeric_constant))
1736      return false;
1737    // Search for unexpected tokens.
1738    for (FormatToken *Prev = Tok.Previous; Prev != Tok.MatchingParen;
1739         Prev = Prev->Previous) {
1740      if (!Prev->isOneOf(tok::kw_const, tok::identifier, tok::coloncolon))
1741        return false;
1742    }
1743    return true;
1744  }
1745
1746  /// Return the type of the given token assuming it is * or &.
1747  TokenType determineStarAmpUsage(const FormatToken &Tok, bool IsExpression,
1748                                  bool InTemplateArgument) {
1749    if (Style.Language == FormatStyle::LK_JavaScript)
1750      return TT_BinaryOperator;
1751
1752    const FormatToken *PrevToken = Tok.getPreviousNonComment();
1753    if (!PrevToken)
1754      return TT_UnaryOperator;
1755
1756    const FormatToken *NextToken = Tok.getNextNonComment();
1757    if (!NextToken ||
1758        NextToken->isOneOf(tok::arrow, tok::equal, tok::kw_const,
1759                           tok::kw_noexcept) ||
1760        (NextToken->is(tok::l_brace) && !NextToken->getNextNonComment()))
1761      return TT_PointerOrReference;
1762
1763    if (PrevToken->is(tok::coloncolon))
1764      return TT_PointerOrReference;
1765
1766    if (PrevToken->isOneOf(tok::l_paren, tok::l_square, tok::l_brace,
1767                           tok::comma, tok::semi, tok::kw_return, tok::colon,
1768                           tok::equal, tok::kw_delete, tok::kw_sizeof,
1769                           tok::kw_throw) ||
1770        PrevToken->isOneOf(TT_BinaryOperator, TT_ConditionalExpr,
1771                           TT_UnaryOperator, TT_CastRParen))
1772      return TT_UnaryOperator;
1773
1774    if (NextToken->is(tok::l_square) && NextToken->isNot(TT_LambdaLSquare))
1775      return TT_PointerOrReference;
1776    if (NextToken->is(tok::kw_operator) && !IsExpression)
1777      return TT_PointerOrReference;
1778    if (NextToken->isOneOf(tok::comma, tok::semi))
1779      return TT_PointerOrReference;
1780
1781    if (PrevToken->is(tok::r_paren) && PrevToken->MatchingParen) {
1782      FormatToken *TokenBeforeMatchingParen =
1783          PrevToken->MatchingParen->getPreviousNonComment();
1784      if (TokenBeforeMatchingParen &&
1785          TokenBeforeMatchingParen->isOneOf(tok::kw_typeof, tok::kw_decltype,
1786                                            TT_TypenameMacro))
1787        return TT_PointerOrReference;
1788    }
1789
1790    if (PrevToken->Tok.isLiteral() ||
1791        PrevToken->isOneOf(tok::r_paren, tok::r_square, tok::kw_true,
1792                           tok::kw_false, tok::r_brace) ||
1793        NextToken->Tok.isLiteral() ||
1794        NextToken->isOneOf(tok::kw_true, tok::kw_false) ||
1795        NextToken->isUnaryOperator() ||
1796        // If we know we're in a template argument, there are no named
1797        // declarations. Thus, having an identifier on the right-hand side
1798        // indicates a binary operator.
1799        (InTemplateArgument && NextToken->Tok.isAnyIdentifier()))
1800      return TT_BinaryOperator;
1801
1802    // "&&(" is quite unlikely to be two successive unary "&".
1803    if (Tok.is(tok::ampamp) && NextToken && NextToken->is(tok::l_paren))
1804      return TT_BinaryOperator;
1805
1806    // This catches some cases where evaluation order is used as control flow:
1807    //   aaa && aaa->f();
1808    const FormatToken *NextNextToken = NextToken->getNextNonComment();
1809    if (NextNextToken && NextNextToken->is(tok::arrow))
1810      return TT_BinaryOperator;
1811
1812    // It is very unlikely that we are going to find a pointer or reference type
1813    // definition on the RHS of an assignment.
1814    if (IsExpression && !Contexts.back().CaretFound)
1815      return TT_BinaryOperator;
1816
1817    return TT_PointerOrReference;
1818  }
1819
1820  TokenType determinePlusMinusCaretUsage(const FormatToken &Tok) {
1821    const FormatToken *PrevToken = Tok.getPreviousNonComment();
1822    if (!PrevToken)
1823      return TT_UnaryOperator;
1824
1825    if (PrevToken->isOneOf(TT_CastRParen, TT_UnaryOperator))
1826      // This must be a sequence of leading unary operators.
1827      return TT_UnaryOperator;
1828
1829    // Use heuristics to recognize unary operators.
1830    if (PrevToken->isOneOf(tok::equal, tok::l_paren, tok::comma, tok::l_square,
1831                           tok::question, tok::colon, tok::kw_return,
1832                           tok::kw_case, tok::at, tok::l_brace, tok::kw_throw,
1833                           tok::kw_co_return, tok::kw_co_yield))
1834      return TT_UnaryOperator;
1835
1836    // There can't be two consecutive binary operators.
1837    if (PrevToken->is(TT_BinaryOperator))
1838      return TT_UnaryOperator;
1839
1840    // Fall back to marking the token as binary operator.
1841    return TT_BinaryOperator;
1842  }
1843
1844  /// Determine whether ++/-- are pre- or post-increments/-decrements.
1845  TokenType determineIncrementUsage(const FormatToken &Tok) {
1846    const FormatToken *PrevToken = Tok.getPreviousNonComment();
1847    if (!PrevToken || PrevToken->is(TT_CastRParen))
1848      return TT_UnaryOperator;
1849    if (PrevToken->isOneOf(tok::r_paren, tok::r_square, tok::identifier))
1850      return TT_TrailingUnaryOperator;
1851
1852    return TT_UnaryOperator;
1853  }
1854
1855  SmallVector<Context, 8> Contexts;
1856
1857  const FormatStyle &Style;
1858  AnnotatedLine &Line;
1859  FormatToken *CurrentToken;
1860  bool AutoFound;
1861  const AdditionalKeywords &Keywords;
1862
1863  // Set of "<" tokens that do not open a template parameter list. If parseAngle
1864  // determines that a specific token can't be a template opener, it will make
1865  // same decision irrespective of the decisions for tokens leading up to it.
1866  // Store this information to prevent this from causing exponential runtime.
1867  llvm::SmallPtrSet<FormatToken *, 16> NonTemplateLess;
1868};
1869
1870static const int PrecedenceUnaryOperator = prec::PointerToMember + 1;
1871static const int PrecedenceArrowAndPeriod = prec::PointerToMember + 2;
1872
1873/// Parses binary expressions by inserting fake parenthesis based on
1874/// operator precedence.
1875class ExpressionParser {
1876public:
1877  ExpressionParser(const FormatStyle &Style, const AdditionalKeywords &Keywords,
1878                   AnnotatedLine &Line)
1879      : Style(Style), Keywords(Keywords), Current(Line.First) {}
1880
1881  /// Parse expressions with the given operator precedence.
1882  void parse(int Precedence = 0) {
1883    // Skip 'return' and ObjC selector colons as they are not part of a binary
1884    // expression.
1885    while (Current && (Current->is(tok::kw_return) ||
1886                       (Current->is(tok::colon) &&
1887                        Current->isOneOf(TT_ObjCMethodExpr, TT_DictLiteral))))
1888      next();
1889
1890    if (!Current || Precedence > PrecedenceArrowAndPeriod)
1891      return;
1892
1893    // Conditional expressions need to be parsed separately for proper nesting.
1894    if (Precedence == prec::Conditional) {
1895      parseConditionalExpr();
1896      return;
1897    }
1898
1899    // Parse unary operators, which all have a higher precedence than binary
1900    // operators.
1901    if (Precedence == PrecedenceUnaryOperator) {
1902      parseUnaryOperator();
1903      return;
1904    }
1905
1906    FormatToken *Start = Current;
1907    FormatToken *LatestOperator = nullptr;
1908    unsigned OperatorIndex = 0;
1909
1910    while (Current) {
1911      // Consume operators with higher precedence.
1912      parse(Precedence + 1);
1913
1914      int CurrentPrecedence = getCurrentPrecedence();
1915
1916      if (Current && Current->is(TT_SelectorName) &&
1917          Precedence == CurrentPrecedence) {
1918        if (LatestOperator)
1919          addFakeParenthesis(Start, prec::Level(Precedence));
1920        Start = Current;
1921      }
1922
1923      // At the end of the line or when an operator with higher precedence is
1924      // found, insert fake parenthesis and return.
1925      if (!Current ||
1926          (Current->closesScope() &&
1927           (Current->MatchingParen || Current->is(TT_TemplateString))) ||
1928          (CurrentPrecedence != -1 && CurrentPrecedence < Precedence) ||
1929          (CurrentPrecedence == prec::Conditional &&
1930           Precedence == prec::Assignment && Current->is(tok::colon))) {
1931        break;
1932      }
1933
1934      // Consume scopes: (), [], <> and {}
1935      if (Current->opensScope()) {
1936        // In fragment of a JavaScript template string can look like '}..${' and
1937        // thus close a scope and open a new one at the same time.
1938        while (Current && (!Current->closesScope() || Current->opensScope())) {
1939          next();
1940          parse();
1941        }
1942        next();
1943      } else {
1944        // Operator found.
1945        if (CurrentPrecedence == Precedence) {
1946          if (LatestOperator)
1947            LatestOperator->NextOperator = Current;
1948          LatestOperator = Current;
1949          Current->OperatorIndex = OperatorIndex;
1950          ++OperatorIndex;
1951        }
1952        next(/*SkipPastLeadingComments=*/Precedence > 0);
1953      }
1954    }
1955
1956    if (LatestOperator && (Current || Precedence > 0)) {
1957      // LatestOperator->LastOperator = true;
1958      if (Precedence == PrecedenceArrowAndPeriod) {
1959        // Call expressions don't have a binary operator precedence.
1960        addFakeParenthesis(Start, prec::Unknown);
1961      } else {
1962        addFakeParenthesis(Start, prec::Level(Precedence));
1963      }
1964    }
1965  }
1966
1967private:
1968  /// Gets the precedence (+1) of the given token for binary operators
1969  /// and other tokens that we treat like binary operators.
1970  int getCurrentPrecedence() {
1971    if (Current) {
1972      const FormatToken *NextNonComment = Current->getNextNonComment();
1973      if (Current->is(TT_ConditionalExpr))
1974        return prec::Conditional;
1975      if (NextNonComment && Current->is(TT_SelectorName) &&
1976          (NextNonComment->isOneOf(TT_DictLiteral, TT_JsTypeColon) ||
1977           ((Style.Language == FormatStyle::LK_Proto ||
1978             Style.Language == FormatStyle::LK_TextProto) &&
1979            NextNonComment->is(tok::less))))
1980        return prec::Assignment;
1981      if (Current->is(TT_JsComputedPropertyName))
1982        return prec::Assignment;
1983      if (Current->is(TT_LambdaArrow))
1984        return prec::Comma;
1985      if (Current->is(TT_JsFatArrow))
1986        return prec::Assignment;
1987      if (Current->isOneOf(tok::semi, TT_InlineASMColon, TT_SelectorName) ||
1988          (Current->is(tok::comment) && NextNonComment &&
1989           NextNonComment->is(TT_SelectorName)))
1990        return 0;
1991      if (Current->is(TT_RangeBasedForLoopColon))
1992        return prec::Comma;
1993      if ((Style.Language == FormatStyle::LK_Java ||
1994           Style.Language == FormatStyle::LK_JavaScript) &&
1995          Current->is(Keywords.kw_instanceof))
1996        return prec::Relational;
1997      if (Style.Language == FormatStyle::LK_JavaScript &&
1998          Current->isOneOf(Keywords.kw_in, Keywords.kw_as))
1999        return prec::Relational;
2000      if (Current->is(TT_BinaryOperator) || Current->is(tok::comma))
2001        return Current->getPrecedence();
2002      if (Current->isOneOf(tok::period, tok::arrow))
2003        return PrecedenceArrowAndPeriod;
2004      if ((Style.Language == FormatStyle::LK_Java ||
2005           Style.Language == FormatStyle::LK_JavaScript) &&
2006          Current->isOneOf(Keywords.kw_extends, Keywords.kw_implements,
2007                           Keywords.kw_throws))
2008        return 0;
2009    }
2010    return -1;
2011  }
2012
2013  void addFakeParenthesis(FormatToken *Start, prec::Level Precedence) {
2014    Start->FakeLParens.push_back(Precedence);
2015    if (Precedence > prec::Unknown)
2016      Start->StartsBinaryExpression = true;
2017    if (Current) {
2018      FormatToken *Previous = Current->Previous;
2019      while (Previous->is(tok::comment) && Previous->Previous)
2020        Previous = Previous->Previous;
2021      ++Previous->FakeRParens;
2022      if (Precedence > prec::Unknown)
2023        Previous->EndsBinaryExpression = true;
2024    }
2025  }
2026
2027  /// Parse unary operator expressions and surround them with fake
2028  /// parentheses if appropriate.
2029  void parseUnaryOperator() {
2030    llvm::SmallVector<FormatToken *, 2> Tokens;
2031    while (Current && Current->is(TT_UnaryOperator)) {
2032      Tokens.push_back(Current);
2033      next();
2034    }
2035    parse(PrecedenceArrowAndPeriod);
2036    for (FormatToken *Token : llvm::reverse(Tokens))
2037      // The actual precedence doesn't matter.
2038      addFakeParenthesis(Token, prec::Unknown);
2039  }
2040
2041  void parseConditionalExpr() {
2042    while (Current && Current->isTrailingComment()) {
2043      next();
2044    }
2045    FormatToken *Start = Current;
2046    parse(prec::LogicalOr);
2047    if (!Current || !Current->is(tok::question))
2048      return;
2049    next();
2050    parse(prec::Assignment);
2051    if (!Current || Current->isNot(TT_ConditionalExpr))
2052      return;
2053    next();
2054    parse(prec::Assignment);
2055    addFakeParenthesis(Start, prec::Conditional);
2056  }
2057
2058  void next(bool SkipPastLeadingComments = true) {
2059    if (Current)
2060      Current = Current->Next;
2061    while (Current &&
2062           (Current->NewlinesBefore == 0 || SkipPastLeadingComments) &&
2063           Current->isTrailingComment())
2064      Current = Current->Next;
2065  }
2066
2067  const FormatStyle &Style;
2068  const AdditionalKeywords &Keywords;
2069  FormatToken *Current;
2070};
2071
2072} // end anonymous namespace
2073
2074void TokenAnnotator::setCommentLineLevels(
2075    SmallVectorImpl<AnnotatedLine *> &Lines) {
2076  const AnnotatedLine *NextNonCommentLine = nullptr;
2077  for (SmallVectorImpl<AnnotatedLine *>::reverse_iterator I = Lines.rbegin(),
2078                                                          E = Lines.rend();
2079       I != E; ++I) {
2080    bool CommentLine = true;
2081    for (const FormatToken *Tok = (*I)->First; Tok; Tok = Tok->Next) {
2082      if (!Tok->is(tok::comment)) {
2083        CommentLine = false;
2084        break;
2085      }
2086    }
2087
2088    // If the comment is currently aligned with the line immediately following
2089    // it, that's probably intentional and we should keep it.
2090    if (NextNonCommentLine && CommentLine &&
2091        NextNonCommentLine->First->NewlinesBefore <= 1 &&
2092        NextNonCommentLine->First->OriginalColumn ==
2093            (*I)->First->OriginalColumn) {
2094      // Align comments for preprocessor lines with the # in column 0 if
2095      // preprocessor lines are not indented. Otherwise, align with the next
2096      // line.
2097      (*I)->Level =
2098          (Style.IndentPPDirectives != FormatStyle::PPDIS_BeforeHash &&
2099           (NextNonCommentLine->Type == LT_PreprocessorDirective ||
2100            NextNonCommentLine->Type == LT_ImportStatement))
2101              ? 0
2102              : NextNonCommentLine->Level;
2103    } else {
2104      NextNonCommentLine = (*I)->First->isNot(tok::r_brace) ? (*I) : nullptr;
2105    }
2106
2107    setCommentLineLevels((*I)->Children);
2108  }
2109}
2110
2111static unsigned maxNestingDepth(const AnnotatedLine &Line) {
2112  unsigned Result = 0;
2113  for (const auto *Tok = Line.First; Tok != nullptr; Tok = Tok->Next)
2114    Result = std::max(Result, Tok->NestingLevel);
2115  return Result;
2116}
2117
2118void TokenAnnotator::annotate(AnnotatedLine &Line) {
2119  for (SmallVectorImpl<AnnotatedLine *>::iterator I = Line.Children.begin(),
2120                                                  E = Line.Children.end();
2121       I != E; ++I) {
2122    annotate(**I);
2123  }
2124  AnnotatingParser Parser(Style, Line, Keywords);
2125  Line.Type = Parser.parseLine();
2126
2127  // With very deep nesting, ExpressionParser uses lots of stack and the
2128  // formatting algorithm is very slow. We're not going to do a good job here
2129  // anyway - it's probably generated code being formatted by mistake.
2130  // Just skip the whole line.
2131  if (maxNestingDepth(Line) > 50)
2132    Line.Type = LT_Invalid;
2133
2134  if (Line.Type == LT_Invalid)
2135    return;
2136
2137  ExpressionParser ExprParser(Style, Keywords, Line);
2138  ExprParser.parse();
2139
2140  if (Line.startsWith(TT_ObjCMethodSpecifier))
2141    Line.Type = LT_ObjCMethodDecl;
2142  else if (Line.startsWith(TT_ObjCDecl))
2143    Line.Type = LT_ObjCDecl;
2144  else if (Line.startsWith(TT_ObjCProperty))
2145    Line.Type = LT_ObjCProperty;
2146
2147  Line.First->SpacesRequiredBefore = 1;
2148  Line.First->CanBreakBefore = Line.First->MustBreakBefore;
2149}
2150
2151// This function heuristically determines whether 'Current' starts the name of a
2152// function declaration.
2153static bool isFunctionDeclarationName(const FormatToken &Current,
2154                                      const AnnotatedLine &Line) {
2155  auto skipOperatorName = [](const FormatToken *Next) -> const FormatToken * {
2156    for (; Next; Next = Next->Next) {
2157      if (Next->is(TT_OverloadedOperatorLParen))
2158        return Next;
2159      if (Next->is(TT_OverloadedOperator))
2160        continue;
2161      if (Next->isOneOf(tok::kw_new, tok::kw_delete)) {
2162        // For 'new[]' and 'delete[]'.
2163        if (Next->Next &&
2164            Next->Next->startsSequence(tok::l_square, tok::r_square))
2165          Next = Next->Next->Next;
2166        continue;
2167      }
2168      if (Next->startsSequence(tok::l_square, tok::r_square)) {
2169        // For operator[]().
2170        Next = Next->Next;
2171        continue;
2172      }
2173      if ((Next->isSimpleTypeSpecifier() || Next->is(tok::identifier)) &&
2174          Next->Next && Next->Next->isOneOf(tok::star, tok::amp, tok::ampamp)) {
2175        // For operator void*(), operator char*(), operator Foo*().
2176        Next = Next->Next;
2177        continue;
2178      }
2179      if (Next->is(TT_TemplateOpener) && Next->MatchingParen) {
2180        Next = Next->MatchingParen;
2181        continue;
2182      }
2183
2184      break;
2185    }
2186    return nullptr;
2187  };
2188
2189  // Find parentheses of parameter list.
2190  const FormatToken *Next = Current.Next;
2191  if (Current.is(tok::kw_operator)) {
2192    if (Current.Previous && Current.Previous->is(tok::coloncolon))
2193      return false;
2194    Next = skipOperatorName(Next);
2195  } else {
2196    if (!Current.is(TT_StartOfName) || Current.NestingLevel != 0)
2197      return false;
2198    for (; Next; Next = Next->Next) {
2199      if (Next->is(TT_TemplateOpener)) {
2200        Next = Next->MatchingParen;
2201      } else if (Next->is(tok::coloncolon)) {
2202        Next = Next->Next;
2203        if (!Next)
2204          return false;
2205        if (Next->is(tok::kw_operator)) {
2206          Next = skipOperatorName(Next->Next);
2207          break;
2208        }
2209        if (!Next->is(tok::identifier))
2210          return false;
2211      } else if (Next->is(tok::l_paren)) {
2212        break;
2213      } else {
2214        return false;
2215      }
2216    }
2217  }
2218
2219  // Check whether parameter list can belong to a function declaration.
2220  if (!Next || !Next->is(tok::l_paren) || !Next->MatchingParen)
2221    return false;
2222  // If the lines ends with "{", this is likely an function definition.
2223  if (Line.Last->is(tok::l_brace))
2224    return true;
2225  if (Next->Next == Next->MatchingParen)
2226    return true; // Empty parentheses.
2227  // If there is an &/&& after the r_paren, this is likely a function.
2228  if (Next->MatchingParen->Next &&
2229      Next->MatchingParen->Next->is(TT_PointerOrReference))
2230    return true;
2231  for (const FormatToken *Tok = Next->Next; Tok && Tok != Next->MatchingParen;
2232       Tok = Tok->Next) {
2233    if (Tok->isOneOf(tok::l_paren, TT_TemplateOpener) && Tok->MatchingParen) {
2234      Tok = Tok->MatchingParen;
2235      continue;
2236    }
2237    if (Tok->is(tok::kw_const) || Tok->isSimpleTypeSpecifier() ||
2238        Tok->isOneOf(TT_PointerOrReference, TT_StartOfName, tok::ellipsis))
2239      return true;
2240    if (Tok->isOneOf(tok::l_brace, tok::string_literal, TT_ObjCMethodExpr) ||
2241        Tok->Tok.isLiteral())
2242      return false;
2243  }
2244  return false;
2245}
2246
2247bool TokenAnnotator::mustBreakForReturnType(const AnnotatedLine &Line) const {
2248  assert(Line.MightBeFunctionDecl);
2249
2250  if ((Style.AlwaysBreakAfterReturnType == FormatStyle::RTBS_TopLevel ||
2251       Style.AlwaysBreakAfterReturnType ==
2252           FormatStyle::RTBS_TopLevelDefinitions) &&
2253      Line.Level > 0)
2254    return false;
2255
2256  switch (Style.AlwaysBreakAfterReturnType) {
2257  case FormatStyle::RTBS_None:
2258    return false;
2259  case FormatStyle::RTBS_All:
2260  case FormatStyle::RTBS_TopLevel:
2261    return true;
2262  case FormatStyle::RTBS_AllDefinitions:
2263  case FormatStyle::RTBS_TopLevelDefinitions:
2264    return Line.mightBeFunctionDefinition();
2265  }
2266
2267  return false;
2268}
2269
2270void TokenAnnotator::calculateFormattingInformation(AnnotatedLine &Line) {
2271  for (SmallVectorImpl<AnnotatedLine *>::iterator I = Line.Children.begin(),
2272                                                  E = Line.Children.end();
2273       I != E; ++I) {
2274    calculateFormattingInformation(**I);
2275  }
2276
2277  Line.First->TotalLength =
2278      Line.First->IsMultiline ? Style.ColumnLimit
2279                              : Line.FirstStartColumn + Line.First->ColumnWidth;
2280  FormatToken *Current = Line.First->Next;
2281  bool InFunctionDecl = Line.MightBeFunctionDecl;
2282  while (Current) {
2283    if (isFunctionDeclarationName(*Current, Line))
2284      Current->Type = TT_FunctionDeclarationName;
2285    if (Current->is(TT_LineComment)) {
2286      if (Current->Previous->BlockKind == BK_BracedInit &&
2287          Current->Previous->opensScope())
2288        Current->SpacesRequiredBefore =
2289            (Style.Cpp11BracedListStyle && !Style.SpacesInParentheses) ? 0 : 1;
2290      else
2291        Current->SpacesRequiredBefore = Style.SpacesBeforeTrailingComments;
2292
2293      // If we find a trailing comment, iterate backwards to determine whether
2294      // it seems to relate to a specific parameter. If so, break before that
2295      // parameter to avoid changing the comment's meaning. E.g. don't move 'b'
2296      // to the previous line in:
2297      //   SomeFunction(a,
2298      //                b, // comment
2299      //                c);
2300      if (!Current->HasUnescapedNewline) {
2301        for (FormatToken *Parameter = Current->Previous; Parameter;
2302             Parameter = Parameter->Previous) {
2303          if (Parameter->isOneOf(tok::comment, tok::r_brace))
2304            break;
2305          if (Parameter->Previous && Parameter->Previous->is(tok::comma)) {
2306            if (!Parameter->Previous->is(TT_CtorInitializerComma) &&
2307                Parameter->HasUnescapedNewline)
2308              Parameter->MustBreakBefore = true;
2309            break;
2310          }
2311        }
2312      }
2313    } else if (Current->SpacesRequiredBefore == 0 &&
2314               spaceRequiredBefore(Line, *Current)) {
2315      Current->SpacesRequiredBefore = 1;
2316    }
2317
2318    Current->MustBreakBefore =
2319        Current->MustBreakBefore || mustBreakBefore(Line, *Current);
2320
2321    if (!Current->MustBreakBefore && InFunctionDecl &&
2322        Current->is(TT_FunctionDeclarationName))
2323      Current->MustBreakBefore = mustBreakForReturnType(Line);
2324
2325    Current->CanBreakBefore =
2326        Current->MustBreakBefore || canBreakBefore(Line, *Current);
2327    unsigned ChildSize = 0;
2328    if (Current->Previous->Children.size() == 1) {
2329      FormatToken &LastOfChild = *Current->Previous->Children[0]->Last;
2330      ChildSize = LastOfChild.isTrailingComment() ? Style.ColumnLimit
2331                                                  : LastOfChild.TotalLength + 1;
2332    }
2333    const FormatToken *Prev = Current->Previous;
2334    if (Current->MustBreakBefore || Prev->Children.size() > 1 ||
2335        (Prev->Children.size() == 1 &&
2336         Prev->Children[0]->First->MustBreakBefore) ||
2337        Current->IsMultiline)
2338      Current->TotalLength = Prev->TotalLength + Style.ColumnLimit;
2339    else
2340      Current->TotalLength = Prev->TotalLength + Current->ColumnWidth +
2341                             ChildSize + Current->SpacesRequiredBefore;
2342
2343    if (Current->is(TT_CtorInitializerColon))
2344      InFunctionDecl = false;
2345
2346    // FIXME: Only calculate this if CanBreakBefore is true once static
2347    // initializers etc. are sorted out.
2348    // FIXME: Move magic numbers to a better place.
2349
2350    // Reduce penalty for aligning ObjC method arguments using the colon
2351    // alignment as this is the canonical way (still prefer fitting everything
2352    // into one line if possible). Trying to fit a whole expression into one
2353    // line should not force other line breaks (e.g. when ObjC method
2354    // expression is a part of other expression).
2355    Current->SplitPenalty = splitPenalty(Line, *Current, InFunctionDecl);
2356    if (Style.Language == FormatStyle::LK_ObjC &&
2357        Current->is(TT_SelectorName) && Current->ParameterIndex > 0) {
2358      if (Current->ParameterIndex == 1)
2359        Current->SplitPenalty += 5 * Current->BindingStrength;
2360    } else {
2361      Current->SplitPenalty += 20 * Current->BindingStrength;
2362    }
2363
2364    Current = Current->Next;
2365  }
2366
2367  calculateUnbreakableTailLengths(Line);
2368  unsigned IndentLevel = Line.Level;
2369  for (Current = Line.First; Current != nullptr; Current = Current->Next) {
2370    if (Current->Role)
2371      Current->Role->precomputeFormattingInfos(Current);
2372    if (Current->MatchingParen &&
2373        Current->MatchingParen->opensBlockOrBlockTypeList(Style)) {
2374      assert(IndentLevel > 0);
2375      --IndentLevel;
2376    }
2377    Current->IndentLevel = IndentLevel;
2378    if (Current->opensBlockOrBlockTypeList(Style))
2379      ++IndentLevel;
2380  }
2381
2382  LLVM_DEBUG({ printDebugInfo(Line); });
2383}
2384
2385void TokenAnnotator::calculateUnbreakableTailLengths(AnnotatedLine &Line) {
2386  unsigned UnbreakableTailLength = 0;
2387  FormatToken *Current = Line.Last;
2388  while (Current) {
2389    Current->UnbreakableTailLength = UnbreakableTailLength;
2390    if (Current->CanBreakBefore ||
2391        Current->isOneOf(tok::comment, tok::string_literal)) {
2392      UnbreakableTailLength = 0;
2393    } else {
2394      UnbreakableTailLength +=
2395          Current->ColumnWidth + Current->SpacesRequiredBefore;
2396    }
2397    Current = Current->Previous;
2398  }
2399}
2400
2401unsigned TokenAnnotator::splitPenalty(const AnnotatedLine &Line,
2402                                      const FormatToken &Tok,
2403                                      bool InFunctionDecl) {
2404  const FormatToken &Left = *Tok.Previous;
2405  const FormatToken &Right = Tok;
2406
2407  if (Left.is(tok::semi))
2408    return 0;
2409
2410  if (Style.Language == FormatStyle::LK_Java) {
2411    if (Right.isOneOf(Keywords.kw_extends, Keywords.kw_throws))
2412      return 1;
2413    if (Right.is(Keywords.kw_implements))
2414      return 2;
2415    if (Left.is(tok::comma) && Left.NestingLevel == 0)
2416      return 3;
2417  } else if (Style.Language == FormatStyle::LK_JavaScript) {
2418    if (Right.is(Keywords.kw_function) && Left.isNot(tok::comma))
2419      return 100;
2420    if (Left.is(TT_JsTypeColon))
2421      return 35;
2422    if ((Left.is(TT_TemplateString) && Left.TokenText.endswith("${")) ||
2423        (Right.is(TT_TemplateString) && Right.TokenText.startswith("}")))
2424      return 100;
2425    // Prefer breaking call chains (".foo") over empty "{}", "[]" or "()".
2426    if (Left.opensScope() && Right.closesScope())
2427      return 200;
2428  }
2429
2430  if (Right.is(tok::identifier) && Right.Next && Right.Next->is(TT_DictLiteral))
2431    return 1;
2432  if (Right.is(tok::l_square)) {
2433    if (Style.Language == FormatStyle::LK_Proto)
2434      return 1;
2435    if (Left.is(tok::r_square))
2436      return 200;
2437    // Slightly prefer formatting local lambda definitions like functions.
2438    if (Right.is(TT_LambdaLSquare) && Left.is(tok::equal))
2439      return 35;
2440    if (!Right.isOneOf(TT_ObjCMethodExpr, TT_LambdaLSquare,
2441                       TT_ArrayInitializerLSquare,
2442                       TT_DesignatedInitializerLSquare, TT_AttributeSquare))
2443      return 500;
2444  }
2445
2446  if (Left.is(tok::coloncolon) ||
2447      (Right.is(tok::period) && Style.Language == FormatStyle::LK_Proto))
2448    return 500;
2449  if (Right.isOneOf(TT_StartOfName, TT_FunctionDeclarationName) ||
2450      Right.is(tok::kw_operator)) {
2451    if (Line.startsWith(tok::kw_for) && Right.PartOfMultiVariableDeclStmt)
2452      return 3;
2453    if (Left.is(TT_StartOfName))
2454      return 110;
2455    if (InFunctionDecl && Right.NestingLevel == 0)
2456      return Style.PenaltyReturnTypeOnItsOwnLine;
2457    return 200;
2458  }
2459  if (Right.is(TT_PointerOrReference))
2460    return 190;
2461  if (Right.is(TT_LambdaArrow))
2462    return 110;
2463  if (Left.is(tok::equal) && Right.is(tok::l_brace))
2464    return 160;
2465  if (Left.is(TT_CastRParen))
2466    return 100;
2467  if (Left.isOneOf(tok::kw_class, tok::kw_struct))
2468    return 5000;
2469  if (Left.is(tok::comment))
2470    return 1000;
2471
2472  if (Left.isOneOf(TT_RangeBasedForLoopColon, TT_InheritanceColon,
2473                   TT_CtorInitializerColon))
2474    return 2;
2475
2476  if (Right.isMemberAccess()) {
2477    // Breaking before the "./->" of a chained call/member access is reasonably
2478    // cheap, as formatting those with one call per line is generally
2479    // desirable. In particular, it should be cheaper to break before the call
2480    // than it is to break inside a call's parameters, which could lead to weird
2481    // "hanging" indents. The exception is the very last "./->" to support this
2482    // frequent pattern:
2483    //
2484    //   aaaaaaaa.aaaaaaaa.bbbbbbb().ccccccccccccccccccccc(
2485    //       dddddddd);
2486    //
2487    // which might otherwise be blown up onto many lines. Here, clang-format
2488    // won't produce "hanging" indents anyway as there is no other trailing
2489    // call.
2490    //
2491    // Also apply higher penalty is not a call as that might lead to a wrapping
2492    // like:
2493    //
2494    //   aaaaaaa
2495    //       .aaaaaaaaa.bbbbbbbb(cccccccc);
2496    return !Right.NextOperator || !Right.NextOperator->Previous->closesScope()
2497               ? 150
2498               : 35;
2499  }
2500
2501  if (Right.is(TT_TrailingAnnotation) &&
2502      (!Right.Next || Right.Next->isNot(tok::l_paren))) {
2503    // Moving trailing annotations to the next line is fine for ObjC method
2504    // declarations.
2505    if (Line.startsWith(TT_ObjCMethodSpecifier))
2506      return 10;
2507    // Generally, breaking before a trailing annotation is bad unless it is
2508    // function-like. It seems to be especially preferable to keep standard
2509    // annotations (i.e. "const", "final" and "override") on the same line.
2510    // Use a slightly higher penalty after ")" so that annotations like
2511    // "const override" are kept together.
2512    bool is_short_annotation = Right.TokenText.size() < 10;
2513    return (Left.is(tok::r_paren) ? 100 : 120) + (is_short_annotation ? 50 : 0);
2514  }
2515
2516  // In for-loops, prefer breaking at ',' and ';'.
2517  if (Line.startsWith(tok::kw_for) && Left.is(tok::equal))
2518    return 4;
2519
2520  // In Objective-C method expressions, prefer breaking before "param:" over
2521  // breaking after it.
2522  if (Right.is(TT_SelectorName))
2523    return 0;
2524  if (Left.is(tok::colon) && Left.is(TT_ObjCMethodExpr))
2525    return Line.MightBeFunctionDecl ? 50 : 500;
2526
2527  // In Objective-C type declarations, avoid breaking after the category's
2528  // open paren (we'll prefer breaking after the protocol list's opening
2529  // angle bracket, if present).
2530  if (Line.Type == LT_ObjCDecl && Left.is(tok::l_paren) && Left.Previous &&
2531      Left.Previous->isOneOf(tok::identifier, tok::greater))
2532    return 500;
2533
2534  if (Left.is(tok::l_paren) && InFunctionDecl &&
2535      Style.AlignAfterOpenBracket != FormatStyle::BAS_DontAlign)
2536    return 100;
2537  if (Left.is(tok::l_paren) && Left.Previous &&
2538      (Left.Previous->is(tok::kw_for) || Left.Previous->isIf()))
2539    return 1000;
2540  if (Left.is(tok::equal) && InFunctionDecl)
2541    return 110;
2542  if (Right.is(tok::r_brace))
2543    return 1;
2544  if (Left.is(TT_TemplateOpener))
2545    return 100;
2546  if (Left.opensScope()) {
2547    if (Style.AlignAfterOpenBracket == FormatStyle::BAS_DontAlign)
2548      return 0;
2549    if (Left.is(tok::l_brace) && !Style.Cpp11BracedListStyle)
2550      return 19;
2551    return Left.ParameterCount > 1 ? Style.PenaltyBreakBeforeFirstCallParameter
2552                                   : 19;
2553  }
2554  if (Left.is(TT_JavaAnnotation))
2555    return 50;
2556
2557  if (Left.is(TT_UnaryOperator))
2558    return 60;
2559  if (Left.isOneOf(tok::plus, tok::comma) && Left.Previous &&
2560      Left.Previous->isLabelString() &&
2561      (Left.NextOperator || Left.OperatorIndex != 0))
2562    return 50;
2563  if (Right.is(tok::plus) && Left.isLabelString() &&
2564      (Right.NextOperator || Right.OperatorIndex != 0))
2565    return 25;
2566  if (Left.is(tok::comma))
2567    return 1;
2568  if (Right.is(tok::lessless) && Left.isLabelString() &&
2569      (Right.NextOperator || Right.OperatorIndex != 1))
2570    return 25;
2571  if (Right.is(tok::lessless)) {
2572    // Breaking at a << is really cheap.
2573    if (!Left.is(tok::r_paren) || Right.OperatorIndex > 0)
2574      // Slightly prefer to break before the first one in log-like statements.
2575      return 2;
2576    return 1;
2577  }
2578  if (Left.ClosesTemplateDeclaration)
2579    return Style.PenaltyBreakTemplateDeclaration;
2580  if (Left.is(TT_ConditionalExpr))
2581    return prec::Conditional;
2582  prec::Level Level = Left.getPrecedence();
2583  if (Level == prec::Unknown)
2584    Level = Right.getPrecedence();
2585  if (Level == prec::Assignment)
2586    return Style.PenaltyBreakAssignment;
2587  if (Level != prec::Unknown)
2588    return Level;
2589
2590  return 3;
2591}
2592
2593bool TokenAnnotator::spaceRequiredBeforeParens(const FormatToken &Right) const {
2594  return Style.SpaceBeforeParens == FormatStyle::SBPO_Always ||
2595         (Style.SpaceBeforeParens == FormatStyle::SBPO_NonEmptyParentheses &&
2596          Right.ParameterCount > 0);
2597}
2598
2599/// Returns \c true if the token is followed by a boolean condition, \c false
2600/// otherwise.
2601static bool isKeywordWithCondition(const FormatToken &Tok) {
2602  return Tok.isOneOf(tok::kw_if, tok::kw_for, tok::kw_while, tok::kw_switch,
2603                     tok::kw_constexpr, tok::kw_catch);
2604}
2605
2606bool TokenAnnotator::spaceRequiredBetween(const AnnotatedLine &Line,
2607                                          const FormatToken &Left,
2608                                          const FormatToken &Right) {
2609  if (Left.is(tok::kw_return) && Right.isNot(tok::semi))
2610    return true;
2611  if (Left.is(Keywords.kw_assert) && Style.Language == FormatStyle::LK_Java)
2612    return true;
2613  if (Style.ObjCSpaceAfterProperty && Line.Type == LT_ObjCProperty &&
2614      Left.Tok.getObjCKeywordID() == tok::objc_property)
2615    return true;
2616  if (Right.is(tok::hashhash))
2617    return Left.is(tok::hash);
2618  if (Left.isOneOf(tok::hashhash, tok::hash))
2619    return Right.is(tok::hash);
2620  if ((Left.is(tok::l_paren) && Right.is(tok::r_paren)) ||
2621      (Left.is(tok::l_brace) && Left.BlockKind != BK_Block &&
2622       Right.is(tok::r_brace) && Right.BlockKind != BK_Block))
2623    return Style.SpaceInEmptyParentheses;
2624  if (Style.SpacesInConditionalStatement) {
2625    if (Left.is(tok::l_paren) && Left.Previous &&
2626        isKeywordWithCondition(*Left.Previous))
2627      return true;
2628    if (Right.is(tok::r_paren) && Right.MatchingParen &&
2629        Right.MatchingParen->Previous &&
2630        isKeywordWithCondition(*Right.MatchingParen->Previous))
2631      return true;
2632  }
2633  if (Left.is(tok::l_paren) || Right.is(tok::r_paren))
2634    return (Right.is(TT_CastRParen) ||
2635            (Left.MatchingParen && Left.MatchingParen->is(TT_CastRParen)))
2636               ? Style.SpacesInCStyleCastParentheses
2637               : Style.SpacesInParentheses;
2638  if (Right.isOneOf(tok::semi, tok::comma))
2639    return false;
2640  if (Right.is(tok::less) && Line.Type == LT_ObjCDecl) {
2641    bool IsLightweightGeneric = Right.MatchingParen &&
2642                                Right.MatchingParen->Next &&
2643                                Right.MatchingParen->Next->is(tok::colon);
2644    return !IsLightweightGeneric && Style.ObjCSpaceBeforeProtocolList;
2645  }
2646  if (Right.is(tok::less) && Left.is(tok::kw_template))
2647    return Style.SpaceAfterTemplateKeyword;
2648  if (Left.isOneOf(tok::exclaim, tok::tilde))
2649    return false;
2650  if (Left.is(tok::at) &&
2651      Right.isOneOf(tok::identifier, tok::string_literal, tok::char_constant,
2652                    tok::numeric_constant, tok::l_paren, tok::l_brace,
2653                    tok::kw_true, tok::kw_false))
2654    return false;
2655  if (Left.is(tok::colon))
2656    return !Left.is(TT_ObjCMethodExpr);
2657  if (Left.is(tok::coloncolon))
2658    return false;
2659  if (Left.is(tok::less) || Right.isOneOf(tok::greater, tok::less)) {
2660    if (Style.Language == FormatStyle::LK_TextProto ||
2661        (Style.Language == FormatStyle::LK_Proto &&
2662         (Left.is(TT_DictLiteral) || Right.is(TT_DictLiteral)))) {
2663      // Format empty list as `<>`.
2664      if (Left.is(tok::less) && Right.is(tok::greater))
2665        return false;
2666      return !Style.Cpp11BracedListStyle;
2667    }
2668    return false;
2669  }
2670  if (Right.is(tok::ellipsis))
2671    return Left.Tok.isLiteral() || (Left.is(tok::identifier) && Left.Previous &&
2672                                    Left.Previous->is(tok::kw_case));
2673  if (Left.is(tok::l_square) && Right.is(tok::amp))
2674    return Style.SpacesInSquareBrackets;
2675  if (Right.is(TT_PointerOrReference)) {
2676    if (Left.is(tok::r_paren) && Line.MightBeFunctionDecl) {
2677      if (!Left.MatchingParen)
2678        return true;
2679      FormatToken *TokenBeforeMatchingParen =
2680          Left.MatchingParen->getPreviousNonComment();
2681      if (!TokenBeforeMatchingParen ||
2682          !TokenBeforeMatchingParen->isOneOf(tok::kw_typeof, tok::kw_decltype,
2683                                             TT_TypenameMacro))
2684        return true;
2685    }
2686    return (Left.Tok.isLiteral() ||
2687            (!Left.isOneOf(TT_PointerOrReference, tok::l_paren) &&
2688             (Style.PointerAlignment != FormatStyle::PAS_Left ||
2689              (Line.IsMultiVariableDeclStmt &&
2690               (Left.NestingLevel == 0 ||
2691                (Left.NestingLevel == 1 && Line.First->is(tok::kw_for)))))));
2692  }
2693  if (Right.is(TT_FunctionTypeLParen) && Left.isNot(tok::l_paren) &&
2694      (!Left.is(TT_PointerOrReference) ||
2695       (Style.PointerAlignment != FormatStyle::PAS_Right &&
2696        !Line.IsMultiVariableDeclStmt)))
2697    return true;
2698  if (Left.is(TT_PointerOrReference))
2699    return Right.Tok.isLiteral() || Right.is(TT_BlockComment) ||
2700           (Right.isOneOf(Keywords.kw_override, Keywords.kw_final) &&
2701            !Right.is(TT_StartOfName)) ||
2702           (Right.is(tok::l_brace) && Right.BlockKind == BK_Block) ||
2703           (!Right.isOneOf(TT_PointerOrReference, TT_ArraySubscriptLSquare,
2704                           tok::l_paren) &&
2705            (Style.PointerAlignment != FormatStyle::PAS_Right &&
2706             !Line.IsMultiVariableDeclStmt) &&
2707            Left.Previous &&
2708            !Left.Previous->isOneOf(tok::l_paren, tok::coloncolon,
2709                                    tok::l_square));
2710  if (Right.is(tok::star) && Left.is(tok::l_paren))
2711    return false;
2712  if (Right.is(tok::star) && Left.is(tok::star))
2713    return false;
2714  if (Right.isOneOf(tok::star, tok::amp, tok::ampamp)) {
2715    const FormatToken *Previous = &Left;
2716    while (Previous && !Previous->is(tok::kw_operator)) {
2717      if (Previous->is(tok::identifier) || Previous->isSimpleTypeSpecifier()) {
2718        Previous = Previous->getPreviousNonComment();
2719        continue;
2720      }
2721      if (Previous->is(TT_TemplateCloser) && Previous->MatchingParen) {
2722        Previous = Previous->MatchingParen->getPreviousNonComment();
2723        continue;
2724      }
2725      if (Previous->is(tok::coloncolon)) {
2726        Previous = Previous->getPreviousNonComment();
2727        continue;
2728      }
2729      break;
2730    }
2731    // Space between the type and the * in:
2732    //   operator void*()
2733    //   operator char*()
2734    //   operator /*comment*/ const char*()
2735    //   operator volatile /*comment*/ char*()
2736    //   operator Foo*()
2737    //   operator C<T>*()
2738    //   operator std::Foo*()
2739    //   operator C<T>::D<U>*()
2740    // dependent on PointerAlignment style.
2741    if (Previous && (Previous->endsSequence(tok::kw_operator) ||
2742       Previous->endsSequence(tok::kw_const, tok::kw_operator) ||
2743       Previous->endsSequence(tok::kw_volatile, tok::kw_operator)))
2744      return (Style.PointerAlignment != FormatStyle::PAS_Left);
2745  }
2746  const auto SpaceRequiredForArrayInitializerLSquare =
2747      [](const FormatToken &LSquareTok, const FormatStyle &Style) {
2748        return Style.SpacesInContainerLiterals ||
2749               ((Style.Language == FormatStyle::LK_Proto ||
2750                 Style.Language == FormatStyle::LK_TextProto) &&
2751                !Style.Cpp11BracedListStyle &&
2752                LSquareTok.endsSequence(tok::l_square, tok::colon,
2753                                        TT_SelectorName));
2754      };
2755  if (Left.is(tok::l_square))
2756    return (Left.is(TT_ArrayInitializerLSquare) && Right.isNot(tok::r_square) &&
2757            SpaceRequiredForArrayInitializerLSquare(Left, Style)) ||
2758           (Left.isOneOf(TT_ArraySubscriptLSquare, TT_StructuredBindingLSquare,
2759                         TT_LambdaLSquare) &&
2760            Style.SpacesInSquareBrackets && Right.isNot(tok::r_square));
2761  if (Right.is(tok::r_square))
2762    return Right.MatchingParen &&
2763           ((Right.MatchingParen->is(TT_ArrayInitializerLSquare) &&
2764             SpaceRequiredForArrayInitializerLSquare(*Right.MatchingParen,
2765                                                     Style)) ||
2766            (Style.SpacesInSquareBrackets &&
2767             Right.MatchingParen->isOneOf(TT_ArraySubscriptLSquare,
2768                                          TT_StructuredBindingLSquare,
2769                                          TT_LambdaLSquare)) ||
2770            Right.MatchingParen->is(TT_AttributeParen));
2771  if (Right.is(tok::l_square) &&
2772      !Right.isOneOf(TT_ObjCMethodExpr, TT_LambdaLSquare,
2773                     TT_DesignatedInitializerLSquare,
2774                     TT_StructuredBindingLSquare, TT_AttributeSquare) &&
2775      !Left.isOneOf(tok::numeric_constant, TT_DictLiteral) &&
2776      !(!Left.is(tok::r_square) && Style.SpaceBeforeSquareBrackets &&
2777        Right.is(TT_ArraySubscriptLSquare)))
2778    return false;
2779  if (Left.is(tok::l_brace) && Right.is(tok::r_brace))
2780    return !Left.Children.empty(); // No spaces in "{}".
2781  if ((Left.is(tok::l_brace) && Left.BlockKind != BK_Block) ||
2782      (Right.is(tok::r_brace) && Right.MatchingParen &&
2783       Right.MatchingParen->BlockKind != BK_Block))
2784    return Style.Cpp11BracedListStyle ? Style.SpacesInParentheses : true;
2785  if (Left.is(TT_BlockComment))
2786    // No whitespace in x(/*foo=*/1), except for JavaScript.
2787    return Style.Language == FormatStyle::LK_JavaScript ||
2788           !Left.TokenText.endswith("=*/");
2789  if (Right.is(tok::l_paren)) {
2790    if ((Left.is(tok::r_paren) && Left.is(TT_AttributeParen)) ||
2791        (Left.is(tok::r_square) && Left.is(TT_AttributeSquare)))
2792      return true;
2793    return Line.Type == LT_ObjCDecl || Left.is(tok::semi) ||
2794           (Style.SpaceBeforeParens != FormatStyle::SBPO_Never &&
2795            (Left.isOneOf(tok::pp_elif, tok::kw_for, tok::kw_while,
2796                          tok::kw_switch, tok::kw_case, TT_ForEachMacro,
2797                          TT_ObjCForIn) ||
2798             Left.isIf(Line.Type != LT_PreprocessorDirective) ||
2799             (Left.isOneOf(tok::kw_try, Keywords.kw___except, tok::kw_catch,
2800                           tok::kw_new, tok::kw_delete) &&
2801              (!Left.Previous || Left.Previous->isNot(tok::period))))) ||
2802           (spaceRequiredBeforeParens(Right) &&
2803            (Left.is(tok::identifier) || Left.isFunctionLikeKeyword() ||
2804             Left.is(tok::r_paren) || Left.isSimpleTypeSpecifier() ||
2805             (Left.is(tok::r_square) && Left.MatchingParen &&
2806              Left.MatchingParen->is(TT_LambdaLSquare))) &&
2807            Line.Type != LT_PreprocessorDirective);
2808  }
2809  if (Left.is(tok::at) && Right.Tok.getObjCKeywordID() != tok::objc_not_keyword)
2810    return false;
2811  if (Right.is(TT_UnaryOperator))
2812    return !Left.isOneOf(tok::l_paren, tok::l_square, tok::at) &&
2813           (Left.isNot(tok::colon) || Left.isNot(TT_ObjCMethodExpr));
2814  if ((Left.isOneOf(tok::identifier, tok::greater, tok::r_square,
2815                    tok::r_paren) ||
2816       Left.isSimpleTypeSpecifier()) &&
2817      Right.is(tok::l_brace) && Right.getNextNonComment() &&
2818      Right.BlockKind != BK_Block)
2819    return false;
2820  if (Left.is(tok::period) || Right.is(tok::period))
2821    return false;
2822  if (Right.is(tok::hash) && Left.is(tok::identifier) && Left.TokenText == "L")
2823    return false;
2824  if (Left.is(TT_TemplateCloser) && Left.MatchingParen &&
2825      Left.MatchingParen->Previous &&
2826      (Left.MatchingParen->Previous->is(tok::period) ||
2827       Left.MatchingParen->Previous->is(tok::coloncolon)))
2828    // Java call to generic function with explicit type:
2829    // A.<B<C<...>>>DoSomething();
2830    // A::<B<C<...>>>DoSomething();  // With a Java 8 method reference.
2831    return false;
2832  if (Left.is(TT_TemplateCloser) && Right.is(tok::l_square))
2833    return false;
2834  if (Left.is(tok::l_brace) && Left.endsSequence(TT_DictLiteral, tok::at))
2835    // Objective-C dictionary literal -> no space after opening brace.
2836    return false;
2837  if (Right.is(tok::r_brace) && Right.MatchingParen &&
2838      Right.MatchingParen->endsSequence(TT_DictLiteral, tok::at))
2839    // Objective-C dictionary literal -> no space before closing brace.
2840    return false;
2841  if (Right.Type == TT_TrailingAnnotation &&
2842      Right.isOneOf(tok::amp, tok::ampamp) &&
2843      Left.isOneOf(tok::kw_const, tok::kw_volatile) &&
2844      (!Right.Next || Right.Next->is(tok::semi)))
2845    // Match const and volatile ref-qualifiers without any additional
2846    // qualifiers such as
2847    // void Fn() const &;
2848    return Style.PointerAlignment != FormatStyle::PAS_Left;
2849  return true;
2850}
2851
2852bool TokenAnnotator::spaceRequiredBefore(const AnnotatedLine &Line,
2853                                         const FormatToken &Right) {
2854  const FormatToken &Left = *Right.Previous;
2855  if (Right.Tok.getIdentifierInfo() && Left.Tok.getIdentifierInfo())
2856    return true; // Never ever merge two identifiers.
2857  if (Style.isCpp()) {
2858    if (Left.is(tok::kw_operator))
2859      return Right.is(tok::coloncolon);
2860    if (Right.is(tok::l_brace) && Right.BlockKind == BK_BracedInit &&
2861        !Left.opensScope() && Style.SpaceBeforeCpp11BracedList)
2862      return true;
2863  } else if (Style.Language == FormatStyle::LK_Proto ||
2864             Style.Language == FormatStyle::LK_TextProto) {
2865    if (Right.is(tok::period) &&
2866        Left.isOneOf(Keywords.kw_optional, Keywords.kw_required,
2867                     Keywords.kw_repeated, Keywords.kw_extend))
2868      return true;
2869    if (Right.is(tok::l_paren) &&
2870        Left.isOneOf(Keywords.kw_returns, Keywords.kw_option))
2871      return true;
2872    if (Right.isOneOf(tok::l_brace, tok::less) && Left.is(TT_SelectorName))
2873      return true;
2874    // Slashes occur in text protocol extension syntax: [type/type] { ... }.
2875    if (Left.is(tok::slash) || Right.is(tok::slash))
2876      return false;
2877    if (Left.MatchingParen &&
2878        Left.MatchingParen->is(TT_ProtoExtensionLSquare) &&
2879        Right.isOneOf(tok::l_brace, tok::less))
2880      return !Style.Cpp11BracedListStyle;
2881    // A percent is probably part of a formatting specification, such as %lld.
2882    if (Left.is(tok::percent))
2883      return false;
2884    // Preserve the existence of a space before a percent for cases like 0x%04x
2885    // and "%d %d"
2886    if (Left.is(tok::numeric_constant) && Right.is(tok::percent))
2887      return Right.WhitespaceRange.getEnd() != Right.WhitespaceRange.getBegin();
2888  } else if (Style.isCSharp()) {
2889    // space between type and variable e.g. Dictionary<string,string> foo;
2890    if (Left.is(TT_TemplateCloser) && Right.is(TT_StartOfName))
2891      return true;
2892    // space between keywords and paren e.g. "using ("
2893    if (Right.is(tok::l_paren))
2894      if (Left.is(tok::kw_using))
2895        return spaceRequiredBeforeParens(Left);
2896  } else if (Style.Language == FormatStyle::LK_JavaScript) {
2897    if (Left.is(TT_JsFatArrow))
2898      return true;
2899    // for await ( ...
2900    if (Right.is(tok::l_paren) && Left.is(Keywords.kw_await) && Left.Previous &&
2901        Left.Previous->is(tok::kw_for))
2902      return true;
2903    if (Left.is(Keywords.kw_async) && Right.is(tok::l_paren) &&
2904        Right.MatchingParen) {
2905      const FormatToken *Next = Right.MatchingParen->getNextNonComment();
2906      // An async arrow function, for example: `x = async () => foo();`,
2907      // as opposed to calling a function called async: `x = async();`
2908      if (Next && Next->is(TT_JsFatArrow))
2909        return true;
2910    }
2911    if ((Left.is(TT_TemplateString) && Left.TokenText.endswith("${")) ||
2912        (Right.is(TT_TemplateString) && Right.TokenText.startswith("}")))
2913      return false;
2914    // In tagged template literals ("html`bar baz`"), there is no space between
2915    // the tag identifier and the template string. getIdentifierInfo makes sure
2916    // that the identifier is not a pseudo keyword like `yield`, either.
2917    if (Left.is(tok::identifier) && Keywords.IsJavaScriptIdentifier(Left) &&
2918        Right.is(TT_TemplateString))
2919      return false;
2920    if (Right.is(tok::star) &&
2921        Left.isOneOf(Keywords.kw_function, Keywords.kw_yield))
2922      return false;
2923    if (Right.isOneOf(tok::l_brace, tok::l_square) &&
2924        Left.isOneOf(Keywords.kw_function, Keywords.kw_yield,
2925                     Keywords.kw_extends, Keywords.kw_implements))
2926      return true;
2927    if (Right.is(tok::l_paren)) {
2928      // JS methods can use some keywords as names (e.g. `delete()`).
2929      if (Line.MustBeDeclaration && Left.Tok.getIdentifierInfo())
2930        return false;
2931      // Valid JS method names can include keywords, e.g. `foo.delete()` or
2932      // `bar.instanceof()`. Recognize call positions by preceding period.
2933      if (Left.Previous && Left.Previous->is(tok::period) &&
2934          Left.Tok.getIdentifierInfo())
2935        return false;
2936      // Additional unary JavaScript operators that need a space after.
2937      if (Left.isOneOf(tok::kw_throw, Keywords.kw_await, Keywords.kw_typeof,
2938                       tok::kw_void))
2939        return true;
2940    }
2941    // `foo as const;` casts into a const type.
2942    if (Left.endsSequence(tok::kw_const, Keywords.kw_as)) {
2943      return false;
2944    }
2945    if ((Left.isOneOf(Keywords.kw_let, Keywords.kw_var, Keywords.kw_in,
2946                      tok::kw_const) ||
2947         // "of" is only a keyword if it appears after another identifier
2948         // (e.g. as "const x of y" in a for loop), or after a destructuring
2949         // operation (const [x, y] of z, const {a, b} of c).
2950         (Left.is(Keywords.kw_of) && Left.Previous &&
2951          (Left.Previous->Tok.is(tok::identifier) ||
2952           Left.Previous->isOneOf(tok::r_square, tok::r_brace)))) &&
2953        (!Left.Previous || !Left.Previous->is(tok::period)))
2954      return true;
2955    if (Left.isOneOf(tok::kw_for, Keywords.kw_as) && Left.Previous &&
2956        Left.Previous->is(tok::period) && Right.is(tok::l_paren))
2957      return false;
2958    if (Left.is(Keywords.kw_as) &&
2959        Right.isOneOf(tok::l_square, tok::l_brace, tok::l_paren))
2960      return true;
2961    if (Left.is(tok::kw_default) && Left.Previous &&
2962        Left.Previous->is(tok::kw_export))
2963      return true;
2964    if (Left.is(Keywords.kw_is) && Right.is(tok::l_brace))
2965      return true;
2966    if (Right.isOneOf(TT_JsTypeColon, TT_JsTypeOptionalQuestion))
2967      return false;
2968    if (Left.is(TT_JsTypeOperator) || Right.is(TT_JsTypeOperator))
2969      return false;
2970    if ((Left.is(tok::l_brace) || Right.is(tok::r_brace)) &&
2971        Line.First->isOneOf(Keywords.kw_import, tok::kw_export))
2972      return false;
2973    if (Left.is(tok::ellipsis))
2974      return false;
2975    if (Left.is(TT_TemplateCloser) &&
2976        !Right.isOneOf(tok::equal, tok::l_brace, tok::comma, tok::l_square,
2977                       Keywords.kw_implements, Keywords.kw_extends))
2978      // Type assertions ('<type>expr') are not followed by whitespace. Other
2979      // locations that should have whitespace following are identified by the
2980      // above set of follower tokens.
2981      return false;
2982    if (Right.is(TT_JsNonNullAssertion))
2983      return false;
2984    if (Left.is(TT_JsNonNullAssertion) &&
2985        Right.isOneOf(Keywords.kw_as, Keywords.kw_in))
2986      return true; // "x! as string", "x! in y"
2987  } else if (Style.Language == FormatStyle::LK_Java) {
2988    if (Left.is(tok::r_square) && Right.is(tok::l_brace))
2989      return true;
2990    if (Left.is(Keywords.kw_synchronized) && Right.is(tok::l_paren))
2991      return Style.SpaceBeforeParens != FormatStyle::SBPO_Never;
2992    if ((Left.isOneOf(tok::kw_static, tok::kw_public, tok::kw_private,
2993                      tok::kw_protected) ||
2994         Left.isOneOf(Keywords.kw_final, Keywords.kw_abstract,
2995                      Keywords.kw_native)) &&
2996        Right.is(TT_TemplateOpener))
2997      return true;
2998  }
2999  if (Left.is(TT_ImplicitStringLiteral))
3000    return Right.WhitespaceRange.getBegin() != Right.WhitespaceRange.getEnd();
3001  if (Line.Type == LT_ObjCMethodDecl) {
3002    if (Left.is(TT_ObjCMethodSpecifier))
3003      return true;
3004    if (Left.is(tok::r_paren) && canBeObjCSelectorComponent(Right))
3005      // Don't space between ')' and <id> or ')' and 'new'. 'new' is not a
3006      // keyword in Objective-C, and '+ (instancetype)new;' is a standard class
3007      // method declaration.
3008      return false;
3009  }
3010  if (Line.Type == LT_ObjCProperty &&
3011      (Right.is(tok::equal) || Left.is(tok::equal)))
3012    return false;
3013
3014  if (Right.isOneOf(TT_TrailingReturnArrow, TT_LambdaArrow) ||
3015      Left.isOneOf(TT_TrailingReturnArrow, TT_LambdaArrow))
3016    return true;
3017  if (Right.is(TT_OverloadedOperatorLParen))
3018    return spaceRequiredBeforeParens(Right);
3019  if (Left.is(tok::comma))
3020    return true;
3021  if (Right.is(tok::comma))
3022    return false;
3023  if (Right.is(TT_ObjCBlockLParen))
3024    return true;
3025  if (Right.is(TT_CtorInitializerColon))
3026    return Style.SpaceBeforeCtorInitializerColon;
3027  if (Right.is(TT_InheritanceColon) && !Style.SpaceBeforeInheritanceColon)
3028    return false;
3029  if (Right.is(TT_RangeBasedForLoopColon) &&
3030      !Style.SpaceBeforeRangeBasedForLoopColon)
3031    return false;
3032  if (Right.is(tok::colon)) {
3033    if (Line.First->isOneOf(tok::kw_case, tok::kw_default) ||
3034        !Right.getNextNonComment() || Right.getNextNonComment()->is(tok::semi))
3035      return false;
3036    if (Right.is(TT_ObjCMethodExpr))
3037      return false;
3038    if (Left.is(tok::question))
3039      return false;
3040    if (Right.is(TT_InlineASMColon) && Left.is(tok::coloncolon))
3041      return false;
3042    if (Right.is(TT_DictLiteral))
3043      return Style.SpacesInContainerLiterals;
3044    if (Right.is(TT_AttributeColon))
3045      return false;
3046    return true;
3047  }
3048  if (Left.is(TT_UnaryOperator)) {
3049    if (!Right.is(tok::l_paren)) {
3050      // The alternative operators for ~ and ! are "compl" and "not".
3051      // If they are used instead, we do not want to combine them with
3052      // the token to the right, unless that is a left paren.
3053      if (Left.is(tok::exclaim) && Left.TokenText == "not")
3054        return true;
3055      if (Left.is(tok::tilde) && Left.TokenText == "compl")
3056        return true;
3057      // Lambda captures allow for a lone &, so "&]" needs to be properly
3058      // handled.
3059      if (Left.is(tok::amp) && Right.is(tok::r_square))
3060        return Style.SpacesInSquareBrackets;
3061    }
3062    return (Style.SpaceAfterLogicalNot && Left.is(tok::exclaim)) ||
3063           Right.is(TT_BinaryOperator);
3064  }
3065
3066  // If the next token is a binary operator or a selector name, we have
3067  // incorrectly classified the parenthesis as a cast. FIXME: Detect correctly.
3068  if (Left.is(TT_CastRParen))
3069    return Style.SpaceAfterCStyleCast ||
3070           Right.isOneOf(TT_BinaryOperator, TT_SelectorName);
3071
3072  if (Left.is(tok::greater) && Right.is(tok::greater)) {
3073    if (Style.Language == FormatStyle::LK_TextProto ||
3074        (Style.Language == FormatStyle::LK_Proto && Left.is(TT_DictLiteral)))
3075      return !Style.Cpp11BracedListStyle;
3076    return Right.is(TT_TemplateCloser) && Left.is(TT_TemplateCloser) &&
3077           (Style.Standard < FormatStyle::LS_Cpp11 || Style.SpacesInAngles);
3078  }
3079  if (Right.isOneOf(tok::arrow, tok::arrowstar, tok::periodstar) ||
3080      Left.isOneOf(tok::arrow, tok::period, tok::arrowstar, tok::periodstar) ||
3081      (Right.is(tok::period) && Right.isNot(TT_DesignatedInitializerPeriod)))
3082    return false;
3083  if (!Style.SpaceBeforeAssignmentOperators && Left.isNot(TT_TemplateCloser) &&
3084      Right.getPrecedence() == prec::Assignment)
3085    return false;
3086  if (Style.Language == FormatStyle::LK_Java && Right.is(tok::coloncolon) &&
3087      (Left.is(tok::identifier) || Left.is(tok::kw_this)))
3088    return false;
3089  if (Right.is(tok::coloncolon) && Left.is(tok::identifier))
3090    // Generally don't remove existing spaces between an identifier and "::".
3091    // The identifier might actually be a macro name such as ALWAYS_INLINE. If
3092    // this turns out to be too lenient, add analysis of the identifier itself.
3093    return Right.WhitespaceRange.getBegin() != Right.WhitespaceRange.getEnd();
3094  if (Right.is(tok::coloncolon) &&
3095      !Left.isOneOf(tok::l_brace, tok::comment, tok::l_paren))
3096    return (Left.is(TT_TemplateOpener) &&
3097            Style.Standard < FormatStyle::LS_Cpp11) ||
3098           !(Left.isOneOf(tok::l_paren, tok::r_paren, tok::l_square,
3099                          tok::kw___super, TT_TemplateCloser,
3100                          TT_TemplateOpener)) ||
3101           (Left.is(tok ::l_paren) && Style.SpacesInParentheses);
3102  if ((Left.is(TT_TemplateOpener)) != (Right.is(TT_TemplateCloser)))
3103    return Style.SpacesInAngles;
3104  // Space before TT_StructuredBindingLSquare.
3105  if (Right.is(TT_StructuredBindingLSquare))
3106    return !Left.isOneOf(tok::amp, tok::ampamp) ||
3107           Style.PointerAlignment != FormatStyle::PAS_Right;
3108  // Space before & or && following a TT_StructuredBindingLSquare.
3109  if (Right.Next && Right.Next->is(TT_StructuredBindingLSquare) &&
3110      Right.isOneOf(tok::amp, tok::ampamp))
3111    return Style.PointerAlignment != FormatStyle::PAS_Left;
3112  if ((Right.is(TT_BinaryOperator) && !Left.is(tok::l_paren)) ||
3113      (Left.isOneOf(TT_BinaryOperator, TT_ConditionalExpr) &&
3114       !Right.is(tok::r_paren)))
3115    return true;
3116  if (Left.is(TT_TemplateCloser) && Right.is(tok::l_paren) &&
3117      Right.isNot(TT_FunctionTypeLParen))
3118    return spaceRequiredBeforeParens(Right);
3119  if (Right.is(TT_TemplateOpener) && Left.is(tok::r_paren) &&
3120      Left.MatchingParen && Left.MatchingParen->is(TT_OverloadedOperatorLParen))
3121    return false;
3122  if (Right.is(tok::less) && Left.isNot(tok::l_paren) &&
3123      Line.startsWith(tok::hash))
3124    return true;
3125  if (Right.is(TT_TrailingUnaryOperator))
3126    return false;
3127  if (Left.is(TT_RegexLiteral))
3128    return false;
3129  return spaceRequiredBetween(Line, Left, Right);
3130}
3131
3132// Returns 'true' if 'Tok' is a brace we'd want to break before in Allman style.
3133static bool isAllmanBrace(const FormatToken &Tok) {
3134  return Tok.is(tok::l_brace) && Tok.BlockKind == BK_Block &&
3135         !Tok.isOneOf(TT_ObjCBlockLBrace, TT_LambdaLBrace, TT_DictLiteral);
3136}
3137
3138bool TokenAnnotator::mustBreakBefore(const AnnotatedLine &Line,
3139                                     const FormatToken &Right) {
3140  const FormatToken &Left = *Right.Previous;
3141  if (Right.NewlinesBefore > 1 && Style.MaxEmptyLinesToKeep > 0)
3142    return true;
3143
3144  if (Style.Language == FormatStyle::LK_JavaScript) {
3145    // FIXME: This might apply to other languages and token kinds.
3146    if (Right.is(tok::string_literal) && Left.is(tok::plus) && Left.Previous &&
3147        Left.Previous->is(tok::string_literal))
3148      return true;
3149    if (Left.is(TT_DictLiteral) && Left.is(tok::l_brace) && Line.Level == 0 &&
3150        Left.Previous && Left.Previous->is(tok::equal) &&
3151        Line.First->isOneOf(tok::identifier, Keywords.kw_import, tok::kw_export,
3152                            tok::kw_const) &&
3153        // kw_var/kw_let are pseudo-tokens that are tok::identifier, so match
3154        // above.
3155        !Line.First->isOneOf(Keywords.kw_var, Keywords.kw_let))
3156      // Object literals on the top level of a file are treated as "enum-style".
3157      // Each key/value pair is put on a separate line, instead of bin-packing.
3158      return true;
3159    if (Left.is(tok::l_brace) && Line.Level == 0 &&
3160        (Line.startsWith(tok::kw_enum) ||
3161         Line.startsWith(tok::kw_const, tok::kw_enum) ||
3162         Line.startsWith(tok::kw_export, tok::kw_enum) ||
3163         Line.startsWith(tok::kw_export, tok::kw_const, tok::kw_enum)))
3164      // JavaScript top-level enum key/value pairs are put on separate lines
3165      // instead of bin-packing.
3166      return true;
3167    if (Right.is(tok::r_brace) && Left.is(tok::l_brace) &&
3168        !Left.Children.empty())
3169      // Support AllowShortFunctionsOnASingleLine for JavaScript.
3170      return Style.AllowShortFunctionsOnASingleLine == FormatStyle::SFS_None ||
3171             Style.AllowShortFunctionsOnASingleLine == FormatStyle::SFS_Empty ||
3172             (Left.NestingLevel == 0 && Line.Level == 0 &&
3173              Style.AllowShortFunctionsOnASingleLine &
3174                  FormatStyle::SFS_InlineOnly);
3175  } else if (Style.Language == FormatStyle::LK_Java) {
3176    if (Right.is(tok::plus) && Left.is(tok::string_literal) && Right.Next &&
3177        Right.Next->is(tok::string_literal))
3178      return true;
3179  } else if (Style.Language == FormatStyle::LK_Cpp ||
3180             Style.Language == FormatStyle::LK_ObjC ||
3181             Style.Language == FormatStyle::LK_Proto ||
3182             Style.Language == FormatStyle::LK_TableGen ||
3183             Style.Language == FormatStyle::LK_TextProto) {
3184    if (Left.isStringLiteral() && Right.isStringLiteral())
3185      return true;
3186  }
3187
3188  // If the last token before a '}', ']', or ')' is a comma or a trailing
3189  // comment, the intention is to insert a line break after it in order to make
3190  // shuffling around entries easier. Import statements, especially in
3191  // JavaScript, can be an exception to this rule.
3192  if (Style.JavaScriptWrapImports || Line.Type != LT_ImportStatement) {
3193    const FormatToken *BeforeClosingBrace = nullptr;
3194    if ((Left.isOneOf(tok::l_brace, TT_ArrayInitializerLSquare) ||
3195         (Style.Language == FormatStyle::LK_JavaScript &&
3196          Left.is(tok::l_paren))) &&
3197        Left.BlockKind != BK_Block && Left.MatchingParen)
3198      BeforeClosingBrace = Left.MatchingParen->Previous;
3199    else if (Right.MatchingParen &&
3200             (Right.MatchingParen->isOneOf(tok::l_brace,
3201                                           TT_ArrayInitializerLSquare) ||
3202              (Style.Language == FormatStyle::LK_JavaScript &&
3203               Right.MatchingParen->is(tok::l_paren))))
3204      BeforeClosingBrace = &Left;
3205    if (BeforeClosingBrace && (BeforeClosingBrace->is(tok::comma) ||
3206                               BeforeClosingBrace->isTrailingComment()))
3207      return true;
3208  }
3209
3210  if (Right.is(tok::comment))
3211    return Left.BlockKind != BK_BracedInit &&
3212           Left.isNot(TT_CtorInitializerColon) &&
3213           (Right.NewlinesBefore > 0 && Right.HasUnescapedNewline);
3214  if (Left.isTrailingComment())
3215    return true;
3216  if (Right.Previous->IsUnterminatedLiteral)
3217    return true;
3218  if (Right.is(tok::lessless) && Right.Next &&
3219      Right.Previous->is(tok::string_literal) &&
3220      Right.Next->is(tok::string_literal))
3221    return true;
3222  if (Right.Previous->ClosesTemplateDeclaration &&
3223      Right.Previous->MatchingParen &&
3224      Right.Previous->MatchingParen->NestingLevel == 0 &&
3225      Style.AlwaysBreakTemplateDeclarations == FormatStyle::BTDS_Yes)
3226    return true;
3227  if (Right.is(TT_CtorInitializerComma) &&
3228      Style.BreakConstructorInitializers == FormatStyle::BCIS_BeforeComma &&
3229      !Style.ConstructorInitializerAllOnOneLineOrOnePerLine)
3230    return true;
3231  if (Right.is(TT_CtorInitializerColon) &&
3232      Style.BreakConstructorInitializers == FormatStyle::BCIS_BeforeComma &&
3233      !Style.ConstructorInitializerAllOnOneLineOrOnePerLine)
3234    return true;
3235  // Break only if we have multiple inheritance.
3236  if (Style.BreakInheritanceList == FormatStyle::BILS_BeforeComma &&
3237      Right.is(TT_InheritanceComma))
3238    return true;
3239  if (Right.is(tok::string_literal) && Right.TokenText.startswith("R\""))
3240    // Multiline raw string literals are special wrt. line breaks. The author
3241    // has made a deliberate choice and might have aligned the contents of the
3242    // string literal accordingly. Thus, we try keep existing line breaks.
3243    return Right.IsMultiline && Right.NewlinesBefore > 0;
3244  if ((Right.Previous->is(tok::l_brace) ||
3245       (Right.Previous->is(tok::less) && Right.Previous->Previous &&
3246        Right.Previous->Previous->is(tok::equal))) &&
3247      Right.NestingLevel == 1 && Style.Language == FormatStyle::LK_Proto) {
3248    // Don't put enums or option definitions onto single lines in protocol
3249    // buffers.
3250    return true;
3251  }
3252  if (Right.is(TT_InlineASMBrace))
3253    return Right.HasUnescapedNewline;
3254  if (isAllmanBrace(Left) || isAllmanBrace(Right))
3255    return (Line.startsWith(tok::kw_enum) && Style.BraceWrapping.AfterEnum) ||
3256           (Line.startsWith(tok::kw_typedef, tok::kw_enum) &&
3257            Style.BraceWrapping.AfterEnum) ||
3258           (Line.startsWith(tok::kw_class) && Style.BraceWrapping.AfterClass) ||
3259           (Line.startsWith(tok::kw_struct) && Style.BraceWrapping.AfterStruct);
3260  if (Left.is(TT_ObjCBlockLBrace) &&
3261      Style.AllowShortBlocksOnASingleLine == FormatStyle::SBS_Never)
3262    return true;
3263
3264  if (Left.is(TT_LambdaLBrace)) {
3265    if (Left.MatchingParen && Left.MatchingParen->Next &&
3266        Left.MatchingParen->Next->isOneOf(tok::comma, tok::r_paren) &&
3267        Style.AllowShortLambdasOnASingleLine == FormatStyle::SLS_Inline)
3268      return false;
3269
3270    if (Style.AllowShortLambdasOnASingleLine == FormatStyle::SLS_None ||
3271        Style.AllowShortLambdasOnASingleLine == FormatStyle::SLS_Inline ||
3272        (!Left.Children.empty() &&
3273         Style.AllowShortLambdasOnASingleLine == FormatStyle::SLS_Empty))
3274      return true;
3275  }
3276
3277  // Put multiple C# attributes on a new line.
3278  if (Style.isCSharp() &&
3279      ((Left.is(TT_AttributeSquare) && Left.is(tok::r_square)) ||
3280       (Left.is(tok::r_square) && Right.is(TT_AttributeSquare) &&
3281        Right.is(tok::l_square))))
3282    return true;
3283
3284  // Put multiple Java annotation on a new line.
3285  if ((Style.Language == FormatStyle::LK_Java ||
3286       Style.Language == FormatStyle::LK_JavaScript) &&
3287      Left.is(TT_LeadingJavaAnnotation) &&
3288      Right.isNot(TT_LeadingJavaAnnotation) && Right.isNot(tok::l_paren) &&
3289      (Line.Last->is(tok::l_brace) || Style.BreakAfterJavaFieldAnnotations))
3290    return true;
3291
3292  if (Right.is(TT_ProtoExtensionLSquare))
3293    return true;
3294
3295  // In text proto instances if a submessage contains at least 2 entries and at
3296  // least one of them is a submessage, like A { ... B { ... } ... },
3297  // put all of the entries of A on separate lines by forcing the selector of
3298  // the submessage B to be put on a newline.
3299  //
3300  // Example: these can stay on one line:
3301  // a { scalar_1: 1 scalar_2: 2 }
3302  // a { b { key: value } }
3303  //
3304  // and these entries need to be on a new line even if putting them all in one
3305  // line is under the column limit:
3306  // a {
3307  //   scalar: 1
3308  //   b { key: value }
3309  // }
3310  //
3311  // We enforce this by breaking before a submessage field that has previous
3312  // siblings, *and* breaking before a field that follows a submessage field.
3313  //
3314  // Be careful to exclude the case  [proto.ext] { ... } since the `]` is
3315  // the TT_SelectorName there, but we don't want to break inside the brackets.
3316  //
3317  // Another edge case is @submessage { key: value }, which is a common
3318  // substitution placeholder. In this case we want to keep `@` and `submessage`
3319  // together.
3320  //
3321  // We ensure elsewhere that extensions are always on their own line.
3322  if ((Style.Language == FormatStyle::LK_Proto ||
3323       Style.Language == FormatStyle::LK_TextProto) &&
3324      Right.is(TT_SelectorName) && !Right.is(tok::r_square) && Right.Next) {
3325    // Keep `@submessage` together in:
3326    // @submessage { key: value }
3327    if (Right.Previous && Right.Previous->is(tok::at))
3328      return false;
3329    // Look for the scope opener after selector in cases like:
3330    // selector { ...
3331    // selector: { ...
3332    // selector: @base { ...
3333    FormatToken *LBrace = Right.Next;
3334    if (LBrace && LBrace->is(tok::colon)) {
3335      LBrace = LBrace->Next;
3336      if (LBrace && LBrace->is(tok::at)) {
3337        LBrace = LBrace->Next;
3338        if (LBrace)
3339          LBrace = LBrace->Next;
3340      }
3341    }
3342    if (LBrace &&
3343        // The scope opener is one of {, [, <:
3344        // selector { ... }
3345        // selector [ ... ]
3346        // selector < ... >
3347        //
3348        // In case of selector { ... }, the l_brace is TT_DictLiteral.
3349        // In case of an empty selector {}, the l_brace is not TT_DictLiteral,
3350        // so we check for immediately following r_brace.
3351        ((LBrace->is(tok::l_brace) &&
3352          (LBrace->is(TT_DictLiteral) ||
3353           (LBrace->Next && LBrace->Next->is(tok::r_brace)))) ||
3354         LBrace->is(TT_ArrayInitializerLSquare) || LBrace->is(tok::less))) {
3355      // If Left.ParameterCount is 0, then this submessage entry is not the
3356      // first in its parent submessage, and we want to break before this entry.
3357      // If Left.ParameterCount is greater than 0, then its parent submessage
3358      // might contain 1 or more entries and we want to break before this entry
3359      // if it contains at least 2 entries. We deal with this case later by
3360      // detecting and breaking before the next entry in the parent submessage.
3361      if (Left.ParameterCount == 0)
3362        return true;
3363      // However, if this submessage is the first entry in its parent
3364      // submessage, Left.ParameterCount might be 1 in some cases.
3365      // We deal with this case later by detecting an entry
3366      // following a closing paren of this submessage.
3367    }
3368
3369    // If this is an entry immediately following a submessage, it will be
3370    // preceded by a closing paren of that submessage, like in:
3371    //     left---.  .---right
3372    //            v  v
3373    // sub: { ... } key: value
3374    // If there was a comment between `}` an `key` above, then `key` would be
3375    // put on a new line anyways.
3376    if (Left.isOneOf(tok::r_brace, tok::greater, tok::r_square))
3377      return true;
3378  }
3379
3380  // Deal with lambda arguments in C++ - we want consistent line breaks whether
3381  // they happen to be at arg0, arg1 or argN. The selection is a bit nuanced
3382  // as aggressive line breaks are placed when the lambda is not the last arg.
3383  if ((Style.Language == FormatStyle::LK_Cpp ||
3384       Style.Language == FormatStyle::LK_ObjC) &&
3385      Left.is(tok::l_paren) && Left.BlockParameterCount > 0 &&
3386      !Right.isOneOf(tok::l_paren, TT_LambdaLSquare)) {
3387    // Multiple lambdas in the same function call force line breaks.
3388    if (Left.BlockParameterCount > 1)
3389      return true;
3390
3391    // A lambda followed by another arg forces a line break.
3392    if (!Left.Role)
3393      return false;
3394    auto Comma = Left.Role->lastComma();
3395    if (!Comma)
3396      return false;
3397    auto Next = Comma->getNextNonComment();
3398    if (!Next)
3399      return false;
3400    if (!Next->isOneOf(TT_LambdaLSquare, tok::l_brace, tok::caret))
3401      return true;
3402  }
3403
3404  return false;
3405}
3406
3407bool TokenAnnotator::canBreakBefore(const AnnotatedLine &Line,
3408                                    const FormatToken &Right) {
3409  const FormatToken &Left = *Right.Previous;
3410
3411  // Language-specific stuff.
3412  if (Style.Language == FormatStyle::LK_Java) {
3413    if (Left.isOneOf(Keywords.kw_throws, Keywords.kw_extends,
3414                     Keywords.kw_implements))
3415      return false;
3416    if (Right.isOneOf(Keywords.kw_throws, Keywords.kw_extends,
3417                      Keywords.kw_implements))
3418      return true;
3419  } else if (Style.Language == FormatStyle::LK_JavaScript) {
3420    const FormatToken *NonComment = Right.getPreviousNonComment();
3421    if (NonComment &&
3422        NonComment->isOneOf(
3423            tok::kw_return, Keywords.kw_yield, tok::kw_continue, tok::kw_break,
3424            tok::kw_throw, Keywords.kw_interface, Keywords.kw_type,
3425            tok::kw_static, tok::kw_public, tok::kw_private, tok::kw_protected,
3426            Keywords.kw_readonly, Keywords.kw_abstract, Keywords.kw_get,
3427            Keywords.kw_set, Keywords.kw_async, Keywords.kw_await))
3428      return false; // Otherwise automatic semicolon insertion would trigger.
3429    if (Right.NestingLevel == 0 &&
3430        (Left.Tok.getIdentifierInfo() ||
3431         Left.isOneOf(tok::r_square, tok::r_paren)) &&
3432        Right.isOneOf(tok::l_square, tok::l_paren))
3433      return false; // Otherwise automatic semicolon insertion would trigger.
3434    if (Left.is(TT_JsFatArrow) && Right.is(tok::l_brace))
3435      return false;
3436    if (Left.is(TT_JsTypeColon))
3437      return true;
3438    // Don't wrap between ":" and "!" of a strict prop init ("field!: type;").
3439    if (Left.is(tok::exclaim) && Right.is(tok::colon))
3440      return false;
3441    // Look for is type annotations like:
3442    // function f(): a is B { ... }
3443    // Do not break before is in these cases.
3444    if (Right.is(Keywords.kw_is)) {
3445      const FormatToken *Next = Right.getNextNonComment();
3446      // If `is` is followed by a colon, it's likely that it's a dict key, so
3447      // ignore it for this check.
3448      // For example this is common in Polymer:
3449      // Polymer({
3450      //   is: 'name',
3451      //   ...
3452      // });
3453      if (!Next || !Next->is(tok::colon))
3454        return false;
3455    }
3456    if (Left.is(Keywords.kw_in))
3457      return Style.BreakBeforeBinaryOperators == FormatStyle::BOS_None;
3458    if (Right.is(Keywords.kw_in))
3459      return Style.BreakBeforeBinaryOperators != FormatStyle::BOS_None;
3460    if (Right.is(Keywords.kw_as))
3461      return false; // must not break before as in 'x as type' casts
3462    if (Right.isOneOf(Keywords.kw_extends, Keywords.kw_infer)) {
3463      // extends and infer can appear as keywords in conditional types:
3464      //   https://www.typescriptlang.org/docs/handbook/release-notes/typescript-2-8.html#conditional-types
3465      // do not break before them, as the expressions are subject to ASI.
3466      return false;
3467    }
3468    if (Left.is(Keywords.kw_as))
3469      return true;
3470    if (Left.is(TT_JsNonNullAssertion))
3471      return true;
3472    if (Left.is(Keywords.kw_declare) &&
3473        Right.isOneOf(Keywords.kw_module, tok::kw_namespace,
3474                      Keywords.kw_function, tok::kw_class, tok::kw_enum,
3475                      Keywords.kw_interface, Keywords.kw_type, Keywords.kw_var,
3476                      Keywords.kw_let, tok::kw_const))
3477      // See grammar for 'declare' statements at:
3478      // https://github.com/Microsoft/TypeScript/blob/master/doc/spec.md#A.10
3479      return false;
3480    if (Left.isOneOf(Keywords.kw_module, tok::kw_namespace) &&
3481        Right.isOneOf(tok::identifier, tok::string_literal))
3482      return false; // must not break in "module foo { ...}"
3483    if (Right.is(TT_TemplateString) && Right.closesScope())
3484      return false;
3485    // Don't split tagged template literal so there is a break between the tag
3486    // identifier and template string.
3487    if (Left.is(tok::identifier) && Right.is(TT_TemplateString)) {
3488      return false;
3489    }
3490    if (Left.is(TT_TemplateString) && Left.opensScope())
3491      return true;
3492  }
3493
3494  if (Left.is(tok::at))
3495    return false;
3496  if (Left.Tok.getObjCKeywordID() == tok::objc_interface)
3497    return false;
3498  if (Left.isOneOf(TT_JavaAnnotation, TT_LeadingJavaAnnotation))
3499    return !Right.is(tok::l_paren);
3500  if (Right.is(TT_PointerOrReference))
3501    return Line.IsMultiVariableDeclStmt ||
3502           (Style.PointerAlignment == FormatStyle::PAS_Right &&
3503            (!Right.Next || Right.Next->isNot(TT_FunctionDeclarationName)));
3504  if (Right.isOneOf(TT_StartOfName, TT_FunctionDeclarationName) ||
3505      Right.is(tok::kw_operator))
3506    return true;
3507  if (Left.is(TT_PointerOrReference))
3508    return false;
3509  if (Right.isTrailingComment())
3510    // We rely on MustBreakBefore being set correctly here as we should not
3511    // change the "binding" behavior of a comment.
3512    // The first comment in a braced lists is always interpreted as belonging to
3513    // the first list element. Otherwise, it should be placed outside of the
3514    // list.
3515    return Left.BlockKind == BK_BracedInit ||
3516           (Left.is(TT_CtorInitializerColon) &&
3517            Style.BreakConstructorInitializers == FormatStyle::BCIS_AfterColon);
3518  if (Left.is(tok::question) && Right.is(tok::colon))
3519    return false;
3520  if (Right.is(TT_ConditionalExpr) || Right.is(tok::question))
3521    return Style.BreakBeforeTernaryOperators;
3522  if (Left.is(TT_ConditionalExpr) || Left.is(tok::question))
3523    return !Style.BreakBeforeTernaryOperators;
3524  if (Left.is(TT_InheritanceColon))
3525    return Style.BreakInheritanceList == FormatStyle::BILS_AfterColon;
3526  if (Right.is(TT_InheritanceColon))
3527    return Style.BreakInheritanceList != FormatStyle::BILS_AfterColon;
3528  if (Right.is(TT_ObjCMethodExpr) && !Right.is(tok::r_square) &&
3529      Left.isNot(TT_SelectorName))
3530    return true;
3531
3532  if (Right.is(tok::colon) &&
3533      !Right.isOneOf(TT_CtorInitializerColon, TT_InlineASMColon))
3534    return false;
3535  if (Left.is(tok::colon) && Left.isOneOf(TT_DictLiteral, TT_ObjCMethodExpr)) {
3536    if (Style.Language == FormatStyle::LK_Proto ||
3537        Style.Language == FormatStyle::LK_TextProto) {
3538      if (!Style.AlwaysBreakBeforeMultilineStrings && Right.isStringLiteral())
3539        return false;
3540      // Prevent cases like:
3541      //
3542      // submessage:
3543      //     { key: valueeeeeeeeeeee }
3544      //
3545      // when the snippet does not fit into one line.
3546      // Prefer:
3547      //
3548      // submessage: {
3549      //   key: valueeeeeeeeeeee
3550      // }
3551      //
3552      // instead, even if it is longer by one line.
3553      //
3554      // Note that this allows allows the "{" to go over the column limit
3555      // when the column limit is just between ":" and "{", but that does
3556      // not happen too often and alternative formattings in this case are
3557      // not much better.
3558      //
3559      // The code covers the cases:
3560      //
3561      // submessage: { ... }
3562      // submessage: < ... >
3563      // repeated: [ ... ]
3564      if (((Right.is(tok::l_brace) || Right.is(tok::less)) &&
3565           Right.is(TT_DictLiteral)) ||
3566          Right.is(TT_ArrayInitializerLSquare))
3567        return false;
3568    }
3569    return true;
3570  }
3571  if (Right.is(tok::r_square) && Right.MatchingParen &&
3572      Right.MatchingParen->is(TT_ProtoExtensionLSquare))
3573    return false;
3574  if (Right.is(TT_SelectorName) || (Right.is(tok::identifier) && Right.Next &&
3575                                    Right.Next->is(TT_ObjCMethodExpr)))
3576    return Left.isNot(tok::period); // FIXME: Properly parse ObjC calls.
3577  if (Left.is(tok::r_paren) && Line.Type == LT_ObjCProperty)
3578    return true;
3579  if (Left.ClosesTemplateDeclaration || Left.is(TT_FunctionAnnotationRParen))
3580    return true;
3581  if (Right.isOneOf(TT_RangeBasedForLoopColon, TT_OverloadedOperatorLParen,
3582                    TT_OverloadedOperator))
3583    return false;
3584  if (Left.is(TT_RangeBasedForLoopColon))
3585    return true;
3586  if (Right.is(TT_RangeBasedForLoopColon))
3587    return false;
3588  if (Left.is(TT_TemplateCloser) && Right.is(TT_TemplateOpener))
3589    return true;
3590  if (Left.isOneOf(TT_TemplateCloser, TT_UnaryOperator) ||
3591      Left.is(tok::kw_operator))
3592    return false;
3593  if (Left.is(tok::equal) && !Right.isOneOf(tok::kw_default, tok::kw_delete) &&
3594      Line.Type == LT_VirtualFunctionDecl && Left.NestingLevel == 0)
3595    return false;
3596  if (Left.is(tok::equal) && Right.is(tok::l_brace) &&
3597      !Style.Cpp11BracedListStyle)
3598    return false;
3599  if (Left.is(tok::l_paren) && Left.is(TT_AttributeParen))
3600    return false;
3601  if (Left.is(tok::l_paren) && Left.Previous &&
3602      (Left.Previous->isOneOf(TT_BinaryOperator, TT_CastRParen)))
3603    return false;
3604  if (Right.is(TT_ImplicitStringLiteral))
3605    return false;
3606
3607  if (Right.is(tok::r_paren) || Right.is(TT_TemplateCloser))
3608    return false;
3609  if (Right.is(tok::r_square) && Right.MatchingParen &&
3610      Right.MatchingParen->is(TT_LambdaLSquare))
3611    return false;
3612
3613  // We only break before r_brace if there was a corresponding break before
3614  // the l_brace, which is tracked by BreakBeforeClosingBrace.
3615  if (Right.is(tok::r_brace))
3616    return Right.MatchingParen && Right.MatchingParen->BlockKind == BK_Block;
3617
3618  // Allow breaking after a trailing annotation, e.g. after a method
3619  // declaration.
3620  if (Left.is(TT_TrailingAnnotation))
3621    return !Right.isOneOf(tok::l_brace, tok::semi, tok::equal, tok::l_paren,
3622                          tok::less, tok::coloncolon);
3623
3624  if (Right.is(tok::kw___attribute) ||
3625      (Right.is(tok::l_square) && Right.is(TT_AttributeSquare)))
3626    return true;
3627
3628  if (Left.is(tok::identifier) && Right.is(tok::string_literal))
3629    return true;
3630
3631  if (Right.is(tok::identifier) && Right.Next && Right.Next->is(TT_DictLiteral))
3632    return true;
3633
3634  if (Left.is(TT_CtorInitializerColon))
3635    return Style.BreakConstructorInitializers == FormatStyle::BCIS_AfterColon;
3636  if (Right.is(TT_CtorInitializerColon))
3637    return Style.BreakConstructorInitializers != FormatStyle::BCIS_AfterColon;
3638  if (Left.is(TT_CtorInitializerComma) &&
3639      Style.BreakConstructorInitializers == FormatStyle::BCIS_BeforeComma)
3640    return false;
3641  if (Right.is(TT_CtorInitializerComma) &&
3642      Style.BreakConstructorInitializers == FormatStyle::BCIS_BeforeComma)
3643    return true;
3644  if (Left.is(TT_InheritanceComma) &&
3645      Style.BreakInheritanceList == FormatStyle::BILS_BeforeComma)
3646    return false;
3647  if (Right.is(TT_InheritanceComma) &&
3648      Style.BreakInheritanceList == FormatStyle::BILS_BeforeComma)
3649    return true;
3650  if ((Left.is(tok::greater) && Right.is(tok::greater)) ||
3651      (Left.is(tok::less) && Right.is(tok::less)))
3652    return false;
3653  if (Right.is(TT_BinaryOperator) &&
3654      Style.BreakBeforeBinaryOperators != FormatStyle::BOS_None &&
3655      (Style.BreakBeforeBinaryOperators == FormatStyle::BOS_All ||
3656       Right.getPrecedence() != prec::Assignment))
3657    return true;
3658  if (Left.is(TT_ArrayInitializerLSquare))
3659    return true;
3660  if (Right.is(tok::kw_typename) && Left.isNot(tok::kw_const))
3661    return true;
3662  if ((Left.isBinaryOperator() || Left.is(TT_BinaryOperator)) &&
3663      !Left.isOneOf(tok::arrowstar, tok::lessless) &&
3664      Style.BreakBeforeBinaryOperators != FormatStyle::BOS_All &&
3665      (Style.BreakBeforeBinaryOperators == FormatStyle::BOS_None ||
3666       Left.getPrecedence() == prec::Assignment))
3667    return true;
3668  if ((Left.is(TT_AttributeSquare) && Right.is(tok::l_square)) ||
3669      (Left.is(tok::r_square) && Right.is(TT_AttributeSquare)))
3670    return false;
3671  return Left.isOneOf(tok::comma, tok::coloncolon, tok::semi, tok::l_brace,
3672                      tok::kw_class, tok::kw_struct, tok::comment) ||
3673         Right.isMemberAccess() ||
3674         Right.isOneOf(TT_TrailingReturnArrow, TT_LambdaArrow, tok::lessless,
3675                       tok::colon, tok::l_square, tok::at) ||
3676         (Left.is(tok::r_paren) &&
3677          Right.isOneOf(tok::identifier, tok::kw_const)) ||
3678         (Left.is(tok::l_paren) && !Right.is(tok::r_paren)) ||
3679         (Left.is(TT_TemplateOpener) && !Right.is(TT_TemplateCloser));
3680}
3681
3682void TokenAnnotator::printDebugInfo(const AnnotatedLine &Line) {
3683  llvm::errs() << "AnnotatedTokens(L=" << Line.Level << "):\n";
3684  const FormatToken *Tok = Line.First;
3685  while (Tok) {
3686    llvm::errs() << " M=" << Tok->MustBreakBefore
3687                 << " C=" << Tok->CanBreakBefore
3688                 << " T=" << getTokenTypeName(Tok->Type)
3689                 << " S=" << Tok->SpacesRequiredBefore
3690                 << " B=" << Tok->BlockParameterCount
3691                 << " BK=" << Tok->BlockKind << " P=" << Tok->SplitPenalty
3692                 << " Name=" << Tok->Tok.getName() << " L=" << Tok->TotalLength
3693                 << " PPK=" << Tok->PackingKind << " FakeLParens=";
3694    for (unsigned i = 0, e = Tok->FakeLParens.size(); i != e; ++i)
3695      llvm::errs() << Tok->FakeLParens[i] << "/";
3696    llvm::errs() << " FakeRParens=" << Tok->FakeRParens;
3697    llvm::errs() << " II=" << Tok->Tok.getIdentifierInfo();
3698    llvm::errs() << " Text='" << Tok->TokenText << "'\n";
3699    if (!Tok->Next)
3700      assert(Tok == Line.Last);
3701    Tok = Tok->Next;
3702  }
3703  llvm::errs() << "----\n";
3704}
3705
3706} // namespace format
3707} // namespace clang
3708