1 //===--- TokenAnnotator.cpp - Format C++ code -----------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 ///
9 /// \file
10 /// This file implements a token annotator, i.e. creates
11 /// \c AnnotatedTokens out of \c FormatTokens with required extra information.
12 ///
13 //===----------------------------------------------------------------------===//
14 
15 #include "TokenAnnotator.h"
16 #include "FormatToken.h"
17 #include "clang/Basic/SourceManager.h"
18 #include "clang/Basic/TokenKinds.h"
19 #include "llvm/ADT/SmallPtrSet.h"
20 #include "llvm/Support/Debug.h"
21 
22 #define DEBUG_TYPE "format-token-annotator"
23 
24 namespace clang {
25 namespace format {
26 
27 namespace {
28 
29 /// Returns \c true if the token can be used as an identifier in
30 /// an Objective-C \c @selector, \c false otherwise.
31 ///
32 /// Because getFormattingLangOpts() always lexes source code as
33 /// Objective-C++, C++ keywords like \c new and \c delete are
34 /// lexed as tok::kw_*, not tok::identifier, even for Objective-C.
35 ///
36 /// For Objective-C and Objective-C++, both identifiers and keywords
37 /// are valid inside @selector(...) (or a macro which
38 /// invokes @selector(...)). So, we allow treat any identifier or
39 /// keyword as a potential Objective-C selector component.
40 static bool canBeObjCSelectorComponent(const FormatToken &Tok) {
41   return Tok.Tok.getIdentifierInfo() != nullptr;
42 }
43 
44 /// With `Left` being '(', check if we're at either `[...](` or
45 /// `[...]<...>(`, where the [ opens a lambda capture list.
46 static bool isLambdaParameterList(const FormatToken *Left) {
47   // Skip <...> if present.
48   if (Left->Previous && Left->Previous->is(tok::greater) &&
49       Left->Previous->MatchingParen &&
50       Left->Previous->MatchingParen->is(TT_TemplateOpener))
51     Left = Left->Previous->MatchingParen;
52 
53   // Check for `[...]`.
54   return Left->Previous && Left->Previous->is(tok::r_square) &&
55          Left->Previous->MatchingParen &&
56          Left->Previous->MatchingParen->is(TT_LambdaLSquare);
57 }
58 
59 /// A parser that gathers additional information about tokens.
60 ///
61 /// The \c TokenAnnotator tries to match parenthesis and square brakets and
62 /// store a parenthesis levels. It also tries to resolve matching "<" and ">"
63 /// into template parameter lists.
64 class AnnotatingParser {
65 public:
66   AnnotatingParser(const FormatStyle &Style, AnnotatedLine &Line,
67                    const AdditionalKeywords &Keywords)
68       : Style(Style), Line(Line), CurrentToken(Line.First), AutoFound(false),
69         Keywords(Keywords) {
70     Contexts.push_back(Context(tok::unknown, 1, /*IsExpression=*/false));
71     resetTokenMetadata(CurrentToken);
72   }
73 
74 private:
75   bool parseAngle() {
76     if (!CurrentToken || !CurrentToken->Previous)
77       return false;
78     if (NonTemplateLess.count(CurrentToken->Previous))
79       return false;
80 
81     const FormatToken &Previous = *CurrentToken->Previous; // The '<'.
82     if (Previous.Previous) {
83       if (Previous.Previous->Tok.isLiteral())
84         return false;
85       if (Previous.Previous->is(tok::r_paren) && Contexts.size() > 1 &&
86           (!Previous.Previous->MatchingParen ||
87            !Previous.Previous->MatchingParen->is(TT_OverloadedOperatorLParen)))
88         return false;
89     }
90 
91     FormatToken *Left = CurrentToken->Previous;
92     Left->ParentBracket = Contexts.back().ContextKind;
93     ScopedContextCreator ContextCreator(*this, tok::less, 12);
94 
95     // If this angle is in the context of an expression, we need to be more
96     // hesitant to detect it as opening template parameters.
97     bool InExprContext = Contexts.back().IsExpression;
98 
99     Contexts.back().IsExpression = false;
100     // If there's a template keyword before the opening angle bracket, this is a
101     // template parameter, not an argument.
102     Contexts.back().InTemplateArgument =
103         Left->Previous && Left->Previous->Tok.isNot(tok::kw_template);
104 
105     if (Style.Language == FormatStyle::LK_Java &&
106         CurrentToken->is(tok::question))
107       next();
108 
109     while (CurrentToken) {
110       if (CurrentToken->is(tok::greater)) {
111         Left->MatchingParen = CurrentToken;
112         CurrentToken->MatchingParen = Left;
113         // In TT_Proto, we must distignuish between:
114         //   map<key, value>
115         //   msg < item: data >
116         //   msg: < item: data >
117         // In TT_TextProto, map<key, value> does not occur.
118         if (Style.Language == FormatStyle::LK_TextProto ||
119             (Style.Language == FormatStyle::LK_Proto && Left->Previous &&
120              Left->Previous->isOneOf(TT_SelectorName, TT_DictLiteral)))
121           CurrentToken->setType(TT_DictLiteral);
122         else
123           CurrentToken->setType(TT_TemplateCloser);
124         next();
125         return true;
126       }
127       if (CurrentToken->is(tok::question) &&
128           Style.Language == FormatStyle::LK_Java) {
129         next();
130         continue;
131       }
132       if (CurrentToken->isOneOf(tok::r_paren, tok::r_square, tok::r_brace) ||
133           (CurrentToken->isOneOf(tok::colon, tok::question) && InExprContext &&
134            !Style.isCSharp() && Style.Language != FormatStyle::LK_Proto &&
135            Style.Language != FormatStyle::LK_TextProto))
136         return false;
137       // If a && or || is found and interpreted as a binary operator, this set
138       // of angles is likely part of something like "a < b && c > d". If the
139       // angles are inside an expression, the ||/&& might also be a binary
140       // operator that was misinterpreted because we are parsing template
141       // parameters.
142       // FIXME: This is getting out of hand, write a decent parser.
143       if (CurrentToken->Previous->isOneOf(tok::pipepipe, tok::ampamp) &&
144           CurrentToken->Previous->is(TT_BinaryOperator) &&
145           Contexts[Contexts.size() - 2].IsExpression &&
146           !Line.startsWith(tok::kw_template))
147         return false;
148       updateParameterCount(Left, CurrentToken);
149       if (Style.Language == FormatStyle::LK_Proto) {
150         if (FormatToken *Previous = CurrentToken->getPreviousNonComment()) {
151           if (CurrentToken->is(tok::colon) ||
152               (CurrentToken->isOneOf(tok::l_brace, tok::less) &&
153                Previous->isNot(tok::colon)))
154             Previous->setType(TT_SelectorName);
155         }
156       }
157       if (!consumeToken())
158         return false;
159     }
160     return false;
161   }
162 
163   bool parseParens(bool LookForDecls = false) {
164     if (!CurrentToken)
165       return false;
166     FormatToken *Left = CurrentToken->Previous;
167     Left->ParentBracket = Contexts.back().ContextKind;
168     ScopedContextCreator ContextCreator(*this, tok::l_paren, 1);
169 
170     // FIXME: This is a bit of a hack. Do better.
171     Contexts.back().ColonIsForRangeExpr =
172         Contexts.size() == 2 && Contexts[0].ColonIsForRangeExpr;
173 
174     bool StartsObjCMethodExpr = false;
175     if (FormatToken *MaybeSel = Left->Previous) {
176       // @selector( starts a selector.
177       if (MaybeSel->isObjCAtKeyword(tok::objc_selector) && MaybeSel->Previous &&
178           MaybeSel->Previous->is(tok::at)) {
179         StartsObjCMethodExpr = true;
180       }
181     }
182 
183     if (Left->is(TT_OverloadedOperatorLParen)) {
184       Contexts.back().IsExpression = false;
185     } else if (Style.Language == FormatStyle::LK_JavaScript &&
186                (Line.startsWith(Keywords.kw_type, tok::identifier) ||
187                 Line.startsWith(tok::kw_export, Keywords.kw_type,
188                                 tok::identifier))) {
189       // type X = (...);
190       // export type X = (...);
191       Contexts.back().IsExpression = false;
192     } else if (Left->Previous &&
193                (Left->Previous->isOneOf(tok::kw_static_assert, tok::kw_decltype,
194                                         tok::kw_while, tok::l_paren,
195                                         tok::comma) ||
196                 Left->Previous->isIf() ||
197                 Left->Previous->is(TT_BinaryOperator))) {
198       // static_assert, if and while usually contain expressions.
199       Contexts.back().IsExpression = true;
200     } else if (Style.Language == FormatStyle::LK_JavaScript && Left->Previous &&
201                (Left->Previous->is(Keywords.kw_function) ||
202                 (Left->Previous->endsSequence(tok::identifier,
203                                               Keywords.kw_function)))) {
204       // function(...) or function f(...)
205       Contexts.back().IsExpression = false;
206     } else if (Style.Language == FormatStyle::LK_JavaScript && Left->Previous &&
207                Left->Previous->is(TT_JsTypeColon)) {
208       // let x: (SomeType);
209       Contexts.back().IsExpression = false;
210     } else if (isLambdaParameterList(Left)) {
211       // This is a parameter list of a lambda expression.
212       Contexts.back().IsExpression = false;
213     } else if (Line.InPPDirective &&
214                (!Left->Previous || !Left->Previous->is(tok::identifier))) {
215       Contexts.back().IsExpression = true;
216     } else if (Contexts[Contexts.size() - 2].CaretFound) {
217       // This is the parameter list of an ObjC block.
218       Contexts.back().IsExpression = false;
219     } else if (Left->Previous && Left->Previous->is(tok::kw___attribute)) {
220       Left->setType(TT_AttributeParen);
221     } else if (Left->Previous && Left->Previous->is(TT_ForEachMacro)) {
222       // The first argument to a foreach macro is a declaration.
223       Contexts.back().IsForEachMacro = true;
224       Contexts.back().IsExpression = false;
225     } else if (Left->Previous && Left->Previous->MatchingParen &&
226                Left->Previous->MatchingParen->is(TT_ObjCBlockLParen)) {
227       Contexts.back().IsExpression = false;
228     } else if (!Line.MustBeDeclaration && !Line.InPPDirective) {
229       bool IsForOrCatch =
230           Left->Previous && Left->Previous->isOneOf(tok::kw_for, tok::kw_catch);
231       Contexts.back().IsExpression = !IsForOrCatch;
232     }
233 
234     if (StartsObjCMethodExpr) {
235       Contexts.back().ColonIsObjCMethodExpr = true;
236       Left->setType(TT_ObjCMethodExpr);
237     }
238 
239     // MightBeFunctionType and ProbablyFunctionType are used for
240     // function pointer and reference types as well as Objective-C
241     // block types:
242     //
243     // void (*FunctionPointer)(void);
244     // void (&FunctionReference)(void);
245     // void (^ObjCBlock)(void);
246     bool MightBeFunctionType = !Contexts[Contexts.size() - 2].IsExpression;
247     bool ProbablyFunctionType =
248         CurrentToken->isOneOf(tok::star, tok::amp, tok::caret);
249     bool HasMultipleLines = false;
250     bool HasMultipleParametersOnALine = false;
251     bool MightBeObjCForRangeLoop =
252         Left->Previous && Left->Previous->is(tok::kw_for);
253     FormatToken *PossibleObjCForInToken = nullptr;
254     while (CurrentToken) {
255       // LookForDecls is set when "if (" has been seen. Check for
256       // 'identifier' '*' 'identifier' followed by not '=' -- this
257       // '*' has to be a binary operator but determineStarAmpUsage() will
258       // categorize it as an unary operator, so set the right type here.
259       if (LookForDecls && CurrentToken->Next) {
260         FormatToken *Prev = CurrentToken->getPreviousNonComment();
261         if (Prev) {
262           FormatToken *PrevPrev = Prev->getPreviousNonComment();
263           FormatToken *Next = CurrentToken->Next;
264           if (PrevPrev && PrevPrev->is(tok::identifier) &&
265               Prev->isOneOf(tok::star, tok::amp, tok::ampamp) &&
266               CurrentToken->is(tok::identifier) && Next->isNot(tok::equal)) {
267             Prev->setType(TT_BinaryOperator);
268             LookForDecls = false;
269           }
270         }
271       }
272 
273       if (CurrentToken->Previous->is(TT_PointerOrReference) &&
274           CurrentToken->Previous->Previous->isOneOf(tok::l_paren,
275                                                     tok::coloncolon))
276         ProbablyFunctionType = true;
277       if (CurrentToken->is(tok::comma))
278         MightBeFunctionType = false;
279       if (CurrentToken->Previous->is(TT_BinaryOperator))
280         Contexts.back().IsExpression = true;
281       if (CurrentToken->is(tok::r_paren)) {
282         if (MightBeFunctionType && ProbablyFunctionType && CurrentToken->Next &&
283             (CurrentToken->Next->is(tok::l_paren) ||
284              (CurrentToken->Next->is(tok::l_square) && Line.MustBeDeclaration)))
285           Left->setType(Left->Next->is(tok::caret) ? TT_ObjCBlockLParen
286                                                    : TT_FunctionTypeLParen);
287         Left->MatchingParen = CurrentToken;
288         CurrentToken->MatchingParen = Left;
289 
290         if (CurrentToken->Next && CurrentToken->Next->is(tok::l_brace) &&
291             Left->Previous && Left->Previous->is(tok::l_paren)) {
292           // Detect the case where macros are used to generate lambdas or
293           // function bodies, e.g.:
294           //   auto my_lambda = MARCO((Type *type, int i) { .. body .. });
295           for (FormatToken *Tok = Left; Tok != CurrentToken; Tok = Tok->Next) {
296             if (Tok->is(TT_BinaryOperator) &&
297                 Tok->isOneOf(tok::star, tok::amp, tok::ampamp))
298               Tok->setType(TT_PointerOrReference);
299           }
300         }
301 
302         if (StartsObjCMethodExpr) {
303           CurrentToken->setType(TT_ObjCMethodExpr);
304           if (Contexts.back().FirstObjCSelectorName) {
305             Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
306                 Contexts.back().LongestObjCSelectorName;
307           }
308         }
309 
310         if (Left->is(TT_AttributeParen))
311           CurrentToken->setType(TT_AttributeParen);
312         if (Left->Previous && Left->Previous->is(TT_JavaAnnotation))
313           CurrentToken->setType(TT_JavaAnnotation);
314         if (Left->Previous && Left->Previous->is(TT_LeadingJavaAnnotation))
315           CurrentToken->setType(TT_LeadingJavaAnnotation);
316         if (Left->Previous && Left->Previous->is(TT_AttributeSquare))
317           CurrentToken->setType(TT_AttributeSquare);
318 
319         if (!HasMultipleLines)
320           Left->PackingKind = PPK_Inconclusive;
321         else if (HasMultipleParametersOnALine)
322           Left->PackingKind = PPK_BinPacked;
323         else
324           Left->PackingKind = PPK_OnePerLine;
325 
326         next();
327         return true;
328       }
329       if (CurrentToken->isOneOf(tok::r_square, tok::r_brace))
330         return false;
331 
332       if (CurrentToken->is(tok::l_brace))
333         Left->setType(TT_Unknown); // Not TT_ObjCBlockLParen
334       if (CurrentToken->is(tok::comma) && CurrentToken->Next &&
335           !CurrentToken->Next->HasUnescapedNewline &&
336           !CurrentToken->Next->isTrailingComment())
337         HasMultipleParametersOnALine = true;
338       if ((CurrentToken->Previous->isOneOf(tok::kw_const, tok::kw_auto) ||
339            CurrentToken->Previous->isSimpleTypeSpecifier()) &&
340           !CurrentToken->is(tok::l_brace))
341         Contexts.back().IsExpression = false;
342       if (CurrentToken->isOneOf(tok::semi, tok::colon)) {
343         MightBeObjCForRangeLoop = false;
344         if (PossibleObjCForInToken) {
345           PossibleObjCForInToken->setType(TT_Unknown);
346           PossibleObjCForInToken = nullptr;
347         }
348       }
349       if (MightBeObjCForRangeLoop && CurrentToken->is(Keywords.kw_in)) {
350         PossibleObjCForInToken = CurrentToken;
351         PossibleObjCForInToken->setType(TT_ObjCForIn);
352       }
353       // When we discover a 'new', we set CanBeExpression to 'false' in order to
354       // parse the type correctly. Reset that after a comma.
355       if (CurrentToken->is(tok::comma))
356         Contexts.back().CanBeExpression = true;
357 
358       FormatToken *Tok = CurrentToken;
359       if (!consumeToken())
360         return false;
361       updateParameterCount(Left, Tok);
362       if (CurrentToken && CurrentToken->HasUnescapedNewline)
363         HasMultipleLines = true;
364     }
365     return false;
366   }
367 
368   bool isCSharpAttributeSpecifier(const FormatToken &Tok) {
369     if (!Style.isCSharp())
370       return false;
371 
372     // `identifier[i]` is not an attribute.
373     if (Tok.Previous && Tok.Previous->is(tok::identifier))
374       return false;
375 
376     // Chains of [] in `identifier[i][j][k]` are not attributes.
377     if (Tok.Previous && Tok.Previous->is(tok::r_square)) {
378       auto *MatchingParen = Tok.Previous->MatchingParen;
379       if (!MatchingParen || MatchingParen->is(TT_ArraySubscriptLSquare))
380         return false;
381     }
382 
383     const FormatToken *AttrTok = Tok.Next;
384     if (!AttrTok)
385       return false;
386 
387     // Just an empty declaration e.g. string [].
388     if (AttrTok->is(tok::r_square))
389       return false;
390 
391     // Move along the tokens inbetween the '[' and ']' e.g. [STAThread].
392     while (AttrTok && AttrTok->isNot(tok::r_square)) {
393       AttrTok = AttrTok->Next;
394     }
395 
396     if (!AttrTok)
397       return false;
398 
399     // Allow an attribute to be the only content of a file.
400     AttrTok = AttrTok->Next;
401     if (!AttrTok)
402       return true;
403 
404     // Limit this to being an access modifier that follows.
405     if (AttrTok->isOneOf(tok::kw_public, tok::kw_private, tok::kw_protected,
406                          tok::comment, tok::kw_class, tok::kw_static,
407                          tok::l_square, Keywords.kw_internal)) {
408       return true;
409     }
410 
411     // incase its a [XXX] retval func(....
412     if (AttrTok->Next &&
413         AttrTok->Next->startsSequence(tok::identifier, tok::l_paren))
414       return true;
415 
416     return false;
417   }
418 
419   bool isCpp11AttributeSpecifier(const FormatToken &Tok) {
420     if (!Style.isCpp() || !Tok.startsSequence(tok::l_square, tok::l_square))
421       return false;
422     // The first square bracket is part of an ObjC array literal
423     if (Tok.Previous && Tok.Previous->is(tok::at)) {
424       return false;
425     }
426     const FormatToken *AttrTok = Tok.Next->Next;
427     if (!AttrTok)
428       return false;
429     // C++17 '[[using ns: foo, bar(baz, blech)]]'
430     // We assume nobody will name an ObjC variable 'using'.
431     if (AttrTok->startsSequence(tok::kw_using, tok::identifier, tok::colon))
432       return true;
433     if (AttrTok->isNot(tok::identifier))
434       return false;
435     while (AttrTok && !AttrTok->startsSequence(tok::r_square, tok::r_square)) {
436       // ObjC message send. We assume nobody will use : in a C++11 attribute
437       // specifier parameter, although this is technically valid:
438       // [[foo(:)]].
439       if (AttrTok->is(tok::colon) ||
440           AttrTok->startsSequence(tok::identifier, tok::identifier) ||
441           AttrTok->startsSequence(tok::r_paren, tok::identifier))
442         return false;
443       if (AttrTok->is(tok::ellipsis))
444         return true;
445       AttrTok = AttrTok->Next;
446     }
447     return AttrTok && AttrTok->startsSequence(tok::r_square, tok::r_square);
448   }
449 
450   bool parseSquare() {
451     if (!CurrentToken)
452       return false;
453 
454     // A '[' could be an index subscript (after an identifier or after
455     // ')' or ']'), it could be the start of an Objective-C method
456     // expression, it could the start of an Objective-C array literal,
457     // or it could be a C++ attribute specifier [[foo::bar]].
458     FormatToken *Left = CurrentToken->Previous;
459     Left->ParentBracket = Contexts.back().ContextKind;
460     FormatToken *Parent = Left->getPreviousNonComment();
461 
462     // Cases where '>' is followed by '['.
463     // In C++, this can happen either in array of templates (foo<int>[10])
464     // or when array is a nested template type (unique_ptr<type1<type2>[]>).
465     bool CppArrayTemplates =
466         Style.isCpp() && Parent && Parent->is(TT_TemplateCloser) &&
467         (Contexts.back().CanBeExpression || Contexts.back().IsExpression ||
468          Contexts.back().InTemplateArgument);
469 
470     bool IsCpp11AttributeSpecifier = isCpp11AttributeSpecifier(*Left) ||
471                                      Contexts.back().InCpp11AttributeSpecifier;
472 
473     // Treat C# Attributes [STAThread] much like C++ attributes [[...]].
474     bool IsCSharpAttributeSpecifier =
475         isCSharpAttributeSpecifier(*Left) ||
476         Contexts.back().InCSharpAttributeSpecifier;
477 
478     bool InsideInlineASM = Line.startsWith(tok::kw_asm);
479     bool IsCppStructuredBinding = Left->isCppStructuredBinding(Style);
480     bool StartsObjCMethodExpr =
481         !IsCppStructuredBinding && !InsideInlineASM && !CppArrayTemplates &&
482         Style.isCpp() && !IsCpp11AttributeSpecifier &&
483         !IsCSharpAttributeSpecifier && Contexts.back().CanBeExpression &&
484         Left->isNot(TT_LambdaLSquare) &&
485         !CurrentToken->isOneOf(tok::l_brace, tok::r_square) &&
486         (!Parent ||
487          Parent->isOneOf(tok::colon, tok::l_square, tok::l_paren,
488                          tok::kw_return, tok::kw_throw) ||
489          Parent->isUnaryOperator() ||
490          // FIXME(bug 36976): ObjC return types shouldn't use TT_CastRParen.
491          Parent->isOneOf(TT_ObjCForIn, TT_CastRParen) ||
492          (getBinOpPrecedence(Parent->Tok.getKind(), true, true) >
493           prec::Unknown));
494     bool ColonFound = false;
495 
496     unsigned BindingIncrease = 1;
497     if (IsCppStructuredBinding) {
498       Left->setType(TT_StructuredBindingLSquare);
499     } else if (Left->is(TT_Unknown)) {
500       if (StartsObjCMethodExpr) {
501         Left->setType(TT_ObjCMethodExpr);
502       } else if (InsideInlineASM) {
503         Left->setType(TT_InlineASMSymbolicNameLSquare);
504       } else if (IsCpp11AttributeSpecifier) {
505         Left->setType(TT_AttributeSquare);
506       } else if (Style.Language == FormatStyle::LK_JavaScript && Parent &&
507                  Contexts.back().ContextKind == tok::l_brace &&
508                  Parent->isOneOf(tok::l_brace, tok::comma)) {
509         Left->setType(TT_JsComputedPropertyName);
510       } else if (Style.isCpp() && Contexts.back().ContextKind == tok::l_brace &&
511                  Parent && Parent->isOneOf(tok::l_brace, tok::comma)) {
512         Left->setType(TT_DesignatedInitializerLSquare);
513       } else if (IsCSharpAttributeSpecifier) {
514         Left->setType(TT_AttributeSquare);
515       } else if (CurrentToken->is(tok::r_square) && Parent &&
516                  Parent->is(TT_TemplateCloser)) {
517         Left->setType(TT_ArraySubscriptLSquare);
518       } else if (Style.Language == FormatStyle::LK_Proto ||
519                  Style.Language == FormatStyle::LK_TextProto) {
520         // Square braces in LK_Proto can either be message field attributes:
521         //
522         // optional Aaa aaa = 1 [
523         //   (aaa) = aaa
524         // ];
525         //
526         // extensions 123 [
527         //   (aaa) = aaa
528         // ];
529         //
530         // or text proto extensions (in options):
531         //
532         // option (Aaa.options) = {
533         //   [type.type/type] {
534         //     key: value
535         //   }
536         // }
537         //
538         // or repeated fields (in options):
539         //
540         // option (Aaa.options) = {
541         //   keys: [ 1, 2, 3 ]
542         // }
543         //
544         // In the first and the third case we want to spread the contents inside
545         // the square braces; in the second we want to keep them inline.
546         Left->setType(TT_ArrayInitializerLSquare);
547         if (!Left->endsSequence(tok::l_square, tok::numeric_constant,
548                                 tok::equal) &&
549             !Left->endsSequence(tok::l_square, tok::numeric_constant,
550                                 tok::identifier) &&
551             !Left->endsSequence(tok::l_square, tok::colon, TT_SelectorName)) {
552           Left->setType(TT_ProtoExtensionLSquare);
553           BindingIncrease = 10;
554         }
555       } else if (!CppArrayTemplates && Parent &&
556                  Parent->isOneOf(TT_BinaryOperator, TT_TemplateCloser, tok::at,
557                                  tok::comma, tok::l_paren, tok::l_square,
558                                  tok::question, tok::colon, tok::kw_return,
559                                  // Should only be relevant to JavaScript:
560                                  tok::kw_default)) {
561         Left->setType(TT_ArrayInitializerLSquare);
562       } else {
563         BindingIncrease = 10;
564         Left->setType(TT_ArraySubscriptLSquare);
565       }
566     }
567 
568     ScopedContextCreator ContextCreator(*this, tok::l_square, BindingIncrease);
569     Contexts.back().IsExpression = true;
570     if (Style.Language == FormatStyle::LK_JavaScript && Parent &&
571         Parent->is(TT_JsTypeColon))
572       Contexts.back().IsExpression = false;
573 
574     Contexts.back().ColonIsObjCMethodExpr = StartsObjCMethodExpr;
575     Contexts.back().InCpp11AttributeSpecifier = IsCpp11AttributeSpecifier;
576     Contexts.back().InCSharpAttributeSpecifier = IsCSharpAttributeSpecifier;
577 
578     while (CurrentToken) {
579       if (CurrentToken->is(tok::r_square)) {
580         if (IsCpp11AttributeSpecifier)
581           CurrentToken->setType(TT_AttributeSquare);
582         if (IsCSharpAttributeSpecifier)
583           CurrentToken->setType(TT_AttributeSquare);
584         else if (((CurrentToken->Next &&
585                    CurrentToken->Next->is(tok::l_paren)) ||
586                   (CurrentToken->Previous &&
587                    CurrentToken->Previous->Previous == Left)) &&
588                  Left->is(TT_ObjCMethodExpr)) {
589           // An ObjC method call is rarely followed by an open parenthesis. It
590           // also can't be composed of just one token, unless it's a macro that
591           // will be expanded to more tokens.
592           // FIXME: Do we incorrectly label ":" with this?
593           StartsObjCMethodExpr = false;
594           Left->setType(TT_Unknown);
595         }
596         if (StartsObjCMethodExpr && CurrentToken->Previous != Left) {
597           CurrentToken->setType(TT_ObjCMethodExpr);
598           // If we haven't seen a colon yet, make sure the last identifier
599           // before the r_square is tagged as a selector name component.
600           if (!ColonFound && CurrentToken->Previous &&
601               CurrentToken->Previous->is(TT_Unknown) &&
602               canBeObjCSelectorComponent(*CurrentToken->Previous))
603             CurrentToken->Previous->setType(TT_SelectorName);
604           // determineStarAmpUsage() thinks that '*' '[' is allocating an
605           // array of pointers, but if '[' starts a selector then '*' is a
606           // binary operator.
607           if (Parent && Parent->is(TT_PointerOrReference))
608             Parent->setType(TT_BinaryOperator);
609         }
610         // An arrow after an ObjC method expression is not a lambda arrow.
611         if (CurrentToken->getType() == TT_ObjCMethodExpr &&
612             CurrentToken->Next && CurrentToken->Next->is(TT_LambdaArrow))
613           CurrentToken->Next->setType(TT_Unknown);
614         Left->MatchingParen = CurrentToken;
615         CurrentToken->MatchingParen = Left;
616         // FirstObjCSelectorName is set when a colon is found. This does
617         // not work, however, when the method has no parameters.
618         // Here, we set FirstObjCSelectorName when the end of the method call is
619         // reached, in case it was not set already.
620         if (!Contexts.back().FirstObjCSelectorName) {
621           FormatToken *Previous = CurrentToken->getPreviousNonComment();
622           if (Previous && Previous->is(TT_SelectorName)) {
623             Previous->ObjCSelectorNameParts = 1;
624             Contexts.back().FirstObjCSelectorName = Previous;
625           }
626         } else {
627           Left->ParameterCount =
628               Contexts.back().FirstObjCSelectorName->ObjCSelectorNameParts;
629         }
630         if (Contexts.back().FirstObjCSelectorName) {
631           Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
632               Contexts.back().LongestObjCSelectorName;
633           if (Left->BlockParameterCount > 1)
634             Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName = 0;
635         }
636         next();
637         return true;
638       }
639       if (CurrentToken->isOneOf(tok::r_paren, tok::r_brace))
640         return false;
641       if (CurrentToken->is(tok::colon)) {
642         if (IsCpp11AttributeSpecifier &&
643             CurrentToken->endsSequence(tok::colon, tok::identifier,
644                                        tok::kw_using)) {
645           // Remember that this is a [[using ns: foo]] C++ attribute, so we
646           // don't add a space before the colon (unlike other colons).
647           CurrentToken->setType(TT_AttributeColon);
648         } else if (Left->isOneOf(TT_ArraySubscriptLSquare,
649                                  TT_DesignatedInitializerLSquare)) {
650           Left->setType(TT_ObjCMethodExpr);
651           StartsObjCMethodExpr = true;
652           Contexts.back().ColonIsObjCMethodExpr = true;
653           if (Parent && Parent->is(tok::r_paren))
654             // FIXME(bug 36976): ObjC return types shouldn't use TT_CastRParen.
655             Parent->setType(TT_CastRParen);
656         }
657         ColonFound = true;
658       }
659       if (CurrentToken->is(tok::comma) && Left->is(TT_ObjCMethodExpr) &&
660           !ColonFound)
661         Left->setType(TT_ArrayInitializerLSquare);
662       FormatToken *Tok = CurrentToken;
663       if (!consumeToken())
664         return false;
665       updateParameterCount(Left, Tok);
666     }
667     return false;
668   }
669 
670   bool parseBrace() {
671     if (CurrentToken) {
672       FormatToken *Left = CurrentToken->Previous;
673       Left->ParentBracket = Contexts.back().ContextKind;
674 
675       if (Contexts.back().CaretFound)
676         Left->setType(TT_ObjCBlockLBrace);
677       Contexts.back().CaretFound = false;
678 
679       ScopedContextCreator ContextCreator(*this, tok::l_brace, 1);
680       Contexts.back().ColonIsDictLiteral = true;
681       if (Left->BlockKind == BK_BracedInit)
682         Contexts.back().IsExpression = true;
683       if (Style.Language == FormatStyle::LK_JavaScript && Left->Previous &&
684           Left->Previous->is(TT_JsTypeColon))
685         Contexts.back().IsExpression = false;
686 
687       while (CurrentToken) {
688         if (CurrentToken->is(tok::r_brace)) {
689           Left->MatchingParen = CurrentToken;
690           CurrentToken->MatchingParen = Left;
691           next();
692           return true;
693         }
694         if (CurrentToken->isOneOf(tok::r_paren, tok::r_square))
695           return false;
696         updateParameterCount(Left, CurrentToken);
697         if (CurrentToken->isOneOf(tok::colon, tok::l_brace, tok::less)) {
698           FormatToken *Previous = CurrentToken->getPreviousNonComment();
699           if (Previous->is(TT_JsTypeOptionalQuestion))
700             Previous = Previous->getPreviousNonComment();
701           if ((CurrentToken->is(tok::colon) &&
702                (!Contexts.back().ColonIsDictLiteral || !Style.isCpp())) ||
703               Style.Language == FormatStyle::LK_Proto ||
704               Style.Language == FormatStyle::LK_TextProto) {
705             Left->setType(TT_DictLiteral);
706             if (Previous->Tok.getIdentifierInfo() ||
707                 Previous->is(tok::string_literal))
708               Previous->setType(TT_SelectorName);
709           }
710           if (CurrentToken->is(tok::colon) ||
711               Style.Language == FormatStyle::LK_JavaScript)
712             Left->setType(TT_DictLiteral);
713         }
714         if (CurrentToken->is(tok::comma) &&
715             Style.Language == FormatStyle::LK_JavaScript)
716           Left->setType(TT_DictLiteral);
717         if (!consumeToken())
718           return false;
719       }
720     }
721     return true;
722   }
723 
724   void updateParameterCount(FormatToken *Left, FormatToken *Current) {
725     // For ObjC methods, the number of parameters is calculated differently as
726     // method declarations have a different structure (the parameters are not
727     // inside a bracket scope).
728     if (Current->is(tok::l_brace) && Current->BlockKind == BK_Block)
729       ++Left->BlockParameterCount;
730     if (Current->is(tok::comma)) {
731       ++Left->ParameterCount;
732       if (!Left->Role)
733         Left->Role.reset(new CommaSeparatedList(Style));
734       Left->Role->CommaFound(Current);
735     } else if (Left->ParameterCount == 0 && Current->isNot(tok::comment)) {
736       Left->ParameterCount = 1;
737     }
738   }
739 
740   bool parseConditional() {
741     while (CurrentToken) {
742       if (CurrentToken->is(tok::colon)) {
743         CurrentToken->setType(TT_ConditionalExpr);
744         next();
745         return true;
746       }
747       if (!consumeToken())
748         return false;
749     }
750     return false;
751   }
752 
753   bool parseTemplateDeclaration() {
754     if (CurrentToken && CurrentToken->is(tok::less)) {
755       CurrentToken->setType(TT_TemplateOpener);
756       next();
757       if (!parseAngle())
758         return false;
759       if (CurrentToken)
760         CurrentToken->Previous->ClosesTemplateDeclaration = true;
761       return true;
762     }
763     return false;
764   }
765 
766   bool consumeToken() {
767     FormatToken *Tok = CurrentToken;
768     next();
769     switch (Tok->Tok.getKind()) {
770     case tok::plus:
771     case tok::minus:
772       if (!Tok->Previous && Line.MustBeDeclaration)
773         Tok->setType(TT_ObjCMethodSpecifier);
774       break;
775     case tok::colon:
776       if (!Tok->Previous)
777         return false;
778       // Colons from ?: are handled in parseConditional().
779       if (Style.Language == FormatStyle::LK_JavaScript) {
780         if (Contexts.back().ColonIsForRangeExpr || // colon in for loop
781             (Contexts.size() == 1 &&               // switch/case labels
782              !Line.First->isOneOf(tok::kw_enum, tok::kw_case)) ||
783             Contexts.back().ContextKind == tok::l_paren ||  // function params
784             Contexts.back().ContextKind == tok::l_square || // array type
785             (!Contexts.back().IsExpression &&
786              Contexts.back().ContextKind == tok::l_brace) || // object type
787             (Contexts.size() == 1 &&
788              Line.MustBeDeclaration)) { // method/property declaration
789           Contexts.back().IsExpression = false;
790           Tok->setType(TT_JsTypeColon);
791           break;
792         }
793       } else if (Style.isCSharp()) {
794         if (Contexts.back().InCSharpAttributeSpecifier) {
795           Tok->setType(TT_AttributeColon);
796           break;
797         }
798         if (Contexts.back().ContextKind == tok::l_paren) {
799           Tok->setType(TT_CSharpNamedArgumentColon);
800           break;
801         }
802       }
803       if (Contexts.back().ColonIsDictLiteral ||
804           Style.Language == FormatStyle::LK_Proto ||
805           Style.Language == FormatStyle::LK_TextProto) {
806         Tok->setType(TT_DictLiteral);
807         if (Style.Language == FormatStyle::LK_TextProto) {
808           if (FormatToken *Previous = Tok->getPreviousNonComment())
809             Previous->setType(TT_SelectorName);
810         }
811       } else if (Contexts.back().ColonIsObjCMethodExpr ||
812                  Line.startsWith(TT_ObjCMethodSpecifier)) {
813         Tok->setType(TT_ObjCMethodExpr);
814         const FormatToken *BeforePrevious = Tok->Previous->Previous;
815         // Ensure we tag all identifiers in method declarations as
816         // TT_SelectorName.
817         bool UnknownIdentifierInMethodDeclaration =
818             Line.startsWith(TT_ObjCMethodSpecifier) &&
819             Tok->Previous->is(tok::identifier) && Tok->Previous->is(TT_Unknown);
820         if (!BeforePrevious ||
821             // FIXME(bug 36976): ObjC return types shouldn't use TT_CastRParen.
822             !(BeforePrevious->is(TT_CastRParen) ||
823               (BeforePrevious->is(TT_ObjCMethodExpr) &&
824                BeforePrevious->is(tok::colon))) ||
825             BeforePrevious->is(tok::r_square) ||
826             Contexts.back().LongestObjCSelectorName == 0 ||
827             UnknownIdentifierInMethodDeclaration) {
828           Tok->Previous->setType(TT_SelectorName);
829           if (!Contexts.back().FirstObjCSelectorName)
830             Contexts.back().FirstObjCSelectorName = Tok->Previous;
831           else if (Tok->Previous->ColumnWidth >
832                    Contexts.back().LongestObjCSelectorName)
833             Contexts.back().LongestObjCSelectorName =
834                 Tok->Previous->ColumnWidth;
835           Tok->Previous->ParameterIndex =
836               Contexts.back().FirstObjCSelectorName->ObjCSelectorNameParts;
837           ++Contexts.back().FirstObjCSelectorName->ObjCSelectorNameParts;
838         }
839       } else if (Contexts.back().ColonIsForRangeExpr) {
840         Tok->setType(TT_RangeBasedForLoopColon);
841       } else if (CurrentToken && CurrentToken->is(tok::numeric_constant)) {
842         Tok->setType(TT_BitFieldColon);
843       } else if (Contexts.size() == 1 &&
844                  !Line.First->isOneOf(tok::kw_enum, tok::kw_case)) {
845         FormatToken *Prev = Tok->getPreviousNonComment();
846         if (Prev->isOneOf(tok::r_paren, tok::kw_noexcept))
847           Tok->setType(TT_CtorInitializerColon);
848         else if (Prev->is(tok::kw_try)) {
849           // Member initializer list within function try block.
850           FormatToken *PrevPrev = Prev->getPreviousNonComment();
851           if (PrevPrev && PrevPrev->isOneOf(tok::r_paren, tok::kw_noexcept))
852             Tok->setType(TT_CtorInitializerColon);
853         } else
854           Tok->setType(TT_InheritanceColon);
855       } else if (canBeObjCSelectorComponent(*Tok->Previous) && Tok->Next &&
856                  (Tok->Next->isOneOf(tok::r_paren, tok::comma) ||
857                   (canBeObjCSelectorComponent(*Tok->Next) && Tok->Next->Next &&
858                    Tok->Next->Next->is(tok::colon)))) {
859         // This handles a special macro in ObjC code where selectors including
860         // the colon are passed as macro arguments.
861         Tok->setType(TT_ObjCMethodExpr);
862       } else if (Contexts.back().ContextKind == tok::l_paren) {
863         Tok->setType(TT_InlineASMColon);
864       }
865       break;
866     case tok::pipe:
867     case tok::amp:
868       // | and & in declarations/type expressions represent union and
869       // intersection types, respectively.
870       if (Style.Language == FormatStyle::LK_JavaScript &&
871           !Contexts.back().IsExpression)
872         Tok->setType(TT_JsTypeOperator);
873       break;
874     case tok::kw_if:
875     case tok::kw_while:
876       if (Tok->is(tok::kw_if) && CurrentToken &&
877           CurrentToken->isOneOf(tok::kw_constexpr, tok::identifier))
878         next();
879       if (CurrentToken && CurrentToken->is(tok::l_paren)) {
880         next();
881         if (!parseParens(/*LookForDecls=*/true))
882           return false;
883       }
884       break;
885     case tok::kw_for:
886       if (Style.Language == FormatStyle::LK_JavaScript) {
887         // x.for and {for: ...}
888         if ((Tok->Previous && Tok->Previous->is(tok::period)) ||
889             (Tok->Next && Tok->Next->is(tok::colon)))
890           break;
891         // JS' for await ( ...
892         if (CurrentToken && CurrentToken->is(Keywords.kw_await))
893           next();
894       }
895       Contexts.back().ColonIsForRangeExpr = true;
896       next();
897       if (!parseParens())
898         return false;
899       break;
900     case tok::l_paren:
901       // When faced with 'operator()()', the kw_operator handler incorrectly
902       // marks the first l_paren as a OverloadedOperatorLParen. Here, we make
903       // the first two parens OverloadedOperators and the second l_paren an
904       // OverloadedOperatorLParen.
905       if (Tok->Previous && Tok->Previous->is(tok::r_paren) &&
906           Tok->Previous->MatchingParen &&
907           Tok->Previous->MatchingParen->is(TT_OverloadedOperatorLParen)) {
908         Tok->Previous->setType(TT_OverloadedOperator);
909         Tok->Previous->MatchingParen->setType(TT_OverloadedOperator);
910         Tok->setType(TT_OverloadedOperatorLParen);
911       }
912 
913       if (!parseParens())
914         return false;
915       if (Line.MustBeDeclaration && Contexts.size() == 1 &&
916           !Contexts.back().IsExpression && !Line.startsWith(TT_ObjCProperty) &&
917           (!Tok->Previous ||
918            !Tok->Previous->isOneOf(tok::kw_decltype, tok::kw___attribute,
919                                    TT_LeadingJavaAnnotation)))
920         Line.MightBeFunctionDecl = true;
921       break;
922     case tok::l_square:
923       if (!parseSquare())
924         return false;
925       break;
926     case tok::l_brace:
927       if (Style.Language == FormatStyle::LK_TextProto) {
928         FormatToken *Previous = Tok->getPreviousNonComment();
929         if (Previous && Previous->getType() != TT_DictLiteral)
930           Previous->setType(TT_SelectorName);
931       }
932       if (!parseBrace())
933         return false;
934       break;
935     case tok::less:
936       if (parseAngle()) {
937         Tok->setType(TT_TemplateOpener);
938         // In TT_Proto, we must distignuish between:
939         //   map<key, value>
940         //   msg < item: data >
941         //   msg: < item: data >
942         // In TT_TextProto, map<key, value> does not occur.
943         if (Style.Language == FormatStyle::LK_TextProto ||
944             (Style.Language == FormatStyle::LK_Proto && Tok->Previous &&
945              Tok->Previous->isOneOf(TT_SelectorName, TT_DictLiteral))) {
946           Tok->setType(TT_DictLiteral);
947           FormatToken *Previous = Tok->getPreviousNonComment();
948           if (Previous && Previous->getType() != TT_DictLiteral)
949             Previous->setType(TT_SelectorName);
950         }
951       } else {
952         Tok->setType(TT_BinaryOperator);
953         NonTemplateLess.insert(Tok);
954         CurrentToken = Tok;
955         next();
956       }
957       break;
958     case tok::r_paren:
959     case tok::r_square:
960       return false;
961     case tok::r_brace:
962       // Lines can start with '}'.
963       if (Tok->Previous)
964         return false;
965       break;
966     case tok::greater:
967       if (Style.Language != FormatStyle::LK_TextProto)
968         Tok->setType(TT_BinaryOperator);
969       if (Tok->Previous && Tok->Previous->is(TT_TemplateCloser))
970         Tok->SpacesRequiredBefore = 1;
971       break;
972     case tok::kw_operator:
973       if (Style.Language == FormatStyle::LK_TextProto ||
974           Style.Language == FormatStyle::LK_Proto)
975         break;
976       while (CurrentToken &&
977              !CurrentToken->isOneOf(tok::l_paren, tok::semi, tok::r_paren)) {
978         if (CurrentToken->isOneOf(tok::star, tok::amp))
979           CurrentToken->setType(TT_PointerOrReference);
980         consumeToken();
981         if (CurrentToken && CurrentToken->Previous->isOneOf(
982                                 TT_BinaryOperator, TT_UnaryOperator, tok::comma,
983                                 tok::star, tok::arrow, tok::amp, tok::ampamp))
984           CurrentToken->Previous->setType(TT_OverloadedOperator);
985       }
986       if (CurrentToken) {
987         CurrentToken->setType(TT_OverloadedOperatorLParen);
988         if (CurrentToken->Previous->is(TT_BinaryOperator))
989           CurrentToken->Previous->setType(TT_OverloadedOperator);
990       }
991       break;
992     case tok::question:
993       if (Tok->is(TT_CSharpNullConditionalLSquare)) {
994         if (!parseSquare())
995           return false;
996         break;
997       }
998       if (Tok->isOneOf(TT_CSharpNullConditional, TT_CSharpNullCoalescing))
999         break;
1000       if (Style.Language == FormatStyle::LK_JavaScript && Tok->Next &&
1001           Tok->Next->isOneOf(tok::semi, tok::comma, tok::colon, tok::r_paren,
1002                              tok::r_brace)) {
1003         // Question marks before semicolons, colons, etc. indicate optional
1004         // types (fields, parameters), e.g.
1005         //   function(x?: string, y?) {...}
1006         //   class X { y?; }
1007         Tok->setType(TT_JsTypeOptionalQuestion);
1008         break;
1009       }
1010       // Declarations cannot be conditional expressions, this can only be part
1011       // of a type declaration.
1012       if (Line.MustBeDeclaration && !Contexts.back().IsExpression &&
1013           Style.Language == FormatStyle::LK_JavaScript)
1014         break;
1015       if (Style.isCSharp()) {
1016         // `Type?)`, `Type?>`, `Type? name;` and `Type? name =` can only be
1017         // nullable types.
1018         // Line.MustBeDeclaration will be true for `Type? name;`.
1019         if ((!Contexts.back().IsExpression && Line.MustBeDeclaration) ||
1020             (Tok->Next && Tok->Next->isOneOf(tok::r_paren, tok::greater)) ||
1021             (Tok->Next && Tok->Next->is(tok::identifier) && Tok->Next->Next &&
1022              Tok->Next->Next->is(tok::equal))) {
1023           Tok->setType(TT_CSharpNullable);
1024           break;
1025         }
1026       }
1027       parseConditional();
1028       break;
1029     case tok::kw_template:
1030       parseTemplateDeclaration();
1031       break;
1032     case tok::comma:
1033       if (Contexts.back().InCtorInitializer)
1034         Tok->setType(TT_CtorInitializerComma);
1035       else if (Contexts.back().InInheritanceList)
1036         Tok->setType(TT_InheritanceComma);
1037       else if (Contexts.back().FirstStartOfName &&
1038                (Contexts.size() == 1 || Line.startsWith(tok::kw_for))) {
1039         Contexts.back().FirstStartOfName->PartOfMultiVariableDeclStmt = true;
1040         Line.IsMultiVariableDeclStmt = true;
1041       }
1042       if (Contexts.back().IsForEachMacro)
1043         Contexts.back().IsExpression = true;
1044       break;
1045     case tok::identifier:
1046       if (Tok->isOneOf(Keywords.kw___has_include,
1047                        Keywords.kw___has_include_next)) {
1048         parseHasInclude();
1049       }
1050       if (Style.isCSharp() && Tok->is(Keywords.kw_where) && Tok->Next &&
1051           Tok->Next->isNot(tok::l_paren)) {
1052         Tok->setType(TT_CSharpGenericTypeConstraint);
1053         parseCSharpGenericTypeConstraint();
1054       }
1055       break;
1056     default:
1057       break;
1058     }
1059     return true;
1060   }
1061 
1062   void parseCSharpGenericTypeConstraint() {
1063     int OpenAngleBracketsCount = 0;
1064     while (CurrentToken) {
1065       if (CurrentToken->is(tok::less)) {
1066         // parseAngle is too greedy and will consume the whole line.
1067         CurrentToken->setType(TT_TemplateOpener);
1068         ++OpenAngleBracketsCount;
1069         next();
1070       } else if (CurrentToken->is(tok::greater)) {
1071         CurrentToken->setType(TT_TemplateCloser);
1072         --OpenAngleBracketsCount;
1073         next();
1074       } else if (CurrentToken->is(tok::comma) && OpenAngleBracketsCount == 0) {
1075         // We allow line breaks after GenericTypeConstraintComma's
1076         // so do not flag commas in Generics as GenericTypeConstraintComma's.
1077         CurrentToken->setType(TT_CSharpGenericTypeConstraintComma);
1078         next();
1079       } else if (CurrentToken->is(Keywords.kw_where)) {
1080         CurrentToken->setType(TT_CSharpGenericTypeConstraint);
1081         next();
1082       } else if (CurrentToken->is(tok::colon)) {
1083         CurrentToken->setType(TT_CSharpGenericTypeConstraintColon);
1084         next();
1085       } else {
1086         next();
1087       }
1088     }
1089   }
1090 
1091   void parseIncludeDirective() {
1092     if (CurrentToken && CurrentToken->is(tok::less)) {
1093       next();
1094       while (CurrentToken) {
1095         // Mark tokens up to the trailing line comments as implicit string
1096         // literals.
1097         if (CurrentToken->isNot(tok::comment) &&
1098             !CurrentToken->TokenText.startswith("//"))
1099           CurrentToken->setType(TT_ImplicitStringLiteral);
1100         next();
1101       }
1102     }
1103   }
1104 
1105   void parseWarningOrError() {
1106     next();
1107     // We still want to format the whitespace left of the first token of the
1108     // warning or error.
1109     next();
1110     while (CurrentToken) {
1111       CurrentToken->setType(TT_ImplicitStringLiteral);
1112       next();
1113     }
1114   }
1115 
1116   void parsePragma() {
1117     next(); // Consume "pragma".
1118     if (CurrentToken &&
1119         CurrentToken->isOneOf(Keywords.kw_mark, Keywords.kw_option)) {
1120       bool IsMark = CurrentToken->is(Keywords.kw_mark);
1121       next(); // Consume "mark".
1122       next(); // Consume first token (so we fix leading whitespace).
1123       while (CurrentToken) {
1124         if (IsMark || CurrentToken->Previous->is(TT_BinaryOperator))
1125           CurrentToken->setType(TT_ImplicitStringLiteral);
1126         next();
1127       }
1128     }
1129   }
1130 
1131   void parseHasInclude() {
1132     if (!CurrentToken || !CurrentToken->is(tok::l_paren))
1133       return;
1134     next(); // '('
1135     parseIncludeDirective();
1136     next(); // ')'
1137   }
1138 
1139   LineType parsePreprocessorDirective() {
1140     bool IsFirstToken = CurrentToken->IsFirst;
1141     LineType Type = LT_PreprocessorDirective;
1142     next();
1143     if (!CurrentToken)
1144       return Type;
1145 
1146     if (Style.Language == FormatStyle::LK_JavaScript && IsFirstToken) {
1147       // JavaScript files can contain shebang lines of the form:
1148       // #!/usr/bin/env node
1149       // Treat these like C++ #include directives.
1150       while (CurrentToken) {
1151         // Tokens cannot be comments here.
1152         CurrentToken->setType(TT_ImplicitStringLiteral);
1153         next();
1154       }
1155       return LT_ImportStatement;
1156     }
1157 
1158     if (CurrentToken->Tok.is(tok::numeric_constant)) {
1159       CurrentToken->SpacesRequiredBefore = 1;
1160       return Type;
1161     }
1162     // Hashes in the middle of a line can lead to any strange token
1163     // sequence.
1164     if (!CurrentToken->Tok.getIdentifierInfo())
1165       return Type;
1166     switch (CurrentToken->Tok.getIdentifierInfo()->getPPKeywordID()) {
1167     case tok::pp_include:
1168     case tok::pp_include_next:
1169     case tok::pp_import:
1170       next();
1171       parseIncludeDirective();
1172       Type = LT_ImportStatement;
1173       break;
1174     case tok::pp_error:
1175     case tok::pp_warning:
1176       parseWarningOrError();
1177       break;
1178     case tok::pp_pragma:
1179       parsePragma();
1180       break;
1181     case tok::pp_if:
1182     case tok::pp_elif:
1183       Contexts.back().IsExpression = true;
1184       next();
1185       parseLine();
1186       break;
1187     default:
1188       break;
1189     }
1190     while (CurrentToken) {
1191       FormatToken *Tok = CurrentToken;
1192       next();
1193       if (Tok->is(tok::l_paren))
1194         parseParens();
1195       else if (Tok->isOneOf(Keywords.kw___has_include,
1196                             Keywords.kw___has_include_next))
1197         parseHasInclude();
1198     }
1199     return Type;
1200   }
1201 
1202 public:
1203   LineType parseLine() {
1204     if (!CurrentToken)
1205       return LT_Invalid;
1206     NonTemplateLess.clear();
1207     if (CurrentToken->is(tok::hash))
1208       return parsePreprocessorDirective();
1209 
1210     // Directly allow to 'import <string-literal>' to support protocol buffer
1211     // definitions (github.com/google/protobuf) or missing "#" (either way we
1212     // should not break the line).
1213     IdentifierInfo *Info = CurrentToken->Tok.getIdentifierInfo();
1214     if ((Style.Language == FormatStyle::LK_Java &&
1215          CurrentToken->is(Keywords.kw_package)) ||
1216         (Info && Info->getPPKeywordID() == tok::pp_import &&
1217          CurrentToken->Next &&
1218          CurrentToken->Next->isOneOf(tok::string_literal, tok::identifier,
1219                                      tok::kw_static))) {
1220       next();
1221       parseIncludeDirective();
1222       return LT_ImportStatement;
1223     }
1224 
1225     // If this line starts and ends in '<' and '>', respectively, it is likely
1226     // part of "#define <a/b.h>".
1227     if (CurrentToken->is(tok::less) && Line.Last->is(tok::greater)) {
1228       parseIncludeDirective();
1229       return LT_ImportStatement;
1230     }
1231 
1232     // In .proto files, top-level options and package statements are very
1233     // similar to import statements and should not be line-wrapped.
1234     if (Style.Language == FormatStyle::LK_Proto && Line.Level == 0 &&
1235         CurrentToken->isOneOf(Keywords.kw_option, Keywords.kw_package)) {
1236       next();
1237       if (CurrentToken && CurrentToken->is(tok::identifier)) {
1238         while (CurrentToken)
1239           next();
1240         return LT_ImportStatement;
1241       }
1242     }
1243 
1244     bool KeywordVirtualFound = false;
1245     bool ImportStatement = false;
1246 
1247     // import {...} from '...';
1248     if (Style.Language == FormatStyle::LK_JavaScript &&
1249         CurrentToken->is(Keywords.kw_import))
1250       ImportStatement = true;
1251 
1252     while (CurrentToken) {
1253       if (CurrentToken->is(tok::kw_virtual))
1254         KeywordVirtualFound = true;
1255       if (Style.Language == FormatStyle::LK_JavaScript) {
1256         // export {...} from '...';
1257         // An export followed by "from 'some string';" is a re-export from
1258         // another module identified by a URI and is treated as a
1259         // LT_ImportStatement (i.e. prevent wraps on it for long URIs).
1260         // Just "export {...};" or "export class ..." should not be treated as
1261         // an import in this sense.
1262         if (Line.First->is(tok::kw_export) &&
1263             CurrentToken->is(Keywords.kw_from) && CurrentToken->Next &&
1264             CurrentToken->Next->isStringLiteral())
1265           ImportStatement = true;
1266         if (isClosureImportStatement(*CurrentToken))
1267           ImportStatement = true;
1268       }
1269       if (!consumeToken())
1270         return LT_Invalid;
1271     }
1272     if (KeywordVirtualFound)
1273       return LT_VirtualFunctionDecl;
1274     if (ImportStatement)
1275       return LT_ImportStatement;
1276 
1277     if (Line.startsWith(TT_ObjCMethodSpecifier)) {
1278       if (Contexts.back().FirstObjCSelectorName)
1279         Contexts.back().FirstObjCSelectorName->LongestObjCSelectorName =
1280             Contexts.back().LongestObjCSelectorName;
1281       return LT_ObjCMethodDecl;
1282     }
1283 
1284     return LT_Other;
1285   }
1286 
1287 private:
1288   bool isClosureImportStatement(const FormatToken &Tok) {
1289     // FIXME: Closure-library specific stuff should not be hard-coded but be
1290     // configurable.
1291     return Tok.TokenText == "goog" && Tok.Next && Tok.Next->is(tok::period) &&
1292            Tok.Next->Next &&
1293            (Tok.Next->Next->TokenText == "module" ||
1294             Tok.Next->Next->TokenText == "provide" ||
1295             Tok.Next->Next->TokenText == "require" ||
1296             Tok.Next->Next->TokenText == "requireType" ||
1297             Tok.Next->Next->TokenText == "forwardDeclare") &&
1298            Tok.Next->Next->Next && Tok.Next->Next->Next->is(tok::l_paren);
1299   }
1300 
1301   void resetTokenMetadata(FormatToken *Token) {
1302     if (!Token)
1303       return;
1304 
1305     // Reset token type in case we have already looked at it and then
1306     // recovered from an error (e.g. failure to find the matching >).
1307     if (!CurrentToken->isOneOf(
1308             TT_LambdaLSquare, TT_LambdaLBrace, TT_ForEachMacro,
1309             TT_TypenameMacro, TT_FunctionLBrace, TT_ImplicitStringLiteral,
1310             TT_InlineASMBrace, TT_JsFatArrow, TT_LambdaArrow, TT_NamespaceMacro,
1311             TT_OverloadedOperator, TT_RegexLiteral, TT_TemplateString,
1312             TT_ObjCStringLiteral))
1313       CurrentToken->setType(TT_Unknown);
1314     CurrentToken->Role.reset();
1315     CurrentToken->MatchingParen = nullptr;
1316     CurrentToken->FakeLParens.clear();
1317     CurrentToken->FakeRParens = 0;
1318   }
1319 
1320   void next() {
1321     if (CurrentToken) {
1322       CurrentToken->NestingLevel = Contexts.size() - 1;
1323       CurrentToken->BindingStrength = Contexts.back().BindingStrength;
1324       modifyContext(*CurrentToken);
1325       determineTokenType(*CurrentToken);
1326       CurrentToken = CurrentToken->Next;
1327     }
1328 
1329     resetTokenMetadata(CurrentToken);
1330   }
1331 
1332   /// A struct to hold information valid in a specific context, e.g.
1333   /// a pair of parenthesis.
1334   struct Context {
1335     Context(tok::TokenKind ContextKind, unsigned BindingStrength,
1336             bool IsExpression)
1337         : ContextKind(ContextKind), BindingStrength(BindingStrength),
1338           IsExpression(IsExpression) {}
1339 
1340     tok::TokenKind ContextKind;
1341     unsigned BindingStrength;
1342     bool IsExpression;
1343     unsigned LongestObjCSelectorName = 0;
1344     bool ColonIsForRangeExpr = false;
1345     bool ColonIsDictLiteral = false;
1346     bool ColonIsObjCMethodExpr = false;
1347     FormatToken *FirstObjCSelectorName = nullptr;
1348     FormatToken *FirstStartOfName = nullptr;
1349     bool CanBeExpression = true;
1350     bool InTemplateArgument = false;
1351     bool InCtorInitializer = false;
1352     bool InInheritanceList = false;
1353     bool CaretFound = false;
1354     bool IsForEachMacro = false;
1355     bool InCpp11AttributeSpecifier = false;
1356     bool InCSharpAttributeSpecifier = false;
1357   };
1358 
1359   /// Puts a new \c Context onto the stack \c Contexts for the lifetime
1360   /// of each instance.
1361   struct ScopedContextCreator {
1362     AnnotatingParser &P;
1363 
1364     ScopedContextCreator(AnnotatingParser &P, tok::TokenKind ContextKind,
1365                          unsigned Increase)
1366         : P(P) {
1367       P.Contexts.push_back(Context(ContextKind,
1368                                    P.Contexts.back().BindingStrength + Increase,
1369                                    P.Contexts.back().IsExpression));
1370     }
1371 
1372     ~ScopedContextCreator() { P.Contexts.pop_back(); }
1373   };
1374 
1375   void modifyContext(const FormatToken &Current) {
1376     if (Current.getPrecedence() == prec::Assignment &&
1377         !Line.First->isOneOf(tok::kw_template, tok::kw_using, tok::kw_return) &&
1378         // Type aliases use `type X = ...;` in TypeScript and can be exported
1379         // using `export type ...`.
1380         !(Style.Language == FormatStyle::LK_JavaScript &&
1381           (Line.startsWith(Keywords.kw_type, tok::identifier) ||
1382            Line.startsWith(tok::kw_export, Keywords.kw_type,
1383                            tok::identifier))) &&
1384         (!Current.Previous || Current.Previous->isNot(tok::kw_operator))) {
1385       Contexts.back().IsExpression = true;
1386       if (!Line.startsWith(TT_UnaryOperator)) {
1387         for (FormatToken *Previous = Current.Previous;
1388              Previous && Previous->Previous &&
1389              !Previous->Previous->isOneOf(tok::comma, tok::semi);
1390              Previous = Previous->Previous) {
1391           if (Previous->isOneOf(tok::r_square, tok::r_paren)) {
1392             Previous = Previous->MatchingParen;
1393             if (!Previous)
1394               break;
1395           }
1396           if (Previous->opensScope())
1397             break;
1398           if (Previous->isOneOf(TT_BinaryOperator, TT_UnaryOperator) &&
1399               Previous->isOneOf(tok::star, tok::amp, tok::ampamp) &&
1400               Previous->Previous && Previous->Previous->isNot(tok::equal))
1401             Previous->setType(TT_PointerOrReference);
1402         }
1403       }
1404     } else if (Current.is(tok::lessless) &&
1405                (!Current.Previous || !Current.Previous->is(tok::kw_operator))) {
1406       Contexts.back().IsExpression = true;
1407     } else if (Current.isOneOf(tok::kw_return, tok::kw_throw)) {
1408       Contexts.back().IsExpression = true;
1409     } else if (Current.is(TT_TrailingReturnArrow)) {
1410       Contexts.back().IsExpression = false;
1411     } else if (Current.is(TT_LambdaArrow) || Current.is(Keywords.kw_assert)) {
1412       Contexts.back().IsExpression = Style.Language == FormatStyle::LK_Java;
1413     } else if (Current.Previous &&
1414                Current.Previous->is(TT_CtorInitializerColon)) {
1415       Contexts.back().IsExpression = true;
1416       Contexts.back().InCtorInitializer = true;
1417     } else if (Current.Previous && Current.Previous->is(TT_InheritanceColon)) {
1418       Contexts.back().InInheritanceList = true;
1419     } else if (Current.isOneOf(tok::r_paren, tok::greater, tok::comma)) {
1420       for (FormatToken *Previous = Current.Previous;
1421            Previous && Previous->isOneOf(tok::star, tok::amp);
1422            Previous = Previous->Previous)
1423         Previous->setType(TT_PointerOrReference);
1424       if (Line.MustBeDeclaration && !Contexts.front().InCtorInitializer)
1425         Contexts.back().IsExpression = false;
1426     } else if (Current.is(tok::kw_new)) {
1427       Contexts.back().CanBeExpression = false;
1428     } else if (Current.is(tok::semi) ||
1429                (Current.is(tok::exclaim) && Current.Previous &&
1430                 !Current.Previous->is(tok::kw_operator))) {
1431       // This should be the condition or increment in a for-loop.
1432       // But not operator !() (can't use TT_OverloadedOperator here as its not
1433       // been annotated yet).
1434       Contexts.back().IsExpression = true;
1435     }
1436   }
1437 
1438   static FormatToken *untilMatchingParen(FormatToken *Current) {
1439     // Used when `MatchingParen` is not yet established.
1440     int ParenLevel = 0;
1441     while (Current) {
1442       if (Current->is(tok::l_paren))
1443         ParenLevel++;
1444       if (Current->is(tok::r_paren))
1445         ParenLevel--;
1446       if (ParenLevel < 1)
1447         break;
1448       Current = Current->Next;
1449     }
1450     return Current;
1451   }
1452 
1453   static bool isDeductionGuide(FormatToken &Current) {
1454     // Look for a deduction guide template<T> A(...) -> A<...>;
1455     if (Current.Previous && Current.Previous->is(tok::r_paren) &&
1456         Current.startsSequence(tok::arrow, tok::identifier, tok::less)) {
1457       // Find the TemplateCloser.
1458       FormatToken *TemplateCloser = Current.Next->Next;
1459       int NestingLevel = 0;
1460       while (TemplateCloser) {
1461         // Skip over an expressions in parens  A<(3 < 2)>;
1462         if (TemplateCloser->is(tok::l_paren)) {
1463           // No Matching Paren yet so skip to matching paren
1464           TemplateCloser = untilMatchingParen(TemplateCloser);
1465         }
1466         if (TemplateCloser->is(tok::less))
1467           NestingLevel++;
1468         if (TemplateCloser->is(tok::greater))
1469           NestingLevel--;
1470         if (NestingLevel < 1)
1471           break;
1472         TemplateCloser = TemplateCloser->Next;
1473       }
1474       // Assuming we have found the end of the template ensure its followed
1475       // with a semi-colon.
1476       if (TemplateCloser && TemplateCloser->Next &&
1477           TemplateCloser->Next->is(tok::semi) &&
1478           Current.Previous->MatchingParen) {
1479         // Determine if the identifier `A` prior to the A<..>; is the same as
1480         // prior to the A(..)
1481         FormatToken *LeadingIdentifier =
1482             Current.Previous->MatchingParen->Previous;
1483 
1484         // Differentiate a deduction guide by seeing the
1485         // > of the template prior to the leading identifier.
1486         if (LeadingIdentifier) {
1487           FormatToken *PriorLeadingIdentifier = LeadingIdentifier->Previous;
1488           // Skip back past explicit decoration
1489           if (PriorLeadingIdentifier &&
1490               PriorLeadingIdentifier->is(tok::kw_explicit))
1491             PriorLeadingIdentifier = PriorLeadingIdentifier->Previous;
1492 
1493           return (PriorLeadingIdentifier &&
1494                   PriorLeadingIdentifier->is(TT_TemplateCloser) &&
1495                   LeadingIdentifier->TokenText == Current.Next->TokenText);
1496         }
1497       }
1498     }
1499     return false;
1500   }
1501 
1502   void determineTokenType(FormatToken &Current) {
1503     if (!Current.is(TT_Unknown))
1504       // The token type is already known.
1505       return;
1506 
1507     if (Style.isCSharp() && CurrentToken->is(tok::question)) {
1508       if (CurrentToken->TokenText == "??") {
1509         Current.setType(TT_CSharpNullCoalescing);
1510         return;
1511       }
1512       if (CurrentToken->TokenText == "?.") {
1513         Current.setType(TT_CSharpNullConditional);
1514         return;
1515       }
1516       if (CurrentToken->TokenText == "?[") {
1517         Current.setType(TT_CSharpNullConditionalLSquare);
1518         return;
1519       }
1520     }
1521 
1522     if (Style.Language == FormatStyle::LK_JavaScript) {
1523       if (Current.is(tok::exclaim)) {
1524         if (Current.Previous &&
1525             (Keywords.IsJavaScriptIdentifier(
1526                  *Current.Previous, /* AcceptIdentifierName= */ true) ||
1527              Current.Previous->isOneOf(
1528                  tok::kw_namespace, tok::r_paren, tok::r_square, tok::r_brace,
1529                  Keywords.kw_type, Keywords.kw_get, Keywords.kw_set) ||
1530              Current.Previous->Tok.isLiteral())) {
1531           Current.setType(TT_JsNonNullAssertion);
1532           return;
1533         }
1534         if (Current.Next &&
1535             Current.Next->isOneOf(TT_BinaryOperator, Keywords.kw_as)) {
1536           Current.setType(TT_JsNonNullAssertion);
1537           return;
1538         }
1539       }
1540     }
1541 
1542     // Line.MightBeFunctionDecl can only be true after the parentheses of a
1543     // function declaration have been found. In this case, 'Current' is a
1544     // trailing token of this declaration and thus cannot be a name.
1545     if (Current.is(Keywords.kw_instanceof)) {
1546       Current.setType(TT_BinaryOperator);
1547     } else if (isStartOfName(Current) &&
1548                (!Line.MightBeFunctionDecl || Current.NestingLevel != 0)) {
1549       Contexts.back().FirstStartOfName = &Current;
1550       Current.setType(TT_StartOfName);
1551     } else if (Current.is(tok::semi)) {
1552       // Reset FirstStartOfName after finding a semicolon so that a for loop
1553       // with multiple increment statements is not confused with a for loop
1554       // having multiple variable declarations.
1555       Contexts.back().FirstStartOfName = nullptr;
1556     } else if (Current.isOneOf(tok::kw_auto, tok::kw___auto_type)) {
1557       AutoFound = true;
1558     } else if (Current.is(tok::arrow) &&
1559                Style.Language == FormatStyle::LK_Java) {
1560       Current.setType(TT_LambdaArrow);
1561     } else if (Current.is(tok::arrow) && AutoFound && Line.MustBeDeclaration &&
1562                Current.NestingLevel == 0 &&
1563                !Current.Previous->is(tok::kw_operator)) {
1564       // not auto operator->() -> xxx;
1565       Current.setType(TT_TrailingReturnArrow);
1566 
1567     } else if (isDeductionGuide(Current)) {
1568       // Deduction guides trailing arrow " A(...) -> A<T>;".
1569       Current.setType(TT_TrailingReturnArrow);
1570     } else if (Current.isOneOf(tok::star, tok::amp, tok::ampamp)) {
1571       Current.setType(determineStarAmpUsage(
1572           Current,
1573           Contexts.back().CanBeExpression && Contexts.back().IsExpression,
1574           Contexts.back().InTemplateArgument));
1575     } else if (Current.isOneOf(tok::minus, tok::plus, tok::caret)) {
1576       Current.setType(determinePlusMinusCaretUsage(Current));
1577       if (Current.is(TT_UnaryOperator) && Current.is(tok::caret))
1578         Contexts.back().CaretFound = true;
1579     } else if (Current.isOneOf(tok::minusminus, tok::plusplus)) {
1580       Current.setType(determineIncrementUsage(Current));
1581     } else if (Current.isOneOf(tok::exclaim, tok::tilde)) {
1582       Current.setType(TT_UnaryOperator);
1583     } else if (Current.is(tok::question)) {
1584       if (Style.Language == FormatStyle::LK_JavaScript &&
1585           Line.MustBeDeclaration && !Contexts.back().IsExpression) {
1586         // In JavaScript, `interface X { foo?(): bar; }` is an optional method
1587         // on the interface, not a ternary expression.
1588         Current.setType(TT_JsTypeOptionalQuestion);
1589       } else {
1590         Current.setType(TT_ConditionalExpr);
1591       }
1592     } else if (Current.isBinaryOperator() &&
1593                (!Current.Previous || Current.Previous->isNot(tok::l_square)) &&
1594                (!Current.is(tok::greater) &&
1595                 Style.Language != FormatStyle::LK_TextProto)) {
1596       Current.setType(TT_BinaryOperator);
1597     } else if (Current.is(tok::comment)) {
1598       if (Current.TokenText.startswith("/*")) {
1599         if (Current.TokenText.endswith("*/"))
1600           Current.setType(TT_BlockComment);
1601         else
1602           // The lexer has for some reason determined a comment here. But we
1603           // cannot really handle it, if it isn't properly terminated.
1604           Current.Tok.setKind(tok::unknown);
1605       } else {
1606         Current.setType(TT_LineComment);
1607       }
1608     } else if (Current.is(tok::r_paren)) {
1609       if (rParenEndsCast(Current))
1610         Current.setType(TT_CastRParen);
1611       if (Current.MatchingParen && Current.Next &&
1612           !Current.Next->isBinaryOperator() &&
1613           !Current.Next->isOneOf(tok::semi, tok::colon, tok::l_brace,
1614                                  tok::comma, tok::period, tok::arrow,
1615                                  tok::coloncolon))
1616         if (FormatToken *AfterParen = Current.MatchingParen->Next) {
1617           // Make sure this isn't the return type of an Obj-C block declaration
1618           if (AfterParen->Tok.isNot(tok::caret)) {
1619             if (FormatToken *BeforeParen = Current.MatchingParen->Previous)
1620               if (BeforeParen->is(tok::identifier) &&
1621                   !BeforeParen->is(TT_TypenameMacro) &&
1622                   BeforeParen->TokenText == BeforeParen->TokenText.upper() &&
1623                   (!BeforeParen->Previous ||
1624                    BeforeParen->Previous->ClosesTemplateDeclaration))
1625                 Current.setType(TT_FunctionAnnotationRParen);
1626           }
1627         }
1628     } else if (Current.is(tok::at) && Current.Next &&
1629                Style.Language != FormatStyle::LK_JavaScript &&
1630                Style.Language != FormatStyle::LK_Java) {
1631       // In Java & JavaScript, "@..." is a decorator or annotation. In ObjC, it
1632       // marks declarations and properties that need special formatting.
1633       switch (Current.Next->Tok.getObjCKeywordID()) {
1634       case tok::objc_interface:
1635       case tok::objc_implementation:
1636       case tok::objc_protocol:
1637         Current.setType(TT_ObjCDecl);
1638         break;
1639       case tok::objc_property:
1640         Current.setType(TT_ObjCProperty);
1641         break;
1642       default:
1643         break;
1644       }
1645     } else if (Current.is(tok::period)) {
1646       FormatToken *PreviousNoComment = Current.getPreviousNonComment();
1647       if (PreviousNoComment &&
1648           PreviousNoComment->isOneOf(tok::comma, tok::l_brace))
1649         Current.setType(TT_DesignatedInitializerPeriod);
1650       else if (Style.Language == FormatStyle::LK_Java && Current.Previous &&
1651                Current.Previous->isOneOf(TT_JavaAnnotation,
1652                                          TT_LeadingJavaAnnotation)) {
1653         Current.setType(Current.Previous->getType());
1654       }
1655     } else if (canBeObjCSelectorComponent(Current) &&
1656                // FIXME(bug 36976): ObjC return types shouldn't use
1657                // TT_CastRParen.
1658                Current.Previous && Current.Previous->is(TT_CastRParen) &&
1659                Current.Previous->MatchingParen &&
1660                Current.Previous->MatchingParen->Previous &&
1661                Current.Previous->MatchingParen->Previous->is(
1662                    TT_ObjCMethodSpecifier)) {
1663       // This is the first part of an Objective-C selector name. (If there's no
1664       // colon after this, this is the only place which annotates the identifier
1665       // as a selector.)
1666       Current.setType(TT_SelectorName);
1667     } else if (Current.isOneOf(tok::identifier, tok::kw_const,
1668                                tok::kw_noexcept) &&
1669                Current.Previous &&
1670                !Current.Previous->isOneOf(tok::equal, tok::at) &&
1671                Line.MightBeFunctionDecl && Contexts.size() == 1) {
1672       // Line.MightBeFunctionDecl can only be true after the parentheses of a
1673       // function declaration have been found.
1674       Current.setType(TT_TrailingAnnotation);
1675     } else if ((Style.Language == FormatStyle::LK_Java ||
1676                 Style.Language == FormatStyle::LK_JavaScript) &&
1677                Current.Previous) {
1678       if (Current.Previous->is(tok::at) &&
1679           Current.isNot(Keywords.kw_interface)) {
1680         const FormatToken &AtToken = *Current.Previous;
1681         const FormatToken *Previous = AtToken.getPreviousNonComment();
1682         if (!Previous || Previous->is(TT_LeadingJavaAnnotation))
1683           Current.setType(TT_LeadingJavaAnnotation);
1684         else
1685           Current.setType(TT_JavaAnnotation);
1686       } else if (Current.Previous->is(tok::period) &&
1687                  Current.Previous->isOneOf(TT_JavaAnnotation,
1688                                            TT_LeadingJavaAnnotation)) {
1689         Current.setType(Current.Previous->getType());
1690       }
1691     }
1692   }
1693 
1694   /// Take a guess at whether \p Tok starts a name of a function or
1695   /// variable declaration.
1696   ///
1697   /// This is a heuristic based on whether \p Tok is an identifier following
1698   /// something that is likely a type.
1699   bool isStartOfName(const FormatToken &Tok) {
1700     if (Tok.isNot(tok::identifier) || !Tok.Previous)
1701       return false;
1702 
1703     if (Tok.Previous->isOneOf(TT_LeadingJavaAnnotation, Keywords.kw_instanceof,
1704                               Keywords.kw_as))
1705       return false;
1706     if (Style.Language == FormatStyle::LK_JavaScript &&
1707         Tok.Previous->is(Keywords.kw_in))
1708       return false;
1709 
1710     // Skip "const" as it does not have an influence on whether this is a name.
1711     FormatToken *PreviousNotConst = Tok.getPreviousNonComment();
1712     while (PreviousNotConst && PreviousNotConst->is(tok::kw_const))
1713       PreviousNotConst = PreviousNotConst->getPreviousNonComment();
1714 
1715     if (!PreviousNotConst)
1716       return false;
1717 
1718     bool IsPPKeyword = PreviousNotConst->is(tok::identifier) &&
1719                        PreviousNotConst->Previous &&
1720                        PreviousNotConst->Previous->is(tok::hash);
1721 
1722     if (PreviousNotConst->is(TT_TemplateCloser))
1723       return PreviousNotConst && PreviousNotConst->MatchingParen &&
1724              PreviousNotConst->MatchingParen->Previous &&
1725              PreviousNotConst->MatchingParen->Previous->isNot(tok::period) &&
1726              PreviousNotConst->MatchingParen->Previous->isNot(tok::kw_template);
1727 
1728     if (PreviousNotConst->is(tok::r_paren) && PreviousNotConst->MatchingParen &&
1729         PreviousNotConst->MatchingParen->Previous &&
1730         PreviousNotConst->MatchingParen->Previous->is(tok::kw_decltype))
1731       return true;
1732 
1733     return (!IsPPKeyword &&
1734             PreviousNotConst->isOneOf(tok::identifier, tok::kw_auto)) ||
1735            PreviousNotConst->is(TT_PointerOrReference) ||
1736            PreviousNotConst->isSimpleTypeSpecifier();
1737   }
1738 
1739   /// Determine whether ')' is ending a cast.
1740   bool rParenEndsCast(const FormatToken &Tok) {
1741     // C-style casts are only used in C++, C# and Java.
1742     if (!Style.isCSharp() && !Style.isCpp() &&
1743         Style.Language != FormatStyle::LK_Java)
1744       return false;
1745 
1746     // Empty parens aren't casts and there are no casts at the end of the line.
1747     if (Tok.Previous == Tok.MatchingParen || !Tok.Next || !Tok.MatchingParen)
1748       return false;
1749 
1750     FormatToken *LeftOfParens = Tok.MatchingParen->getPreviousNonComment();
1751     if (LeftOfParens) {
1752       // If there is a closing parenthesis left of the current parentheses,
1753       // look past it as these might be chained casts.
1754       if (LeftOfParens->is(tok::r_paren)) {
1755         if (!LeftOfParens->MatchingParen ||
1756             !LeftOfParens->MatchingParen->Previous)
1757           return false;
1758         LeftOfParens = LeftOfParens->MatchingParen->Previous;
1759       }
1760 
1761       // If there is an identifier (or with a few exceptions a keyword) right
1762       // before the parentheses, this is unlikely to be a cast.
1763       if (LeftOfParens->Tok.getIdentifierInfo() &&
1764           !LeftOfParens->isOneOf(Keywords.kw_in, tok::kw_return, tok::kw_case,
1765                                  tok::kw_delete))
1766         return false;
1767 
1768       // Certain other tokens right before the parentheses are also signals that
1769       // this cannot be a cast.
1770       if (LeftOfParens->isOneOf(tok::at, tok::r_square, TT_OverloadedOperator,
1771                                 TT_TemplateCloser, tok::ellipsis))
1772         return false;
1773     }
1774 
1775     if (Tok.Next->is(tok::question))
1776       return false;
1777 
1778     // `foreach((A a, B b) in someList)` should not be seen as a cast.
1779     if (Tok.Next->is(Keywords.kw_in) && Style.isCSharp())
1780       return false;
1781 
1782     // Functions which end with decorations like volatile, noexcept are unlikely
1783     // to be casts.
1784     if (Tok.Next->isOneOf(tok::kw_noexcept, tok::kw_volatile, tok::kw_const,
1785                           tok::kw_throw, tok::arrow, Keywords.kw_override,
1786                           Keywords.kw_final) ||
1787         isCpp11AttributeSpecifier(*Tok.Next))
1788       return false;
1789 
1790     // As Java has no function types, a "(" after the ")" likely means that this
1791     // is a cast.
1792     if (Style.Language == FormatStyle::LK_Java && Tok.Next->is(tok::l_paren))
1793       return true;
1794 
1795     // If a (non-string) literal follows, this is likely a cast.
1796     if (Tok.Next->isNot(tok::string_literal) &&
1797         (Tok.Next->Tok.isLiteral() ||
1798          Tok.Next->isOneOf(tok::kw_sizeof, tok::kw_alignof)))
1799       return true;
1800 
1801     // Heuristically try to determine whether the parentheses contain a type.
1802     bool ParensAreType =
1803         !Tok.Previous ||
1804         Tok.Previous->isOneOf(TT_PointerOrReference, TT_TemplateCloser) ||
1805         Tok.Previous->isSimpleTypeSpecifier();
1806     bool ParensCouldEndDecl =
1807         Tok.Next->isOneOf(tok::equal, tok::semi, tok::l_brace, tok::greater);
1808     if (ParensAreType && !ParensCouldEndDecl)
1809       return true;
1810 
1811     // At this point, we heuristically assume that there are no casts at the
1812     // start of the line. We assume that we have found most cases where there
1813     // are by the logic above, e.g. "(void)x;".
1814     if (!LeftOfParens)
1815       return false;
1816 
1817     // Certain token types inside the parentheses mean that this can't be a
1818     // cast.
1819     for (const FormatToken *Token = Tok.MatchingParen->Next; Token != &Tok;
1820          Token = Token->Next)
1821       if (Token->is(TT_BinaryOperator))
1822         return false;
1823 
1824     // If the following token is an identifier or 'this', this is a cast. All
1825     // cases where this can be something else are handled above.
1826     if (Tok.Next->isOneOf(tok::identifier, tok::kw_this))
1827       return true;
1828 
1829     if (!Tok.Next->Next)
1830       return false;
1831 
1832     // If the next token after the parenthesis is a unary operator, assume
1833     // that this is cast, unless there are unexpected tokens inside the
1834     // parenthesis.
1835     bool NextIsUnary =
1836         Tok.Next->isUnaryOperator() || Tok.Next->isOneOf(tok::amp, tok::star);
1837     if (!NextIsUnary || Tok.Next->is(tok::plus) ||
1838         !Tok.Next->Next->isOneOf(tok::identifier, tok::numeric_constant))
1839       return false;
1840     // Search for unexpected tokens.
1841     for (FormatToken *Prev = Tok.Previous; Prev != Tok.MatchingParen;
1842          Prev = Prev->Previous) {
1843       if (!Prev->isOneOf(tok::kw_const, tok::identifier, tok::coloncolon))
1844         return false;
1845     }
1846     return true;
1847   }
1848 
1849   /// Return the type of the given token assuming it is * or &.
1850   TokenType determineStarAmpUsage(const FormatToken &Tok, bool IsExpression,
1851                                   bool InTemplateArgument) {
1852     if (Style.Language == FormatStyle::LK_JavaScript)
1853       return TT_BinaryOperator;
1854 
1855     // && in C# must be a binary operator.
1856     if (Style.isCSharp() && Tok.is(tok::ampamp))
1857       return TT_BinaryOperator;
1858 
1859     const FormatToken *PrevToken = Tok.getPreviousNonComment();
1860     if (!PrevToken)
1861       return TT_UnaryOperator;
1862 
1863     const FormatToken *NextToken = Tok.getNextNonComment();
1864     if (!NextToken ||
1865         NextToken->isOneOf(tok::arrow, tok::equal, tok::kw_const,
1866                            tok::kw_noexcept) ||
1867         (NextToken->is(tok::l_brace) && !NextToken->getNextNonComment()))
1868       return TT_PointerOrReference;
1869 
1870     if (PrevToken->is(tok::coloncolon))
1871       return TT_PointerOrReference;
1872 
1873     if (PrevToken->isOneOf(tok::l_paren, tok::l_square, tok::l_brace,
1874                            tok::comma, tok::semi, tok::kw_return, tok::colon,
1875                            tok::equal, tok::kw_delete, tok::kw_sizeof,
1876                            tok::kw_throw) ||
1877         PrevToken->isOneOf(TT_BinaryOperator, TT_ConditionalExpr,
1878                            TT_UnaryOperator, TT_CastRParen))
1879       return TT_UnaryOperator;
1880 
1881     if (NextToken->is(tok::l_square) && NextToken->isNot(TT_LambdaLSquare))
1882       return TT_PointerOrReference;
1883     if (NextToken->is(tok::kw_operator) && !IsExpression)
1884       return TT_PointerOrReference;
1885     if (NextToken->isOneOf(tok::comma, tok::semi))
1886       return TT_PointerOrReference;
1887 
1888     if (PrevToken->is(tok::r_paren) && PrevToken->MatchingParen) {
1889       FormatToken *TokenBeforeMatchingParen =
1890           PrevToken->MatchingParen->getPreviousNonComment();
1891       if (TokenBeforeMatchingParen &&
1892           TokenBeforeMatchingParen->isOneOf(tok::kw_typeof, tok::kw_decltype,
1893                                             TT_TypenameMacro))
1894         return TT_PointerOrReference;
1895     }
1896 
1897     if (PrevToken->Tok.isLiteral() ||
1898         PrevToken->isOneOf(tok::r_paren, tok::r_square, tok::kw_true,
1899                            tok::kw_false, tok::r_brace) ||
1900         NextToken->Tok.isLiteral() ||
1901         NextToken->isOneOf(tok::kw_true, tok::kw_false) ||
1902         NextToken->isUnaryOperator() ||
1903         // If we know we're in a template argument, there are no named
1904         // declarations. Thus, having an identifier on the right-hand side
1905         // indicates a binary operator.
1906         (InTemplateArgument && NextToken->Tok.isAnyIdentifier()))
1907       return TT_BinaryOperator;
1908 
1909     // "&&(" is quite unlikely to be two successive unary "&".
1910     if (Tok.is(tok::ampamp) && NextToken->is(tok::l_paren))
1911       return TT_BinaryOperator;
1912 
1913     // This catches some cases where evaluation order is used as control flow:
1914     //   aaa && aaa->f();
1915     if (NextToken->Tok.isAnyIdentifier()) {
1916       const FormatToken *NextNextToken = NextToken->getNextNonComment();
1917       if (NextNextToken && NextNextToken->is(tok::arrow))
1918         return TT_BinaryOperator;
1919     }
1920 
1921     // It is very unlikely that we are going to find a pointer or reference type
1922     // definition on the RHS of an assignment.
1923     if (IsExpression && !Contexts.back().CaretFound)
1924       return TT_BinaryOperator;
1925 
1926     return TT_PointerOrReference;
1927   }
1928 
1929   TokenType determinePlusMinusCaretUsage(const FormatToken &Tok) {
1930     const FormatToken *PrevToken = Tok.getPreviousNonComment();
1931     if (!PrevToken)
1932       return TT_UnaryOperator;
1933 
1934     if (PrevToken->isOneOf(TT_CastRParen, TT_UnaryOperator))
1935       // This must be a sequence of leading unary operators.
1936       return TT_UnaryOperator;
1937 
1938     // Use heuristics to recognize unary operators.
1939     if (PrevToken->isOneOf(tok::equal, tok::l_paren, tok::comma, tok::l_square,
1940                            tok::question, tok::colon, tok::kw_return,
1941                            tok::kw_case, tok::at, tok::l_brace, tok::kw_throw,
1942                            tok::kw_co_return, tok::kw_co_yield))
1943       return TT_UnaryOperator;
1944 
1945     // There can't be two consecutive binary operators.
1946     if (PrevToken->is(TT_BinaryOperator))
1947       return TT_UnaryOperator;
1948 
1949     // Fall back to marking the token as binary operator.
1950     return TT_BinaryOperator;
1951   }
1952 
1953   /// Determine whether ++/-- are pre- or post-increments/-decrements.
1954   TokenType determineIncrementUsage(const FormatToken &Tok) {
1955     const FormatToken *PrevToken = Tok.getPreviousNonComment();
1956     if (!PrevToken || PrevToken->is(TT_CastRParen))
1957       return TT_UnaryOperator;
1958     if (PrevToken->isOneOf(tok::r_paren, tok::r_square, tok::identifier))
1959       return TT_TrailingUnaryOperator;
1960 
1961     return TT_UnaryOperator;
1962   }
1963 
1964   SmallVector<Context, 8> Contexts;
1965 
1966   const FormatStyle &Style;
1967   AnnotatedLine &Line;
1968   FormatToken *CurrentToken;
1969   bool AutoFound;
1970   const AdditionalKeywords &Keywords;
1971 
1972   // Set of "<" tokens that do not open a template parameter list. If parseAngle
1973   // determines that a specific token can't be a template opener, it will make
1974   // same decision irrespective of the decisions for tokens leading up to it.
1975   // Store this information to prevent this from causing exponential runtime.
1976   llvm::SmallPtrSet<FormatToken *, 16> NonTemplateLess;
1977 };
1978 
1979 static const int PrecedenceUnaryOperator = prec::PointerToMember + 1;
1980 static const int PrecedenceArrowAndPeriod = prec::PointerToMember + 2;
1981 
1982 /// Parses binary expressions by inserting fake parenthesis based on
1983 /// operator precedence.
1984 class ExpressionParser {
1985 public:
1986   ExpressionParser(const FormatStyle &Style, const AdditionalKeywords &Keywords,
1987                    AnnotatedLine &Line)
1988       : Style(Style), Keywords(Keywords), Current(Line.First) {}
1989 
1990   /// Parse expressions with the given operator precedence.
1991   void parse(int Precedence = 0) {
1992     // Skip 'return' and ObjC selector colons as they are not part of a binary
1993     // expression.
1994     while (Current && (Current->is(tok::kw_return) ||
1995                        (Current->is(tok::colon) &&
1996                         Current->isOneOf(TT_ObjCMethodExpr, TT_DictLiteral))))
1997       next();
1998 
1999     if (!Current || Precedence > PrecedenceArrowAndPeriod)
2000       return;
2001 
2002     // Conditional expressions need to be parsed separately for proper nesting.
2003     if (Precedence == prec::Conditional) {
2004       parseConditionalExpr();
2005       return;
2006     }
2007 
2008     // Parse unary operators, which all have a higher precedence than binary
2009     // operators.
2010     if (Precedence == PrecedenceUnaryOperator) {
2011       parseUnaryOperator();
2012       return;
2013     }
2014 
2015     FormatToken *Start = Current;
2016     FormatToken *LatestOperator = nullptr;
2017     unsigned OperatorIndex = 0;
2018 
2019     while (Current) {
2020       // Consume operators with higher precedence.
2021       parse(Precedence + 1);
2022 
2023       int CurrentPrecedence = getCurrentPrecedence();
2024 
2025       if (Current && Current->is(TT_SelectorName) &&
2026           Precedence == CurrentPrecedence) {
2027         if (LatestOperator)
2028           addFakeParenthesis(Start, prec::Level(Precedence));
2029         Start = Current;
2030       }
2031 
2032       // At the end of the line or when an operator with higher precedence is
2033       // found, insert fake parenthesis and return.
2034       if (!Current ||
2035           (Current->closesScope() &&
2036            (Current->MatchingParen || Current->is(TT_TemplateString))) ||
2037           (CurrentPrecedence != -1 && CurrentPrecedence < Precedence) ||
2038           (CurrentPrecedence == prec::Conditional &&
2039            Precedence == prec::Assignment && Current->is(tok::colon))) {
2040         break;
2041       }
2042 
2043       // Consume scopes: (), [], <> and {}
2044       if (Current->opensScope()) {
2045         // In fragment of a JavaScript template string can look like '}..${' and
2046         // thus close a scope and open a new one at the same time.
2047         while (Current && (!Current->closesScope() || Current->opensScope())) {
2048           next();
2049           parse();
2050         }
2051         next();
2052       } else {
2053         // Operator found.
2054         if (CurrentPrecedence == Precedence) {
2055           if (LatestOperator)
2056             LatestOperator->NextOperator = Current;
2057           LatestOperator = Current;
2058           Current->OperatorIndex = OperatorIndex;
2059           ++OperatorIndex;
2060         }
2061         next(/*SkipPastLeadingComments=*/Precedence > 0);
2062       }
2063     }
2064 
2065     if (LatestOperator && (Current || Precedence > 0)) {
2066       // LatestOperator->LastOperator = true;
2067       if (Precedence == PrecedenceArrowAndPeriod) {
2068         // Call expressions don't have a binary operator precedence.
2069         addFakeParenthesis(Start, prec::Unknown);
2070       } else {
2071         addFakeParenthesis(Start, prec::Level(Precedence));
2072       }
2073     }
2074   }
2075 
2076 private:
2077   /// Gets the precedence (+1) of the given token for binary operators
2078   /// and other tokens that we treat like binary operators.
2079   int getCurrentPrecedence() {
2080     if (Current) {
2081       const FormatToken *NextNonComment = Current->getNextNonComment();
2082       if (Current->is(TT_ConditionalExpr))
2083         return prec::Conditional;
2084       if (NextNonComment && Current->is(TT_SelectorName) &&
2085           (NextNonComment->isOneOf(TT_DictLiteral, TT_JsTypeColon) ||
2086            ((Style.Language == FormatStyle::LK_Proto ||
2087              Style.Language == FormatStyle::LK_TextProto) &&
2088             NextNonComment->is(tok::less))))
2089         return prec::Assignment;
2090       if (Current->is(TT_JsComputedPropertyName))
2091         return prec::Assignment;
2092       if (Current->is(TT_LambdaArrow))
2093         return prec::Comma;
2094       if (Current->is(TT_JsFatArrow))
2095         return prec::Assignment;
2096       if (Current->isOneOf(tok::semi, TT_InlineASMColon, TT_SelectorName) ||
2097           (Current->is(tok::comment) && NextNonComment &&
2098            NextNonComment->is(TT_SelectorName)))
2099         return 0;
2100       if (Current->is(TT_RangeBasedForLoopColon))
2101         return prec::Comma;
2102       if ((Style.Language == FormatStyle::LK_Java ||
2103            Style.Language == FormatStyle::LK_JavaScript) &&
2104           Current->is(Keywords.kw_instanceof))
2105         return prec::Relational;
2106       if (Style.Language == FormatStyle::LK_JavaScript &&
2107           Current->isOneOf(Keywords.kw_in, Keywords.kw_as))
2108         return prec::Relational;
2109       if (Current->is(TT_BinaryOperator) || Current->is(tok::comma))
2110         return Current->getPrecedence();
2111       if (Current->isOneOf(tok::period, tok::arrow))
2112         return PrecedenceArrowAndPeriod;
2113       if ((Style.Language == FormatStyle::LK_Java ||
2114            Style.Language == FormatStyle::LK_JavaScript) &&
2115           Current->isOneOf(Keywords.kw_extends, Keywords.kw_implements,
2116                            Keywords.kw_throws))
2117         return 0;
2118     }
2119     return -1;
2120   }
2121 
2122   void addFakeParenthesis(FormatToken *Start, prec::Level Precedence) {
2123     Start->FakeLParens.push_back(Precedence);
2124     if (Precedence > prec::Unknown)
2125       Start->StartsBinaryExpression = true;
2126     if (Current) {
2127       FormatToken *Previous = Current->Previous;
2128       while (Previous->is(tok::comment) && Previous->Previous)
2129         Previous = Previous->Previous;
2130       ++Previous->FakeRParens;
2131       if (Precedence > prec::Unknown)
2132         Previous->EndsBinaryExpression = true;
2133     }
2134   }
2135 
2136   /// Parse unary operator expressions and surround them with fake
2137   /// parentheses if appropriate.
2138   void parseUnaryOperator() {
2139     llvm::SmallVector<FormatToken *, 2> Tokens;
2140     while (Current && Current->is(TT_UnaryOperator)) {
2141       Tokens.push_back(Current);
2142       next();
2143     }
2144     parse(PrecedenceArrowAndPeriod);
2145     for (FormatToken *Token : llvm::reverse(Tokens))
2146       // The actual precedence doesn't matter.
2147       addFakeParenthesis(Token, prec::Unknown);
2148   }
2149 
2150   void parseConditionalExpr() {
2151     while (Current && Current->isTrailingComment()) {
2152       next();
2153     }
2154     FormatToken *Start = Current;
2155     parse(prec::LogicalOr);
2156     if (!Current || !Current->is(tok::question))
2157       return;
2158     next();
2159     parse(prec::Assignment);
2160     if (!Current || Current->isNot(TT_ConditionalExpr))
2161       return;
2162     next();
2163     parse(prec::Assignment);
2164     addFakeParenthesis(Start, prec::Conditional);
2165   }
2166 
2167   void next(bool SkipPastLeadingComments = true) {
2168     if (Current)
2169       Current = Current->Next;
2170     while (Current &&
2171            (Current->NewlinesBefore == 0 || SkipPastLeadingComments) &&
2172            Current->isTrailingComment())
2173       Current = Current->Next;
2174   }
2175 
2176   const FormatStyle &Style;
2177   const AdditionalKeywords &Keywords;
2178   FormatToken *Current;
2179 };
2180 
2181 } // end anonymous namespace
2182 
2183 void TokenAnnotator::setCommentLineLevels(
2184     SmallVectorImpl<AnnotatedLine *> &Lines) {
2185   const AnnotatedLine *NextNonCommentLine = nullptr;
2186   for (SmallVectorImpl<AnnotatedLine *>::reverse_iterator I = Lines.rbegin(),
2187                                                           E = Lines.rend();
2188        I != E; ++I) {
2189     bool CommentLine = true;
2190     for (const FormatToken *Tok = (*I)->First; Tok; Tok = Tok->Next) {
2191       if (!Tok->is(tok::comment)) {
2192         CommentLine = false;
2193         break;
2194       }
2195     }
2196 
2197     // If the comment is currently aligned with the line immediately following
2198     // it, that's probably intentional and we should keep it.
2199     if (NextNonCommentLine && CommentLine &&
2200         NextNonCommentLine->First->NewlinesBefore <= 1 &&
2201         NextNonCommentLine->First->OriginalColumn ==
2202             (*I)->First->OriginalColumn) {
2203       // Align comments for preprocessor lines with the # in column 0 if
2204       // preprocessor lines are not indented. Otherwise, align with the next
2205       // line.
2206       (*I)->Level =
2207           (Style.IndentPPDirectives != FormatStyle::PPDIS_BeforeHash &&
2208            (NextNonCommentLine->Type == LT_PreprocessorDirective ||
2209             NextNonCommentLine->Type == LT_ImportStatement))
2210               ? 0
2211               : NextNonCommentLine->Level;
2212     } else {
2213       NextNonCommentLine = (*I)->First->isNot(tok::r_brace) ? (*I) : nullptr;
2214     }
2215 
2216     setCommentLineLevels((*I)->Children);
2217   }
2218 }
2219 
2220 static unsigned maxNestingDepth(const AnnotatedLine &Line) {
2221   unsigned Result = 0;
2222   for (const auto *Tok = Line.First; Tok != nullptr; Tok = Tok->Next)
2223     Result = std::max(Result, Tok->NestingLevel);
2224   return Result;
2225 }
2226 
2227 void TokenAnnotator::annotate(AnnotatedLine &Line) {
2228   for (SmallVectorImpl<AnnotatedLine *>::iterator I = Line.Children.begin(),
2229                                                   E = Line.Children.end();
2230        I != E; ++I) {
2231     annotate(**I);
2232   }
2233   AnnotatingParser Parser(Style, Line, Keywords);
2234   Line.Type = Parser.parseLine();
2235 
2236   // With very deep nesting, ExpressionParser uses lots of stack and the
2237   // formatting algorithm is very slow. We're not going to do a good job here
2238   // anyway - it's probably generated code being formatted by mistake.
2239   // Just skip the whole line.
2240   if (maxNestingDepth(Line) > 50)
2241     Line.Type = LT_Invalid;
2242 
2243   if (Line.Type == LT_Invalid)
2244     return;
2245 
2246   ExpressionParser ExprParser(Style, Keywords, Line);
2247   ExprParser.parse();
2248 
2249   if (Line.startsWith(TT_ObjCMethodSpecifier))
2250     Line.Type = LT_ObjCMethodDecl;
2251   else if (Line.startsWith(TT_ObjCDecl))
2252     Line.Type = LT_ObjCDecl;
2253   else if (Line.startsWith(TT_ObjCProperty))
2254     Line.Type = LT_ObjCProperty;
2255 
2256   Line.First->SpacesRequiredBefore = 1;
2257   Line.First->CanBreakBefore = Line.First->MustBreakBefore;
2258 }
2259 
2260 // This function heuristically determines whether 'Current' starts the name of a
2261 // function declaration.
2262 static bool isFunctionDeclarationName(const FormatToken &Current,
2263                                       const AnnotatedLine &Line) {
2264   auto skipOperatorName = [](const FormatToken *Next) -> const FormatToken * {
2265     for (; Next; Next = Next->Next) {
2266       if (Next->is(TT_OverloadedOperatorLParen))
2267         return Next;
2268       if (Next->is(TT_OverloadedOperator))
2269         continue;
2270       if (Next->isOneOf(tok::kw_new, tok::kw_delete)) {
2271         // For 'new[]' and 'delete[]'.
2272         if (Next->Next &&
2273             Next->Next->startsSequence(tok::l_square, tok::r_square))
2274           Next = Next->Next->Next;
2275         continue;
2276       }
2277       if (Next->startsSequence(tok::l_square, tok::r_square)) {
2278         // For operator[]().
2279         Next = Next->Next;
2280         continue;
2281       }
2282       if ((Next->isSimpleTypeSpecifier() || Next->is(tok::identifier)) &&
2283           Next->Next && Next->Next->isOneOf(tok::star, tok::amp, tok::ampamp)) {
2284         // For operator void*(), operator char*(), operator Foo*().
2285         Next = Next->Next;
2286         continue;
2287       }
2288       if (Next->is(TT_TemplateOpener) && Next->MatchingParen) {
2289         Next = Next->MatchingParen;
2290         continue;
2291       }
2292 
2293       break;
2294     }
2295     return nullptr;
2296   };
2297 
2298   // Find parentheses of parameter list.
2299   const FormatToken *Next = Current.Next;
2300   if (Current.is(tok::kw_operator)) {
2301     if (Current.Previous && Current.Previous->is(tok::coloncolon))
2302       return false;
2303     Next = skipOperatorName(Next);
2304   } else {
2305     if (!Current.is(TT_StartOfName) || Current.NestingLevel != 0)
2306       return false;
2307     for (; Next; Next = Next->Next) {
2308       if (Next->is(TT_TemplateOpener)) {
2309         Next = Next->MatchingParen;
2310       } else if (Next->is(tok::coloncolon)) {
2311         Next = Next->Next;
2312         if (!Next)
2313           return false;
2314         if (Next->is(tok::kw_operator)) {
2315           Next = skipOperatorName(Next->Next);
2316           break;
2317         }
2318         if (!Next->is(tok::identifier))
2319           return false;
2320       } else if (Next->is(tok::l_paren)) {
2321         break;
2322       } else {
2323         return false;
2324       }
2325     }
2326   }
2327 
2328   // Check whether parameter list can belong to a function declaration.
2329   if (!Next || !Next->is(tok::l_paren) || !Next->MatchingParen)
2330     return false;
2331   // If the lines ends with "{", this is likely an function definition.
2332   if (Line.Last->is(tok::l_brace))
2333     return true;
2334   if (Next->Next == Next->MatchingParen)
2335     return true; // Empty parentheses.
2336   // If there is an &/&& after the r_paren, this is likely a function.
2337   if (Next->MatchingParen->Next &&
2338       Next->MatchingParen->Next->is(TT_PointerOrReference))
2339     return true;
2340   for (const FormatToken *Tok = Next->Next; Tok && Tok != Next->MatchingParen;
2341        Tok = Tok->Next) {
2342     if (Tok->isOneOf(tok::l_paren, TT_TemplateOpener) && Tok->MatchingParen) {
2343       Tok = Tok->MatchingParen;
2344       continue;
2345     }
2346     if (Tok->is(tok::kw_const) || Tok->isSimpleTypeSpecifier() ||
2347         Tok->isOneOf(TT_PointerOrReference, TT_StartOfName, tok::ellipsis))
2348       return true;
2349     if (Tok->isOneOf(tok::l_brace, tok::string_literal, TT_ObjCMethodExpr) ||
2350         Tok->Tok.isLiteral())
2351       return false;
2352   }
2353   return false;
2354 }
2355 
2356 bool TokenAnnotator::mustBreakForReturnType(const AnnotatedLine &Line) const {
2357   assert(Line.MightBeFunctionDecl);
2358 
2359   if ((Style.AlwaysBreakAfterReturnType == FormatStyle::RTBS_TopLevel ||
2360        Style.AlwaysBreakAfterReturnType ==
2361            FormatStyle::RTBS_TopLevelDefinitions) &&
2362       Line.Level > 0)
2363     return false;
2364 
2365   switch (Style.AlwaysBreakAfterReturnType) {
2366   case FormatStyle::RTBS_None:
2367     return false;
2368   case FormatStyle::RTBS_All:
2369   case FormatStyle::RTBS_TopLevel:
2370     return true;
2371   case FormatStyle::RTBS_AllDefinitions:
2372   case FormatStyle::RTBS_TopLevelDefinitions:
2373     return Line.mightBeFunctionDefinition();
2374   }
2375 
2376   return false;
2377 }
2378 
2379 void TokenAnnotator::calculateFormattingInformation(AnnotatedLine &Line) {
2380   for (SmallVectorImpl<AnnotatedLine *>::iterator I = Line.Children.begin(),
2381                                                   E = Line.Children.end();
2382        I != E; ++I) {
2383     calculateFormattingInformation(**I);
2384   }
2385 
2386   Line.First->TotalLength =
2387       Line.First->IsMultiline ? Style.ColumnLimit
2388                               : Line.FirstStartColumn + Line.First->ColumnWidth;
2389   FormatToken *Current = Line.First->Next;
2390   bool InFunctionDecl = Line.MightBeFunctionDecl;
2391   while (Current) {
2392     if (isFunctionDeclarationName(*Current, Line))
2393       Current->setType(TT_FunctionDeclarationName);
2394     if (Current->is(TT_LineComment)) {
2395       if (Current->Previous->BlockKind == BK_BracedInit &&
2396           Current->Previous->opensScope())
2397         Current->SpacesRequiredBefore =
2398             (Style.Cpp11BracedListStyle && !Style.SpacesInParentheses) ? 0 : 1;
2399       else
2400         Current->SpacesRequiredBefore = Style.SpacesBeforeTrailingComments;
2401 
2402       // If we find a trailing comment, iterate backwards to determine whether
2403       // it seems to relate to a specific parameter. If so, break before that
2404       // parameter to avoid changing the comment's meaning. E.g. don't move 'b'
2405       // to the previous line in:
2406       //   SomeFunction(a,
2407       //                b, // comment
2408       //                c);
2409       if (!Current->HasUnescapedNewline) {
2410         for (FormatToken *Parameter = Current->Previous; Parameter;
2411              Parameter = Parameter->Previous) {
2412           if (Parameter->isOneOf(tok::comment, tok::r_brace))
2413             break;
2414           if (Parameter->Previous && Parameter->Previous->is(tok::comma)) {
2415             if (!Parameter->Previous->is(TT_CtorInitializerComma) &&
2416                 Parameter->HasUnescapedNewline)
2417               Parameter->MustBreakBefore = true;
2418             break;
2419           }
2420         }
2421       }
2422     } else if (Current->SpacesRequiredBefore == 0 &&
2423                spaceRequiredBefore(Line, *Current)) {
2424       Current->SpacesRequiredBefore = 1;
2425     }
2426 
2427     Current->MustBreakBefore =
2428         Current->MustBreakBefore || mustBreakBefore(Line, *Current);
2429 
2430     if (!Current->MustBreakBefore && InFunctionDecl &&
2431         Current->is(TT_FunctionDeclarationName))
2432       Current->MustBreakBefore = mustBreakForReturnType(Line);
2433 
2434     Current->CanBreakBefore =
2435         Current->MustBreakBefore || canBreakBefore(Line, *Current);
2436     unsigned ChildSize = 0;
2437     if (Current->Previous->Children.size() == 1) {
2438       FormatToken &LastOfChild = *Current->Previous->Children[0]->Last;
2439       ChildSize = LastOfChild.isTrailingComment() ? Style.ColumnLimit
2440                                                   : LastOfChild.TotalLength + 1;
2441     }
2442     const FormatToken *Prev = Current->Previous;
2443     if (Current->MustBreakBefore || Prev->Children.size() > 1 ||
2444         (Prev->Children.size() == 1 &&
2445          Prev->Children[0]->First->MustBreakBefore) ||
2446         Current->IsMultiline)
2447       Current->TotalLength = Prev->TotalLength + Style.ColumnLimit;
2448     else
2449       Current->TotalLength = Prev->TotalLength + Current->ColumnWidth +
2450                              ChildSize + Current->SpacesRequiredBefore;
2451 
2452     if (Current->is(TT_CtorInitializerColon))
2453       InFunctionDecl = false;
2454 
2455     // FIXME: Only calculate this if CanBreakBefore is true once static
2456     // initializers etc. are sorted out.
2457     // FIXME: Move magic numbers to a better place.
2458 
2459     // Reduce penalty for aligning ObjC method arguments using the colon
2460     // alignment as this is the canonical way (still prefer fitting everything
2461     // into one line if possible). Trying to fit a whole expression into one
2462     // line should not force other line breaks (e.g. when ObjC method
2463     // expression is a part of other expression).
2464     Current->SplitPenalty = splitPenalty(Line, *Current, InFunctionDecl);
2465     if (Style.Language == FormatStyle::LK_ObjC &&
2466         Current->is(TT_SelectorName) && Current->ParameterIndex > 0) {
2467       if (Current->ParameterIndex == 1)
2468         Current->SplitPenalty += 5 * Current->BindingStrength;
2469     } else {
2470       Current->SplitPenalty += 20 * Current->BindingStrength;
2471     }
2472 
2473     Current = Current->Next;
2474   }
2475 
2476   calculateUnbreakableTailLengths(Line);
2477   unsigned IndentLevel = Line.Level;
2478   for (Current = Line.First; Current != nullptr; Current = Current->Next) {
2479     if (Current->Role)
2480       Current->Role->precomputeFormattingInfos(Current);
2481     if (Current->MatchingParen &&
2482         Current->MatchingParen->opensBlockOrBlockTypeList(Style)) {
2483       assert(IndentLevel > 0);
2484       --IndentLevel;
2485     }
2486     Current->IndentLevel = IndentLevel;
2487     if (Current->opensBlockOrBlockTypeList(Style))
2488       ++IndentLevel;
2489   }
2490 
2491   LLVM_DEBUG({ printDebugInfo(Line); });
2492 }
2493 
2494 void TokenAnnotator::calculateUnbreakableTailLengths(AnnotatedLine &Line) {
2495   unsigned UnbreakableTailLength = 0;
2496   FormatToken *Current = Line.Last;
2497   while (Current) {
2498     Current->UnbreakableTailLength = UnbreakableTailLength;
2499     if (Current->CanBreakBefore ||
2500         Current->isOneOf(tok::comment, tok::string_literal)) {
2501       UnbreakableTailLength = 0;
2502     } else {
2503       UnbreakableTailLength +=
2504           Current->ColumnWidth + Current->SpacesRequiredBefore;
2505     }
2506     Current = Current->Previous;
2507   }
2508 }
2509 
2510 unsigned TokenAnnotator::splitPenalty(const AnnotatedLine &Line,
2511                                       const FormatToken &Tok,
2512                                       bool InFunctionDecl) {
2513   const FormatToken &Left = *Tok.Previous;
2514   const FormatToken &Right = Tok;
2515 
2516   if (Left.is(tok::semi))
2517     return 0;
2518 
2519   if (Style.Language == FormatStyle::LK_Java) {
2520     if (Right.isOneOf(Keywords.kw_extends, Keywords.kw_throws))
2521       return 1;
2522     if (Right.is(Keywords.kw_implements))
2523       return 2;
2524     if (Left.is(tok::comma) && Left.NestingLevel == 0)
2525       return 3;
2526   } else if (Style.Language == FormatStyle::LK_JavaScript) {
2527     if (Right.is(Keywords.kw_function) && Left.isNot(tok::comma))
2528       return 100;
2529     if (Left.is(TT_JsTypeColon))
2530       return 35;
2531     if ((Left.is(TT_TemplateString) && Left.TokenText.endswith("${")) ||
2532         (Right.is(TT_TemplateString) && Right.TokenText.startswith("}")))
2533       return 100;
2534     // Prefer breaking call chains (".foo") over empty "{}", "[]" or "()".
2535     if (Left.opensScope() && Right.closesScope())
2536       return 200;
2537   }
2538 
2539   if (Right.is(tok::identifier) && Right.Next && Right.Next->is(TT_DictLiteral))
2540     return 1;
2541   if (Right.is(tok::l_square)) {
2542     if (Style.Language == FormatStyle::LK_Proto)
2543       return 1;
2544     if (Left.is(tok::r_square))
2545       return 200;
2546     // Slightly prefer formatting local lambda definitions like functions.
2547     if (Right.is(TT_LambdaLSquare) && Left.is(tok::equal))
2548       return 35;
2549     if (!Right.isOneOf(TT_ObjCMethodExpr, TT_LambdaLSquare,
2550                        TT_ArrayInitializerLSquare,
2551                        TT_DesignatedInitializerLSquare, TT_AttributeSquare))
2552       return 500;
2553   }
2554 
2555   if (Left.is(tok::coloncolon) ||
2556       (Right.is(tok::period) && Style.Language == FormatStyle::LK_Proto))
2557     return 500;
2558   if (Right.isOneOf(TT_StartOfName, TT_FunctionDeclarationName) ||
2559       Right.is(tok::kw_operator)) {
2560     if (Line.startsWith(tok::kw_for) && Right.PartOfMultiVariableDeclStmt)
2561       return 3;
2562     if (Left.is(TT_StartOfName))
2563       return 110;
2564     if (InFunctionDecl && Right.NestingLevel == 0)
2565       return Style.PenaltyReturnTypeOnItsOwnLine;
2566     return 200;
2567   }
2568   if (Right.is(TT_PointerOrReference))
2569     return 190;
2570   if (Right.is(TT_LambdaArrow))
2571     return 110;
2572   if (Left.is(tok::equal) && Right.is(tok::l_brace))
2573     return 160;
2574   if (Left.is(TT_CastRParen))
2575     return 100;
2576   if (Left.isOneOf(tok::kw_class, tok::kw_struct))
2577     return 5000;
2578   if (Left.is(tok::comment))
2579     return 1000;
2580 
2581   if (Left.isOneOf(TT_RangeBasedForLoopColon, TT_InheritanceColon,
2582                    TT_CtorInitializerColon))
2583     return 2;
2584 
2585   if (Right.isMemberAccess()) {
2586     // Breaking before the "./->" of a chained call/member access is reasonably
2587     // cheap, as formatting those with one call per line is generally
2588     // desirable. In particular, it should be cheaper to break before the call
2589     // than it is to break inside a call's parameters, which could lead to weird
2590     // "hanging" indents. The exception is the very last "./->" to support this
2591     // frequent pattern:
2592     //
2593     //   aaaaaaaa.aaaaaaaa.bbbbbbb().ccccccccccccccccccccc(
2594     //       dddddddd);
2595     //
2596     // which might otherwise be blown up onto many lines. Here, clang-format
2597     // won't produce "hanging" indents anyway as there is no other trailing
2598     // call.
2599     //
2600     // Also apply higher penalty is not a call as that might lead to a wrapping
2601     // like:
2602     //
2603     //   aaaaaaa
2604     //       .aaaaaaaaa.bbbbbbbb(cccccccc);
2605     return !Right.NextOperator || !Right.NextOperator->Previous->closesScope()
2606                ? 150
2607                : 35;
2608   }
2609 
2610   if (Right.is(TT_TrailingAnnotation) &&
2611       (!Right.Next || Right.Next->isNot(tok::l_paren))) {
2612     // Moving trailing annotations to the next line is fine for ObjC method
2613     // declarations.
2614     if (Line.startsWith(TT_ObjCMethodSpecifier))
2615       return 10;
2616     // Generally, breaking before a trailing annotation is bad unless it is
2617     // function-like. It seems to be especially preferable to keep standard
2618     // annotations (i.e. "const", "final" and "override") on the same line.
2619     // Use a slightly higher penalty after ")" so that annotations like
2620     // "const override" are kept together.
2621     bool is_short_annotation = Right.TokenText.size() < 10;
2622     return (Left.is(tok::r_paren) ? 100 : 120) + (is_short_annotation ? 50 : 0);
2623   }
2624 
2625   // In for-loops, prefer breaking at ',' and ';'.
2626   if (Line.startsWith(tok::kw_for) && Left.is(tok::equal))
2627     return 4;
2628 
2629   // In Objective-C method expressions, prefer breaking before "param:" over
2630   // breaking after it.
2631   if (Right.is(TT_SelectorName))
2632     return 0;
2633   if (Left.is(tok::colon) && Left.is(TT_ObjCMethodExpr))
2634     return Line.MightBeFunctionDecl ? 50 : 500;
2635 
2636   // In Objective-C type declarations, avoid breaking after the category's
2637   // open paren (we'll prefer breaking after the protocol list's opening
2638   // angle bracket, if present).
2639   if (Line.Type == LT_ObjCDecl && Left.is(tok::l_paren) && Left.Previous &&
2640       Left.Previous->isOneOf(tok::identifier, tok::greater))
2641     return 500;
2642 
2643   if (Left.is(tok::l_paren) && InFunctionDecl &&
2644       Style.AlignAfterOpenBracket != FormatStyle::BAS_DontAlign)
2645     return 100;
2646   if (Left.is(tok::l_paren) && Left.Previous &&
2647       (Left.Previous->is(tok::kw_for) || Left.Previous->isIf()))
2648     return 1000;
2649   if (Left.is(tok::equal) && InFunctionDecl)
2650     return 110;
2651   if (Right.is(tok::r_brace))
2652     return 1;
2653   if (Left.is(TT_TemplateOpener))
2654     return 100;
2655   if (Left.opensScope()) {
2656     if (Style.AlignAfterOpenBracket == FormatStyle::BAS_DontAlign)
2657       return 0;
2658     if (Left.is(tok::l_brace) && !Style.Cpp11BracedListStyle)
2659       return 19;
2660     return Left.ParameterCount > 1 ? Style.PenaltyBreakBeforeFirstCallParameter
2661                                    : 19;
2662   }
2663   if (Left.is(TT_JavaAnnotation))
2664     return 50;
2665 
2666   if (Left.is(TT_UnaryOperator))
2667     return 60;
2668   if (Left.isOneOf(tok::plus, tok::comma) && Left.Previous &&
2669       Left.Previous->isLabelString() &&
2670       (Left.NextOperator || Left.OperatorIndex != 0))
2671     return 50;
2672   if (Right.is(tok::plus) && Left.isLabelString() &&
2673       (Right.NextOperator || Right.OperatorIndex != 0))
2674     return 25;
2675   if (Left.is(tok::comma))
2676     return 1;
2677   if (Right.is(tok::lessless) && Left.isLabelString() &&
2678       (Right.NextOperator || Right.OperatorIndex != 1))
2679     return 25;
2680   if (Right.is(tok::lessless)) {
2681     // Breaking at a << is really cheap.
2682     if (!Left.is(tok::r_paren) || Right.OperatorIndex > 0)
2683       // Slightly prefer to break before the first one in log-like statements.
2684       return 2;
2685     return 1;
2686   }
2687   if (Left.ClosesTemplateDeclaration)
2688     return Style.PenaltyBreakTemplateDeclaration;
2689   if (Left.is(TT_ConditionalExpr))
2690     return prec::Conditional;
2691   prec::Level Level = Left.getPrecedence();
2692   if (Level == prec::Unknown)
2693     Level = Right.getPrecedence();
2694   if (Level == prec::Assignment)
2695     return Style.PenaltyBreakAssignment;
2696   if (Level != prec::Unknown)
2697     return Level;
2698 
2699   return 3;
2700 }
2701 
2702 bool TokenAnnotator::spaceRequiredBeforeParens(const FormatToken &Right) const {
2703   return Style.SpaceBeforeParens == FormatStyle::SBPO_Always ||
2704          (Style.SpaceBeforeParens == FormatStyle::SBPO_NonEmptyParentheses &&
2705           Right.ParameterCount > 0);
2706 }
2707 
2708 /// Returns \c true if the token is followed by a boolean condition, \c false
2709 /// otherwise.
2710 static bool isKeywordWithCondition(const FormatToken &Tok) {
2711   return Tok.isOneOf(tok::kw_if, tok::kw_for, tok::kw_while, tok::kw_switch,
2712                      tok::kw_constexpr, tok::kw_catch);
2713 }
2714 
2715 bool TokenAnnotator::spaceRequiredBetween(const AnnotatedLine &Line,
2716                                           const FormatToken &Left,
2717                                           const FormatToken &Right) {
2718   if (Left.is(tok::kw_return) && Right.isNot(tok::semi))
2719     return true;
2720   if (Left.is(Keywords.kw_assert) && Style.Language == FormatStyle::LK_Java)
2721     return true;
2722   if (Style.ObjCSpaceAfterProperty && Line.Type == LT_ObjCProperty &&
2723       Left.Tok.getObjCKeywordID() == tok::objc_property)
2724     return true;
2725   if (Right.is(tok::hashhash))
2726     return Left.is(tok::hash);
2727   if (Left.isOneOf(tok::hashhash, tok::hash))
2728     return Right.is(tok::hash);
2729   if ((Left.is(tok::l_paren) && Right.is(tok::r_paren)) ||
2730       (Left.is(tok::l_brace) && Left.BlockKind != BK_Block &&
2731        Right.is(tok::r_brace) && Right.BlockKind != BK_Block))
2732     return Style.SpaceInEmptyParentheses;
2733   if (Style.SpacesInConditionalStatement) {
2734     if (Left.is(tok::l_paren) && Left.Previous &&
2735         isKeywordWithCondition(*Left.Previous))
2736       return true;
2737     if (Right.is(tok::r_paren) && Right.MatchingParen &&
2738         Right.MatchingParen->Previous &&
2739         isKeywordWithCondition(*Right.MatchingParen->Previous))
2740       return true;
2741   }
2742   if (Left.is(tok::l_paren) || Right.is(tok::r_paren))
2743     return (Right.is(TT_CastRParen) ||
2744             (Left.MatchingParen && Left.MatchingParen->is(TT_CastRParen)))
2745                ? Style.SpacesInCStyleCastParentheses
2746                : Style.SpacesInParentheses;
2747   if (Right.isOneOf(tok::semi, tok::comma))
2748     return false;
2749   if (Right.is(tok::less) && Line.Type == LT_ObjCDecl) {
2750     bool IsLightweightGeneric = Right.MatchingParen &&
2751                                 Right.MatchingParen->Next &&
2752                                 Right.MatchingParen->Next->is(tok::colon);
2753     return !IsLightweightGeneric && Style.ObjCSpaceBeforeProtocolList;
2754   }
2755   if (Right.is(tok::less) && Left.is(tok::kw_template))
2756     return Style.SpaceAfterTemplateKeyword;
2757   if (Left.isOneOf(tok::exclaim, tok::tilde))
2758     return false;
2759   if (Left.is(tok::at) &&
2760       Right.isOneOf(tok::identifier, tok::string_literal, tok::char_constant,
2761                     tok::numeric_constant, tok::l_paren, tok::l_brace,
2762                     tok::kw_true, tok::kw_false))
2763     return false;
2764   if (Left.is(tok::colon))
2765     return !Left.is(TT_ObjCMethodExpr);
2766   if (Left.is(tok::coloncolon))
2767     return false;
2768   if (Left.is(tok::less) || Right.isOneOf(tok::greater, tok::less)) {
2769     if (Style.Language == FormatStyle::LK_TextProto ||
2770         (Style.Language == FormatStyle::LK_Proto &&
2771          (Left.is(TT_DictLiteral) || Right.is(TT_DictLiteral)))) {
2772       // Format empty list as `<>`.
2773       if (Left.is(tok::less) && Right.is(tok::greater))
2774         return false;
2775       return !Style.Cpp11BracedListStyle;
2776     }
2777     return false;
2778   }
2779   if (Right.is(tok::ellipsis))
2780     return Left.Tok.isLiteral() || (Left.is(tok::identifier) && Left.Previous &&
2781                                     Left.Previous->is(tok::kw_case));
2782   if (Left.is(tok::l_square) && Right.is(tok::amp))
2783     return Style.SpacesInSquareBrackets;
2784   if (Right.is(TT_PointerOrReference)) {
2785     if (Left.is(tok::r_paren) && Line.MightBeFunctionDecl) {
2786       if (!Left.MatchingParen)
2787         return true;
2788       FormatToken *TokenBeforeMatchingParen =
2789           Left.MatchingParen->getPreviousNonComment();
2790       if (!TokenBeforeMatchingParen ||
2791           !TokenBeforeMatchingParen->isOneOf(tok::kw_typeof, tok::kw_decltype,
2792                                              TT_TypenameMacro))
2793         return true;
2794     }
2795     return (Left.Tok.isLiteral() ||
2796             (!Left.isOneOf(TT_PointerOrReference, tok::l_paren) &&
2797              (Style.PointerAlignment != FormatStyle::PAS_Left ||
2798               (Line.IsMultiVariableDeclStmt &&
2799                (Left.NestingLevel == 0 ||
2800                 (Left.NestingLevel == 1 && Line.First->is(tok::kw_for)))))));
2801   }
2802   if (Right.is(TT_FunctionTypeLParen) && Left.isNot(tok::l_paren) &&
2803       (!Left.is(TT_PointerOrReference) ||
2804        (Style.PointerAlignment != FormatStyle::PAS_Right &&
2805         !Line.IsMultiVariableDeclStmt)))
2806     return true;
2807   if (Left.is(TT_PointerOrReference))
2808     return Right.Tok.isLiteral() || Right.is(TT_BlockComment) ||
2809            (Right.isOneOf(Keywords.kw_override, Keywords.kw_final) &&
2810             !Right.is(TT_StartOfName)) ||
2811            (Right.is(tok::l_brace) && Right.BlockKind == BK_Block) ||
2812            (!Right.isOneOf(TT_PointerOrReference, TT_ArraySubscriptLSquare,
2813                            tok::l_paren) &&
2814             (Style.PointerAlignment != FormatStyle::PAS_Right &&
2815              !Line.IsMultiVariableDeclStmt) &&
2816             Left.Previous &&
2817             !Left.Previous->isOneOf(tok::l_paren, tok::coloncolon,
2818                                     tok::l_square));
2819   if (Right.is(tok::star) && Left.is(tok::l_paren))
2820     return false;
2821   if (Left.is(tok::star) && Right.isOneOf(tok::star, tok::amp, tok::ampamp))
2822     return false;
2823   if (Right.isOneOf(tok::star, tok::amp, tok::ampamp)) {
2824     const FormatToken *Previous = &Left;
2825     while (Previous && !Previous->is(tok::kw_operator)) {
2826       if (Previous->is(tok::identifier) || Previous->isSimpleTypeSpecifier()) {
2827         Previous = Previous->getPreviousNonComment();
2828         continue;
2829       }
2830       if (Previous->is(TT_TemplateCloser) && Previous->MatchingParen) {
2831         Previous = Previous->MatchingParen->getPreviousNonComment();
2832         continue;
2833       }
2834       if (Previous->is(tok::coloncolon)) {
2835         Previous = Previous->getPreviousNonComment();
2836         continue;
2837       }
2838       break;
2839     }
2840     // Space between the type and the * in:
2841     //   operator void*()
2842     //   operator char*()
2843     //   operator /*comment*/ const char*()
2844     //   operator volatile /*comment*/ char*()
2845     //   operator Foo*()
2846     //   operator C<T>*()
2847     //   operator std::Foo*()
2848     //   operator C<T>::D<U>*()
2849     // dependent on PointerAlignment style.
2850     if (Previous &&
2851         (Previous->endsSequence(tok::kw_operator) ||
2852          Previous->endsSequence(tok::kw_const, tok::kw_operator) ||
2853          Previous->endsSequence(tok::kw_volatile, tok::kw_operator)))
2854       return (Style.PointerAlignment != FormatStyle::PAS_Left);
2855   }
2856   const auto SpaceRequiredForArrayInitializerLSquare =
2857       [](const FormatToken &LSquareTok, const FormatStyle &Style) {
2858         return Style.SpacesInContainerLiterals ||
2859                ((Style.Language == FormatStyle::LK_Proto ||
2860                  Style.Language == FormatStyle::LK_TextProto) &&
2861                 !Style.Cpp11BracedListStyle &&
2862                 LSquareTok.endsSequence(tok::l_square, tok::colon,
2863                                         TT_SelectorName));
2864       };
2865   if (Left.is(tok::l_square))
2866     return (Left.is(TT_ArrayInitializerLSquare) && Right.isNot(tok::r_square) &&
2867             SpaceRequiredForArrayInitializerLSquare(Left, Style)) ||
2868            (Left.isOneOf(TT_ArraySubscriptLSquare, TT_StructuredBindingLSquare,
2869                          TT_LambdaLSquare) &&
2870             Style.SpacesInSquareBrackets && Right.isNot(tok::r_square));
2871   if (Right.is(tok::r_square))
2872     return Right.MatchingParen &&
2873            ((Right.MatchingParen->is(TT_ArrayInitializerLSquare) &&
2874              SpaceRequiredForArrayInitializerLSquare(*Right.MatchingParen,
2875                                                      Style)) ||
2876             (Style.SpacesInSquareBrackets &&
2877              Right.MatchingParen->isOneOf(TT_ArraySubscriptLSquare,
2878                                           TT_StructuredBindingLSquare,
2879                                           TT_LambdaLSquare)) ||
2880             Right.MatchingParen->is(TT_AttributeParen));
2881   if (Right.is(tok::l_square) &&
2882       !Right.isOneOf(TT_ObjCMethodExpr, TT_LambdaLSquare,
2883                      TT_DesignatedInitializerLSquare,
2884                      TT_StructuredBindingLSquare, TT_AttributeSquare) &&
2885       !Left.isOneOf(tok::numeric_constant, TT_DictLiteral) &&
2886       !(!Left.is(tok::r_square) && Style.SpaceBeforeSquareBrackets &&
2887         Right.is(TT_ArraySubscriptLSquare)))
2888     return false;
2889   if (Left.is(tok::l_brace) && Right.is(tok::r_brace))
2890     return !Left.Children.empty(); // No spaces in "{}".
2891   if ((Left.is(tok::l_brace) && Left.BlockKind != BK_Block) ||
2892       (Right.is(tok::r_brace) && Right.MatchingParen &&
2893        Right.MatchingParen->BlockKind != BK_Block))
2894     return Style.Cpp11BracedListStyle ? Style.SpacesInParentheses : true;
2895   if (Left.is(TT_BlockComment))
2896     // No whitespace in x(/*foo=*/1), except for JavaScript.
2897     return Style.Language == FormatStyle::LK_JavaScript ||
2898            !Left.TokenText.endswith("=*/");
2899 
2900   // Space between template and attribute.
2901   // e.g. template <typename T> [[nodiscard]] ...
2902   if (Left.is(TT_TemplateCloser) && Right.is(TT_AttributeSquare))
2903     return true;
2904   if (Right.is(tok::l_paren)) {
2905     if ((Left.is(tok::r_paren) && Left.is(TT_AttributeParen)) ||
2906         (Left.is(tok::r_square) && Left.is(TT_AttributeSquare)))
2907       return true;
2908     if (Style.SpaceBeforeParens ==
2909             FormatStyle::SBPO_ControlStatementsExceptForEachMacros &&
2910         Left.is(TT_ForEachMacro))
2911       return false;
2912     return Line.Type == LT_ObjCDecl || Left.is(tok::semi) ||
2913            (Style.SpaceBeforeParens != FormatStyle::SBPO_Never &&
2914             (Left.isOneOf(tok::pp_elif, tok::kw_for, tok::kw_while,
2915                           tok::kw_switch, tok::kw_case, TT_ForEachMacro,
2916                           TT_ObjCForIn) ||
2917              Left.isIf(Line.Type != LT_PreprocessorDirective) ||
2918              (Left.isOneOf(tok::kw_try, Keywords.kw___except, tok::kw_catch,
2919                            tok::kw_new, tok::kw_delete) &&
2920               (!Left.Previous || Left.Previous->isNot(tok::period))))) ||
2921            (spaceRequiredBeforeParens(Right) &&
2922             (Left.is(tok::identifier) || Left.isFunctionLikeKeyword() ||
2923              Left.is(tok::r_paren) || Left.isSimpleTypeSpecifier() ||
2924              (Left.is(tok::r_square) && Left.MatchingParen &&
2925               Left.MatchingParen->is(TT_LambdaLSquare))) &&
2926             Line.Type != LT_PreprocessorDirective);
2927   }
2928   if (Left.is(tok::at) && Right.Tok.getObjCKeywordID() != tok::objc_not_keyword)
2929     return false;
2930   if (Right.is(TT_UnaryOperator))
2931     return !Left.isOneOf(tok::l_paren, tok::l_square, tok::at) &&
2932            (Left.isNot(tok::colon) || Left.isNot(TT_ObjCMethodExpr));
2933   if ((Left.isOneOf(tok::identifier, tok::greater, tok::r_square,
2934                     tok::r_paren) ||
2935        Left.isSimpleTypeSpecifier()) &&
2936       Right.is(tok::l_brace) && Right.getNextNonComment() &&
2937       Right.BlockKind != BK_Block)
2938     return false;
2939   if (Left.is(tok::period) || Right.is(tok::period))
2940     return false;
2941   if (Right.is(tok::hash) && Left.is(tok::identifier) && Left.TokenText == "L")
2942     return false;
2943   if (Left.is(TT_TemplateCloser) && Left.MatchingParen &&
2944       Left.MatchingParen->Previous &&
2945       (Left.MatchingParen->Previous->is(tok::period) ||
2946        Left.MatchingParen->Previous->is(tok::coloncolon)))
2947     // Java call to generic function with explicit type:
2948     // A.<B<C<...>>>DoSomething();
2949     // A::<B<C<...>>>DoSomething();  // With a Java 8 method reference.
2950     return false;
2951   if (Left.is(TT_TemplateCloser) && Right.is(tok::l_square))
2952     return false;
2953   if (Left.is(tok::l_brace) && Left.endsSequence(TT_DictLiteral, tok::at))
2954     // Objective-C dictionary literal -> no space after opening brace.
2955     return false;
2956   if (Right.is(tok::r_brace) && Right.MatchingParen &&
2957       Right.MatchingParen->endsSequence(TT_DictLiteral, tok::at))
2958     // Objective-C dictionary literal -> no space before closing brace.
2959     return false;
2960   if (Right.getType() == TT_TrailingAnnotation &&
2961       Right.isOneOf(tok::amp, tok::ampamp) &&
2962       Left.isOneOf(tok::kw_const, tok::kw_volatile) &&
2963       (!Right.Next || Right.Next->is(tok::semi)))
2964     // Match const and volatile ref-qualifiers without any additional
2965     // qualifiers such as
2966     // void Fn() const &;
2967     return Style.PointerAlignment != FormatStyle::PAS_Left;
2968   return true;
2969 }
2970 
2971 bool TokenAnnotator::spaceRequiredBefore(const AnnotatedLine &Line,
2972                                          const FormatToken &Right) {
2973   const FormatToken &Left = *Right.Previous;
2974   if (Right.Tok.getIdentifierInfo() && Left.Tok.getIdentifierInfo())
2975     return true; // Never ever merge two identifiers.
2976   if (Style.isCpp()) {
2977     if (Left.is(tok::kw_operator))
2978       return Right.is(tok::coloncolon);
2979     if (Right.is(tok::l_brace) && Right.BlockKind == BK_BracedInit &&
2980         !Left.opensScope() && Style.SpaceBeforeCpp11BracedList)
2981       return true;
2982   } else if (Style.Language == FormatStyle::LK_Proto ||
2983              Style.Language == FormatStyle::LK_TextProto) {
2984     if (Right.is(tok::period) &&
2985         Left.isOneOf(Keywords.kw_optional, Keywords.kw_required,
2986                      Keywords.kw_repeated, Keywords.kw_extend))
2987       return true;
2988     if (Right.is(tok::l_paren) &&
2989         Left.isOneOf(Keywords.kw_returns, Keywords.kw_option))
2990       return true;
2991     if (Right.isOneOf(tok::l_brace, tok::less) && Left.is(TT_SelectorName))
2992       return true;
2993     // Slashes occur in text protocol extension syntax: [type/type] { ... }.
2994     if (Left.is(tok::slash) || Right.is(tok::slash))
2995       return false;
2996     if (Left.MatchingParen &&
2997         Left.MatchingParen->is(TT_ProtoExtensionLSquare) &&
2998         Right.isOneOf(tok::l_brace, tok::less))
2999       return !Style.Cpp11BracedListStyle;
3000     // A percent is probably part of a formatting specification, such as %lld.
3001     if (Left.is(tok::percent))
3002       return false;
3003     // Preserve the existence of a space before a percent for cases like 0x%04x
3004     // and "%d %d"
3005     if (Left.is(tok::numeric_constant) && Right.is(tok::percent))
3006       return Right.WhitespaceRange.getEnd() != Right.WhitespaceRange.getBegin();
3007   } else if (Style.isCSharp()) {
3008     // Require spaces around '{' and  before '}' unless they appear in
3009     // interpolated strings. Interpolated strings are merged into a single token
3010     // so cannot have spaces inserted by this function.
3011 
3012     // No space between 'this' and '['
3013     if (Left.is(tok::kw_this) && Right.is(tok::l_square))
3014       return false;
3015 
3016     // No space between 'new' and '('
3017     if (Left.is(tok::kw_new) && Right.is(tok::l_paren))
3018       return false;
3019 
3020     // Space before { (including space within '{ {').
3021     if (Right.is(tok::l_brace))
3022       return true;
3023 
3024     // Spaces inside braces.
3025     if (Left.is(tok::l_brace) && Right.isNot(tok::r_brace))
3026       return true;
3027 
3028     if (Left.isNot(tok::l_brace) && Right.is(tok::r_brace))
3029       return true;
3030 
3031     // Spaces around '=>'.
3032     if (Left.is(TT_JsFatArrow) || Right.is(TT_JsFatArrow))
3033       return true;
3034 
3035     // No spaces around attribute target colons
3036     if (Left.is(TT_AttributeColon) || Right.is(TT_AttributeColon))
3037       return false;
3038 
3039     // space between type and variable e.g. Dictionary<string,string> foo;
3040     if (Left.is(TT_TemplateCloser) && Right.is(TT_StartOfName))
3041       return true;
3042 
3043     // spaces inside square brackets.
3044     if (Left.is(tok::l_square) || Right.is(tok::r_square))
3045       return Style.SpacesInSquareBrackets;
3046 
3047     // No space before ? in nullable types.
3048     if (Right.is(TT_CSharpNullable))
3049       return false;
3050 
3051     // Require space after ? in nullable types except in generics and casts.
3052     if (Left.is(TT_CSharpNullable))
3053       return !Right.isOneOf(TT_TemplateCloser, tok::r_paren);
3054 
3055     // No space before or after '?.'.
3056     if (Left.is(TT_CSharpNullConditional) || Right.is(TT_CSharpNullConditional))
3057       return false;
3058 
3059     // Space before and after '??'.
3060     if (Left.is(TT_CSharpNullCoalescing) || Right.is(TT_CSharpNullCoalescing))
3061       return true;
3062 
3063     // No space before '?['.
3064     if (Right.is(TT_CSharpNullConditionalLSquare))
3065       return false;
3066 
3067     // No space between consecutive commas '[,,]'.
3068     if (Left.is(tok::comma) && Right.is(tok::comma))
3069       return false;
3070 
3071     // Possible space inside `?[ 0 ]`.
3072     if (Left.is(TT_CSharpNullConditionalLSquare))
3073       return Style.SpacesInSquareBrackets;
3074 
3075     // space after var in `var (key, value)`
3076     if (Left.is(Keywords.kw_var) && Right.is(tok::l_paren))
3077       return true;
3078 
3079     // space between keywords and paren e.g. "using ("
3080     if (Right.is(tok::l_paren))
3081       if (Left.isOneOf(tok::kw_using, Keywords.kw_async, Keywords.kw_when))
3082         return Style.SpaceBeforeParens == FormatStyle::SBPO_ControlStatements ||
3083                spaceRequiredBeforeParens(Right);
3084   } else if (Style.Language == FormatStyle::LK_JavaScript) {
3085     if (Left.is(TT_JsFatArrow))
3086       return true;
3087     // for await ( ...
3088     if (Right.is(tok::l_paren) && Left.is(Keywords.kw_await) && Left.Previous &&
3089         Left.Previous->is(tok::kw_for))
3090       return true;
3091     if (Left.is(Keywords.kw_async) && Right.is(tok::l_paren) &&
3092         Right.MatchingParen) {
3093       const FormatToken *Next = Right.MatchingParen->getNextNonComment();
3094       // An async arrow function, for example: `x = async () => foo();`,
3095       // as opposed to calling a function called async: `x = async();`
3096       if (Next && Next->is(TT_JsFatArrow))
3097         return true;
3098     }
3099     if ((Left.is(TT_TemplateString) && Left.TokenText.endswith("${")) ||
3100         (Right.is(TT_TemplateString) && Right.TokenText.startswith("}")))
3101       return false;
3102     // In tagged template literals ("html`bar baz`"), there is no space between
3103     // the tag identifier and the template string.
3104     if (Keywords.IsJavaScriptIdentifier(Left,
3105                                         /* AcceptIdentifierName= */ false) &&
3106         Right.is(TT_TemplateString))
3107       return false;
3108     if (Right.is(tok::star) &&
3109         Left.isOneOf(Keywords.kw_function, Keywords.kw_yield))
3110       return false;
3111     if (Right.isOneOf(tok::l_brace, tok::l_square) &&
3112         Left.isOneOf(Keywords.kw_function, Keywords.kw_yield,
3113                      Keywords.kw_extends, Keywords.kw_implements))
3114       return true;
3115     if (Right.is(tok::l_paren)) {
3116       // JS methods can use some keywords as names (e.g. `delete()`).
3117       if (Line.MustBeDeclaration && Left.Tok.getIdentifierInfo())
3118         return false;
3119       // Valid JS method names can include keywords, e.g. `foo.delete()` or
3120       // `bar.instanceof()`. Recognize call positions by preceding period.
3121       if (Left.Previous && Left.Previous->is(tok::period) &&
3122           Left.Tok.getIdentifierInfo())
3123         return false;
3124       // Additional unary JavaScript operators that need a space after.
3125       if (Left.isOneOf(tok::kw_throw, Keywords.kw_await, Keywords.kw_typeof,
3126                        tok::kw_void))
3127         return true;
3128     }
3129     // `foo as const;` casts into a const type.
3130     if (Left.endsSequence(tok::kw_const, Keywords.kw_as)) {
3131       return false;
3132     }
3133     if ((Left.isOneOf(Keywords.kw_let, Keywords.kw_var, Keywords.kw_in,
3134                       tok::kw_const) ||
3135          // "of" is only a keyword if it appears after another identifier
3136          // (e.g. as "const x of y" in a for loop), or after a destructuring
3137          // operation (const [x, y] of z, const {a, b} of c).
3138          (Left.is(Keywords.kw_of) && Left.Previous &&
3139           (Left.Previous->Tok.is(tok::identifier) ||
3140            Left.Previous->isOneOf(tok::r_square, tok::r_brace)))) &&
3141         (!Left.Previous || !Left.Previous->is(tok::period)))
3142       return true;
3143     if (Left.isOneOf(tok::kw_for, Keywords.kw_as) && Left.Previous &&
3144         Left.Previous->is(tok::period) && Right.is(tok::l_paren))
3145       return false;
3146     if (Left.is(Keywords.kw_as) &&
3147         Right.isOneOf(tok::l_square, tok::l_brace, tok::l_paren))
3148       return true;
3149     if (Left.is(tok::kw_default) && Left.Previous &&
3150         Left.Previous->is(tok::kw_export))
3151       return true;
3152     if (Left.is(Keywords.kw_is) && Right.is(tok::l_brace))
3153       return true;
3154     if (Right.isOneOf(TT_JsTypeColon, TT_JsTypeOptionalQuestion))
3155       return false;
3156     if (Left.is(TT_JsTypeOperator) || Right.is(TT_JsTypeOperator))
3157       return false;
3158     if ((Left.is(tok::l_brace) || Right.is(tok::r_brace)) &&
3159         Line.First->isOneOf(Keywords.kw_import, tok::kw_export))
3160       return false;
3161     if (Left.is(tok::ellipsis))
3162       return false;
3163     if (Left.is(TT_TemplateCloser) &&
3164         !Right.isOneOf(tok::equal, tok::l_brace, tok::comma, tok::l_square,
3165                        Keywords.kw_implements, Keywords.kw_extends))
3166       // Type assertions ('<type>expr') are not followed by whitespace. Other
3167       // locations that should have whitespace following are identified by the
3168       // above set of follower tokens.
3169       return false;
3170     if (Right.is(TT_JsNonNullAssertion))
3171       return false;
3172     if (Left.is(TT_JsNonNullAssertion) &&
3173         Right.isOneOf(Keywords.kw_as, Keywords.kw_in))
3174       return true; // "x! as string", "x! in y"
3175   } else if (Style.Language == FormatStyle::LK_Java) {
3176     if (Left.is(tok::r_square) && Right.is(tok::l_brace))
3177       return true;
3178     if (Left.is(Keywords.kw_synchronized) && Right.is(tok::l_paren))
3179       return Style.SpaceBeforeParens != FormatStyle::SBPO_Never;
3180     if ((Left.isOneOf(tok::kw_static, tok::kw_public, tok::kw_private,
3181                       tok::kw_protected) ||
3182          Left.isOneOf(Keywords.kw_final, Keywords.kw_abstract,
3183                       Keywords.kw_native)) &&
3184         Right.is(TT_TemplateOpener))
3185       return true;
3186   }
3187   if (Left.is(TT_ImplicitStringLiteral))
3188     return Right.WhitespaceRange.getBegin() != Right.WhitespaceRange.getEnd();
3189   if (Line.Type == LT_ObjCMethodDecl) {
3190     if (Left.is(TT_ObjCMethodSpecifier))
3191       return true;
3192     if (Left.is(tok::r_paren) && canBeObjCSelectorComponent(Right))
3193       // Don't space between ')' and <id> or ')' and 'new'. 'new' is not a
3194       // keyword in Objective-C, and '+ (instancetype)new;' is a standard class
3195       // method declaration.
3196       return false;
3197   }
3198   if (Line.Type == LT_ObjCProperty &&
3199       (Right.is(tok::equal) || Left.is(tok::equal)))
3200     return false;
3201 
3202   if (Right.isOneOf(TT_TrailingReturnArrow, TT_LambdaArrow) ||
3203       Left.isOneOf(TT_TrailingReturnArrow, TT_LambdaArrow))
3204     return true;
3205   if (Right.is(TT_OverloadedOperatorLParen))
3206     return spaceRequiredBeforeParens(Right);
3207   if (Left.is(tok::comma))
3208     return true;
3209   if (Right.is(tok::comma))
3210     return false;
3211   if (Right.is(TT_ObjCBlockLParen))
3212     return true;
3213   if (Right.is(TT_CtorInitializerColon))
3214     return Style.SpaceBeforeCtorInitializerColon;
3215   if (Right.is(TT_InheritanceColon) && !Style.SpaceBeforeInheritanceColon)
3216     return false;
3217   if (Right.is(TT_RangeBasedForLoopColon) &&
3218       !Style.SpaceBeforeRangeBasedForLoopColon)
3219     return false;
3220   if (Right.is(tok::colon)) {
3221     if (Line.First->isOneOf(tok::kw_case, tok::kw_default) ||
3222         !Right.getNextNonComment() || Right.getNextNonComment()->is(tok::semi))
3223       return false;
3224     if (Right.is(TT_ObjCMethodExpr))
3225       return false;
3226     if (Left.is(tok::question))
3227       return false;
3228     if (Right.is(TT_InlineASMColon) && Left.is(tok::coloncolon))
3229       return false;
3230     if (Right.is(TT_DictLiteral))
3231       return Style.SpacesInContainerLiterals;
3232     if (Right.is(TT_AttributeColon))
3233       return false;
3234     if (Right.is(TT_CSharpNamedArgumentColon))
3235       return false;
3236     return true;
3237   }
3238   if (Left.is(TT_UnaryOperator)) {
3239     if (!Right.is(tok::l_paren)) {
3240       // The alternative operators for ~ and ! are "compl" and "not".
3241       // If they are used instead, we do not want to combine them with
3242       // the token to the right, unless that is a left paren.
3243       if (Left.is(tok::exclaim) && Left.TokenText == "not")
3244         return true;
3245       if (Left.is(tok::tilde) && Left.TokenText == "compl")
3246         return true;
3247       // Lambda captures allow for a lone &, so "&]" needs to be properly
3248       // handled.
3249       if (Left.is(tok::amp) && Right.is(tok::r_square))
3250         return Style.SpacesInSquareBrackets;
3251     }
3252     return (Style.SpaceAfterLogicalNot && Left.is(tok::exclaim)) ||
3253            Right.is(TT_BinaryOperator);
3254   }
3255 
3256   // If the next token is a binary operator or a selector name, we have
3257   // incorrectly classified the parenthesis as a cast. FIXME: Detect correctly.
3258   if (Left.is(TT_CastRParen))
3259     return Style.SpaceAfterCStyleCast ||
3260            Right.isOneOf(TT_BinaryOperator, TT_SelectorName);
3261 
3262   if (Left.is(tok::greater) && Right.is(tok::greater)) {
3263     if (Style.Language == FormatStyle::LK_TextProto ||
3264         (Style.Language == FormatStyle::LK_Proto && Left.is(TT_DictLiteral)))
3265       return !Style.Cpp11BracedListStyle;
3266     return Right.is(TT_TemplateCloser) && Left.is(TT_TemplateCloser) &&
3267            (Style.Standard < FormatStyle::LS_Cpp11 || Style.SpacesInAngles);
3268   }
3269   if (Right.isOneOf(tok::arrow, tok::arrowstar, tok::periodstar) ||
3270       Left.isOneOf(tok::arrow, tok::period, tok::arrowstar, tok::periodstar) ||
3271       (Right.is(tok::period) && Right.isNot(TT_DesignatedInitializerPeriod)))
3272     return false;
3273   if (!Style.SpaceBeforeAssignmentOperators && Left.isNot(TT_TemplateCloser) &&
3274       Right.getPrecedence() == prec::Assignment)
3275     return false;
3276   if (Style.Language == FormatStyle::LK_Java && Right.is(tok::coloncolon) &&
3277       (Left.is(tok::identifier) || Left.is(tok::kw_this)))
3278     return false;
3279   if (Right.is(tok::coloncolon) && Left.is(tok::identifier))
3280     // Generally don't remove existing spaces between an identifier and "::".
3281     // The identifier might actually be a macro name such as ALWAYS_INLINE. If
3282     // this turns out to be too lenient, add analysis of the identifier itself.
3283     return Right.WhitespaceRange.getBegin() != Right.WhitespaceRange.getEnd();
3284   if (Right.is(tok::coloncolon) &&
3285       !Left.isOneOf(tok::l_brace, tok::comment, tok::l_paren))
3286     // Put a space between < and :: in vector< ::std::string >
3287     return (Left.is(TT_TemplateOpener) &&
3288             (Style.Standard < FormatStyle::LS_Cpp11 || Style.SpacesInAngles)) ||
3289            !(Left.isOneOf(tok::l_paren, tok::r_paren, tok::l_square,
3290                           tok::kw___super, TT_TemplateOpener,
3291                           TT_TemplateCloser)) ||
3292            (Left.is(tok::l_paren) && Style.SpacesInParentheses);
3293   if ((Left.is(TT_TemplateOpener)) != (Right.is(TT_TemplateCloser)))
3294     return Style.SpacesInAngles;
3295   // Space before TT_StructuredBindingLSquare.
3296   if (Right.is(TT_StructuredBindingLSquare))
3297     return !Left.isOneOf(tok::amp, tok::ampamp) ||
3298            Style.PointerAlignment != FormatStyle::PAS_Right;
3299   // Space before & or && following a TT_StructuredBindingLSquare.
3300   if (Right.Next && Right.Next->is(TT_StructuredBindingLSquare) &&
3301       Right.isOneOf(tok::amp, tok::ampamp))
3302     return Style.PointerAlignment != FormatStyle::PAS_Left;
3303   if ((Right.is(TT_BinaryOperator) && !Left.is(tok::l_paren)) ||
3304       (Left.isOneOf(TT_BinaryOperator, TT_ConditionalExpr) &&
3305        !Right.is(tok::r_paren)))
3306     return true;
3307   if (Left.is(TT_TemplateCloser) && Right.is(tok::l_paren) &&
3308       Right.isNot(TT_FunctionTypeLParen))
3309     return spaceRequiredBeforeParens(Right);
3310   if (Right.is(TT_TemplateOpener) && Left.is(tok::r_paren) &&
3311       Left.MatchingParen && Left.MatchingParen->is(TT_OverloadedOperatorLParen))
3312     return false;
3313   if (Right.is(tok::less) && Left.isNot(tok::l_paren) &&
3314       Line.startsWith(tok::hash))
3315     return true;
3316   if (Right.is(TT_TrailingUnaryOperator))
3317     return false;
3318   if (Left.is(TT_RegexLiteral))
3319     return false;
3320   return spaceRequiredBetween(Line, Left, Right);
3321 }
3322 
3323 // Returns 'true' if 'Tok' is a brace we'd want to break before in Allman style.
3324 static bool isAllmanBrace(const FormatToken &Tok) {
3325   return Tok.is(tok::l_brace) && Tok.BlockKind == BK_Block &&
3326          !Tok.isOneOf(TT_ObjCBlockLBrace, TT_LambdaLBrace, TT_DictLiteral);
3327 }
3328 
3329 // Returns 'true' if 'Tok' is an function argument.
3330 static bool IsFunctionArgument(const FormatToken &Tok) {
3331   return Tok.MatchingParen && Tok.MatchingParen->Next &&
3332          Tok.MatchingParen->Next->isOneOf(tok::comma, tok::r_paren);
3333 }
3334 
3335 static bool
3336 isItAnEmptyLambdaAllowed(const FormatToken &Tok,
3337                          FormatStyle::ShortLambdaStyle ShortLambdaOption) {
3338   return Tok.Children.empty() && ShortLambdaOption != FormatStyle::SLS_None;
3339 }
3340 
3341 static bool
3342 isItAInlineLambdaAllowed(const FormatToken &Tok,
3343                          FormatStyle::ShortLambdaStyle ShortLambdaOption) {
3344   return (ShortLambdaOption == FormatStyle::SLS_Inline &&
3345           IsFunctionArgument(Tok)) ||
3346          (ShortLambdaOption == FormatStyle::SLS_All);
3347 }
3348 
3349 static bool isOneChildWithoutMustBreakBefore(const FormatToken &Tok) {
3350   if (Tok.Children.size() != 1)
3351     return false;
3352   FormatToken *curElt = Tok.Children[0]->First;
3353   while (curElt) {
3354     if (curElt->MustBreakBefore)
3355       return false;
3356     curElt = curElt->Next;
3357   }
3358   return true;
3359 }
3360 static bool isAllmanLambdaBrace(const FormatToken &Tok) {
3361   return (Tok.is(tok::l_brace) && Tok.BlockKind == BK_Block &&
3362           !Tok.isOneOf(TT_ObjCBlockLBrace, TT_DictLiteral));
3363 }
3364 
3365 static bool isAllmanBraceIncludedBreakableLambda(
3366     const FormatToken &Tok, FormatStyle::ShortLambdaStyle ShortLambdaOption) {
3367   if (!isAllmanLambdaBrace(Tok))
3368     return false;
3369 
3370   if (isItAnEmptyLambdaAllowed(Tok, ShortLambdaOption))
3371     return false;
3372 
3373   return !isItAInlineLambdaAllowed(Tok, ShortLambdaOption) ||
3374          !isOneChildWithoutMustBreakBefore(Tok);
3375 }
3376 
3377 bool TokenAnnotator::mustBreakBefore(const AnnotatedLine &Line,
3378                                      const FormatToken &Right) {
3379   const FormatToken &Left = *Right.Previous;
3380   if (Right.NewlinesBefore > 1 && Style.MaxEmptyLinesToKeep > 0)
3381     return true;
3382 
3383   if (Style.isCSharp()) {
3384     if (Right.is(TT_CSharpNamedArgumentColon) ||
3385         Left.is(TT_CSharpNamedArgumentColon))
3386       return false;
3387     if (Right.is(TT_CSharpGenericTypeConstraint))
3388       return true;
3389   } else if (Style.Language == FormatStyle::LK_JavaScript) {
3390     // FIXME: This might apply to other languages and token kinds.
3391     if (Right.is(tok::string_literal) && Left.is(tok::plus) && Left.Previous &&
3392         Left.Previous->is(tok::string_literal))
3393       return true;
3394     if (Left.is(TT_DictLiteral) && Left.is(tok::l_brace) && Line.Level == 0 &&
3395         Left.Previous && Left.Previous->is(tok::equal) &&
3396         Line.First->isOneOf(tok::identifier, Keywords.kw_import, tok::kw_export,
3397                             tok::kw_const) &&
3398         // kw_var/kw_let are pseudo-tokens that are tok::identifier, so match
3399         // above.
3400         !Line.First->isOneOf(Keywords.kw_var, Keywords.kw_let))
3401       // Object literals on the top level of a file are treated as "enum-style".
3402       // Each key/value pair is put on a separate line, instead of bin-packing.
3403       return true;
3404     if (Left.is(tok::l_brace) && Line.Level == 0 &&
3405         (Line.startsWith(tok::kw_enum) ||
3406          Line.startsWith(tok::kw_const, tok::kw_enum) ||
3407          Line.startsWith(tok::kw_export, tok::kw_enum) ||
3408          Line.startsWith(tok::kw_export, tok::kw_const, tok::kw_enum)))
3409       // JavaScript top-level enum key/value pairs are put on separate lines
3410       // instead of bin-packing.
3411       return true;
3412     if (Right.is(tok::r_brace) && Left.is(tok::l_brace) && Left.Previous &&
3413         Left.Previous->is(TT_JsFatArrow)) {
3414       // JS arrow function (=> {...}).
3415       switch (Style.AllowShortLambdasOnASingleLine) {
3416       case FormatStyle::SLS_All:
3417         return false;
3418       case FormatStyle::SLS_None:
3419         return true;
3420       case FormatStyle::SLS_Empty:
3421         return !Left.Children.empty();
3422       case FormatStyle::SLS_Inline:
3423         // allow one-lining inline (e.g. in function call args) and empty arrow
3424         // functions.
3425         return (Left.NestingLevel == 0 && Line.Level == 0) &&
3426                !Left.Children.empty();
3427       }
3428       llvm_unreachable("Unknown FormatStyle::ShortLambdaStyle enum");
3429     }
3430 
3431     if (Right.is(tok::r_brace) && Left.is(tok::l_brace) &&
3432         !Left.Children.empty())
3433       // Support AllowShortFunctionsOnASingleLine for JavaScript.
3434       return Style.AllowShortFunctionsOnASingleLine == FormatStyle::SFS_None ||
3435              Style.AllowShortFunctionsOnASingleLine == FormatStyle::SFS_Empty ||
3436              (Left.NestingLevel == 0 && Line.Level == 0 &&
3437               Style.AllowShortFunctionsOnASingleLine &
3438                   FormatStyle::SFS_InlineOnly);
3439   } else if (Style.Language == FormatStyle::LK_Java) {
3440     if (Right.is(tok::plus) && Left.is(tok::string_literal) && Right.Next &&
3441         Right.Next->is(tok::string_literal))
3442       return true;
3443   } else if (Style.Language == FormatStyle::LK_Cpp ||
3444              Style.Language == FormatStyle::LK_ObjC ||
3445              Style.Language == FormatStyle::LK_Proto ||
3446              Style.Language == FormatStyle::LK_TableGen ||
3447              Style.Language == FormatStyle::LK_TextProto) {
3448     if (Left.isStringLiteral() && Right.isStringLiteral())
3449       return true;
3450   }
3451 
3452   // If the last token before a '}', ']', or ')' is a comma or a trailing
3453   // comment, the intention is to insert a line break after it in order to make
3454   // shuffling around entries easier. Import statements, especially in
3455   // JavaScript, can be an exception to this rule.
3456   if (Style.JavaScriptWrapImports || Line.Type != LT_ImportStatement) {
3457     const FormatToken *BeforeClosingBrace = nullptr;
3458     if ((Left.isOneOf(tok::l_brace, TT_ArrayInitializerLSquare) ||
3459          (Style.Language == FormatStyle::LK_JavaScript &&
3460           Left.is(tok::l_paren))) &&
3461         Left.BlockKind != BK_Block && Left.MatchingParen)
3462       BeforeClosingBrace = Left.MatchingParen->Previous;
3463     else if (Right.MatchingParen &&
3464              (Right.MatchingParen->isOneOf(tok::l_brace,
3465                                            TT_ArrayInitializerLSquare) ||
3466               (Style.Language == FormatStyle::LK_JavaScript &&
3467                Right.MatchingParen->is(tok::l_paren))))
3468       BeforeClosingBrace = &Left;
3469     if (BeforeClosingBrace && (BeforeClosingBrace->is(tok::comma) ||
3470                                BeforeClosingBrace->isTrailingComment()))
3471       return true;
3472   }
3473 
3474   if (Right.is(tok::comment))
3475     return Left.BlockKind != BK_BracedInit &&
3476            Left.isNot(TT_CtorInitializerColon) &&
3477            (Right.NewlinesBefore > 0 && Right.HasUnescapedNewline);
3478   if (Left.isTrailingComment())
3479     return true;
3480   if (Right.Previous->IsUnterminatedLiteral)
3481     return true;
3482   if (Right.is(tok::lessless) && Right.Next &&
3483       Right.Previous->is(tok::string_literal) &&
3484       Right.Next->is(tok::string_literal))
3485     return true;
3486   if (Right.Previous->ClosesTemplateDeclaration &&
3487       Right.Previous->MatchingParen &&
3488       Right.Previous->MatchingParen->NestingLevel == 0 &&
3489       Style.AlwaysBreakTemplateDeclarations == FormatStyle::BTDS_Yes)
3490     return true;
3491   if (Right.is(TT_CtorInitializerComma) &&
3492       Style.BreakConstructorInitializers == FormatStyle::BCIS_BeforeComma &&
3493       !Style.ConstructorInitializerAllOnOneLineOrOnePerLine)
3494     return true;
3495   if (Right.is(TT_CtorInitializerColon) &&
3496       Style.BreakConstructorInitializers == FormatStyle::BCIS_BeforeComma &&
3497       !Style.ConstructorInitializerAllOnOneLineOrOnePerLine)
3498     return true;
3499   // Break only if we have multiple inheritance.
3500   if (Style.BreakInheritanceList == FormatStyle::BILS_BeforeComma &&
3501       Right.is(TT_InheritanceComma))
3502     return true;
3503   if (Right.is(tok::string_literal) && Right.TokenText.startswith("R\""))
3504     // Multiline raw string literals are special wrt. line breaks. The author
3505     // has made a deliberate choice and might have aligned the contents of the
3506     // string literal accordingly. Thus, we try keep existing line breaks.
3507     return Right.IsMultiline && Right.NewlinesBefore > 0;
3508   if ((Right.Previous->is(tok::l_brace) ||
3509        (Right.Previous->is(tok::less) && Right.Previous->Previous &&
3510         Right.Previous->Previous->is(tok::equal))) &&
3511       Right.NestingLevel == 1 && Style.Language == FormatStyle::LK_Proto) {
3512     // Don't put enums or option definitions onto single lines in protocol
3513     // buffers.
3514     return true;
3515   }
3516   if (Right.is(TT_InlineASMBrace))
3517     return Right.HasUnescapedNewline;
3518 
3519   auto ShortLambdaOption = Style.AllowShortLambdasOnASingleLine;
3520   if (Style.BraceWrapping.BeforeLambdaBody &&
3521       (isAllmanBraceIncludedBreakableLambda(Left, ShortLambdaOption) ||
3522        isAllmanBraceIncludedBreakableLambda(Right, ShortLambdaOption))) {
3523     return true;
3524   }
3525 
3526   if (isAllmanBrace(Left) || isAllmanBrace(Right))
3527     return (Line.startsWith(tok::kw_enum) && Style.BraceWrapping.AfterEnum) ||
3528            (Line.startsWith(tok::kw_typedef, tok::kw_enum) &&
3529             Style.BraceWrapping.AfterEnum) ||
3530            (Line.startsWith(tok::kw_class) && Style.BraceWrapping.AfterClass) ||
3531            (Line.startsWith(tok::kw_struct) && Style.BraceWrapping.AfterStruct);
3532   if (Left.is(TT_ObjCBlockLBrace) &&
3533       Style.AllowShortBlocksOnASingleLine == FormatStyle::SBS_Never)
3534     return true;
3535 
3536   if (Left.is(TT_LambdaLBrace)) {
3537     if (IsFunctionArgument(Left) &&
3538         Style.AllowShortLambdasOnASingleLine == FormatStyle::SLS_Inline)
3539       return false;
3540 
3541     if (Style.AllowShortLambdasOnASingleLine == FormatStyle::SLS_None ||
3542         Style.AllowShortLambdasOnASingleLine == FormatStyle::SLS_Inline ||
3543         (!Left.Children.empty() &&
3544          Style.AllowShortLambdasOnASingleLine == FormatStyle::SLS_Empty))
3545       return true;
3546   }
3547 
3548   // Put multiple Java annotation on a new line.
3549   if ((Style.Language == FormatStyle::LK_Java ||
3550        Style.Language == FormatStyle::LK_JavaScript) &&
3551       Left.is(TT_LeadingJavaAnnotation) &&
3552       Right.isNot(TT_LeadingJavaAnnotation) && Right.isNot(tok::l_paren) &&
3553       (Line.Last->is(tok::l_brace) || Style.BreakAfterJavaFieldAnnotations))
3554     return true;
3555 
3556   if (Right.is(TT_ProtoExtensionLSquare))
3557     return true;
3558 
3559   // In text proto instances if a submessage contains at least 2 entries and at
3560   // least one of them is a submessage, like A { ... B { ... } ... },
3561   // put all of the entries of A on separate lines by forcing the selector of
3562   // the submessage B to be put on a newline.
3563   //
3564   // Example: these can stay on one line:
3565   // a { scalar_1: 1 scalar_2: 2 }
3566   // a { b { key: value } }
3567   //
3568   // and these entries need to be on a new line even if putting them all in one
3569   // line is under the column limit:
3570   // a {
3571   //   scalar: 1
3572   //   b { key: value }
3573   // }
3574   //
3575   // We enforce this by breaking before a submessage field that has previous
3576   // siblings, *and* breaking before a field that follows a submessage field.
3577   //
3578   // Be careful to exclude the case  [proto.ext] { ... } since the `]` is
3579   // the TT_SelectorName there, but we don't want to break inside the brackets.
3580   //
3581   // Another edge case is @submessage { key: value }, which is a common
3582   // substitution placeholder. In this case we want to keep `@` and `submessage`
3583   // together.
3584   //
3585   // We ensure elsewhere that extensions are always on their own line.
3586   if ((Style.Language == FormatStyle::LK_Proto ||
3587        Style.Language == FormatStyle::LK_TextProto) &&
3588       Right.is(TT_SelectorName) && !Right.is(tok::r_square) && Right.Next) {
3589     // Keep `@submessage` together in:
3590     // @submessage { key: value }
3591     if (Right.Previous && Right.Previous->is(tok::at))
3592       return false;
3593     // Look for the scope opener after selector in cases like:
3594     // selector { ...
3595     // selector: { ...
3596     // selector: @base { ...
3597     FormatToken *LBrace = Right.Next;
3598     if (LBrace && LBrace->is(tok::colon)) {
3599       LBrace = LBrace->Next;
3600       if (LBrace && LBrace->is(tok::at)) {
3601         LBrace = LBrace->Next;
3602         if (LBrace)
3603           LBrace = LBrace->Next;
3604       }
3605     }
3606     if (LBrace &&
3607         // The scope opener is one of {, [, <:
3608         // selector { ... }
3609         // selector [ ... ]
3610         // selector < ... >
3611         //
3612         // In case of selector { ... }, the l_brace is TT_DictLiteral.
3613         // In case of an empty selector {}, the l_brace is not TT_DictLiteral,
3614         // so we check for immediately following r_brace.
3615         ((LBrace->is(tok::l_brace) &&
3616           (LBrace->is(TT_DictLiteral) ||
3617            (LBrace->Next && LBrace->Next->is(tok::r_brace)))) ||
3618          LBrace->is(TT_ArrayInitializerLSquare) || LBrace->is(tok::less))) {
3619       // If Left.ParameterCount is 0, then this submessage entry is not the
3620       // first in its parent submessage, and we want to break before this entry.
3621       // If Left.ParameterCount is greater than 0, then its parent submessage
3622       // might contain 1 or more entries and we want to break before this entry
3623       // if it contains at least 2 entries. We deal with this case later by
3624       // detecting and breaking before the next entry in the parent submessage.
3625       if (Left.ParameterCount == 0)
3626         return true;
3627       // However, if this submessage is the first entry in its parent
3628       // submessage, Left.ParameterCount might be 1 in some cases.
3629       // We deal with this case later by detecting an entry
3630       // following a closing paren of this submessage.
3631     }
3632 
3633     // If this is an entry immediately following a submessage, it will be
3634     // preceded by a closing paren of that submessage, like in:
3635     //     left---.  .---right
3636     //            v  v
3637     // sub: { ... } key: value
3638     // If there was a comment between `}` an `key` above, then `key` would be
3639     // put on a new line anyways.
3640     if (Left.isOneOf(tok::r_brace, tok::greater, tok::r_square))
3641       return true;
3642   }
3643 
3644   // Deal with lambda arguments in C++ - we want consistent line breaks whether
3645   // they happen to be at arg0, arg1 or argN. The selection is a bit nuanced
3646   // as aggressive line breaks are placed when the lambda is not the last arg.
3647   if ((Style.Language == FormatStyle::LK_Cpp ||
3648        Style.Language == FormatStyle::LK_ObjC) &&
3649       Left.is(tok::l_paren) && Left.BlockParameterCount > 0 &&
3650       !Right.isOneOf(tok::l_paren, TT_LambdaLSquare)) {
3651     // Multiple lambdas in the same function call force line breaks.
3652     if (Left.BlockParameterCount > 1)
3653       return true;
3654 
3655     // A lambda followed by another arg forces a line break.
3656     if (!Left.Role)
3657       return false;
3658     auto Comma = Left.Role->lastComma();
3659     if (!Comma)
3660       return false;
3661     auto Next = Comma->getNextNonComment();
3662     if (!Next)
3663       return false;
3664     if (!Next->isOneOf(TT_LambdaLSquare, tok::l_brace, tok::caret))
3665       return true;
3666   }
3667 
3668   return false;
3669 }
3670 
3671 bool TokenAnnotator::canBreakBefore(const AnnotatedLine &Line,
3672                                     const FormatToken &Right) {
3673   const FormatToken &Left = *Right.Previous;
3674   // Language-specific stuff.
3675   if (Style.isCSharp()) {
3676     if (Left.isOneOf(TT_CSharpNamedArgumentColon, TT_AttributeColon) ||
3677         Right.isOneOf(TT_CSharpNamedArgumentColon, TT_AttributeColon))
3678       return false;
3679     // Only break after commas for generic type constraints.
3680     if (Line.First->is(TT_CSharpGenericTypeConstraint))
3681       return Left.is(TT_CSharpGenericTypeConstraintComma);
3682   } else if (Style.Language == FormatStyle::LK_Java) {
3683     if (Left.isOneOf(Keywords.kw_throws, Keywords.kw_extends,
3684                      Keywords.kw_implements))
3685       return false;
3686     if (Right.isOneOf(Keywords.kw_throws, Keywords.kw_extends,
3687                       Keywords.kw_implements))
3688       return true;
3689   } else if (Style.Language == FormatStyle::LK_JavaScript) {
3690     const FormatToken *NonComment = Right.getPreviousNonComment();
3691     if (NonComment &&
3692         NonComment->isOneOf(
3693             tok::kw_return, Keywords.kw_yield, tok::kw_continue, tok::kw_break,
3694             tok::kw_throw, Keywords.kw_interface, Keywords.kw_type,
3695             tok::kw_static, tok::kw_public, tok::kw_private, tok::kw_protected,
3696             Keywords.kw_readonly, Keywords.kw_abstract, Keywords.kw_get,
3697             Keywords.kw_set, Keywords.kw_async, Keywords.kw_await))
3698       return false; // Otherwise automatic semicolon insertion would trigger.
3699     if (Right.NestingLevel == 0 &&
3700         (Left.Tok.getIdentifierInfo() ||
3701          Left.isOneOf(tok::r_square, tok::r_paren)) &&
3702         Right.isOneOf(tok::l_square, tok::l_paren))
3703       return false; // Otherwise automatic semicolon insertion would trigger.
3704     if (Left.is(TT_JsFatArrow) && Right.is(tok::l_brace))
3705       return false;
3706     if (Left.is(TT_JsTypeColon))
3707       return true;
3708     // Don't wrap between ":" and "!" of a strict prop init ("field!: type;").
3709     if (Left.is(tok::exclaim) && Right.is(tok::colon))
3710       return false;
3711     // Look for is type annotations like:
3712     // function f(): a is B { ... }
3713     // Do not break before is in these cases.
3714     if (Right.is(Keywords.kw_is)) {
3715       const FormatToken *Next = Right.getNextNonComment();
3716       // If `is` is followed by a colon, it's likely that it's a dict key, so
3717       // ignore it for this check.
3718       // For example this is common in Polymer:
3719       // Polymer({
3720       //   is: 'name',
3721       //   ...
3722       // });
3723       if (!Next || !Next->is(tok::colon))
3724         return false;
3725     }
3726     if (Left.is(Keywords.kw_in))
3727       return Style.BreakBeforeBinaryOperators == FormatStyle::BOS_None;
3728     if (Right.is(Keywords.kw_in))
3729       return Style.BreakBeforeBinaryOperators != FormatStyle::BOS_None;
3730     if (Right.is(Keywords.kw_as))
3731       return false; // must not break before as in 'x as type' casts
3732     if (Right.isOneOf(Keywords.kw_extends, Keywords.kw_infer)) {
3733       // extends and infer can appear as keywords in conditional types:
3734       //   https://www.typescriptlang.org/docs/handbook/release-notes/typescript-2-8.html#conditional-types
3735       // do not break before them, as the expressions are subject to ASI.
3736       return false;
3737     }
3738     if (Left.is(Keywords.kw_as))
3739       return true;
3740     if (Left.is(TT_JsNonNullAssertion))
3741       return true;
3742     if (Left.is(Keywords.kw_declare) &&
3743         Right.isOneOf(Keywords.kw_module, tok::kw_namespace,
3744                       Keywords.kw_function, tok::kw_class, tok::kw_enum,
3745                       Keywords.kw_interface, Keywords.kw_type, Keywords.kw_var,
3746                       Keywords.kw_let, tok::kw_const))
3747       // See grammar for 'declare' statements at:
3748       // https://github.com/Microsoft/TypeScript/blob/master/doc/spec.md#A.10
3749       return false;
3750     if (Left.isOneOf(Keywords.kw_module, tok::kw_namespace) &&
3751         Right.isOneOf(tok::identifier, tok::string_literal))
3752       return false; // must not break in "module foo { ...}"
3753     if (Right.is(TT_TemplateString) && Right.closesScope())
3754       return false;
3755     // Don't split tagged template literal so there is a break between the tag
3756     // identifier and template string.
3757     if (Left.is(tok::identifier) && Right.is(TT_TemplateString)) {
3758       return false;
3759     }
3760     if (Left.is(TT_TemplateString) && Left.opensScope())
3761       return true;
3762   }
3763 
3764   if (Left.is(tok::at))
3765     return false;
3766   if (Left.Tok.getObjCKeywordID() == tok::objc_interface)
3767     return false;
3768   if (Left.isOneOf(TT_JavaAnnotation, TT_LeadingJavaAnnotation))
3769     return !Right.is(tok::l_paren);
3770   if (Right.is(TT_PointerOrReference))
3771     return Line.IsMultiVariableDeclStmt ||
3772            (Style.PointerAlignment == FormatStyle::PAS_Right &&
3773             (!Right.Next || Right.Next->isNot(TT_FunctionDeclarationName)));
3774   if (Right.isOneOf(TT_StartOfName, TT_FunctionDeclarationName) ||
3775       Right.is(tok::kw_operator))
3776     return true;
3777   if (Left.is(TT_PointerOrReference))
3778     return false;
3779   if (Right.isTrailingComment())
3780     // We rely on MustBreakBefore being set correctly here as we should not
3781     // change the "binding" behavior of a comment.
3782     // The first comment in a braced lists is always interpreted as belonging to
3783     // the first list element. Otherwise, it should be placed outside of the
3784     // list.
3785     return Left.BlockKind == BK_BracedInit ||
3786            (Left.is(TT_CtorInitializerColon) &&
3787             Style.BreakConstructorInitializers == FormatStyle::BCIS_AfterColon);
3788   if (Left.is(tok::question) && Right.is(tok::colon))
3789     return false;
3790   if (Right.is(TT_ConditionalExpr) || Right.is(tok::question))
3791     return Style.BreakBeforeTernaryOperators;
3792   if (Left.is(TT_ConditionalExpr) || Left.is(tok::question))
3793     return !Style.BreakBeforeTernaryOperators;
3794   if (Left.is(TT_InheritanceColon))
3795     return Style.BreakInheritanceList == FormatStyle::BILS_AfterColon;
3796   if (Right.is(TT_InheritanceColon))
3797     return Style.BreakInheritanceList != FormatStyle::BILS_AfterColon;
3798   if (Right.is(TT_ObjCMethodExpr) && !Right.is(tok::r_square) &&
3799       Left.isNot(TT_SelectorName))
3800     return true;
3801 
3802   if (Right.is(tok::colon) &&
3803       !Right.isOneOf(TT_CtorInitializerColon, TT_InlineASMColon))
3804     return false;
3805   if (Left.is(tok::colon) && Left.isOneOf(TT_DictLiteral, TT_ObjCMethodExpr)) {
3806     if (Style.Language == FormatStyle::LK_Proto ||
3807         Style.Language == FormatStyle::LK_TextProto) {
3808       if (!Style.AlwaysBreakBeforeMultilineStrings && Right.isStringLiteral())
3809         return false;
3810       // Prevent cases like:
3811       //
3812       // submessage:
3813       //     { key: valueeeeeeeeeeee }
3814       //
3815       // when the snippet does not fit into one line.
3816       // Prefer:
3817       //
3818       // submessage: {
3819       //   key: valueeeeeeeeeeee
3820       // }
3821       //
3822       // instead, even if it is longer by one line.
3823       //
3824       // Note that this allows allows the "{" to go over the column limit
3825       // when the column limit is just between ":" and "{", but that does
3826       // not happen too often and alternative formattings in this case are
3827       // not much better.
3828       //
3829       // The code covers the cases:
3830       //
3831       // submessage: { ... }
3832       // submessage: < ... >
3833       // repeated: [ ... ]
3834       if (((Right.is(tok::l_brace) || Right.is(tok::less)) &&
3835            Right.is(TT_DictLiteral)) ||
3836           Right.is(TT_ArrayInitializerLSquare))
3837         return false;
3838     }
3839     return true;
3840   }
3841   if (Right.is(tok::r_square) && Right.MatchingParen &&
3842       Right.MatchingParen->is(TT_ProtoExtensionLSquare))
3843     return false;
3844   if (Right.is(TT_SelectorName) || (Right.is(tok::identifier) && Right.Next &&
3845                                     Right.Next->is(TT_ObjCMethodExpr)))
3846     return Left.isNot(tok::period); // FIXME: Properly parse ObjC calls.
3847   if (Left.is(tok::r_paren) && Line.Type == LT_ObjCProperty)
3848     return true;
3849   if (Left.ClosesTemplateDeclaration || Left.is(TT_FunctionAnnotationRParen))
3850     return true;
3851   if (Right.isOneOf(TT_RangeBasedForLoopColon, TT_OverloadedOperatorLParen,
3852                     TT_OverloadedOperator))
3853     return false;
3854   if (Left.is(TT_RangeBasedForLoopColon))
3855     return true;
3856   if (Right.is(TT_RangeBasedForLoopColon))
3857     return false;
3858   if (Left.is(TT_TemplateCloser) && Right.is(TT_TemplateOpener))
3859     return true;
3860   if (Left.isOneOf(TT_TemplateCloser, TT_UnaryOperator) ||
3861       Left.is(tok::kw_operator))
3862     return false;
3863   if (Left.is(tok::equal) && !Right.isOneOf(tok::kw_default, tok::kw_delete) &&
3864       Line.Type == LT_VirtualFunctionDecl && Left.NestingLevel == 0)
3865     return false;
3866   if (Left.is(tok::equal) && Right.is(tok::l_brace) &&
3867       !Style.Cpp11BracedListStyle)
3868     return false;
3869   if (Left.is(tok::l_paren) && Left.is(TT_AttributeParen))
3870     return false;
3871   if (Left.is(tok::l_paren) && Left.Previous &&
3872       (Left.Previous->isOneOf(TT_BinaryOperator, TT_CastRParen)))
3873     return false;
3874   if (Right.is(TT_ImplicitStringLiteral))
3875     return false;
3876 
3877   if (Right.is(tok::r_paren) || Right.is(TT_TemplateCloser))
3878     return false;
3879   if (Right.is(tok::r_square) && Right.MatchingParen &&
3880       Right.MatchingParen->is(TT_LambdaLSquare))
3881     return false;
3882 
3883   // We only break before r_brace if there was a corresponding break before
3884   // the l_brace, which is tracked by BreakBeforeClosingBrace.
3885   if (Right.is(tok::r_brace))
3886     return Right.MatchingParen && Right.MatchingParen->BlockKind == BK_Block;
3887 
3888   // Allow breaking after a trailing annotation, e.g. after a method
3889   // declaration.
3890   if (Left.is(TT_TrailingAnnotation))
3891     return !Right.isOneOf(tok::l_brace, tok::semi, tok::equal, tok::l_paren,
3892                           tok::less, tok::coloncolon);
3893 
3894   if (Right.is(tok::kw___attribute) ||
3895       (Right.is(tok::l_square) && Right.is(TT_AttributeSquare)))
3896     return !Left.is(TT_AttributeSquare);
3897 
3898   if (Left.is(tok::identifier) && Right.is(tok::string_literal))
3899     return true;
3900 
3901   if (Right.is(tok::identifier) && Right.Next && Right.Next->is(TT_DictLiteral))
3902     return true;
3903 
3904   if (Left.is(TT_CtorInitializerColon))
3905     return Style.BreakConstructorInitializers == FormatStyle::BCIS_AfterColon;
3906   if (Right.is(TT_CtorInitializerColon))
3907     return Style.BreakConstructorInitializers != FormatStyle::BCIS_AfterColon;
3908   if (Left.is(TT_CtorInitializerComma) &&
3909       Style.BreakConstructorInitializers == FormatStyle::BCIS_BeforeComma)
3910     return false;
3911   if (Right.is(TT_CtorInitializerComma) &&
3912       Style.BreakConstructorInitializers == FormatStyle::BCIS_BeforeComma)
3913     return true;
3914   if (Left.is(TT_InheritanceComma) &&
3915       Style.BreakInheritanceList == FormatStyle::BILS_BeforeComma)
3916     return false;
3917   if (Right.is(TT_InheritanceComma) &&
3918       Style.BreakInheritanceList == FormatStyle::BILS_BeforeComma)
3919     return true;
3920   if ((Left.is(tok::greater) && Right.is(tok::greater)) ||
3921       (Left.is(tok::less) && Right.is(tok::less)))
3922     return false;
3923   if (Right.is(TT_BinaryOperator) &&
3924       Style.BreakBeforeBinaryOperators != FormatStyle::BOS_None &&
3925       (Style.BreakBeforeBinaryOperators == FormatStyle::BOS_All ||
3926        Right.getPrecedence() != prec::Assignment))
3927     return true;
3928   if (Left.is(TT_ArrayInitializerLSquare))
3929     return true;
3930   if (Right.is(tok::kw_typename) && Left.isNot(tok::kw_const))
3931     return true;
3932   if ((Left.isBinaryOperator() || Left.is(TT_BinaryOperator)) &&
3933       !Left.isOneOf(tok::arrowstar, tok::lessless) &&
3934       Style.BreakBeforeBinaryOperators != FormatStyle::BOS_All &&
3935       (Style.BreakBeforeBinaryOperators == FormatStyle::BOS_None ||
3936        Left.getPrecedence() == prec::Assignment))
3937     return true;
3938   if ((Left.is(TT_AttributeSquare) && Right.is(tok::l_square)) ||
3939       (Left.is(tok::r_square) && Right.is(TT_AttributeSquare)))
3940     return false;
3941 
3942   auto ShortLambdaOption = Style.AllowShortLambdasOnASingleLine;
3943   if (Style.BraceWrapping.BeforeLambdaBody) {
3944     if (isAllmanLambdaBrace(Left))
3945       return !isItAnEmptyLambdaAllowed(Left, ShortLambdaOption);
3946     if (isAllmanLambdaBrace(Right))
3947       return !isItAnEmptyLambdaAllowed(Right, ShortLambdaOption);
3948   }
3949 
3950   return Left.isOneOf(tok::comma, tok::coloncolon, tok::semi, tok::l_brace,
3951                       tok::kw_class, tok::kw_struct, tok::comment) ||
3952          Right.isMemberAccess() ||
3953          Right.isOneOf(TT_TrailingReturnArrow, TT_LambdaArrow, tok::lessless,
3954                        tok::colon, tok::l_square, tok::at) ||
3955          (Style.BraceWrapping.BeforeLambdaBody && Right.is(TT_LambdaLBrace)) ||
3956          (Left.is(tok::r_paren) &&
3957           Right.isOneOf(tok::identifier, tok::kw_const)) ||
3958          (Left.is(tok::l_paren) && !Right.is(tok::r_paren)) ||
3959          (Left.is(TT_TemplateOpener) && !Right.is(TT_TemplateCloser));
3960 }
3961 
3962 void TokenAnnotator::printDebugInfo(const AnnotatedLine &Line) {
3963   llvm::errs() << "AnnotatedTokens(L=" << Line.Level << "):\n";
3964   const FormatToken *Tok = Line.First;
3965   while (Tok) {
3966     llvm::errs() << " M=" << Tok->MustBreakBefore
3967                  << " C=" << Tok->CanBreakBefore
3968                  << " T=" << getTokenTypeName(Tok->getType())
3969                  << " S=" << Tok->SpacesRequiredBefore
3970                  << " B=" << Tok->BlockParameterCount
3971                  << " BK=" << Tok->BlockKind << " P=" << Tok->SplitPenalty
3972                  << " Name=" << Tok->Tok.getName() << " L=" << Tok->TotalLength
3973                  << " PPK=" << Tok->PackingKind << " FakeLParens=";
3974     for (unsigned i = 0, e = Tok->FakeLParens.size(); i != e; ++i)
3975       llvm::errs() << Tok->FakeLParens[i] << "/";
3976     llvm::errs() << " FakeRParens=" << Tok->FakeRParens;
3977     llvm::errs() << " II=" << Tok->Tok.getIdentifierInfo();
3978     llvm::errs() << " Text='" << Tok->TokenText << "'\n";
3979     if (!Tok->Next)
3980       assert(Tok == Line.Last);
3981     Tok = Tok->Next;
3982   }
3983   llvm::errs() << "----\n";
3984 }
3985 
3986 } // namespace format
3987 } // namespace clang
3988