1 //===--- ContinuationIndenter.cpp - Format C++ code -----------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 ///
10 /// \file
11 /// \brief This file implements the continuation indenter.
12 ///
13 //===----------------------------------------------------------------------===//
14 
15 #include "BreakableToken.h"
16 #include "ContinuationIndenter.h"
17 #include "WhitespaceManager.h"
18 #include "clang/Basic/OperatorPrecedence.h"
19 #include "clang/Basic/SourceManager.h"
20 #include "clang/Format/Format.h"
21 #include "llvm/Support/Debug.h"
22 #include <string>
23 
24 #define DEBUG_TYPE "format-formatter"
25 
26 namespace clang {
27 namespace format {
28 
29 // Returns the length of everything up to the first possible line break after
30 // the ), ], } or > matching \c Tok.
31 static unsigned getLengthToMatchingParen(const FormatToken &Tok) {
32   if (!Tok.MatchingParen)
33     return 0;
34   FormatToken *End = Tok.MatchingParen;
35   while (End->Next && !End->Next->CanBreakBefore) {
36     End = End->Next;
37   }
38   return End->TotalLength - Tok.TotalLength + 1;
39 }
40 
41 static unsigned getLengthToNextOperator(const FormatToken &Tok) {
42   if (!Tok.NextOperator)
43     return 0;
44   return Tok.NextOperator->TotalLength - Tok.TotalLength;
45 }
46 
47 // Returns \c true if \c Tok is the "." or "->" of a call and starts the next
48 // segment of a builder type call.
49 static bool startsSegmentOfBuilderTypeCall(const FormatToken &Tok) {
50   return Tok.isMemberAccess() && Tok.Previous && Tok.Previous->closesScope();
51 }
52 
53 // Returns \c true if \c Current starts a new parameter.
54 static bool startsNextParameter(const FormatToken &Current,
55                                 const FormatStyle &Style) {
56   const FormatToken &Previous = *Current.Previous;
57   if (Current.is(TT_CtorInitializerComma) &&
58       Style.BreakConstructorInitializersBeforeComma)
59     return true;
60   return Previous.is(tok::comma) && !Current.isTrailingComment() &&
61          (Previous.isNot(TT_CtorInitializerComma) ||
62           !Style.BreakConstructorInitializersBeforeComma);
63 }
64 
65 ContinuationIndenter::ContinuationIndenter(const FormatStyle &Style,
66                                            const AdditionalKeywords &Keywords,
67                                            const SourceManager &SourceMgr,
68                                            WhitespaceManager &Whitespaces,
69                                            encoding::Encoding Encoding,
70                                            bool BinPackInconclusiveFunctions)
71     : Style(Style), Keywords(Keywords), SourceMgr(SourceMgr),
72       Whitespaces(Whitespaces), Encoding(Encoding),
73       BinPackInconclusiveFunctions(BinPackInconclusiveFunctions),
74       CommentPragmasRegex(Style.CommentPragmas) {}
75 
76 LineState ContinuationIndenter::getInitialState(unsigned FirstIndent,
77                                                 const AnnotatedLine *Line,
78                                                 bool DryRun) {
79   LineState State;
80   State.FirstIndent = FirstIndent;
81   State.Column = FirstIndent;
82   State.Line = Line;
83   State.NextToken = Line->First;
84   State.Stack.push_back(ParenState(FirstIndent, Line->Level, FirstIndent,
85                                    /*AvoidBinPacking=*/false,
86                                    /*NoLineBreak=*/false));
87   State.LineContainsContinuedForLoopSection = false;
88   State.StartOfStringLiteral = 0;
89   State.StartOfLineLevel = 0;
90   State.LowestLevelOnLine = 0;
91   State.IgnoreStackForComparison = false;
92 
93   // The first token has already been indented and thus consumed.
94   moveStateToNextToken(State, DryRun, /*Newline=*/false);
95   return State;
96 }
97 
98 bool ContinuationIndenter::canBreak(const LineState &State) {
99   const FormatToken &Current = *State.NextToken;
100   const FormatToken &Previous = *Current.Previous;
101   assert(&Previous == Current.Previous);
102   if (!Current.CanBreakBefore &&
103       !(State.Stack.back().BreakBeforeClosingBrace &&
104         Current.closesBlockOrBlockTypeList(Style)))
105     return false;
106   // The opening "{" of a braced list has to be on the same line as the first
107   // element if it is nested in another braced init list or function call.
108   if (!Current.MustBreakBefore && Previous.is(tok::l_brace) &&
109       Previous.isNot(TT_DictLiteral) && Previous.BlockKind == BK_BracedInit &&
110       Previous.Previous &&
111       Previous.Previous->isOneOf(tok::l_brace, tok::l_paren, tok::comma))
112     return false;
113   // This prevents breaks like:
114   //   ...
115   //   SomeParameter, OtherParameter).DoSomething(
116   //   ...
117   // As they hide "DoSomething" and are generally bad for readability.
118   if (Previous.opensScope() && Previous.isNot(tok::l_brace) &&
119       State.LowestLevelOnLine < State.StartOfLineLevel &&
120       State.LowestLevelOnLine < Current.NestingLevel)
121     return false;
122   if (Current.isMemberAccess() && State.Stack.back().ContainsUnwrappedBuilder)
123     return false;
124 
125   // Don't create a 'hanging' indent if there are multiple blocks in a single
126   // statement.
127   if (Previous.is(tok::l_brace) && State.Stack.size() > 1 &&
128       State.Stack[State.Stack.size() - 2].NestedBlockInlined &&
129       State.Stack[State.Stack.size() - 2].HasMultipleNestedBlocks)
130     return false;
131 
132   // Don't break after very short return types (e.g. "void") as that is often
133   // unexpected.
134   if (Current.is(TT_FunctionDeclarationName) && State.Column < 6) {
135     if (Style.AlwaysBreakAfterReturnType == FormatStyle::RTBS_None)
136       return false;
137   }
138 
139   return !State.Stack.back().NoLineBreak;
140 }
141 
142 bool ContinuationIndenter::mustBreak(const LineState &State) {
143   const FormatToken &Current = *State.NextToken;
144   const FormatToken &Previous = *Current.Previous;
145   if (Current.MustBreakBefore || Current.is(TT_InlineASMColon))
146     return true;
147   if (State.Stack.back().BreakBeforeClosingBrace &&
148       Current.closesBlockOrBlockTypeList(Style))
149     return true;
150   if (Previous.is(tok::semi) && State.LineContainsContinuedForLoopSection)
151     return true;
152   if ((startsNextParameter(Current, Style) || Previous.is(tok::semi) ||
153        (Previous.is(TT_TemplateCloser) && Current.is(TT_StartOfName) &&
154         Style.Language == FormatStyle::LK_Cpp &&
155         // FIXME: This is a temporary workaround for the case where clang-format
156         // sets BreakBeforeParameter to avoid bin packing and this creates a
157         // completely unnecessary line break after a template type that isn't
158         // line-wrapped.
159         (Previous.NestingLevel == 1 || Style.BinPackParameters)) ||
160        (Style.BreakBeforeTernaryOperators && Current.is(TT_ConditionalExpr) &&
161         Previous.isNot(tok::question)) ||
162        (!Style.BreakBeforeTernaryOperators &&
163         Previous.is(TT_ConditionalExpr))) &&
164       State.Stack.back().BreakBeforeParameter && !Current.isTrailingComment() &&
165       !Current.isOneOf(tok::r_paren, tok::r_brace))
166     return true;
167   if (((Previous.is(TT_DictLiteral) && Previous.is(tok::l_brace)) ||
168        (Previous.is(TT_ArrayInitializerLSquare) &&
169         Previous.ParameterCount > 1)) &&
170       Style.ColumnLimit > 0 &&
171       getLengthToMatchingParen(Previous) + State.Column - 1 >
172           getColumnLimit(State))
173     return true;
174   if (Current.is(TT_CtorInitializerColon) &&
175       (State.Column + State.Line->Last->TotalLength - Current.TotalLength + 2 >
176            getColumnLimit(State) ||
177        State.Stack.back().BreakBeforeParameter) &&
178       ((Style.AllowShortFunctionsOnASingleLine != FormatStyle::SFS_All) ||
179        Style.BreakConstructorInitializersBeforeComma || Style.ColumnLimit != 0))
180     return true;
181   if (Current.is(TT_SelectorName) && State.Stack.back().ObjCSelectorNameFound &&
182       State.Stack.back().BreakBeforeParameter)
183     return true;
184 
185   unsigned NewLineColumn = getNewLineColumn(State);
186   if (Current.isMemberAccess() && Style.ColumnLimit != 0 &&
187       State.Column + getLengthToNextOperator(Current) > Style.ColumnLimit &&
188       (State.Column > NewLineColumn ||
189        Current.NestingLevel < State.StartOfLineLevel))
190     return true;
191 
192   if (State.Column <= NewLineColumn)
193     return false;
194 
195   if (Style.AlwaysBreakBeforeMultilineStrings &&
196       (NewLineColumn == State.FirstIndent + Style.ContinuationIndentWidth ||
197        Previous.is(tok::comma) || Current.NestingLevel < 2) &&
198       !Previous.isOneOf(tok::kw_return, tok::lessless, tok::at) &&
199       !Previous.isOneOf(TT_InlineASMColon, TT_ConditionalExpr) &&
200       nextIsMultilineString(State))
201     return true;
202 
203   // Using CanBreakBefore here and below takes care of the decision whether the
204   // current style uses wrapping before or after operators for the given
205   // operator.
206   if (Previous.is(TT_BinaryOperator) && Current.CanBreakBefore) {
207     // If we need to break somewhere inside the LHS of a binary expression, we
208     // should also break after the operator. Otherwise, the formatting would
209     // hide the operator precedence, e.g. in:
210     //   if (aaaaaaaaaaaaaa ==
211     //           bbbbbbbbbbbbbb && c) {..
212     // For comparisons, we only apply this rule, if the LHS is a binary
213     // expression itself as otherwise, the line breaks seem superfluous.
214     // We need special cases for ">>" which we have split into two ">" while
215     // lexing in order to make template parsing easier.
216     bool IsComparison = (Previous.getPrecedence() == prec::Relational ||
217                          Previous.getPrecedence() == prec::Equality) &&
218                         Previous.Previous &&
219                         Previous.Previous->isNot(TT_BinaryOperator); // For >>.
220     bool LHSIsBinaryExpr =
221         Previous.Previous && Previous.Previous->EndsBinaryExpression;
222     if ((!IsComparison || LHSIsBinaryExpr) && !Current.isTrailingComment() &&
223         Previous.getPrecedence() != prec::Assignment &&
224         State.Stack.back().BreakBeforeParameter)
225       return true;
226   } else if (Current.is(TT_BinaryOperator) && Current.CanBreakBefore &&
227              State.Stack.back().BreakBeforeParameter) {
228     return true;
229   }
230 
231   // Same as above, but for the first "<<" operator.
232   if (Current.is(tok::lessless) && Current.isNot(TT_OverloadedOperator) &&
233       State.Stack.back().BreakBeforeParameter &&
234       State.Stack.back().FirstLessLess == 0)
235     return true;
236 
237   if (Current.NestingLevel == 0 && !Current.isTrailingComment()) {
238     // Always break after "template <...>" and leading annotations. This is only
239     // for cases where the entire line does not fit on a single line as a
240     // different LineFormatter would be used otherwise.
241     if (Previous.ClosesTemplateDeclaration)
242       return true;
243     if (Previous.is(TT_FunctionAnnotationRParen))
244       return true;
245     if (Previous.is(TT_LeadingJavaAnnotation) && Current.isNot(tok::l_paren) &&
246         Current.isNot(TT_LeadingJavaAnnotation))
247       return true;
248   }
249 
250   // If the return type spans multiple lines, wrap before the function name.
251   if ((Current.is(TT_FunctionDeclarationName) ||
252        (Current.is(tok::kw_operator) && !Previous.is(tok::coloncolon))) &&
253       !Previous.is(tok::kw_template) && State.Stack.back().BreakBeforeParameter)
254     return true;
255 
256   if (startsSegmentOfBuilderTypeCall(Current) &&
257       (State.Stack.back().CallContinuation != 0 ||
258        State.Stack.back().BreakBeforeParameter))
259     return true;
260 
261   // The following could be precomputed as they do not depend on the state.
262   // However, as they should take effect only if the UnwrappedLine does not fit
263   // into the ColumnLimit, they are checked here in the ContinuationIndenter.
264   if (Style.ColumnLimit != 0 && Previous.BlockKind == BK_Block &&
265       Previous.is(tok::l_brace) && !Current.isOneOf(tok::r_brace, tok::comment))
266     return true;
267 
268   if (Current.is(tok::lessless) &&
269       ((Previous.is(tok::identifier) && Previous.TokenText == "endl") ||
270        (Previous.Tok.isLiteral() && (Previous.TokenText.endswith("\\n\"") ||
271                                      Previous.TokenText == "\'\\n\'"))))
272     return true;
273 
274   return false;
275 }
276 
277 unsigned ContinuationIndenter::addTokenToState(LineState &State, bool Newline,
278                                                bool DryRun,
279                                                unsigned ExtraSpaces) {
280   const FormatToken &Current = *State.NextToken;
281 
282   assert(!State.Stack.empty());
283   if ((Current.is(TT_ImplicitStringLiteral) &&
284        (Current.Previous->Tok.getIdentifierInfo() == nullptr ||
285         Current.Previous->Tok.getIdentifierInfo()->getPPKeywordID() ==
286             tok::pp_not_keyword))) {
287     unsigned EndColumn =
288         SourceMgr.getSpellingColumnNumber(Current.WhitespaceRange.getEnd());
289     if (Current.LastNewlineOffset != 0) {
290       // If there is a newline within this token, the final column will solely
291       // determined by the current end column.
292       State.Column = EndColumn;
293     } else {
294       unsigned StartColumn =
295           SourceMgr.getSpellingColumnNumber(Current.WhitespaceRange.getBegin());
296       assert(EndColumn >= StartColumn);
297       State.Column += EndColumn - StartColumn;
298     }
299     moveStateToNextToken(State, DryRun, /*Newline=*/false);
300     return 0;
301   }
302 
303   unsigned Penalty = 0;
304   if (Newline)
305     Penalty = addTokenOnNewLine(State, DryRun);
306   else
307     addTokenOnCurrentLine(State, DryRun, ExtraSpaces);
308 
309   return moveStateToNextToken(State, DryRun, Newline) + Penalty;
310 }
311 
312 void ContinuationIndenter::addTokenOnCurrentLine(LineState &State, bool DryRun,
313                                                  unsigned ExtraSpaces) {
314   FormatToken &Current = *State.NextToken;
315   const FormatToken &Previous = *State.NextToken->Previous;
316   if (Current.is(tok::equal) &&
317       (State.Line->First->is(tok::kw_for) || Current.NestingLevel == 0) &&
318       State.Stack.back().VariablePos == 0) {
319     State.Stack.back().VariablePos = State.Column;
320     // Move over * and & if they are bound to the variable name.
321     const FormatToken *Tok = &Previous;
322     while (Tok && State.Stack.back().VariablePos >= Tok->ColumnWidth) {
323       State.Stack.back().VariablePos -= Tok->ColumnWidth;
324       if (Tok->SpacesRequiredBefore != 0)
325         break;
326       Tok = Tok->Previous;
327     }
328     if (Previous.PartOfMultiVariableDeclStmt)
329       State.Stack.back().LastSpace = State.Stack.back().VariablePos;
330   }
331 
332   unsigned Spaces = Current.SpacesRequiredBefore + ExtraSpaces;
333 
334   if (!DryRun)
335     Whitespaces.replaceWhitespace(Current, /*Newlines=*/0, /*IndentLevel=*/0,
336                                   Spaces, State.Column + Spaces);
337 
338   if (Current.is(TT_SelectorName) &&
339       !State.Stack.back().ObjCSelectorNameFound) {
340     unsigned MinIndent =
341         std::max(State.FirstIndent + Style.ContinuationIndentWidth,
342                  State.Stack.back().Indent);
343     unsigned FirstColonPos = State.Column + Spaces + Current.ColumnWidth;
344     if (Current.LongestObjCSelectorName == 0)
345       State.Stack.back().AlignColons = false;
346     else if (MinIndent + Current.LongestObjCSelectorName > FirstColonPos)
347       State.Stack.back().ColonPos = MinIndent + Current.LongestObjCSelectorName;
348     else
349       State.Stack.back().ColonPos = FirstColonPos;
350   }
351 
352   // In "AlwaysBreak" mode, enforce wrapping directly after the parenthesis by
353   // disallowing any further line breaks if there is no line break after the
354   // opening parenthesis. Don't break if it doesn't conserve columns.
355   if (Style.AlignAfterOpenBracket == FormatStyle::BAS_AlwaysBreak &&
356       Previous.isOneOf(tok::l_paren, TT_TemplateOpener, tok::l_square) &&
357       State.Column > getNewLineColumn(State) &&
358       (!Previous.Previous ||
359        !Previous.Previous->isOneOf(tok::kw_for, tok::kw_while,
360                                    tok::kw_switch)) &&
361       // Don't do this for simple (no expressions) one-argument function calls
362       // as that feels like needlessly wasting whitespace, e.g.:
363       //
364       //   caaaaaaaaaaaall(
365       //       caaaaaaaaaaaall(
366       //           caaaaaaaaaaaall(
367       //               caaaaaaaaaaaaaaaaaaaaaaall(aaaaaaaaaaaaaa, aaaaaaaaa))));
368       Current.FakeLParens.size() > 0 &&
369       Current.FakeLParens.back() > prec::Unknown)
370     State.Stack.back().NoLineBreak = true;
371 
372   if (Style.AlignAfterOpenBracket != FormatStyle::BAS_DontAlign &&
373       Previous.opensScope() && Previous.isNot(TT_ObjCMethodExpr) &&
374       (Current.isNot(TT_LineComment) || Previous.BlockKind == BK_BracedInit))
375     State.Stack.back().Indent = State.Column + Spaces;
376   if (State.Stack.back().AvoidBinPacking && startsNextParameter(Current, Style))
377     State.Stack.back().NoLineBreak = true;
378   if (startsSegmentOfBuilderTypeCall(Current) &&
379       State.Column > getNewLineColumn(State))
380     State.Stack.back().ContainsUnwrappedBuilder = true;
381 
382   if (Current.is(TT_LambdaArrow) && Style.Language == FormatStyle::LK_Java)
383     State.Stack.back().NoLineBreak = true;
384   if (Current.isMemberAccess() && Previous.is(tok::r_paren) &&
385       (Previous.MatchingParen &&
386        (Previous.TotalLength - Previous.MatchingParen->TotalLength > 10))) {
387     // If there is a function call with long parameters, break before trailing
388     // calls. This prevents things like:
389     //   EXPECT_CALL(SomeLongParameter).Times(
390     //       2);
391     // We don't want to do this for short parameters as they can just be
392     // indexes.
393     State.Stack.back().NoLineBreak = true;
394   }
395 
396   State.Column += Spaces;
397   if (Current.isNot(tok::comment) && Previous.is(tok::l_paren) &&
398       Previous.Previous &&
399       Previous.Previous->isOneOf(tok::kw_if, tok::kw_for)) {
400     // Treat the condition inside an if as if it was a second function
401     // parameter, i.e. let nested calls have a continuation indent.
402     State.Stack.back().LastSpace = State.Column;
403     State.Stack.back().NestedBlockIndent = State.Column;
404   } else if (!Current.isOneOf(tok::comment, tok::caret) &&
405              ((Previous.is(tok::comma) &&
406                !Previous.is(TT_OverloadedOperator)) ||
407               (Previous.is(tok::colon) && Previous.is(TT_ObjCMethodExpr)))) {
408     State.Stack.back().LastSpace = State.Column;
409   } else if ((Previous.isOneOf(TT_BinaryOperator, TT_ConditionalExpr,
410                                TT_CtorInitializerColon)) &&
411              ((Previous.getPrecedence() != prec::Assignment &&
412                (Previous.isNot(tok::lessless) || Previous.OperatorIndex != 0 ||
413                 Previous.NextOperator)) ||
414               Current.StartsBinaryExpression)) {
415     // Indent relative to the RHS of the expression unless this is a simple
416     // assignment without binary expression on the RHS. Also indent relative to
417     // unary operators and the colons of constructor initializers.
418     State.Stack.back().LastSpace = State.Column;
419   } else if (Previous.is(TT_InheritanceColon)) {
420     State.Stack.back().Indent = State.Column;
421     State.Stack.back().LastSpace = State.Column;
422   } else if (Previous.opensScope()) {
423     // If a function has a trailing call, indent all parameters from the
424     // opening parenthesis. This avoids confusing indents like:
425     //   OuterFunction(InnerFunctionCall( // break
426     //       ParameterToInnerFunction))   // break
427     //       .SecondInnerFunctionCall();
428     bool HasTrailingCall = false;
429     if (Previous.MatchingParen) {
430       const FormatToken *Next = Previous.MatchingParen->getNextNonComment();
431       HasTrailingCall = Next && Next->isMemberAccess();
432     }
433     if (HasTrailingCall && State.Stack.size() > 1 &&
434         State.Stack[State.Stack.size() - 2].CallContinuation == 0)
435       State.Stack.back().LastSpace = State.Column;
436   }
437 }
438 
439 unsigned ContinuationIndenter::addTokenOnNewLine(LineState &State,
440                                                  bool DryRun) {
441   FormatToken &Current = *State.NextToken;
442   const FormatToken &Previous = *State.NextToken->Previous;
443 
444   // Extra penalty that needs to be added because of the way certain line
445   // breaks are chosen.
446   unsigned Penalty = 0;
447 
448   const FormatToken *PreviousNonComment = Current.getPreviousNonComment();
449   const FormatToken *NextNonComment = Previous.getNextNonComment();
450   if (!NextNonComment)
451     NextNonComment = &Current;
452   // The first line break on any NestingLevel causes an extra penalty in order
453   // prefer similar line breaks.
454   if (!State.Stack.back().ContainsLineBreak)
455     Penalty += 15;
456   State.Stack.back().ContainsLineBreak = true;
457 
458   Penalty += State.NextToken->SplitPenalty;
459 
460   // Breaking before the first "<<" is generally not desirable if the LHS is
461   // short. Also always add the penalty if the LHS is split over mutliple lines
462   // to avoid unnecessary line breaks that just work around this penalty.
463   if (NextNonComment->is(tok::lessless) &&
464       State.Stack.back().FirstLessLess == 0 &&
465       (State.Column <= Style.ColumnLimit / 3 ||
466        State.Stack.back().BreakBeforeParameter))
467     Penalty += Style.PenaltyBreakFirstLessLess;
468 
469   State.Column = getNewLineColumn(State);
470 
471   // Indent nested blocks relative to this column, unless in a very specific
472   // JavaScript special case where:
473   //
474   //   var loooooong_name =
475   //       function() {
476   //     // code
477   //   }
478   //
479   // is common and should be formatted like a free-standing function.
480   if (Style.Language != FormatStyle::LK_JavaScript ||
481       Current.NestingLevel != 0 || !PreviousNonComment ||
482       !PreviousNonComment->is(tok::equal) ||
483       !Current.isOneOf(Keywords.kw_async, Keywords.kw_function))
484     State.Stack.back().NestedBlockIndent = State.Column;
485 
486   if (NextNonComment->isMemberAccess()) {
487     if (State.Stack.back().CallContinuation == 0)
488       State.Stack.back().CallContinuation = State.Column;
489   } else if (NextNonComment->is(TT_SelectorName)) {
490     if (!State.Stack.back().ObjCSelectorNameFound) {
491       if (NextNonComment->LongestObjCSelectorName == 0) {
492         State.Stack.back().AlignColons = false;
493       } else {
494         State.Stack.back().ColonPos =
495             (Style.IndentWrappedFunctionNames
496                  ? std::max(State.Stack.back().Indent,
497                             State.FirstIndent + Style.ContinuationIndentWidth)
498                  : State.Stack.back().Indent) +
499             NextNonComment->LongestObjCSelectorName;
500       }
501     } else if (State.Stack.back().AlignColons &&
502                State.Stack.back().ColonPos <= NextNonComment->ColumnWidth) {
503       State.Stack.back().ColonPos = State.Column + NextNonComment->ColumnWidth;
504     }
505   } else if (PreviousNonComment && PreviousNonComment->is(tok::colon) &&
506              PreviousNonComment->isOneOf(TT_ObjCMethodExpr, TT_DictLiteral)) {
507     // FIXME: This is hacky, find a better way. The problem is that in an ObjC
508     // method expression, the block should be aligned to the line starting it,
509     // e.g.:
510     //   [aaaaaaaaaaaaaaa aaaaaaaaa: \\ break for some reason
511     //                        ^(int *i) {
512     //                            // ...
513     //                        }];
514     // Thus, we set LastSpace of the next higher NestingLevel, to which we move
515     // when we consume all of the "}"'s FakeRParens at the "{".
516     if (State.Stack.size() > 1)
517       State.Stack[State.Stack.size() - 2].LastSpace =
518           std::max(State.Stack.back().LastSpace, State.Stack.back().Indent) +
519           Style.ContinuationIndentWidth;
520   }
521 
522   if ((Previous.isOneOf(tok::comma, tok::semi) &&
523        !State.Stack.back().AvoidBinPacking) ||
524       Previous.is(TT_BinaryOperator))
525     State.Stack.back().BreakBeforeParameter = false;
526   if (Previous.isOneOf(TT_TemplateCloser, TT_JavaAnnotation) &&
527       Current.NestingLevel == 0)
528     State.Stack.back().BreakBeforeParameter = false;
529   if (NextNonComment->is(tok::question) ||
530       (PreviousNonComment && PreviousNonComment->is(tok::question)))
531     State.Stack.back().BreakBeforeParameter = true;
532   if (Current.is(TT_BinaryOperator) && Current.CanBreakBefore)
533     State.Stack.back().BreakBeforeParameter = false;
534 
535   if (!DryRun) {
536     unsigned Newlines = std::max(
537         1u, std::min(Current.NewlinesBefore, Style.MaxEmptyLinesToKeep + 1));
538     Whitespaces.replaceWhitespace(Current, Newlines,
539                                   State.Stack.back().IndentLevel, State.Column,
540                                   State.Column, State.Line->InPPDirective);
541   }
542 
543   if (!Current.isTrailingComment())
544     State.Stack.back().LastSpace = State.Column;
545   if (Current.is(tok::lessless))
546     // If we are breaking before a "<<", we always want to indent relative to
547     // RHS. This is necessary only for "<<", as we special-case it and don't
548     // always indent relative to the RHS.
549     State.Stack.back().LastSpace += 3; // 3 -> width of "<< ".
550 
551   State.StartOfLineLevel = Current.NestingLevel;
552   State.LowestLevelOnLine = Current.NestingLevel;
553 
554   // Any break on this level means that the parent level has been broken
555   // and we need to avoid bin packing there.
556   bool NestedBlockSpecialCase =
557       Style.Language != FormatStyle::LK_Cpp &&
558       Current.is(tok::r_brace) && State.Stack.size() > 1 &&
559       State.Stack[State.Stack.size() - 2].NestedBlockInlined;
560   if (!NestedBlockSpecialCase)
561     for (unsigned i = 0, e = State.Stack.size() - 1; i != e; ++i)
562       State.Stack[i].BreakBeforeParameter = true;
563 
564   if (PreviousNonComment &&
565       !PreviousNonComment->isOneOf(tok::comma, tok::semi) &&
566       (PreviousNonComment->isNot(TT_TemplateCloser) ||
567        Current.NestingLevel != 0) &&
568       !PreviousNonComment->isOneOf(
569           TT_BinaryOperator, TT_FunctionAnnotationRParen, TT_JavaAnnotation,
570           TT_LeadingJavaAnnotation) &&
571       Current.isNot(TT_BinaryOperator) && !PreviousNonComment->opensScope())
572     State.Stack.back().BreakBeforeParameter = true;
573 
574   // If we break after { or the [ of an array initializer, we should also break
575   // before the corresponding } or ].
576   if (PreviousNonComment &&
577       (PreviousNonComment->isOneOf(tok::l_brace, TT_ArrayInitializerLSquare)))
578     State.Stack.back().BreakBeforeClosingBrace = true;
579 
580   if (State.Stack.back().AvoidBinPacking) {
581     // If we are breaking after '(', '{', '<', this is not bin packing
582     // unless AllowAllParametersOfDeclarationOnNextLine is false or this is a
583     // dict/object literal.
584     if (!Previous.isOneOf(tok::l_paren, tok::l_brace, TT_BinaryOperator) ||
585         (!Style.AllowAllParametersOfDeclarationOnNextLine &&
586          State.Line->MustBeDeclaration) ||
587         Previous.is(TT_DictLiteral))
588       State.Stack.back().BreakBeforeParameter = true;
589   }
590 
591   return Penalty;
592 }
593 
594 unsigned ContinuationIndenter::getNewLineColumn(const LineState &State) {
595   if (!State.NextToken || !State.NextToken->Previous)
596     return 0;
597   FormatToken &Current = *State.NextToken;
598   const FormatToken &Previous = *Current.Previous;
599   // If we are continuing an expression, we want to use the continuation indent.
600   unsigned ContinuationIndent =
601       std::max(State.Stack.back().LastSpace, State.Stack.back().Indent) +
602       Style.ContinuationIndentWidth;
603   const FormatToken *PreviousNonComment = Current.getPreviousNonComment();
604   const FormatToken *NextNonComment = Previous.getNextNonComment();
605   if (!NextNonComment)
606     NextNonComment = &Current;
607 
608   // Java specific bits.
609   if (Style.Language == FormatStyle::LK_Java &&
610       Current.isOneOf(Keywords.kw_implements, Keywords.kw_extends))
611     return std::max(State.Stack.back().LastSpace,
612                     State.Stack.back().Indent + Style.ContinuationIndentWidth);
613 
614   if (NextNonComment->is(tok::l_brace) && NextNonComment->BlockKind == BK_Block)
615     return Current.NestingLevel == 0 ? State.FirstIndent
616                                      : State.Stack.back().Indent;
617   if (Current.isOneOf(tok::r_brace, tok::r_square) && State.Stack.size() > 1) {
618     if (Current.closesBlockOrBlockTypeList(Style))
619       return State.Stack[State.Stack.size() - 2].NestedBlockIndent;
620     if (Current.MatchingParen &&
621         Current.MatchingParen->BlockKind == BK_BracedInit)
622       return State.Stack[State.Stack.size() - 2].LastSpace;
623     return State.FirstIndent;
624   }
625   if (Current.is(tok::identifier) && Current.Next &&
626       Current.Next->is(TT_DictLiteral))
627     return State.Stack.back().Indent;
628   if (NextNonComment->isStringLiteral() && State.StartOfStringLiteral != 0)
629     return State.StartOfStringLiteral;
630   if (NextNonComment->is(TT_ObjCStringLiteral) &&
631       State.StartOfStringLiteral != 0)
632     return State.StartOfStringLiteral - 1;
633   if (NextNonComment->is(tok::lessless) &&
634       State.Stack.back().FirstLessLess != 0)
635     return State.Stack.back().FirstLessLess;
636   if (NextNonComment->isMemberAccess()) {
637     if (State.Stack.back().CallContinuation == 0)
638       return ContinuationIndent;
639     return State.Stack.back().CallContinuation;
640   }
641   if (State.Stack.back().QuestionColumn != 0 &&
642       ((NextNonComment->is(tok::colon) &&
643         NextNonComment->is(TT_ConditionalExpr)) ||
644        Previous.is(TT_ConditionalExpr)))
645     return State.Stack.back().QuestionColumn;
646   if (Previous.is(tok::comma) && State.Stack.back().VariablePos != 0)
647     return State.Stack.back().VariablePos;
648   if ((PreviousNonComment &&
649        (PreviousNonComment->ClosesTemplateDeclaration ||
650         PreviousNonComment->isOneOf(
651             TT_AttributeParen, TT_FunctionAnnotationRParen, TT_JavaAnnotation,
652             TT_LeadingJavaAnnotation))) ||
653       (!Style.IndentWrappedFunctionNames &&
654        NextNonComment->isOneOf(tok::kw_operator, TT_FunctionDeclarationName)))
655     return std::max(State.Stack.back().LastSpace, State.Stack.back().Indent);
656   if (NextNonComment->is(TT_SelectorName)) {
657     if (!State.Stack.back().ObjCSelectorNameFound) {
658       if (NextNonComment->LongestObjCSelectorName == 0)
659         return State.Stack.back().Indent;
660       return (Style.IndentWrappedFunctionNames
661                   ? std::max(State.Stack.back().Indent,
662                              State.FirstIndent + Style.ContinuationIndentWidth)
663                   : State.Stack.back().Indent) +
664              NextNonComment->LongestObjCSelectorName -
665              NextNonComment->ColumnWidth;
666     }
667     if (!State.Stack.back().AlignColons)
668       return State.Stack.back().Indent;
669     if (State.Stack.back().ColonPos > NextNonComment->ColumnWidth)
670       return State.Stack.back().ColonPos - NextNonComment->ColumnWidth;
671     return State.Stack.back().Indent;
672   }
673   if (NextNonComment->is(TT_ArraySubscriptLSquare)) {
674     if (State.Stack.back().StartOfArraySubscripts != 0)
675       return State.Stack.back().StartOfArraySubscripts;
676     return ContinuationIndent;
677   }
678 
679   // This ensure that we correctly format ObjC methods calls without inputs,
680   // i.e. where the last element isn't selector like: [callee method];
681   if (NextNonComment->is(tok::identifier) && NextNonComment->FakeRParens == 0 &&
682       NextNonComment->Next && NextNonComment->Next->is(TT_ObjCMethodExpr))
683     return State.Stack.back().Indent;
684 
685   if (NextNonComment->isOneOf(TT_StartOfName, TT_PointerOrReference) ||
686       Previous.isOneOf(tok::coloncolon, tok::equal, TT_JsTypeColon))
687     return ContinuationIndent;
688   if (PreviousNonComment && PreviousNonComment->is(tok::colon) &&
689       PreviousNonComment->isOneOf(TT_ObjCMethodExpr, TT_DictLiteral))
690     return ContinuationIndent;
691   if (NextNonComment->is(TT_CtorInitializerColon))
692     return State.FirstIndent + Style.ConstructorInitializerIndentWidth;
693   if (NextNonComment->is(TT_CtorInitializerComma))
694     return State.Stack.back().Indent;
695   if (Previous.is(tok::r_paren) && !Current.isBinaryOperator() &&
696       !Current.isOneOf(tok::colon, tok::comment))
697     return ContinuationIndent;
698   if (State.Stack.back().Indent == State.FirstIndent && PreviousNonComment &&
699       PreviousNonComment->isNot(tok::r_brace))
700     // Ensure that we fall back to the continuation indent width instead of
701     // just flushing continuations left.
702     return State.Stack.back().Indent + Style.ContinuationIndentWidth;
703   return State.Stack.back().Indent;
704 }
705 
706 unsigned ContinuationIndenter::moveStateToNextToken(LineState &State,
707                                                     bool DryRun, bool Newline) {
708   assert(State.Stack.size());
709   const FormatToken &Current = *State.NextToken;
710 
711   if (Current.is(TT_InheritanceColon))
712     State.Stack.back().AvoidBinPacking = true;
713   if (Current.is(tok::lessless) && Current.isNot(TT_OverloadedOperator)) {
714     if (State.Stack.back().FirstLessLess == 0)
715       State.Stack.back().FirstLessLess = State.Column;
716     else
717       State.Stack.back().LastOperatorWrapped = Newline;
718   }
719   if ((Current.is(TT_BinaryOperator) && Current.isNot(tok::lessless)) ||
720       Current.is(TT_ConditionalExpr))
721     State.Stack.back().LastOperatorWrapped = Newline;
722   if (Current.is(TT_ArraySubscriptLSquare) &&
723       State.Stack.back().StartOfArraySubscripts == 0)
724     State.Stack.back().StartOfArraySubscripts = State.Column;
725   if (Style.BreakBeforeTernaryOperators && Current.is(tok::question))
726     State.Stack.back().QuestionColumn = State.Column;
727   if (!Style.BreakBeforeTernaryOperators && Current.isNot(tok::colon)) {
728     const FormatToken *Previous = Current.Previous;
729     while (Previous && Previous->isTrailingComment())
730       Previous = Previous->Previous;
731     if (Previous && Previous->is(tok::question))
732       State.Stack.back().QuestionColumn = State.Column;
733   }
734   if (!Current.opensScope() && !Current.closesScope())
735     State.LowestLevelOnLine =
736         std::min(State.LowestLevelOnLine, Current.NestingLevel);
737   if (Current.isMemberAccess())
738     State.Stack.back().StartOfFunctionCall =
739         !Current.NextOperator ? 0 : State.Column;
740   if (Current.is(TT_SelectorName)) {
741     State.Stack.back().ObjCSelectorNameFound = true;
742     if (Style.IndentWrappedFunctionNames) {
743       State.Stack.back().Indent =
744           State.FirstIndent + Style.ContinuationIndentWidth;
745     }
746   }
747   if (Current.is(TT_CtorInitializerColon)) {
748     // Indent 2 from the column, so:
749     // SomeClass::SomeClass()
750     //     : First(...), ...
751     //       Next(...)
752     //       ^ line up here.
753     State.Stack.back().Indent =
754         State.Column + (Style.BreakConstructorInitializersBeforeComma ? 0 : 2);
755     State.Stack.back().NestedBlockIndent = State.Stack.back().Indent;
756     if (Style.ConstructorInitializerAllOnOneLineOrOnePerLine)
757       State.Stack.back().AvoidBinPacking = true;
758     State.Stack.back().BreakBeforeParameter = false;
759   }
760   if (Current.isOneOf(TT_BinaryOperator, TT_ConditionalExpr) && Newline)
761     State.Stack.back().NestedBlockIndent =
762         State.Column + Current.ColumnWidth + 1;
763 
764   // Insert scopes created by fake parenthesis.
765   const FormatToken *Previous = Current.getPreviousNonComment();
766 
767   // Add special behavior to support a format commonly used for JavaScript
768   // closures:
769   //   SomeFunction(function() {
770   //     foo();
771   //     bar();
772   //   }, a, b, c);
773   if (Current.isNot(tok::comment) && Previous &&
774       Previous->isOneOf(tok::l_brace, TT_ArrayInitializerLSquare) &&
775       !Previous->is(TT_DictLiteral) && State.Stack.size() > 1) {
776     if (State.Stack[State.Stack.size() - 2].NestedBlockInlined && Newline)
777       for (unsigned i = 0, e = State.Stack.size() - 1; i != e; ++i)
778         State.Stack[i].NoLineBreak = true;
779     State.Stack[State.Stack.size() - 2].NestedBlockInlined = false;
780   }
781   if (Previous && (Previous->isOneOf(tok::l_paren, tok::comma, tok::colon) ||
782                    Previous->isOneOf(TT_BinaryOperator, TT_ConditionalExpr)) &&
783       !Previous->isOneOf(TT_DictLiteral, TT_ObjCMethodExpr)) {
784     State.Stack.back().NestedBlockInlined =
785         !Newline &&
786         (Previous->isNot(tok::l_paren) || Previous->ParameterCount > 1);
787   }
788 
789   moveStatePastFakeLParens(State, Newline);
790   moveStatePastScopeOpener(State, Newline);
791   moveStatePastScopeCloser(State);
792   moveStatePastFakeRParens(State);
793 
794   if (Current.isStringLiteral() && State.StartOfStringLiteral == 0)
795     State.StartOfStringLiteral = State.Column;
796   if (Current.is(TT_ObjCStringLiteral) && State.StartOfStringLiteral == 0)
797     State.StartOfStringLiteral = State.Column + 1;
798   else if (!Current.isOneOf(tok::comment, tok::identifier, tok::hash) &&
799            !Current.isStringLiteral())
800     State.StartOfStringLiteral = 0;
801 
802   State.Column += Current.ColumnWidth;
803   State.NextToken = State.NextToken->Next;
804   unsigned Penalty = breakProtrudingToken(Current, State, DryRun);
805   if (State.Column > getColumnLimit(State)) {
806     unsigned ExcessCharacters = State.Column - getColumnLimit(State);
807     Penalty += Style.PenaltyExcessCharacter * ExcessCharacters;
808   }
809 
810   if (Current.Role)
811     Current.Role->formatFromToken(State, this, DryRun);
812   // If the previous has a special role, let it consume tokens as appropriate.
813   // It is necessary to start at the previous token for the only implemented
814   // role (comma separated list). That way, the decision whether or not to break
815   // after the "{" is already done and both options are tried and evaluated.
816   // FIXME: This is ugly, find a better way.
817   if (Previous && Previous->Role)
818     Penalty += Previous->Role->formatAfterToken(State, this, DryRun);
819 
820   return Penalty;
821 }
822 
823 void ContinuationIndenter::moveStatePastFakeLParens(LineState &State,
824                                                     bool Newline) {
825   const FormatToken &Current = *State.NextToken;
826   const FormatToken *Previous = Current.getPreviousNonComment();
827 
828   // Don't add extra indentation for the first fake parenthesis after
829   // 'return', assignments or opening <({[. The indentation for these cases
830   // is special cased.
831   bool SkipFirstExtraIndent =
832       (Previous && (Previous->opensScope() ||
833                     Previous->isOneOf(tok::semi, tok::kw_return) ||
834                     (Previous->getPrecedence() == prec::Assignment &&
835                      Style.AlignOperands) ||
836                     Previous->is(TT_ObjCMethodExpr)));
837   for (SmallVectorImpl<prec::Level>::const_reverse_iterator
838            I = Current.FakeLParens.rbegin(),
839            E = Current.FakeLParens.rend();
840        I != E; ++I) {
841     ParenState NewParenState = State.Stack.back();
842     NewParenState.ContainsLineBreak = false;
843 
844     // Indent from 'LastSpace' unless these are fake parentheses encapsulating
845     // a builder type call after 'return' or, if the alignment after opening
846     // brackets is disabled.
847     if (!Current.isTrailingComment() &&
848         (Style.AlignOperands || *I < prec::Assignment) &&
849         (!Previous || Previous->isNot(tok::kw_return) ||
850          (Style.Language != FormatStyle::LK_Java && *I > 0)) &&
851         (Style.AlignAfterOpenBracket != FormatStyle::BAS_DontAlign ||
852          *I != prec::Comma || Current.NestingLevel == 0))
853       NewParenState.Indent =
854           std::max(std::max(State.Column, NewParenState.Indent),
855                    State.Stack.back().LastSpace);
856 
857     // Don't allow the RHS of an operator to be split over multiple lines unless
858     // there is a line-break right after the operator.
859     // Exclude relational operators, as there, it is always more desirable to
860     // have the LHS 'left' of the RHS.
861     if (Previous && Previous->getPrecedence() != prec::Assignment &&
862         Previous->isOneOf(TT_BinaryOperator, TT_ConditionalExpr) &&
863         Previous->getPrecedence() != prec::Relational) {
864       bool BreakBeforeOperator =
865           Previous->is(tok::lessless) ||
866           (Previous->is(TT_BinaryOperator) &&
867            Style.BreakBeforeBinaryOperators != FormatStyle::BOS_None) ||
868           (Previous->is(TT_ConditionalExpr) &&
869            Style.BreakBeforeTernaryOperators);
870       if ((!Newline && !BreakBeforeOperator) ||
871           (!State.Stack.back().LastOperatorWrapped && BreakBeforeOperator))
872         NewParenState.NoLineBreak = true;
873     }
874 
875     // Do not indent relative to the fake parentheses inserted for "." or "->".
876     // This is a special case to make the following to statements consistent:
877     //   OuterFunction(InnerFunctionCall( // break
878     //       ParameterToInnerFunction));
879     //   OuterFunction(SomeObject.InnerFunctionCall( // break
880     //       ParameterToInnerFunction));
881     if (*I > prec::Unknown)
882       NewParenState.LastSpace = std::max(NewParenState.LastSpace, State.Column);
883     if (*I != prec::Conditional && !Current.is(TT_UnaryOperator) &&
884         Style.AlignAfterOpenBracket != FormatStyle::BAS_DontAlign)
885       NewParenState.StartOfFunctionCall = State.Column;
886 
887     // Always indent conditional expressions. Never indent expression where
888     // the 'operator' is ',', ';' or an assignment (i.e. *I <=
889     // prec::Assignment) as those have different indentation rules. Indent
890     // other expression, unless the indentation needs to be skipped.
891     if (*I == prec::Conditional ||
892         (!SkipFirstExtraIndent && *I > prec::Assignment &&
893          !Current.isTrailingComment()))
894       NewParenState.Indent += Style.ContinuationIndentWidth;
895     if ((Previous && !Previous->opensScope()) || *I != prec::Comma)
896       NewParenState.BreakBeforeParameter = false;
897     State.Stack.push_back(NewParenState);
898     SkipFirstExtraIndent = false;
899   }
900 }
901 
902 void ContinuationIndenter::moveStatePastFakeRParens(LineState &State) {
903   for (unsigned i = 0, e = State.NextToken->FakeRParens; i != e; ++i) {
904     unsigned VariablePos = State.Stack.back().VariablePos;
905     if (State.Stack.size() == 1) {
906       // Do not pop the last element.
907       break;
908     }
909     State.Stack.pop_back();
910     State.Stack.back().VariablePos = VariablePos;
911   }
912 }
913 
914 void ContinuationIndenter::moveStatePastScopeOpener(LineState &State,
915                                                     bool Newline) {
916   const FormatToken &Current = *State.NextToken;
917   if (!Current.opensScope())
918     return;
919 
920   if (Current.MatchingParen && Current.BlockKind == BK_Block) {
921     moveStateToNewBlock(State);
922     return;
923   }
924 
925   unsigned NewIndent;
926   unsigned NewIndentLevel = State.Stack.back().IndentLevel;
927   unsigned LastSpace = State.Stack.back().LastSpace;
928   bool AvoidBinPacking;
929   bool BreakBeforeParameter = false;
930   unsigned NestedBlockIndent = std::max(State.Stack.back().StartOfFunctionCall,
931                                         State.Stack.back().NestedBlockIndent);
932   if (Current.isOneOf(tok::l_brace, TT_ArrayInitializerLSquare)) {
933     if (Current.opensBlockOrBlockTypeList(Style)) {
934       NewIndent = State.Stack.back().NestedBlockIndent + Style.IndentWidth;
935       NewIndent = std::min(State.Column + 2, NewIndent);
936       ++NewIndentLevel;
937     } else {
938       NewIndent = State.Stack.back().LastSpace + Style.ContinuationIndentWidth;
939     }
940     const FormatToken *NextNoComment = Current.getNextNonComment();
941     bool EndsInComma = Current.MatchingParen &&
942                        Current.MatchingParen->Previous &&
943                        Current.MatchingParen->Previous->is(tok::comma);
944     AvoidBinPacking =
945         (Current.is(TT_ArrayInitializerLSquare) && EndsInComma) ||
946         Current.is(TT_DictLiteral) ||
947         Style.Language == FormatStyle::LK_Proto || !Style.BinPackArguments ||
948         (NextNoComment && NextNoComment->is(TT_DesignatedInitializerPeriod));
949     if (Current.ParameterCount > 1)
950       NestedBlockIndent = std::max(NestedBlockIndent, State.Column + 1);
951   } else {
952     NewIndent = Style.ContinuationIndentWidth +
953                 std::max(State.Stack.back().LastSpace,
954                          State.Stack.back().StartOfFunctionCall);
955 
956     // Ensure that different different brackets force relative alignment, e.g.:
957     // void SomeFunction(vector<  // break
958     //                       int> v);
959     // FIXME: We likely want to do this for more combinations of brackets.
960     // Verify that it is wanted for ObjC, too.
961     if (Current.Tok.getKind() == tok::less &&
962         Current.ParentBracket == tok::l_paren) {
963       NewIndent = std::max(NewIndent, State.Stack.back().Indent);
964       LastSpace = std::max(LastSpace, State.Stack.back().Indent);
965     }
966 
967     AvoidBinPacking =
968         (State.Line->MustBeDeclaration && !Style.BinPackParameters) ||
969         (!State.Line->MustBeDeclaration && !Style.BinPackArguments) ||
970         (Style.ExperimentalAutoDetectBinPacking &&
971          (Current.PackingKind == PPK_OnePerLine ||
972           (!BinPackInconclusiveFunctions &&
973            Current.PackingKind == PPK_Inconclusive)));
974     if (Current.is(TT_ObjCMethodExpr) && Current.MatchingParen) {
975       if (Style.ColumnLimit) {
976         // If this '[' opens an ObjC call, determine whether all parameters fit
977         // into one line and put one per line if they don't.
978         if (getLengthToMatchingParen(Current) + State.Column >
979             getColumnLimit(State))
980           BreakBeforeParameter = true;
981       } else {
982         // For ColumnLimit = 0, we have to figure out whether there is or has to
983         // be a line break within this call.
984         for (const FormatToken *Tok = &Current;
985              Tok && Tok != Current.MatchingParen; Tok = Tok->Next) {
986           if (Tok->MustBreakBefore ||
987               (Tok->CanBreakBefore && Tok->NewlinesBefore > 0)) {
988             BreakBeforeParameter = true;
989             break;
990           }
991         }
992       }
993     }
994   }
995   // Generally inherit NoLineBreak from the current scope to nested scope.
996   // However, don't do this for non-empty nested blocks, dict literals and
997   // array literals as these follow different indentation rules.
998   bool NoLineBreak =
999       Current.Children.empty() &&
1000       !Current.isOneOf(TT_DictLiteral, TT_ArrayInitializerLSquare) &&
1001       (State.Stack.back().NoLineBreak ||
1002        (Current.is(TT_TemplateOpener) &&
1003         State.Stack.back().ContainsUnwrappedBuilder));
1004   State.Stack.push_back(ParenState(NewIndent, NewIndentLevel, LastSpace,
1005                                    AvoidBinPacking, NoLineBreak));
1006   State.Stack.back().NestedBlockIndent = NestedBlockIndent;
1007   State.Stack.back().BreakBeforeParameter = BreakBeforeParameter;
1008   State.Stack.back().HasMultipleNestedBlocks = Current.BlockParameterCount > 1;
1009 }
1010 
1011 void ContinuationIndenter::moveStatePastScopeCloser(LineState &State) {
1012   const FormatToken &Current = *State.NextToken;
1013   if (!Current.closesScope())
1014     return;
1015 
1016   // If we encounter a closing ), ], } or >, we can remove a level from our
1017   // stacks.
1018   if (State.Stack.size() > 1 &&
1019       (Current.isOneOf(tok::r_paren, tok::r_square) ||
1020        (Current.is(tok::r_brace) && State.NextToken != State.Line->First) ||
1021        State.NextToken->is(TT_TemplateCloser)))
1022     State.Stack.pop_back();
1023 
1024   if (Current.is(tok::r_square)) {
1025     // If this ends the array subscript expr, reset the corresponding value.
1026     const FormatToken *NextNonComment = Current.getNextNonComment();
1027     if (NextNonComment && NextNonComment->isNot(tok::l_square))
1028       State.Stack.back().StartOfArraySubscripts = 0;
1029   }
1030 }
1031 
1032 void ContinuationIndenter::moveStateToNewBlock(LineState &State) {
1033   unsigned NestedBlockIndent = State.Stack.back().NestedBlockIndent;
1034   // ObjC block sometimes follow special indentation rules.
1035   unsigned NewIndent =
1036       NestedBlockIndent + (State.NextToken->is(TT_ObjCBlockLBrace)
1037                                ? Style.ObjCBlockIndentWidth
1038                                : Style.IndentWidth);
1039   State.Stack.push_back(ParenState(
1040       NewIndent, /*NewIndentLevel=*/State.Stack.back().IndentLevel + 1,
1041       State.Stack.back().LastSpace, /*AvoidBinPacking=*/true,
1042       /*NoLineBreak=*/false));
1043   State.Stack.back().NestedBlockIndent = NestedBlockIndent;
1044   State.Stack.back().BreakBeforeParameter = true;
1045 }
1046 
1047 unsigned ContinuationIndenter::addMultilineToken(const FormatToken &Current,
1048                                                  LineState &State) {
1049   // Break before further function parameters on all levels.
1050   for (unsigned i = 0, e = State.Stack.size(); i != e; ++i)
1051     State.Stack[i].BreakBeforeParameter = true;
1052 
1053   unsigned ColumnsUsed = State.Column;
1054   // We can only affect layout of the first and the last line, so the penalty
1055   // for all other lines is constant, and we ignore it.
1056   State.Column = Current.LastLineColumnWidth;
1057 
1058   if (ColumnsUsed > getColumnLimit(State))
1059     return Style.PenaltyExcessCharacter * (ColumnsUsed - getColumnLimit(State));
1060   return 0;
1061 }
1062 
1063 unsigned ContinuationIndenter::breakProtrudingToken(const FormatToken &Current,
1064                                                     LineState &State,
1065                                                     bool DryRun) {
1066   // Don't break multi-line tokens other than block comments. Instead, just
1067   // update the state.
1068   if (Current.isNot(TT_BlockComment) && Current.IsMultiline)
1069     return addMultilineToken(Current, State);
1070 
1071   // Don't break implicit string literals or import statements.
1072   if (Current.is(TT_ImplicitStringLiteral) ||
1073       State.Line->Type == LT_ImportStatement)
1074     return 0;
1075 
1076   if (!Current.isStringLiteral() && !Current.is(tok::comment))
1077     return 0;
1078 
1079   std::unique_ptr<BreakableToken> Token;
1080   unsigned StartColumn = State.Column - Current.ColumnWidth;
1081   unsigned ColumnLimit = getColumnLimit(State);
1082 
1083   if (Current.isStringLiteral()) {
1084     // FIXME: String literal breaking is currently disabled for Java and JS, as
1085     // it requires strings to be merged using "+" which we don't support.
1086     if (Style.Language == FormatStyle::LK_Java ||
1087         Style.Language == FormatStyle::LK_JavaScript ||
1088         !Style.BreakStringLiterals)
1089       return 0;
1090 
1091     // Don't break string literals inside preprocessor directives (except for
1092     // #define directives, as their contents are stored in separate lines and
1093     // are not affected by this check).
1094     // This way we avoid breaking code with line directives and unknown
1095     // preprocessor directives that contain long string literals.
1096     if (State.Line->Type == LT_PreprocessorDirective)
1097       return 0;
1098     // Exempts unterminated string literals from line breaking. The user will
1099     // likely want to terminate the string before any line breaking is done.
1100     if (Current.IsUnterminatedLiteral)
1101       return 0;
1102 
1103     StringRef Text = Current.TokenText;
1104     StringRef Prefix;
1105     StringRef Postfix;
1106     bool IsNSStringLiteral = false;
1107     // FIXME: Handle whitespace between '_T', '(', '"..."', and ')'.
1108     // FIXME: Store Prefix and Suffix (or PrefixLength and SuffixLength to
1109     // reduce the overhead) for each FormatToken, which is a string, so that we
1110     // don't run multiple checks here on the hot path.
1111     if (Text.startswith("\"") && Current.Previous &&
1112         Current.Previous->is(tok::at)) {
1113       IsNSStringLiteral = true;
1114       Prefix = "@\"";
1115     }
1116     if ((Text.endswith(Postfix = "\"") &&
1117          (IsNSStringLiteral || Text.startswith(Prefix = "\"") ||
1118           Text.startswith(Prefix = "u\"") || Text.startswith(Prefix = "U\"") ||
1119           Text.startswith(Prefix = "u8\"") ||
1120           Text.startswith(Prefix = "L\""))) ||
1121         (Text.startswith(Prefix = "_T(\"") && Text.endswith(Postfix = "\")"))) {
1122       Token.reset(new BreakableStringLiteral(
1123           Current, State.Line->Level, StartColumn, Prefix, Postfix,
1124           State.Line->InPPDirective, Encoding, Style));
1125     } else {
1126       return 0;
1127     }
1128   } else if (Current.is(TT_BlockComment) && Current.isTrailingComment()) {
1129     if (!Style.ReflowComments ||
1130         CommentPragmasRegex.match(Current.TokenText.substr(2)))
1131       return 0;
1132     Token.reset(new BreakableBlockComment(
1133         Current, State.Line->Level, StartColumn, Current.OriginalColumn,
1134         !Current.Previous, State.Line->InPPDirective, Encoding, Style));
1135   } else if (Current.is(TT_LineComment) &&
1136              (Current.Previous == nullptr ||
1137               Current.Previous->isNot(TT_ImplicitStringLiteral))) {
1138     if (!Style.ReflowComments ||
1139         CommentPragmasRegex.match(Current.TokenText.substr(2)))
1140       return 0;
1141     Token.reset(new BreakableLineComment(Current, State.Line->Level,
1142                                          StartColumn, /*InPPDirective=*/false,
1143                                          Encoding, Style));
1144     // We don't insert backslashes when breaking line comments.
1145     ColumnLimit = Style.ColumnLimit;
1146   } else {
1147     return 0;
1148   }
1149   if (Current.UnbreakableTailLength >= ColumnLimit)
1150     return 0;
1151 
1152   unsigned RemainingSpace = ColumnLimit - Current.UnbreakableTailLength;
1153   bool BreakInserted = false;
1154   unsigned Penalty = 0;
1155   unsigned RemainingTokenColumns = 0;
1156   for (unsigned LineIndex = 0, EndIndex = Token->getLineCount();
1157        LineIndex != EndIndex; ++LineIndex) {
1158     if (!DryRun)
1159       Token->replaceWhitespaceBefore(LineIndex, Whitespaces);
1160     unsigned TailOffset = 0;
1161     RemainingTokenColumns =
1162         Token->getLineLengthAfterSplit(LineIndex, TailOffset, StringRef::npos);
1163     while (RemainingTokenColumns > RemainingSpace) {
1164       BreakableToken::Split Split =
1165           Token->getSplit(LineIndex, TailOffset, ColumnLimit);
1166       if (Split.first == StringRef::npos) {
1167         // The last line's penalty is handled in addNextStateToQueue().
1168         if (LineIndex < EndIndex - 1)
1169           Penalty += Style.PenaltyExcessCharacter *
1170                      (RemainingTokenColumns - RemainingSpace);
1171         break;
1172       }
1173       assert(Split.first != 0);
1174       unsigned NewRemainingTokenColumns = Token->getLineLengthAfterSplit(
1175           LineIndex, TailOffset + Split.first + Split.second, StringRef::npos);
1176 
1177       // We can remove extra whitespace instead of breaking the line.
1178       if (RemainingTokenColumns + 1 - Split.second <= RemainingSpace) {
1179         RemainingTokenColumns = 0;
1180         if (!DryRun)
1181           Token->replaceWhitespace(LineIndex, TailOffset, Split, Whitespaces);
1182         break;
1183       }
1184 
1185       // When breaking before a tab character, it may be moved by a few columns,
1186       // but will still be expanded to the next tab stop, so we don't save any
1187       // columns.
1188       if (NewRemainingTokenColumns == RemainingTokenColumns)
1189         break;
1190 
1191       assert(NewRemainingTokenColumns < RemainingTokenColumns);
1192       if (!DryRun)
1193         Token->insertBreak(LineIndex, TailOffset, Split, Whitespaces);
1194       Penalty += Current.SplitPenalty;
1195       unsigned ColumnsUsed =
1196           Token->getLineLengthAfterSplit(LineIndex, TailOffset, Split.first);
1197       if (ColumnsUsed > ColumnLimit) {
1198         Penalty += Style.PenaltyExcessCharacter * (ColumnsUsed - ColumnLimit);
1199       }
1200       TailOffset += Split.first + Split.second;
1201       RemainingTokenColumns = NewRemainingTokenColumns;
1202       BreakInserted = true;
1203     }
1204   }
1205 
1206   State.Column = RemainingTokenColumns;
1207 
1208   if (BreakInserted) {
1209     // If we break the token inside a parameter list, we need to break before
1210     // the next parameter on all levels, so that the next parameter is clearly
1211     // visible. Line comments already introduce a break.
1212     if (Current.isNot(TT_LineComment)) {
1213       for (unsigned i = 0, e = State.Stack.size(); i != e; ++i)
1214         State.Stack[i].BreakBeforeParameter = true;
1215     }
1216 
1217     Penalty += Current.isStringLiteral() ? Style.PenaltyBreakString
1218                                          : Style.PenaltyBreakComment;
1219 
1220     State.Stack.back().LastSpace = StartColumn;
1221   }
1222   return Penalty;
1223 }
1224 
1225 unsigned ContinuationIndenter::getColumnLimit(const LineState &State) const {
1226   // In preprocessor directives reserve two chars for trailing " \"
1227   return Style.ColumnLimit - (State.Line->InPPDirective ? 2 : 0);
1228 }
1229 
1230 bool ContinuationIndenter::nextIsMultilineString(const LineState &State) {
1231   const FormatToken &Current = *State.NextToken;
1232   if (!Current.isStringLiteral() || Current.is(TT_ImplicitStringLiteral))
1233     return false;
1234   // We never consider raw string literals "multiline" for the purpose of
1235   // AlwaysBreakBeforeMultilineStrings implementation as they are special-cased
1236   // (see TokenAnnotator::mustBreakBefore().
1237   if (Current.TokenText.startswith("R\""))
1238     return false;
1239   if (Current.IsMultiline)
1240     return true;
1241   if (Current.getNextNonComment() &&
1242       Current.getNextNonComment()->isStringLiteral())
1243     return true; // Implicit concatenation.
1244   if (Style.ColumnLimit != 0 &&
1245       State.Column + Current.ColumnWidth + Current.UnbreakableTailLength >
1246           Style.ColumnLimit)
1247     return true; // String will be split.
1248   return false;
1249 }
1250 
1251 } // namespace format
1252 } // namespace clang
1253