1 //===--- Format.cpp - Format C++ code -------------------------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 ///
10 /// \file
11 /// \brief This file implements functions declared in Format.h. This will be
12 /// split into separate files as we go.
13 ///
14 //===----------------------------------------------------------------------===//
15 
16 #include "clang/Format/Format.h"
17 #include "AffectedRangeManager.h"
18 #include "ContinuationIndenter.h"
19 #include "FormatTokenLexer.h"
20 #include "NamespaceEndCommentsFixer.h"
21 #include "SortJavaScriptImports.h"
22 #include "TokenAnalyzer.h"
23 #include "TokenAnnotator.h"
24 #include "UnwrappedLineFormatter.h"
25 #include "UnwrappedLineParser.h"
26 #include "WhitespaceManager.h"
27 #include "clang/Basic/Diagnostic.h"
28 #include "clang/Basic/DiagnosticOptions.h"
29 #include "clang/Basic/SourceManager.h"
30 #include "clang/Basic/VirtualFileSystem.h"
31 #include "clang/Lex/Lexer.h"
32 #include "llvm/ADT/STLExtras.h"
33 #include "llvm/Support/Allocator.h"
34 #include "llvm/Support/Debug.h"
35 #include "llvm/Support/Path.h"
36 #include "llvm/Support/Regex.h"
37 #include "llvm/Support/YAMLTraits.h"
38 #include <algorithm>
39 #include <memory>
40 #include <string>
41 
42 #define DEBUG_TYPE "format-formatter"
43 
44 using clang::format::FormatStyle;
45 
46 LLVM_YAML_IS_FLOW_SEQUENCE_VECTOR(std::string)
47 LLVM_YAML_IS_SEQUENCE_VECTOR(clang::format::FormatStyle::IncludeCategory)
48 
49 namespace llvm {
50 namespace yaml {
51 template <> struct ScalarEnumerationTraits<FormatStyle::LanguageKind> {
52   static void enumeration(IO &IO, FormatStyle::LanguageKind &Value) {
53     IO.enumCase(Value, "Cpp", FormatStyle::LK_Cpp);
54     IO.enumCase(Value, "Java", FormatStyle::LK_Java);
55     IO.enumCase(Value, "JavaScript", FormatStyle::LK_JavaScript);
56     IO.enumCase(Value, "ObjC", FormatStyle::LK_ObjC);
57     IO.enumCase(Value, "Proto", FormatStyle::LK_Proto);
58     IO.enumCase(Value, "TableGen", FormatStyle::LK_TableGen);
59   }
60 };
61 
62 template <> struct ScalarEnumerationTraits<FormatStyle::LanguageStandard> {
63   static void enumeration(IO &IO, FormatStyle::LanguageStandard &Value) {
64     IO.enumCase(Value, "Cpp03", FormatStyle::LS_Cpp03);
65     IO.enumCase(Value, "C++03", FormatStyle::LS_Cpp03);
66     IO.enumCase(Value, "Cpp11", FormatStyle::LS_Cpp11);
67     IO.enumCase(Value, "C++11", FormatStyle::LS_Cpp11);
68     IO.enumCase(Value, "Auto", FormatStyle::LS_Auto);
69   }
70 };
71 
72 template <> struct ScalarEnumerationTraits<FormatStyle::UseTabStyle> {
73   static void enumeration(IO &IO, FormatStyle::UseTabStyle &Value) {
74     IO.enumCase(Value, "Never", FormatStyle::UT_Never);
75     IO.enumCase(Value, "false", FormatStyle::UT_Never);
76     IO.enumCase(Value, "Always", FormatStyle::UT_Always);
77     IO.enumCase(Value, "true", FormatStyle::UT_Always);
78     IO.enumCase(Value, "ForIndentation", FormatStyle::UT_ForIndentation);
79     IO.enumCase(Value, "ForContinuationAndIndentation",
80                 FormatStyle::UT_ForContinuationAndIndentation);
81   }
82 };
83 
84 template <> struct ScalarEnumerationTraits<FormatStyle::JavaScriptQuoteStyle> {
85   static void enumeration(IO &IO, FormatStyle::JavaScriptQuoteStyle &Value) {
86     IO.enumCase(Value, "Leave", FormatStyle::JSQS_Leave);
87     IO.enumCase(Value, "Single", FormatStyle::JSQS_Single);
88     IO.enumCase(Value, "Double", FormatStyle::JSQS_Double);
89   }
90 };
91 
92 template <> struct ScalarEnumerationTraits<FormatStyle::ShortFunctionStyle> {
93   static void enumeration(IO &IO, FormatStyle::ShortFunctionStyle &Value) {
94     IO.enumCase(Value, "None", FormatStyle::SFS_None);
95     IO.enumCase(Value, "false", FormatStyle::SFS_None);
96     IO.enumCase(Value, "All", FormatStyle::SFS_All);
97     IO.enumCase(Value, "true", FormatStyle::SFS_All);
98     IO.enumCase(Value, "Inline", FormatStyle::SFS_Inline);
99     IO.enumCase(Value, "Empty", FormatStyle::SFS_Empty);
100   }
101 };
102 
103 template <> struct ScalarEnumerationTraits<FormatStyle::BinaryOperatorStyle> {
104   static void enumeration(IO &IO, FormatStyle::BinaryOperatorStyle &Value) {
105     IO.enumCase(Value, "All", FormatStyle::BOS_All);
106     IO.enumCase(Value, "true", FormatStyle::BOS_All);
107     IO.enumCase(Value, "None", FormatStyle::BOS_None);
108     IO.enumCase(Value, "false", FormatStyle::BOS_None);
109     IO.enumCase(Value, "NonAssignment", FormatStyle::BOS_NonAssignment);
110   }
111 };
112 
113 template <> struct ScalarEnumerationTraits<FormatStyle::BraceBreakingStyle> {
114   static void enumeration(IO &IO, FormatStyle::BraceBreakingStyle &Value) {
115     IO.enumCase(Value, "Attach", FormatStyle::BS_Attach);
116     IO.enumCase(Value, "Linux", FormatStyle::BS_Linux);
117     IO.enumCase(Value, "Mozilla", FormatStyle::BS_Mozilla);
118     IO.enumCase(Value, "Stroustrup", FormatStyle::BS_Stroustrup);
119     IO.enumCase(Value, "Allman", FormatStyle::BS_Allman);
120     IO.enumCase(Value, "GNU", FormatStyle::BS_GNU);
121     IO.enumCase(Value, "WebKit", FormatStyle::BS_WebKit);
122     IO.enumCase(Value, "Custom", FormatStyle::BS_Custom);
123   }
124 };
125 
126 template <>
127 struct ScalarEnumerationTraits<FormatStyle::ReturnTypeBreakingStyle> {
128   static void enumeration(IO &IO, FormatStyle::ReturnTypeBreakingStyle &Value) {
129     IO.enumCase(Value, "None", FormatStyle::RTBS_None);
130     IO.enumCase(Value, "All", FormatStyle::RTBS_All);
131     IO.enumCase(Value, "TopLevel", FormatStyle::RTBS_TopLevel);
132     IO.enumCase(Value, "TopLevelDefinitions",
133                 FormatStyle::RTBS_TopLevelDefinitions);
134     IO.enumCase(Value, "AllDefinitions", FormatStyle::RTBS_AllDefinitions);
135   }
136 };
137 
138 template <>
139 struct ScalarEnumerationTraits<FormatStyle::DefinitionReturnTypeBreakingStyle> {
140   static void
141   enumeration(IO &IO, FormatStyle::DefinitionReturnTypeBreakingStyle &Value) {
142     IO.enumCase(Value, "None", FormatStyle::DRTBS_None);
143     IO.enumCase(Value, "All", FormatStyle::DRTBS_All);
144     IO.enumCase(Value, "TopLevel", FormatStyle::DRTBS_TopLevel);
145 
146     // For backward compatibility.
147     IO.enumCase(Value, "false", FormatStyle::DRTBS_None);
148     IO.enumCase(Value, "true", FormatStyle::DRTBS_All);
149   }
150 };
151 
152 template <>
153 struct ScalarEnumerationTraits<FormatStyle::NamespaceIndentationKind> {
154   static void enumeration(IO &IO,
155                           FormatStyle::NamespaceIndentationKind &Value) {
156     IO.enumCase(Value, "None", FormatStyle::NI_None);
157     IO.enumCase(Value, "Inner", FormatStyle::NI_Inner);
158     IO.enumCase(Value, "All", FormatStyle::NI_All);
159   }
160 };
161 
162 template <> struct ScalarEnumerationTraits<FormatStyle::BracketAlignmentStyle> {
163   static void enumeration(IO &IO, FormatStyle::BracketAlignmentStyle &Value) {
164     IO.enumCase(Value, "Align", FormatStyle::BAS_Align);
165     IO.enumCase(Value, "DontAlign", FormatStyle::BAS_DontAlign);
166     IO.enumCase(Value, "AlwaysBreak", FormatStyle::BAS_AlwaysBreak);
167 
168     // For backward compatibility.
169     IO.enumCase(Value, "true", FormatStyle::BAS_Align);
170     IO.enumCase(Value, "false", FormatStyle::BAS_DontAlign);
171   }
172 };
173 
174 template <> struct ScalarEnumerationTraits<FormatStyle::EscapedNewlineAlignmentStyle> {
175   static void enumeration(IO &IO, FormatStyle::EscapedNewlineAlignmentStyle &Value) {
176     IO.enumCase(Value, "DontAlign", FormatStyle::ENAS_DontAlign);
177     IO.enumCase(Value, "Left", FormatStyle::ENAS_Left);
178     IO.enumCase(Value, "Right", FormatStyle::ENAS_Right);
179 
180     // For backward compatibility.
181     IO.enumCase(Value, "true", FormatStyle::ENAS_Left);
182     IO.enumCase(Value, "false", FormatStyle::ENAS_Right);
183   }
184 };
185 
186 template <> struct ScalarEnumerationTraits<FormatStyle::PointerAlignmentStyle> {
187   static void enumeration(IO &IO, FormatStyle::PointerAlignmentStyle &Value) {
188     IO.enumCase(Value, "Middle", FormatStyle::PAS_Middle);
189     IO.enumCase(Value, "Left", FormatStyle::PAS_Left);
190     IO.enumCase(Value, "Right", FormatStyle::PAS_Right);
191 
192     // For backward compatibility.
193     IO.enumCase(Value, "true", FormatStyle::PAS_Left);
194     IO.enumCase(Value, "false", FormatStyle::PAS_Right);
195   }
196 };
197 
198 template <>
199 struct ScalarEnumerationTraits<FormatStyle::SpaceBeforeParensOptions> {
200   static void enumeration(IO &IO,
201                           FormatStyle::SpaceBeforeParensOptions &Value) {
202     IO.enumCase(Value, "Never", FormatStyle::SBPO_Never);
203     IO.enumCase(Value, "ControlStatements",
204                 FormatStyle::SBPO_ControlStatements);
205     IO.enumCase(Value, "Always", FormatStyle::SBPO_Always);
206 
207     // For backward compatibility.
208     IO.enumCase(Value, "false", FormatStyle::SBPO_Never);
209     IO.enumCase(Value, "true", FormatStyle::SBPO_ControlStatements);
210   }
211 };
212 
213 template <> struct MappingTraits<FormatStyle> {
214   static void mapping(IO &IO, FormatStyle &Style) {
215     // When reading, read the language first, we need it for getPredefinedStyle.
216     IO.mapOptional("Language", Style.Language);
217 
218     if (IO.outputting()) {
219       StringRef StylesArray[] = {"LLVM",    "Google", "Chromium",
220                                  "Mozilla", "WebKit", "GNU"};
221       ArrayRef<StringRef> Styles(StylesArray);
222       for (size_t i = 0, e = Styles.size(); i < e; ++i) {
223         StringRef StyleName(Styles[i]);
224         FormatStyle PredefinedStyle;
225         if (getPredefinedStyle(StyleName, Style.Language, &PredefinedStyle) &&
226             Style == PredefinedStyle) {
227           IO.mapOptional("# BasedOnStyle", StyleName);
228           break;
229         }
230       }
231     } else {
232       StringRef BasedOnStyle;
233       IO.mapOptional("BasedOnStyle", BasedOnStyle);
234       if (!BasedOnStyle.empty()) {
235         FormatStyle::LanguageKind OldLanguage = Style.Language;
236         FormatStyle::LanguageKind Language =
237             ((FormatStyle *)IO.getContext())->Language;
238         if (!getPredefinedStyle(BasedOnStyle, Language, &Style)) {
239           IO.setError(Twine("Unknown value for BasedOnStyle: ", BasedOnStyle));
240           return;
241         }
242         Style.Language = OldLanguage;
243       }
244     }
245 
246     // For backward compatibility.
247     if (!IO.outputting()) {
248       IO.mapOptional("AlignEscapedNewlinesLeft", Style.AlignEscapedNewlines);
249       IO.mapOptional("DerivePointerBinding", Style.DerivePointerAlignment);
250       IO.mapOptional("IndentFunctionDeclarationAfterType",
251                      Style.IndentWrappedFunctionNames);
252       IO.mapOptional("PointerBindsToType", Style.PointerAlignment);
253       IO.mapOptional("SpaceAfterControlStatementKeyword",
254                      Style.SpaceBeforeParens);
255     }
256 
257     IO.mapOptional("AccessModifierOffset", Style.AccessModifierOffset);
258     IO.mapOptional("AlignAfterOpenBracket", Style.AlignAfterOpenBracket);
259     IO.mapOptional("AlignConsecutiveAssignments",
260                    Style.AlignConsecutiveAssignments);
261     IO.mapOptional("AlignConsecutiveDeclarations",
262                    Style.AlignConsecutiveDeclarations);
263     IO.mapOptional("AlignEscapedNewlines", Style.AlignEscapedNewlines);
264     IO.mapOptional("AlignOperands", Style.AlignOperands);
265     IO.mapOptional("AlignTrailingComments", Style.AlignTrailingComments);
266     IO.mapOptional("AllowAllParametersOfDeclarationOnNextLine",
267                    Style.AllowAllParametersOfDeclarationOnNextLine);
268     IO.mapOptional("AllowShortBlocksOnASingleLine",
269                    Style.AllowShortBlocksOnASingleLine);
270     IO.mapOptional("AllowShortCaseLabelsOnASingleLine",
271                    Style.AllowShortCaseLabelsOnASingleLine);
272     IO.mapOptional("AllowShortFunctionsOnASingleLine",
273                    Style.AllowShortFunctionsOnASingleLine);
274     IO.mapOptional("AllowShortIfStatementsOnASingleLine",
275                    Style.AllowShortIfStatementsOnASingleLine);
276     IO.mapOptional("AllowShortLoopsOnASingleLine",
277                    Style.AllowShortLoopsOnASingleLine);
278     IO.mapOptional("AlwaysBreakAfterDefinitionReturnType",
279                    Style.AlwaysBreakAfterDefinitionReturnType);
280     IO.mapOptional("AlwaysBreakAfterReturnType",
281                    Style.AlwaysBreakAfterReturnType);
282     // If AlwaysBreakAfterDefinitionReturnType was specified but
283     // AlwaysBreakAfterReturnType was not, initialize the latter from the
284     // former for backwards compatibility.
285     if (Style.AlwaysBreakAfterDefinitionReturnType != FormatStyle::DRTBS_None &&
286         Style.AlwaysBreakAfterReturnType == FormatStyle::RTBS_None) {
287       if (Style.AlwaysBreakAfterDefinitionReturnType == FormatStyle::DRTBS_All)
288         Style.AlwaysBreakAfterReturnType = FormatStyle::RTBS_AllDefinitions;
289       else if (Style.AlwaysBreakAfterDefinitionReturnType ==
290                FormatStyle::DRTBS_TopLevel)
291         Style.AlwaysBreakAfterReturnType =
292             FormatStyle::RTBS_TopLevelDefinitions;
293     }
294 
295     IO.mapOptional("AlwaysBreakBeforeMultilineStrings",
296                    Style.AlwaysBreakBeforeMultilineStrings);
297     IO.mapOptional("AlwaysBreakTemplateDeclarations",
298                    Style.AlwaysBreakTemplateDeclarations);
299     IO.mapOptional("BinPackArguments", Style.BinPackArguments);
300     IO.mapOptional("BinPackParameters", Style.BinPackParameters);
301     IO.mapOptional("BraceWrapping", Style.BraceWrapping);
302     IO.mapOptional("BreakBeforeBinaryOperators",
303                    Style.BreakBeforeBinaryOperators);
304     IO.mapOptional("BreakBeforeBraces", Style.BreakBeforeBraces);
305     IO.mapOptional("BreakBeforeTernaryOperators",
306                    Style.BreakBeforeTernaryOperators);
307     IO.mapOptional("BreakConstructorInitializersBeforeComma",
308                    Style.BreakConstructorInitializersBeforeComma);
309     IO.mapOptional("BreakAfterJavaFieldAnnotations",
310                    Style.BreakAfterJavaFieldAnnotations);
311     IO.mapOptional("BreakStringLiterals", Style.BreakStringLiterals);
312     IO.mapOptional("ColumnLimit", Style.ColumnLimit);
313     IO.mapOptional("CommentPragmas", Style.CommentPragmas);
314     IO.mapOptional("BreakBeforeInheritanceComma",
315                    Style.BreakBeforeInheritanceComma);
316     IO.mapOptional("ConstructorInitializerAllOnOneLineOrOnePerLine",
317                    Style.ConstructorInitializerAllOnOneLineOrOnePerLine);
318     IO.mapOptional("ConstructorInitializerIndentWidth",
319                    Style.ConstructorInitializerIndentWidth);
320     IO.mapOptional("ContinuationIndentWidth", Style.ContinuationIndentWidth);
321     IO.mapOptional("Cpp11BracedListStyle", Style.Cpp11BracedListStyle);
322     IO.mapOptional("DerivePointerAlignment", Style.DerivePointerAlignment);
323     IO.mapOptional("DisableFormat", Style.DisableFormat);
324     IO.mapOptional("ExperimentalAutoDetectBinPacking",
325                    Style.ExperimentalAutoDetectBinPacking);
326     IO.mapOptional("FixNamespaceComments", Style.FixNamespaceComments);
327     IO.mapOptional("ForEachMacros", Style.ForEachMacros);
328     IO.mapOptional("IncludeCategories", Style.IncludeCategories);
329     IO.mapOptional("IncludeIsMainRegex", Style.IncludeIsMainRegex);
330     IO.mapOptional("IndentCaseLabels", Style.IndentCaseLabels);
331     IO.mapOptional("IndentWidth", Style.IndentWidth);
332     IO.mapOptional("IndentWrappedFunctionNames",
333                    Style.IndentWrappedFunctionNames);
334     IO.mapOptional("JavaScriptQuotes", Style.JavaScriptQuotes);
335     IO.mapOptional("JavaScriptWrapImports", Style.JavaScriptWrapImports);
336     IO.mapOptional("KeepEmptyLinesAtTheStartOfBlocks",
337                    Style.KeepEmptyLinesAtTheStartOfBlocks);
338     IO.mapOptional("MacroBlockBegin", Style.MacroBlockBegin);
339     IO.mapOptional("MacroBlockEnd", Style.MacroBlockEnd);
340     IO.mapOptional("MaxEmptyLinesToKeep", Style.MaxEmptyLinesToKeep);
341     IO.mapOptional("NamespaceIndentation", Style.NamespaceIndentation);
342     IO.mapOptional("ObjCBlockIndentWidth", Style.ObjCBlockIndentWidth);
343     IO.mapOptional("ObjCSpaceAfterProperty", Style.ObjCSpaceAfterProperty);
344     IO.mapOptional("ObjCSpaceBeforeProtocolList",
345                    Style.ObjCSpaceBeforeProtocolList);
346     IO.mapOptional("PenaltyBreakBeforeFirstCallParameter",
347                    Style.PenaltyBreakBeforeFirstCallParameter);
348     IO.mapOptional("PenaltyBreakComment", Style.PenaltyBreakComment);
349     IO.mapOptional("PenaltyBreakFirstLessLess",
350                    Style.PenaltyBreakFirstLessLess);
351     IO.mapOptional("PenaltyBreakString", Style.PenaltyBreakString);
352     IO.mapOptional("PenaltyExcessCharacter", Style.PenaltyExcessCharacter);
353     IO.mapOptional("PenaltyReturnTypeOnItsOwnLine",
354                    Style.PenaltyReturnTypeOnItsOwnLine);
355     IO.mapOptional("PointerAlignment", Style.PointerAlignment);
356     IO.mapOptional("ReflowComments", Style.ReflowComments);
357     IO.mapOptional("SortIncludes", Style.SortIncludes);
358     IO.mapOptional("SpaceAfterCStyleCast", Style.SpaceAfterCStyleCast);
359     IO.mapOptional("SpaceAfterTemplateKeyword", Style.SpaceAfterTemplateKeyword);
360     IO.mapOptional("SpaceBeforeAssignmentOperators",
361                    Style.SpaceBeforeAssignmentOperators);
362     IO.mapOptional("SpaceBeforeParens", Style.SpaceBeforeParens);
363     IO.mapOptional("SpaceInEmptyParentheses", Style.SpaceInEmptyParentheses);
364     IO.mapOptional("SpacesBeforeTrailingComments",
365                    Style.SpacesBeforeTrailingComments);
366     IO.mapOptional("SpacesInAngles", Style.SpacesInAngles);
367     IO.mapOptional("SpacesInContainerLiterals",
368                    Style.SpacesInContainerLiterals);
369     IO.mapOptional("SpacesInCStyleCastParentheses",
370                    Style.SpacesInCStyleCastParentheses);
371     IO.mapOptional("SpacesInParentheses", Style.SpacesInParentheses);
372     IO.mapOptional("SpacesInSquareBrackets", Style.SpacesInSquareBrackets);
373     IO.mapOptional("Standard", Style.Standard);
374     IO.mapOptional("TabWidth", Style.TabWidth);
375     IO.mapOptional("UseTab", Style.UseTab);
376   }
377 };
378 
379 template <> struct MappingTraits<FormatStyle::BraceWrappingFlags> {
380   static void mapping(IO &IO, FormatStyle::BraceWrappingFlags &Wrapping) {
381     IO.mapOptional("AfterClass", Wrapping.AfterClass);
382     IO.mapOptional("AfterControlStatement", Wrapping.AfterControlStatement);
383     IO.mapOptional("AfterEnum", Wrapping.AfterEnum);
384     IO.mapOptional("AfterFunction", Wrapping.AfterFunction);
385     IO.mapOptional("AfterNamespace", Wrapping.AfterNamespace);
386     IO.mapOptional("AfterObjCDeclaration", Wrapping.AfterObjCDeclaration);
387     IO.mapOptional("AfterStruct", Wrapping.AfterStruct);
388     IO.mapOptional("AfterUnion", Wrapping.AfterUnion);
389     IO.mapOptional("BeforeCatch", Wrapping.BeforeCatch);
390     IO.mapOptional("BeforeElse", Wrapping.BeforeElse);
391     IO.mapOptional("IndentBraces", Wrapping.IndentBraces);
392   }
393 };
394 
395 template <> struct MappingTraits<FormatStyle::IncludeCategory> {
396   static void mapping(IO &IO, FormatStyle::IncludeCategory &Category) {
397     IO.mapOptional("Regex", Category.Regex);
398     IO.mapOptional("Priority", Category.Priority);
399   }
400 };
401 
402 // Allows to read vector<FormatStyle> while keeping default values.
403 // IO.getContext() should contain a pointer to the FormatStyle structure, that
404 // will be used to get default values for missing keys.
405 // If the first element has no Language specified, it will be treated as the
406 // default one for the following elements.
407 template <> struct DocumentListTraits<std::vector<FormatStyle>> {
408   static size_t size(IO &IO, std::vector<FormatStyle> &Seq) {
409     return Seq.size();
410   }
411   static FormatStyle &element(IO &IO, std::vector<FormatStyle> &Seq,
412                               size_t Index) {
413     if (Index >= Seq.size()) {
414       assert(Index == Seq.size());
415       FormatStyle Template;
416       if (Seq.size() > 0 && Seq[0].Language == FormatStyle::LK_None) {
417         Template = Seq[0];
418       } else {
419         Template = *((const FormatStyle *)IO.getContext());
420         Template.Language = FormatStyle::LK_None;
421       }
422       Seq.resize(Index + 1, Template);
423     }
424     return Seq[Index];
425   }
426 };
427 } // namespace yaml
428 } // namespace llvm
429 
430 namespace clang {
431 namespace format {
432 
433 const std::error_category &getParseCategory() {
434   static ParseErrorCategory C;
435   return C;
436 }
437 std::error_code make_error_code(ParseError e) {
438   return std::error_code(static_cast<int>(e), getParseCategory());
439 }
440 
441 inline llvm::Error make_string_error(const llvm::Twine &Message) {
442   return llvm::make_error<llvm::StringError>(Message,
443                                              llvm::inconvertibleErrorCode());
444 }
445 
446 const char *ParseErrorCategory::name() const noexcept {
447   return "clang-format.parse_error";
448 }
449 
450 std::string ParseErrorCategory::message(int EV) const {
451   switch (static_cast<ParseError>(EV)) {
452   case ParseError::Success:
453     return "Success";
454   case ParseError::Error:
455     return "Invalid argument";
456   case ParseError::Unsuitable:
457     return "Unsuitable";
458   }
459   llvm_unreachable("unexpected parse error");
460 }
461 
462 static FormatStyle expandPresets(const FormatStyle &Style) {
463   if (Style.BreakBeforeBraces == FormatStyle::BS_Custom)
464     return Style;
465   FormatStyle Expanded = Style;
466   Expanded.BraceWrapping = {false, false, false, false, false, false,
467                             false, false, false, false, false};
468   switch (Style.BreakBeforeBraces) {
469   case FormatStyle::BS_Linux:
470     Expanded.BraceWrapping.AfterClass = true;
471     Expanded.BraceWrapping.AfterFunction = true;
472     Expanded.BraceWrapping.AfterNamespace = true;
473     break;
474   case FormatStyle::BS_Mozilla:
475     Expanded.BraceWrapping.AfterClass = true;
476     Expanded.BraceWrapping.AfterEnum = true;
477     Expanded.BraceWrapping.AfterFunction = true;
478     Expanded.BraceWrapping.AfterStruct = true;
479     Expanded.BraceWrapping.AfterUnion = true;
480     break;
481   case FormatStyle::BS_Stroustrup:
482     Expanded.BraceWrapping.AfterFunction = true;
483     Expanded.BraceWrapping.BeforeCatch = true;
484     Expanded.BraceWrapping.BeforeElse = true;
485     break;
486   case FormatStyle::BS_Allman:
487     Expanded.BraceWrapping.AfterClass = true;
488     Expanded.BraceWrapping.AfterControlStatement = true;
489     Expanded.BraceWrapping.AfterEnum = true;
490     Expanded.BraceWrapping.AfterFunction = true;
491     Expanded.BraceWrapping.AfterNamespace = true;
492     Expanded.BraceWrapping.AfterObjCDeclaration = true;
493     Expanded.BraceWrapping.AfterStruct = true;
494     Expanded.BraceWrapping.BeforeCatch = true;
495     Expanded.BraceWrapping.BeforeElse = true;
496     break;
497   case FormatStyle::BS_GNU:
498     Expanded.BraceWrapping = {true, true, true, true, true, true,
499                               true, true, true, true, true};
500     break;
501   case FormatStyle::BS_WebKit:
502     Expanded.BraceWrapping.AfterFunction = true;
503     break;
504   default:
505     break;
506   }
507   return Expanded;
508 }
509 
510 FormatStyle getLLVMStyle() {
511   FormatStyle LLVMStyle;
512   LLVMStyle.Language = FormatStyle::LK_Cpp;
513   LLVMStyle.AccessModifierOffset = -2;
514   LLVMStyle.AlignEscapedNewlines = FormatStyle::ENAS_Right;
515   LLVMStyle.AlignAfterOpenBracket = FormatStyle::BAS_Align;
516   LLVMStyle.AlignOperands = true;
517   LLVMStyle.AlignTrailingComments = true;
518   LLVMStyle.AlignConsecutiveAssignments = false;
519   LLVMStyle.AlignConsecutiveDeclarations = false;
520   LLVMStyle.AllowAllParametersOfDeclarationOnNextLine = true;
521   LLVMStyle.AllowShortFunctionsOnASingleLine = FormatStyle::SFS_All;
522   LLVMStyle.AllowShortBlocksOnASingleLine = false;
523   LLVMStyle.AllowShortCaseLabelsOnASingleLine = false;
524   LLVMStyle.AllowShortIfStatementsOnASingleLine = false;
525   LLVMStyle.AllowShortLoopsOnASingleLine = false;
526   LLVMStyle.AlwaysBreakAfterReturnType = FormatStyle::RTBS_None;
527   LLVMStyle.AlwaysBreakAfterDefinitionReturnType = FormatStyle::DRTBS_None;
528   LLVMStyle.AlwaysBreakBeforeMultilineStrings = false;
529   LLVMStyle.AlwaysBreakTemplateDeclarations = false;
530   LLVMStyle.BinPackParameters = true;
531   LLVMStyle.BinPackArguments = true;
532   LLVMStyle.BreakBeforeBinaryOperators = FormatStyle::BOS_None;
533   LLVMStyle.BreakBeforeTernaryOperators = true;
534   LLVMStyle.BreakBeforeBraces = FormatStyle::BS_Attach;
535   LLVMStyle.BraceWrapping = {false, false, false, false, false, false,
536                              false, false, false, false, false};
537   LLVMStyle.BreakAfterJavaFieldAnnotations = false;
538   LLVMStyle.BreakConstructorInitializersBeforeComma = false;
539   LLVMStyle.BreakBeforeInheritanceComma = false;
540   LLVMStyle.BreakStringLiterals = true;
541   LLVMStyle.ColumnLimit = 80;
542   LLVMStyle.CommentPragmas = "^ IWYU pragma:";
543   LLVMStyle.ConstructorInitializerAllOnOneLineOrOnePerLine = false;
544   LLVMStyle.ConstructorInitializerIndentWidth = 4;
545   LLVMStyle.ContinuationIndentWidth = 4;
546   LLVMStyle.Cpp11BracedListStyle = true;
547   LLVMStyle.DerivePointerAlignment = false;
548   LLVMStyle.ExperimentalAutoDetectBinPacking = false;
549   LLVMStyle.FixNamespaceComments = true;
550   LLVMStyle.ForEachMacros.push_back("foreach");
551   LLVMStyle.ForEachMacros.push_back("Q_FOREACH");
552   LLVMStyle.ForEachMacros.push_back("BOOST_FOREACH");
553   LLVMStyle.IncludeCategories = {{"^\"(llvm|llvm-c|clang|clang-c)/", 2},
554                                  {"^(<|\"(gtest|isl|json)/)", 3},
555                                  {".*", 1}};
556   LLVMStyle.IncludeIsMainRegex = "$";
557   LLVMStyle.IndentCaseLabels = false;
558   LLVMStyle.IndentWrappedFunctionNames = false;
559   LLVMStyle.IndentWidth = 2;
560   LLVMStyle.JavaScriptQuotes = FormatStyle::JSQS_Leave;
561   LLVMStyle.JavaScriptWrapImports = true;
562   LLVMStyle.TabWidth = 8;
563   LLVMStyle.MaxEmptyLinesToKeep = 1;
564   LLVMStyle.KeepEmptyLinesAtTheStartOfBlocks = true;
565   LLVMStyle.NamespaceIndentation = FormatStyle::NI_None;
566   LLVMStyle.ObjCBlockIndentWidth = 2;
567   LLVMStyle.ObjCSpaceAfterProperty = false;
568   LLVMStyle.ObjCSpaceBeforeProtocolList = true;
569   LLVMStyle.PointerAlignment = FormatStyle::PAS_Right;
570   LLVMStyle.SpacesBeforeTrailingComments = 1;
571   LLVMStyle.Standard = FormatStyle::LS_Cpp11;
572   LLVMStyle.UseTab = FormatStyle::UT_Never;
573   LLVMStyle.ReflowComments = true;
574   LLVMStyle.SpacesInParentheses = false;
575   LLVMStyle.SpacesInSquareBrackets = false;
576   LLVMStyle.SpaceInEmptyParentheses = false;
577   LLVMStyle.SpacesInContainerLiterals = true;
578   LLVMStyle.SpacesInCStyleCastParentheses = false;
579   LLVMStyle.SpaceAfterCStyleCast = false;
580   LLVMStyle.SpaceAfterTemplateKeyword = true;
581   LLVMStyle.SpaceBeforeParens = FormatStyle::SBPO_ControlStatements;
582   LLVMStyle.SpaceBeforeAssignmentOperators = true;
583   LLVMStyle.SpacesInAngles = false;
584 
585   LLVMStyle.PenaltyBreakComment = 300;
586   LLVMStyle.PenaltyBreakFirstLessLess = 120;
587   LLVMStyle.PenaltyBreakString = 1000;
588   LLVMStyle.PenaltyExcessCharacter = 1000000;
589   LLVMStyle.PenaltyReturnTypeOnItsOwnLine = 60;
590   LLVMStyle.PenaltyBreakBeforeFirstCallParameter = 19;
591 
592   LLVMStyle.DisableFormat = false;
593   LLVMStyle.SortIncludes = true;
594 
595   return LLVMStyle;
596 }
597 
598 FormatStyle getGoogleStyle(FormatStyle::LanguageKind Language) {
599   FormatStyle GoogleStyle = getLLVMStyle();
600   GoogleStyle.Language = Language;
601 
602   GoogleStyle.AccessModifierOffset = -1;
603   GoogleStyle.AlignEscapedNewlines = FormatStyle::ENAS_Left;
604   GoogleStyle.AllowShortIfStatementsOnASingleLine = true;
605   GoogleStyle.AllowShortLoopsOnASingleLine = true;
606   GoogleStyle.AlwaysBreakBeforeMultilineStrings = true;
607   GoogleStyle.AlwaysBreakTemplateDeclarations = true;
608   GoogleStyle.ConstructorInitializerAllOnOneLineOrOnePerLine = true;
609   GoogleStyle.DerivePointerAlignment = true;
610   GoogleStyle.IncludeCategories = {{"^<.*\\.h>", 1}, {"^<.*", 2}, {".*", 3}};
611   GoogleStyle.IncludeIsMainRegex = "([-_](test|unittest))?$";
612   GoogleStyle.IndentCaseLabels = true;
613   GoogleStyle.KeepEmptyLinesAtTheStartOfBlocks = false;
614   GoogleStyle.ObjCSpaceAfterProperty = false;
615   GoogleStyle.ObjCSpaceBeforeProtocolList = false;
616   GoogleStyle.PointerAlignment = FormatStyle::PAS_Left;
617   GoogleStyle.SpacesBeforeTrailingComments = 2;
618   GoogleStyle.Standard = FormatStyle::LS_Auto;
619 
620   GoogleStyle.PenaltyReturnTypeOnItsOwnLine = 200;
621   GoogleStyle.PenaltyBreakBeforeFirstCallParameter = 1;
622 
623   if (Language == FormatStyle::LK_Java) {
624     GoogleStyle.AlignAfterOpenBracket = FormatStyle::BAS_DontAlign;
625     GoogleStyle.AlignOperands = false;
626     GoogleStyle.AlignTrailingComments = false;
627     GoogleStyle.AllowShortFunctionsOnASingleLine = FormatStyle::SFS_Empty;
628     GoogleStyle.AllowShortIfStatementsOnASingleLine = false;
629     GoogleStyle.AlwaysBreakBeforeMultilineStrings = false;
630     GoogleStyle.BreakBeforeBinaryOperators = FormatStyle::BOS_NonAssignment;
631     GoogleStyle.ColumnLimit = 100;
632     GoogleStyle.SpaceAfterCStyleCast = true;
633     GoogleStyle.SpacesBeforeTrailingComments = 1;
634   } else if (Language == FormatStyle::LK_JavaScript) {
635     GoogleStyle.AlignAfterOpenBracket = FormatStyle::BAS_AlwaysBreak;
636     GoogleStyle.AlignOperands = false;
637     GoogleStyle.AllowShortFunctionsOnASingleLine = FormatStyle::SFS_Empty;
638     GoogleStyle.AlwaysBreakBeforeMultilineStrings = false;
639     GoogleStyle.BreakBeforeTernaryOperators = false;
640     // taze:, triple slash directives (`/// <...`), @tag followed by { for a lot
641     // of JSDoc tags, and @see, which is commonly followed by overlong URLs.
642     GoogleStyle.CommentPragmas =
643         "(taze:|^/[ \t]*<|(@[A-Za-z_0-9-]+[ \\t]*{)|@see)";
644     GoogleStyle.MaxEmptyLinesToKeep = 3;
645     GoogleStyle.NamespaceIndentation = FormatStyle::NI_All;
646     GoogleStyle.SpacesInContainerLiterals = false;
647     GoogleStyle.JavaScriptQuotes = FormatStyle::JSQS_Single;
648     GoogleStyle.JavaScriptWrapImports = false;
649   } else if (Language == FormatStyle::LK_Proto) {
650     GoogleStyle.AllowShortFunctionsOnASingleLine = FormatStyle::SFS_None;
651     GoogleStyle.SpacesInContainerLiterals = false;
652   } else if (Language == FormatStyle::LK_ObjC) {
653     GoogleStyle.ColumnLimit = 100;
654   }
655 
656   return GoogleStyle;
657 }
658 
659 FormatStyle getChromiumStyle(FormatStyle::LanguageKind Language) {
660   FormatStyle ChromiumStyle = getGoogleStyle(Language);
661   if (Language == FormatStyle::LK_Java) {
662     ChromiumStyle.AllowShortIfStatementsOnASingleLine = true;
663     ChromiumStyle.BreakAfterJavaFieldAnnotations = true;
664     ChromiumStyle.ContinuationIndentWidth = 8;
665     ChromiumStyle.IndentWidth = 4;
666   } else if (Language == FormatStyle::LK_JavaScript) {
667     ChromiumStyle.AllowShortIfStatementsOnASingleLine = false;
668     ChromiumStyle.AllowShortLoopsOnASingleLine = false;
669   } else {
670     ChromiumStyle.AllowAllParametersOfDeclarationOnNextLine = false;
671     ChromiumStyle.AllowShortFunctionsOnASingleLine = FormatStyle::SFS_Inline;
672     ChromiumStyle.AllowShortIfStatementsOnASingleLine = false;
673     ChromiumStyle.AllowShortLoopsOnASingleLine = false;
674     ChromiumStyle.BinPackParameters = false;
675     ChromiumStyle.DerivePointerAlignment = false;
676     if (Language == FormatStyle::LK_ObjC)
677       ChromiumStyle.ColumnLimit = 80;
678   }
679   return ChromiumStyle;
680 }
681 
682 FormatStyle getMozillaStyle() {
683   FormatStyle MozillaStyle = getLLVMStyle();
684   MozillaStyle.AllowAllParametersOfDeclarationOnNextLine = false;
685   MozillaStyle.AllowShortFunctionsOnASingleLine = FormatStyle::SFS_Inline;
686   MozillaStyle.AlwaysBreakAfterReturnType =
687       FormatStyle::RTBS_TopLevel;
688   MozillaStyle.AlwaysBreakAfterDefinitionReturnType =
689       FormatStyle::DRTBS_TopLevel;
690   MozillaStyle.AlwaysBreakTemplateDeclarations = true;
691   MozillaStyle.BinPackParameters = false;
692   MozillaStyle.BinPackArguments = false;
693   MozillaStyle.BreakBeforeBraces = FormatStyle::BS_Mozilla;
694   MozillaStyle.BreakConstructorInitializersBeforeComma = true;
695   MozillaStyle.BreakBeforeInheritanceComma = true;
696   MozillaStyle.ConstructorInitializerIndentWidth = 2;
697   MozillaStyle.ContinuationIndentWidth = 2;
698   MozillaStyle.Cpp11BracedListStyle = false;
699   MozillaStyle.FixNamespaceComments = false;
700   MozillaStyle.IndentCaseLabels = true;
701   MozillaStyle.ObjCSpaceAfterProperty = true;
702   MozillaStyle.ObjCSpaceBeforeProtocolList = false;
703   MozillaStyle.PenaltyReturnTypeOnItsOwnLine = 200;
704   MozillaStyle.PointerAlignment = FormatStyle::PAS_Left;
705   MozillaStyle.SpaceAfterTemplateKeyword = false;
706   return MozillaStyle;
707 }
708 
709 FormatStyle getWebKitStyle() {
710   FormatStyle Style = getLLVMStyle();
711   Style.AccessModifierOffset = -4;
712   Style.AlignAfterOpenBracket = FormatStyle::BAS_DontAlign;
713   Style.AlignOperands = false;
714   Style.AlignTrailingComments = false;
715   Style.BreakBeforeBinaryOperators = FormatStyle::BOS_All;
716   Style.BreakBeforeBraces = FormatStyle::BS_WebKit;
717   Style.BreakConstructorInitializersBeforeComma = true;
718   Style.Cpp11BracedListStyle = false;
719   Style.ColumnLimit = 0;
720   Style.FixNamespaceComments = false;
721   Style.IndentWidth = 4;
722   Style.NamespaceIndentation = FormatStyle::NI_Inner;
723   Style.ObjCBlockIndentWidth = 4;
724   Style.ObjCSpaceAfterProperty = true;
725   Style.PointerAlignment = FormatStyle::PAS_Left;
726   return Style;
727 }
728 
729 FormatStyle getGNUStyle() {
730   FormatStyle Style = getLLVMStyle();
731   Style.AlwaysBreakAfterDefinitionReturnType = FormatStyle::DRTBS_All;
732   Style.AlwaysBreakAfterReturnType = FormatStyle::RTBS_AllDefinitions;
733   Style.BreakBeforeBinaryOperators = FormatStyle::BOS_All;
734   Style.BreakBeforeBraces = FormatStyle::BS_GNU;
735   Style.BreakBeforeTernaryOperators = true;
736   Style.Cpp11BracedListStyle = false;
737   Style.ColumnLimit = 79;
738   Style.FixNamespaceComments = false;
739   Style.SpaceBeforeParens = FormatStyle::SBPO_Always;
740   Style.Standard = FormatStyle::LS_Cpp03;
741   return Style;
742 }
743 
744 FormatStyle getNoStyle() {
745   FormatStyle NoStyle = getLLVMStyle();
746   NoStyle.DisableFormat = true;
747   NoStyle.SortIncludes = false;
748   return NoStyle;
749 }
750 
751 bool getPredefinedStyle(StringRef Name, FormatStyle::LanguageKind Language,
752                         FormatStyle *Style) {
753   if (Name.equals_lower("llvm")) {
754     *Style = getLLVMStyle();
755   } else if (Name.equals_lower("chromium")) {
756     *Style = getChromiumStyle(Language);
757   } else if (Name.equals_lower("mozilla")) {
758     *Style = getMozillaStyle();
759   } else if (Name.equals_lower("google")) {
760     *Style = getGoogleStyle(Language);
761   } else if (Name.equals_lower("webkit")) {
762     *Style = getWebKitStyle();
763   } else if (Name.equals_lower("gnu")) {
764     *Style = getGNUStyle();
765   } else if (Name.equals_lower("none")) {
766     *Style = getNoStyle();
767   } else {
768     return false;
769   }
770 
771   Style->Language = Language;
772   return true;
773 }
774 
775 std::error_code parseConfiguration(StringRef Text, FormatStyle *Style) {
776   assert(Style);
777   FormatStyle::LanguageKind Language = Style->Language;
778   assert(Language != FormatStyle::LK_None);
779   if (Text.trim().empty())
780     return make_error_code(ParseError::Error);
781 
782   std::vector<FormatStyle> Styles;
783   llvm::yaml::Input Input(Text);
784   // DocumentListTraits<vector<FormatStyle>> uses the context to get default
785   // values for the fields, keys for which are missing from the configuration.
786   // Mapping also uses the context to get the language to find the correct
787   // base style.
788   Input.setContext(Style);
789   Input >> Styles;
790   if (Input.error())
791     return Input.error();
792 
793   for (unsigned i = 0; i < Styles.size(); ++i) {
794     // Ensures that only the first configuration can skip the Language option.
795     if (Styles[i].Language == FormatStyle::LK_None && i != 0)
796       return make_error_code(ParseError::Error);
797     // Ensure that each language is configured at most once.
798     for (unsigned j = 0; j < i; ++j) {
799       if (Styles[i].Language == Styles[j].Language) {
800         DEBUG(llvm::dbgs()
801               << "Duplicate languages in the config file on positions " << j
802               << " and " << i << "\n");
803         return make_error_code(ParseError::Error);
804       }
805     }
806   }
807   // Look for a suitable configuration starting from the end, so we can
808   // find the configuration for the specific language first, and the default
809   // configuration (which can only be at slot 0) after it.
810   for (int i = Styles.size() - 1; i >= 0; --i) {
811     if (Styles[i].Language == Language ||
812         Styles[i].Language == FormatStyle::LK_None) {
813       *Style = Styles[i];
814       Style->Language = Language;
815       return make_error_code(ParseError::Success);
816     }
817   }
818   return make_error_code(ParseError::Unsuitable);
819 }
820 
821 std::string configurationAsText(const FormatStyle &Style) {
822   std::string Text;
823   llvm::raw_string_ostream Stream(Text);
824   llvm::yaml::Output Output(Stream);
825   // We use the same mapping method for input and output, so we need a non-const
826   // reference here.
827   FormatStyle NonConstStyle = expandPresets(Style);
828   Output << NonConstStyle;
829   return Stream.str();
830 }
831 
832 namespace {
833 
834 class JavaScriptRequoter : public TokenAnalyzer {
835 public:
836   JavaScriptRequoter(const Environment &Env, const FormatStyle &Style)
837       : TokenAnalyzer(Env, Style) {}
838 
839   tooling::Replacements
840   analyze(TokenAnnotator &Annotator,
841           SmallVectorImpl<AnnotatedLine *> &AnnotatedLines,
842           FormatTokenLexer &Tokens) override {
843     AffectedRangeMgr.computeAffectedLines(AnnotatedLines.begin(),
844                                           AnnotatedLines.end());
845     tooling::Replacements Result;
846     requoteJSStringLiteral(AnnotatedLines, Result);
847     return Result;
848   }
849 
850 private:
851   // Replaces double/single-quoted string literal as appropriate, re-escaping
852   // the contents in the process.
853   void requoteJSStringLiteral(SmallVectorImpl<AnnotatedLine *> &Lines,
854                               tooling::Replacements &Result) {
855     for (AnnotatedLine *Line : Lines) {
856       requoteJSStringLiteral(Line->Children, Result);
857       if (!Line->Affected)
858         continue;
859       for (FormatToken *FormatTok = Line->First; FormatTok;
860            FormatTok = FormatTok->Next) {
861         StringRef Input = FormatTok->TokenText;
862         if (FormatTok->Finalized || !FormatTok->isStringLiteral() ||
863             // NB: testing for not starting with a double quote to avoid
864             // breaking `template strings`.
865             (Style.JavaScriptQuotes == FormatStyle::JSQS_Single &&
866              !Input.startswith("\"")) ||
867             (Style.JavaScriptQuotes == FormatStyle::JSQS_Double &&
868              !Input.startswith("\'")))
869           continue;
870 
871         // Change start and end quote.
872         bool IsSingle = Style.JavaScriptQuotes == FormatStyle::JSQS_Single;
873         SourceLocation Start = FormatTok->Tok.getLocation();
874         auto Replace = [&](SourceLocation Start, unsigned Length,
875                            StringRef ReplacementText) {
876           auto Err = Result.add(tooling::Replacement(
877               Env.getSourceManager(), Start, Length, ReplacementText));
878           // FIXME: handle error. For now, print error message and skip the
879           // replacement for release version.
880           if (Err) {
881             llvm::errs() << llvm::toString(std::move(Err)) << "\n";
882             assert(false);
883           }
884         };
885         Replace(Start, 1, IsSingle ? "'" : "\"");
886         Replace(FormatTok->Tok.getEndLoc().getLocWithOffset(-1), 1,
887                 IsSingle ? "'" : "\"");
888 
889         // Escape internal quotes.
890         bool Escaped = false;
891         for (size_t i = 1; i < Input.size() - 1; i++) {
892           switch (Input[i]) {
893           case '\\':
894             if (!Escaped && i + 1 < Input.size() &&
895                 ((IsSingle && Input[i + 1] == '"') ||
896                  (!IsSingle && Input[i + 1] == '\''))) {
897               // Remove this \, it's escaping a " or ' that no longer needs
898               // escaping
899               Replace(Start.getLocWithOffset(i), 1, "");
900               continue;
901             }
902             Escaped = !Escaped;
903             break;
904           case '\"':
905           case '\'':
906             if (!Escaped && IsSingle == (Input[i] == '\'')) {
907               // Escape the quote.
908               Replace(Start.getLocWithOffset(i), 0, "\\");
909             }
910             Escaped = false;
911             break;
912           default:
913             Escaped = false;
914             break;
915           }
916         }
917       }
918     }
919   }
920 };
921 
922 class Formatter : public TokenAnalyzer {
923 public:
924   Formatter(const Environment &Env, const FormatStyle &Style,
925             FormattingAttemptStatus *Status)
926       : TokenAnalyzer(Env, Style), Status(Status) {}
927 
928   tooling::Replacements
929   analyze(TokenAnnotator &Annotator,
930           SmallVectorImpl<AnnotatedLine *> &AnnotatedLines,
931           FormatTokenLexer &Tokens) override {
932     tooling::Replacements Result;
933     deriveLocalStyle(AnnotatedLines);
934     AffectedRangeMgr.computeAffectedLines(AnnotatedLines.begin(),
935                                           AnnotatedLines.end());
936     for (unsigned i = 0, e = AnnotatedLines.size(); i != e; ++i) {
937       Annotator.calculateFormattingInformation(*AnnotatedLines[i]);
938     }
939     Annotator.setCommentLineLevels(AnnotatedLines);
940 
941     WhitespaceManager Whitespaces(
942         Env.getSourceManager(), Style,
943         inputUsesCRLF(Env.getSourceManager().getBufferData(Env.getFileID())));
944     ContinuationIndenter Indenter(Style, Tokens.getKeywords(),
945                                   Env.getSourceManager(), Whitespaces, Encoding,
946                                   BinPackInconclusiveFunctions);
947     UnwrappedLineFormatter(&Indenter, &Whitespaces, Style, Tokens.getKeywords(),
948                            Env.getSourceManager(), Status)
949         .format(AnnotatedLines);
950     for (const auto &R : Whitespaces.generateReplacements())
951       if (Result.add(R))
952         return Result;
953     return Result;
954   }
955 
956 private:
957 
958   static bool inputUsesCRLF(StringRef Text) {
959     return Text.count('\r') * 2 > Text.count('\n');
960   }
961 
962   bool
963   hasCpp03IncompatibleFormat(const SmallVectorImpl<AnnotatedLine *> &Lines) {
964     for (const AnnotatedLine *Line : Lines) {
965       if (hasCpp03IncompatibleFormat(Line->Children))
966         return true;
967       for (FormatToken *Tok = Line->First->Next; Tok; Tok = Tok->Next) {
968         if (Tok->WhitespaceRange.getBegin() == Tok->WhitespaceRange.getEnd()) {
969           if (Tok->is(tok::coloncolon) && Tok->Previous->is(TT_TemplateOpener))
970             return true;
971           if (Tok->is(TT_TemplateCloser) &&
972               Tok->Previous->is(TT_TemplateCloser))
973             return true;
974         }
975       }
976     }
977     return false;
978   }
979 
980   int countVariableAlignments(const SmallVectorImpl<AnnotatedLine *> &Lines) {
981     int AlignmentDiff = 0;
982     for (const AnnotatedLine *Line : Lines) {
983       AlignmentDiff += countVariableAlignments(Line->Children);
984       for (FormatToken *Tok = Line->First; Tok && Tok->Next; Tok = Tok->Next) {
985         if (!Tok->is(TT_PointerOrReference))
986           continue;
987         bool SpaceBefore =
988             Tok->WhitespaceRange.getBegin() != Tok->WhitespaceRange.getEnd();
989         bool SpaceAfter = Tok->Next->WhitespaceRange.getBegin() !=
990                           Tok->Next->WhitespaceRange.getEnd();
991         if (SpaceBefore && !SpaceAfter)
992           ++AlignmentDiff;
993         if (!SpaceBefore && SpaceAfter)
994           --AlignmentDiff;
995       }
996     }
997     return AlignmentDiff;
998   }
999 
1000   void
1001   deriveLocalStyle(const SmallVectorImpl<AnnotatedLine *> &AnnotatedLines) {
1002     bool HasBinPackedFunction = false;
1003     bool HasOnePerLineFunction = false;
1004     for (unsigned i = 0, e = AnnotatedLines.size(); i != e; ++i) {
1005       if (!AnnotatedLines[i]->First->Next)
1006         continue;
1007       FormatToken *Tok = AnnotatedLines[i]->First->Next;
1008       while (Tok->Next) {
1009         if (Tok->PackingKind == PPK_BinPacked)
1010           HasBinPackedFunction = true;
1011         if (Tok->PackingKind == PPK_OnePerLine)
1012           HasOnePerLineFunction = true;
1013 
1014         Tok = Tok->Next;
1015       }
1016     }
1017     if (Style.DerivePointerAlignment)
1018       Style.PointerAlignment = countVariableAlignments(AnnotatedLines) <= 0
1019                                    ? FormatStyle::PAS_Left
1020                                    : FormatStyle::PAS_Right;
1021     if (Style.Standard == FormatStyle::LS_Auto)
1022       Style.Standard = hasCpp03IncompatibleFormat(AnnotatedLines)
1023                            ? FormatStyle::LS_Cpp11
1024                            : FormatStyle::LS_Cpp03;
1025     BinPackInconclusiveFunctions =
1026         HasBinPackedFunction || !HasOnePerLineFunction;
1027   }
1028 
1029   bool BinPackInconclusiveFunctions;
1030   FormattingAttemptStatus *Status;
1031 };
1032 
1033 // This class clean up the erroneous/redundant code around the given ranges in
1034 // file.
1035 class Cleaner : public TokenAnalyzer {
1036 public:
1037   Cleaner(const Environment &Env, const FormatStyle &Style)
1038       : TokenAnalyzer(Env, Style),
1039         DeletedTokens(FormatTokenLess(Env.getSourceManager())) {}
1040 
1041   // FIXME: eliminate unused parameters.
1042   tooling::Replacements
1043   analyze(TokenAnnotator &Annotator,
1044           SmallVectorImpl<AnnotatedLine *> &AnnotatedLines,
1045           FormatTokenLexer &Tokens) override {
1046     // FIXME: in the current implementation the granularity of affected range
1047     // is an annotated line. However, this is not sufficient. Furthermore,
1048     // redundant code introduced by replacements does not necessarily
1049     // intercept with ranges of replacements that result in the redundancy.
1050     // To determine if some redundant code is actually introduced by
1051     // replacements(e.g. deletions), we need to come up with a more
1052     // sophisticated way of computing affected ranges.
1053     AffectedRangeMgr.computeAffectedLines(AnnotatedLines.begin(),
1054                                           AnnotatedLines.end());
1055 
1056     checkEmptyNamespace(AnnotatedLines);
1057 
1058     for (auto &Line : AnnotatedLines) {
1059       if (Line->Affected) {
1060         cleanupRight(Line->First, tok::comma, tok::comma);
1061         cleanupRight(Line->First, TT_CtorInitializerColon, tok::comma);
1062         cleanupRight(Line->First, tok::l_paren, tok::comma);
1063         cleanupLeft(Line->First, tok::comma, tok::r_paren);
1064         cleanupLeft(Line->First, TT_CtorInitializerComma, tok::l_brace);
1065         cleanupLeft(Line->First, TT_CtorInitializerColon, tok::l_brace);
1066         cleanupLeft(Line->First, TT_CtorInitializerColon, tok::equal);
1067       }
1068     }
1069 
1070     return generateFixes();
1071   }
1072 
1073 private:
1074   bool containsOnlyComments(const AnnotatedLine &Line) {
1075     for (FormatToken *Tok = Line.First; Tok != nullptr; Tok = Tok->Next) {
1076       if (Tok->isNot(tok::comment))
1077         return false;
1078     }
1079     return true;
1080   }
1081 
1082   // Iterate through all lines and remove any empty (nested) namespaces.
1083   void checkEmptyNamespace(SmallVectorImpl<AnnotatedLine *> &AnnotatedLines) {
1084     std::set<unsigned> DeletedLines;
1085     for (unsigned i = 0, e = AnnotatedLines.size(); i != e; ++i) {
1086       auto &Line = *AnnotatedLines[i];
1087       if (Line.startsWith(tok::kw_namespace) ||
1088           Line.startsWith(tok::kw_inline, tok::kw_namespace)) {
1089         checkEmptyNamespace(AnnotatedLines, i, i, DeletedLines);
1090       }
1091     }
1092 
1093     for (auto Line : DeletedLines) {
1094       FormatToken *Tok = AnnotatedLines[Line]->First;
1095       while (Tok) {
1096         deleteToken(Tok);
1097         Tok = Tok->Next;
1098       }
1099     }
1100   }
1101 
1102   // The function checks if the namespace, which starts from \p CurrentLine, and
1103   // its nested namespaces are empty and delete them if they are empty. It also
1104   // sets \p NewLine to the last line checked.
1105   // Returns true if the current namespace is empty.
1106   bool checkEmptyNamespace(SmallVectorImpl<AnnotatedLine *> &AnnotatedLines,
1107                            unsigned CurrentLine, unsigned &NewLine,
1108                            std::set<unsigned> &DeletedLines) {
1109     unsigned InitLine = CurrentLine, End = AnnotatedLines.size();
1110     if (Style.BraceWrapping.AfterNamespace) {
1111       // If the left brace is in a new line, we should consume it first so that
1112       // it does not make the namespace non-empty.
1113       // FIXME: error handling if there is no left brace.
1114       if (!AnnotatedLines[++CurrentLine]->startsWith(tok::l_brace)) {
1115         NewLine = CurrentLine;
1116         return false;
1117       }
1118     } else if (!AnnotatedLines[CurrentLine]->endsWith(tok::l_brace)) {
1119       return false;
1120     }
1121     while (++CurrentLine < End) {
1122       if (AnnotatedLines[CurrentLine]->startsWith(tok::r_brace))
1123         break;
1124 
1125       if (AnnotatedLines[CurrentLine]->startsWith(tok::kw_namespace) ||
1126           AnnotatedLines[CurrentLine]->startsWith(tok::kw_inline,
1127                                                   tok::kw_namespace)) {
1128         if (!checkEmptyNamespace(AnnotatedLines, CurrentLine, NewLine,
1129                                  DeletedLines))
1130           return false;
1131         CurrentLine = NewLine;
1132         continue;
1133       }
1134 
1135       if (containsOnlyComments(*AnnotatedLines[CurrentLine]))
1136         continue;
1137 
1138       // If there is anything other than comments or nested namespaces in the
1139       // current namespace, the namespace cannot be empty.
1140       NewLine = CurrentLine;
1141       return false;
1142     }
1143 
1144     NewLine = CurrentLine;
1145     if (CurrentLine >= End)
1146       return false;
1147 
1148     // Check if the empty namespace is actually affected by changed ranges.
1149     if (!AffectedRangeMgr.affectsCharSourceRange(CharSourceRange::getCharRange(
1150             AnnotatedLines[InitLine]->First->Tok.getLocation(),
1151             AnnotatedLines[CurrentLine]->Last->Tok.getEndLoc())))
1152       return false;
1153 
1154     for (unsigned i = InitLine; i <= CurrentLine; ++i) {
1155       DeletedLines.insert(i);
1156     }
1157 
1158     return true;
1159   }
1160 
1161   // Checks pairs {start, start->next},..., {end->previous, end} and deletes one
1162   // of the token in the pair if the left token has \p LK token kind and the
1163   // right token has \p RK token kind. If \p DeleteLeft is true, the left token
1164   // is deleted on match; otherwise, the right token is deleted.
1165   template <typename LeftKind, typename RightKind>
1166   void cleanupPair(FormatToken *Start, LeftKind LK, RightKind RK,
1167                    bool DeleteLeft) {
1168     auto NextNotDeleted = [this](const FormatToken &Tok) -> FormatToken * {
1169       for (auto *Res = Tok.Next; Res; Res = Res->Next)
1170         if (!Res->is(tok::comment) &&
1171             DeletedTokens.find(Res) == DeletedTokens.end())
1172           return Res;
1173       return nullptr;
1174     };
1175     for (auto *Left = Start; Left;) {
1176       auto *Right = NextNotDeleted(*Left);
1177       if (!Right)
1178         break;
1179       if (Left->is(LK) && Right->is(RK)) {
1180         deleteToken(DeleteLeft ? Left : Right);
1181         for (auto *Tok = Left->Next; Tok && Tok != Right; Tok = Tok->Next)
1182           deleteToken(Tok);
1183         // If the right token is deleted, we should keep the left token
1184         // unchanged and pair it with the new right token.
1185         if (!DeleteLeft)
1186           continue;
1187       }
1188       Left = Right;
1189     }
1190   }
1191 
1192   template <typename LeftKind, typename RightKind>
1193   void cleanupLeft(FormatToken *Start, LeftKind LK, RightKind RK) {
1194     cleanupPair(Start, LK, RK, /*DeleteLeft=*/true);
1195   }
1196 
1197   template <typename LeftKind, typename RightKind>
1198   void cleanupRight(FormatToken *Start, LeftKind LK, RightKind RK) {
1199     cleanupPair(Start, LK, RK, /*DeleteLeft=*/false);
1200   }
1201 
1202   // Delete the given token.
1203   inline void deleteToken(FormatToken *Tok) {
1204     if (Tok)
1205       DeletedTokens.insert(Tok);
1206   }
1207 
1208   tooling::Replacements generateFixes() {
1209     tooling::Replacements Fixes;
1210     std::vector<FormatToken *> Tokens;
1211     std::copy(DeletedTokens.begin(), DeletedTokens.end(),
1212               std::back_inserter(Tokens));
1213 
1214     // Merge multiple continuous token deletions into one big deletion so that
1215     // the number of replacements can be reduced. This makes computing affected
1216     // ranges more efficient when we run reformat on the changed code.
1217     unsigned Idx = 0;
1218     while (Idx < Tokens.size()) {
1219       unsigned St = Idx, End = Idx;
1220       while ((End + 1) < Tokens.size() &&
1221              Tokens[End]->Next == Tokens[End + 1]) {
1222         End++;
1223       }
1224       auto SR = CharSourceRange::getCharRange(Tokens[St]->Tok.getLocation(),
1225                                               Tokens[End]->Tok.getEndLoc());
1226       auto Err =
1227           Fixes.add(tooling::Replacement(Env.getSourceManager(), SR, ""));
1228       // FIXME: better error handling. for now just print error message and skip
1229       // for the release version.
1230       if (Err) {
1231         llvm::errs() << llvm::toString(std::move(Err)) << "\n";
1232         assert(false && "Fixes must not conflict!");
1233       }
1234       Idx = End + 1;
1235     }
1236 
1237     return Fixes;
1238   }
1239 
1240   // Class for less-than inequality comparason for the set `RedundantTokens`.
1241   // We store tokens in the order they appear in the translation unit so that
1242   // we do not need to sort them in `generateFixes()`.
1243   struct FormatTokenLess {
1244     FormatTokenLess(const SourceManager &SM) : SM(SM) {}
1245 
1246     bool operator()(const FormatToken *LHS, const FormatToken *RHS) const {
1247       return SM.isBeforeInTranslationUnit(LHS->Tok.getLocation(),
1248                                           RHS->Tok.getLocation());
1249     }
1250     const SourceManager &SM;
1251   };
1252 
1253   // Tokens to be deleted.
1254   std::set<FormatToken *, FormatTokenLess> DeletedTokens;
1255 };
1256 
1257 struct IncludeDirective {
1258   StringRef Filename;
1259   StringRef Text;
1260   unsigned Offset;
1261   int Category;
1262 };
1263 
1264 } // end anonymous namespace
1265 
1266 // Determines whether 'Ranges' intersects with ('Start', 'End').
1267 static bool affectsRange(ArrayRef<tooling::Range> Ranges, unsigned Start,
1268                          unsigned End) {
1269   for (auto Range : Ranges) {
1270     if (Range.getOffset() < End &&
1271         Range.getOffset() + Range.getLength() > Start)
1272       return true;
1273   }
1274   return false;
1275 }
1276 
1277 // Returns a pair (Index, OffsetToEOL) describing the position of the cursor
1278 // before sorting/deduplicating. Index is the index of the include under the
1279 // cursor in the original set of includes. If this include has duplicates, it is
1280 // the index of the first of the duplicates as the others are going to be
1281 // removed. OffsetToEOL describes the cursor's position relative to the end of
1282 // its current line.
1283 // If `Cursor` is not on any #include, `Index` will be UINT_MAX.
1284 static std::pair<unsigned, unsigned>
1285 FindCursorIndex(const SmallVectorImpl<IncludeDirective> &Includes,
1286                 const SmallVectorImpl<unsigned> &Indices, unsigned Cursor) {
1287   unsigned CursorIndex = UINT_MAX;
1288   unsigned OffsetToEOL = 0;
1289   for (int i = 0, e = Includes.size(); i != e; ++i) {
1290     unsigned Start = Includes[Indices[i]].Offset;
1291     unsigned End = Start + Includes[Indices[i]].Text.size();
1292     if (!(Cursor >= Start && Cursor < End))
1293       continue;
1294     CursorIndex = Indices[i];
1295     OffsetToEOL = End - Cursor;
1296     // Put the cursor on the only remaining #include among the duplicate
1297     // #includes.
1298     while (--i >= 0 && Includes[CursorIndex].Text == Includes[Indices[i]].Text)
1299       CursorIndex = i;
1300     break;
1301   }
1302   return std::make_pair(CursorIndex, OffsetToEOL);
1303 }
1304 
1305 // Sorts and deduplicate a block of includes given by 'Includes' alphabetically
1306 // adding the necessary replacement to 'Replaces'. 'Includes' must be in strict
1307 // source order.
1308 // #include directives with the same text will be deduplicated, and only the
1309 // first #include in the duplicate #includes remains. If the `Cursor` is
1310 // provided and put on a deleted #include, it will be moved to the remaining
1311 // #include in the duplicate #includes.
1312 static void sortCppIncludes(const FormatStyle &Style,
1313                             const SmallVectorImpl<IncludeDirective> &Includes,
1314                             ArrayRef<tooling::Range> Ranges, StringRef FileName,
1315                             tooling::Replacements &Replaces, unsigned *Cursor) {
1316   unsigned IncludesBeginOffset = Includes.front().Offset;
1317   unsigned IncludesEndOffset =
1318       Includes.back().Offset + Includes.back().Text.size();
1319   unsigned IncludesBlockSize = IncludesEndOffset - IncludesBeginOffset;
1320   if (!affectsRange(Ranges, IncludesBeginOffset, IncludesEndOffset))
1321     return;
1322   SmallVector<unsigned, 16> Indices;
1323   for (unsigned i = 0, e = Includes.size(); i != e; ++i)
1324     Indices.push_back(i);
1325   std::stable_sort(
1326       Indices.begin(), Indices.end(), [&](unsigned LHSI, unsigned RHSI) {
1327         return std::tie(Includes[LHSI].Category, Includes[LHSI].Filename) <
1328                std::tie(Includes[RHSI].Category, Includes[RHSI].Filename);
1329       });
1330   // The index of the include on which the cursor will be put after
1331   // sorting/deduplicating.
1332   unsigned CursorIndex;
1333   // The offset from cursor to the end of line.
1334   unsigned CursorToEOLOffset;
1335   if (Cursor)
1336     std::tie(CursorIndex, CursorToEOLOffset) =
1337         FindCursorIndex(Includes, Indices, *Cursor);
1338 
1339   // Deduplicate #includes.
1340   Indices.erase(std::unique(Indices.begin(), Indices.end(),
1341                             [&](unsigned LHSI, unsigned RHSI) {
1342                               return Includes[LHSI].Text == Includes[RHSI].Text;
1343                             }),
1344                 Indices.end());
1345 
1346   // If the #includes are out of order, we generate a single replacement fixing
1347   // the entire block. Otherwise, no replacement is generated.
1348   if (Indices.size() == Includes.size() &&
1349       std::is_sorted(Indices.begin(), Indices.end()))
1350     return;
1351 
1352   std::string result;
1353   for (unsigned Index : Indices) {
1354     if (!result.empty())
1355       result += "\n";
1356     result += Includes[Index].Text;
1357     if (Cursor && CursorIndex == Index)
1358       *Cursor = IncludesBeginOffset + result.size() - CursorToEOLOffset;
1359   }
1360 
1361   auto Err = Replaces.add(tooling::Replacement(
1362       FileName, Includes.front().Offset, IncludesBlockSize, result));
1363   // FIXME: better error handling. For now, just skip the replacement for the
1364   // release version.
1365   if (Err) {
1366     llvm::errs() << llvm::toString(std::move(Err)) << "\n";
1367     assert(false);
1368   }
1369 }
1370 
1371 namespace {
1372 
1373 // This class manages priorities of #include categories and calculates
1374 // priorities for headers.
1375 class IncludeCategoryManager {
1376 public:
1377   IncludeCategoryManager(const FormatStyle &Style, StringRef FileName)
1378       : Style(Style), FileName(FileName) {
1379     FileStem = llvm::sys::path::stem(FileName);
1380     for (const auto &Category : Style.IncludeCategories)
1381       CategoryRegexs.emplace_back(Category.Regex);
1382     IsMainFile = FileName.endswith(".c") || FileName.endswith(".cc") ||
1383                  FileName.endswith(".cpp") || FileName.endswith(".c++") ||
1384                  FileName.endswith(".cxx") || FileName.endswith(".m") ||
1385                  FileName.endswith(".mm");
1386   }
1387 
1388   // Returns the priority of the category which \p IncludeName belongs to.
1389   // If \p CheckMainHeader is true and \p IncludeName is a main header, returns
1390   // 0. Otherwise, returns the priority of the matching category or INT_MAX.
1391   int getIncludePriority(StringRef IncludeName, bool CheckMainHeader) {
1392     int Ret = INT_MAX;
1393     for (unsigned i = 0, e = CategoryRegexs.size(); i != e; ++i)
1394       if (CategoryRegexs[i].match(IncludeName)) {
1395         Ret = Style.IncludeCategories[i].Priority;
1396         break;
1397       }
1398     if (CheckMainHeader && IsMainFile && Ret > 0 && isMainHeader(IncludeName))
1399       Ret = 0;
1400     return Ret;
1401   }
1402 
1403 private:
1404   bool isMainHeader(StringRef IncludeName) const {
1405     if (!IncludeName.startswith("\""))
1406       return false;
1407     StringRef HeaderStem =
1408         llvm::sys::path::stem(IncludeName.drop_front(1).drop_back(1));
1409     if (FileStem.startswith(HeaderStem)) {
1410       llvm::Regex MainIncludeRegex(
1411           (HeaderStem + Style.IncludeIsMainRegex).str());
1412       if (MainIncludeRegex.match(FileStem))
1413         return true;
1414     }
1415     return false;
1416   }
1417 
1418   const FormatStyle &Style;
1419   bool IsMainFile;
1420   StringRef FileName;
1421   StringRef FileStem;
1422   SmallVector<llvm::Regex, 4> CategoryRegexs;
1423 };
1424 
1425 const char IncludeRegexPattern[] =
1426     R"(^[\t\ ]*#[\t\ ]*(import|include)[^"<]*(["<][^">]*[">]))";
1427 
1428 } // anonymous namespace
1429 
1430 tooling::Replacements sortCppIncludes(const FormatStyle &Style, StringRef Code,
1431                                       ArrayRef<tooling::Range> Ranges,
1432                                       StringRef FileName,
1433                                       tooling::Replacements &Replaces,
1434                                       unsigned *Cursor) {
1435   unsigned Prev = 0;
1436   unsigned SearchFrom = 0;
1437   llvm::Regex IncludeRegex(IncludeRegexPattern);
1438   SmallVector<StringRef, 4> Matches;
1439   SmallVector<IncludeDirective, 16> IncludesInBlock;
1440 
1441   // In compiled files, consider the first #include to be the main #include of
1442   // the file if it is not a system #include. This ensures that the header
1443   // doesn't have hidden dependencies
1444   // (http://llvm.org/docs/CodingStandards.html#include-style).
1445   //
1446   // FIXME: Do some sanity checking, e.g. edit distance of the base name, to fix
1447   // cases where the first #include is unlikely to be the main header.
1448   IncludeCategoryManager Categories(Style, FileName);
1449   bool FirstIncludeBlock = true;
1450   bool MainIncludeFound = false;
1451   bool FormattingOff = false;
1452 
1453   for (;;) {
1454     auto Pos = Code.find('\n', SearchFrom);
1455     StringRef Line =
1456         Code.substr(Prev, (Pos != StringRef::npos ? Pos : Code.size()) - Prev);
1457 
1458     StringRef Trimmed = Line.trim();
1459     if (Trimmed == "// clang-format off")
1460       FormattingOff = true;
1461     else if (Trimmed == "// clang-format on")
1462       FormattingOff = false;
1463 
1464     if (!FormattingOff && !Line.endswith("\\")) {
1465       if (IncludeRegex.match(Line, &Matches)) {
1466         StringRef IncludeName = Matches[2];
1467         int Category = Categories.getIncludePriority(
1468             IncludeName,
1469             /*CheckMainHeader=*/!MainIncludeFound && FirstIncludeBlock);
1470         if (Category == 0)
1471           MainIncludeFound = true;
1472         IncludesInBlock.push_back({IncludeName, Line, Prev, Category});
1473       } else if (!IncludesInBlock.empty()) {
1474         sortCppIncludes(Style, IncludesInBlock, Ranges, FileName, Replaces,
1475                         Cursor);
1476         IncludesInBlock.clear();
1477         FirstIncludeBlock = false;
1478       }
1479       Prev = Pos + 1;
1480     }
1481     if (Pos == StringRef::npos || Pos + 1 == Code.size())
1482       break;
1483     SearchFrom = Pos + 1;
1484   }
1485   if (!IncludesInBlock.empty())
1486     sortCppIncludes(Style, IncludesInBlock, Ranges, FileName, Replaces, Cursor);
1487   return Replaces;
1488 }
1489 
1490 bool isMpegTS(StringRef Code) {
1491   // MPEG transport streams use the ".ts" file extension. clang-format should
1492   // not attempt to format those. MPEG TS' frame format starts with 0x47 every
1493   // 189 bytes - detect that and return.
1494   return Code.size() > 188 && Code[0] == 0x47 && Code[188] == 0x47;
1495 }
1496 
1497 tooling::Replacements sortIncludes(const FormatStyle &Style, StringRef Code,
1498                                    ArrayRef<tooling::Range> Ranges,
1499                                    StringRef FileName, unsigned *Cursor) {
1500   tooling::Replacements Replaces;
1501   if (!Style.SortIncludes)
1502     return Replaces;
1503   if (Style.Language == FormatStyle::LanguageKind::LK_JavaScript &&
1504       isMpegTS(Code))
1505     return Replaces;
1506   if (Style.Language == FormatStyle::LanguageKind::LK_JavaScript)
1507     return sortJavaScriptImports(Style, Code, Ranges, FileName);
1508   sortCppIncludes(Style, Code, Ranges, FileName, Replaces, Cursor);
1509   return Replaces;
1510 }
1511 
1512 template <typename T>
1513 static llvm::Expected<tooling::Replacements>
1514 processReplacements(T ProcessFunc, StringRef Code,
1515                     const tooling::Replacements &Replaces,
1516                     const FormatStyle &Style) {
1517   if (Replaces.empty())
1518     return tooling::Replacements();
1519 
1520   auto NewCode = applyAllReplacements(Code, Replaces);
1521   if (!NewCode)
1522     return NewCode.takeError();
1523   std::vector<tooling::Range> ChangedRanges = Replaces.getAffectedRanges();
1524   StringRef FileName = Replaces.begin()->getFilePath();
1525 
1526   tooling::Replacements FormatReplaces =
1527       ProcessFunc(Style, *NewCode, ChangedRanges, FileName);
1528 
1529   return Replaces.merge(FormatReplaces);
1530 }
1531 
1532 llvm::Expected<tooling::Replacements>
1533 formatReplacements(StringRef Code, const tooling::Replacements &Replaces,
1534                    const FormatStyle &Style) {
1535   // We need to use lambda function here since there are two versions of
1536   // `sortIncludes`.
1537   auto SortIncludes = [](const FormatStyle &Style, StringRef Code,
1538                          std::vector<tooling::Range> Ranges,
1539                          StringRef FileName) -> tooling::Replacements {
1540     return sortIncludes(Style, Code, Ranges, FileName);
1541   };
1542   auto SortedReplaces =
1543       processReplacements(SortIncludes, Code, Replaces, Style);
1544   if (!SortedReplaces)
1545     return SortedReplaces.takeError();
1546 
1547   // We need to use lambda function here since there are two versions of
1548   // `reformat`.
1549   auto Reformat = [](const FormatStyle &Style, StringRef Code,
1550                      std::vector<tooling::Range> Ranges,
1551                      StringRef FileName) -> tooling::Replacements {
1552     return reformat(Style, Code, Ranges, FileName);
1553   };
1554   return processReplacements(Reformat, Code, *SortedReplaces, Style);
1555 }
1556 
1557 namespace {
1558 
1559 inline bool isHeaderInsertion(const tooling::Replacement &Replace) {
1560   return Replace.getOffset() == UINT_MAX && Replace.getLength() == 0 &&
1561          llvm::Regex(IncludeRegexPattern).match(Replace.getReplacementText());
1562 }
1563 
1564 inline bool isHeaderDeletion(const tooling::Replacement &Replace) {
1565   return Replace.getOffset() == UINT_MAX && Replace.getLength() == 1;
1566 }
1567 
1568 // Returns the offset after skipping a sequence of tokens, matched by \p
1569 // GetOffsetAfterSequence, from the start of the code.
1570 // \p GetOffsetAfterSequence should be a function that matches a sequence of
1571 // tokens and returns an offset after the sequence.
1572 unsigned getOffsetAfterTokenSequence(
1573     StringRef FileName, StringRef Code, const FormatStyle &Style,
1574     llvm::function_ref<unsigned(const SourceManager &, Lexer &, Token &)>
1575         GetOffsetAfterSequence) {
1576   std::unique_ptr<Environment> Env =
1577       Environment::CreateVirtualEnvironment(Code, FileName, /*Ranges=*/{});
1578   const SourceManager &SourceMgr = Env->getSourceManager();
1579   Lexer Lex(Env->getFileID(), SourceMgr.getBuffer(Env->getFileID()), SourceMgr,
1580             getFormattingLangOpts(Style));
1581   Token Tok;
1582   // Get the first token.
1583   Lex.LexFromRawLexer(Tok);
1584   return GetOffsetAfterSequence(SourceMgr, Lex, Tok);
1585 }
1586 
1587 // Check if a sequence of tokens is like "#<Name> <raw_identifier>". If it is,
1588 // \p Tok will be the token after this directive; otherwise, it can be any token
1589 // after the given \p Tok (including \p Tok).
1590 bool checkAndConsumeDirectiveWithName(Lexer &Lex, StringRef Name, Token &Tok) {
1591   bool Matched = Tok.is(tok::hash) && !Lex.LexFromRawLexer(Tok) &&
1592                  Tok.is(tok::raw_identifier) &&
1593                  Tok.getRawIdentifier() == Name && !Lex.LexFromRawLexer(Tok) &&
1594                  Tok.is(tok::raw_identifier);
1595   if (Matched)
1596     Lex.LexFromRawLexer(Tok);
1597   return Matched;
1598 }
1599 
1600 void skipComments(Lexer &Lex, Token &Tok) {
1601   while (Tok.is(tok::comment))
1602     if (Lex.LexFromRawLexer(Tok))
1603       return;
1604 }
1605 
1606 // Returns the offset after header guard directives and any comments
1607 // before/after header guards. If no header guard presents in the code, this
1608 // will returns the offset after skipping all comments from the start of the
1609 // code.
1610 unsigned getOffsetAfterHeaderGuardsAndComments(StringRef FileName,
1611                                                StringRef Code,
1612                                                const FormatStyle &Style) {
1613   return getOffsetAfterTokenSequence(
1614       FileName, Code, Style,
1615       [](const SourceManager &SM, Lexer &Lex, Token Tok) {
1616         skipComments(Lex, Tok);
1617         unsigned InitialOffset = SM.getFileOffset(Tok.getLocation());
1618         if (checkAndConsumeDirectiveWithName(Lex, "ifndef", Tok)) {
1619           skipComments(Lex, Tok);
1620           if (checkAndConsumeDirectiveWithName(Lex, "define", Tok))
1621             return SM.getFileOffset(Tok.getLocation());
1622         }
1623         return InitialOffset;
1624       });
1625 }
1626 
1627 // Check if a sequence of tokens is like
1628 //    "#include ("header.h" | <header.h>)".
1629 // If it is, \p Tok will be the token after this directive; otherwise, it can be
1630 // any token after the given \p Tok (including \p Tok).
1631 bool checkAndConsumeInclusiveDirective(Lexer &Lex, Token &Tok) {
1632   auto Matched = [&]() {
1633     Lex.LexFromRawLexer(Tok);
1634     return true;
1635   };
1636   if (Tok.is(tok::hash) && !Lex.LexFromRawLexer(Tok) &&
1637       Tok.is(tok::raw_identifier) && Tok.getRawIdentifier() == "include") {
1638     if (Lex.LexFromRawLexer(Tok))
1639       return false;
1640     if (Tok.is(tok::string_literal))
1641       return Matched();
1642     if (Tok.is(tok::less)) {
1643       while (!Lex.LexFromRawLexer(Tok) && Tok.isNot(tok::greater)) {
1644       }
1645       if (Tok.is(tok::greater))
1646         return Matched();
1647     }
1648   }
1649   return false;
1650 }
1651 
1652 // Returns the offset of the last #include directive after which a new
1653 // #include can be inserted. This ignores #include's after the #include block(s)
1654 // in the beginning of a file to avoid inserting headers into code sections
1655 // where new #include's should not be added by default.
1656 // These code sections include:
1657 //      - raw string literals (containing #include).
1658 //      - #if blocks.
1659 //      - Special #include's among declarations (e.g. functions).
1660 //
1661 // If no #include after which a new #include can be inserted, this returns the
1662 // offset after skipping all comments from the start of the code.
1663 // Inserting after an #include is not allowed if it comes after code that is not
1664 // #include (e.g. pre-processing directive that is not #include, declarations).
1665 unsigned getMaxHeaderInsertionOffset(StringRef FileName, StringRef Code,
1666                                      const FormatStyle &Style) {
1667   return getOffsetAfterTokenSequence(
1668       FileName, Code, Style,
1669       [](const SourceManager &SM, Lexer &Lex, Token Tok) {
1670         skipComments(Lex, Tok);
1671         unsigned MaxOffset = SM.getFileOffset(Tok.getLocation());
1672         while (checkAndConsumeInclusiveDirective(Lex, Tok))
1673           MaxOffset = SM.getFileOffset(Tok.getLocation());
1674         return MaxOffset;
1675       });
1676 }
1677 
1678 bool isDeletedHeader(llvm::StringRef HeaderName,
1679                      const std::set<llvm::StringRef> &HeadersToDelete) {
1680   return HeadersToDelete.count(HeaderName) ||
1681          HeadersToDelete.count(HeaderName.trim("\"<>"));
1682 }
1683 
1684 // FIXME: insert empty lines between newly created blocks.
1685 tooling::Replacements
1686 fixCppIncludeInsertions(StringRef Code, const tooling::Replacements &Replaces,
1687                         const FormatStyle &Style) {
1688   if (!Style.isCpp())
1689     return Replaces;
1690 
1691   tooling::Replacements HeaderInsertions;
1692   std::set<llvm::StringRef> HeadersToDelete;
1693   tooling::Replacements Result;
1694   for (const auto &R : Replaces) {
1695     if (isHeaderInsertion(R)) {
1696       // Replacements from \p Replaces must be conflict-free already, so we can
1697       // simply consume the error.
1698       llvm::consumeError(HeaderInsertions.add(R));
1699     } else if (isHeaderDeletion(R)) {
1700       HeadersToDelete.insert(R.getReplacementText());
1701     } else if (R.getOffset() == UINT_MAX) {
1702       llvm::errs() << "Insertions other than header #include insertion are "
1703                       "not supported! "
1704                    << R.getReplacementText() << "\n";
1705     } else {
1706       llvm::consumeError(Result.add(R));
1707     }
1708   }
1709   if (HeaderInsertions.empty() && HeadersToDelete.empty())
1710     return Replaces;
1711 
1712   llvm::Regex IncludeRegex(IncludeRegexPattern);
1713   llvm::Regex DefineRegex(R"(^[\t\ ]*#[\t\ ]*define[\t\ ]*[^\\]*$)");
1714   SmallVector<StringRef, 4> Matches;
1715 
1716   StringRef FileName = Replaces.begin()->getFilePath();
1717   IncludeCategoryManager Categories(Style, FileName);
1718 
1719   // Record the offset of the end of the last include in each category.
1720   std::map<int, int> CategoryEndOffsets;
1721   // All possible priorities.
1722   // Add 0 for main header and INT_MAX for headers that are not in any category.
1723   std::set<int> Priorities = {0, INT_MAX};
1724   for (const auto &Category : Style.IncludeCategories)
1725     Priorities.insert(Category.Priority);
1726   int FirstIncludeOffset = -1;
1727   // All new headers should be inserted after this offset.
1728   unsigned MinInsertOffset =
1729       getOffsetAfterHeaderGuardsAndComments(FileName, Code, Style);
1730   StringRef TrimmedCode = Code.drop_front(MinInsertOffset);
1731   // Max insertion offset in the original code.
1732   unsigned MaxInsertOffset =
1733       MinInsertOffset +
1734       getMaxHeaderInsertionOffset(FileName, TrimmedCode, Style);
1735   SmallVector<StringRef, 32> Lines;
1736   TrimmedCode.split(Lines, '\n');
1737   unsigned Offset = MinInsertOffset;
1738   unsigned NextLineOffset;
1739   std::set<StringRef> ExistingIncludes;
1740   for (auto Line : Lines) {
1741     NextLineOffset = std::min(Code.size(), Offset + Line.size() + 1);
1742     if (IncludeRegex.match(Line, &Matches)) {
1743       // The header name with quotes or angle brackets.
1744       StringRef IncludeName = Matches[2];
1745       ExistingIncludes.insert(IncludeName);
1746       // Only record the offset of current #include if we can insert after it.
1747       if (Offset <= MaxInsertOffset) {
1748         int Category = Categories.getIncludePriority(
1749             IncludeName, /*CheckMainHeader=*/FirstIncludeOffset < 0);
1750         CategoryEndOffsets[Category] = NextLineOffset;
1751         if (FirstIncludeOffset < 0)
1752           FirstIncludeOffset = Offset;
1753       }
1754       if (isDeletedHeader(IncludeName, HeadersToDelete)) {
1755         // If this is the last line without trailing newline, we need to make
1756         // sure we don't delete across the file boundary.
1757         unsigned Length = std::min(Line.size() + 1, Code.size() - Offset);
1758         llvm::Error Err =
1759             Result.add(tooling::Replacement(FileName, Offset, Length, ""));
1760         if (Err) {
1761           // Ignore the deletion on conflict.
1762           llvm::errs() << "Failed to add header deletion replacement for "
1763                        << IncludeName << ": " << llvm::toString(std::move(Err))
1764                        << "\n";
1765         }
1766       }
1767     }
1768     Offset = NextLineOffset;
1769   }
1770 
1771   // Populate CategoryEndOfssets:
1772   // - Ensure that CategoryEndOffset[Highest] is always populated.
1773   // - If CategoryEndOffset[Priority] isn't set, use the next higher value that
1774   //   is set, up to CategoryEndOffset[Highest].
1775   auto Highest = Priorities.begin();
1776   if (CategoryEndOffsets.find(*Highest) == CategoryEndOffsets.end()) {
1777     if (FirstIncludeOffset >= 0)
1778       CategoryEndOffsets[*Highest] = FirstIncludeOffset;
1779     else
1780       CategoryEndOffsets[*Highest] = MinInsertOffset;
1781   }
1782   // By this point, CategoryEndOffset[Highest] is always set appropriately:
1783   //  - to an appropriate location before/after existing #includes, or
1784   //  - to right after the header guard, or
1785   //  - to the beginning of the file.
1786   for (auto I = ++Priorities.begin(), E = Priorities.end(); I != E; ++I)
1787     if (CategoryEndOffsets.find(*I) == CategoryEndOffsets.end())
1788       CategoryEndOffsets[*I] = CategoryEndOffsets[*std::prev(I)];
1789 
1790   bool NeedNewLineAtEnd = !Code.empty() && Code.back() != '\n';
1791   for (const auto &R : HeaderInsertions) {
1792     auto IncludeDirective = R.getReplacementText();
1793     bool Matched = IncludeRegex.match(IncludeDirective, &Matches);
1794     assert(Matched && "Header insertion replacement must have replacement text "
1795                       "'#include ...'");
1796     (void)Matched;
1797     auto IncludeName = Matches[2];
1798     if (ExistingIncludes.find(IncludeName) != ExistingIncludes.end()) {
1799       DEBUG(llvm::dbgs() << "Skip adding existing include : " << IncludeName
1800                          << "\n");
1801       continue;
1802     }
1803     int Category =
1804         Categories.getIncludePriority(IncludeName, /*CheckMainHeader=*/true);
1805     Offset = CategoryEndOffsets[Category];
1806     std::string NewInclude = !IncludeDirective.endswith("\n")
1807                                  ? (IncludeDirective + "\n").str()
1808                                  : IncludeDirective.str();
1809     // When inserting headers at end of the code, also append '\n' to the code
1810     // if it does not end with '\n'.
1811     if (NeedNewLineAtEnd && Offset == Code.size()) {
1812       NewInclude = "\n" + NewInclude;
1813       NeedNewLineAtEnd = false;
1814     }
1815     auto NewReplace = tooling::Replacement(FileName, Offset, 0, NewInclude);
1816     auto Err = Result.add(NewReplace);
1817     if (Err) {
1818       llvm::consumeError(std::move(Err));
1819       unsigned NewOffset = Result.getShiftedCodePosition(Offset);
1820       NewReplace = tooling::Replacement(FileName, NewOffset, 0, NewInclude);
1821       Result = Result.merge(tooling::Replacements(NewReplace));
1822     }
1823   }
1824   return Result;
1825 }
1826 
1827 } // anonymous namespace
1828 
1829 llvm::Expected<tooling::Replacements>
1830 cleanupAroundReplacements(StringRef Code, const tooling::Replacements &Replaces,
1831                           const FormatStyle &Style) {
1832   // We need to use lambda function here since there are two versions of
1833   // `cleanup`.
1834   auto Cleanup = [](const FormatStyle &Style, StringRef Code,
1835                     std::vector<tooling::Range> Ranges,
1836                     StringRef FileName) -> tooling::Replacements {
1837     return cleanup(Style, Code, Ranges, FileName);
1838   };
1839   // Make header insertion replacements insert new headers into correct blocks.
1840   tooling::Replacements NewReplaces =
1841       fixCppIncludeInsertions(Code, Replaces, Style);
1842   return processReplacements(Cleanup, Code, NewReplaces, Style);
1843 }
1844 
1845 tooling::Replacements reformat(const FormatStyle &Style, StringRef Code,
1846                                ArrayRef<tooling::Range> Ranges,
1847                                StringRef FileName,
1848                                FormattingAttemptStatus *Status) {
1849   FormatStyle Expanded = expandPresets(Style);
1850   if (Expanded.DisableFormat)
1851     return tooling::Replacements();
1852   if (Expanded.Language == FormatStyle::LK_JavaScript && isMpegTS(Code))
1853     return tooling::Replacements();
1854   auto Env = Environment::CreateVirtualEnvironment(Code, FileName, Ranges);
1855 
1856   auto reformatAfterApplying = [&] (TokenAnalyzer& Fixer) {
1857     tooling::Replacements Fixes = Fixer.process();
1858     if (!Fixes.empty()) {
1859       auto NewCode = applyAllReplacements(Code, Fixes);
1860       if (NewCode) {
1861         auto NewEnv = Environment::CreateVirtualEnvironment(
1862             *NewCode, FileName,
1863             tooling::calculateRangesAfterReplacements(Fixes, Ranges));
1864         Formatter Format(*NewEnv, Expanded, Status);
1865         return Fixes.merge(Format.process());
1866       }
1867     }
1868     Formatter Format(*Env, Expanded, Status);
1869     return Format.process();
1870   };
1871 
1872   if (Style.Language == FormatStyle::LK_Cpp &&
1873       Style.FixNamespaceComments) {
1874     NamespaceEndCommentsFixer CommentsFixer(*Env, Expanded);
1875     return reformatAfterApplying(CommentsFixer);
1876   }
1877 
1878   if (Style.Language == FormatStyle::LK_JavaScript &&
1879       Style.JavaScriptQuotes != FormatStyle::JSQS_Leave) {
1880     JavaScriptRequoter Requoter(*Env, Expanded);
1881     return reformatAfterApplying(Requoter);
1882   }
1883 
1884   Formatter Format(*Env, Expanded, Status);
1885   return Format.process();
1886 }
1887 
1888 tooling::Replacements cleanup(const FormatStyle &Style, StringRef Code,
1889                               ArrayRef<tooling::Range> Ranges,
1890                               StringRef FileName) {
1891   std::unique_ptr<Environment> Env =
1892       Environment::CreateVirtualEnvironment(Code, FileName, Ranges);
1893   Cleaner Clean(*Env, Style);
1894   return Clean.process();
1895 }
1896 
1897 tooling::Replacements reformat(const FormatStyle &Style, StringRef Code,
1898                                ArrayRef<tooling::Range> Ranges,
1899                                StringRef FileName, bool *IncompleteFormat) {
1900   FormattingAttemptStatus Status;
1901   auto Result = reformat(Style, Code, Ranges, FileName, &Status);
1902   if (!Status.FormatComplete)
1903     *IncompleteFormat = true;
1904   return Result;
1905 }
1906 
1907 tooling::Replacements fixNamespaceEndComments(const FormatStyle &Style,
1908                                               StringRef Code,
1909                                               ArrayRef<tooling::Range> Ranges,
1910                                               StringRef FileName) {
1911   std::unique_ptr<Environment> Env =
1912       Environment::CreateVirtualEnvironment(Code, FileName, Ranges);
1913   NamespaceEndCommentsFixer Fix(*Env, Style);
1914   return Fix.process();
1915 }
1916 
1917 LangOptions getFormattingLangOpts(const FormatStyle &Style) {
1918   LangOptions LangOpts;
1919   LangOpts.CPlusPlus = 1;
1920   LangOpts.CPlusPlus11 = Style.Standard == FormatStyle::LS_Cpp03 ? 0 : 1;
1921   LangOpts.CPlusPlus14 = Style.Standard == FormatStyle::LS_Cpp03 ? 0 : 1;
1922   LangOpts.CPlusPlus1z = Style.Standard == FormatStyle::LS_Cpp03 ? 0 : 1;
1923   LangOpts.LineComment = 1;
1924   bool AlternativeOperators = Style.isCpp();
1925   LangOpts.CXXOperatorNames = AlternativeOperators ? 1 : 0;
1926   LangOpts.Bool = 1;
1927   LangOpts.ObjC1 = 1;
1928   LangOpts.ObjC2 = 1;
1929   LangOpts.MicrosoftExt = 1;    // To get kw___try, kw___finally.
1930   LangOpts.DeclSpecKeyword = 1; // To get __declspec.
1931   return LangOpts;
1932 }
1933 
1934 const char *StyleOptionHelpDescription =
1935     "Coding style, currently supports:\n"
1936     "  LLVM, Google, Chromium, Mozilla, WebKit.\n"
1937     "Use -style=file to load style configuration from\n"
1938     ".clang-format file located in one of the parent\n"
1939     "directories of the source file (or current\n"
1940     "directory for stdin).\n"
1941     "Use -style=\"{key: value, ...}\" to set specific\n"
1942     "parameters, e.g.:\n"
1943     "  -style=\"{BasedOnStyle: llvm, IndentWidth: 8}\"";
1944 
1945 static FormatStyle::LanguageKind getLanguageByFileName(StringRef FileName) {
1946   if (FileName.endswith(".java"))
1947     return FormatStyle::LK_Java;
1948   if (FileName.endswith_lower(".js") || FileName.endswith_lower(".ts"))
1949     return FormatStyle::LK_JavaScript; // JavaScript or TypeScript.
1950   if (FileName.endswith(".m") || FileName.endswith(".mm"))
1951     return FormatStyle::LK_ObjC;
1952   if (FileName.endswith_lower(".proto") ||
1953       FileName.endswith_lower(".protodevel"))
1954     return FormatStyle::LK_Proto;
1955   if (FileName.endswith_lower(".td"))
1956     return FormatStyle::LK_TableGen;
1957   return FormatStyle::LK_Cpp;
1958 }
1959 
1960 llvm::Expected<FormatStyle> getStyle(StringRef StyleName, StringRef FileName,
1961                                      StringRef FallbackStyleName,
1962                                      StringRef Code, vfs::FileSystem *FS) {
1963   if (!FS) {
1964     FS = vfs::getRealFileSystem().get();
1965   }
1966   FormatStyle Style = getLLVMStyle();
1967   Style.Language = getLanguageByFileName(FileName);
1968 
1969   // This is a very crude detection of whether a header contains ObjC code that
1970   // should be improved over time and probably be done on tokens, not one the
1971   // bare content of the file.
1972   if (Style.Language == FormatStyle::LK_Cpp && FileName.endswith(".h") &&
1973       (Code.contains("\n- (") || Code.contains("\n+ (")))
1974     Style.Language = FormatStyle::LK_ObjC;
1975 
1976   FormatStyle FallbackStyle = getNoStyle();
1977   if (!getPredefinedStyle(FallbackStyleName, Style.Language, &FallbackStyle))
1978     return make_string_error("Invalid fallback style \"" + FallbackStyleName);
1979 
1980   if (StyleName.startswith("{")) {
1981     // Parse YAML/JSON style from the command line.
1982     if (std::error_code ec = parseConfiguration(StyleName, &Style))
1983       return make_string_error("Error parsing -style: " + ec.message());
1984     return Style;
1985   }
1986 
1987   if (!StyleName.equals_lower("file")) {
1988     if (!getPredefinedStyle(StyleName, Style.Language, &Style))
1989       return make_string_error("Invalid value for -style");
1990     return Style;
1991   }
1992 
1993   // Look for .clang-format/_clang-format file in the file's parent directories.
1994   SmallString<128> UnsuitableConfigFiles;
1995   SmallString<128> Path(FileName);
1996   if (std::error_code EC = FS->makeAbsolute(Path))
1997     return make_string_error(EC.message());
1998 
1999   for (StringRef Directory = Path; !Directory.empty();
2000        Directory = llvm::sys::path::parent_path(Directory)) {
2001 
2002     auto Status = FS->status(Directory);
2003     if (!Status ||
2004         Status->getType() != llvm::sys::fs::file_type::directory_file) {
2005       continue;
2006     }
2007 
2008     SmallString<128> ConfigFile(Directory);
2009 
2010     llvm::sys::path::append(ConfigFile, ".clang-format");
2011     DEBUG(llvm::dbgs() << "Trying " << ConfigFile << "...\n");
2012 
2013     Status = FS->status(ConfigFile.str());
2014     bool FoundConfigFile =
2015         Status && (Status->getType() == llvm::sys::fs::file_type::regular_file);
2016     if (!FoundConfigFile) {
2017       // Try _clang-format too, since dotfiles are not commonly used on Windows.
2018       ConfigFile = Directory;
2019       llvm::sys::path::append(ConfigFile, "_clang-format");
2020       DEBUG(llvm::dbgs() << "Trying " << ConfigFile << "...\n");
2021       Status = FS->status(ConfigFile.str());
2022       FoundConfigFile = Status && (Status->getType() ==
2023                                    llvm::sys::fs::file_type::regular_file);
2024     }
2025 
2026     if (FoundConfigFile) {
2027       llvm::ErrorOr<std::unique_ptr<llvm::MemoryBuffer>> Text =
2028           FS->getBufferForFile(ConfigFile.str());
2029       if (std::error_code EC = Text.getError())
2030         return make_string_error(EC.message());
2031       if (std::error_code ec =
2032               parseConfiguration(Text.get()->getBuffer(), &Style)) {
2033         if (ec == ParseError::Unsuitable) {
2034           if (!UnsuitableConfigFiles.empty())
2035             UnsuitableConfigFiles.append(", ");
2036           UnsuitableConfigFiles.append(ConfigFile);
2037           continue;
2038         }
2039         return make_string_error("Error reading " + ConfigFile + ": " +
2040                                  ec.message());
2041       }
2042       DEBUG(llvm::dbgs() << "Using configuration file " << ConfigFile << "\n");
2043       return Style;
2044     }
2045   }
2046   if (!UnsuitableConfigFiles.empty())
2047     return make_string_error("Configuration file(s) do(es) not support " +
2048                              getLanguageName(Style.Language) + ": " +
2049                              UnsuitableConfigFiles);
2050   return FallbackStyle;
2051 }
2052 
2053 } // namespace format
2054 } // namespace clang
2055