1 //===--- CodeComplete.cpp ----------------------------------------*- C++-*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // Code completion has several moving parts:
10 //  - AST-based completions are provided using the completion hooks in Sema.
11 //  - external completions are retrieved from the index (using hints from Sema)
12 //  - the two sources overlap, and must be merged and overloads bundled
13 //  - results must be scored and ranked (see Quality.h) before rendering
14 //
15 // Signature help works in a similar way as code completion, but it is simpler:
16 // it's purely AST-based, and there are few candidates.
17 //
18 //===----------------------------------------------------------------------===//
19 
20 #include "CodeComplete.h"
21 #include "AST.h"
22 #include "ClangdUnit.h"
23 #include "CodeCompletionStrings.h"
24 #include "Compiler.h"
25 #include "Diagnostics.h"
26 #include "ExpectedTypes.h"
27 #include "FileDistance.h"
28 #include "FuzzyMatch.h"
29 #include "Headers.h"
30 #include "Logger.h"
31 #include "Protocol.h"
32 #include "Quality.h"
33 #include "SourceCode.h"
34 #include "TUScheduler.h"
35 #include "Trace.h"
36 #include "URI.h"
37 #include "index/Index.h"
38 #include "index/Symbol.h"
39 #include "index/SymbolOrigin.h"
40 #include "clang/AST/Decl.h"
41 #include "clang/AST/DeclBase.h"
42 #include "clang/Basic/CharInfo.h"
43 #include "clang/Basic/LangOptions.h"
44 #include "clang/Basic/SourceLocation.h"
45 #include "clang/Format/Format.h"
46 #include "clang/Frontend/CompilerInstance.h"
47 #include "clang/Frontend/FrontendActions.h"
48 #include "clang/Lex/ExternalPreprocessorSource.h"
49 #include "clang/Lex/Preprocessor.h"
50 #include "clang/Lex/PreprocessorOptions.h"
51 #include "clang/Sema/CodeCompleteConsumer.h"
52 #include "clang/Sema/DeclSpec.h"
53 #include "clang/Sema/Sema.h"
54 #include "llvm/ADT/ArrayRef.h"
55 #include "llvm/ADT/None.h"
56 #include "llvm/ADT/Optional.h"
57 #include "llvm/ADT/SmallVector.h"
58 #include "llvm/ADT/StringExtras.h"
59 #include "llvm/ADT/StringRef.h"
60 #include "llvm/Support/Compiler.h"
61 #include "llvm/Support/Debug.h"
62 #include "llvm/Support/Error.h"
63 #include "llvm/Support/Format.h"
64 #include "llvm/Support/FormatVariadic.h"
65 #include "llvm/Support/ScopedPrinter.h"
66 #include <algorithm>
67 #include <iterator>
68 
69 // We log detailed candidate here if you run with -debug-only=codecomplete.
70 #define DEBUG_TYPE "CodeComplete"
71 
72 namespace clang {
73 namespace clangd {
74 namespace {
75 
76 CompletionItemKind toCompletionItemKind(index::SymbolKind Kind) {
77   using SK = index::SymbolKind;
78   switch (Kind) {
79   case SK::Unknown:
80     return CompletionItemKind::Missing;
81   case SK::Module:
82   case SK::Namespace:
83   case SK::NamespaceAlias:
84     return CompletionItemKind::Module;
85   case SK::Macro:
86     return CompletionItemKind::Text;
87   case SK::Enum:
88     return CompletionItemKind::Enum;
89   // FIXME(ioeric): use LSP struct instead of class when it is suppoted in the
90   // protocol.
91   case SK::Struct:
92   case SK::Class:
93   case SK::Protocol:
94   case SK::Extension:
95   case SK::Union:
96     return CompletionItemKind::Class;
97   case SK::TypeAlias:
98     // We use the same kind as the VSCode C++ extension.
99     // FIXME: pick a better option when we have one.
100     return CompletionItemKind::Interface;
101   case SK::Using:
102     return CompletionItemKind::Reference;
103   case SK::Function:
104   // FIXME(ioeric): this should probably be an operator. This should be fixed
105   // when `Operator` is support type in the protocol.
106   case SK::ConversionFunction:
107     return CompletionItemKind::Function;
108   case SK::Variable:
109   case SK::Parameter:
110     return CompletionItemKind::Variable;
111   case SK::Field:
112     return CompletionItemKind::Field;
113   // FIXME(ioeric): use LSP enum constant when it is supported in the protocol.
114   case SK::EnumConstant:
115     return CompletionItemKind::Value;
116   case SK::InstanceMethod:
117   case SK::ClassMethod:
118   case SK::StaticMethod:
119   case SK::Destructor:
120     return CompletionItemKind::Method;
121   case SK::InstanceProperty:
122   case SK::ClassProperty:
123   case SK::StaticProperty:
124     return CompletionItemKind::Property;
125   case SK::Constructor:
126     return CompletionItemKind::Constructor;
127   }
128   llvm_unreachable("Unhandled clang::index::SymbolKind.");
129 }
130 
131 CompletionItemKind
132 toCompletionItemKind(CodeCompletionResult::ResultKind ResKind,
133                      const NamedDecl *Decl,
134                      CodeCompletionContext::Kind CtxKind) {
135   if (Decl)
136     return toCompletionItemKind(index::getSymbolInfo(Decl).Kind);
137   if (CtxKind == CodeCompletionContext::CCC_IncludedFile)
138     return CompletionItemKind::File;
139   switch (ResKind) {
140   case CodeCompletionResult::RK_Declaration:
141     llvm_unreachable("RK_Declaration without Decl");
142   case CodeCompletionResult::RK_Keyword:
143     return CompletionItemKind::Keyword;
144   case CodeCompletionResult::RK_Macro:
145     return CompletionItemKind::Text; // unfortunately, there's no 'Macro'
146                                      // completion items in LSP.
147   case CodeCompletionResult::RK_Pattern:
148     return CompletionItemKind::Snippet;
149   }
150   llvm_unreachable("Unhandled CodeCompletionResult::ResultKind.");
151 }
152 
153 // Identifier code completion result.
154 struct RawIdentifier {
155   llvm::StringRef Name;
156   unsigned References; // # of usages in file.
157 };
158 
159 /// A code completion result, in clang-native form.
160 /// It may be promoted to a CompletionItem if it's among the top-ranked results.
161 struct CompletionCandidate {
162   llvm::StringRef Name; // Used for filtering and sorting.
163   // We may have a result from Sema, from the index, or both.
164   const CodeCompletionResult *SemaResult = nullptr;
165   const Symbol *IndexResult = nullptr;
166   const RawIdentifier *IdentifierResult = nullptr;
167   llvm::SmallVector<llvm::StringRef, 1> RankedIncludeHeaders;
168 
169   // Returns a token identifying the overload set this is part of.
170   // 0 indicates it's not part of any overload set.
171   size_t overloadSet(const CodeCompleteOptions &Opts) const {
172     if (!Opts.BundleOverloads.getValueOr(false))
173       return 0;
174     llvm::SmallString<256> Scratch;
175     if (IndexResult) {
176       switch (IndexResult->SymInfo.Kind) {
177       case index::SymbolKind::ClassMethod:
178       case index::SymbolKind::InstanceMethod:
179       case index::SymbolKind::StaticMethod:
180 #ifndef NDEBUG
181         llvm_unreachable("Don't expect members from index in code completion");
182 #else
183         LLVM_FALLTHROUGH;
184 #endif
185       case index::SymbolKind::Function:
186         // We can't group overloads together that need different #includes.
187         // This could break #include insertion.
188         return llvm::hash_combine(
189             (IndexResult->Scope + IndexResult->Name).toStringRef(Scratch),
190             headerToInsertIfAllowed(Opts).getValueOr(""));
191       default:
192         return 0;
193       }
194     }
195     if (SemaResult) {
196       // We need to make sure we're consistent with the IndexResult case!
197       const NamedDecl *D = SemaResult->Declaration;
198       if (!D || !D->isFunctionOrFunctionTemplate())
199         return 0;
200       {
201         llvm::raw_svector_ostream OS(Scratch);
202         D->printQualifiedName(OS);
203       }
204       return llvm::hash_combine(Scratch,
205                                 headerToInsertIfAllowed(Opts).getValueOr(""));
206     }
207     assert(IdentifierResult);
208     return 0;
209   }
210 
211   // The best header to include if include insertion is allowed.
212   llvm::Optional<llvm::StringRef>
213   headerToInsertIfAllowed(const CodeCompleteOptions &Opts) const {
214     if (Opts.InsertIncludes == CodeCompleteOptions::NeverInsert ||
215         RankedIncludeHeaders.empty())
216       return None;
217     if (SemaResult && SemaResult->Declaration) {
218       // Avoid inserting new #include if the declaration is found in the current
219       // file e.g. the symbol is forward declared.
220       auto &SM = SemaResult->Declaration->getASTContext().getSourceManager();
221       for (const Decl *RD : SemaResult->Declaration->redecls())
222         if (SM.isInMainFile(SM.getExpansionLoc(RD->getBeginLoc())))
223           return None;
224     }
225     return RankedIncludeHeaders[0];
226   }
227 
228   using Bundle = llvm::SmallVector<CompletionCandidate, 4>;
229 };
230 using ScoredBundle =
231     std::pair<CompletionCandidate::Bundle, CodeCompletion::Scores>;
232 struct ScoredBundleGreater {
233   bool operator()(const ScoredBundle &L, const ScoredBundle &R) {
234     if (L.second.Total != R.second.Total)
235       return L.second.Total > R.second.Total;
236     return L.first.front().Name <
237            R.first.front().Name; // Earlier name is better.
238   }
239 };
240 
241 // Assembles a code completion out of a bundle of >=1 completion candidates.
242 // Many of the expensive strings are only computed at this point, once we know
243 // the candidate bundle is going to be returned.
244 //
245 // Many fields are the same for all candidates in a bundle (e.g. name), and are
246 // computed from the first candidate, in the constructor.
247 // Others vary per candidate, so add() must be called for remaining candidates.
248 struct CodeCompletionBuilder {
249   CodeCompletionBuilder(ASTContext *ASTCtx, const CompletionCandidate &C,
250                         CodeCompletionString *SemaCCS,
251                         llvm::ArrayRef<std::string> QueryScopes,
252                         const IncludeInserter &Includes,
253                         llvm::StringRef FileName,
254                         CodeCompletionContext::Kind ContextKind,
255                         const CodeCompleteOptions &Opts)
256       : ASTCtx(ASTCtx), ExtractDocumentation(Opts.IncludeComments),
257         EnableFunctionArgSnippets(Opts.EnableFunctionArgSnippets) {
258     add(C, SemaCCS);
259     if (C.SemaResult) {
260       assert(ASTCtx);
261       Completion.Origin |= SymbolOrigin::AST;
262       Completion.Name = llvm::StringRef(SemaCCS->getTypedText());
263       if (Completion.Scope.empty()) {
264         if ((C.SemaResult->Kind == CodeCompletionResult::RK_Declaration) ||
265             (C.SemaResult->Kind == CodeCompletionResult::RK_Pattern))
266           if (const auto *D = C.SemaResult->getDeclaration())
267             if (const auto *ND = dyn_cast<NamedDecl>(D))
268               Completion.Scope =
269                   splitQualifiedName(printQualifiedName(*ND)).first;
270       }
271       Completion.Kind = toCompletionItemKind(
272           C.SemaResult->Kind, C.SemaResult->Declaration, ContextKind);
273       // Sema could provide more info on whether the completion was a file or
274       // folder.
275       if (Completion.Kind == CompletionItemKind::File &&
276           Completion.Name.back() == '/')
277         Completion.Kind = CompletionItemKind::Folder;
278       for (const auto &FixIt : C.SemaResult->FixIts) {
279         Completion.FixIts.push_back(toTextEdit(
280             FixIt, ASTCtx->getSourceManager(), ASTCtx->getLangOpts()));
281       }
282       llvm::sort(Completion.FixIts, [](const TextEdit &X, const TextEdit &Y) {
283         return std::tie(X.range.start.line, X.range.start.character) <
284                std::tie(Y.range.start.line, Y.range.start.character);
285       });
286       Completion.Deprecated |=
287           (C.SemaResult->Availability == CXAvailability_Deprecated);
288     }
289     if (C.IndexResult) {
290       Completion.Origin |= C.IndexResult->Origin;
291       if (Completion.Scope.empty())
292         Completion.Scope = C.IndexResult->Scope;
293       if (Completion.Kind == CompletionItemKind::Missing)
294         Completion.Kind = toCompletionItemKind(C.IndexResult->SymInfo.Kind);
295       if (Completion.Name.empty())
296         Completion.Name = C.IndexResult->Name;
297       // If the completion was visible to Sema, no qualifier is needed. This
298       // avoids unneeded qualifiers in cases like with `using ns::X`.
299       if (Completion.RequiredQualifier.empty() && !C.SemaResult) {
300         llvm::StringRef ShortestQualifier = C.IndexResult->Scope;
301         for (llvm::StringRef Scope : QueryScopes) {
302           llvm::StringRef Qualifier = C.IndexResult->Scope;
303           if (Qualifier.consume_front(Scope) &&
304               Qualifier.size() < ShortestQualifier.size())
305             ShortestQualifier = Qualifier;
306         }
307         Completion.RequiredQualifier = ShortestQualifier;
308       }
309       Completion.Deprecated |= (C.IndexResult->Flags & Symbol::Deprecated);
310     }
311     if (C.IdentifierResult) {
312       Completion.Origin |= SymbolOrigin::Identifier;
313       Completion.Kind = CompletionItemKind::Text;
314       Completion.Name = C.IdentifierResult->Name;
315     }
316 
317     // Turn absolute path into a literal string that can be #included.
318     auto Inserted = [&](llvm::StringRef Header)
319         -> llvm::Expected<std::pair<std::string, bool>> {
320       auto DeclaringURI =
321           URI::parse(C.IndexResult->CanonicalDeclaration.FileURI);
322       if (!DeclaringURI)
323         return DeclaringURI.takeError();
324       auto ResolvedDeclaring = URI::resolve(*DeclaringURI, FileName);
325       if (!ResolvedDeclaring)
326         return ResolvedDeclaring.takeError();
327       auto ResolvedInserted = toHeaderFile(Header, FileName);
328       if (!ResolvedInserted)
329         return ResolvedInserted.takeError();
330       auto Spelled = Includes.calculateIncludePath(*ResolvedInserted, FileName);
331       if (!Spelled)
332         return llvm::createStringError(llvm::inconvertibleErrorCode(),
333                                        "Header not on include path");
334       return std::make_pair(
335           std::move(*Spelled),
336           Includes.shouldInsertInclude(*ResolvedDeclaring, *ResolvedInserted));
337     };
338     bool ShouldInsert = C.headerToInsertIfAllowed(Opts).hasValue();
339     // Calculate include paths and edits for all possible headers.
340     for (const auto &Inc : C.RankedIncludeHeaders) {
341       if (auto ToInclude = Inserted(Inc)) {
342         CodeCompletion::IncludeCandidate Include;
343         Include.Header = ToInclude->first;
344         if (ToInclude->second && ShouldInsert)
345           Include.Insertion = Includes.insert(ToInclude->first);
346         Completion.Includes.push_back(std::move(Include));
347       } else
348         log("Failed to generate include insertion edits for adding header "
349             "(FileURI='{0}', IncludeHeader='{1}') into {2}: {3}",
350             C.IndexResult->CanonicalDeclaration.FileURI, Inc, FileName,
351             ToInclude.takeError());
352     }
353     // Prefer includes that do not need edits (i.e. already exist).
354     std::stable_partition(Completion.Includes.begin(),
355                           Completion.Includes.end(),
356                           [](const CodeCompletion::IncludeCandidate &I) {
357                             return !I.Insertion.hasValue();
358                           });
359   }
360 
361   void add(const CompletionCandidate &C, CodeCompletionString *SemaCCS) {
362     assert(bool(C.SemaResult) == bool(SemaCCS));
363     Bundled.emplace_back();
364     BundledEntry &S = Bundled.back();
365     if (C.SemaResult) {
366       bool IsPattern = C.SemaResult->Kind == CodeCompletionResult::RK_Pattern;
367       getSignature(*SemaCCS, &S.Signature, &S.SnippetSuffix,
368                    &Completion.RequiredQualifier, IsPattern);
369       S.ReturnType = getReturnType(*SemaCCS);
370     } else if (C.IndexResult) {
371       S.Signature = C.IndexResult->Signature;
372       S.SnippetSuffix = C.IndexResult->CompletionSnippetSuffix;
373       S.ReturnType = C.IndexResult->ReturnType;
374     }
375     if (ExtractDocumentation && Completion.Documentation.empty()) {
376       if (C.IndexResult)
377         Completion.Documentation = C.IndexResult->Documentation;
378       else if (C.SemaResult)
379         Completion.Documentation = getDocComment(*ASTCtx, *C.SemaResult,
380                                                  /*CommentsFromHeader=*/false);
381     }
382   }
383 
384   CodeCompletion build() {
385     Completion.ReturnType = summarizeReturnType();
386     Completion.Signature = summarizeSignature();
387     Completion.SnippetSuffix = summarizeSnippet();
388     Completion.BundleSize = Bundled.size();
389     return std::move(Completion);
390   }
391 
392 private:
393   struct BundledEntry {
394     std::string SnippetSuffix;
395     std::string Signature;
396     std::string ReturnType;
397   };
398 
399   // If all BundledEntrys have the same value for a property, return it.
400   template <std::string BundledEntry::*Member>
401   const std::string *onlyValue() const {
402     auto B = Bundled.begin(), E = Bundled.end();
403     for (auto I = B + 1; I != E; ++I)
404       if (I->*Member != B->*Member)
405         return nullptr;
406     return &(B->*Member);
407   }
408 
409   template <bool BundledEntry::*Member> const bool *onlyValue() const {
410     auto B = Bundled.begin(), E = Bundled.end();
411     for (auto I = B + 1; I != E; ++I)
412       if (I->*Member != B->*Member)
413         return nullptr;
414     return &(B->*Member);
415   }
416 
417   std::string summarizeReturnType() const {
418     if (auto *RT = onlyValue<&BundledEntry::ReturnType>())
419       return *RT;
420     return "";
421   }
422 
423   std::string summarizeSnippet() const {
424     auto *Snippet = onlyValue<&BundledEntry::SnippetSuffix>();
425     if (!Snippet)
426       // All bundles are function calls.
427       // FIXME(ibiryukov): sometimes add template arguments to a snippet, e.g.
428       // we need to complete 'forward<$1>($0)'.
429       return "($0)";
430     if (EnableFunctionArgSnippets)
431       return *Snippet;
432 
433     // Replace argument snippets with a simplified pattern.
434     if (Snippet->empty())
435       return "";
436     if (Completion.Kind == CompletionItemKind::Function ||
437         Completion.Kind == CompletionItemKind::Method) {
438       // Functions snippets can be of 2 types:
439       // - containing only function arguments, e.g.
440       //   foo(${1:int p1}, ${2:int p2});
441       //   We transform this pattern to '($0)' or '()'.
442       // - template arguments and function arguments, e.g.
443       //   foo<${1:class}>(${2:int p1}).
444       //   We transform this pattern to '<$1>()$0' or '<$0>()'.
445 
446       bool EmptyArgs = llvm::StringRef(*Snippet).endswith("()");
447       if (Snippet->front() == '<')
448         return EmptyArgs ? "<$1>()$0" : "<$1>($0)";
449       if (Snippet->front() == '(')
450         return EmptyArgs ? "()" : "($0)";
451       return *Snippet; // Not an arg snippet?
452     }
453     // 'CompletionItemKind::Interface' matches template type aliases.
454     if (Completion.Kind == CompletionItemKind::Interface ||
455         Completion.Kind == CompletionItemKind::Class) {
456       if (Snippet->front() != '<')
457         return *Snippet; // Not an arg snippet?
458 
459       // Classes and template using aliases can only have template arguments,
460       // e.g. Foo<${1:class}>.
461       if (llvm::StringRef(*Snippet).endswith("<>"))
462         return "<>"; // can happen with defaulted template arguments.
463       return "<$0>";
464     }
465     return *Snippet;
466   }
467 
468   std::string summarizeSignature() const {
469     if (auto *Signature = onlyValue<&BundledEntry::Signature>())
470       return *Signature;
471     // All bundles are function calls.
472     return "(…)";
473   }
474 
475   // ASTCtx can be nullptr if not run with sema.
476   ASTContext *ASTCtx;
477   CodeCompletion Completion;
478   llvm::SmallVector<BundledEntry, 1> Bundled;
479   bool ExtractDocumentation;
480   bool EnableFunctionArgSnippets;
481 };
482 
483 // Determine the symbol ID for a Sema code completion result, if possible.
484 llvm::Optional<SymbolID> getSymbolID(const CodeCompletionResult &R,
485                                      const SourceManager &SM) {
486   switch (R.Kind) {
487   case CodeCompletionResult::RK_Declaration:
488   case CodeCompletionResult::RK_Pattern: {
489     return clang::clangd::getSymbolID(R.Declaration);
490   }
491   case CodeCompletionResult::RK_Macro:
492     return clang::clangd::getSymbolID(*R.Macro, R.MacroDefInfo, SM);
493   case CodeCompletionResult::RK_Keyword:
494     return None;
495   }
496   llvm_unreachable("unknown CodeCompletionResult kind");
497 }
498 
499 // Scopes of the paritial identifier we're trying to complete.
500 // It is used when we query the index for more completion results.
501 struct SpecifiedScope {
502   // The scopes we should look in, determined by Sema.
503   //
504   // If the qualifier was fully resolved, we look for completions in these
505   // scopes; if there is an unresolved part of the qualifier, it should be
506   // resolved within these scopes.
507   //
508   // Examples of qualified completion:
509   //
510   //   "::vec"                                      => {""}
511   //   "using namespace std; ::vec^"                => {"", "std::"}
512   //   "namespace ns {using namespace std;} ns::^"  => {"ns::", "std::"}
513   //   "std::vec^"                                  => {""}  // "std" unresolved
514   //
515   // Examples of unqualified completion:
516   //
517   //   "vec^"                                       => {""}
518   //   "using namespace std; vec^"                  => {"", "std::"}
519   //   "using namespace std; namespace ns { vec^ }" => {"ns::", "std::", ""}
520   //
521   // "" for global namespace, "ns::" for normal namespace.
522   std::vector<std::string> AccessibleScopes;
523   // The full scope qualifier as typed by the user (without the leading "::").
524   // Set if the qualifier is not fully resolved by Sema.
525   llvm::Optional<std::string> UnresolvedQualifier;
526 
527   // Construct scopes being queried in indexes. The results are deduplicated.
528   // This method format the scopes to match the index request representation.
529   std::vector<std::string> scopesForIndexQuery() {
530     std::set<std::string> Results;
531     for (llvm::StringRef AS : AccessibleScopes)
532       Results.insert(
533           (AS + (UnresolvedQualifier ? *UnresolvedQualifier : "")).str());
534     return {Results.begin(), Results.end()};
535   }
536 };
537 
538 // Get all scopes that will be queried in indexes and whether symbols from
539 // any scope is allowed. The first scope in the list is the preferred scope
540 // (e.g. enclosing namespace).
541 std::pair<std::vector<std::string>, bool>
542 getQueryScopes(CodeCompletionContext &CCContext, const Sema &CCSema,
543                const CompletionPrefix &HeuristicPrefix,
544                const CodeCompleteOptions &Opts) {
545   SpecifiedScope Scopes;
546   for (auto *Context : CCContext.getVisitedContexts()) {
547     if (isa<TranslationUnitDecl>(Context))
548       Scopes.AccessibleScopes.push_back(""); // global namespace
549     else if (isa<NamespaceDecl>(Context))
550       Scopes.AccessibleScopes.push_back(printNamespaceScope(*Context));
551   }
552 
553   const CXXScopeSpec *SemaSpecifier =
554       CCContext.getCXXScopeSpecifier().getValueOr(nullptr);
555   // Case 1: unqualified completion.
556   if (!SemaSpecifier) {
557     // Case 2 (exception): sema saw no qualifier, but there appears to be one!
558     // This can happen e.g. in incomplete macro expansions. Use heuristics.
559     if (!HeuristicPrefix.Qualifier.empty()) {
560       vlog("Sema said no scope specifier, but we saw {0} in the source code",
561            HeuristicPrefix.Qualifier);
562       StringRef SpelledSpecifier = HeuristicPrefix.Qualifier;
563       if (SpelledSpecifier.consume_front("::"))
564         Scopes.AccessibleScopes = {""};
565       Scopes.UnresolvedQualifier = SpelledSpecifier;
566       return {Scopes.scopesForIndexQuery(), false};
567     }
568     // The enclosing namespace must be first, it gets a quality boost.
569     std::vector<std::string> EnclosingAtFront;
570     std::string EnclosingScope = printNamespaceScope(*CCSema.CurContext);
571     EnclosingAtFront.push_back(EnclosingScope);
572     for (auto &S : Scopes.scopesForIndexQuery()) {
573       if (EnclosingScope != S)
574         EnclosingAtFront.push_back(std::move(S));
575     }
576     // Allow AllScopes completion as there is no explicit scope qualifier.
577     return {EnclosingAtFront, Opts.AllScopes};
578   }
579   // Case 3: sema saw and resolved a scope qualifier.
580   if (SemaSpecifier && SemaSpecifier->isValid())
581     return {Scopes.scopesForIndexQuery(), false};
582 
583   // Case 4: There was a qualifier, and Sema didn't resolve it.
584   Scopes.AccessibleScopes.push_back(""); // Make sure global scope is included.
585   llvm::StringRef SpelledSpecifier = Lexer::getSourceText(
586       CharSourceRange::getCharRange(SemaSpecifier->getRange()),
587       CCSema.SourceMgr, clang::LangOptions());
588   if (SpelledSpecifier.consume_front("::"))
589     Scopes.AccessibleScopes = {""};
590   Scopes.UnresolvedQualifier = SpelledSpecifier;
591   // Sema excludes the trailing "::".
592   if (!Scopes.UnresolvedQualifier->empty())
593     *Scopes.UnresolvedQualifier += "::";
594 
595   return {Scopes.scopesForIndexQuery(), false};
596 }
597 
598 // Should we perform index-based completion in a context of the specified kind?
599 // FIXME: consider allowing completion, but restricting the result types.
600 bool contextAllowsIndex(enum CodeCompletionContext::Kind K) {
601   switch (K) {
602   case CodeCompletionContext::CCC_TopLevel:
603   case CodeCompletionContext::CCC_ObjCInterface:
604   case CodeCompletionContext::CCC_ObjCImplementation:
605   case CodeCompletionContext::CCC_ObjCIvarList:
606   case CodeCompletionContext::CCC_ClassStructUnion:
607   case CodeCompletionContext::CCC_Statement:
608   case CodeCompletionContext::CCC_Expression:
609   case CodeCompletionContext::CCC_ObjCMessageReceiver:
610   case CodeCompletionContext::CCC_EnumTag:
611   case CodeCompletionContext::CCC_UnionTag:
612   case CodeCompletionContext::CCC_ClassOrStructTag:
613   case CodeCompletionContext::CCC_ObjCProtocolName:
614   case CodeCompletionContext::CCC_Namespace:
615   case CodeCompletionContext::CCC_Type:
616   case CodeCompletionContext::CCC_ParenthesizedExpression:
617   case CodeCompletionContext::CCC_ObjCInterfaceName:
618   case CodeCompletionContext::CCC_ObjCCategoryName:
619   case CodeCompletionContext::CCC_Symbol:
620   case CodeCompletionContext::CCC_SymbolOrNewName:
621     return true;
622   case CodeCompletionContext::CCC_OtherWithMacros:
623   case CodeCompletionContext::CCC_DotMemberAccess:
624   case CodeCompletionContext::CCC_ArrowMemberAccess:
625   case CodeCompletionContext::CCC_ObjCPropertyAccess:
626   case CodeCompletionContext::CCC_MacroName:
627   case CodeCompletionContext::CCC_MacroNameUse:
628   case CodeCompletionContext::CCC_PreprocessorExpression:
629   case CodeCompletionContext::CCC_PreprocessorDirective:
630   case CodeCompletionContext::CCC_SelectorName:
631   case CodeCompletionContext::CCC_TypeQualifiers:
632   case CodeCompletionContext::CCC_ObjCInstanceMessage:
633   case CodeCompletionContext::CCC_ObjCClassMessage:
634   case CodeCompletionContext::CCC_IncludedFile:
635   // FIXME: Provide identifier based completions for the following contexts:
636   case CodeCompletionContext::CCC_Other: // Be conservative.
637   case CodeCompletionContext::CCC_NaturalLanguage:
638   case CodeCompletionContext::CCC_Recovery:
639   case CodeCompletionContext::CCC_NewName:
640     return false;
641   }
642   llvm_unreachable("unknown code completion context");
643 }
644 
645 static bool isInjectedClass(const NamedDecl &D) {
646   if (auto *R = dyn_cast_or_null<RecordDecl>(&D))
647     if (R->isInjectedClassName())
648       return true;
649   return false;
650 }
651 
652 // Some member calls are blacklisted because they're so rarely useful.
653 static bool isBlacklistedMember(const NamedDecl &D) {
654   // Destructor completion is rarely useful, and works inconsistently.
655   // (s.^ completes ~string, but s.~st^ is an error).
656   if (D.getKind() == Decl::CXXDestructor)
657     return true;
658   // Injected name may be useful for A::foo(), but who writes A::A::foo()?
659   if (isInjectedClass(D))
660     return true;
661   // Explicit calls to operators are also rare.
662   auto NameKind = D.getDeclName().getNameKind();
663   if (NameKind == DeclarationName::CXXOperatorName ||
664       NameKind == DeclarationName::CXXLiteralOperatorName ||
665       NameKind == DeclarationName::CXXConversionFunctionName)
666     return true;
667   return false;
668 }
669 
670 // The CompletionRecorder captures Sema code-complete output, including context.
671 // It filters out ignored results (but doesn't apply fuzzy-filtering yet).
672 // It doesn't do scoring or conversion to CompletionItem yet, as we want to
673 // merge with index results first.
674 // Generally the fields and methods of this object should only be used from
675 // within the callback.
676 struct CompletionRecorder : public CodeCompleteConsumer {
677   CompletionRecorder(const CodeCompleteOptions &Opts,
678                      llvm::unique_function<void()> ResultsCallback)
679       : CodeCompleteConsumer(Opts.getClangCompleteOpts()),
680         CCContext(CodeCompletionContext::CCC_Other), Opts(Opts),
681         CCAllocator(std::make_shared<GlobalCodeCompletionAllocator>()),
682         CCTUInfo(CCAllocator), ResultsCallback(std::move(ResultsCallback)) {
683     assert(this->ResultsCallback);
684   }
685 
686   std::vector<CodeCompletionResult> Results;
687   CodeCompletionContext CCContext;
688   Sema *CCSema = nullptr; // Sema that created the results.
689   // FIXME: Sema is scary. Can we store ASTContext and Preprocessor, instead?
690 
691   void ProcessCodeCompleteResults(class Sema &S, CodeCompletionContext Context,
692                                   CodeCompletionResult *InResults,
693                                   unsigned NumResults) override final {
694     // Results from recovery mode are generally useless, and the callback after
695     // recovery (if any) is usually more interesting. To make sure we handle the
696     // future callback from sema, we just ignore all callbacks in recovery mode,
697     // as taking only results from recovery mode results in poor completion
698     // results.
699     // FIXME: in case there is no future sema completion callback after the
700     // recovery mode, we might still want to provide some results (e.g. trivial
701     // identifier-based completion).
702     if (Context.getKind() == CodeCompletionContext::CCC_Recovery) {
703       log("Code complete: Ignoring sema code complete callback with Recovery "
704           "context.");
705       return;
706     }
707     // If a callback is called without any sema result and the context does not
708     // support index-based completion, we simply skip it to give way to
709     // potential future callbacks with results.
710     if (NumResults == 0 && !contextAllowsIndex(Context.getKind()))
711       return;
712     if (CCSema) {
713       log("Multiple code complete callbacks (parser backtracked?). "
714           "Dropping results from context {0}, keeping results from {1}.",
715           getCompletionKindString(Context.getKind()),
716           getCompletionKindString(this->CCContext.getKind()));
717       return;
718     }
719     // Record the completion context.
720     CCSema = &S;
721     CCContext = Context;
722 
723     // Retain the results we might want.
724     for (unsigned I = 0; I < NumResults; ++I) {
725       auto &Result = InResults[I];
726       // Class members that are shadowed by subclasses are usually noise.
727       if (Result.Hidden && Result.Declaration &&
728           Result.Declaration->isCXXClassMember())
729         continue;
730       if (!Opts.IncludeIneligibleResults &&
731           (Result.Availability == CXAvailability_NotAvailable ||
732            Result.Availability == CXAvailability_NotAccessible))
733         continue;
734       if (Result.Declaration &&
735           !Context.getBaseType().isNull() // is this a member-access context?
736           && isBlacklistedMember(*Result.Declaration))
737         continue;
738       // Skip injected class name when no class scope is not explicitly set.
739       // E.g. show injected A::A in `using A::A^` but not in "A^".
740       if (Result.Declaration && !Context.getCXXScopeSpecifier().hasValue() &&
741           isInjectedClass(*Result.Declaration))
742         continue;
743       // We choose to never append '::' to completion results in clangd.
744       Result.StartsNestedNameSpecifier = false;
745       Results.push_back(Result);
746     }
747     ResultsCallback();
748   }
749 
750   CodeCompletionAllocator &getAllocator() override { return *CCAllocator; }
751   CodeCompletionTUInfo &getCodeCompletionTUInfo() override { return CCTUInfo; }
752 
753   // Returns the filtering/sorting name for Result, which must be from Results.
754   // Returned string is owned by this recorder (or the AST).
755   llvm::StringRef getName(const CodeCompletionResult &Result) {
756     switch (Result.Kind) {
757     case CodeCompletionResult::RK_Declaration:
758       if (auto *ID = Result.Declaration->getIdentifier())
759         return ID->getName();
760       break;
761     case CodeCompletionResult::RK_Keyword:
762       return Result.Keyword;
763     case CodeCompletionResult::RK_Macro:
764       return Result.Macro->getName();
765     case CodeCompletionResult::RK_Pattern:
766       return Result.Pattern->getTypedText();
767     }
768     auto *CCS = codeCompletionString(Result);
769     return CCS->getTypedText();
770   }
771 
772   // Build a CodeCompletion string for R, which must be from Results.
773   // The CCS will be owned by this recorder.
774   CodeCompletionString *codeCompletionString(const CodeCompletionResult &R) {
775     // CodeCompletionResult doesn't seem to be const-correct. We own it, anyway.
776     return const_cast<CodeCompletionResult &>(R).CreateCodeCompletionString(
777         *CCSema, CCContext, *CCAllocator, CCTUInfo,
778         /*IncludeBriefComments=*/false);
779   }
780 
781 private:
782   CodeCompleteOptions Opts;
783   std::shared_ptr<GlobalCodeCompletionAllocator> CCAllocator;
784   CodeCompletionTUInfo CCTUInfo;
785   llvm::unique_function<void()> ResultsCallback;
786 };
787 
788 struct ScoredSignature {
789   // When set, requires documentation to be requested from the index with this
790   // ID.
791   llvm::Optional<SymbolID> IDForDoc;
792   SignatureInformation Signature;
793   SignatureQualitySignals Quality;
794 };
795 
796 class SignatureHelpCollector final : public CodeCompleteConsumer {
797 public:
798   SignatureHelpCollector(const clang::CodeCompleteOptions &CodeCompleteOpts,
799                          const SymbolIndex *Index, SignatureHelp &SigHelp)
800       : CodeCompleteConsumer(CodeCompleteOpts), SigHelp(SigHelp),
801         Allocator(std::make_shared<clang::GlobalCodeCompletionAllocator>()),
802         CCTUInfo(Allocator), Index(Index) {}
803 
804   void ProcessOverloadCandidates(Sema &S, unsigned CurrentArg,
805                                  OverloadCandidate *Candidates,
806                                  unsigned NumCandidates,
807                                  SourceLocation OpenParLoc) override {
808     assert(!OpenParLoc.isInvalid());
809     SourceManager &SrcMgr = S.getSourceManager();
810     OpenParLoc = SrcMgr.getFileLoc(OpenParLoc);
811     if (SrcMgr.isInMainFile(OpenParLoc))
812       SigHelp.argListStart = sourceLocToPosition(SrcMgr, OpenParLoc);
813     else
814       elog("Location oustide main file in signature help: {0}",
815            OpenParLoc.printToString(SrcMgr));
816 
817     std::vector<ScoredSignature> ScoredSignatures;
818     SigHelp.signatures.reserve(NumCandidates);
819     ScoredSignatures.reserve(NumCandidates);
820     // FIXME(rwols): How can we determine the "active overload candidate"?
821     // Right now the overloaded candidates seem to be provided in a "best fit"
822     // order, so I'm not too worried about this.
823     SigHelp.activeSignature = 0;
824     assert(CurrentArg <= (unsigned)std::numeric_limits<int>::max() &&
825            "too many arguments");
826     SigHelp.activeParameter = static_cast<int>(CurrentArg);
827     for (unsigned I = 0; I < NumCandidates; ++I) {
828       OverloadCandidate Candidate = Candidates[I];
829       // We want to avoid showing instantiated signatures, because they may be
830       // long in some cases (e.g. when 'T' is substituted with 'std::string', we
831       // would get 'std::basic_string<char>').
832       if (auto *Func = Candidate.getFunction()) {
833         if (auto *Pattern = Func->getTemplateInstantiationPattern())
834           Candidate = OverloadCandidate(Pattern);
835       }
836 
837       const auto *CCS = Candidate.CreateSignatureString(
838           CurrentArg, S, *Allocator, CCTUInfo, true);
839       assert(CCS && "Expected the CodeCompletionString to be non-null");
840       ScoredSignatures.push_back(processOverloadCandidate(
841           Candidate, *CCS,
842           Candidate.getFunction()
843               ? getDeclComment(S.getASTContext(), *Candidate.getFunction())
844               : ""));
845     }
846 
847     // Sema does not load the docs from the preamble, so we need to fetch extra
848     // docs from the index instead.
849     llvm::DenseMap<SymbolID, std::string> FetchedDocs;
850     if (Index) {
851       LookupRequest IndexRequest;
852       for (const auto &S : ScoredSignatures) {
853         if (!S.IDForDoc)
854           continue;
855         IndexRequest.IDs.insert(*S.IDForDoc);
856       }
857       Index->lookup(IndexRequest, [&](const Symbol &S) {
858         if (!S.Documentation.empty())
859           FetchedDocs[S.ID] = S.Documentation;
860       });
861       log("SigHelp: requested docs for {0} symbols from the index, got {1} "
862           "symbols with non-empty docs in the response",
863           IndexRequest.IDs.size(), FetchedDocs.size());
864     }
865 
866     llvm::sort(ScoredSignatures, [](const ScoredSignature &L,
867                                     const ScoredSignature &R) {
868       // Ordering follows:
869       // - Less number of parameters is better.
870       // - Function is better than FunctionType which is better than
871       // Function Template.
872       // - High score is better.
873       // - Shorter signature is better.
874       // - Alphebatically smaller is better.
875       if (L.Quality.NumberOfParameters != R.Quality.NumberOfParameters)
876         return L.Quality.NumberOfParameters < R.Quality.NumberOfParameters;
877       if (L.Quality.NumberOfOptionalParameters !=
878           R.Quality.NumberOfOptionalParameters)
879         return L.Quality.NumberOfOptionalParameters <
880                R.Quality.NumberOfOptionalParameters;
881       if (L.Quality.Kind != R.Quality.Kind) {
882         using OC = CodeCompleteConsumer::OverloadCandidate;
883         switch (L.Quality.Kind) {
884         case OC::CK_Function:
885           return true;
886         case OC::CK_FunctionType:
887           return R.Quality.Kind != OC::CK_Function;
888         case OC::CK_FunctionTemplate:
889           return false;
890         }
891         llvm_unreachable("Unknown overload candidate type.");
892       }
893       if (L.Signature.label.size() != R.Signature.label.size())
894         return L.Signature.label.size() < R.Signature.label.size();
895       return L.Signature.label < R.Signature.label;
896     });
897 
898     for (auto &SS : ScoredSignatures) {
899       auto IndexDocIt =
900           SS.IDForDoc ? FetchedDocs.find(*SS.IDForDoc) : FetchedDocs.end();
901       if (IndexDocIt != FetchedDocs.end())
902         SS.Signature.documentation = IndexDocIt->second;
903 
904       SigHelp.signatures.push_back(std::move(SS.Signature));
905     }
906   }
907 
908   GlobalCodeCompletionAllocator &getAllocator() override { return *Allocator; }
909 
910   CodeCompletionTUInfo &getCodeCompletionTUInfo() override { return CCTUInfo; }
911 
912 private:
913   void processParameterChunk(llvm::StringRef ChunkText,
914                              SignatureInformation &Signature) const {
915     // (!) this is O(n), should still be fast compared to building ASTs.
916     unsigned ParamStartOffset = lspLength(Signature.label);
917     unsigned ParamEndOffset = ParamStartOffset + lspLength(ChunkText);
918     // A piece of text that describes the parameter that corresponds to
919     // the code-completion location within a function call, message send,
920     // macro invocation, etc.
921     Signature.label += ChunkText;
922     ParameterInformation Info;
923     Info.labelOffsets.emplace(ParamStartOffset, ParamEndOffset);
924     // FIXME: only set 'labelOffsets' when all clients migrate out of it.
925     Info.labelString = ChunkText;
926 
927     Signature.parameters.push_back(std::move(Info));
928   }
929 
930   void processOptionalChunk(const CodeCompletionString &CCS,
931                             SignatureInformation &Signature,
932                             SignatureQualitySignals &Signal) const {
933     for (const auto &Chunk : CCS) {
934       switch (Chunk.Kind) {
935       case CodeCompletionString::CK_Optional:
936         assert(Chunk.Optional &&
937                "Expected the optional code completion string to be non-null.");
938         processOptionalChunk(*Chunk.Optional, Signature, Signal);
939         break;
940       case CodeCompletionString::CK_VerticalSpace:
941         break;
942       case CodeCompletionString::CK_CurrentParameter:
943       case CodeCompletionString::CK_Placeholder:
944         processParameterChunk(Chunk.Text, Signature);
945         Signal.NumberOfOptionalParameters++;
946         break;
947       default:
948         Signature.label += Chunk.Text;
949         break;
950       }
951     }
952   }
953 
954   // FIXME(ioeric): consider moving CodeCompletionString logic here to
955   // CompletionString.h.
956   ScoredSignature processOverloadCandidate(const OverloadCandidate &Candidate,
957                                            const CodeCompletionString &CCS,
958                                            llvm::StringRef DocComment) const {
959     SignatureInformation Signature;
960     SignatureQualitySignals Signal;
961     const char *ReturnType = nullptr;
962 
963     Signature.documentation = formatDocumentation(CCS, DocComment);
964     Signal.Kind = Candidate.getKind();
965 
966     for (const auto &Chunk : CCS) {
967       switch (Chunk.Kind) {
968       case CodeCompletionString::CK_ResultType:
969         // A piece of text that describes the type of an entity or,
970         // for functions and methods, the return type.
971         assert(!ReturnType && "Unexpected CK_ResultType");
972         ReturnType = Chunk.Text;
973         break;
974       case CodeCompletionString::CK_CurrentParameter:
975       case CodeCompletionString::CK_Placeholder:
976         processParameterChunk(Chunk.Text, Signature);
977         Signal.NumberOfParameters++;
978         break;
979       case CodeCompletionString::CK_Optional: {
980         // The rest of the parameters are defaulted/optional.
981         assert(Chunk.Optional &&
982                "Expected the optional code completion string to be non-null.");
983         processOptionalChunk(*Chunk.Optional, Signature, Signal);
984         break;
985       }
986       case CodeCompletionString::CK_VerticalSpace:
987         break;
988       default:
989         Signature.label += Chunk.Text;
990         break;
991       }
992     }
993     if (ReturnType) {
994       Signature.label += " -> ";
995       Signature.label += ReturnType;
996     }
997     dlog("Signal for {0}: {1}", Signature, Signal);
998     ScoredSignature Result;
999     Result.Signature = std::move(Signature);
1000     Result.Quality = Signal;
1001     Result.IDForDoc =
1002         Result.Signature.documentation.empty() && Candidate.getFunction()
1003             ? clangd::getSymbolID(Candidate.getFunction())
1004             : None;
1005     return Result;
1006   }
1007 
1008   SignatureHelp &SigHelp;
1009   std::shared_ptr<clang::GlobalCodeCompletionAllocator> Allocator;
1010   CodeCompletionTUInfo CCTUInfo;
1011   const SymbolIndex *Index;
1012 }; // SignatureHelpCollector
1013 
1014 struct SemaCompleteInput {
1015   PathRef FileName;
1016   const tooling::CompileCommand &Command;
1017   const PreambleData *Preamble;
1018   llvm::StringRef Contents;
1019   size_t Offset;
1020   llvm::IntrusiveRefCntPtr<llvm::vfs::FileSystem> VFS;
1021 };
1022 
1023 void loadMainFilePreambleMacros(const Preprocessor &PP,
1024                                 const PreambleData &Preamble) {
1025   // The ExternalPreprocessorSource has our macros, if we know where to look.
1026   // We can read all the macros using PreambleMacros->ReadDefinedMacros(),
1027   // but this includes transitively included files, so may deserialize a lot.
1028   ExternalPreprocessorSource *PreambleMacros = PP.getExternalSource();
1029   // As we have the names of the macros, we can look up their IdentifierInfo
1030   // and then use this to load just the macros we want.
1031   IdentifierInfoLookup *PreambleIdentifiers =
1032       PP.getIdentifierTable().getExternalIdentifierLookup();
1033   if (!PreambleIdentifiers || !PreambleMacros)
1034     return;
1035   for (const auto &MacroName : Preamble.MainFileMacros)
1036     if (auto *II = PreambleIdentifiers->get(MacroName))
1037       if (II->isOutOfDate())
1038         PreambleMacros->updateOutOfDateIdentifier(*II);
1039 }
1040 
1041 // Invokes Sema code completion on a file.
1042 // If \p Includes is set, it will be updated based on the compiler invocation.
1043 bool semaCodeComplete(std::unique_ptr<CodeCompleteConsumer> Consumer,
1044                       const clang::CodeCompleteOptions &Options,
1045                       const SemaCompleteInput &Input,
1046                       IncludeStructure *Includes = nullptr) {
1047   trace::Span Tracer("Sema completion");
1048   llvm::IntrusiveRefCntPtr<llvm::vfs::FileSystem> VFS = Input.VFS;
1049   if (Input.Preamble && Input.Preamble->StatCache)
1050     VFS = Input.Preamble->StatCache->getConsumingFS(std::move(VFS));
1051   ParseInputs ParseInput;
1052   ParseInput.CompileCommand = Input.Command;
1053   ParseInput.FS = VFS;
1054   ParseInput.Contents = Input.Contents;
1055   ParseInput.Opts = ParseOptions();
1056 
1057   IgnoreDiagnostics IgnoreDiags;
1058   auto CI = buildCompilerInvocation(ParseInput, IgnoreDiags);
1059   if (!CI) {
1060     elog("Couldn't create CompilerInvocation");
1061     return false;
1062   }
1063   auto &FrontendOpts = CI->getFrontendOpts();
1064   FrontendOpts.SkipFunctionBodies = true;
1065   // Disable typo correction in Sema.
1066   CI->getLangOpts()->SpellChecking = false;
1067   // Setup code completion.
1068   FrontendOpts.CodeCompleteOpts = Options;
1069   FrontendOpts.CodeCompletionAt.FileName = Input.FileName;
1070   std::tie(FrontendOpts.CodeCompletionAt.Line,
1071            FrontendOpts.CodeCompletionAt.Column) =
1072       offsetToClangLineColumn(Input.Contents, Input.Offset);
1073 
1074   std::unique_ptr<llvm::MemoryBuffer> ContentsBuffer =
1075       llvm::MemoryBuffer::getMemBufferCopy(Input.Contents, Input.FileName);
1076   // The diagnostic options must be set before creating a CompilerInstance.
1077   CI->getDiagnosticOpts().IgnoreWarnings = true;
1078   // We reuse the preamble whether it's valid or not. This is a
1079   // correctness/performance tradeoff: building without a preamble is slow, and
1080   // completion is latency-sensitive.
1081   // However, if we're completing *inside* the preamble section of the draft,
1082   // overriding the preamble will break sema completion. Fortunately we can just
1083   // skip all includes in this case; these completions are really simple.
1084   PreambleBounds PreambleRegion =
1085       ComputePreambleBounds(*CI->getLangOpts(), ContentsBuffer.get(), 0);
1086   bool CompletingInPreamble = PreambleRegion.Size > Input.Offset;
1087   // NOTE: we must call BeginSourceFile after prepareCompilerInstance. Otherwise
1088   // the remapped buffers do not get freed.
1089   auto Clang = prepareCompilerInstance(
1090       std::move(CI),
1091       (Input.Preamble && !CompletingInPreamble) ? &Input.Preamble->Preamble
1092                                                 : nullptr,
1093       std::move(ContentsBuffer), std::move(VFS), IgnoreDiags);
1094   Clang->getPreprocessorOpts().SingleFileParseMode = CompletingInPreamble;
1095   Clang->setCodeCompletionConsumer(Consumer.release());
1096 
1097   SyntaxOnlyAction Action;
1098   if (!Action.BeginSourceFile(*Clang, Clang->getFrontendOpts().Inputs[0])) {
1099     log("BeginSourceFile() failed when running codeComplete for {0}",
1100         Input.FileName);
1101     return false;
1102   }
1103   // Macros can be defined within the preamble region of the main file.
1104   // They don't fall nicely into our index/Sema dichotomy:
1105   //  - they're not indexed for completion (they're not available across files)
1106   //  - but Sema code complete won't see them: as part of the preamble, they're
1107   //    deserialized only when mentioned.
1108   // Force them to be deserialized so SemaCodeComplete sees them.
1109   if (Input.Preamble)
1110     loadMainFilePreambleMacros(Clang->getPreprocessor(), *Input.Preamble);
1111   if (Includes)
1112     Clang->getPreprocessor().addPPCallbacks(
1113         collectIncludeStructureCallback(Clang->getSourceManager(), Includes));
1114   if (llvm::Error Err = Action.Execute()) {
1115     log("Execute() failed when running codeComplete for {0}: {1}",
1116         Input.FileName, toString(std::move(Err)));
1117     return false;
1118   }
1119   Action.EndSourceFile();
1120 
1121   return true;
1122 }
1123 
1124 // Should we allow index completions in the specified context?
1125 bool allowIndex(CodeCompletionContext &CC) {
1126   if (!contextAllowsIndex(CC.getKind()))
1127     return false;
1128   // We also avoid ClassName::bar (but allow namespace::bar).
1129   auto Scope = CC.getCXXScopeSpecifier();
1130   if (!Scope)
1131     return true;
1132   NestedNameSpecifier *NameSpec = (*Scope)->getScopeRep();
1133   if (!NameSpec)
1134     return true;
1135   // We only query the index when qualifier is a namespace.
1136   // If it's a class, we rely solely on sema completions.
1137   switch (NameSpec->getKind()) {
1138   case NestedNameSpecifier::Global:
1139   case NestedNameSpecifier::Namespace:
1140   case NestedNameSpecifier::NamespaceAlias:
1141     return true;
1142   case NestedNameSpecifier::Super:
1143   case NestedNameSpecifier::TypeSpec:
1144   case NestedNameSpecifier::TypeSpecWithTemplate:
1145   // Unresolved inside a template.
1146   case NestedNameSpecifier::Identifier:
1147     return false;
1148   }
1149   llvm_unreachable("invalid NestedNameSpecifier kind");
1150 }
1151 
1152 std::future<SymbolSlab> startAsyncFuzzyFind(const SymbolIndex &Index,
1153                                             const FuzzyFindRequest &Req) {
1154   return runAsync<SymbolSlab>([&Index, Req]() {
1155     trace::Span Tracer("Async fuzzyFind");
1156     SymbolSlab::Builder Syms;
1157     Index.fuzzyFind(Req, [&Syms](const Symbol &Sym) { Syms.insert(Sym); });
1158     return std::move(Syms).build();
1159   });
1160 }
1161 
1162 // Creates a `FuzzyFindRequest` based on the cached index request from the
1163 // last completion, if any, and the speculated completion filter text in the
1164 // source code.
1165 FuzzyFindRequest speculativeFuzzyFindRequestForCompletion(
1166     FuzzyFindRequest CachedReq, const CompletionPrefix &HeuristicPrefix) {
1167   CachedReq.Query = HeuristicPrefix.Name;
1168   return CachedReq;
1169 }
1170 
1171 // Runs Sema-based (AST) and Index-based completion, returns merged results.
1172 //
1173 // There are a few tricky considerations:
1174 //   - the AST provides information needed for the index query (e.g. which
1175 //     namespaces to search in). So Sema must start first.
1176 //   - we only want to return the top results (Opts.Limit).
1177 //     Building CompletionItems for everything else is wasteful, so we want to
1178 //     preserve the "native" format until we're done with scoring.
1179 //   - the data underlying Sema completion items is owned by the AST and various
1180 //     other arenas, which must stay alive for us to build CompletionItems.
1181 //   - we may get duplicate results from Sema and the Index, we need to merge.
1182 //
1183 // So we start Sema completion first, and do all our work in its callback.
1184 // We use the Sema context information to query the index.
1185 // Then we merge the two result sets, producing items that are Sema/Index/Both.
1186 // These items are scored, and the top N are synthesized into the LSP response.
1187 // Finally, we can clean up the data structures created by Sema completion.
1188 //
1189 // Main collaborators are:
1190 //   - semaCodeComplete sets up the compiler machinery to run code completion.
1191 //   - CompletionRecorder captures Sema completion results, including context.
1192 //   - SymbolIndex (Opts.Index) provides index completion results as Symbols
1193 //   - CompletionCandidates are the result of merging Sema and Index results.
1194 //     Each candidate points to an underlying CodeCompletionResult (Sema), a
1195 //     Symbol (Index), or both. It computes the result quality score.
1196 //     CompletionCandidate also does conversion to CompletionItem (at the end).
1197 //   - FuzzyMatcher scores how the candidate matches the partial identifier.
1198 //     This score is combined with the result quality score for the final score.
1199 //   - TopN determines the results with the best score.
1200 class CodeCompleteFlow {
1201   PathRef FileName;
1202   IncludeStructure Includes;           // Complete once the compiler runs.
1203   SpeculativeFuzzyFind *SpecFuzzyFind; // Can be nullptr.
1204   const CodeCompleteOptions &Opts;
1205 
1206   // Sema takes ownership of Recorder. Recorder is valid until Sema cleanup.
1207   CompletionRecorder *Recorder = nullptr;
1208   CodeCompletionContext::Kind CCContextKind = CodeCompletionContext::CCC_Other;
1209   // Counters for logging.
1210   int NSema = 0, NIndex = 0, NSemaAndIndex = 0, NIdent = 0;
1211   bool Incomplete = false; // Would more be available with a higher limit?
1212   CompletionPrefix HeuristicPrefix;
1213   llvm::Optional<FuzzyMatcher> Filter; // Initialized once Sema runs.
1214   Range ReplacedRange;
1215   std::vector<std::string> QueryScopes; // Initialized once Sema runs.
1216   // Initialized once QueryScopes is initialized, if there are scopes.
1217   llvm::Optional<ScopeDistance> ScopeProximity;
1218   llvm::Optional<OpaqueType> PreferredType; // Initialized once Sema runs.
1219   // Whether to query symbols from any scope. Initialized once Sema runs.
1220   bool AllScopes = false;
1221   llvm::StringSet<> ContextWords;
1222   // Include-insertion and proximity scoring rely on the include structure.
1223   // This is available after Sema has run.
1224   llvm::Optional<IncludeInserter> Inserter;  // Available during runWithSema.
1225   llvm::Optional<URIDistance> FileProximity; // Initialized once Sema runs.
1226   /// Speculative request based on the cached request and the filter text before
1227   /// the cursor.
1228   /// Initialized right before sema run. This is only set if `SpecFuzzyFind` is
1229   /// set and contains a cached request.
1230   llvm::Optional<FuzzyFindRequest> SpecReq;
1231 
1232 public:
1233   // A CodeCompleteFlow object is only useful for calling run() exactly once.
1234   CodeCompleteFlow(PathRef FileName, const IncludeStructure &Includes,
1235                    SpeculativeFuzzyFind *SpecFuzzyFind,
1236                    const CodeCompleteOptions &Opts)
1237       : FileName(FileName), Includes(Includes), SpecFuzzyFind(SpecFuzzyFind),
1238         Opts(Opts) {}
1239 
1240   CodeCompleteResult run(const SemaCompleteInput &SemaCCInput) && {
1241     trace::Span Tracer("CodeCompleteFlow");
1242     HeuristicPrefix =
1243         guessCompletionPrefix(SemaCCInput.Contents, SemaCCInput.Offset);
1244     populateContextWords(SemaCCInput.Contents);
1245     if (Opts.Index && SpecFuzzyFind && SpecFuzzyFind->CachedReq.hasValue()) {
1246       assert(!SpecFuzzyFind->Result.valid());
1247       SpecReq = speculativeFuzzyFindRequestForCompletion(
1248           *SpecFuzzyFind->CachedReq, HeuristicPrefix);
1249       SpecFuzzyFind->Result = startAsyncFuzzyFind(*Opts.Index, *SpecReq);
1250     }
1251 
1252     // We run Sema code completion first. It builds an AST and calculates:
1253     //   - completion results based on the AST.
1254     //   - partial identifier and context. We need these for the index query.
1255     CodeCompleteResult Output;
1256     auto RecorderOwner = std::make_unique<CompletionRecorder>(Opts, [&]() {
1257       assert(Recorder && "Recorder is not set");
1258       CCContextKind = Recorder->CCContext.getKind();
1259       auto Style = getFormatStyleForFile(
1260           SemaCCInput.FileName, SemaCCInput.Contents, SemaCCInput.VFS.get());
1261       // If preprocessor was run, inclusions from preprocessor callback should
1262       // already be added to Includes.
1263       Inserter.emplace(
1264           SemaCCInput.FileName, SemaCCInput.Contents, Style,
1265           SemaCCInput.Command.Directory,
1266           &Recorder->CCSema->getPreprocessor().getHeaderSearchInfo());
1267       for (const auto &Inc : Includes.MainFileIncludes)
1268         Inserter->addExisting(Inc);
1269 
1270       // Most of the cost of file proximity is in initializing the FileDistance
1271       // structures based on the observed includes, once per query. Conceptually
1272       // that happens here (though the per-URI-scheme initialization is lazy).
1273       // The per-result proximity scoring is (amortized) very cheap.
1274       FileDistanceOptions ProxOpts{}; // Use defaults.
1275       const auto &SM = Recorder->CCSema->getSourceManager();
1276       llvm::StringMap<SourceParams> ProxSources;
1277       for (auto &Entry : Includes.includeDepth(
1278                SM.getFileEntryForID(SM.getMainFileID())->getName())) {
1279         auto &Source = ProxSources[Entry.getKey()];
1280         Source.Cost = Entry.getValue() * ProxOpts.IncludeCost;
1281         // Symbols near our transitive includes are good, but only consider
1282         // things in the same directory or below it. Otherwise there can be
1283         // many false positives.
1284         if (Entry.getValue() > 0)
1285           Source.MaxUpTraversals = 1;
1286       }
1287       FileProximity.emplace(ProxSources, ProxOpts);
1288 
1289       Output = runWithSema();
1290       Inserter.reset(); // Make sure this doesn't out-live Clang.
1291       SPAN_ATTACH(Tracer, "sema_completion_kind",
1292                   getCompletionKindString(CCContextKind));
1293       log("Code complete: sema context {0}, query scopes [{1}] (AnyScope={2}), "
1294           "expected type {3}",
1295           getCompletionKindString(CCContextKind),
1296           llvm::join(QueryScopes.begin(), QueryScopes.end(), ","), AllScopes,
1297           PreferredType ? Recorder->CCContext.getPreferredType().getAsString()
1298                         : "<none>");
1299     });
1300 
1301     Recorder = RecorderOwner.get();
1302 
1303     semaCodeComplete(std::move(RecorderOwner), Opts.getClangCompleteOpts(),
1304                      SemaCCInput, &Includes);
1305     logResults(Output, Tracer);
1306     return Output;
1307   }
1308 
1309   void logResults(const CodeCompleteResult &Output, const trace::Span &Tracer) {
1310     SPAN_ATTACH(Tracer, "sema_results", NSema);
1311     SPAN_ATTACH(Tracer, "index_results", NIndex);
1312     SPAN_ATTACH(Tracer, "merged_results", NSemaAndIndex);
1313     SPAN_ATTACH(Tracer, "identifier_results", NIdent);
1314     SPAN_ATTACH(Tracer, "returned_results", int64_t(Output.Completions.size()));
1315     SPAN_ATTACH(Tracer, "incomplete", Output.HasMore);
1316     log("Code complete: {0} results from Sema, {1} from Index, "
1317         "{2} matched, {3} from identifiers, {4} returned{5}.",
1318         NSema, NIndex, NSemaAndIndex, NIdent, Output.Completions.size(),
1319         Output.HasMore ? " (incomplete)" : "");
1320     assert(!Opts.Limit || Output.Completions.size() <= Opts.Limit);
1321     // We don't assert that isIncomplete means we hit a limit.
1322     // Indexes may choose to impose their own limits even if we don't have one.
1323   }
1324 
1325   CodeCompleteResult
1326   runWithoutSema(llvm::StringRef Content, size_t Offset,
1327                  llvm::IntrusiveRefCntPtr<llvm::vfs::FileSystem> VFS) && {
1328     trace::Span Tracer("CodeCompleteWithoutSema");
1329     // Fill in fields normally set by runWithSema()
1330     HeuristicPrefix = guessCompletionPrefix(Content, Offset);
1331     populateContextWords(Content);
1332     CCContextKind = CodeCompletionContext::CCC_Recovery;
1333     Filter = FuzzyMatcher(HeuristicPrefix.Name);
1334     auto Pos = offsetToPosition(Content, Offset);
1335     ReplacedRange.start = ReplacedRange.end = Pos;
1336     ReplacedRange.start.character -= HeuristicPrefix.Name.size();
1337 
1338     llvm::StringMap<SourceParams> ProxSources;
1339     ProxSources[FileName].Cost = 0;
1340     FileProximity.emplace(ProxSources);
1341 
1342     auto Style = getFormatStyleForFile(FileName, Content, VFS.get());
1343     // This will only insert verbatim headers.
1344     Inserter.emplace(FileName, Content, Style,
1345                      /*BuildDir=*/"", /*HeaderSearchInfo=*/nullptr);
1346 
1347     auto Identifiers = collectIdentifiers(Content, Style);
1348     std::vector<RawIdentifier> IdentifierResults;
1349     for (const auto &IDAndCount : Identifiers) {
1350       RawIdentifier ID;
1351       ID.Name = IDAndCount.first();
1352       ID.References = IDAndCount.second;
1353       // Avoid treating typed filter as an identifier.
1354       if (ID.Name == HeuristicPrefix.Name)
1355         --ID.References;
1356       if (ID.References > 0)
1357         IdentifierResults.push_back(std::move(ID));
1358     }
1359 
1360     // Simplified version of getQueryScopes():
1361     //  - accessible scopes are determined heuristically.
1362     //  - all-scopes query if no qualifier was typed (and it's allowed).
1363     SpecifiedScope Scopes;
1364     Scopes.AccessibleScopes =
1365         visibleNamespaces(Content.take_front(Offset), Style);
1366     for (std::string &S : Scopes.AccessibleScopes)
1367       if (!S.empty())
1368         S.append("::"); // visibleNamespaces doesn't include trailing ::.
1369     if (HeuristicPrefix.Qualifier.empty())
1370       AllScopes = Opts.AllScopes;
1371     else if (HeuristicPrefix.Qualifier.startswith("::")) {
1372       Scopes.AccessibleScopes = {""};
1373       Scopes.UnresolvedQualifier = HeuristicPrefix.Qualifier.drop_front(2);
1374     } else
1375       Scopes.UnresolvedQualifier = HeuristicPrefix.Qualifier;
1376     // First scope is the (modified) enclosing scope.
1377     QueryScopes = Scopes.scopesForIndexQuery();
1378     ScopeProximity.emplace(QueryScopes);
1379 
1380     SymbolSlab IndexResults = Opts.Index ? queryIndex() : SymbolSlab();
1381 
1382     CodeCompleteResult Output = toCodeCompleteResult(mergeResults(
1383         /*SemaResults=*/{}, IndexResults, IdentifierResults));
1384     Output.RanParser = false;
1385     logResults(Output, Tracer);
1386     return Output;
1387   }
1388 
1389 private:
1390   void populateContextWords(llvm::StringRef Content) {
1391     // Take last 3 lines before the completion point.
1392     unsigned RangeEnd = HeuristicPrefix.Qualifier.begin() - Content.data(),
1393              RangeBegin = RangeEnd;
1394     for (size_t I = 0; I < 3 && RangeBegin > 0; ++I) {
1395       auto PrevNL = Content.rfind('\n', RangeBegin);
1396       if (PrevNL == StringRef::npos) {
1397         RangeBegin = 0;
1398         break;
1399       }
1400       RangeBegin = PrevNL;
1401     }
1402 
1403     ContextWords = collectWords(Content.slice(RangeBegin, RangeEnd));
1404     dlog("Completion context words: {0}",
1405          llvm::join(ContextWords.keys(), ", "));
1406   }
1407 
1408   // This is called by run() once Sema code completion is done, but before the
1409   // Sema data structures are torn down. It does all the real work.
1410   CodeCompleteResult runWithSema() {
1411     const auto &CodeCompletionRange = CharSourceRange::getCharRange(
1412         Recorder->CCSema->getPreprocessor().getCodeCompletionTokenRange());
1413     // When we are getting completions with an empty identifier, for example
1414     //    std::vector<int> asdf;
1415     //    asdf.^;
1416     // Then the range will be invalid and we will be doing insertion, use
1417     // current cursor position in such cases as range.
1418     if (CodeCompletionRange.isValid()) {
1419       ReplacedRange = halfOpenToRange(Recorder->CCSema->getSourceManager(),
1420                                       CodeCompletionRange);
1421     } else {
1422       const auto &Pos = sourceLocToPosition(
1423           Recorder->CCSema->getSourceManager(),
1424           Recorder->CCSema->getPreprocessor().getCodeCompletionLoc());
1425       ReplacedRange.start = ReplacedRange.end = Pos;
1426     }
1427     Filter = FuzzyMatcher(
1428         Recorder->CCSema->getPreprocessor().getCodeCompletionFilter());
1429     std::tie(QueryScopes, AllScopes) = getQueryScopes(
1430         Recorder->CCContext, *Recorder->CCSema, HeuristicPrefix, Opts);
1431     if (!QueryScopes.empty())
1432       ScopeProximity.emplace(QueryScopes);
1433     PreferredType =
1434         OpaqueType::fromType(Recorder->CCSema->getASTContext(),
1435                              Recorder->CCContext.getPreferredType());
1436     // Sema provides the needed context to query the index.
1437     // FIXME: in addition to querying for extra/overlapping symbols, we should
1438     //        explicitly request symbols corresponding to Sema results.
1439     //        We can use their signals even if the index can't suggest them.
1440     // We must copy index results to preserve them, but there are at most Limit.
1441     auto IndexResults = (Opts.Index && allowIndex(Recorder->CCContext))
1442                             ? queryIndex()
1443                             : SymbolSlab();
1444     trace::Span Tracer("Populate CodeCompleteResult");
1445     // Merge Sema and Index results, score them, and pick the winners.
1446     auto Top =
1447         mergeResults(Recorder->Results, IndexResults, /*Identifiers*/ {});
1448     return toCodeCompleteResult(Top);
1449   }
1450 
1451   CodeCompleteResult
1452   toCodeCompleteResult(const std::vector<ScoredBundle> &Scored) {
1453     CodeCompleteResult Output;
1454 
1455     // Convert the results to final form, assembling the expensive strings.
1456     for (auto &C : Scored) {
1457       Output.Completions.push_back(toCodeCompletion(C.first));
1458       Output.Completions.back().Score = C.second;
1459       Output.Completions.back().CompletionTokenRange = ReplacedRange;
1460     }
1461     Output.HasMore = Incomplete;
1462     Output.Context = CCContextKind;
1463     return Output;
1464   }
1465 
1466   SymbolSlab queryIndex() {
1467     trace::Span Tracer("Query index");
1468     SPAN_ATTACH(Tracer, "limit", int64_t(Opts.Limit));
1469 
1470     // Build the query.
1471     FuzzyFindRequest Req;
1472     if (Opts.Limit)
1473       Req.Limit = Opts.Limit;
1474     Req.Query = Filter->pattern();
1475     Req.RestrictForCodeCompletion = true;
1476     Req.Scopes = QueryScopes;
1477     Req.AnyScope = AllScopes;
1478     // FIXME: we should send multiple weighted paths here.
1479     Req.ProximityPaths.push_back(FileName);
1480     if (PreferredType)
1481       Req.PreferredTypes.push_back(PreferredType->raw());
1482     vlog("Code complete: fuzzyFind({0:2})", toJSON(Req));
1483 
1484     if (SpecFuzzyFind)
1485       SpecFuzzyFind->NewReq = Req;
1486     if (SpecFuzzyFind && SpecFuzzyFind->Result.valid() && (*SpecReq == Req)) {
1487       vlog("Code complete: speculative fuzzy request matches the actual index "
1488            "request. Waiting for the speculative index results.");
1489       SPAN_ATTACH(Tracer, "Speculative results", true);
1490 
1491       trace::Span WaitSpec("Wait speculative results");
1492       return SpecFuzzyFind->Result.get();
1493     }
1494 
1495     SPAN_ATTACH(Tracer, "Speculative results", false);
1496 
1497     // Run the query against the index.
1498     SymbolSlab::Builder ResultsBuilder;
1499     if (Opts.Index->fuzzyFind(
1500             Req, [&](const Symbol &Sym) { ResultsBuilder.insert(Sym); }))
1501       Incomplete = true;
1502     return std::move(ResultsBuilder).build();
1503   }
1504 
1505   // Merges Sema and Index results where possible, to form CompletionCandidates.
1506   // \p Identifiers is raw idenfiers that can also be completion condidates.
1507   // Identifiers are not merged with results from index or sema.
1508   // Groups overloads if desired, to form CompletionCandidate::Bundles. The
1509   // bundles are scored and top results are returned, best to worst.
1510   std::vector<ScoredBundle>
1511   mergeResults(const std::vector<CodeCompletionResult> &SemaResults,
1512                const SymbolSlab &IndexResults,
1513                const std::vector<RawIdentifier> &IdentifierResults) {
1514     trace::Span Tracer("Merge and score results");
1515     std::vector<CompletionCandidate::Bundle> Bundles;
1516     llvm::DenseMap<size_t, size_t> BundleLookup;
1517     auto AddToBundles = [&](const CodeCompletionResult *SemaResult,
1518                             const Symbol *IndexResult,
1519                             const RawIdentifier *IdentifierResult) {
1520       CompletionCandidate C;
1521       C.SemaResult = SemaResult;
1522       C.IndexResult = IndexResult;
1523       C.IdentifierResult = IdentifierResult;
1524       if (C.IndexResult) {
1525         C.Name = IndexResult->Name;
1526         C.RankedIncludeHeaders = getRankedIncludes(*C.IndexResult);
1527       } else if (C.SemaResult) {
1528         C.Name = Recorder->getName(*SemaResult);
1529       } else {
1530         assert(IdentifierResult);
1531         C.Name = IdentifierResult->Name;
1532       }
1533       if (auto OverloadSet = C.overloadSet(Opts)) {
1534         auto Ret = BundleLookup.try_emplace(OverloadSet, Bundles.size());
1535         if (Ret.second)
1536           Bundles.emplace_back();
1537         Bundles[Ret.first->second].push_back(std::move(C));
1538       } else {
1539         Bundles.emplace_back();
1540         Bundles.back().push_back(std::move(C));
1541       }
1542     };
1543     llvm::DenseSet<const Symbol *> UsedIndexResults;
1544     auto CorrespondingIndexResult =
1545         [&](const CodeCompletionResult &SemaResult) -> const Symbol * {
1546       if (auto SymID =
1547               getSymbolID(SemaResult, Recorder->CCSema->getSourceManager())) {
1548         auto I = IndexResults.find(*SymID);
1549         if (I != IndexResults.end()) {
1550           UsedIndexResults.insert(&*I);
1551           return &*I;
1552         }
1553       }
1554       return nullptr;
1555     };
1556     // Emit all Sema results, merging them with Index results if possible.
1557     for (auto &SemaResult : SemaResults)
1558       AddToBundles(&SemaResult, CorrespondingIndexResult(SemaResult), nullptr);
1559     // Now emit any Index-only results.
1560     for (const auto &IndexResult : IndexResults) {
1561       if (UsedIndexResults.count(&IndexResult))
1562         continue;
1563       AddToBundles(/*SemaResult=*/nullptr, &IndexResult, nullptr);
1564     }
1565     // Emit identifier results.
1566     for (const auto &Ident : IdentifierResults)
1567       AddToBundles(/*SemaResult=*/nullptr, /*IndexResult=*/nullptr, &Ident);
1568     // We only keep the best N results at any time, in "native" format.
1569     TopN<ScoredBundle, ScoredBundleGreater> Top(
1570         Opts.Limit == 0 ? std::numeric_limits<size_t>::max() : Opts.Limit);
1571     for (auto &Bundle : Bundles)
1572       addCandidate(Top, std::move(Bundle));
1573     return std::move(Top).items();
1574   }
1575 
1576   llvm::Optional<float> fuzzyScore(const CompletionCandidate &C) {
1577     // Macros can be very spammy, so we only support prefix completion.
1578     // We won't end up with underfull index results, as macros are sema-only.
1579     if (C.SemaResult && C.SemaResult->Kind == CodeCompletionResult::RK_Macro &&
1580         !C.Name.startswith_lower(Filter->pattern()))
1581       return None;
1582     return Filter->match(C.Name);
1583   }
1584 
1585   // Scores a candidate and adds it to the TopN structure.
1586   void addCandidate(TopN<ScoredBundle, ScoredBundleGreater> &Candidates,
1587                     CompletionCandidate::Bundle Bundle) {
1588     SymbolQualitySignals Quality;
1589     SymbolRelevanceSignals Relevance;
1590     Relevance.Context = CCContextKind;
1591     Relevance.Name = Bundle.front().Name;
1592     Relevance.Query = SymbolRelevanceSignals::CodeComplete;
1593     Relevance.FileProximityMatch = FileProximity.getPointer();
1594     if (ScopeProximity)
1595       Relevance.ScopeProximityMatch = ScopeProximity.getPointer();
1596     if (PreferredType)
1597       Relevance.HadContextType = true;
1598     Relevance.ContextWords = &ContextWords;
1599 
1600     auto &First = Bundle.front();
1601     if (auto FuzzyScore = fuzzyScore(First))
1602       Relevance.NameMatch = *FuzzyScore;
1603     else
1604       return;
1605     SymbolOrigin Origin = SymbolOrigin::Unknown;
1606     bool FromIndex = false;
1607     for (const auto &Candidate : Bundle) {
1608       if (Candidate.IndexResult) {
1609         Quality.merge(*Candidate.IndexResult);
1610         Relevance.merge(*Candidate.IndexResult);
1611         Origin |= Candidate.IndexResult->Origin;
1612         FromIndex = true;
1613         if (!Candidate.IndexResult->Type.empty())
1614           Relevance.HadSymbolType |= true;
1615         if (PreferredType &&
1616             PreferredType->raw() == Candidate.IndexResult->Type) {
1617           Relevance.TypeMatchesPreferred = true;
1618         }
1619       }
1620       if (Candidate.SemaResult) {
1621         Quality.merge(*Candidate.SemaResult);
1622         Relevance.merge(*Candidate.SemaResult);
1623         if (PreferredType) {
1624           if (auto CompletionType = OpaqueType::fromCompletionResult(
1625                   Recorder->CCSema->getASTContext(), *Candidate.SemaResult)) {
1626             Relevance.HadSymbolType |= true;
1627             if (PreferredType == CompletionType)
1628               Relevance.TypeMatchesPreferred = true;
1629           }
1630         }
1631         Origin |= SymbolOrigin::AST;
1632       }
1633       if (Candidate.IdentifierResult) {
1634         Quality.References = Candidate.IdentifierResult->References;
1635         Relevance.Scope = SymbolRelevanceSignals::FileScope;
1636         Origin |= SymbolOrigin::Identifier;
1637       }
1638     }
1639 
1640     CodeCompletion::Scores Scores;
1641     Scores.Quality = Quality.evaluate();
1642     Scores.Relevance = Relevance.evaluate();
1643     Scores.Total = evaluateSymbolAndRelevance(Scores.Quality, Scores.Relevance);
1644     // NameMatch is in fact a multiplier on total score, so rescoring is sound.
1645     Scores.ExcludingName = Relevance.NameMatch
1646                                ? Scores.Total / Relevance.NameMatch
1647                                : Scores.Quality;
1648 
1649     dlog("CodeComplete: {0} ({1}) = {2}\n{3}{4}\n", First.Name,
1650          llvm::to_string(Origin), Scores.Total, llvm::to_string(Quality),
1651          llvm::to_string(Relevance));
1652 
1653     NSema += bool(Origin & SymbolOrigin::AST);
1654     NIndex += FromIndex;
1655     NSemaAndIndex += bool(Origin & SymbolOrigin::AST) && FromIndex;
1656     NIdent += bool(Origin & SymbolOrigin::Identifier);
1657     if (Candidates.push({std::move(Bundle), Scores}))
1658       Incomplete = true;
1659   }
1660 
1661   CodeCompletion toCodeCompletion(const CompletionCandidate::Bundle &Bundle) {
1662     llvm::Optional<CodeCompletionBuilder> Builder;
1663     for (const auto &Item : Bundle) {
1664       CodeCompletionString *SemaCCS =
1665           Item.SemaResult ? Recorder->codeCompletionString(*Item.SemaResult)
1666                           : nullptr;
1667       if (!Builder)
1668         Builder.emplace(Recorder ? &Recorder->CCSema->getASTContext() : nullptr,
1669                         Item, SemaCCS, QueryScopes, *Inserter, FileName,
1670                         CCContextKind, Opts);
1671       else
1672         Builder->add(Item, SemaCCS);
1673     }
1674     return Builder->build();
1675   }
1676 };
1677 
1678 } // namespace
1679 
1680 clang::CodeCompleteOptions CodeCompleteOptions::getClangCompleteOpts() const {
1681   clang::CodeCompleteOptions Result;
1682   Result.IncludeCodePatterns = EnableSnippets && IncludeCodePatterns;
1683   Result.IncludeMacros = IncludeMacros;
1684   Result.IncludeGlobals = true;
1685   // We choose to include full comments and not do doxygen parsing in
1686   // completion.
1687   // FIXME: ideally, we should support doxygen in some form, e.g. do markdown
1688   // formatting of the comments.
1689   Result.IncludeBriefComments = false;
1690 
1691   // When an is used, Sema is responsible for completing the main file,
1692   // the index can provide results from the preamble.
1693   // Tell Sema not to deserialize the preamble to look for results.
1694   Result.LoadExternal = !Index;
1695   Result.IncludeFixIts = IncludeFixIts;
1696 
1697   return Result;
1698 }
1699 
1700 CompletionPrefix guessCompletionPrefix(llvm::StringRef Content,
1701                                        unsigned Offset) {
1702   assert(Offset <= Content.size());
1703   StringRef Rest = Content.take_front(Offset);
1704   CompletionPrefix Result;
1705 
1706   // Consume the unqualified name. We only handle ASCII characters.
1707   // isIdentifierBody will let us match "0invalid", but we don't mind.
1708   while (!Rest.empty() && isIdentifierBody(Rest.back()))
1709     Rest = Rest.drop_back();
1710   Result.Name = Content.slice(Rest.size(), Offset);
1711 
1712   // Consume qualifiers.
1713   while (Rest.consume_back("::") && !Rest.endswith(":")) // reject ::::
1714     while (!Rest.empty() && isIdentifierBody(Rest.back()))
1715       Rest = Rest.drop_back();
1716   Result.Qualifier =
1717       Content.slice(Rest.size(), Result.Name.begin() - Content.begin());
1718 
1719   return Result;
1720 }
1721 
1722 CodeCompleteResult
1723 codeComplete(PathRef FileName, const tooling::CompileCommand &Command,
1724              const PreambleData *Preamble, llvm::StringRef Contents,
1725              Position Pos, llvm::IntrusiveRefCntPtr<llvm::vfs::FileSystem> VFS,
1726              CodeCompleteOptions Opts, SpeculativeFuzzyFind *SpecFuzzyFind) {
1727   auto Offset = positionToOffset(Contents, Pos);
1728   if (!Offset) {
1729     elog("Code completion position was invalid {0}", Offset.takeError());
1730     return CodeCompleteResult();
1731   }
1732   auto Flow = CodeCompleteFlow(
1733       FileName, Preamble ? Preamble->Includes : IncludeStructure(),
1734       SpecFuzzyFind, Opts);
1735   return (!Preamble || Opts.RunParser == CodeCompleteOptions::NeverParse)
1736              ? std::move(Flow).runWithoutSema(Contents, *Offset, VFS)
1737              : std::move(Flow).run(
1738                    {FileName, Command, Preamble, Contents, *Offset, VFS});
1739 }
1740 
1741 SignatureHelp signatureHelp(PathRef FileName,
1742                             const tooling::CompileCommand &Command,
1743                             const PreambleData *Preamble,
1744                             llvm::StringRef Contents, Position Pos,
1745                             llvm::IntrusiveRefCntPtr<llvm::vfs::FileSystem> VFS,
1746                             const SymbolIndex *Index) {
1747   auto Offset = positionToOffset(Contents, Pos);
1748   if (!Offset) {
1749     elog("Code completion position was invalid {0}", Offset.takeError());
1750     return SignatureHelp();
1751   }
1752   SignatureHelp Result;
1753   clang::CodeCompleteOptions Options;
1754   Options.IncludeGlobals = false;
1755   Options.IncludeMacros = false;
1756   Options.IncludeCodePatterns = false;
1757   Options.IncludeBriefComments = false;
1758   IncludeStructure PreambleInclusions; // Unused for signatureHelp
1759   semaCodeComplete(
1760       std::make_unique<SignatureHelpCollector>(Options, Index, Result),
1761       Options,
1762       {FileName, Command, Preamble, Contents, *Offset, std::move(VFS)});
1763   return Result;
1764 }
1765 
1766 bool isIndexedForCodeCompletion(const NamedDecl &ND, ASTContext &ASTCtx) {
1767   auto InTopLevelScope = [](const NamedDecl &ND) {
1768     switch (ND.getDeclContext()->getDeclKind()) {
1769     case Decl::TranslationUnit:
1770     case Decl::Namespace:
1771     case Decl::LinkageSpec:
1772       return true;
1773     default:
1774       break;
1775     };
1776     return false;
1777   };
1778   // We only complete symbol's name, which is the same as the name of the
1779   // *primary* template in case of template specializations.
1780   if (isExplicitTemplateSpecialization(&ND))
1781     return false;
1782 
1783   if (InTopLevelScope(ND))
1784     return true;
1785 
1786   if (const auto *EnumDecl = dyn_cast<clang::EnumDecl>(ND.getDeclContext()))
1787     return InTopLevelScope(*EnumDecl) && !EnumDecl->isScoped();
1788 
1789   return false;
1790 }
1791 
1792 CompletionItem CodeCompletion::render(const CodeCompleteOptions &Opts) const {
1793   CompletionItem LSP;
1794   const auto *InsertInclude = Includes.empty() ? nullptr : &Includes[0];
1795   LSP.label = ((InsertInclude && InsertInclude->Insertion)
1796                    ? Opts.IncludeIndicator.Insert
1797                    : Opts.IncludeIndicator.NoInsert) +
1798               (Opts.ShowOrigins ? "[" + llvm::to_string(Origin) + "]" : "") +
1799               RequiredQualifier + Name + Signature;
1800 
1801   LSP.kind = Kind;
1802   LSP.detail = BundleSize > 1 ? llvm::formatv("[{0} overloads]", BundleSize)
1803                               : ReturnType;
1804   LSP.deprecated = Deprecated;
1805   if (InsertInclude)
1806     LSP.detail += "\n" + InsertInclude->Header;
1807   LSP.documentation = Documentation;
1808   LSP.sortText = sortText(Score.Total, Name);
1809   LSP.filterText = Name;
1810   LSP.textEdit = {CompletionTokenRange, RequiredQualifier + Name};
1811   // Merge continuous additionalTextEdits into main edit. The main motivation
1812   // behind this is to help LSP clients, it seems most of them are confused when
1813   // they are provided with additionalTextEdits that are consecutive to main
1814   // edit.
1815   // Note that we store additional text edits from back to front in a line. That
1816   // is mainly to help LSP clients again, so that changes do not effect each
1817   // other.
1818   for (const auto &FixIt : FixIts) {
1819     if (isRangeConsecutive(FixIt.range, LSP.textEdit->range)) {
1820       LSP.textEdit->newText = FixIt.newText + LSP.textEdit->newText;
1821       LSP.textEdit->range.start = FixIt.range.start;
1822     } else {
1823       LSP.additionalTextEdits.push_back(FixIt);
1824     }
1825   }
1826   if (Opts.EnableSnippets)
1827     LSP.textEdit->newText += SnippetSuffix;
1828 
1829   // FIXME(kadircet): Do not even fill insertText after making sure textEdit is
1830   // compatible with most of the editors.
1831   LSP.insertText = LSP.textEdit->newText;
1832   LSP.insertTextFormat = Opts.EnableSnippets ? InsertTextFormat::Snippet
1833                                              : InsertTextFormat::PlainText;
1834   if (InsertInclude && InsertInclude->Insertion)
1835     LSP.additionalTextEdits.push_back(*InsertInclude->Insertion);
1836 
1837   return LSP;
1838 }
1839 
1840 llvm::raw_ostream &operator<<(llvm::raw_ostream &OS, const CodeCompletion &C) {
1841   // For now just lean on CompletionItem.
1842   return OS << C.render(CodeCompleteOptions());
1843 }
1844 
1845 llvm::raw_ostream &operator<<(llvm::raw_ostream &OS,
1846                               const CodeCompleteResult &R) {
1847   OS << "CodeCompleteResult: " << R.Completions.size() << (R.HasMore ? "+" : "")
1848      << " (" << getCompletionKindString(R.Context) << ")"
1849      << " items:\n";
1850   for (const auto &C : R.Completions)
1851     OS << C << "\n";
1852   return OS;
1853 }
1854 
1855 } // namespace clangd
1856 } // namespace clang
1857