1 //===--- CodeComplete.cpp ----------------------------------------*- C++-*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // Code completion has several moving parts:
10 //  - AST-based completions are provided using the completion hooks in Sema.
11 //  - external completions are retrieved from the index (using hints from Sema)
12 //  - the two sources overlap, and must be merged and overloads bundled
13 //  - results must be scored and ranked (see Quality.h) before rendering
14 //
15 // Signature help works in a similar way as code completion, but it is simpler:
16 // it's purely AST-based, and there are few candidates.
17 //
18 //===----------------------------------------------------------------------===//
19 
20 #include "CodeComplete.h"
21 #include "AST.h"
22 #include "CodeCompletionStrings.h"
23 #include "Compiler.h"
24 #include "Diagnostics.h"
25 #include "ExpectedTypes.h"
26 #include "FileDistance.h"
27 #include "FuzzyMatch.h"
28 #include "Headers.h"
29 #include "Hover.h"
30 #include "Preamble.h"
31 #include "Protocol.h"
32 #include "Quality.h"
33 #include "SourceCode.h"
34 #include "TUScheduler.h"
35 #include "URI.h"
36 #include "index/Index.h"
37 #include "index/Symbol.h"
38 #include "index/SymbolOrigin.h"
39 #include "support/Logger.h"
40 #include "support/Threading.h"
41 #include "support/ThreadsafeFS.h"
42 #include "support/Trace.h"
43 #include "clang/AST/Decl.h"
44 #include "clang/AST/DeclBase.h"
45 #include "clang/Basic/CharInfo.h"
46 #include "clang/Basic/LangOptions.h"
47 #include "clang/Basic/SourceLocation.h"
48 #include "clang/Basic/TokenKinds.h"
49 #include "clang/Format/Format.h"
50 #include "clang/Frontend/CompilerInstance.h"
51 #include "clang/Frontend/FrontendActions.h"
52 #include "clang/Lex/ExternalPreprocessorSource.h"
53 #include "clang/Lex/Lexer.h"
54 #include "clang/Lex/Preprocessor.h"
55 #include "clang/Lex/PreprocessorOptions.h"
56 #include "clang/Sema/CodeCompleteConsumer.h"
57 #include "clang/Sema/DeclSpec.h"
58 #include "clang/Sema/Sema.h"
59 #include "llvm/ADT/ArrayRef.h"
60 #include "llvm/ADT/None.h"
61 #include "llvm/ADT/Optional.h"
62 #include "llvm/ADT/SmallVector.h"
63 #include "llvm/ADT/StringExtras.h"
64 #include "llvm/ADT/StringRef.h"
65 #include "llvm/Support/Casting.h"
66 #include "llvm/Support/Compiler.h"
67 #include "llvm/Support/Debug.h"
68 #include "llvm/Support/Error.h"
69 #include "llvm/Support/Format.h"
70 #include "llvm/Support/FormatVariadic.h"
71 #include "llvm/Support/ScopedPrinter.h"
72 #include <algorithm>
73 #include <iterator>
74 #include <limits>
75 
76 // We log detailed candidate here if you run with -debug-only=codecomplete.
77 #define DEBUG_TYPE "CodeComplete"
78 
79 namespace clang {
80 namespace clangd {
81 namespace {
82 
83 CompletionItemKind toCompletionItemKind(index::SymbolKind Kind) {
84   using SK = index::SymbolKind;
85   switch (Kind) {
86   case SK::Unknown:
87     return CompletionItemKind::Missing;
88   case SK::Module:
89   case SK::Namespace:
90   case SK::NamespaceAlias:
91     return CompletionItemKind::Module;
92   case SK::Macro:
93     return CompletionItemKind::Text;
94   case SK::Enum:
95     return CompletionItemKind::Enum;
96   case SK::Struct:
97     return CompletionItemKind::Struct;
98   case SK::Class:
99   case SK::Protocol:
100   case SK::Extension:
101   case SK::Union:
102     return CompletionItemKind::Class;
103   case SK::TypeAlias:
104     // We use the same kind as the VSCode C++ extension.
105     // FIXME: pick a better option when we have one.
106     return CompletionItemKind::Interface;
107   case SK::Using:
108     return CompletionItemKind::Reference;
109   case SK::Function:
110   case SK::ConversionFunction:
111     return CompletionItemKind::Function;
112   case SK::Variable:
113   case SK::Parameter:
114   case SK::NonTypeTemplateParm:
115     return CompletionItemKind::Variable;
116   case SK::Field:
117     return CompletionItemKind::Field;
118   case SK::EnumConstant:
119     return CompletionItemKind::EnumMember;
120   case SK::InstanceMethod:
121   case SK::ClassMethod:
122   case SK::StaticMethod:
123   case SK::Destructor:
124     return CompletionItemKind::Method;
125   case SK::InstanceProperty:
126   case SK::ClassProperty:
127   case SK::StaticProperty:
128     return CompletionItemKind::Property;
129   case SK::Constructor:
130     return CompletionItemKind::Constructor;
131   case SK::TemplateTypeParm:
132   case SK::TemplateTemplateParm:
133     return CompletionItemKind::TypeParameter;
134   }
135   llvm_unreachable("Unhandled clang::index::SymbolKind.");
136 }
137 
138 CompletionItemKind
139 toCompletionItemKind(CodeCompletionResult::ResultKind ResKind,
140                      const NamedDecl *Decl,
141                      CodeCompletionContext::Kind CtxKind) {
142   if (Decl)
143     return toCompletionItemKind(index::getSymbolInfo(Decl).Kind);
144   if (CtxKind == CodeCompletionContext::CCC_IncludedFile)
145     return CompletionItemKind::File;
146   switch (ResKind) {
147   case CodeCompletionResult::RK_Declaration:
148     llvm_unreachable("RK_Declaration without Decl");
149   case CodeCompletionResult::RK_Keyword:
150     return CompletionItemKind::Keyword;
151   case CodeCompletionResult::RK_Macro:
152     return CompletionItemKind::Text; // unfortunately, there's no 'Macro'
153                                      // completion items in LSP.
154   case CodeCompletionResult::RK_Pattern:
155     return CompletionItemKind::Snippet;
156   }
157   llvm_unreachable("Unhandled CodeCompletionResult::ResultKind.");
158 }
159 
160 // Identifier code completion result.
161 struct RawIdentifier {
162   llvm::StringRef Name;
163   unsigned References; // # of usages in file.
164 };
165 
166 /// A code completion result, in clang-native form.
167 /// It may be promoted to a CompletionItem if it's among the top-ranked results.
168 struct CompletionCandidate {
169   llvm::StringRef Name; // Used for filtering and sorting.
170   // We may have a result from Sema, from the index, or both.
171   const CodeCompletionResult *SemaResult = nullptr;
172   const Symbol *IndexResult = nullptr;
173   const RawIdentifier *IdentifierResult = nullptr;
174   llvm::SmallVector<llvm::StringRef, 1> RankedIncludeHeaders;
175 
176   // Returns a token identifying the overload set this is part of.
177   // 0 indicates it's not part of any overload set.
178   size_t overloadSet(const CodeCompleteOptions &Opts, llvm::StringRef FileName,
179                      IncludeInserter *Inserter) const {
180     if (!Opts.BundleOverloads.getValueOr(false))
181       return 0;
182 
183     // Depending on the index implementation, we can see different header
184     // strings (literal or URI) mapping to the same file. We still want to
185     // bundle those, so we must resolve the header to be included here.
186     std::string HeaderForHash;
187     if (Inserter) {
188       if (auto Header = headerToInsertIfAllowed(Opts)) {
189         if (auto HeaderFile = toHeaderFile(*Header, FileName)) {
190           if (auto Spelled =
191                   Inserter->calculateIncludePath(*HeaderFile, FileName))
192             HeaderForHash = *Spelled;
193         } else {
194           vlog("Code completion header path manipulation failed {0}",
195                HeaderFile.takeError());
196         }
197       }
198     }
199 
200     llvm::SmallString<256> Scratch;
201     if (IndexResult) {
202       switch (IndexResult->SymInfo.Kind) {
203       case index::SymbolKind::ClassMethod:
204       case index::SymbolKind::InstanceMethod:
205       case index::SymbolKind::StaticMethod:
206 #ifndef NDEBUG
207         llvm_unreachable("Don't expect members from index in code completion");
208 #else
209         LLVM_FALLTHROUGH;
210 #endif
211       case index::SymbolKind::Function:
212         // We can't group overloads together that need different #includes.
213         // This could break #include insertion.
214         return llvm::hash_combine(
215             (IndexResult->Scope + IndexResult->Name).toStringRef(Scratch),
216             HeaderForHash);
217       default:
218         return 0;
219       }
220     }
221     if (SemaResult) {
222       // We need to make sure we're consistent with the IndexResult case!
223       const NamedDecl *D = SemaResult->Declaration;
224       if (!D || !D->isFunctionOrFunctionTemplate())
225         return 0;
226       {
227         llvm::raw_svector_ostream OS(Scratch);
228         D->printQualifiedName(OS);
229       }
230       return llvm::hash_combine(Scratch, HeaderForHash);
231     }
232     assert(IdentifierResult);
233     return 0;
234   }
235 
236   // The best header to include if include insertion is allowed.
237   llvm::Optional<llvm::StringRef>
238   headerToInsertIfAllowed(const CodeCompleteOptions &Opts) const {
239     if (Opts.InsertIncludes == CodeCompleteOptions::NeverInsert ||
240         RankedIncludeHeaders.empty())
241       return None;
242     if (SemaResult && SemaResult->Declaration) {
243       // Avoid inserting new #include if the declaration is found in the current
244       // file e.g. the symbol is forward declared.
245       auto &SM = SemaResult->Declaration->getASTContext().getSourceManager();
246       for (const Decl *RD : SemaResult->Declaration->redecls())
247         if (SM.isInMainFile(SM.getExpansionLoc(RD->getBeginLoc())))
248           return None;
249     }
250     return RankedIncludeHeaders[0];
251   }
252 
253   using Bundle = llvm::SmallVector<CompletionCandidate, 4>;
254 };
255 using ScoredBundle =
256     std::pair<CompletionCandidate::Bundle, CodeCompletion::Scores>;
257 struct ScoredBundleGreater {
258   bool operator()(const ScoredBundle &L, const ScoredBundle &R) {
259     if (L.second.Total != R.second.Total)
260       return L.second.Total > R.second.Total;
261     return L.first.front().Name <
262            R.first.front().Name; // Earlier name is better.
263   }
264 };
265 
266 // Assembles a code completion out of a bundle of >=1 completion candidates.
267 // Many of the expensive strings are only computed at this point, once we know
268 // the candidate bundle is going to be returned.
269 //
270 // Many fields are the same for all candidates in a bundle (e.g. name), and are
271 // computed from the first candidate, in the constructor.
272 // Others vary per candidate, so add() must be called for remaining candidates.
273 struct CodeCompletionBuilder {
274   CodeCompletionBuilder(ASTContext *ASTCtx, const CompletionCandidate &C,
275                         CodeCompletionString *SemaCCS,
276                         llvm::ArrayRef<std::string> QueryScopes,
277                         const IncludeInserter &Includes,
278                         llvm::StringRef FileName,
279                         CodeCompletionContext::Kind ContextKind,
280                         const CodeCompleteOptions &Opts,
281                         bool IsUsingDeclaration, tok::TokenKind NextTokenKind)
282       : ASTCtx(ASTCtx),
283         EnableFunctionArgSnippets(Opts.EnableFunctionArgSnippets),
284         IsUsingDeclaration(IsUsingDeclaration), NextTokenKind(NextTokenKind) {
285     Completion.Deprecated = true; // cleared by any non-deprecated overload.
286     add(C, SemaCCS);
287     if (C.SemaResult) {
288       assert(ASTCtx);
289       Completion.Origin |= SymbolOrigin::AST;
290       Completion.Name = std::string(llvm::StringRef(SemaCCS->getTypedText()));
291       if (Completion.Scope.empty()) {
292         if ((C.SemaResult->Kind == CodeCompletionResult::RK_Declaration) ||
293             (C.SemaResult->Kind == CodeCompletionResult::RK_Pattern))
294           if (const auto *D = C.SemaResult->getDeclaration())
295             if (const auto *ND = dyn_cast<NamedDecl>(D))
296               Completion.Scope = std::string(
297                   splitQualifiedName(printQualifiedName(*ND)).first);
298       }
299       Completion.Kind = toCompletionItemKind(
300           C.SemaResult->Kind, C.SemaResult->Declaration, ContextKind);
301       // Sema could provide more info on whether the completion was a file or
302       // folder.
303       if (Completion.Kind == CompletionItemKind::File &&
304           Completion.Name.back() == '/')
305         Completion.Kind = CompletionItemKind::Folder;
306       for (const auto &FixIt : C.SemaResult->FixIts) {
307         Completion.FixIts.push_back(toTextEdit(
308             FixIt, ASTCtx->getSourceManager(), ASTCtx->getLangOpts()));
309       }
310       llvm::sort(Completion.FixIts, [](const TextEdit &X, const TextEdit &Y) {
311         return std::tie(X.range.start.line, X.range.start.character) <
312                std::tie(Y.range.start.line, Y.range.start.character);
313       });
314     }
315     if (C.IndexResult) {
316       Completion.Origin |= C.IndexResult->Origin;
317       if (Completion.Scope.empty())
318         Completion.Scope = std::string(C.IndexResult->Scope);
319       if (Completion.Kind == CompletionItemKind::Missing)
320         Completion.Kind = toCompletionItemKind(C.IndexResult->SymInfo.Kind);
321       if (Completion.Name.empty())
322         Completion.Name = std::string(C.IndexResult->Name);
323       // If the completion was visible to Sema, no qualifier is needed. This
324       // avoids unneeded qualifiers in cases like with `using ns::X`.
325       if (Completion.RequiredQualifier.empty() && !C.SemaResult) {
326         llvm::StringRef ShortestQualifier = C.IndexResult->Scope;
327         for (llvm::StringRef Scope : QueryScopes) {
328           llvm::StringRef Qualifier = C.IndexResult->Scope;
329           if (Qualifier.consume_front(Scope) &&
330               Qualifier.size() < ShortestQualifier.size())
331             ShortestQualifier = Qualifier;
332         }
333         Completion.RequiredQualifier = std::string(ShortestQualifier);
334       }
335     }
336     if (C.IdentifierResult) {
337       Completion.Origin |= SymbolOrigin::Identifier;
338       Completion.Kind = CompletionItemKind::Text;
339       Completion.Name = std::string(C.IdentifierResult->Name);
340     }
341 
342     // Turn absolute path into a literal string that can be #included.
343     auto Inserted = [&](llvm::StringRef Header)
344         -> llvm::Expected<std::pair<std::string, bool>> {
345       auto ResolvedDeclaring =
346           URI::resolve(C.IndexResult->CanonicalDeclaration.FileURI, FileName);
347       if (!ResolvedDeclaring)
348         return ResolvedDeclaring.takeError();
349       auto ResolvedInserted = toHeaderFile(Header, FileName);
350       if (!ResolvedInserted)
351         return ResolvedInserted.takeError();
352       auto Spelled = Includes.calculateIncludePath(*ResolvedInserted, FileName);
353       if (!Spelled)
354         return error("Header not on include path");
355       return std::make_pair(
356           std::move(*Spelled),
357           Includes.shouldInsertInclude(*ResolvedDeclaring, *ResolvedInserted));
358     };
359     bool ShouldInsert = C.headerToInsertIfAllowed(Opts).hasValue();
360     // Calculate include paths and edits for all possible headers.
361     for (const auto &Inc : C.RankedIncludeHeaders) {
362       if (auto ToInclude = Inserted(Inc)) {
363         CodeCompletion::IncludeCandidate Include;
364         Include.Header = ToInclude->first;
365         if (ToInclude->second && ShouldInsert)
366           Include.Insertion = Includes.insert(ToInclude->first);
367         Completion.Includes.push_back(std::move(Include));
368       } else
369         log("Failed to generate include insertion edits for adding header "
370             "(FileURI='{0}', IncludeHeader='{1}') into {2}: {3}",
371             C.IndexResult->CanonicalDeclaration.FileURI, Inc, FileName,
372             ToInclude.takeError());
373     }
374     // Prefer includes that do not need edits (i.e. already exist).
375     std::stable_partition(Completion.Includes.begin(),
376                           Completion.Includes.end(),
377                           [](const CodeCompletion::IncludeCandidate &I) {
378                             return !I.Insertion.hasValue();
379                           });
380   }
381 
382   void add(const CompletionCandidate &C, CodeCompletionString *SemaCCS) {
383     assert(bool(C.SemaResult) == bool(SemaCCS));
384     Bundled.emplace_back();
385     BundledEntry &S = Bundled.back();
386     if (C.SemaResult) {
387       bool IsPattern = C.SemaResult->Kind == CodeCompletionResult::RK_Pattern;
388       getSignature(*SemaCCS, &S.Signature, &S.SnippetSuffix,
389                    &Completion.RequiredQualifier, IsPattern);
390       S.ReturnType = getReturnType(*SemaCCS);
391     } else if (C.IndexResult) {
392       S.Signature = std::string(C.IndexResult->Signature);
393       S.SnippetSuffix = std::string(C.IndexResult->CompletionSnippetSuffix);
394       S.ReturnType = std::string(C.IndexResult->ReturnType);
395     }
396     if (!Completion.Documentation) {
397       auto SetDoc = [&](llvm::StringRef Doc) {
398         if (!Doc.empty()) {
399           Completion.Documentation.emplace();
400           parseDocumentation(Doc, *Completion.Documentation);
401         }
402       };
403       if (C.IndexResult) {
404         SetDoc(C.IndexResult->Documentation);
405       } else if (C.SemaResult) {
406         const auto DocComment = getDocComment(*ASTCtx, *C.SemaResult,
407                                               /*CommentsFromHeader=*/false);
408         SetDoc(formatDocumentation(*SemaCCS, DocComment));
409       }
410     }
411     if (Completion.Deprecated) {
412       if (C.SemaResult)
413         Completion.Deprecated &=
414             C.SemaResult->Availability == CXAvailability_Deprecated;
415       if (C.IndexResult)
416         Completion.Deprecated &=
417             bool(C.IndexResult->Flags & Symbol::Deprecated);
418     }
419   }
420 
421   CodeCompletion build() {
422     Completion.ReturnType = summarizeReturnType();
423     Completion.Signature = summarizeSignature();
424     Completion.SnippetSuffix = summarizeSnippet();
425     Completion.BundleSize = Bundled.size();
426     return std::move(Completion);
427   }
428 
429 private:
430   struct BundledEntry {
431     std::string SnippetSuffix;
432     std::string Signature;
433     std::string ReturnType;
434   };
435 
436   // If all BundledEntries have the same value for a property, return it.
437   template <std::string BundledEntry::*Member>
438   const std::string *onlyValue() const {
439     auto B = Bundled.begin(), E = Bundled.end();
440     for (auto I = B + 1; I != E; ++I)
441       if (I->*Member != B->*Member)
442         return nullptr;
443     return &(B->*Member);
444   }
445 
446   template <bool BundledEntry::*Member> const bool *onlyValue() const {
447     auto B = Bundled.begin(), E = Bundled.end();
448     for (auto I = B + 1; I != E; ++I)
449       if (I->*Member != B->*Member)
450         return nullptr;
451     return &(B->*Member);
452   }
453 
454   std::string summarizeReturnType() const {
455     if (auto *RT = onlyValue<&BundledEntry::ReturnType>())
456       return *RT;
457     return "";
458   }
459 
460   std::string summarizeSnippet() const {
461     if (IsUsingDeclaration)
462       return "";
463     auto *Snippet = onlyValue<&BundledEntry::SnippetSuffix>();
464     if (!Snippet)
465       // All bundles are function calls.
466       // FIXME(ibiryukov): sometimes add template arguments to a snippet, e.g.
467       // we need to complete 'forward<$1>($0)'.
468       return "($0)";
469 
470     bool MayHaveArgList = Completion.Kind == CompletionItemKind::Function ||
471                           Completion.Kind == CompletionItemKind::Method ||
472                           Completion.Kind == CompletionItemKind::Constructor ||
473                           Completion.Kind == CompletionItemKind::Text /*Macro*/;
474     // If likely arg list already exists, don't add new parens & placeholders.
475     //   Snippet: function(int x, int y)
476     //   func^(1,2) -> function(1, 2)
477     //             NOT function(int x, int y)(1, 2)
478     if (MayHaveArgList) {
479       // Check for a template argument list in the code.
480       //   Snippet: function<class T>(int x)
481       //   fu^<int>(1) -> function<int>(1)
482       if (NextTokenKind == tok::less && Snippet->front() == '<')
483         return "";
484       // Potentially followed by regular argument list.
485       if (NextTokenKind == tok::l_paren) {
486         //   Snippet: function<class T>(int x)
487         //   fu^(1,2) -> function<class T>(1, 2)
488         if (Snippet->front() == '<') {
489           // Find matching '>', handling nested brackets.
490           int Balance = 0;
491           size_t I = 0;
492           do {
493             if (Snippet->at(I) == '>')
494               --Balance;
495             else if (Snippet->at(I) == '<')
496               ++Balance;
497             ++I;
498           } while (Balance > 0);
499           return Snippet->substr(0, I);
500         }
501         return "";
502       }
503     }
504     if (EnableFunctionArgSnippets)
505       return *Snippet;
506 
507     // Replace argument snippets with a simplified pattern.
508     if (Snippet->empty())
509       return "";
510     if (MayHaveArgList) {
511       // Functions snippets can be of 2 types:
512       // - containing only function arguments, e.g.
513       //   foo(${1:int p1}, ${2:int p2});
514       //   We transform this pattern to '($0)' or '()'.
515       // - template arguments and function arguments, e.g.
516       //   foo<${1:class}>(${2:int p1}).
517       //   We transform this pattern to '<$1>()$0' or '<$0>()'.
518 
519       bool EmptyArgs = llvm::StringRef(*Snippet).endswith("()");
520       if (Snippet->front() == '<')
521         return EmptyArgs ? "<$1>()$0" : "<$1>($0)";
522       if (Snippet->front() == '(')
523         return EmptyArgs ? "()" : "($0)";
524       return *Snippet; // Not an arg snippet?
525     }
526     // 'CompletionItemKind::Interface' matches template type aliases.
527     if (Completion.Kind == CompletionItemKind::Interface ||
528         Completion.Kind == CompletionItemKind::Class) {
529       if (Snippet->front() != '<')
530         return *Snippet; // Not an arg snippet?
531 
532       // Classes and template using aliases can only have template arguments,
533       // e.g. Foo<${1:class}>.
534       if (llvm::StringRef(*Snippet).endswith("<>"))
535         return "<>"; // can happen with defaulted template arguments.
536       return "<$0>";
537     }
538     return *Snippet;
539   }
540 
541   std::string summarizeSignature() const {
542     if (auto *Signature = onlyValue<&BundledEntry::Signature>())
543       return *Signature;
544     // All bundles are function calls.
545     return "(…)";
546   }
547 
548   // ASTCtx can be nullptr if not run with sema.
549   ASTContext *ASTCtx;
550   CodeCompletion Completion;
551   llvm::SmallVector<BundledEntry, 1> Bundled;
552   bool EnableFunctionArgSnippets;
553   // No snippets will be generated for using declarations and when the function
554   // arguments are already present.
555   bool IsUsingDeclaration;
556   tok::TokenKind NextTokenKind;
557 };
558 
559 // Determine the symbol ID for a Sema code completion result, if possible.
560 SymbolID getSymbolID(const CodeCompletionResult &R, const SourceManager &SM) {
561   switch (R.Kind) {
562   case CodeCompletionResult::RK_Declaration:
563   case CodeCompletionResult::RK_Pattern: {
564     // Computing USR caches linkage, which may change after code completion.
565     if (hasUnstableLinkage(R.Declaration))
566       return {};
567     return clang::clangd::getSymbolID(R.Declaration);
568   }
569   case CodeCompletionResult::RK_Macro:
570     return clang::clangd::getSymbolID(R.Macro->getName(), R.MacroDefInfo, SM);
571   case CodeCompletionResult::RK_Keyword:
572     return {};
573   }
574   llvm_unreachable("unknown CodeCompletionResult kind");
575 }
576 
577 // Scopes of the partial identifier we're trying to complete.
578 // It is used when we query the index for more completion results.
579 struct SpecifiedScope {
580   // The scopes we should look in, determined by Sema.
581   //
582   // If the qualifier was fully resolved, we look for completions in these
583   // scopes; if there is an unresolved part of the qualifier, it should be
584   // resolved within these scopes.
585   //
586   // Examples of qualified completion:
587   //
588   //   "::vec"                                      => {""}
589   //   "using namespace std; ::vec^"                => {"", "std::"}
590   //   "namespace ns {using namespace std;} ns::^"  => {"ns::", "std::"}
591   //   "std::vec^"                                  => {""}  // "std" unresolved
592   //
593   // Examples of unqualified completion:
594   //
595   //   "vec^"                                       => {""}
596   //   "using namespace std; vec^"                  => {"", "std::"}
597   //   "using namespace std; namespace ns { vec^ }" => {"ns::", "std::", ""}
598   //
599   // "" for global namespace, "ns::" for normal namespace.
600   std::vector<std::string> AccessibleScopes;
601   // The full scope qualifier as typed by the user (without the leading "::").
602   // Set if the qualifier is not fully resolved by Sema.
603   llvm::Optional<std::string> UnresolvedQualifier;
604 
605   // Construct scopes being queried in indexes. The results are deduplicated.
606   // This method format the scopes to match the index request representation.
607   std::vector<std::string> scopesForIndexQuery() {
608     std::set<std::string> Results;
609     for (llvm::StringRef AS : AccessibleScopes)
610       Results.insert(
611           (AS + (UnresolvedQualifier ? *UnresolvedQualifier : "")).str());
612     return {Results.begin(), Results.end()};
613   }
614 };
615 
616 // Get all scopes that will be queried in indexes and whether symbols from
617 // any scope is allowed. The first scope in the list is the preferred scope
618 // (e.g. enclosing namespace).
619 std::pair<std::vector<std::string>, bool>
620 getQueryScopes(CodeCompletionContext &CCContext, const Sema &CCSema,
621                const CompletionPrefix &HeuristicPrefix,
622                const CodeCompleteOptions &Opts) {
623   SpecifiedScope Scopes;
624   for (auto *Context : CCContext.getVisitedContexts()) {
625     if (isa<TranslationUnitDecl>(Context))
626       Scopes.AccessibleScopes.push_back(""); // global namespace
627     else if (isa<NamespaceDecl>(Context))
628       Scopes.AccessibleScopes.push_back(printNamespaceScope(*Context));
629   }
630 
631   const CXXScopeSpec *SemaSpecifier =
632       CCContext.getCXXScopeSpecifier().getValueOr(nullptr);
633   // Case 1: unqualified completion.
634   if (!SemaSpecifier) {
635     // Case 2 (exception): sema saw no qualifier, but there appears to be one!
636     // This can happen e.g. in incomplete macro expansions. Use heuristics.
637     if (!HeuristicPrefix.Qualifier.empty()) {
638       vlog("Sema said no scope specifier, but we saw {0} in the source code",
639            HeuristicPrefix.Qualifier);
640       StringRef SpelledSpecifier = HeuristicPrefix.Qualifier;
641       if (SpelledSpecifier.consume_front("::"))
642         Scopes.AccessibleScopes = {""};
643       Scopes.UnresolvedQualifier = std::string(SpelledSpecifier);
644       return {Scopes.scopesForIndexQuery(), false};
645     }
646     // The enclosing namespace must be first, it gets a quality boost.
647     std::vector<std::string> EnclosingAtFront;
648     std::string EnclosingScope = printNamespaceScope(*CCSema.CurContext);
649     EnclosingAtFront.push_back(EnclosingScope);
650     for (auto &S : Scopes.scopesForIndexQuery()) {
651       if (EnclosingScope != S)
652         EnclosingAtFront.push_back(std::move(S));
653     }
654     // Allow AllScopes completion as there is no explicit scope qualifier.
655     return {EnclosingAtFront, Opts.AllScopes};
656   }
657   // Case 3: sema saw and resolved a scope qualifier.
658   if (SemaSpecifier && SemaSpecifier->isValid())
659     return {Scopes.scopesForIndexQuery(), false};
660 
661   // Case 4: There was a qualifier, and Sema didn't resolve it.
662   Scopes.AccessibleScopes.push_back(""); // Make sure global scope is included.
663   llvm::StringRef SpelledSpecifier = Lexer::getSourceText(
664       CharSourceRange::getCharRange(SemaSpecifier->getRange()),
665       CCSema.SourceMgr, clang::LangOptions());
666   if (SpelledSpecifier.consume_front("::"))
667     Scopes.AccessibleScopes = {""};
668   Scopes.UnresolvedQualifier = std::string(SpelledSpecifier);
669   // Sema excludes the trailing "::".
670   if (!Scopes.UnresolvedQualifier->empty())
671     *Scopes.UnresolvedQualifier += "::";
672 
673   return {Scopes.scopesForIndexQuery(), false};
674 }
675 
676 // Should we perform index-based completion in a context of the specified kind?
677 // FIXME: consider allowing completion, but restricting the result types.
678 bool contextAllowsIndex(enum CodeCompletionContext::Kind K) {
679   switch (K) {
680   case CodeCompletionContext::CCC_TopLevel:
681   case CodeCompletionContext::CCC_ObjCInterface:
682   case CodeCompletionContext::CCC_ObjCImplementation:
683   case CodeCompletionContext::CCC_ObjCIvarList:
684   case CodeCompletionContext::CCC_ClassStructUnion:
685   case CodeCompletionContext::CCC_Statement:
686   case CodeCompletionContext::CCC_Expression:
687   case CodeCompletionContext::CCC_ObjCMessageReceiver:
688   case CodeCompletionContext::CCC_EnumTag:
689   case CodeCompletionContext::CCC_UnionTag:
690   case CodeCompletionContext::CCC_ClassOrStructTag:
691   case CodeCompletionContext::CCC_ObjCProtocolName:
692   case CodeCompletionContext::CCC_Namespace:
693   case CodeCompletionContext::CCC_Type:
694   case CodeCompletionContext::CCC_ParenthesizedExpression:
695   case CodeCompletionContext::CCC_ObjCInterfaceName:
696   case CodeCompletionContext::CCC_ObjCCategoryName:
697   case CodeCompletionContext::CCC_Symbol:
698   case CodeCompletionContext::CCC_SymbolOrNewName:
699     return true;
700   case CodeCompletionContext::CCC_OtherWithMacros:
701   case CodeCompletionContext::CCC_DotMemberAccess:
702   case CodeCompletionContext::CCC_ArrowMemberAccess:
703   case CodeCompletionContext::CCC_ObjCPropertyAccess:
704   case CodeCompletionContext::CCC_MacroName:
705   case CodeCompletionContext::CCC_MacroNameUse:
706   case CodeCompletionContext::CCC_PreprocessorExpression:
707   case CodeCompletionContext::CCC_PreprocessorDirective:
708   case CodeCompletionContext::CCC_SelectorName:
709   case CodeCompletionContext::CCC_TypeQualifiers:
710   case CodeCompletionContext::CCC_ObjCInstanceMessage:
711   case CodeCompletionContext::CCC_ObjCClassMessage:
712   case CodeCompletionContext::CCC_IncludedFile:
713   case CodeCompletionContext::CCC_Attribute:
714   // FIXME: Provide identifier based completions for the following contexts:
715   case CodeCompletionContext::CCC_Other: // Be conservative.
716   case CodeCompletionContext::CCC_NaturalLanguage:
717   case CodeCompletionContext::CCC_Recovery:
718   case CodeCompletionContext::CCC_NewName:
719     return false;
720   }
721   llvm_unreachable("unknown code completion context");
722 }
723 
724 static bool isInjectedClass(const NamedDecl &D) {
725   if (auto *R = dyn_cast_or_null<RecordDecl>(&D))
726     if (R->isInjectedClassName())
727       return true;
728   return false;
729 }
730 
731 // Some member calls are excluded because they're so rarely useful.
732 static bool isExcludedMember(const NamedDecl &D) {
733   // Destructor completion is rarely useful, and works inconsistently.
734   // (s.^ completes ~string, but s.~st^ is an error).
735   if (D.getKind() == Decl::CXXDestructor)
736     return true;
737   // Injected name may be useful for A::foo(), but who writes A::A::foo()?
738   if (isInjectedClass(D))
739     return true;
740   // Explicit calls to operators are also rare.
741   auto NameKind = D.getDeclName().getNameKind();
742   if (NameKind == DeclarationName::CXXOperatorName ||
743       NameKind == DeclarationName::CXXLiteralOperatorName ||
744       NameKind == DeclarationName::CXXConversionFunctionName)
745     return true;
746   return false;
747 }
748 
749 // The CompletionRecorder captures Sema code-complete output, including context.
750 // It filters out ignored results (but doesn't apply fuzzy-filtering yet).
751 // It doesn't do scoring or conversion to CompletionItem yet, as we want to
752 // merge with index results first.
753 // Generally the fields and methods of this object should only be used from
754 // within the callback.
755 struct CompletionRecorder : public CodeCompleteConsumer {
756   CompletionRecorder(const CodeCompleteOptions &Opts,
757                      llvm::unique_function<void()> ResultsCallback)
758       : CodeCompleteConsumer(Opts.getClangCompleteOpts()),
759         CCContext(CodeCompletionContext::CCC_Other), Opts(Opts),
760         CCAllocator(std::make_shared<GlobalCodeCompletionAllocator>()),
761         CCTUInfo(CCAllocator), ResultsCallback(std::move(ResultsCallback)) {
762     assert(this->ResultsCallback);
763   }
764 
765   std::vector<CodeCompletionResult> Results;
766   CodeCompletionContext CCContext;
767   Sema *CCSema = nullptr; // Sema that created the results.
768   // FIXME: Sema is scary. Can we store ASTContext and Preprocessor, instead?
769 
770   void ProcessCodeCompleteResults(class Sema &S, CodeCompletionContext Context,
771                                   CodeCompletionResult *InResults,
772                                   unsigned NumResults) override final {
773     // Results from recovery mode are generally useless, and the callback after
774     // recovery (if any) is usually more interesting. To make sure we handle the
775     // future callback from sema, we just ignore all callbacks in recovery mode,
776     // as taking only results from recovery mode results in poor completion
777     // results.
778     // FIXME: in case there is no future sema completion callback after the
779     // recovery mode, we might still want to provide some results (e.g. trivial
780     // identifier-based completion).
781     if (Context.getKind() == CodeCompletionContext::CCC_Recovery) {
782       log("Code complete: Ignoring sema code complete callback with Recovery "
783           "context.");
784       return;
785     }
786     // If a callback is called without any sema result and the context does not
787     // support index-based completion, we simply skip it to give way to
788     // potential future callbacks with results.
789     if (NumResults == 0 && !contextAllowsIndex(Context.getKind()))
790       return;
791     if (CCSema) {
792       log("Multiple code complete callbacks (parser backtracked?). "
793           "Dropping results from context {0}, keeping results from {1}.",
794           getCompletionKindString(Context.getKind()),
795           getCompletionKindString(this->CCContext.getKind()));
796       return;
797     }
798     // Record the completion context.
799     CCSema = &S;
800     CCContext = Context;
801 
802     // Retain the results we might want.
803     for (unsigned I = 0; I < NumResults; ++I) {
804       auto &Result = InResults[I];
805       // Class members that are shadowed by subclasses are usually noise.
806       if (Result.Hidden && Result.Declaration &&
807           Result.Declaration->isCXXClassMember())
808         continue;
809       if (!Opts.IncludeIneligibleResults &&
810           (Result.Availability == CXAvailability_NotAvailable ||
811            Result.Availability == CXAvailability_NotAccessible))
812         continue;
813       if (Result.Declaration &&
814           !Context.getBaseType().isNull() // is this a member-access context?
815           && isExcludedMember(*Result.Declaration))
816         continue;
817       // Skip injected class name when no class scope is not explicitly set.
818       // E.g. show injected A::A in `using A::A^` but not in "A^".
819       if (Result.Declaration && !Context.getCXXScopeSpecifier().hasValue() &&
820           isInjectedClass(*Result.Declaration))
821         continue;
822       // We choose to never append '::' to completion results in clangd.
823       Result.StartsNestedNameSpecifier = false;
824       Results.push_back(Result);
825     }
826     ResultsCallback();
827   }
828 
829   CodeCompletionAllocator &getAllocator() override { return *CCAllocator; }
830   CodeCompletionTUInfo &getCodeCompletionTUInfo() override { return CCTUInfo; }
831 
832   // Returns the filtering/sorting name for Result, which must be from Results.
833   // Returned string is owned by this recorder (or the AST).
834   llvm::StringRef getName(const CodeCompletionResult &Result) {
835     switch (Result.Kind) {
836     case CodeCompletionResult::RK_Declaration:
837       if (auto *ID = Result.Declaration->getIdentifier())
838         return ID->getName();
839       break;
840     case CodeCompletionResult::RK_Keyword:
841       return Result.Keyword;
842     case CodeCompletionResult::RK_Macro:
843       return Result.Macro->getName();
844     case CodeCompletionResult::RK_Pattern:
845       return Result.Pattern->getTypedText();
846     }
847     auto *CCS = codeCompletionString(Result);
848     return CCS->getTypedText();
849   }
850 
851   // Build a CodeCompletion string for R, which must be from Results.
852   // The CCS will be owned by this recorder.
853   CodeCompletionString *codeCompletionString(const CodeCompletionResult &R) {
854     // CodeCompletionResult doesn't seem to be const-correct. We own it, anyway.
855     return const_cast<CodeCompletionResult &>(R).CreateCodeCompletionString(
856         *CCSema, CCContext, *CCAllocator, CCTUInfo,
857         /*IncludeBriefComments=*/false);
858   }
859 
860 private:
861   CodeCompleteOptions Opts;
862   std::shared_ptr<GlobalCodeCompletionAllocator> CCAllocator;
863   CodeCompletionTUInfo CCTUInfo;
864   llvm::unique_function<void()> ResultsCallback;
865 };
866 
867 struct ScoredSignature {
868   // When not null, requires documentation to be requested from the index with
869   // this ID.
870   SymbolID IDForDoc;
871   SignatureInformation Signature;
872   SignatureQualitySignals Quality;
873 };
874 
875 class SignatureHelpCollector final : public CodeCompleteConsumer {
876 public:
877   SignatureHelpCollector(const clang::CodeCompleteOptions &CodeCompleteOpts,
878                          const SymbolIndex *Index, SignatureHelp &SigHelp)
879       : CodeCompleteConsumer(CodeCompleteOpts), SigHelp(SigHelp),
880         Allocator(std::make_shared<clang::GlobalCodeCompletionAllocator>()),
881         CCTUInfo(Allocator), Index(Index) {}
882 
883   void ProcessOverloadCandidates(Sema &S, unsigned CurrentArg,
884                                  OverloadCandidate *Candidates,
885                                  unsigned NumCandidates,
886                                  SourceLocation OpenParLoc) override {
887     assert(!OpenParLoc.isInvalid());
888     SourceManager &SrcMgr = S.getSourceManager();
889     OpenParLoc = SrcMgr.getFileLoc(OpenParLoc);
890     if (SrcMgr.isInMainFile(OpenParLoc))
891       SigHelp.argListStart = sourceLocToPosition(SrcMgr, OpenParLoc);
892     else
893       elog("Location oustide main file in signature help: {0}",
894            OpenParLoc.printToString(SrcMgr));
895 
896     std::vector<ScoredSignature> ScoredSignatures;
897     SigHelp.signatures.reserve(NumCandidates);
898     ScoredSignatures.reserve(NumCandidates);
899     // FIXME(rwols): How can we determine the "active overload candidate"?
900     // Right now the overloaded candidates seem to be provided in a "best fit"
901     // order, so I'm not too worried about this.
902     SigHelp.activeSignature = 0;
903     assert(CurrentArg <= (unsigned)std::numeric_limits<int>::max() &&
904            "too many arguments");
905     SigHelp.activeParameter = static_cast<int>(CurrentArg);
906     for (unsigned I = 0; I < NumCandidates; ++I) {
907       OverloadCandidate Candidate = Candidates[I];
908       // We want to avoid showing instantiated signatures, because they may be
909       // long in some cases (e.g. when 'T' is substituted with 'std::string', we
910       // would get 'std::basic_string<char>').
911       if (auto *Func = Candidate.getFunction()) {
912         if (auto *Pattern = Func->getTemplateInstantiationPattern())
913           Candidate = OverloadCandidate(Pattern);
914       }
915 
916       const auto *CCS = Candidate.CreateSignatureString(
917           CurrentArg, S, *Allocator, CCTUInfo, true);
918       assert(CCS && "Expected the CodeCompletionString to be non-null");
919       ScoredSignatures.push_back(processOverloadCandidate(
920           Candidate, *CCS,
921           Candidate.getFunction()
922               ? getDeclComment(S.getASTContext(), *Candidate.getFunction())
923               : ""));
924     }
925 
926     // Sema does not load the docs from the preamble, so we need to fetch extra
927     // docs from the index instead.
928     llvm::DenseMap<SymbolID, std::string> FetchedDocs;
929     if (Index) {
930       LookupRequest IndexRequest;
931       for (const auto &S : ScoredSignatures) {
932         if (!S.IDForDoc)
933           continue;
934         IndexRequest.IDs.insert(S.IDForDoc);
935       }
936       Index->lookup(IndexRequest, [&](const Symbol &S) {
937         if (!S.Documentation.empty())
938           FetchedDocs[S.ID] = std::string(S.Documentation);
939       });
940       log("SigHelp: requested docs for {0} symbols from the index, got {1} "
941           "symbols with non-empty docs in the response",
942           IndexRequest.IDs.size(), FetchedDocs.size());
943     }
944 
945     llvm::sort(ScoredSignatures, [](const ScoredSignature &L,
946                                     const ScoredSignature &R) {
947       // Ordering follows:
948       // - Less number of parameters is better.
949       // - Function is better than FunctionType which is better than
950       // Function Template.
951       // - High score is better.
952       // - Shorter signature is better.
953       // - Alphabetically smaller is better.
954       if (L.Quality.NumberOfParameters != R.Quality.NumberOfParameters)
955         return L.Quality.NumberOfParameters < R.Quality.NumberOfParameters;
956       if (L.Quality.NumberOfOptionalParameters !=
957           R.Quality.NumberOfOptionalParameters)
958         return L.Quality.NumberOfOptionalParameters <
959                R.Quality.NumberOfOptionalParameters;
960       if (L.Quality.Kind != R.Quality.Kind) {
961         using OC = CodeCompleteConsumer::OverloadCandidate;
962         switch (L.Quality.Kind) {
963         case OC::CK_Function:
964           return true;
965         case OC::CK_FunctionType:
966           return R.Quality.Kind != OC::CK_Function;
967         case OC::CK_FunctionTemplate:
968           return false;
969         }
970         llvm_unreachable("Unknown overload candidate type.");
971       }
972       if (L.Signature.label.size() != R.Signature.label.size())
973         return L.Signature.label.size() < R.Signature.label.size();
974       return L.Signature.label < R.Signature.label;
975     });
976 
977     for (auto &SS : ScoredSignatures) {
978       auto IndexDocIt =
979           SS.IDForDoc ? FetchedDocs.find(SS.IDForDoc) : FetchedDocs.end();
980       if (IndexDocIt != FetchedDocs.end())
981         SS.Signature.documentation = IndexDocIt->second;
982 
983       SigHelp.signatures.push_back(std::move(SS.Signature));
984     }
985   }
986 
987   GlobalCodeCompletionAllocator &getAllocator() override { return *Allocator; }
988 
989   CodeCompletionTUInfo &getCodeCompletionTUInfo() override { return CCTUInfo; }
990 
991 private:
992   void processParameterChunk(llvm::StringRef ChunkText,
993                              SignatureInformation &Signature) const {
994     // (!) this is O(n), should still be fast compared to building ASTs.
995     unsigned ParamStartOffset = lspLength(Signature.label);
996     unsigned ParamEndOffset = ParamStartOffset + lspLength(ChunkText);
997     // A piece of text that describes the parameter that corresponds to
998     // the code-completion location within a function call, message send,
999     // macro invocation, etc.
1000     Signature.label += ChunkText;
1001     ParameterInformation Info;
1002     Info.labelOffsets.emplace(ParamStartOffset, ParamEndOffset);
1003     // FIXME: only set 'labelOffsets' when all clients migrate out of it.
1004     Info.labelString = std::string(ChunkText);
1005 
1006     Signature.parameters.push_back(std::move(Info));
1007   }
1008 
1009   void processOptionalChunk(const CodeCompletionString &CCS,
1010                             SignatureInformation &Signature,
1011                             SignatureQualitySignals &Signal) const {
1012     for (const auto &Chunk : CCS) {
1013       switch (Chunk.Kind) {
1014       case CodeCompletionString::CK_Optional:
1015         assert(Chunk.Optional &&
1016                "Expected the optional code completion string to be non-null.");
1017         processOptionalChunk(*Chunk.Optional, Signature, Signal);
1018         break;
1019       case CodeCompletionString::CK_VerticalSpace:
1020         break;
1021       case CodeCompletionString::CK_CurrentParameter:
1022       case CodeCompletionString::CK_Placeholder:
1023         processParameterChunk(Chunk.Text, Signature);
1024         Signal.NumberOfOptionalParameters++;
1025         break;
1026       default:
1027         Signature.label += Chunk.Text;
1028         break;
1029       }
1030     }
1031   }
1032 
1033   // FIXME(ioeric): consider moving CodeCompletionString logic here to
1034   // CompletionString.h.
1035   ScoredSignature processOverloadCandidate(const OverloadCandidate &Candidate,
1036                                            const CodeCompletionString &CCS,
1037                                            llvm::StringRef DocComment) const {
1038     SignatureInformation Signature;
1039     SignatureQualitySignals Signal;
1040     const char *ReturnType = nullptr;
1041 
1042     Signature.documentation = formatDocumentation(CCS, DocComment);
1043     Signal.Kind = Candidate.getKind();
1044 
1045     for (const auto &Chunk : CCS) {
1046       switch (Chunk.Kind) {
1047       case CodeCompletionString::CK_ResultType:
1048         // A piece of text that describes the type of an entity or,
1049         // for functions and methods, the return type.
1050         assert(!ReturnType && "Unexpected CK_ResultType");
1051         ReturnType = Chunk.Text;
1052         break;
1053       case CodeCompletionString::CK_CurrentParameter:
1054       case CodeCompletionString::CK_Placeholder:
1055         processParameterChunk(Chunk.Text, Signature);
1056         Signal.NumberOfParameters++;
1057         break;
1058       case CodeCompletionString::CK_Optional: {
1059         // The rest of the parameters are defaulted/optional.
1060         assert(Chunk.Optional &&
1061                "Expected the optional code completion string to be non-null.");
1062         processOptionalChunk(*Chunk.Optional, Signature, Signal);
1063         break;
1064       }
1065       case CodeCompletionString::CK_VerticalSpace:
1066         break;
1067       default:
1068         Signature.label += Chunk.Text;
1069         break;
1070       }
1071     }
1072     if (ReturnType) {
1073       Signature.label += " -> ";
1074       Signature.label += ReturnType;
1075     }
1076     dlog("Signal for {0}: {1}", Signature, Signal);
1077     ScoredSignature Result;
1078     Result.Signature = std::move(Signature);
1079     Result.Quality = Signal;
1080     const FunctionDecl *Func = Candidate.getFunction();
1081     if (Func && Result.Signature.documentation.empty()) {
1082       // Computing USR caches linkage, which may change after code completion.
1083       if (!hasUnstableLinkage(Func))
1084         Result.IDForDoc = clangd::getSymbolID(Func);
1085     }
1086     return Result;
1087   }
1088 
1089   SignatureHelp &SigHelp;
1090   std::shared_ptr<clang::GlobalCodeCompletionAllocator> Allocator;
1091   CodeCompletionTUInfo CCTUInfo;
1092   const SymbolIndex *Index;
1093 }; // SignatureHelpCollector
1094 
1095 // Used only for completion of C-style comments in function call (i.e.
1096 // /*foo=*/7). Similar to SignatureHelpCollector, but needs to do less work.
1097 class ParamNameCollector final : public CodeCompleteConsumer {
1098 public:
1099   ParamNameCollector(const clang::CodeCompleteOptions &CodeCompleteOpts,
1100                      std::set<std::string> &ParamNames)
1101       : CodeCompleteConsumer(CodeCompleteOpts),
1102         Allocator(std::make_shared<clang::GlobalCodeCompletionAllocator>()),
1103         CCTUInfo(Allocator), ParamNames(ParamNames) {}
1104 
1105   void ProcessOverloadCandidates(Sema &S, unsigned CurrentArg,
1106                                  OverloadCandidate *Candidates,
1107                                  unsigned NumCandidates,
1108                                  SourceLocation OpenParLoc) override {
1109     assert(CurrentArg <= (unsigned)std::numeric_limits<int>::max() &&
1110            "too many arguments");
1111 
1112     for (unsigned I = 0; I < NumCandidates; ++I) {
1113       OverloadCandidate Candidate = Candidates[I];
1114       auto *Func = Candidate.getFunction();
1115       if (!Func || Func->getNumParams() <= CurrentArg)
1116         continue;
1117       auto *PVD = Func->getParamDecl(CurrentArg);
1118       if (!PVD)
1119         continue;
1120       auto *Ident = PVD->getIdentifier();
1121       if (!Ident)
1122         continue;
1123       auto Name = Ident->getName();
1124       if (!Name.empty())
1125         ParamNames.insert(Name.str());
1126     }
1127   }
1128 
1129 private:
1130   GlobalCodeCompletionAllocator &getAllocator() override { return *Allocator; }
1131 
1132   CodeCompletionTUInfo &getCodeCompletionTUInfo() override { return CCTUInfo; }
1133 
1134   std::shared_ptr<clang::GlobalCodeCompletionAllocator> Allocator;
1135   CodeCompletionTUInfo CCTUInfo;
1136   std::set<std::string> &ParamNames;
1137 };
1138 
1139 struct SemaCompleteInput {
1140   PathRef FileName;
1141   size_t Offset;
1142   const PreambleData &Preamble;
1143   const llvm::Optional<PreamblePatch> Patch;
1144   const ParseInputs &ParseInput;
1145 };
1146 
1147 void loadMainFilePreambleMacros(const Preprocessor &PP,
1148                                 const PreambleData &Preamble) {
1149   // The ExternalPreprocessorSource has our macros, if we know where to look.
1150   // We can read all the macros using PreambleMacros->ReadDefinedMacros(),
1151   // but this includes transitively included files, so may deserialize a lot.
1152   ExternalPreprocessorSource *PreambleMacros = PP.getExternalSource();
1153   // As we have the names of the macros, we can look up their IdentifierInfo
1154   // and then use this to load just the macros we want.
1155   const auto &ITable = PP.getIdentifierTable();
1156   IdentifierInfoLookup *PreambleIdentifiers =
1157       ITable.getExternalIdentifierLookup();
1158 
1159   if (!PreambleIdentifiers || !PreambleMacros)
1160     return;
1161   for (const auto &MacroName : Preamble.Macros.Names) {
1162     if (ITable.find(MacroName.getKey()) != ITable.end())
1163       continue;
1164     if (auto *II = PreambleIdentifiers->get(MacroName.getKey()))
1165       if (II->isOutOfDate())
1166         PreambleMacros->updateOutOfDateIdentifier(*II);
1167   }
1168 }
1169 
1170 // Invokes Sema code completion on a file.
1171 // If \p Includes is set, it will be updated based on the compiler invocation.
1172 bool semaCodeComplete(std::unique_ptr<CodeCompleteConsumer> Consumer,
1173                       const clang::CodeCompleteOptions &Options,
1174                       const SemaCompleteInput &Input,
1175                       IncludeStructure *Includes = nullptr) {
1176   trace::Span Tracer("Sema completion");
1177 
1178   IgnoreDiagnostics IgnoreDiags;
1179   auto CI = buildCompilerInvocation(Input.ParseInput, IgnoreDiags);
1180   if (!CI) {
1181     elog("Couldn't create CompilerInvocation");
1182     return false;
1183   }
1184   auto &FrontendOpts = CI->getFrontendOpts();
1185   FrontendOpts.SkipFunctionBodies = true;
1186   // Disable typo correction in Sema.
1187   CI->getLangOpts()->SpellChecking = false;
1188   // Code completion won't trigger in delayed template bodies.
1189   // This is on-by-default in windows to allow parsing SDK headers; we're only
1190   // disabling it for the main-file (not preamble).
1191   CI->getLangOpts()->DelayedTemplateParsing = false;
1192   // Setup code completion.
1193   FrontendOpts.CodeCompleteOpts = Options;
1194   FrontendOpts.CodeCompletionAt.FileName = std::string(Input.FileName);
1195   std::tie(FrontendOpts.CodeCompletionAt.Line,
1196            FrontendOpts.CodeCompletionAt.Column) =
1197       offsetToClangLineColumn(Input.ParseInput.Contents, Input.Offset);
1198 
1199   std::unique_ptr<llvm::MemoryBuffer> ContentsBuffer =
1200       llvm::MemoryBuffer::getMemBuffer(Input.ParseInput.Contents,
1201                                        Input.FileName);
1202   // The diagnostic options must be set before creating a CompilerInstance.
1203   CI->getDiagnosticOpts().IgnoreWarnings = true;
1204   // We reuse the preamble whether it's valid or not. This is a
1205   // correctness/performance tradeoff: building without a preamble is slow, and
1206   // completion is latency-sensitive.
1207   // However, if we're completing *inside* the preamble section of the draft,
1208   // overriding the preamble will break sema completion. Fortunately we can just
1209   // skip all includes in this case; these completions are really simple.
1210   PreambleBounds PreambleRegion =
1211       ComputePreambleBounds(*CI->getLangOpts(), *ContentsBuffer, 0);
1212   bool CompletingInPreamble = Input.Offset < PreambleRegion.Size ||
1213                               (!PreambleRegion.PreambleEndsAtStartOfLine &&
1214                                Input.Offset == PreambleRegion.Size);
1215   if (Input.Patch)
1216     Input.Patch->apply(*CI);
1217   // NOTE: we must call BeginSourceFile after prepareCompilerInstance. Otherwise
1218   // the remapped buffers do not get freed.
1219   llvm::IntrusiveRefCntPtr<llvm::vfs::FileSystem> VFS =
1220       Input.ParseInput.TFS->view(Input.ParseInput.CompileCommand.Directory);
1221   if (Input.Preamble.StatCache)
1222     VFS = Input.Preamble.StatCache->getConsumingFS(std::move(VFS));
1223   auto Clang = prepareCompilerInstance(
1224       std::move(CI), !CompletingInPreamble ? &Input.Preamble.Preamble : nullptr,
1225       std::move(ContentsBuffer), std::move(VFS), IgnoreDiags);
1226   Clang->getPreprocessorOpts().SingleFileParseMode = CompletingInPreamble;
1227   Clang->setCodeCompletionConsumer(Consumer.release());
1228 
1229   SyntaxOnlyAction Action;
1230   if (!Action.BeginSourceFile(*Clang, Clang->getFrontendOpts().Inputs[0])) {
1231     log("BeginSourceFile() failed when running codeComplete for {0}",
1232         Input.FileName);
1233     return false;
1234   }
1235   // Macros can be defined within the preamble region of the main file.
1236   // They don't fall nicely into our index/Sema dichotomy:
1237   //  - they're not indexed for completion (they're not available across files)
1238   //  - but Sema code complete won't see them: as part of the preamble, they're
1239   //    deserialized only when mentioned.
1240   // Force them to be deserialized so SemaCodeComplete sees them.
1241   loadMainFilePreambleMacros(Clang->getPreprocessor(), Input.Preamble);
1242   if (Includes)
1243     Clang->getPreprocessor().addPPCallbacks(
1244         Includes->collect(Clang->getSourceManager()));
1245   if (llvm::Error Err = Action.Execute()) {
1246     log("Execute() failed when running codeComplete for {0}: {1}",
1247         Input.FileName, toString(std::move(Err)));
1248     return false;
1249   }
1250   Action.EndSourceFile();
1251 
1252   return true;
1253 }
1254 
1255 // Should we allow index completions in the specified context?
1256 bool allowIndex(CodeCompletionContext &CC) {
1257   if (!contextAllowsIndex(CC.getKind()))
1258     return false;
1259   // We also avoid ClassName::bar (but allow namespace::bar).
1260   auto Scope = CC.getCXXScopeSpecifier();
1261   if (!Scope)
1262     return true;
1263   NestedNameSpecifier *NameSpec = (*Scope)->getScopeRep();
1264   if (!NameSpec)
1265     return true;
1266   // We only query the index when qualifier is a namespace.
1267   // If it's a class, we rely solely on sema completions.
1268   switch (NameSpec->getKind()) {
1269   case NestedNameSpecifier::Global:
1270   case NestedNameSpecifier::Namespace:
1271   case NestedNameSpecifier::NamespaceAlias:
1272     return true;
1273   case NestedNameSpecifier::Super:
1274   case NestedNameSpecifier::TypeSpec:
1275   case NestedNameSpecifier::TypeSpecWithTemplate:
1276   // Unresolved inside a template.
1277   case NestedNameSpecifier::Identifier:
1278     return false;
1279   }
1280   llvm_unreachable("invalid NestedNameSpecifier kind");
1281 }
1282 
1283 std::future<SymbolSlab> startAsyncFuzzyFind(const SymbolIndex &Index,
1284                                             const FuzzyFindRequest &Req) {
1285   return runAsync<SymbolSlab>([&Index, Req]() {
1286     trace::Span Tracer("Async fuzzyFind");
1287     SymbolSlab::Builder Syms;
1288     Index.fuzzyFind(Req, [&Syms](const Symbol &Sym) { Syms.insert(Sym); });
1289     return std::move(Syms).build();
1290   });
1291 }
1292 
1293 // Creates a `FuzzyFindRequest` based on the cached index request from the
1294 // last completion, if any, and the speculated completion filter text in the
1295 // source code.
1296 FuzzyFindRequest speculativeFuzzyFindRequestForCompletion(
1297     FuzzyFindRequest CachedReq, const CompletionPrefix &HeuristicPrefix) {
1298   CachedReq.Query = std::string(HeuristicPrefix.Name);
1299   return CachedReq;
1300 }
1301 
1302 // Runs Sema-based (AST) and Index-based completion, returns merged results.
1303 //
1304 // There are a few tricky considerations:
1305 //   - the AST provides information needed for the index query (e.g. which
1306 //     namespaces to search in). So Sema must start first.
1307 //   - we only want to return the top results (Opts.Limit).
1308 //     Building CompletionItems for everything else is wasteful, so we want to
1309 //     preserve the "native" format until we're done with scoring.
1310 //   - the data underlying Sema completion items is owned by the AST and various
1311 //     other arenas, which must stay alive for us to build CompletionItems.
1312 //   - we may get duplicate results from Sema and the Index, we need to merge.
1313 //
1314 // So we start Sema completion first, and do all our work in its callback.
1315 // We use the Sema context information to query the index.
1316 // Then we merge the two result sets, producing items that are Sema/Index/Both.
1317 // These items are scored, and the top N are synthesized into the LSP response.
1318 // Finally, we can clean up the data structures created by Sema completion.
1319 //
1320 // Main collaborators are:
1321 //   - semaCodeComplete sets up the compiler machinery to run code completion.
1322 //   - CompletionRecorder captures Sema completion results, including context.
1323 //   - SymbolIndex (Opts.Index) provides index completion results as Symbols
1324 //   - CompletionCandidates are the result of merging Sema and Index results.
1325 //     Each candidate points to an underlying CodeCompletionResult (Sema), a
1326 //     Symbol (Index), or both. It computes the result quality score.
1327 //     CompletionCandidate also does conversion to CompletionItem (at the end).
1328 //   - FuzzyMatcher scores how the candidate matches the partial identifier.
1329 //     This score is combined with the result quality score for the final score.
1330 //   - TopN determines the results with the best score.
1331 class CodeCompleteFlow {
1332   PathRef FileName;
1333   IncludeStructure Includes;           // Complete once the compiler runs.
1334   SpeculativeFuzzyFind *SpecFuzzyFind; // Can be nullptr.
1335   const CodeCompleteOptions &Opts;
1336 
1337   // Sema takes ownership of Recorder. Recorder is valid until Sema cleanup.
1338   CompletionRecorder *Recorder = nullptr;
1339   CodeCompletionContext::Kind CCContextKind = CodeCompletionContext::CCC_Other;
1340   bool IsUsingDeclaration = false;
1341   // The snippets will not be generated if the token following completion
1342   // location is an opening parenthesis (tok::l_paren) because this would add
1343   // extra parenthesis.
1344   tok::TokenKind NextTokenKind = tok::eof;
1345   // Counters for logging.
1346   int NSema = 0, NIndex = 0, NSemaAndIndex = 0, NIdent = 0;
1347   bool Incomplete = false; // Would more be available with a higher limit?
1348   CompletionPrefix HeuristicPrefix;
1349   llvm::Optional<FuzzyMatcher> Filter; // Initialized once Sema runs.
1350   Range ReplacedRange;
1351   std::vector<std::string> QueryScopes; // Initialized once Sema runs.
1352   // Initialized once QueryScopes is initialized, if there are scopes.
1353   llvm::Optional<ScopeDistance> ScopeProximity;
1354   llvm::Optional<OpaqueType> PreferredType; // Initialized once Sema runs.
1355   // Whether to query symbols from any scope. Initialized once Sema runs.
1356   bool AllScopes = false;
1357   llvm::StringSet<> ContextWords;
1358   // Include-insertion and proximity scoring rely on the include structure.
1359   // This is available after Sema has run.
1360   llvm::Optional<IncludeInserter> Inserter;  // Available during runWithSema.
1361   llvm::Optional<URIDistance> FileProximity; // Initialized once Sema runs.
1362   /// Speculative request based on the cached request and the filter text before
1363   /// the cursor.
1364   /// Initialized right before sema run. This is only set if `SpecFuzzyFind` is
1365   /// set and contains a cached request.
1366   llvm::Optional<FuzzyFindRequest> SpecReq;
1367 
1368 public:
1369   // A CodeCompleteFlow object is only useful for calling run() exactly once.
1370   CodeCompleteFlow(PathRef FileName, const IncludeStructure &Includes,
1371                    SpeculativeFuzzyFind *SpecFuzzyFind,
1372                    const CodeCompleteOptions &Opts)
1373       : FileName(FileName), Includes(Includes), SpecFuzzyFind(SpecFuzzyFind),
1374         Opts(Opts) {}
1375 
1376   CodeCompleteResult run(const SemaCompleteInput &SemaCCInput) && {
1377     trace::Span Tracer("CodeCompleteFlow");
1378     HeuristicPrefix = guessCompletionPrefix(SemaCCInput.ParseInput.Contents,
1379                                             SemaCCInput.Offset);
1380     populateContextWords(SemaCCInput.ParseInput.Contents);
1381     if (Opts.Index && SpecFuzzyFind && SpecFuzzyFind->CachedReq.hasValue()) {
1382       assert(!SpecFuzzyFind->Result.valid());
1383       SpecReq = speculativeFuzzyFindRequestForCompletion(
1384           *SpecFuzzyFind->CachedReq, HeuristicPrefix);
1385       SpecFuzzyFind->Result = startAsyncFuzzyFind(*Opts.Index, *SpecReq);
1386     }
1387 
1388     // We run Sema code completion first. It builds an AST and calculates:
1389     //   - completion results based on the AST.
1390     //   - partial identifier and context. We need these for the index query.
1391     CodeCompleteResult Output;
1392     auto RecorderOwner = std::make_unique<CompletionRecorder>(Opts, [&]() {
1393       assert(Recorder && "Recorder is not set");
1394       CCContextKind = Recorder->CCContext.getKind();
1395       IsUsingDeclaration = Recorder->CCContext.isUsingDeclaration();
1396       auto Style = getFormatStyleForFile(SemaCCInput.FileName,
1397                                          SemaCCInput.ParseInput.Contents,
1398                                          *SemaCCInput.ParseInput.TFS);
1399       const auto NextToken = Lexer::findNextToken(
1400           Recorder->CCSema->getPreprocessor().getCodeCompletionLoc(),
1401           Recorder->CCSema->getSourceManager(), Recorder->CCSema->LangOpts);
1402       if (NextToken)
1403         NextTokenKind = NextToken->getKind();
1404       // If preprocessor was run, inclusions from preprocessor callback should
1405       // already be added to Includes.
1406       Inserter.emplace(
1407           SemaCCInput.FileName, SemaCCInput.ParseInput.Contents, Style,
1408           SemaCCInput.ParseInput.CompileCommand.Directory,
1409           &Recorder->CCSema->getPreprocessor().getHeaderSearchInfo());
1410       for (const auto &Inc : Includes.MainFileIncludes)
1411         Inserter->addExisting(Inc);
1412 
1413       // Most of the cost of file proximity is in initializing the FileDistance
1414       // structures based on the observed includes, once per query. Conceptually
1415       // that happens here (though the per-URI-scheme initialization is lazy).
1416       // The per-result proximity scoring is (amortized) very cheap.
1417       FileDistanceOptions ProxOpts{}; // Use defaults.
1418       const auto &SM = Recorder->CCSema->getSourceManager();
1419       llvm::StringMap<SourceParams> ProxSources;
1420       auto MainFileID =
1421           Includes.getID(SM.getFileEntryForID(SM.getMainFileID()));
1422       assert(MainFileID);
1423       for (auto &HeaderIDAndDepth : Includes.includeDepth(*MainFileID)) {
1424         auto &Source =
1425             ProxSources[Includes.getRealPath(HeaderIDAndDepth.getFirst())];
1426         Source.Cost = HeaderIDAndDepth.getSecond() * ProxOpts.IncludeCost;
1427         // Symbols near our transitive includes are good, but only consider
1428         // things in the same directory or below it. Otherwise there can be
1429         // many false positives.
1430         if (HeaderIDAndDepth.getSecond() > 0)
1431           Source.MaxUpTraversals = 1;
1432       }
1433       FileProximity.emplace(ProxSources, ProxOpts);
1434 
1435       Output = runWithSema();
1436       Inserter.reset(); // Make sure this doesn't out-live Clang.
1437       SPAN_ATTACH(Tracer, "sema_completion_kind",
1438                   getCompletionKindString(CCContextKind));
1439       log("Code complete: sema context {0}, query scopes [{1}] (AnyScope={2}), "
1440           "expected type {3}{4}",
1441           getCompletionKindString(CCContextKind),
1442           llvm::join(QueryScopes.begin(), QueryScopes.end(), ","), AllScopes,
1443           PreferredType ? Recorder->CCContext.getPreferredType().getAsString()
1444                         : "<none>",
1445           IsUsingDeclaration ? ", inside using declaration" : "");
1446     });
1447 
1448     Recorder = RecorderOwner.get();
1449 
1450     semaCodeComplete(std::move(RecorderOwner), Opts.getClangCompleteOpts(),
1451                      SemaCCInput, &Includes);
1452     logResults(Output, Tracer);
1453     return Output;
1454   }
1455 
1456   void logResults(const CodeCompleteResult &Output, const trace::Span &Tracer) {
1457     SPAN_ATTACH(Tracer, "sema_results", NSema);
1458     SPAN_ATTACH(Tracer, "index_results", NIndex);
1459     SPAN_ATTACH(Tracer, "merged_results", NSemaAndIndex);
1460     SPAN_ATTACH(Tracer, "identifier_results", NIdent);
1461     SPAN_ATTACH(Tracer, "returned_results", int64_t(Output.Completions.size()));
1462     SPAN_ATTACH(Tracer, "incomplete", Output.HasMore);
1463     log("Code complete: {0} results from Sema, {1} from Index, "
1464         "{2} matched, {3} from identifiers, {4} returned{5}.",
1465         NSema, NIndex, NSemaAndIndex, NIdent, Output.Completions.size(),
1466         Output.HasMore ? " (incomplete)" : "");
1467     assert(!Opts.Limit || Output.Completions.size() <= Opts.Limit);
1468     // We don't assert that isIncomplete means we hit a limit.
1469     // Indexes may choose to impose their own limits even if we don't have one.
1470   }
1471 
1472   CodeCompleteResult runWithoutSema(llvm::StringRef Content, size_t Offset,
1473                                     const ThreadsafeFS &TFS) && {
1474     trace::Span Tracer("CodeCompleteWithoutSema");
1475     // Fill in fields normally set by runWithSema()
1476     HeuristicPrefix = guessCompletionPrefix(Content, Offset);
1477     populateContextWords(Content);
1478     CCContextKind = CodeCompletionContext::CCC_Recovery;
1479     IsUsingDeclaration = false;
1480     Filter = FuzzyMatcher(HeuristicPrefix.Name);
1481     auto Pos = offsetToPosition(Content, Offset);
1482     ReplacedRange.start = ReplacedRange.end = Pos;
1483     ReplacedRange.start.character -= HeuristicPrefix.Name.size();
1484 
1485     llvm::StringMap<SourceParams> ProxSources;
1486     ProxSources[FileName].Cost = 0;
1487     FileProximity.emplace(ProxSources);
1488 
1489     auto Style = getFormatStyleForFile(FileName, Content, TFS);
1490     // This will only insert verbatim headers.
1491     Inserter.emplace(FileName, Content, Style,
1492                      /*BuildDir=*/"", /*HeaderSearchInfo=*/nullptr);
1493 
1494     auto Identifiers = collectIdentifiers(Content, Style);
1495     std::vector<RawIdentifier> IdentifierResults;
1496     for (const auto &IDAndCount : Identifiers) {
1497       RawIdentifier ID;
1498       ID.Name = IDAndCount.first();
1499       ID.References = IDAndCount.second;
1500       // Avoid treating typed filter as an identifier.
1501       if (ID.Name == HeuristicPrefix.Name)
1502         --ID.References;
1503       if (ID.References > 0)
1504         IdentifierResults.push_back(std::move(ID));
1505     }
1506 
1507     // Simplified version of getQueryScopes():
1508     //  - accessible scopes are determined heuristically.
1509     //  - all-scopes query if no qualifier was typed (and it's allowed).
1510     SpecifiedScope Scopes;
1511     Scopes.AccessibleScopes = visibleNamespaces(
1512         Content.take_front(Offset), format::getFormattingLangOpts(Style));
1513     for (std::string &S : Scopes.AccessibleScopes)
1514       if (!S.empty())
1515         S.append("::"); // visibleNamespaces doesn't include trailing ::.
1516     if (HeuristicPrefix.Qualifier.empty())
1517       AllScopes = Opts.AllScopes;
1518     else if (HeuristicPrefix.Qualifier.startswith("::")) {
1519       Scopes.AccessibleScopes = {""};
1520       Scopes.UnresolvedQualifier =
1521           std::string(HeuristicPrefix.Qualifier.drop_front(2));
1522     } else
1523       Scopes.UnresolvedQualifier = std::string(HeuristicPrefix.Qualifier);
1524     // First scope is the (modified) enclosing scope.
1525     QueryScopes = Scopes.scopesForIndexQuery();
1526     ScopeProximity.emplace(QueryScopes);
1527 
1528     SymbolSlab IndexResults = Opts.Index ? queryIndex() : SymbolSlab();
1529 
1530     CodeCompleteResult Output = toCodeCompleteResult(mergeResults(
1531         /*SemaResults=*/{}, IndexResults, IdentifierResults));
1532     Output.RanParser = false;
1533     logResults(Output, Tracer);
1534     return Output;
1535   }
1536 
1537 private:
1538   void populateContextWords(llvm::StringRef Content) {
1539     // Take last 3 lines before the completion point.
1540     unsigned RangeEnd = HeuristicPrefix.Qualifier.begin() - Content.data(),
1541              RangeBegin = RangeEnd;
1542     for (size_t I = 0; I < 3 && RangeBegin > 0; ++I) {
1543       auto PrevNL = Content.rfind('\n', RangeBegin);
1544       if (PrevNL == StringRef::npos) {
1545         RangeBegin = 0;
1546         break;
1547       }
1548       RangeBegin = PrevNL;
1549     }
1550 
1551     ContextWords = collectWords(Content.slice(RangeBegin, RangeEnd));
1552     dlog("Completion context words: {0}",
1553          llvm::join(ContextWords.keys(), ", "));
1554   }
1555 
1556   // This is called by run() once Sema code completion is done, but before the
1557   // Sema data structures are torn down. It does all the real work.
1558   CodeCompleteResult runWithSema() {
1559     const auto &CodeCompletionRange = CharSourceRange::getCharRange(
1560         Recorder->CCSema->getPreprocessor().getCodeCompletionTokenRange());
1561     // When we are getting completions with an empty identifier, for example
1562     //    std::vector<int> asdf;
1563     //    asdf.^;
1564     // Then the range will be invalid and we will be doing insertion, use
1565     // current cursor position in such cases as range.
1566     if (CodeCompletionRange.isValid()) {
1567       ReplacedRange = halfOpenToRange(Recorder->CCSema->getSourceManager(),
1568                                       CodeCompletionRange);
1569     } else {
1570       const auto &Pos = sourceLocToPosition(
1571           Recorder->CCSema->getSourceManager(),
1572           Recorder->CCSema->getPreprocessor().getCodeCompletionLoc());
1573       ReplacedRange.start = ReplacedRange.end = Pos;
1574     }
1575     Filter = FuzzyMatcher(
1576         Recorder->CCSema->getPreprocessor().getCodeCompletionFilter());
1577     std::tie(QueryScopes, AllScopes) = getQueryScopes(
1578         Recorder->CCContext, *Recorder->CCSema, HeuristicPrefix, Opts);
1579     if (!QueryScopes.empty())
1580       ScopeProximity.emplace(QueryScopes);
1581     PreferredType =
1582         OpaqueType::fromType(Recorder->CCSema->getASTContext(),
1583                              Recorder->CCContext.getPreferredType());
1584     // Sema provides the needed context to query the index.
1585     // FIXME: in addition to querying for extra/overlapping symbols, we should
1586     //        explicitly request symbols corresponding to Sema results.
1587     //        We can use their signals even if the index can't suggest them.
1588     // We must copy index results to preserve them, but there are at most Limit.
1589     auto IndexResults = (Opts.Index && allowIndex(Recorder->CCContext))
1590                             ? queryIndex()
1591                             : SymbolSlab();
1592     trace::Span Tracer("Populate CodeCompleteResult");
1593     // Merge Sema and Index results, score them, and pick the winners.
1594     auto Top =
1595         mergeResults(Recorder->Results, IndexResults, /*Identifiers*/ {});
1596     return toCodeCompleteResult(Top);
1597   }
1598 
1599   CodeCompleteResult
1600   toCodeCompleteResult(const std::vector<ScoredBundle> &Scored) {
1601     CodeCompleteResult Output;
1602 
1603     // Convert the results to final form, assembling the expensive strings.
1604     for (auto &C : Scored) {
1605       Output.Completions.push_back(toCodeCompletion(C.first));
1606       Output.Completions.back().Score = C.second;
1607       Output.Completions.back().CompletionTokenRange = ReplacedRange;
1608     }
1609     Output.HasMore = Incomplete;
1610     Output.Context = CCContextKind;
1611     Output.CompletionRange = ReplacedRange;
1612     return Output;
1613   }
1614 
1615   SymbolSlab queryIndex() {
1616     trace::Span Tracer("Query index");
1617     SPAN_ATTACH(Tracer, "limit", int64_t(Opts.Limit));
1618 
1619     // Build the query.
1620     FuzzyFindRequest Req;
1621     if (Opts.Limit)
1622       Req.Limit = Opts.Limit;
1623     Req.Query = std::string(Filter->pattern());
1624     Req.RestrictForCodeCompletion = true;
1625     Req.Scopes = QueryScopes;
1626     Req.AnyScope = AllScopes;
1627     // FIXME: we should send multiple weighted paths here.
1628     Req.ProximityPaths.push_back(std::string(FileName));
1629     if (PreferredType)
1630       Req.PreferredTypes.push_back(std::string(PreferredType->raw()));
1631     vlog("Code complete: fuzzyFind({0:2})", toJSON(Req));
1632 
1633     if (SpecFuzzyFind)
1634       SpecFuzzyFind->NewReq = Req;
1635     if (SpecFuzzyFind && SpecFuzzyFind->Result.valid() && (*SpecReq == Req)) {
1636       vlog("Code complete: speculative fuzzy request matches the actual index "
1637            "request. Waiting for the speculative index results.");
1638       SPAN_ATTACH(Tracer, "Speculative results", true);
1639 
1640       trace::Span WaitSpec("Wait speculative results");
1641       return SpecFuzzyFind->Result.get();
1642     }
1643 
1644     SPAN_ATTACH(Tracer, "Speculative results", false);
1645 
1646     // Run the query against the index.
1647     SymbolSlab::Builder ResultsBuilder;
1648     if (Opts.Index->fuzzyFind(
1649             Req, [&](const Symbol &Sym) { ResultsBuilder.insert(Sym); }))
1650       Incomplete = true;
1651     return std::move(ResultsBuilder).build();
1652   }
1653 
1654   // Merges Sema and Index results where possible, to form CompletionCandidates.
1655   // \p Identifiers is raw identifiers that can also be completion candidates.
1656   // Identifiers are not merged with results from index or sema.
1657   // Groups overloads if desired, to form CompletionCandidate::Bundles. The
1658   // bundles are scored and top results are returned, best to worst.
1659   std::vector<ScoredBundle>
1660   mergeResults(const std::vector<CodeCompletionResult> &SemaResults,
1661                const SymbolSlab &IndexResults,
1662                const std::vector<RawIdentifier> &IdentifierResults) {
1663     trace::Span Tracer("Merge and score results");
1664     std::vector<CompletionCandidate::Bundle> Bundles;
1665     llvm::DenseMap<size_t, size_t> BundleLookup;
1666     auto AddToBundles = [&](const CodeCompletionResult *SemaResult,
1667                             const Symbol *IndexResult,
1668                             const RawIdentifier *IdentifierResult) {
1669       CompletionCandidate C;
1670       C.SemaResult = SemaResult;
1671       C.IndexResult = IndexResult;
1672       C.IdentifierResult = IdentifierResult;
1673       if (C.IndexResult) {
1674         C.Name = IndexResult->Name;
1675         C.RankedIncludeHeaders = getRankedIncludes(*C.IndexResult);
1676       } else if (C.SemaResult) {
1677         C.Name = Recorder->getName(*SemaResult);
1678       } else {
1679         assert(IdentifierResult);
1680         C.Name = IdentifierResult->Name;
1681       }
1682       if (auto OverloadSet = C.overloadSet(
1683               Opts, FileName, Inserter ? Inserter.getPointer() : nullptr)) {
1684         auto Ret = BundleLookup.try_emplace(OverloadSet, Bundles.size());
1685         if (Ret.second)
1686           Bundles.emplace_back();
1687         Bundles[Ret.first->second].push_back(std::move(C));
1688       } else {
1689         Bundles.emplace_back();
1690         Bundles.back().push_back(std::move(C));
1691       }
1692     };
1693     llvm::DenseSet<const Symbol *> UsedIndexResults;
1694     auto CorrespondingIndexResult =
1695         [&](const CodeCompletionResult &SemaResult) -> const Symbol * {
1696       if (auto SymID =
1697               getSymbolID(SemaResult, Recorder->CCSema->getSourceManager())) {
1698         auto I = IndexResults.find(SymID);
1699         if (I != IndexResults.end()) {
1700           UsedIndexResults.insert(&*I);
1701           return &*I;
1702         }
1703       }
1704       return nullptr;
1705     };
1706     // Emit all Sema results, merging them with Index results if possible.
1707     for (auto &SemaResult : SemaResults)
1708       AddToBundles(&SemaResult, CorrespondingIndexResult(SemaResult), nullptr);
1709     // Now emit any Index-only results.
1710     for (const auto &IndexResult : IndexResults) {
1711       if (UsedIndexResults.count(&IndexResult))
1712         continue;
1713       AddToBundles(/*SemaResult=*/nullptr, &IndexResult, nullptr);
1714     }
1715     // Emit identifier results.
1716     for (const auto &Ident : IdentifierResults)
1717       AddToBundles(/*SemaResult=*/nullptr, /*IndexResult=*/nullptr, &Ident);
1718     // We only keep the best N results at any time, in "native" format.
1719     TopN<ScoredBundle, ScoredBundleGreater> Top(
1720         Opts.Limit == 0 ? std::numeric_limits<size_t>::max() : Opts.Limit);
1721     for (auto &Bundle : Bundles)
1722       addCandidate(Top, std::move(Bundle));
1723     return std::move(Top).items();
1724   }
1725 
1726   llvm::Optional<float> fuzzyScore(const CompletionCandidate &C) {
1727     // Macros can be very spammy, so we only support prefix completion.
1728     if (((C.SemaResult &&
1729           C.SemaResult->Kind == CodeCompletionResult::RK_Macro) ||
1730          (C.IndexResult &&
1731           C.IndexResult->SymInfo.Kind == index::SymbolKind::Macro)) &&
1732         !C.Name.startswith_insensitive(Filter->pattern()))
1733       return None;
1734     return Filter->match(C.Name);
1735   }
1736 
1737   CodeCompletion::Scores
1738   evaluateCompletion(const SymbolQualitySignals &Quality,
1739                      const SymbolRelevanceSignals &Relevance) {
1740     using RM = CodeCompleteOptions::CodeCompletionRankingModel;
1741     CodeCompletion::Scores Scores;
1742     switch (Opts.RankingModel) {
1743     case RM::Heuristics:
1744       Scores.Quality = Quality.evaluateHeuristics();
1745       Scores.Relevance = Relevance.evaluateHeuristics();
1746       Scores.Total =
1747           evaluateSymbolAndRelevance(Scores.Quality, Scores.Relevance);
1748       // NameMatch is in fact a multiplier on total score, so rescoring is
1749       // sound.
1750       Scores.ExcludingName =
1751           Relevance.NameMatch > std::numeric_limits<float>::epsilon()
1752               ? Scores.Total / Relevance.NameMatch
1753               : Scores.Quality;
1754       return Scores;
1755 
1756     case RM::DecisionForest:
1757       DecisionForestScores DFScores = Opts.DecisionForestScorer(
1758           Quality, Relevance, Opts.DecisionForestBase);
1759       Scores.ExcludingName = DFScores.ExcludingName;
1760       Scores.Total = DFScores.Total;
1761       return Scores;
1762     }
1763     llvm_unreachable("Unhandled CodeCompletion ranking model.");
1764   }
1765 
1766   // Scores a candidate and adds it to the TopN structure.
1767   void addCandidate(TopN<ScoredBundle, ScoredBundleGreater> &Candidates,
1768                     CompletionCandidate::Bundle Bundle) {
1769     SymbolQualitySignals Quality;
1770     SymbolRelevanceSignals Relevance;
1771     Relevance.Context = CCContextKind;
1772     Relevance.Name = Bundle.front().Name;
1773     Relevance.FilterLength = HeuristicPrefix.Name.size();
1774     Relevance.Query = SymbolRelevanceSignals::CodeComplete;
1775     Relevance.FileProximityMatch = FileProximity.getPointer();
1776     if (ScopeProximity)
1777       Relevance.ScopeProximityMatch = ScopeProximity.getPointer();
1778     if (PreferredType)
1779       Relevance.HadContextType = true;
1780     Relevance.ContextWords = &ContextWords;
1781     Relevance.MainFileSignals = Opts.MainFileSignals;
1782 
1783     auto &First = Bundle.front();
1784     if (auto FuzzyScore = fuzzyScore(First))
1785       Relevance.NameMatch = *FuzzyScore;
1786     else
1787       return;
1788     SymbolOrigin Origin = SymbolOrigin::Unknown;
1789     bool FromIndex = false;
1790     for (const auto &Candidate : Bundle) {
1791       if (Candidate.IndexResult) {
1792         Quality.merge(*Candidate.IndexResult);
1793         Relevance.merge(*Candidate.IndexResult);
1794         Origin |= Candidate.IndexResult->Origin;
1795         FromIndex = true;
1796         if (!Candidate.IndexResult->Type.empty())
1797           Relevance.HadSymbolType |= true;
1798         if (PreferredType &&
1799             PreferredType->raw() == Candidate.IndexResult->Type) {
1800           Relevance.TypeMatchesPreferred = true;
1801         }
1802       }
1803       if (Candidate.SemaResult) {
1804         Quality.merge(*Candidate.SemaResult);
1805         Relevance.merge(*Candidate.SemaResult);
1806         if (PreferredType) {
1807           if (auto CompletionType = OpaqueType::fromCompletionResult(
1808                   Recorder->CCSema->getASTContext(), *Candidate.SemaResult)) {
1809             Relevance.HadSymbolType |= true;
1810             if (PreferredType == CompletionType)
1811               Relevance.TypeMatchesPreferred = true;
1812           }
1813         }
1814         Origin |= SymbolOrigin::AST;
1815       }
1816       if (Candidate.IdentifierResult) {
1817         Quality.References = Candidate.IdentifierResult->References;
1818         Relevance.Scope = SymbolRelevanceSignals::FileScope;
1819         Origin |= SymbolOrigin::Identifier;
1820       }
1821     }
1822 
1823     CodeCompletion::Scores Scores = evaluateCompletion(Quality, Relevance);
1824     if (Opts.RecordCCResult)
1825       Opts.RecordCCResult(toCodeCompletion(Bundle), Quality, Relevance,
1826                           Scores.Total);
1827 
1828     dlog("CodeComplete: {0} ({1}) = {2}\n{3}{4}\n", First.Name,
1829          llvm::to_string(Origin), Scores.Total, llvm::to_string(Quality),
1830          llvm::to_string(Relevance));
1831 
1832     NSema += bool(Origin & SymbolOrigin::AST);
1833     NIndex += FromIndex;
1834     NSemaAndIndex += bool(Origin & SymbolOrigin::AST) && FromIndex;
1835     NIdent += bool(Origin & SymbolOrigin::Identifier);
1836     if (Candidates.push({std::move(Bundle), Scores}))
1837       Incomplete = true;
1838   }
1839 
1840   CodeCompletion toCodeCompletion(const CompletionCandidate::Bundle &Bundle) {
1841     llvm::Optional<CodeCompletionBuilder> Builder;
1842     for (const auto &Item : Bundle) {
1843       CodeCompletionString *SemaCCS =
1844           Item.SemaResult ? Recorder->codeCompletionString(*Item.SemaResult)
1845                           : nullptr;
1846       if (!Builder)
1847         Builder.emplace(Recorder ? &Recorder->CCSema->getASTContext() : nullptr,
1848                         Item, SemaCCS, QueryScopes, *Inserter, FileName,
1849                         CCContextKind, Opts, IsUsingDeclaration, NextTokenKind);
1850       else
1851         Builder->add(Item, SemaCCS);
1852     }
1853     return Builder->build();
1854   }
1855 };
1856 
1857 } // namespace
1858 
1859 clang::CodeCompleteOptions CodeCompleteOptions::getClangCompleteOpts() const {
1860   clang::CodeCompleteOptions Result;
1861   Result.IncludeCodePatterns = EnableSnippets;
1862   Result.IncludeMacros = true;
1863   Result.IncludeGlobals = true;
1864   // We choose to include full comments and not do doxygen parsing in
1865   // completion.
1866   // FIXME: ideally, we should support doxygen in some form, e.g. do markdown
1867   // formatting of the comments.
1868   Result.IncludeBriefComments = false;
1869 
1870   // When an is used, Sema is responsible for completing the main file,
1871   // the index can provide results from the preamble.
1872   // Tell Sema not to deserialize the preamble to look for results.
1873   Result.LoadExternal = !Index;
1874   Result.IncludeFixIts = IncludeFixIts;
1875 
1876   return Result;
1877 }
1878 
1879 CompletionPrefix guessCompletionPrefix(llvm::StringRef Content,
1880                                        unsigned Offset) {
1881   assert(Offset <= Content.size());
1882   StringRef Rest = Content.take_front(Offset);
1883   CompletionPrefix Result;
1884 
1885   // Consume the unqualified name. We only handle ASCII characters.
1886   // isAsciiIdentifierContinue will let us match "0invalid", but we don't mind.
1887   while (!Rest.empty() && isAsciiIdentifierContinue(Rest.back()))
1888     Rest = Rest.drop_back();
1889   Result.Name = Content.slice(Rest.size(), Offset);
1890 
1891   // Consume qualifiers.
1892   while (Rest.consume_back("::") && !Rest.endswith(":")) // reject ::::
1893     while (!Rest.empty() && isAsciiIdentifierContinue(Rest.back()))
1894       Rest = Rest.drop_back();
1895   Result.Qualifier =
1896       Content.slice(Rest.size(), Result.Name.begin() - Content.begin());
1897 
1898   return Result;
1899 }
1900 
1901 // Code complete the argument name on "/*" inside function call.
1902 // Offset should be pointing to the start of the comment, i.e.:
1903 // foo(^/*, rather than foo(/*^) where the cursor probably is.
1904 CodeCompleteResult codeCompleteComment(PathRef FileName, unsigned Offset,
1905                                        llvm::StringRef Prefix,
1906                                        const PreambleData *Preamble,
1907                                        const ParseInputs &ParseInput) {
1908   if (Preamble == nullptr) // Can't run without Sema.
1909     return CodeCompleteResult();
1910 
1911   clang::CodeCompleteOptions Options;
1912   Options.IncludeGlobals = false;
1913   Options.IncludeMacros = false;
1914   Options.IncludeCodePatterns = false;
1915   Options.IncludeBriefComments = false;
1916   std::set<std::string> ParamNames;
1917   // We want to see signatures coming from newly introduced includes, hence a
1918   // full patch.
1919   semaCodeComplete(
1920       std::make_unique<ParamNameCollector>(Options, ParamNames), Options,
1921       {FileName, Offset, *Preamble,
1922        PreamblePatch::createFullPatch(FileName, ParseInput, *Preamble),
1923        ParseInput});
1924   if (ParamNames.empty())
1925     return CodeCompleteResult();
1926 
1927   CodeCompleteResult Result;
1928   Result.Context = CodeCompletionContext::CCC_NaturalLanguage;
1929   for (llvm::StringRef Name : ParamNames) {
1930     if (!Name.startswith(Prefix))
1931       continue;
1932     CodeCompletion Item;
1933     Item.Name = Name.str() + "=";
1934     Item.Kind = CompletionItemKind::Text;
1935     Result.Completions.push_back(Item);
1936   }
1937 
1938   return Result;
1939 }
1940 
1941 // If Offset is inside what looks like argument comment (e.g.
1942 // "/*^" or "/* foo^"), returns new offset pointing to the start of the /*
1943 // (place where semaCodeComplete should run).
1944 llvm::Optional<unsigned>
1945 maybeFunctionArgumentCommentStart(llvm::StringRef Content) {
1946   while (!Content.empty() && isAsciiIdentifierContinue(Content.back()))
1947     Content = Content.drop_back();
1948   Content = Content.rtrim();
1949   if (Content.endswith("/*"))
1950     return Content.size() - 2;
1951   return None;
1952 }
1953 
1954 CodeCompleteResult codeComplete(PathRef FileName, Position Pos,
1955                                 const PreambleData *Preamble,
1956                                 const ParseInputs &ParseInput,
1957                                 CodeCompleteOptions Opts,
1958                                 SpeculativeFuzzyFind *SpecFuzzyFind) {
1959   auto Offset = positionToOffset(ParseInput.Contents, Pos);
1960   if (!Offset) {
1961     elog("Code completion position was invalid {0}", Offset.takeError());
1962     return CodeCompleteResult();
1963   }
1964 
1965   auto Content = llvm::StringRef(ParseInput.Contents).take_front(*Offset);
1966   if (auto OffsetBeforeComment = maybeFunctionArgumentCommentStart(Content)) {
1967     // We are doing code completion of a comment, where we currently only
1968     // support completing param names in function calls. To do this, we
1969     // require information from Sema, but Sema's comment completion stops at
1970     // parsing, so we must move back the position before running it, extract
1971     // information we need and construct completion items ourselves.
1972     auto CommentPrefix = Content.substr(*OffsetBeforeComment + 2).trim();
1973     return codeCompleteComment(FileName, *OffsetBeforeComment, CommentPrefix,
1974                                Preamble, ParseInput);
1975   }
1976 
1977   auto Flow = CodeCompleteFlow(
1978       FileName, Preamble ? Preamble->Includes : IncludeStructure(),
1979       SpecFuzzyFind, Opts);
1980   return (!Preamble || Opts.RunParser == CodeCompleteOptions::NeverParse)
1981              ? std::move(Flow).runWithoutSema(ParseInput.Contents, *Offset,
1982                                               *ParseInput.TFS)
1983              : std::move(Flow).run({FileName, *Offset, *Preamble,
1984                                     /*PreamblePatch=*/
1985                                     PreamblePatch::createMacroPatch(
1986                                         FileName, ParseInput, *Preamble),
1987                                     ParseInput});
1988 }
1989 
1990 SignatureHelp signatureHelp(PathRef FileName, Position Pos,
1991                             const PreambleData &Preamble,
1992                             const ParseInputs &ParseInput) {
1993   auto Offset = positionToOffset(ParseInput.Contents, Pos);
1994   if (!Offset) {
1995     elog("Signature help position was invalid {0}", Offset.takeError());
1996     return SignatureHelp();
1997   }
1998   SignatureHelp Result;
1999   clang::CodeCompleteOptions Options;
2000   Options.IncludeGlobals = false;
2001   Options.IncludeMacros = false;
2002   Options.IncludeCodePatterns = false;
2003   Options.IncludeBriefComments = false;
2004   semaCodeComplete(
2005       std::make_unique<SignatureHelpCollector>(Options, ParseInput.Index,
2006                                                Result),
2007       Options,
2008       {FileName, *Offset, Preamble,
2009        PreamblePatch::createFullPatch(FileName, ParseInput, Preamble),
2010        ParseInput});
2011   return Result;
2012 }
2013 
2014 bool isIndexedForCodeCompletion(const NamedDecl &ND, ASTContext &ASTCtx) {
2015   auto InTopLevelScope = [](const NamedDecl &ND) {
2016     switch (ND.getDeclContext()->getDeclKind()) {
2017     case Decl::TranslationUnit:
2018     case Decl::Namespace:
2019     case Decl::LinkageSpec:
2020       return true;
2021     default:
2022       break;
2023     };
2024     return false;
2025   };
2026   // We only complete symbol's name, which is the same as the name of the
2027   // *primary* template in case of template specializations.
2028   if (isExplicitTemplateSpecialization(&ND))
2029     return false;
2030 
2031   // Category decls are not useful on their own outside the interface or
2032   // implementation blocks. Moreover, sema already provides completion for
2033   // these, even if it requires preamble deserialization. So by excluding them
2034   // from the index, we reduce the noise in all the other completion scopes.
2035   if (llvm::isa<ObjCCategoryDecl>(&ND) || llvm::isa<ObjCCategoryImplDecl>(&ND))
2036     return false;
2037 
2038   if (InTopLevelScope(ND))
2039     return true;
2040 
2041   if (const auto *EnumDecl = dyn_cast<clang::EnumDecl>(ND.getDeclContext()))
2042     return InTopLevelScope(*EnumDecl) && !EnumDecl->isScoped();
2043 
2044   return false;
2045 }
2046 
2047 // FIXME: find a home for this (that can depend on both markup and Protocol).
2048 static MarkupContent renderDoc(const markup::Document &Doc, MarkupKind Kind) {
2049   MarkupContent Result;
2050   Result.kind = Kind;
2051   switch (Kind) {
2052   case MarkupKind::PlainText:
2053     Result.value.append(Doc.asPlainText());
2054     break;
2055   case MarkupKind::Markdown:
2056     Result.value.append(Doc.asMarkdown());
2057     break;
2058   }
2059   return Result;
2060 }
2061 
2062 CompletionItem CodeCompletion::render(const CodeCompleteOptions &Opts) const {
2063   CompletionItem LSP;
2064   const auto *InsertInclude = Includes.empty() ? nullptr : &Includes[0];
2065   LSP.label = ((InsertInclude && InsertInclude->Insertion)
2066                    ? Opts.IncludeIndicator.Insert
2067                    : Opts.IncludeIndicator.NoInsert) +
2068               (Opts.ShowOrigins ? "[" + llvm::to_string(Origin) + "]" : "") +
2069               RequiredQualifier + Name + Signature;
2070 
2071   LSP.kind = Kind;
2072   LSP.detail = BundleSize > 1
2073                    ? std::string(llvm::formatv("[{0} overloads]", BundleSize))
2074                    : ReturnType;
2075   LSP.deprecated = Deprecated;
2076   // Combine header information and documentation in LSP `documentation` field.
2077   // This is not quite right semantically, but tends to display well in editors.
2078   if (InsertInclude || Documentation) {
2079     markup::Document Doc;
2080     if (InsertInclude)
2081       Doc.addParagraph().appendText("From ").appendCode(InsertInclude->Header);
2082     if (Documentation)
2083       Doc.append(*Documentation);
2084     LSP.documentation = renderDoc(Doc, Opts.DocumentationFormat);
2085   }
2086   LSP.sortText = sortText(Score.Total, Name);
2087   LSP.filterText = Name;
2088   LSP.textEdit = {CompletionTokenRange, RequiredQualifier + Name};
2089   // Merge continuous additionalTextEdits into main edit. The main motivation
2090   // behind this is to help LSP clients, it seems most of them are confused when
2091   // they are provided with additionalTextEdits that are consecutive to main
2092   // edit.
2093   // Note that we store additional text edits from back to front in a line. That
2094   // is mainly to help LSP clients again, so that changes do not effect each
2095   // other.
2096   for (const auto &FixIt : FixIts) {
2097     if (FixIt.range.end == LSP.textEdit->range.start) {
2098       LSP.textEdit->newText = FixIt.newText + LSP.textEdit->newText;
2099       LSP.textEdit->range.start = FixIt.range.start;
2100     } else {
2101       LSP.additionalTextEdits.push_back(FixIt);
2102     }
2103   }
2104   if (Opts.EnableSnippets)
2105     LSP.textEdit->newText += SnippetSuffix;
2106 
2107   // FIXME(kadircet): Do not even fill insertText after making sure textEdit is
2108   // compatible with most of the editors.
2109   LSP.insertText = LSP.textEdit->newText;
2110   // Some clients support snippets but work better with plaintext.
2111   // So if the snippet is trivial, let the client know.
2112   // https://github.com/clangd/clangd/issues/922
2113   LSP.insertTextFormat = (Opts.EnableSnippets && !SnippetSuffix.empty())
2114                              ? InsertTextFormat::Snippet
2115                              : InsertTextFormat::PlainText;
2116   if (InsertInclude && InsertInclude->Insertion)
2117     LSP.additionalTextEdits.push_back(*InsertInclude->Insertion);
2118 
2119   LSP.score = Score.ExcludingName;
2120 
2121   return LSP;
2122 }
2123 
2124 llvm::raw_ostream &operator<<(llvm::raw_ostream &OS, const CodeCompletion &C) {
2125   // For now just lean on CompletionItem.
2126   return OS << C.render(CodeCompleteOptions());
2127 }
2128 
2129 llvm::raw_ostream &operator<<(llvm::raw_ostream &OS,
2130                               const CodeCompleteResult &R) {
2131   OS << "CodeCompleteResult: " << R.Completions.size() << (R.HasMore ? "+" : "")
2132      << " (" << getCompletionKindString(R.Context) << ")"
2133      << " items:\n";
2134   for (const auto &C : R.Completions)
2135     OS << C << "\n";
2136   return OS;
2137 }
2138 
2139 // Heuristically detect whether the `Line` is an unterminated include filename.
2140 bool isIncludeFile(llvm::StringRef Line) {
2141   Line = Line.ltrim();
2142   if (!Line.consume_front("#"))
2143     return false;
2144   Line = Line.ltrim();
2145   if (!(Line.consume_front("include_next") || Line.consume_front("include") ||
2146         Line.consume_front("import")))
2147     return false;
2148   Line = Line.ltrim();
2149   if (Line.consume_front("<"))
2150     return Line.count('>') == 0;
2151   if (Line.consume_front("\""))
2152     return Line.count('"') == 0;
2153   return false;
2154 }
2155 
2156 bool allowImplicitCompletion(llvm::StringRef Content, unsigned Offset) {
2157   // Look at last line before completion point only.
2158   Content = Content.take_front(Offset);
2159   auto Pos = Content.rfind('\n');
2160   if (Pos != llvm::StringRef::npos)
2161     Content = Content.substr(Pos + 1);
2162 
2163   // Complete after scope operators.
2164   if (Content.endswith(".") || Content.endswith("->") ||
2165       Content.endswith("::") || Content.endswith("/*"))
2166     return true;
2167   // Complete after `#include <` and #include `<foo/`.
2168   if ((Content.endswith("<") || Content.endswith("\"") ||
2169        Content.endswith("/")) &&
2170       isIncludeFile(Content))
2171     return true;
2172 
2173   // Complete words. Give non-ascii characters the benefit of the doubt.
2174   return !Content.empty() && (isAsciiIdentifierContinue(Content.back()) ||
2175                               !llvm::isASCII(Content.back()));
2176 }
2177 
2178 } // namespace clangd
2179 } // namespace clang
2180