Diff 130607

clangd/CodeComplete.cpp

Show All 16 Lines
#include "CodeComplete.h"		#include "CodeComplete.h"
#include "CodeCompletionStrings.h"		#include "CodeCompletionStrings.h"
#include "Compiler.h"		#include "Compiler.h"
#include "FuzzyMatch.h"		#include "FuzzyMatch.h"
#include "Logger.h"		#include "Logger.h"
#include "index/Index.h"		#include "index/Index.h"
#include "clang/Frontend/CompilerInstance.h"		#include "clang/Frontend/CompilerInstance.h"
#include "clang/Frontend/FrontendActions.h"		#include "clang/Frontend/FrontendActions.h"
		#include "clang/Index/USRGeneration.h"
#include "clang/Sema/CodeCompleteConsumer.h"		#include "clang/Sema/CodeCompleteConsumer.h"
#include "clang/Sema/Sema.h"		#include "clang/Sema/Sema.h"
#include "llvm/Support/Format.h"		#include "llvm/Support/Format.h"
#include <queue>		#include <queue>

namespace clang {		namespace clang {
namespace clangd {		namespace clangd {
namespace {		namespace {
▲ Show 20 Lines • Show All 147 Lines • ▼ Show 20 Lines	for (const auto &Chunk : CCS) {
default:		default:
Result += Chunk.Text;		Result += Chunk.Text;
break;		break;
}		}
}		}
return Result;		return Result;
}		}

/// A scored code completion result.		// Produces an integer that sorts in the same order as F.
/// It may be promoted to a CompletionItem if it's among the top-ranked results.		// That is: a < b <==> encodeFloat(a) < encodeFloat(b).
///		uint32_t encodeFloat(float F) {
/// We score candidates by multiplying the symbolScore ("quality" of the result)		static_assert(std::numeric_limits<float>::is_iec559, "");
/// with the filterScore (how well it matched the query).		static_assert(sizeof(float) == sizeof(uint32_t), "");
/// This is sensitive to the distribution of both component scores!		constexpr uint32_t TopBit = ~(~uint32_t{0} >> 1);
struct CompletionCandidate {
CompletionCandidate(CodeCompletionResult &Result, float FilterScore)
: Result(&Result) {
Scores.symbolScore = score(Result); // Higher is better.
Scores.filterScore = FilterScore; // 0-1, higher is better.
Scores.finalScore = Scores.symbolScore * Scores.filterScore;
}

CodeCompletionResult *Result;
CompletionItemScores Scores;

// Comparison reflects rank: better candidates are smaller.		// Get the bits of the float. Endianness is the same as for integers.
bool operator<(const CompletionCandidate &C) const {		uint32_t U;
if (Scores.finalScore != C.Scores.finalScore)		memcpy(&U, &F, sizeof(float));
return Scores.finalScore > C.Scores.finalScore;		// IEEE 754 floats compare like sign-magnitude integers.
return Result < C.Result;		if (U & TopBit) // Negative float.
		return 0 - U; // Map onto the low half of integers, order reversed.
		return U + TopBit; // Positive floats map onto the high half of integers.
}		}

// Returns a string that sorts in the same order as operator<, for LSP.		// Returns a string that sorts in the same order as (-Score, Name), for LSP.
// Conceptually, this is [-Score, Name]. We convert -Score to an integer, and		std::string sortText(float Score, llvm::StringRef Name) {
// hex-encode it for readability. Example: [0.5, "foo"] -> "41000000foo"		// We convert -Score to an integer, and hex-encode for readability.
std::string sortText() const {		// Example: [0.5, "foo"] -> "41000000foo"
std::string S, NameStorage;		std::string S;
llvm::raw_string_ostream OS(S);		llvm::raw_string_ostream OS(S);
write_hex(OS, encodeFloat(-Scores.finalScore), llvm::HexPrintStyle::Lower,		write_hex(OS, encodeFloat(-Score), llvm::HexPrintStyle::Lower,
/Width=/2 * sizeof(Scores.finalScore));		/Width=/2 * sizeof(Score));
OS << Result->getOrderedName(NameStorage);		OS << Name;
return OS.str();		OS.flush();
		return S;
}		}

private:		/// A code completion result, in clang-native form.
static float score(const CodeCompletionResult &Result) {		/// It may be promoted to a CompletionItem if it's among the top-ranked results.
		struct CompletionCandidate {
		llvm::StringRef Name; // Used for filtering and sorting.
		// We may have a result from Sema, from the index, or both.
		const CodeCompletionResult *SemaResult = nullptr;
		const Symbol *IndexResult = nullptr;

		// Computes the "symbol quality" score for this completion. Higher is better.
		float score() const {
		// For now we just use the Sema priority, mapping it onto a 0-1 interval.
		if (!SemaResult) // FIXME(sammccall): better scoring for index results.
		return 0.3; // fixed mediocre score for index-only results.

// Priority 80 is a really bad score.		// Priority 80 is a really bad score.
float Score = 1 - std::min<float>(80, Result.Priority) / 80;		float Score = 1 - std::min<float>(80, SemaResult->Priority) / 80;

switch (static_cast<CXAvailabilityKind>(Result.Availability)) {		switch (static_cast<CXAvailabilityKind>(SemaResult->Availability)) {
case CXAvailability_Available:		case CXAvailability_Available:
// No penalty.		// No penalty.
break;		break;
case CXAvailability_Deprecated:		case CXAvailability_Deprecated:
Score *= 0.1f;		Score *= 0.1f;
break;		break;
case CXAvailability_NotAccessible:		case CXAvailability_NotAccessible:
case CXAvailability_NotAvailable:		case CXAvailability_NotAvailable:
Score = 0;		Score = 0;
break;		break;
}		}
return Score;		return Score;
}		}

// Produces an integer that sorts in the same order as F.		// Builds an LSP completion item.
// That is: a < b <==> encodeFloat(a) < encodeFloat(b).		CompletionItem build(const CompletionItemScores &Scores,
static uint32_t encodeFloat(float F) {		const CodeCompleteOptions &Opts,
static_assert(std::numeric_limits<float>::is_iec559, "");		CodeCompletionString *SemaCCS) const {
static_assert(sizeof(float) == sizeof(uint32_t), "");		assert(bool(SemaResult) == bool(SemaCCS));
constexpr uint32_t TopBit = ~(~uint32_t{0} >> 1);		CompletionItem I;
		if (SemaResult) {
		I.kind = toCompletionItemKind(SemaResult->Kind, SemaResult->CursorKind);
		getLabelAndInsertText(*SemaCCS, &I.label, &I.insertText,
		Opts.EnableSnippets);
		I.filterText = getFilterText(*SemaCCS);
		I.documentation = getDocumentation(*SemaCCS);
		I.detail = getDetail(*SemaCCS);
		}
		if (IndexResult) {
		if (I.kind == CompletionItemKind::Missing)
		I.kind = toCompletionItemKind(IndexResult->SymInfo.Kind);
		// FIXME: reintroduce a way to show the index source for debugging.
		if (I.label.empty())
		I.label = IndexResult->CompletionLabel;
		if (I.filterText.empty())
		I.filterText = IndexResult->Name;

// Get the bits of the float. Endianness is the same as for integers.		// FIXME(ioeric): support inserting/replacing scope qualifiers.
uint32_t U;		if (I.insertText.empty())
memcpy(&U, &F, sizeof(float));		I.insertText = Opts.EnableSnippets
// IEEE 754 floats compare like sign-magnitude integers.		? IndexResult->CompletionSnippetInsertText
if (U & TopBit) // Negative float.		: IndexResult->CompletionPlainInsertText;
return 0 - U; // Map onto the low half of integers, order reversed.
return U + TopBit; // Positive floats map onto the high half of integers.		if (auto *D = IndexResult->Detail) {
		if (I.documentation.empty())
		I.documentation = D->Documentation;
		if (I.detail.empty())
		I.detail = D->CompletionDetail;
		}
		}
		I.scoreInfo = Scores;
		I.sortText = sortText(Scores.finalScore, Name);
		I.insertTextFormat = Opts.EnableSnippets ? InsertTextFormat::Snippet
		: InsertTextFormat::PlainText;
		return I;
}		}
};		};

		// Determine the symbol ID for a Sema code completion result, if possible.
		llvm::Optional<SymbolID> getSymbolID(const CodeCompletionResult &R) {
		switch (R.Kind) {
		case CodeCompletionResult::RK_Declaration:
		case CodeCompletionResult::RK_Pattern: {
		llvm::SmallString<128> USR;
		if (/Ignore=/clang::index::generateUSRForDecl(R.Declaration, USR))
		return None;
		return SymbolID(USR);
		}
		case CodeCompletionResult::RK_Macro:
		// FIXME: Macros do have USRs, but the CCR doesn't contain enough info.
		case CodeCompletionResult::RK_Keyword:
		return None;
		}
		hokeinUnsubmitted Done Reply Inline Actions add `return None` to make compiler happier? I think it might trigger -Wreturn-type warning. hokein: add `return None` to make compiler happier? I think it might trigger -Wreturn-type warning.
		sammccallAuthorUnsubmitted Not Done Reply Inline Actions added llvm_unreachable. sammccall: added llvm_unreachable.
		llvm_unreachable("unknown CodeCompletionResult kind");
		}

/// \brief Information about the scope specifier in the qualified-id code		/// \brief Information about the scope specifier in the qualified-id code
/// completion (e.g. "ns::ab?").		/// completion (e.g. "ns::ab?").
struct SpecifiedScope {		struct SpecifiedScope {
/// The scope specifier as written. For example, for completion "ns::ab?", the		/// The scope specifier as written. For example, for completion "ns::ab?", the
/// written scope specifier is "ns".		/// written scope specifier is "ns".
std::string Written;		std::string Written;
// If this scope specifier is recognized in Sema (e.g. as a namespace		// If this scope specifier is recognized in Sema (e.g. as a namespace
// context), this will be set to the fully qualfied name of the corresponding		// context), this will be set to the fully qualfied name of the corresponding
// context.		// context.
std::string Resolved;		std::string Resolved;
};

/// \brief Information from sema about (parital) symbol names to be completed.		llvm::StringRef forIndex() {
/// For example, for completion "ns::ab^", this stores the scope specifier		llvm::StringRef Chosen = Resolved.empty() ? Written : Resolved;
/// "ns::" and the completion filter text "ab".		return Chosen.trim(':');
struct NameToComplete {		}
// The partial identifier being completed, without qualifier.
std::string Filter;

/// This is set if the completion is for qualified IDs, e.g. "abc::x^".
llvm::Optional<SpecifiedScope> SSInfo;
};		};

SpecifiedScope extraCompletionScope(Sema &S, const CXXScopeSpec &SS);		// The CompletionRecorder captures Sema code-complete output, including context.
		// It filters out ignored results (but doesn't apply fuzzy-filtering yet).
		ioericUnsubmitted Done Reply Inline Actions Does the recorder still do fuzzy-matching? ioeric: Does the recorder still do fuzzy-matching?
class CompletionItemsCollector : public CodeCompleteConsumer {		// It doesn't do scoring or conversion to CompletionItem yet, as we want to
public:		// merge with index results first.
CompletionItemsCollector(const CodeCompleteOptions &CodeCompleteOpts,		struct CompletionRecorder : public CodeCompleteConsumer {
CompletionList &Items, NameToComplete &CompletedName)		CompletionRecorder(const CodeCompleteOptions &Opts)
: CodeCompleteConsumer(CodeCompleteOpts.getClangCompleteOpts(),		: CodeCompleteConsumer(Opts.getClangCompleteOpts(),
/OutputIsBinary=/false),		/OutputIsBinary=/false),
ClangdOpts(CodeCompleteOpts), Items(Items),		CCContext(CodeCompletionContext::CCC_Other), Opts(Opts),
Allocator(std::make_shared<clang::GlobalCodeCompletionAllocator>()),		CCAllocator(std::make_shared<GlobalCodeCompletionAllocator>()),
CCTUInfo(Allocator), CompletedName(CompletedName),		CCTUInfo(CCAllocator) {}
EnableSnippets(CodeCompleteOpts.EnableSnippets) {}		std::vector<CodeCompletionResult> Results;
		CodeCompletionContext CCContext;
		Sema *CCSema = nullptr; // Sema that created the results.
		// FIXME: Sema is scary. Can we store ASTContext and Preprocessor, instead?

void ProcessCodeCompleteResults(Sema &S, CodeCompletionContext Context,		void ProcessCodeCompleteResults(class Sema &S, CodeCompletionContext Context,
CodeCompletionResult *Results,		CodeCompletionResult *InResults,
unsigned NumResults) override final {		unsigned NumResults) override final {
FuzzyMatcher Filter(S.getPreprocessor().getCodeCompletionFilter());		// Record the completion context.
if (auto SS = Context.getCXXScopeSpecifier())		assert(!CCSema && "ProcessCodeCompleteResults called multiple times!");
CompletedName.SSInfo = extraCompletionScope(S, **SS);		CCSema = &S;
		ioericUnsubmitted Done Reply Inline Actions It seems that `CCContext` can change during `ProcessCodeCompleteResults`. It's unclear what the implication is for `codeCompletionString` at the end. ioeric: It seems that `CCContext` can change during `ProcessCodeCompleteResults`. It's unclear what…
		sammccallAuthorUnsubmitted Not Done Reply Inline Actions This function is only ever called once, but this isn't documented anywhere :-\ Added an assert. sammccall: This function is only ever called once, but this isn't documented anywhere :-\ Added an assert.
		hokeinUnsubmitted Done Reply Inline Actions I'd suggesting rename the variable `Sema` to another name, since `Sema` is already a class name (although naming is hard). hokein: I'd suggesting rename the variable `Sema` to another name, since `Sema` is already a class name…
		CCContext = Context;

CompletedName.Filter = S.getPreprocessor().getCodeCompletionFilter();		// Retain the results we might want.
std::priority_queue<CompletionCandidate> Candidates;
for (unsigned I = 0; I < NumResults; ++I) {		for (unsigned I = 0; I < NumResults; ++I) {
auto &Result = Results[I];		auto &Result = InResults[I];
// We drop hidden items, as they cannot be found by the lookup after		// Drop hidden items which cannot be found by lookup after completion.
// inserting the corresponding completion item and only produce noise and		// Exception: some items can be named by using a qualifier.
// duplicates in the completion list. However, there is one exception. If
// Result has a Qualifier which is non-informative, we can refer to an
// item by adding that qualifier, so we don't filter out this item.
if (Result.Hidden && (!Result.Qualifier \|\| Result.QualifierIsInformative))		if (Result.Hidden && (!Result.Qualifier \|\| Result.QualifierIsInformative))
continue;		continue;
if (!ClangdOpts.IncludeIneligibleResults &&		if (!Opts.IncludeIneligibleResults &&
(Result.Availability == CXAvailability_NotAvailable \|\|		(Result.Availability == CXAvailability_NotAvailable \|\|
Result.Availability == CXAvailability_NotAccessible))		Result.Availability == CXAvailability_NotAccessible))
continue;		continue;
auto FilterScore = fuzzyMatch(S, Context, Filter, Result);		Results.push_back(Result);
if (!FilterScore)
continue;
Candidates.emplace(Result, *FilterScore);
if (ClangdOpts.Limit && Candidates.size() > ClangdOpts.Limit) {
Candidates.pop();
Items.isIncomplete = true;
}		}
}		}
while (!Candidates.empty()) {
auto &Candidate = Candidates.top();
const auto *CCS = Candidate.Result->CreateCodeCompletionString(
S, Context, *Allocator, CCTUInfo,
CodeCompleteOpts.IncludeBriefComments);
assert(CCS && "Expected the CodeCompletionString to be non-null");
Items.items.push_back(ProcessCodeCompleteResult(Candidate, *CCS));
Candidates.pop();
}
std::reverse(Items.items.begin(), Items.items.end());
}

GlobalCodeCompletionAllocator &getAllocator() override { return *Allocator; }

		CodeCompletionAllocator &getAllocator() override { return *CCAllocator; }
CodeCompletionTUInfo &getCodeCompletionTUInfo() override { return CCTUInfo; }		CodeCompletionTUInfo &getCodeCompletionTUInfo() override { return CCTUInfo; }

private:		// Returns the filtering/sorting name for Result, which must be from Results.
llvm::Optional<float> fuzzyMatch(Sema &S, const CodeCompletionContext &CCCtx,		// Returned string is owned by this recorder (or the AST).
FuzzyMatcher &Filter,		llvm::StringRef getName(const CodeCompletionResult &Result) {
CodeCompletionResult Result) {
switch (Result.Kind) {		switch (Result.Kind) {
case CodeCompletionResult::RK_Declaration:		case CodeCompletionResult::RK_Declaration:
if (auto *ID = Result.Declaration->getIdentifier())		if (auto *ID = Result.Declaration->getIdentifier())
return Filter.match(ID->getName());		return ID->getName();
break;		break;
case CodeCompletionResult::RK_Keyword:		case CodeCompletionResult::RK_Keyword:
return Filter.match(Result.Keyword);		return Result.Keyword;
case CodeCompletionResult::RK_Macro:		case CodeCompletionResult::RK_Macro:
return Filter.match(Result.Macro->getName());		return Result.Macro->getName();
case CodeCompletionResult::RK_Pattern:		case CodeCompletionResult::RK_Pattern:
return Filter.match(Result.Pattern->getTypedText());		return Result.Pattern->getTypedText();
}		}
auto *CCS = Result.CreateCodeCompletionString(		auto CCS = codeCompletionString(Result, /IncludeBriefComments=*/false);
S, CCCtx, Allocator, CCTUInfo, /IncludeBriefComments=*/false);		return CCS->getTypedText();
return Filter.match(CCS->getTypedText());
}		}

CompletionItem		// Build a CodeCompletion string for R, which must be from Results.
ProcessCodeCompleteResult(const CompletionCandidate &Candidate,		// The CCS will be owned by this recorder.
const CodeCompletionString &CCS) const {		CodeCompletionString *codeCompletionString(const CodeCompletionResult &R,
		bool IncludeBriefComments) {
		// CodeCompletionResult doesn't seem to be const-correct. We own it, anyway.
		return const_cast<CodeCompletionResult &>(R).CreateCodeCompletionString(
		CCSema, CCContext, CCAllocator, CCTUInfo, IncludeBriefComments);
		}

// Adjust this to InsertTextFormat::Snippet iff we encounter a		private:
// CK_Placeholder chunk in SnippetCompletionItemsCollector.		CodeCompleteOptions Opts;
CompletionItem Item;		std::shared_ptr<GlobalCodeCompletionAllocator> CCAllocator;
		CodeCompletionTUInfo CCTUInfo;
Item.documentation = getDocumentation(CCS);		};
Item.sortText = Candidate.sortText();
Item.scoreInfo = Candidate.Scores;

Item.detail = getDetail(CCS);
Item.filterText = getFilterText(CCS);
getLabelAndInsertText(CCS, &Item.label, &Item.insertText, EnableSnippets);

Item.insertTextFormat = EnableSnippets ? InsertTextFormat::Snippet		// Tracks a bounded number of candidates with the best scores.
: InsertTextFormat::PlainText;		class TopN {
		public:
		using value_type = std::pair<CompletionCandidate, CompletionItemScores>;
		static constexpr size_t Unbounded = std::numeric_limits<size_t>::max();

		TopN(size_t N) : N(N) {}

// Fill in the kind field of the CompletionItem.		// Adds a candidate to the set.
Item.kind = toCompletionItemKind(Candidate.Result->Kind,		// Returns true if a candidate was dropped to get back under N.
Candidate.Result->CursorKind);		bool push(value_type &&V) {
		bool Dropped = false;
		if (Heap.size() >= N) {
		Dropped = true;
		if (N > 0 && greater(V, Heap.front())) {
		std::pop_heap(Heap.begin(), Heap.end(), greater);
		Heap.back() = std::move(V);
		std::push_heap(Heap.begin(), Heap.end(), greater);
		}
		} else {
		Heap.push_back(std::move(V));
		std::push_heap(Heap.begin(), Heap.end(), greater);
		}
		assert(Heap.size() <= N);
		assert(std::is_heap(Heap.begin(), Heap.end(), greater));
		return Dropped;
		}

return Item;		// Returns candidates from best to worst.
		std::vector<value_type> items() && {
		ioericUnsubmitted Done Reply Inline Actions Maybe `dropped()`? ioeric: Maybe `dropped()`?
		std::sort_heap(Heap.begin(), Heap.end(), greater);
		assert(Heap.size() <= N);
		return std::move(Heap);
}		}

CodeCompleteOptions ClangdOpts;		private:
CompletionList &Items;		static bool greater(const value_type &L, const value_type &R) {
std::shared_ptr<clang::GlobalCodeCompletionAllocator> Allocator;		if (L.second.finalScore != R.second.finalScore)
CodeCompletionTUInfo CCTUInfo;		return L.second.finalScore > R.second.finalScore;
NameToComplete &CompletedName;		return L.first.Name < R.first.Name; // Earlier name is better.
bool EnableSnippets;		}
}; // CompletionItemsCollector
		const size_t N;
		std::vector<value_type> Heap; // Min-heap, comparator is greater().
		};

class SignatureHelpCollector final : public CodeCompleteConsumer {		class SignatureHelpCollector final : public CodeCompleteConsumer {

public:		public:
SignatureHelpCollector(const clang::CodeCompleteOptions &CodeCompleteOpts,		SignatureHelpCollector(const clang::CodeCompleteOptions &CodeCompleteOpts,
SignatureHelp &SigHelp)		SignatureHelp &SigHelp)
: CodeCompleteConsumer(CodeCompleteOpts, /OutputIsBinary=/false),		: CodeCompleteConsumer(CodeCompleteOpts, /OutputIsBinary=/false),
SigHelp(SigHelp),		SigHelp(SigHelp),
▲ Show 20 Lines • Show All 80 Lines • ▼ Show 20 Lines	private:
}		}

SignatureHelp &SigHelp;		SignatureHelp &SigHelp;
std::shared_ptr<clang::GlobalCodeCompletionAllocator> Allocator;		std::shared_ptr<clang::GlobalCodeCompletionAllocator> Allocator;
CodeCompletionTUInfo CCTUInfo;		CodeCompletionTUInfo CCTUInfo;

}; // SignatureHelpCollector		}; // SignatureHelpCollector

bool invokeCodeComplete(const Context &Ctx,		struct SemaCompleteInput {
		PathRef FileName;
		const tooling::CompileCommand &Command;
		PrecompiledPreamble const *Preamble;
		StringRef Contents;
		Position Pos;
		IntrusiveRefCntPtr<vfs::FileSystem> VFS;
		std::shared_ptr<PCHContainerOperations> PCHs;
		};

		// Invokes Sema code completion on a file.
		// Callback will be invoked once completion is done, but before cleaning up.
		bool semaCodeComplete(const Context &Ctx,
std::unique_ptr<CodeCompleteConsumer> Consumer,		std::unique_ptr<CodeCompleteConsumer> Consumer,
const clang::CodeCompleteOptions &Options,		const clang::CodeCompleteOptions &Options,
PathRef FileName,		const SemaCompleteInput &Input,
const tooling::CompileCommand &Command,		llvm::function_ref<void()> Callback = nullptr) {
PrecompiledPreamble const *Preamble, StringRef Contents,
Position Pos, IntrusiveRefCntPtr<vfs::FileSystem> VFS,
std::shared_ptr<PCHContainerOperations> PCHs) {
std::vector<const char *> ArgStrs;		std::vector<const char *> ArgStrs;
for (const auto &S : Command.CommandLine)		for (const auto &S : Input.Command.CommandLine)
ArgStrs.push_back(S.c_str());		ArgStrs.push_back(S.c_str());

VFS->setCurrentWorkingDirectory(Command.Directory);		Input.VFS->setCurrentWorkingDirectory(Input.Command.Directory);

IgnoreDiagnostics DummyDiagsConsumer;		IgnoreDiagnostics DummyDiagsConsumer;
auto CI = createInvocationFromCommandLine(		auto CI = createInvocationFromCommandLine(
ArgStrs,		ArgStrs,
CompilerInstance::createDiagnostics(new DiagnosticOptions,		CompilerInstance::createDiagnostics(new DiagnosticOptions,
&DummyDiagsConsumer, false),		&DummyDiagsConsumer, false),
VFS);		Input.VFS);
assert(CI && "Couldn't create CompilerInvocation");		assert(CI && "Couldn't create CompilerInvocation");
CI->getFrontendOpts().DisableFree = false;		CI->getFrontendOpts().DisableFree = false;

std::unique_ptr<llvm::MemoryBuffer> ContentsBuffer =		std::unique_ptr<llvm::MemoryBuffer> ContentsBuffer =
llvm::MemoryBuffer::getMemBufferCopy(Contents, FileName);		llvm::MemoryBuffer::getMemBufferCopy(Input.Contents, Input.FileName);

// We reuse the preamble whether it's valid or not. This is a		// We reuse the preamble whether it's valid or not. This is a
// correctness/performance tradeoff: building without a preamble is slow, and		// correctness/performance tradeoff: building without a preamble is slow, and
// completion is latency-sensitive.		// completion is latency-sensitive.
if (Preamble) {		if (Input.Preamble) {
auto Bounds =		auto Bounds =
ComputePreambleBounds(*CI->getLangOpts(), ContentsBuffer.get(), 0);		ComputePreambleBounds(*CI->getLangOpts(), ContentsBuffer.get(), 0);
// FIXME(ibiryukov): Remove this call to CanReuse() after we'll fix		// FIXME(ibiryukov): Remove this call to CanReuse() after we'll fix
// clients relying on getting stats for preamble files during code		// clients relying on getting stats for preamble files during code
// completion.		// completion.
// Note that results of CanReuse() are ignored, see the comment above.		// Note that results of CanReuse() are ignored, see the comment above.
Preamble->CanReuse(*CI, ContentsBuffer.get(), Bounds, VFS.get());		Input.Preamble->CanReuse(*CI, ContentsBuffer.get(), Bounds,
		Input.VFS.get());
}		}
auto Clang = prepareCompilerInstance(		auto Clang = prepareCompilerInstance(
std::move(CI), Preamble, std::move(ContentsBuffer), std::move(PCHs),		std::move(CI), Input.Preamble, std::move(ContentsBuffer),
std::move(VFS), DummyDiagsConsumer);		std::move(Input.PCHs), std::move(Input.VFS), DummyDiagsConsumer);
auto &DiagOpts = Clang->getDiagnosticOpts();		auto &DiagOpts = Clang->getDiagnosticOpts();
DiagOpts.IgnoreWarnings = true;		DiagOpts.IgnoreWarnings = true;

auto &FrontendOpts = Clang->getFrontendOpts();		auto &FrontendOpts = Clang->getFrontendOpts();
FrontendOpts.SkipFunctionBodies = true;		FrontendOpts.SkipFunctionBodies = true;
FrontendOpts.CodeCompleteOpts = Options;		FrontendOpts.CodeCompleteOpts = Options;
FrontendOpts.CodeCompletionAt.FileName = FileName;		FrontendOpts.CodeCompletionAt.FileName = Input.FileName;
FrontendOpts.CodeCompletionAt.Line = Pos.line + 1;		FrontendOpts.CodeCompletionAt.Line = Input.Pos.line + 1;
FrontendOpts.CodeCompletionAt.Column = Pos.character + 1;		FrontendOpts.CodeCompletionAt.Column = Input.Pos.character + 1;

Clang->setCodeCompletionConsumer(Consumer.release());		Clang->setCodeCompletionConsumer(Consumer.release());

SyntaxOnlyAction Action;		SyntaxOnlyAction Action;
if (!Action.BeginSourceFile(*Clang, Clang->getFrontendOpts().Inputs[0])) {		if (!Action.BeginSourceFile(*Clang, Clang->getFrontendOpts().Inputs[0])) {
log(Ctx,		log(Ctx, "BeginSourceFile() failed when running codeComplete for " +
"BeginSourceFile() failed when running codeComplete for " + FileName);		Input.FileName);
return false;		return false;
}		}
if (!Action.Execute()) {		if (!Action.Execute()) {
log(Ctx, "Execute() failed when running codeComplete for " + FileName);		log(Ctx,
		"Execute() failed when running codeComplete for " + Input.FileName);
return false;		return false;
}		}

		if (Callback)
		Callback();
Action.EndSourceFile();		Action.EndSourceFile();

return true;		return true;
}		}

CompletionItem indexCompletionItem(const Symbol &Sym, llvm::StringRef Filter,		SpecifiedScope getSpecifiedScope(Sema &S, const CXXScopeSpec &SS) {
const SpecifiedScope &SSInfo,
llvm::StringRef DebuggingLabel = "") {
CompletionItem Item;
Item.kind = toCompletionItemKind(Sym.SymInfo.Kind);
// Add DebuggingLabel to the completion results if DebuggingLabel is not
// empty.
//
// For symbols from static index, there are prefix "[G]" in the
// results (which is used for debugging purpose).
// So completion list will be like:
// clang::symbol_from_dynamic_index
// [G]clang::symbol_from_static_index
//
// FIXME: Find out a better way to show the index source.
if (!DebuggingLabel.empty()) {
llvm::raw_string_ostream Label(Item.label);
Label << llvm::format("[%s]%s", DebuggingLabel.str().c_str(),
Sym.Name.str().c_str());
} else {
Item.label = Sym.Name;
}
// FIXME(ioeric): support inserting/replacing scope qualifiers.

// FIXME(ioeric): support snippets.
Item.insertText = Sym.CompletionPlainInsertText;
Item.insertTextFormat = InsertTextFormat::PlainText;
Item.filterText = Sym.Name;

// FIXME(ioeric): sort symbols appropriately.
Item.sortText = "";

if (Sym.Detail) {
Item.documentation = Sym.Detail->Documentation;
Item.detail = Sym.Detail->CompletionDetail;
}

return Item;
}

void completeWithIndex(const Context &Ctx, const SymbolIndex &Index,
llvm::StringRef Code, const SpecifiedScope &SSInfo,
llvm::StringRef Filter, CompletionList *Items,
llvm::StringRef DebuggingLabel = "") {
FuzzyFindRequest Req;
Req.Query = Filter;
// FIXME(ioeric): add more possible scopes based on using namespaces and
// containing namespaces.
StringRef Scope = SSInfo.Resolved.empty() ? SSInfo.Written : SSInfo.Resolved;
Req.Scopes = {Scope.trim(':').str()};

Items->isIncomplete \|= !Index.fuzzyFind(Ctx, Req, [&](const Symbol &Sym) {
Items->items.push_back(
indexCompletionItem(Sym, Filter, SSInfo, DebuggingLabel));
});
}

SpecifiedScope extraCompletionScope(Sema &S, const CXXScopeSpec &SS) {
SpecifiedScope Info;		SpecifiedScope Info;
auto &SM = S.getSourceManager();		auto &SM = S.getSourceManager();
auto SpecifierRange = SS.getRange();		auto SpecifierRange = SS.getRange();
Info.Written = Lexer::getSourceText(		Info.Written = Lexer::getSourceText(
CharSourceRange::getCharRange(SpecifierRange), SM, clang::LangOptions());		CharSourceRange::getCharRange(SpecifierRange), SM, clang::LangOptions());
if (SS.isValid()) {		if (SS.isValid()) {
DeclContext *DC = S.computeDeclContext(SS);		DeclContext *DC = S.computeDeclContext(SS);
if (auto *NS = llvm::dyn_cast<NamespaceDecl>(DC)) {		if (auto *NS = llvm::dyn_cast<NamespaceDecl>(DC)) {
Info.Resolved = NS->getQualifiedNameAsString();		Info.Resolved = NS->getQualifiedNameAsString();
} else if (llvm::dyn_cast<TranslationUnitDecl>(DC) != nullptr) {		} else if (llvm::dyn_cast<TranslationUnitDecl>(DC) != nullptr) {
Info.Resolved = "::";		Info.Resolved = "::";
// Sema does not include the suffix "::" in the range of SS, so we add		// Sema does not include the suffix "::" in the range of SS, so we add
// it back here.		// it back here.
Info.Written = "::";		Info.Written = "::";
}		}
}		}
return Info;		return Info;
}		}

		// Should we perform index-based completion in this context?
		// FIXME: consider allowing completion, but restricting the result types.
		bool allowIndex(enum CodeCompletionContext::Kind K) {
		switch (K) {
		case CodeCompletionContext::CCC_TopLevel:
		case CodeCompletionContext::CCC_ObjCInterface:
		case CodeCompletionContext::CCC_ObjCImplementation:
		case CodeCompletionContext::CCC_ObjCIvarList:
		case CodeCompletionContext::CCC_ClassStructUnion:
		case CodeCompletionContext::CCC_Statement:
		case CodeCompletionContext::CCC_Expression:
		case CodeCompletionContext::CCC_ObjCMessageReceiver:
		case CodeCompletionContext::CCC_EnumTag:
		case CodeCompletionContext::CCC_UnionTag:
		case CodeCompletionContext::CCC_ClassOrStructTag:
		case CodeCompletionContext::CCC_ObjCProtocolName:
		case CodeCompletionContext::CCC_Namespace:
		case CodeCompletionContext::CCC_Type:
		case CodeCompletionContext::CCC_Name: // FIXME: why does ns::^ give this?
		case CodeCompletionContext::CCC_PotentiallyQualifiedName:
		case CodeCompletionContext::CCC_ParenthesizedExpression:
		case CodeCompletionContext::CCC_ObjCInterfaceName:
		case CodeCompletionContext::CCC_ObjCCategoryName:
		return true;
		case CodeCompletionContext::CCC_Other: // Be conservative.
		case CodeCompletionContext::CCC_OtherWithMacros:
		case CodeCompletionContext::CCC_DotMemberAccess:
		case CodeCompletionContext::CCC_ArrowMemberAccess:
		case CodeCompletionContext::CCC_ObjCPropertyAccess:
		case CodeCompletionContext::CCC_MacroName:
		case CodeCompletionContext::CCC_MacroNameUse:
		case CodeCompletionContext::CCC_PreprocessorExpression:
		case CodeCompletionContext::CCC_PreprocessorDirective:
		case CodeCompletionContext::CCC_NaturalLanguage:
		case CodeCompletionContext::CCC_SelectorName:
		case CodeCompletionContext::CCC_TypeQualifiers:
		case CodeCompletionContext::CCC_ObjCInstanceMessage:
		case CodeCompletionContext::CCC_ObjCClassMessage:
		case CodeCompletionContext::CCC_Recovery:
		return false;
		}
		llvm_unreachable("unknown code completion context");
		}

} // namespace		} // namespace

clang::CodeCompleteOptions CodeCompleteOptions::getClangCompleteOpts() const {		clang::CodeCompleteOptions CodeCompleteOptions::getClangCompleteOpts() const {
clang::CodeCompleteOptions Result;		clang::CodeCompleteOptions Result;
Result.IncludeCodePatterns = EnableSnippets && IncludeCodePatterns;		Result.IncludeCodePatterns = EnableSnippets && IncludeCodePatterns;
Result.IncludeMacros = IncludeMacros;		Result.IncludeMacros = IncludeMacros;
Result.IncludeGlobals = true;		Result.IncludeGlobals = true;
Result.IncludeBriefComments = IncludeBriefComments;		Result.IncludeBriefComments = IncludeBriefComments;

// When an is used, Sema is responsible for completing the main file,		// When an is used, Sema is responsible for completing the main file,
// the index can provide results from the preamble.		// the index can provide results from the preamble.
// Tell Sema not to deserialize the preamble to look for results.		// Tell Sema not to deserialize the preamble to look for results.
Result.LoadExternal = !Index;		Result.LoadExternal = !Index;

return Result;		return Result;
}		}

		// Runs Sema-based (AST) and Index-based completion, returns merged results.
		//
		// There are a few tricky considerations:
		// - the AST provides information needed for the index query (e.g. which
		// namespaces to search in). So Sema must start first.
		// - we only want to return the top results (Opts.Limit).
		// Building CompletionItems for everything else is wasteful, so we want to
		// preserve the "native" format until we're done with scoring.
		// - the data underlying Sema completion items is owned by the AST and various
		// other arenas, which must stay alive for us to build CompletionItems.
		// - we may get duplicate results from Sema and the Index, we need to merge.
		//
		// So we start Sema completion first, but defer its cleanup until we're done.
		// We use the Sema context information to query the index.
		// Then we merge the two result sets, producing items that are Sema/Index/Both.
		// These items are scored, and the top N are synthesized into the LSP response.
		// Finally, we can clean up the data structures created by Sema completion.
		//
		// Main collaborators are:
		// - semaCodeComplete sets up the compiler machinery to run code completion.
		// - CompletionRecorder captures Sema completion results, including context.
		// - SymbolIndex (Opts.Index) provides index completion results as Symbols
		// - CompletionCandidates are the result of merging Sema and Index results.
		// Each candidate points to an underlying CodeCompletionResult (Sema), a
		// Symbol (Index), or both. It computes the result quality score.
		// CompletionCandidate also does conversion to CompletionItem (at the end).
		// - FuzzyMatcher scores how the candidate matches the partial identifier.
		// This score is combined with the result quality score for the final score.
		// - TopN determines the results with the best score.
		class CodeCompleteFlow {
		const Context &Ctx;
		const CodeCompleteOptions &Opts;
		// Sema takes ownership of Recorder. Recorder is valid until Sema cleanup.
		std::unique_ptr<CompletionRecorder> RecorderOwner;
		CompletionRecorder &Recorder;
		int NSema = 0, NIndex = 0, NBoth = 0; // Counters for logging.
		bool Incomplete = false; // Would more be available with a higher limit?
		ioericUnsubmitted Not Done Reply Inline Actions `InComplete` can probably be output variable of `queryIndex` and `addCandidate` instead of a state? ioeric: `InComplete` can probably be output variable of `queryIndex` and `addCandidate` instead of a…
		sammccallAuthorUnsubmitted Not Done Reply Inline Actions Certainly it can (it needs to be an out-param, because these functions already have primary return values). Just as these could all be free functions :-) I tried it out - I find the out-params are a bit messy/hard to read, and they'd need to be added to `mergeResults`, `queryIndex` and `addCandidate`. It adds quite a lot of noise, and I'm not sure on balance emphasizing the flow of IsIncomplete is worth obscuring the flow of the results themselves. If you disagree, let me know (or just change it!) sammccall: Certainly it can (it needs to be an out-param, because these functions already have primary…
		llvm::Optional<FuzzyMatcher> Filter; // Initialized once Sema runs.

		public:
		// A CodeCompleteFlow object is only useful for calling run() exactly once.
		CodeCompleteFlow(const Context &Ctx, const CodeCompleteOptions &Opts)
		: Ctx(Ctx), Opts(Opts), RecorderOwner(new CompletionRecorder(Opts)),
		Recorder(*RecorderOwner) {}

		CompletionList run(const SemaCompleteInput &SemaCCInput) && {
		// We run Sema code completion first. It builds an AST and calculates:
		// - completion results based on the AST. These are saved for merging.
		// - partial identifier and context. We need these for the index query.
		CompletionList Output;
		semaCodeComplete(Ctx, std::move(RecorderOwner), Opts.getClangCompleteOpts(),
		SemaCCInput, [&] {
		if (Recorder.CCSema)
		Output = runWithSema();
		else
		log(Ctx, "Code complete: no Sema callback, 0 results");
		});

		log(Ctx,
		llvm::formatv("Code complete: {0} results from Sema, {1} from Index, "
		"{2} matched, {3} returned{4}.",
		NSema, NIndex, NBoth, Output.items.size(),
		Output.isIncomplete ? " (incomplete)" : ""));
		assert(!Opts.Limit \|\| Output.items.size() <= Opts.Limit);
		// We don't assert that isIncomplete means we hit a limit.
		// Indexes may choose to impose their own limits even if we don't have one.
		return Output;
		}

		private:
		// This is called by run() once Sema code completion is done, but before the
		// Sema data structures are torn down. It does all the real work.
		CompletionList runWithSema() {
		Filter = FuzzyMatcher(
		Recorder.CCSema->getPreprocessor().getCodeCompletionFilter());
		// Sema provides the needed context to query the index.
		// FIXME: in addition to querying for extra/overlapping symbols, we should
		// explicitly request symbols corresponding to Sema results.
		// We can use their signals even if the index can't suggest them.
		// We must copy index results to preserve them, but there are at most Limit.
		auto IndexResults = queryIndex();
		// Merge Sema and Index results, score them, and pick the winners.
		auto Top = mergeResults(Recorder.Results, IndexResults);
		// Convert the results to the desired LSP structs.
		CompletionList Output;
		for (auto &C : Top)
		Output.items.push_back(toCompletionItem(C.first, C.second));
		Output.isIncomplete = Incomplete;
		return Output;
		}

		SymbolSlab queryIndex() {
		if (!Opts.Index \|\| !allowIndex(Recorder.CCContext.getKind()))
		return SymbolSlab();
		SymbolSlab::Builder ResultsBuilder;
		// Build the query.
		FuzzyFindRequest Req;
		Req.Query = Filter->pattern();
		// If the user typed a scope, e.g. a::b::xxx(), restrict to that scope.
		// FIXME(ioeric): add scopes based on using directives and enclosing ns.
		if (auto SS = Recorder.CCContext.getCXXScopeSpecifier())
		Req.Scopes = {getSpecifiedScope(Recorder.CCSema, *SS).forIndex()};
		else
		// Unless the user typed a ns qualifier, complete in global scope only.
		// FIXME: once we know what namespaces are in scope (D42073), use those.
		// FIXME: once we can insert namespace qualifiers and use the in-scope
		// namespaces for scoring, search in all namespaces.
		Req.Scopes = {""};
		// Run the query against the index.
		Incomplete \|= !Opts.Index->fuzzyFind(
		Ctx, Req, [&](const Symbol &Sym) { ResultsBuilder.insert(Sym); });
		return std::move(ResultsBuilder).build();
		}

		// Merges the Sema and Index results where possible, scores them, and
		// returns the top results from best to worst.
		std::vector<std::pair<CompletionCandidate, CompletionItemScores>>
		mergeResults(const std::vector<CodeCompletionResult> &SemaResults,
		const SymbolSlab &IndexResults) {
		// We only keep the best N results at any time, in "native" format.
		TopN Top(Opts.Limit == 0 ? TopN::Unbounded : Opts.Limit);
		llvm::DenseSet<const Symbol *> UsedIndexResults;
		auto CorrespondingIndexResult =
		[&](const CodeCompletionResult &SemaResult) -> const Symbol * {
		if (auto SymID = getSymbolID(SemaResult)) {
		auto I = IndexResults.find(*SymID);
		if (I != IndexResults.end()) {
		UsedIndexResults.insert(&*I);
		return &*I;
		}
		}
		return nullptr;
		};
		// Emit all Sema results, merging them with Index results if possible.
		for (auto &SemaResult : Recorder.Results)
		addCandidate(Top, &SemaResult, CorrespondingIndexResult(SemaResult));
		// Now emit any Index-only results.
		for (const auto &IndexResult : IndexResults) {
		if (UsedIndexResults.count(&IndexResult))
		hokeinUnsubmitted Not Done Reply Inline Actions consider using `llvm::set_difference` here? hokein: consider using `llvm::set_difference` here?
		sammccallAuthorUnsubmitted Not Done Reply Inline Actions The value type is different: Symbol vs Symbol* sammccall: The value type is different: Symbol vs Symbol*
		continue;
		addCandidate(Top, /SemaResult=/nullptr, &IndexResult);
		}
		return std::move(Top).items();
		}

		// Scores a candidate and adds it to the TopN structure.
		void addCandidate(TopN &Candidates, const CodeCompletionResult *SemaResult,
		const Symbol *IndexResult) {
		CompletionCandidate C;
		C.SemaResult = SemaResult;
		C.IndexResult = IndexResult;
		C.Name = IndexResult ? IndexResult->Name : Recorder.getName(*SemaResult);

		CompletionItemScores Scores;
		if (auto FuzzyScore = Filter->match(C.Name))
		Scores.filterScore = *FuzzyScore;
		else
		return;
		Scores.symbolScore = C.score();
		// We score candidates by multiplying symbolScore ("quality" of the result)
		// with filterScore (how well it matched the query).
		// This is sensitive to the distribution of both component scores!
		Scores.finalScore = Scores.filterScore * Scores.symbolScore;

		NSema += bool(SemaResult);
		NIndex += bool(IndexResult);
		NBoth += SemaResult && IndexResult;
		Incomplete \|= Candidates.push({C, Scores});
		}

		CompletionItem toCompletionItem(const CompletionCandidate &Candidate,
		const CompletionItemScores &Scores) {
		CodeCompletionString *SemaCCS = nullptr;
		if (auto *SR = Candidate.SemaResult)
		SemaCCS = Recorder.codeCompletionString(*SR, Opts.IncludeBriefComments);
		return Candidate.build(Scores, Opts, SemaCCS);
		}
		};

CompletionList codeComplete(const Context &Ctx, PathRef FileName,		CompletionList codeComplete(const Context &Ctx, PathRef FileName,
		ioericUnsubmitted Not Done Reply Inline Actions The overall behavior looks good. And the comments really help understand the code! As chatted offline, we might want to break down this function, and a class that book-keeps all the states might be helpful. ioeric: The overall behavior looks good. And the comments really help understand the code! As chatted…
const tooling::CompileCommand &Command,		const tooling::CompileCommand &Command,
PrecompiledPreamble const *Preamble,		PrecompiledPreamble const *Preamble,
StringRef Contents, Position Pos,		StringRef Contents, Position Pos,
IntrusiveRefCntPtr<vfs::FileSystem> VFS,		IntrusiveRefCntPtr<vfs::FileSystem> VFS,
std::shared_ptr<PCHContainerOperations> PCHs,		std::shared_ptr<PCHContainerOperations> PCHs,
CodeCompleteOptions Opts) {		CodeCompleteOptions Opts) {
CompletionList Results;		return CodeCompleteFlow(Ctx, Opts).run(
NameToComplete CompletedName;		{FileName, Command, Preamble, Contents, Pos, VFS, PCHs});
auto Consumer =
llvm::make_unique<CompletionItemsCollector>(Opts, Results, CompletedName);
invokeCodeComplete(Ctx, std::move(Consumer), Opts.getClangCompleteOpts(),
FileName, Command, Preamble, Contents, Pos, std::move(VFS),
std::move(PCHs));

// Got scope specifier (ns::f^) for code completion from sema, try to query
// global symbols from indexes.
// FIXME: merge with Sema results, and respect limits.
if (CompletedName.SSInfo && Opts.Index)
completeWithIndex(Ctx, Opts.Index, Contents, CompletedName.SSInfo,
CompletedName.Filter, &Results, /DebuggingLabel=/"I");
return Results;
}		}

SignatureHelp signatureHelp(const Context &Ctx, PathRef FileName,		SignatureHelp signatureHelp(const Context &Ctx, PathRef FileName,
const tooling::CompileCommand &Command,		const tooling::CompileCommand &Command,
PrecompiledPreamble const *Preamble,		PrecompiledPreamble const *Preamble,
StringRef Contents, Position Pos,		StringRef Contents, Position Pos,
IntrusiveRefCntPtr<vfs::FileSystem> VFS,		IntrusiveRefCntPtr<vfs::FileSystem> VFS,
std::shared_ptr<PCHContainerOperations> PCHs) {		std::shared_ptr<PCHContainerOperations> PCHs) {
SignatureHelp Result;		SignatureHelp Result;
clang::CodeCompleteOptions Options;		clang::CodeCompleteOptions Options;
Options.IncludeGlobals = false;		Options.IncludeGlobals = false;
Options.IncludeMacros = false;		Options.IncludeMacros = false;
Options.IncludeCodePatterns = false;		Options.IncludeCodePatterns = false;
Options.IncludeBriefComments = true;		Options.IncludeBriefComments = true;
invokeCodeComplete(Ctx,		semaCodeComplete(
llvm::make_unique<SignatureHelpCollector>(Options, Result),		Ctx, llvm::make_unique<SignatureHelpCollector>(Options, Result), Options,
Options, FileName, Command, Preamble, Contents, Pos,		{FileName, Command, Preamble, Contents, Pos, std::move(VFS),
std::move(VFS), std::move(PCHs));		std::move(PCHs)});
return Result;		return Result;
}		}

} // namespace clangd		} // namespace clangd
} // namespace clang		} // namespace clang
		ioericUnsubmitted Done Reply Inline Actions I think we already only query namespace scopes now? ioeric: I think we already only query namespace scopes now?
		sammccallAuthorUnsubmitted Not Done Reply Inline Actions Nope, we never check the completion context kind, and I think I've seen cases where we end up completing when it's inappropriate. Fixed this (see the new `allowIndex()` check) and removed the fixme. sammccall: Nope, we never check the completion context kind, and I think I've seen cases where we end up…
		ioericUnsubmitted Done Reply Inline Actions It would be a bit more natural if the decision of building CCS is hidden in the candidate. Maybe pass in a callback for creating CCS from a sema result and let candidate decide whether to create CCS or not? This would also get rid of the constraint for `build`. ioeric: It would be a bit more natural if the decision of building CCS is hidden in the candidate.
		sammccallAuthorUnsubmitted Not Done Reply Inline Actions I agree, but trying this out I found it equally hard to read, and not as decoupled as I'd hope. So as discussed offline, sticking with the ugly-and-direct approach :-) sammccall: I agree, but trying this out I found it equally hard to read, and not as decoupled as I'd hope.
		ioericUnsubmitted Done Reply Inline Actions Would it make sense to move the score construction into `build`, by passing in necessary information in `Candidate.second`? ioeric: Would it make sense to move the score construction into `build`, by passing in necessary…
		ioericUnsubmitted Done Reply Inline Actions As discussed offline, we want to defer unqualified completion support (IIRC?) until we have enough information about visible scopes (i.e. after D42073). ioeric: As discussed offline, we want to defer unqualified completion support (IIRC?) until we have…
		sammccallAuthorUnsubmitted Not Done Reply Inline Actions Done - we now complete only symbols in the global scope. I added two FIXMEs describing how we can progressively make this better over time. Do they match your understanding? sammccall: Done - we now complete only symbols in the global scope. I added two FIXMEs describing how we…

clangd/FuzzyMatch.h

	Show All 29 Lines
	public:			public:
	// Characters beyond MaxPat are ignored.			// Characters beyond MaxPat are ignored.
	FuzzyMatcher(llvm::StringRef Pattern);			FuzzyMatcher(llvm::StringRef Pattern);

	// If Word matches the pattern, return a score in [0,1] (higher is better).			// If Word matches the pattern, return a score in [0,1] (higher is better).
	// Characters beyond MaxWord are ignored.			// Characters beyond MaxWord are ignored.
	llvm::Optional<float> match(llvm::StringRef Word);			llvm::Optional<float> match(llvm::StringRef Word);

	bool empty() { return PatN == 0; }			llvm::StringRef pattern() const { return llvm::StringRef(Pat, PatN); }
				bool empty() const { return PatN == 0; }

	// Dump internal state from the last match() to the stream, for debugging.			// Dump internal state from the last match() to the stream, for debugging.
	// Returns the pattern with [] around matched characters, e.g.			// Returns the pattern with [] around matched characters, e.g.
	// [u_p] + "unique_ptr" --> "[u]nique[_p]tr"			// [u_p] + "unique_ptr" --> "[u]nique[_p]tr"
	llvm::SmallString<256> dumpLast(llvm::raw_ostream &) const;			llvm::SmallString<256> dumpLast(llvm::raw_ostream &) const;

	private:			private:
	// We truncate the pattern and the word to bound the cost of matching.			// We truncate the pattern and the word to bound the cost of matching.
	▲ Show 20 Lines • Show All 44 Lines • Show Last 20 Lines

unittests/clangd/CodeCompleteTests.cpp

Show All 11 Lines
#include "CodeComplete.h"		#include "CodeComplete.h"
#include "Compiler.h"		#include "Compiler.h"
#include "Context.h"		#include "Context.h"
#include "Matchers.h"		#include "Matchers.h"
#include "Protocol.h"		#include "Protocol.h"
#include "SourceCode.h"		#include "SourceCode.h"
#include "TestFS.h"		#include "TestFS.h"
#include "index/MemIndex.h"		#include "index/MemIndex.h"
#include "index/Merge.h"
#include "gmock/gmock.h"		#include "gmock/gmock.h"
#include "gtest/gtest.h"		#include "gtest/gtest.h"

namespace clang {		namespace clang {
namespace clangd {		namespace clangd {
// Let GMock print completion items and signature help.		// Let GMock print completion items and signature help.
void PrintTo(const CompletionItem &I, std::ostream *O) {		void PrintTo(const CompletionItem &I, std::ostream *O) {
llvm::raw_os_ostream OS(*O);		llvm::raw_os_ostream OS(*O);
▲ Show 20 Lines • Show All 48 Lines • ▼ Show 20 Lines
MATCHER_P(PlainText, Text, "") {		MATCHER_P(PlainText, Text, "") {
return arg.insertTextFormat == clangd::InsertTextFormat::PlainText &&		return arg.insertTextFormat == clangd::InsertTextFormat::PlainText &&
arg.insertText == Text;		arg.insertText == Text;
}		}
MATCHER_P(Snippet, Text, "") {		MATCHER_P(Snippet, Text, "") {
return arg.insertTextFormat == clangd::InsertTextFormat::Snippet &&		return arg.insertTextFormat == clangd::InsertTextFormat::Snippet &&
arg.insertText == Text;		arg.insertText == Text;
}		}
MATCHER(FilterContainsName, "") {		MATCHER(NameContainsFilter, "") {
if (arg.filterText.empty())		if (arg.filterText.empty())
return true;		return true;
return llvm::StringRef(arg.insertText).contains(arg.filterText);		return llvm::StringRef(arg.insertText).contains(arg.filterText);
}		}
// Shorthand for Contains(Named(Name)).		// Shorthand for Contains(Named(Name)).
Matcher<const std::vector<CompletionItem> &> Has(std::string Name) {		Matcher<const std::vector<CompletionItem> &> Has(std::string Name) {
return Contains(Named(std::move(Name)));		return Contains(Named(std::move(Name)));
}		}
Show All 30 Lines	CompletionList completions(StringRef Text,
auto File = getVirtualTestFilePath("foo.cpp");		auto File = getVirtualTestFilePath("foo.cpp");
Annotations Test(Text);		Annotations Test(Text);
Server.addDocument(Context::empty(), File, Test.code()).wait();		Server.addDocument(Context::empty(), File, Test.code()).wait();
auto CompletionList =		auto CompletionList =
Server.codeComplete(Context::empty(), File, Test.point(), Opts)		Server.codeComplete(Context::empty(), File, Test.point(), Opts)
.get()		.get()
.second.Value;		.second.Value;
// Sanity-check that filterText is valid.		// Sanity-check that filterText is valid.
EXPECT_THAT(CompletionList.items, Each(FilterContainsName()));		EXPECT_THAT(CompletionList.items, Each(NameContainsFilter()));
return CompletionList;		return CompletionList;
}		}

		std::string replace(StringRef Haystack, StringRef Needle, StringRef Repl) {
		std::string Result;
		raw_string_ostream OS(Result);
		std::pair<StringRef, StringRef> Split;
		for (Split = Haystack.split(Needle); !Split.second.empty();
		Split = Split.first.split(Needle))
		OS << Split.first << Repl;
		Result += Split.first;
		OS.flush();
		return Result;
		}

// Helpers to produce fake index symbols for memIndex() or completions().		// Helpers to produce fake index symbols for memIndex() or completions().
Symbol sym(StringRef QName, index::SymbolKind Kind) {		// USRFormat is a regex replacement string for the unqualified part of the USR.
		Symbol sym(StringRef QName, index::SymbolKind Kind, StringRef USRFormat) {
Symbol Sym;		Symbol Sym;
Sym.ID = SymbolID(QName);		std::string USR = "c:"; // We synthesize a few simple cases of USRs by hand!
size_t Pos = QName.rfind("::");		size_t Pos = QName.rfind("::");
if (Pos == llvm::StringRef::npos) {		if (Pos == llvm::StringRef::npos) {
Sym.Name = QName;		Sym.Name = QName;
Sym.Scope = "";		Sym.Scope = "";
} else {		} else {
Sym.Name = QName.substr(Pos + 2);		Sym.Name = QName.substr(Pos + 2);
Sym.Scope = QName.substr(0, Pos);		Sym.Scope = QName.substr(0, Pos);
		USR += "@N@" + replace(Sym.Scope, "::", "@N@"); // ns:: -> @N@ns
}		}
		USR += Regex("^.*$").sub(USRFormat, Sym.Name); // e.g. func -> @F@func#
		Sym.ID = SymbolID(USR);
Sym.CompletionPlainInsertText = Sym.Name;		Sym.CompletionPlainInsertText = Sym.Name;
		Sym.CompletionSnippetInsertText = Sym.Name;
Sym.CompletionLabel = Sym.Name;		Sym.CompletionLabel = Sym.Name;
Sym.SymInfo.Kind = Kind;		Sym.SymInfo.Kind = Kind;
return Sym;		return Sym;
}		}
Symbol func(StringRef Name) { return sym(Name, index::SymbolKind::Function); }		Symbol func(StringRef Name) { // Assumes the function has no args.
Symbol cls(StringRef Name) { return sym(Name, index::SymbolKind::Class); }		return sym(Name, index::SymbolKind::Function, "@F@\\0#"); // no args
Symbol var(StringRef Name) { return sym(Name, index::SymbolKind::Variable); }		}
		Symbol cls(StringRef Name) {
		return sym(Name, index::SymbolKind::Class, "@S@\\0@S@\\0");
		}
		Symbol var(StringRef Name) {
		return sym(Name, index::SymbolKind::Variable, "@\\0");
		}

TEST(CompletionTest, Limit) {		TEST(CompletionTest, Limit) {
clangd::CodeCompleteOptions Opts;		clangd::CodeCompleteOptions Opts;
Opts.Limit = 2;		Opts.Limit = 2;
auto Results = completions(R"cpp(		auto Results = completions(R"cpp(
struct ClassWithMembers {		struct ClassWithMembers {
int AAA();		int AAA();
int BBB();		int BBB();
▲ Show 20 Lines • Show All 57 Lines • ▼ Show 20 Lines	auto Results = completions(
struct LocalClass {};		struct LocalClass {};

/// Doc for local_var.		/// Doc for local_var.
int local_var;		int local_var;

ClassWithMembers().^		ClassWithMembers().^
}		}
)cpp",		)cpp",
/IndexSymbols=/{}, Opts);		{cls("IndexClass"), var("index_var"), func("index_func")}, Opts);

// Class members. The only items that must be present in after-dot		// Class members. The only items that must be present in after-dot
// completion.		// completion.
EXPECT_THAT(		EXPECT_THAT(
Results.items,		Results.items,
AllOf(Has(Opts.EnableSnippets ? "method()" : "method"), Has("field")));		AllOf(Has(Opts.EnableSnippets ? "method()" : "method"), Has("field")));
EXPECT_IFF(Opts.IncludeIneligibleResults, Results.items,		EXPECT_IFF(Opts.IncludeIneligibleResults, Results.items,
Has("private_field"));		Has("private_field"));
// Global items.		// Global items.
EXPECT_THAT(Results.items, Not(AnyOf(Has("global_var"), Has("global_func"),		EXPECT_THAT(
Has("global_func()"), Has("GlobalClass"),		Results.items,
Has("MACRO"), Has("LocalClass"))));		Not(AnyOf(Has("global_var"), Has("index_var"), Has("global_func"),
		Has("global_func()"), Has("index_func"), Has("GlobalClass"),
		Has("IndexClass"), Has("MACRO"), Has("LocalClass"))));
// There should be no code patterns (aka snippets) in after-dot		// There should be no code patterns (aka snippets) in after-dot
// completion. At least there aren't any we're aware of.		// completion. At least there aren't any we're aware of.
EXPECT_THAT(Results.items, Not(Contains(Kind(CompletionItemKind::Snippet))));		EXPECT_THAT(Results.items, Not(Contains(Kind(CompletionItemKind::Snippet))));
// Check documentation.		// Check documentation.
EXPECT_IFF(Opts.IncludeBriefComments, Results.items,		EXPECT_IFF(Opts.IncludeBriefComments, Results.items,
Contains(IsDocumented()));		Contains(IsDocumented()));
}		}

Show All 16 Lines	auto Results = completions(
struct LocalClass {};		struct LocalClass {};

/// Doc for local_var.		/// Doc for local_var.
int local_var;		int local_var;

^		^
}		}
)cpp",		)cpp",
/IndexSymbols=/{}, Opts);		{cls("IndexClass"), var("index_var"), func("index_func")}, Opts);

// Class members. Should never be present in global completions.		// Class members. Should never be present in global completions.
EXPECT_THAT(Results.items,		EXPECT_THAT(Results.items,
Not(AnyOf(Has("method"), Has("method()"), Has("field"))));		Not(AnyOf(Has("method"), Has("method()"), Has("field"))));
// Global items.		// Global items.
EXPECT_THAT(Results.items,		EXPECT_THAT(Results.items,
AllOf(Has("global_var"),		AllOf(Has("global_var"), Has("index_var"),
Has(Opts.EnableSnippets ? "global_func()" : "global_func"),		Has(Opts.EnableSnippets ? "global_func()" : "global_func"),
Has("GlobalClass")));		Has("index_func" /* our fake symbol doesn't include () */),
		Has("GlobalClass"), Has("IndexClass")));
// A macro.		// A macro.
EXPECT_IFF(Opts.IncludeMacros, Results.items, Has("MACRO"));		EXPECT_IFF(Opts.IncludeMacros, Results.items, Has("MACRO"));
// Local items. Must be present always.		// Local items. Must be present always.
EXPECT_THAT(Results.items,		EXPECT_THAT(Results.items,
AllOf(Has("local_var"), Has("LocalClass"),		AllOf(Has("local_var"), Has("LocalClass"),
Contains(Kind(CompletionItemKind::Snippet))));		Contains(Kind(CompletionItemKind::Snippet))));
// Check documentation.		// Check documentation.
EXPECT_IFF(Opts.IncludeBriefComments, Results.items,		EXPECT_IFF(Opts.IncludeBriefComments, Results.items,
▲ Show 20 Lines • Show All 102 Lines • ▼ Show 20 Lines	auto Results = completions(
)cpp",		)cpp",
/IndexSymbols=/{}, Opts);		/IndexSymbols=/{}, Opts);
EXPECT_THAT(Results.items,		EXPECT_THAT(Results.items,
HasSubsequence(Snippet("a"),		HasSubsequence(Snippet("a"),
Snippet("f(${1:int i}, ${2:const float f})")));		Snippet("f(${1:int i}, ${2:const float f})")));
}		}

TEST(CompletionTest, Kinds) {		TEST(CompletionTest, Kinds) {
auto Results = completions(R"cpp(		auto Results = completions(
		R"cpp(
#define MACRO X		#define MACRO X
int variable;		int variable;
struct Struct {};		struct Struct {};
int function();		int function();
int X = ^		int X = ^
)cpp");		)cpp",
EXPECT_THAT(Results.items, Has("function", CompletionItemKind::Function));		{func("indexFunction"), var("indexVariable"), cls("indexClass")});
EXPECT_THAT(Results.items, Has("variable", CompletionItemKind::Variable));		EXPECT_THAT(Results.items,
EXPECT_THAT(Results.items, Has("int", CompletionItemKind::Keyword));		AllOf(Has("function", CompletionItemKind::Function),
EXPECT_THAT(Results.items, Has("Struct", CompletionItemKind::Class));		Has("variable", CompletionItemKind::Variable),
EXPECT_THAT(Results.items, Has("MACRO", CompletionItemKind::Text));		Has("int", CompletionItemKind::Keyword),
		Has("Struct", CompletionItemKind::Class),
		Has("MACRO", CompletionItemKind::Text),
		Has("indexFunction", CompletionItemKind::Function),
		Has("indexVariable", CompletionItemKind::Variable),
		Has("indexClass", CompletionItemKind::Class)));

Results = completions("nam^");		Results = completions("nam^");
EXPECT_THAT(Results.items, Has("namespace", CompletionItemKind::Snippet));		EXPECT_THAT(Results.items, Has("namespace", CompletionItemKind::Snippet));
}		}

TEST(CompletionTest, NoDuplicates) {		TEST(CompletionTest, NoDuplicates) {
auto Items = completions(R"cpp(		auto Results = completions(
struct Adapter {		R"cpp(
		class Adapter {
void method();		void method();
};		};

void Adapter::method() {		void Adapter::method() {
Adapter^		Adapter^
}		}
)cpp")		)cpp",
.items;		{cls("Adapter")});

// Make sure there are no duplicate entries of 'Adapter'.		// Make sure there are no duplicate entries of 'Adapter'.
EXPECT_THAT(Items, ElementsAre(Named("Adapter"), Named("~Adapter")));		EXPECT_THAT(Results.items, ElementsAre(Named("Adapter"), Named("~Adapter")));
}

TEST(CompletionTest, FuzzyRanking) {
auto Items = completions(R"cpp(
struct fake { int BigBang, Babble, Ball; };
int main() { fake().bb^ }")cpp").items;
// BigBang is a better match than Babble. Ball doesn't match at all.
EXPECT_THAT(Items, ElementsAre(Named("BigBang"), Named("Babble")));
}		}

TEST(CompletionTest, NoIndex) {		TEST(CompletionTest, ScopedNoIndex) {
auto Results = completions(R"cpp(
namespace ns { class Local {}; }
void f() { ns::^ }
)cpp");
EXPECT_THAT(Results.items, Has("Local"));
}

TEST(CompletionTest, StaticAndDynamicIndex) {
clangd::CodeCompleteOptions Opts;
auto StaticIdx = memIndex({cls("ns::XYZ")});
auto DynamicIdx = memIndex({func("ns::foo")});
auto Merge = mergeIndex(DynamicIdx.get(), StaticIdx.get());
Opts.Index = Merge.get();

auto Results = completions(		auto Results = completions(
R"cpp(		R"cpp(
void f() { ::ns::^ }		namespace fake { int BigBang, Babble, Ball; };
)cpp",		int main() { fake::bb^ }
/IndexSymbols=/{}, Opts);		")cpp");
EXPECT_THAT(Results.items, Contains(Labeled("[I]XYZ")));		// BigBang is a better match than Babble. Ball doesn't match at all.
EXPECT_THAT(Results.items, Contains(Labeled("[I]foo")));		EXPECT_THAT(Results.items, ElementsAre(Named("BigBang"), Named("Babble")));
}		}

TEST(CompletionTest, IndexScope) {		TEST(CompletionTest, Scoped) {
auto Results = completions(		auto Results = completions(
R"cpp(		R"cpp(
namespace ns { int local; }		namespace fake { int Babble, Ball; };
void f() { ns::^ }		int main() { fake::bb^ }
)cpp",		")cpp",
{cls("ns::XYZ"), cls("nx::XYZ"), func("ns::foo")});		{var("fake::BigBang")});
EXPECT_THAT(Results.items,		EXPECT_THAT(Results.items, ElementsAre(Named("BigBang"), Named("Babble")));
UnorderedElementsAre(Named("XYZ"), Named("foo"), Named("local")));
}		}

TEST(CompletionTest, IndexBasedWithFilter) {		TEST(CompletionTest, ScopedWithFilter) {
auto Results = completions(		auto Results = completions(
R"cpp(		R"cpp(
void f() { ns::x^ }		void f() { ns::x^ }
)cpp",		)cpp",
{cls("ns::XYZ"), func("ns::foo")});		{cls("ns::XYZ"), func("ns::foo")});
EXPECT_THAT(Results.items,		EXPECT_THAT(Results.items,
UnorderedElementsAre(AllOf(Named("XYZ"), Filter("XYZ"))));		UnorderedElementsAre(AllOf(Named("XYZ"), Filter("XYZ"))));
}		}

TEST(CompletionTest, IndexGlobalQualified) {		TEST(CompletionTest, GlobalQualified) {
auto Results = completions(		auto Results = completions(
R"cpp(		R"cpp(
void f() { ::^ }		void f() { ::^ }
)cpp",		)cpp",
{cls("XYZ")});		{cls("XYZ")});
EXPECT_THAT(Results.items, AllOf(Has("XYZ", CompletionItemKind::Class),		EXPECT_THAT(Results.items, AllOf(Has("XYZ", CompletionItemKind::Class),
Has("f", CompletionItemKind::Function)));		Has("f", CompletionItemKind::Function)));
}		}

TEST(CompletionTest, IndexFullyQualifiedScope) {		TEST(CompletionTest, FullyQualified) {
auto Results = completions(		auto Results = completions(
R"cpp(		R"cpp(
		namespace ns { void bar(); }
void f() { ::ns::^ }		void f() { ::ns::^ }
)cpp",		)cpp",
{cls("ns::XYZ")});		{cls("ns::XYZ")});
EXPECT_THAT(Results.items, Has("XYZ", CompletionItemKind::Class));		EXPECT_THAT(Results.items, AllOf(Has("XYZ", CompletionItemKind::Class),
		Has("bar", CompletionItemKind::Function)));
		}

		TEST(CompletionTest, SemaIndexMerge) {
		auto Results = completions(
		R"cpp(
		namespace ns { int local; void both(); }
		void f() { ::ns::^ }
		)cpp",
		{func("ns::both"), cls("ns::Index")});
		// We get results from both index and sema, with no duplicates.
		EXPECT_THAT(
		Results.items,
		UnorderedElementsAre(Named("local"), Named("Index"), Named("both")));
}		}

TEST(CompletionTest, IndexSuppressesPreambleCompletions) {		TEST(CompletionTest, IndexSuppressesPreambleCompletions) {
MockFSProvider FS;		MockFSProvider FS;
MockCompilationDatabase CDB;		MockCompilationDatabase CDB;
IgnoreDiagnostics DiagConsumer;		IgnoreDiagnostics DiagConsumer;
ClangdServer Server(CDB, DiagConsumer, FS, getDefaultAsyncThreadsCount(),		ClangdServer Server(CDB, DiagConsumer, FS, getDefaultAsyncThreadsCount(),
/StorePreamblesInMemory=/true);		/StorePreamblesInMemory=/true);
▲ Show 20 Lines • Show All 145 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[clangd] Merge index-provided completions with those from Sema.
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 130607

clangd/CodeComplete.cpp

clangd/FuzzyMatch.h

unittests/clangd/CodeCompleteTests.cpp

This is an archive of the discontinued LLVM Phabricator instance.

[clangd] Merge index-provided completions with those from Sema.ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 130607

clangd/CodeComplete.cpp

clangd/FuzzyMatch.h

unittests/clangd/CodeCompleteTests.cpp

[clangd] Merge index-provided completions with those from Sema.
ClosedPublic