diff --git a/clang-tools-extra/clangd/SourceCode.h b/clang-tools-extra/clangd/SourceCode.h --- a/clang-tools-extra/clangd/SourceCode.h +++ b/clang-tools-extra/clangd/SourceCode.h @@ -262,6 +262,25 @@ std::vector visibleNamespaces(llvm::StringRef Code, const format::FormatStyle &Style); +// Represents locations that can accept a definition. +struct EligibleRegion { + /// Namespace that owns all of the EligiblePoints, e.g. + /// namespace a{ namespace b { ^ void foo();^} } + /// It will be “a::b” for both carrot locations. + std::string CurrentNamespace; + /// Offsets into the code marking eligible points to insert a function + /// definition. + std::vector EligiblePoints; +}; + +/// Returns most eligible region to insert a definition for FullyQualifiedName +/// in the Code. Pseudo parses Code under the hood to determine namespace decls +/// and possible insertion points. Choses the region that matches the longest +/// prefix of FullyQualifiedName. +EligibleRegion getEligibleRegion(llvm::StringRef Code, + llvm::StringRef FullyQualifiedName, + const format::FormatStyle &Style); + struct DefinedMacro { llvm::StringRef Name; const MacroInfo *Info; diff --git a/clang-tools-extra/clangd/SourceCode.cpp b/clang-tools-extra/clangd/SourceCode.cpp --- a/clang-tools-extra/clangd/SourceCode.cpp +++ b/clang-tools-extra/clangd/SourceCode.cpp @@ -20,9 +20,11 @@ #include "clang/Format/Format.h" #include "clang/Lex/Lexer.h" #include "clang/Lex/Preprocessor.h" +#include "clang/Lex/Token.h" #include "clang/Tooling/Core/Replacement.h" #include "llvm/ADT/ArrayRef.h" #include "llvm/ADT/None.h" +#include "llvm/ADT/STLExtras.h" #include "llvm/ADT/StringExtras.h" #include "llvm/ADT/StringMap.h" #include "llvm/ADT/StringRef.h" @@ -37,6 +39,9 @@ #include "llvm/Support/VirtualFileSystem.h" #include "llvm/Support/xxhash.h" #include +#include +#include +#include namespace clang { namespace clangd { @@ -327,7 +332,6 @@ } } - static unsigned getTokenLengthAtLoc(SourceLocation Loc, const SourceManager &SM, const LangOptions &LangOpts) { Token TheTok; @@ -646,9 +650,9 @@ return formatReplacements(Code, std::move(*CleanReplaces), Style); } -template -static void lex(llvm::StringRef Code, const format::FormatStyle &Style, - Action A) { +static void +lex(llvm::StringRef Code, const format::FormatStyle &Style, + llvm::function_ref A) { // FIXME: InMemoryFileAdapter crashes unless the buffer is null terminated! std::string NullTerminatedCode = Code.str(); SourceManagerForFile FileSM("dummy.cpp", NullTerminatedCode); @@ -658,16 +662,16 @@ Token Tok; while (!Lex.LexFromRawLexer(Tok)) - A(Tok); + A(Tok, sourceLocToPosition(SM, Tok.getLocation())); // LexFromRawLexer returns true after it lexes last token, so we still have // one more token to report. - A(Tok); + A(Tok, sourceLocToPosition(SM, Tok.getLocation())); } llvm::StringMap collectIdentifiers(llvm::StringRef Content, const format::FormatStyle &Style) { llvm::StringMap Identifiers; - lex(Content, Style, [&](const clang::Token &Tok) { + lex(Content, Style, [&](const clang::Token &Tok, const Position) { switch (Tok.getKind()) { case tok::identifier: ++Identifiers[Tok.getIdentifierInfo()->getName()]; @@ -683,15 +687,20 @@ } namespace { -enum NamespaceEvent { - BeginNamespace, // namespace {. Payload is resolved . - EndNamespace, // } // namespace . Payload is resolved *outer* namespace. - UsingDirective // using namespace . Payload is unresolved . +struct NamespaceEvent { + enum { + BeginNamespace, // namespace {. Payload is resolved . + EndNamespace, // } // namespace . Payload is resolved *outer* + // namespace. + UsingDirective // using namespace . Payload is unresolved . + } Trigger; + std::string Payload; + Position Pos; }; // Scans C++ source code for constructs that change the visible namespaces. -void parseNamespaceEvents( - llvm::StringRef Code, const format::FormatStyle &Style, - llvm::function_ref Callback) { +void parseNamespaceEvents(llvm::StringRef Code, + const format::FormatStyle &Style, + llvm::function_ref Callback) { // Stack of enclosing namespaces, e.g. {"clang", "clangd"} std::vector Enclosing; // Contains e.g. "clang", "clangd" @@ -708,8 +717,10 @@ } State = Default; std::string NSName; - lex(Code, Style, [&](const clang::Token &Tok) { - switch(Tok.getKind()) { + NamespaceEvent Event; + lex(Code, Style, [&](const clang::Token &Tok, const Position P) { + Event.Pos = std::move(P); + switch (Tok.getKind()) { case tok::raw_identifier: // In raw mode, this could be a keyword or a name. switch (State) { @@ -761,7 +772,9 @@ // Parsed: namespace { BraceStack.push_back(true); Enclosing.push_back(NSName); - Callback(BeginNamespace, llvm::join(Enclosing, "::")); + Event.Trigger = NamespaceEvent::BeginNamespace; + Event.Payload = llvm::join(Enclosing, "::"); + Callback(Event); } else { // This case includes anonymous namespaces (State = Namespace). // For our purposes, they're not namespaces and we ignore them. @@ -775,15 +788,20 @@ if (BraceStack.back()) { // Parsed: } // namespace Enclosing.pop_back(); - Callback(EndNamespace, llvm::join(Enclosing, "::")); + Event.Trigger = NamespaceEvent::EndNamespace; + Event.Payload = llvm::join(Enclosing, "::"); + Callback(Event); } BraceStack.pop_back(); } break; case tok::semi: - if (State == UsingNamespaceName) + if (State == UsingNamespaceName) { // Parsed: using namespace ; - Callback(UsingDirective, llvm::StringRef(NSName)); + Event.Trigger = NamespaceEvent::UsingDirective; + Event.Payload = std::move(NSName); + Callback(Event); + } State = Default; break; default: @@ -811,36 +829,34 @@ // Map from namespace to (resolved) namespaces introduced via using directive. llvm::StringMap> UsingDirectives; - parseNamespaceEvents(Code, Style, - [&](NamespaceEvent Event, llvm::StringRef NS) { - switch (Event) { - case BeginNamespace: - case EndNamespace: - Current = NS; - break; - case UsingDirective: - if (NS.consume_front("::")) - UsingDirectives[Current].insert(NS); - else { - for (llvm::StringRef Enclosing : - ancestorNamespaces(Current)) { - if (Enclosing.empty()) - UsingDirectives[Current].insert(NS); - else - UsingDirectives[Current].insert( - (Enclosing + "::" + NS).str()); - } - } - break; - } - }); + parseNamespaceEvents(Code, Style, [&](NamespaceEvent Event) { + llvm::StringRef NS = Event.Payload; + switch (Event.Trigger) { + case NamespaceEvent::BeginNamespace: + case NamespaceEvent::EndNamespace: + Current = std::move(Event.Payload); + break; + case NamespaceEvent::UsingDirective: + if (NS.consume_front("::")) + UsingDirectives[Current].insert(NS); + else { + for (llvm::StringRef Enclosing : ancestorNamespaces(Current)) { + if (Enclosing.empty()) + UsingDirectives[Current].insert(NS); + else + UsingDirectives[Current].insert((Enclosing + "::" + NS).str()); + } + } + break; + } + }); std::vector Found; for (llvm::StringRef Enclosing : ancestorNamespaces(Current)) { Found.push_back(Enclosing); auto It = UsingDirectives.find(Enclosing); if (It != UsingDirectives.end()) - for (const auto& Used : It->second) + for (const auto &Used : It->second) Found.push_back(Used.getKey()); } @@ -971,5 +987,53 @@ return llvm::Error::success(); } +EligibleRegion getEligibleRegion(llvm::StringRef Code, + llvm::StringRef FullyQualifiedName, + const format::FormatStyle &Style) { + EligibleRegion ER; + // Start with global namespace. + std::vector Enclosing = {""}; + // FIXME: In addition to namespaces try to generate events for function + // definitions as well. One might use a closing parantheses(")" followed by an + // opening brace "{" to trigger the start. + parseNamespaceEvents(Code, Style, [&](NamespaceEvent Event) { + // Using Directives only introduces declarations to current scope, they do + // not change the current namespace, so skip them. + if (Event.Trigger == NamespaceEvent::UsingDirective) + return; + // Do not qualify the global namespace. + if (!Event.Payload.empty()) + Event.Payload.append("::"); + + std::string CurrentNamespace; + if (Event.Trigger == NamespaceEvent::BeginNamespace) { + Enclosing.emplace_back(std::move(Event.Payload)); + CurrentNamespace = Enclosing.back(); + // parseNameSpaceEvents reports the beginning position of a token; we want + // to insert after '{', so increment by one. + ++Event.Pos.character; + } else { + // Event.Payload points to outer namespace when exiting a scope, so use + // the namespace we've last entered instead. + CurrentNamespace = std::move(Enclosing.back()); + Enclosing.pop_back(); + assert(Enclosing.back() == Event.Payload); + } + + // Ignore namespaces that are not a prefix of the target. + if (!FullyQualifiedName.startswith(CurrentNamespace)) + return; + + // Prefer the namespace that shares the longest prefix with target. + if (CurrentNamespace.size() > ER.CurrentNamespace.size()) { + ER.EligiblePoints.clear(); + ER.CurrentNamespace = CurrentNamespace; + } + if (CurrentNamespace.size() == ER.CurrentNamespace.size()) + ER.EligiblePoints.emplace_back(std::move(Event.Pos)); + }); + return ER; +} + } // namespace clangd } // namespace clang diff --git a/clang-tools-extra/clangd/unittests/SourceCodeTests.cpp b/clang-tools-extra/clangd/unittests/SourceCodeTests.cpp --- a/clang-tools-extra/clangd/unittests/SourceCodeTests.cpp +++ b/clang-tools-extra/clangd/unittests/SourceCodeTests.cpp @@ -19,6 +19,7 @@ #include "llvm/Testing/Support/Error.h" #include "gmock/gmock.h" #include "gtest/gtest.h" +#include namespace clang { namespace clangd { @@ -603,6 +604,66 @@ Test.llvm::Annotations::point("bar")); } +TEST(SourceCodeTests, GetEligibleRegion) { + constexpr std::tuple + Cases[] = { + {R"cpp(// FIXME: We should also mark positions before and after + //declarations/definitions as eligible. + namespace ns1 { + namespace a { namespace ns2 {} } + namespace ns2 {^ + void foo(); + namespace {} + void bar() {} + namespace ns3 {} + class T {}; + ^} + using namespace ns2; + })cpp", + "ns1::ns2::symbol", "ns1::ns2::"}, + {R"cpp( + namespace ns1 {^ + namespace a { namespace ns2 {} } + namespace b {} + namespace ns {} + ^})cpp", + "ns1::ns2::symbol", "ns1::"}, + {R"cpp( + namespace x { + namespace a { namespace ns2 {} } + namespace b {} + namespace ns {} + })cpp", + "ns1::ns2::symbol", ""}, + {R"cpp( + namespace ns1 { + namespace ns2 {^^} + namespace b {} + namespace ns2 {^^} + } + namespace ns1 {namespace ns2 {^^}})cpp", + "ns1::ns2::symbol", "ns1::ns2::"}, + {R"cpp( + namespace ns1 {^ + namespace ns {} + namespace b {} + namespace ns {} + ^} + namespace ns1 {^namespace ns {}^})cpp", + "ns1::ns2::symbol", "ns1::"}, + }; + for (auto Case : Cases) { + Annotations Test(std::get<0>(Case)); + + auto Res = getEligibleRegion(Test.code(), std::get<1>(Case), + format::getLLVMStyle()); + EXPECT_THAT(Res.EligiblePoints, testing::ElementsAreArray(Test.points())) + << Test.code(); + EXPECT_EQ(Res.CurrentNamespace, std::get<2>(Case)) << Test.code(); + } +} } // namespace } // namespace clangd } // namespace clang