diff --git a/clang-tools-extra/clangd/CollectMacros.h b/clang-tools-extra/clangd/CollectMacros.h --- a/clang-tools-extra/clangd/CollectMacros.h +++ b/clang-tools-extra/clangd/CollectMacros.h @@ -99,6 +99,18 @@ MainFileMacros &Out; }; +/// Represents a `#pragma mark` in the main file. +/// +/// There can be at most one pragma mark per line. +struct PragmaMark { + SourceLocation Loc; + std::string Trivia; +}; + +/// Collect all pragma marks from the main file. +std::unique_ptr +collectPragmaMarksCallback(const SourceManager &, std::vector &Out); + } // namespace clangd } // namespace clang diff --git a/clang-tools-extra/clangd/CollectMacros.cpp b/clang-tools-extra/clangd/CollectMacros.cpp --- a/clang-tools-extra/clangd/CollectMacros.cpp +++ b/clang-tools-extra/clangd/CollectMacros.cpp @@ -10,6 +10,24 @@ #include "clang/Basic/SourceLocation.h" #include "clang/Lex/Lexer.h" +namespace { +class CollectPragmaMarks : public clang::PPCallbacks { +public: + explicit CollectPragmaMarks(const clang::SourceManager &SM, + std::vector &Out) + : SM(SM), Out(Out) {} + void PragmaMark(clang::SourceLocation Loc, clang::StringRef Trivia) override { + if (clang::clangd::isInsideMainFile(Loc, SM)) { + Out.emplace_back(clang::clangd::PragmaMark{Loc, Trivia.str()}); + } + } + +private: + const clang::SourceManager &SM; + std::vector &Out; +}; +} // namespace + namespace clang { namespace clangd { @@ -30,5 +48,12 @@ else Out.UnknownMacros.push_back({Range, IsDefinition}); } + +std::unique_ptr +collectPragmaMarksCallback(const SourceManager &SM, + std::vector &Out) { + return std::make_unique(SM, Out); +} + } // namespace clangd } // namespace clang diff --git a/clang-tools-extra/clangd/FindSymbols.cpp b/clang-tools-extra/clangd/FindSymbols.cpp --- a/clang-tools-extra/clangd/FindSymbols.cpp +++ b/clang-tools-extra/clangd/FindSymbols.cpp @@ -523,9 +523,198 @@ ParsedAST &AST; }; +struct PragmaMarkSymbol { + DocumentSymbol DocSym; + bool IsGroup; +}; + +/// Merge in `PragmaMarkSymbols` into the given `DocumentSymbols`. All symbols +/// should be sorted in ascending order by range. +std::vector mergePragmas(std::vector &Syms, + ArrayRef &Pragmas, + Range ParentRange) { + std::vector Res; + size_t MarkIndex = 0; + bool HaveOpenMarkGroup = false; + auto It = Syms.begin(); + + while (It != Syms.end() && !Pragmas.empty()) { + auto &Sym = *It; + const auto &Pragma = Pragmas.front(); + + // Pragma mark is contained in the current symbol, we need to recurse to + // nest it inside the symbol. + if (Sym.range.contains(Pragma.DocSym.range)) { + Sym.children = mergePragmas(Sym.children, Pragmas, Sym.range); + continue; + } + // Pragma mark is after the current symbol. + if (Sym.range < Pragma.DocSym.range) { + if (HaveOpenMarkGroup) { // Sym belongs to the previous TextMark group. + unionRanges(Res[MarkIndex].range, Sym.range); + Res[MarkIndex].children.push_back(std::move(Sym)); + } else { // Sym doesn't belong to a group. + Res.push_back(std::move(Sym)); + } + It++; + continue; + } + // Pragma mark is before the current symbol, add in a node for the mark. + assert(Pragma.DocSym.range < Sym.range && "Mark should be before Sym"); + if (Pragma.IsGroup) { + MarkIndex = Res.size(); + HaveOpenMarkGroup = true; + } else { // New mark ends the previous group if one existed. + HaveOpenMarkGroup = false; + } + Res.push_back(std::move(Pragma.DocSym)); + Pragmas = Pragmas.drop_front(); + } + + // If we ran out of Symbols, we add any leftover marks as long as they are + // contained in our parent. Otherwise, we can't add them, since they belong + // to a different ancestor besides our parent. + while (!Pragmas.empty()) { + const auto &Pragma = Pragmas.back(); + if (!ParentRange.contains(Pragma.DocSym.range)) + break; + Res.push_back(std::move(Pragma.DocSym)); + Pragmas = Pragmas.drop_front(); + } + + // If we ran out of marks, but still have symbols left, add them. If we have + // a group open, leftover symbols belong to that group. + for (; It != Syms.end(); It++) { + auto &Sym = *It; + if (HaveOpenMarkGroup) { + unionRanges(Res[MarkIndex].range, Sym.range); + Res[MarkIndex].children.push_back(std::move(Sym)); + } else { + Res.push_back(std::move(Sym)); + } + } + return Res; +} + +/// Merge in `PragmaMarkSymbols` into the given `DocumentSymbols`. All symbols +/// should be sorted in ascending order by range. +std::vector mergePragmas2(std::vector &Syms, + ArrayRef &Pragmas, + Range ParentRange) { + std::vector Res; + auto It = Syms.begin(); + + while (!Pragmas.empty()) { + const auto &Pragma = Pragmas.front(); + // If the Pragma isn't contained in our parent, we're done, it must belong + // to a different ancestor. + if (!ParentRange.contains(Pragma.DocSym.range)) + break; + + // No more symbols left, just add the pragma. + if (It == Syms.end()) { + Res.push_back(std::move(Pragma.DocSym)); + Pragmas = Pragmas.drop_front(); + continue; + } + auto &Sym = *It; + + // Pragma mark is contained in the current symbol, we need to recurse to + // nest it inside the symbol. + if (Sym.range.contains(Pragma.DocSym.range)) { + Sym.children = mergePragmas2(Sym.children, Pragmas, Sym.range); + continue; + } + // Pragma mark is after the child node, so we can process the child, it + // doesn't belong to a group. + if (Sym.range < Pragma.DocSym.range) { + Res.push_back(std::move(Sym)); + It++; + continue; + } + // Pragma mark is before the current symbol, add in a node for the mark, and + // any Syms who should belong to the group, if it is one. + assert(Pragma.DocSym.range < Sym.range && "Mark should be before Sym"); + if (!Pragma.IsGroup) { + Res.push_back(std::move(Pragma.DocSym)); + Pragmas = Pragmas.drop_front(); + continue; + } + DocumentSymbol PragmaSym = Pragma.DocSym; + Pragmas = Pragmas.drop_front(); + // We've got a pragma which is a group. We add all Syms we encounter to our + // group until it ends; our group will end if there's a pragma after us + // which implicitly ends our group. + while (It != Syms.end() && PragmaSym.range < It->range) { + auto &Sym = *It; + if (Pragmas.empty() || + It->range < Pragmas.front().DocSym.range) { // Sym is ours. + unionRanges(PragmaSym.range, Sym.range); + PragmaSym.children.push_back(std::move(Sym)); + ++It; + continue; + } + const auto &NextPragma = Pragmas.front(); + // Next pragma is contained in the Sym, it belongs there and doesn't + // affect us at all. + if (Sym.range.contains(NextPragma.DocSym.range)) { + Sym.children = mergePragmas2(Sym.children, Pragmas, Sym.range); + continue; + } + // NextPragma is after us but before the next symbol. Our reign is over. + break; + } + Res.push_back(PragmaSym); + } + // If we ran out of marks, but still have symbols left, add them. + for (; It != Syms.end(); It++) { + Res.push_back(std::move(*It)); + } + return Res; +} + +PragmaMarkSymbol markToSymbol(const PragmaMark &P, const SourceManager &SM) { + StringRef Name = StringRef(P.Trivia).trim(); + bool IsGroup = false; + // "-\s+" or "" after an initial trim. The former is + // considered a group, the latter just a mark. We need to include a name + // here since editors won't properly render the symbol otherwise. + StringRef MaybeGroupName = Name; + if (MaybeGroupName.consume_front("-") && + (MaybeGroupName.ltrim() != MaybeGroupName || MaybeGroupName.empty())) { + Name = MaybeGroupName.empty() ? "(unnamed group)" : MaybeGroupName.ltrim(); + IsGroup = true; + } else if (Name.empty()) { + Name = "(unnamed mark)"; + } + DocumentSymbol Sym; + Sym.name = Name.str(); + Sym.kind = SymbolKind::File; + Position Start = sourceLocToPosition(SM, P.Loc); + Position End = {Start.line + 1, 0}; + Sym.range = Range{Start, End}; + Sym.selectionRange = Range{Start, End}; + return {Sym, IsGroup}; +} + std::vector collectDocSymbols(ParsedAST &AST) { - return DocumentOutline(AST).build(); + std::vector Syms = DocumentOutline(AST).build(); + + const auto &PragmaMarks = AST.getMarks(); + if (PragmaMarks.empty()) + return Syms; + + const auto &SM = AST.getSourceManager(); + std::vector Pragmas; + for (const auto &P : PragmaMarks) + Pragmas.push_back(markToSymbol(P, SM)); + Range EntireFile = { + {-1, -1}, + {std::numeric_limits::max(), std::numeric_limits::max()}}; + ArrayRef PragmasRef(Pragmas); + return mergePragmas2(Syms, PragmasRef, EntireFile); } + } // namespace llvm::Expected> getDocumentSymbols(ParsedAST &AST) { diff --git a/clang-tools-extra/clangd/FindTarget.cpp b/clang-tools-extra/clangd/FindTarget.cpp --- a/clang-tools-extra/clangd/FindTarget.cpp +++ b/clang-tools-extra/clangd/FindTarget.cpp @@ -652,7 +652,7 @@ void visitProtocolList( llvm::iterator_range Protocols, llvm::iterator_range Locations) { - for (const auto &P : llvm::zip(Protocols, Locations)) { + for (auto P : llvm::zip(Protocols, Locations)) { Refs.push_back(ReferenceLoc{NestedNameSpecifierLoc(), std::get<1>(P), /*IsDecl=*/false, diff --git a/clang-tools-extra/clangd/ParsedAST.h b/clang-tools-extra/clangd/ParsedAST.h --- a/clang-tools-extra/clangd/ParsedAST.h +++ b/clang-tools-extra/clangd/ParsedAST.h @@ -101,6 +101,8 @@ /// Gets all macro references (definition, expansions) present in the main /// file, including those in the preamble region. const MainFileMacros &getMacros() const; + /// Gets all pragma marks in the main file. + const std::vector &getMarks() const; /// Tokens recorded while parsing the main file. /// (!) does not have tokens from the preamble. const syntax::TokenBuffer &getTokens() const { return Tokens; } @@ -121,7 +123,8 @@ std::shared_ptr Preamble, std::unique_ptr Clang, std::unique_ptr Action, syntax::TokenBuffer Tokens, - MainFileMacros Macros, std::vector LocalTopLevelDecls, + MainFileMacros Macros, std::vector Marks, + std::vector LocalTopLevelDecls, llvm::Optional> Diags, IncludeStructure Includes, CanonicalIncludes CanonIncludes); @@ -144,6 +147,8 @@ /// All macro definitions and expansions in the main file. MainFileMacros Macros; + // Pragma marks in the main file. + std::vector Marks; // Data, stored after parsing. None if AST was built with a stale preamble. llvm::Optional> Diags; // Top-level decls inside the current file. Not that this does not include diff --git a/clang-tools-extra/clangd/ParsedAST.cpp b/clang-tools-extra/clangd/ParsedAST.cpp --- a/clang-tools-extra/clangd/ParsedAST.cpp +++ b/clang-tools-extra/clangd/ParsedAST.cpp @@ -436,6 +436,12 @@ std::make_unique(Clang->getSourceManager(), Macros)); + std::vector Marks; + if (Preamble) + Marks = Preamble->Marks; + Clang->getPreprocessor().addPPCallbacks( + collectPragmaMarksCallback(Clang->getSourceManager(), Marks)); + // Copy over the includes from the preamble, then combine with the // non-preamble includes below. CanonicalIncludes CanonIncludes; @@ -497,7 +503,7 @@ } return ParsedAST(Inputs.Version, std::move(Preamble), std::move(Clang), std::move(Action), std::move(Tokens), std::move(Macros), - std::move(ParsedDecls), std::move(Diags), + std::move(Marks), std::move(ParsedDecls), std::move(Diags), std::move(Includes), std::move(CanonIncludes)); } @@ -537,6 +543,7 @@ } const MainFileMacros &ParsedAST::getMacros() const { return Macros; } +const std::vector &ParsedAST::getMarks() const { return Marks; } std::size_t ParsedAST::getUsedBytes() const { auto &AST = getASTContext(); @@ -583,12 +590,14 @@ std::unique_ptr Clang, std::unique_ptr Action, syntax::TokenBuffer Tokens, MainFileMacros Macros, + std::vector Marks, std::vector LocalTopLevelDecls, llvm::Optional> Diags, IncludeStructure Includes, CanonicalIncludes CanonIncludes) : Version(Version), Preamble(std::move(Preamble)), Clang(std::move(Clang)), Action(std::move(Action)), Tokens(std::move(Tokens)), - Macros(std::move(Macros)), Diags(std::move(Diags)), + Macros(std::move(Macros)), Marks(std::move(Marks)), + Diags(std::move(Diags)), LocalTopLevelDecls(std::move(LocalTopLevelDecls)), Includes(std::move(Includes)), CanonIncludes(std::move(CanonIncludes)) { Resolver = std::make_unique(getASTContext()); diff --git a/clang-tools-extra/clangd/Preamble.h b/clang-tools-extra/clangd/Preamble.h --- a/clang-tools-extra/clangd/Preamble.h +++ b/clang-tools-extra/clangd/Preamble.h @@ -61,6 +61,8 @@ // Users care about headers vs main-file, not preamble vs non-preamble. // These should be treated as main-file entities e.g. for code completion. MainFileMacros Macros; + // Pragma marks defined in the preamble section of the main file. + std::vector Marks; // Cache of FS operations performed when building the preamble. // When reusing a preamble, this cache can be consumed to save IO. std::unique_ptr StatCache; diff --git a/clang-tools-extra/clangd/Preamble.cpp b/clang-tools-extra/clangd/Preamble.cpp --- a/clang-tools-extra/clangd/Preamble.cpp +++ b/clang-tools-extra/clangd/Preamble.cpp @@ -73,6 +73,8 @@ MainFileMacros takeMacros() { return std::move(Macros); } + std::vector takeMarks() { return std::move(Marks); } + CanonicalIncludes takeCanonicalIncludes() { return std::move(CanonIncludes); } bool isMainFileIncludeGuarded() const { return IsMainFileIncludeGuarded; } @@ -103,7 +105,9 @@ return std::make_unique( collectIncludeStructureCallback(*SourceMgr, &Includes), - std::make_unique(*SourceMgr, Macros)); + std::make_unique( + std::make_unique(*SourceMgr, Macros), + collectPragmaMarksCallback(*SourceMgr, Marks))); } CommentHandler *getCommentHandler() override { @@ -130,6 +134,7 @@ IncludeStructure Includes; CanonicalIncludes CanonIncludes; MainFileMacros Macros; + std::vector Marks; bool IsMainFileIncludeGuarded = false; std::unique_ptr IWYUHandler = nullptr; const clang::LangOptions *LangOpts = nullptr; @@ -387,6 +392,7 @@ Result->Diags = std::move(Diags); Result->Includes = CapturedInfo.takeIncludes(); Result->Macros = CapturedInfo.takeMacros(); + Result->Marks = CapturedInfo.takeMarks(); Result->CanonIncludes = CapturedInfo.takeCanonicalIncludes(); Result->StatCache = std::move(StatCache); Result->MainIsIncludeGuarded = CapturedInfo.isMainFileIncludeGuarded(); diff --git a/clang-tools-extra/clangd/SourceCode.h b/clang-tools-extra/clangd/SourceCode.h --- a/clang-tools-extra/clangd/SourceCode.h +++ b/clang-tools-extra/clangd/SourceCode.h @@ -129,6 +129,9 @@ // Note that clang also uses closed source ranges, which this can't handle! Range halfOpenToRange(const SourceManager &SM, CharSourceRange R); +// Expand range `A` to also contain `B`. +void unionRanges(Range &A, Range B); + // Converts an offset to a clang line/column (1-based, columns are bytes). // The offset must be in range [0, Code.size()]. // Prefer to use SourceManager if one is available. diff --git a/clang-tools-extra/clangd/SourceCode.cpp b/clang-tools-extra/clangd/SourceCode.cpp --- a/clang-tools-extra/clangd/SourceCode.cpp +++ b/clang-tools-extra/clangd/SourceCode.cpp @@ -471,6 +471,13 @@ return {Begin, End}; } +void unionRanges(Range &A, Range B) { + if (B.start < A.start) + A.start = B.start; + if (A.end < B.end) + A.end = B.end; +} + std::pair offsetToClangLineColumn(llvm::StringRef Code, size_t Offset) { Offset = std::min(Code.size(), Offset); diff --git a/clang-tools-extra/clangd/unittests/FindSymbolsTests.cpp b/clang-tools-extra/clangd/unittests/FindSymbolsTests.cpp --- a/clang-tools-extra/clangd/unittests/FindSymbolsTests.cpp +++ b/clang-tools-extra/clangd/unittests/FindSymbolsTests.cpp @@ -1027,6 +1027,105 @@ AllOf(WithName("-pur"), WithKind(SymbolKind::Method)))))); } +TEST(DocumentSymbolsTest, PragmaMarkGroups) { + TestTU TU; + TU.ExtraArgs = {"-xobjective-c++", "-Wno-objc-root-class"}; + Annotations Main(R"cpp( + $DogDef[[@interface Dog + @end]] + + $DogImpl[[@implementation Dog + + + (id)sharedDoggo { return 0; } + + #pragma $Overrides[[mark - Overrides + + - (id)init { + return self; + } + - (void)bark {}]] + + #pragma $Specifics[[mark - Dog Specifics + + - (int)isAGoodBoy { + return 1; + }]] + @]]end // FIXME: Why doesn't this include the 'end'? + + #pragma $End[[mark - End +]] + )cpp"); + TU.Code = Main.code().str(); + EXPECT_THAT( + getSymbols(TU.build()), + ElementsAre( + AllOf(WithName("Dog"), SymRange(Main.range("DogDef"))), + AllOf(WithName("Dog"), SymRange(Main.range("DogImpl")), + Children(AllOf(WithName("+sharedDoggo"), + WithKind(SymbolKind::Method)), + AllOf(WithName("Overrides"), + SymRange(Main.range("Overrides")), + Children(AllOf(WithName("-init"), + WithKind(SymbolKind::Method)), + AllOf(WithName("-bark"), + WithKind(SymbolKind::Method)))), + AllOf(WithName("Dog Specifics"), + SymRange(Main.range("Specifics")), + Children(AllOf(WithName("-isAGoodBoy"), + WithKind(SymbolKind::Method)))))), + AllOf(WithName("End"), SymRange(Main.range("End"))))); +} + +TEST(DocumentSymbolsTest, PragmaMarkGroupsNoNesting) { + TestTU TU; + TU.ExtraArgs = {"-xobjective-c++", "-Wno-objc-root-class"}; + Annotations Main(R"cpp( + #pragma mark Helpers + void helpA(id obj) {} + + #pragma mark - + #pragma mark Core + + void coreMethod() {} + )cpp"); + TU.Code = Main.code().str(); + EXPECT_THAT(getSymbols(TU.build()), + ElementsAre(AllOf(WithName("Helpers")), AllOf(WithName("helpA")), + AllOf(WithName("(unnamed group)")), + AllOf(WithName("Core")), + AllOf(WithName("coreMethod")))); +} + +TEST(DocumentSymbolsTest, SymbolsAreSorted) { + TestTU TU; + TU.ExtraArgs = {"-xobjective-c++", "-Wno-objc-root-class"}; + Annotations Main(R"cpp( + @interface MYObject + @end + + void someFunctionAbove() {} + + @implementation MYObject + - (id)init { return self; } + + void someHelperFunction() {} + + - (void)retain {} + - (void)release {} + @end + )cpp"); + TU.Code = Main.code().str(); + EXPECT_THAT(getSymbols(TU.build()), + ElementsAre(AllOf(WithName("MYObject")), + AllOf(WithName("someFunctionAbove")), + // FIXME: This should be nested under MYObject below. + AllOf(WithName("someHelperFunction")), + AllOf(WithName("MYObject"), + Children(AllOf(WithName("-init")), + AllOf(WithName("-retain")), + AllOf(WithName("-release")))))); +} + } // namespace } // namespace clangd } // namespace clang diff --git a/clang-tools-extra/clangd/unittests/ParsedASTTests.cpp b/clang-tools-extra/clangd/unittests/ParsedASTTests.cpp --- a/clang-tools-extra/clangd/unittests/ParsedASTTests.cpp +++ b/clang-tools-extra/clangd/unittests/ParsedASTTests.cpp @@ -99,6 +99,8 @@ return arg.beginOffset() == R.Begin && arg.endOffset() == R.End; } +MATCHER_P(PragmaTrivia, P, "") { return arg.Trivia == P; } + MATCHER(EqInc, "") { Inclusion Actual = testing::get<0>(arg); Inclusion Expected = testing::get<1>(arg); @@ -886,6 +888,27 @@ EXPECT_FALSE(mainIsGuarded(AST)); } +TEST(ParsedASTTest, DiscoversPragmaMarks) { + TestTU TU; + TU.AdditionalFiles["Header.h"] = R"( + #pragma mark - Something API + int something(); + #pragma mark Something else + )"; + TU.Code = R"cpp( + #include "Header.h" + #pragma mark In Preamble + #pragma mark - Something Impl + int something() { return 1; } + #pragma mark End + )cpp"; + auto AST = TU.build(); + + EXPECT_THAT(AST.getMarks(), ElementsAre(PragmaTrivia(" In Preamble"), + PragmaTrivia(" - Something Impl"), + PragmaTrivia(" End"))); +} + } // namespace } // namespace clangd } // namespace clang diff --git a/clang/include/clang/Lex/PPCallbacks.h b/clang/include/clang/Lex/PPCallbacks.h --- a/clang/include/clang/Lex/PPCallbacks.h +++ b/clang/include/clang/Lex/PPCallbacks.h @@ -492,6 +492,11 @@ Second->PragmaComment(Loc, Kind, Str); } + void PragmaMark(SourceLocation Loc, StringRef Trivia) override { + First->PragmaMark(Loc, Trivia); + Second->PragmaMark(Loc, Trivia); + } + void PragmaDetectMismatch(SourceLocation Loc, StringRef Name, StringRef Value) override { First->PragmaDetectMismatch(Loc, Name, Value);