aboutsummaryrefslogtreecommitdiff
path: root/clang-tools-extra/clangd/IncludeCleaner.cpp
diff options
context:
space:
mode:
authorKirill Bobyrev <kbobyrev@google.com>2021-11-26 16:20:40 +0100
committerKirill Bobyrev <kbobyrev@google.com>2021-11-26 16:20:48 +0100
commit34cc210aa8af2fd33598e5559d0f5b51f9423dd6 (patch)
tree1946391203317eb92d450822815da33c726c10c1 /clang-tools-extra/clangd/IncludeCleaner.cpp
parentfc0aacf324b172309ee10334e2213e1b3df8ea45 (diff)
downloadllvm-34cc210aa8af2fd33598e5559d0f5b51f9423dd6.zip
llvm-34cc210aa8af2fd33598e5559d0f5b51f9423dd6.tar.gz
llvm-34cc210aa8af2fd33598e5559d0f5b51f9423dd6.tar.bz2
[clangd] IncludeCleaner: Attribute symbols from non self-contained headers to their parents
When a symbol comes from the non self-contained header, we recursively uplift the file we consider used to the first includer that has a header guard. We need to do this while we still have FileIDs because every time a non self-contained header is included, it gets a new FileID but is later deduplicated by HeaderID and it's not possible to understand where it was included from. Based on D114370. Reviewed By: sammccall Differential Revision: https://reviews.llvm.org/D114623
Diffstat (limited to 'clang-tools-extra/clangd/IncludeCleaner.cpp')
-rw-r--r--clang-tools-extra/clangd/IncludeCleaner.cpp50
1 files changed, 40 insertions, 10 deletions
diff --git a/clang-tools-extra/clangd/IncludeCleaner.cpp b/clang-tools-extra/clangd/IncludeCleaner.cpp
index a0b9e303e..33964d9f 100644
--- a/clang-tools-extra/clangd/IncludeCleaner.cpp
+++ b/clang-tools-extra/clangd/IncludeCleaner.cpp
@@ -8,6 +8,7 @@
#include "IncludeCleaner.h"
#include "Config.h"
+#include "Headers.h"
#include "ParsedAST.h"
#include "Protocol.h"
#include "SourceCode.h"
@@ -16,6 +17,7 @@
#include "clang/AST/ExprCXX.h"
#include "clang/AST/RecursiveASTVisitor.h"
#include "clang/Basic/SourceLocation.h"
+#include "clang/Basic/SourceManager.h"
#include "clang/Lex/HeaderSearch.h"
#include "clang/Lex/Preprocessor.h"
#include "clang/Tooling/Syntax/Tokens.h"
@@ -221,6 +223,31 @@ bool mayConsiderUnused(const Inclusion &Inc, ParsedAST &AST) {
return true;
}
+// In case symbols are coming from non self-contained header, we need to find
+// its first includer that is self-contained. This is the header users can
+// include, so it will be responsible for bringing the symbols from given
+// header into the scope.
+FileID headerResponsible(FileID ID, const SourceManager &SM,
+ const IncludeStructure &Includes) {
+ // Unroll the chain of non self-contained headers until we find the one that
+ // can be included.
+ for (const FileEntry *FE = SM.getFileEntryForID(ID); ID != SM.getMainFileID();
+ FE = SM.getFileEntryForID(ID)) {
+ // If FE is nullptr, we consider it to be the responsible header.
+ if (!FE)
+ break;
+ auto HID = Includes.getID(FE);
+ assert(HID && "We're iterating over headers already existing in "
+ "IncludeStructure");
+ if (Includes.isSelfContained(*HID))
+ break;
+ // The header is not self-contained: put the responsibility for its symbols
+ // on its includer.
+ ID = SM.getFileID(SM.getIncludeLoc(ID));
+ }
+ return ID;
+}
+
} // namespace
ReferencedLocations findReferencedLocations(ParsedAST &AST) {
@@ -234,20 +261,27 @@ ReferencedLocations findReferencedLocations(ParsedAST &AST) {
llvm::DenseSet<FileID>
findReferencedFiles(const llvm::DenseSet<SourceLocation> &Locs,
- const SourceManager &SM) {
+ const IncludeStructure &Includes, const SourceManager &SM) {
std::vector<SourceLocation> Sorted{Locs.begin(), Locs.end()};
llvm::sort(Sorted); // Group by FileID.
- ReferencedFiles Result(SM);
+ ReferencedFiles Files(SM);
for (auto It = Sorted.begin(); It < Sorted.end();) {
FileID FID = SM.getFileID(*It);
- Result.add(FID, *It);
+ Files.add(FID, *It);
// Cheaply skip over all the other locations from the same FileID.
// This avoids lots of redundant Loc->File lookups for the same file.
do
++It;
while (It != Sorted.end() && SM.isInFileID(*It, FID));
}
- return std::move(Result.Files);
+ // If a header is not self-contained, we consider its symbols a logical part
+ // of the including file. Therefore, mark the parents of all used
+ // non-self-contained FileIDs as used. Perform this on FileIDs rather than
+ // HeaderIDs, as each inclusion of a non-self-contained file is distinct.
+ llvm::DenseSet<FileID> Result;
+ for (FileID ID : Files.Files)
+ Result.insert(headerResponsible(ID, SM, Includes));
+ return Result;
}
std::vector<const Inclusion *>
@@ -304,12 +338,8 @@ std::vector<const Inclusion *> computeUnusedIncludes(ParsedAST &AST) {
const auto &SM = AST.getSourceManager();
auto Refs = findReferencedLocations(AST);
- // FIXME(kirillbobyrev): Attribute the symbols from non self-contained
- // headers to their parents while the information about respective
- // SourceLocations and FileIDs is not lost. It is not possible to do that
- // later when non-guarded headers included multiple times will get same
- // HeaderID.
- auto ReferencedFileIDs = findReferencedFiles(Refs, SM);
+ auto ReferencedFileIDs = findReferencedFiles(Refs, AST.getIncludeStructure(),
+ AST.getSourceManager());
auto ReferencedHeaders =
translateToHeaderIDs(ReferencedFileIDs, AST.getIncludeStructure(), SM);
return getUnused(AST, ReferencedHeaders);