diff options
| author | Vladislav Dzhidzhoev <vdzhidzhoev@accesssoftek.com> | 2026-02-04 00:34:52 +0100 |
|---|---|---|
| committer | GitHub <noreply@github.com> | 2026-02-04 00:34:52 +0100 |
| commit | b9cecee3fb90f5262d85e824f8e80d153e2c3a4c (patch) | |
| tree | dd6390a066a18888e4d64674b0c3e27453c4498c /llvm/lib/Bitcode/Reader | |
| parent | 3bd2ae712755c5b7f7ddc1374c24b197d53bdefe (diff) | |
| download | llvm-b9cecee3fb90f5262d85e824f8e80d153e2c3a4c.tar.gz llvm-b9cecee3fb90f5262d85e824f8e80d153e2c3a4c.tar.bz2 llvm-b9cecee3fb90f5262d85e824f8e80d153e2c3a4c.zip | |
Reland "[DebugMetadata][DwarfDebug] Support function-local types in lexical block scopes (4/7)" (#165032)
This is an attempt to merge https://reviews.llvm.org/D144006 with LTO
fix.
The last merge attempt was
https://github.com/llvm/llvm-project/pull/75385.
The issue with it was investigated in
https://github.com/llvm/llvm-project/pull/75385#issuecomment-2386684121.
The problem happens when
1. Several modules are being linked.
2. There are several DISubprograms that initially belong to different
modules but represent the same source code function (for example, a
function included from the same source code file).
3. Some of such DISubprograms survive IR linking. It may happen if one
of them is inlined somewhere or if the functions that have these
DISubprograms attached have internal linkage.
4. Each of these DISubprograms has a local type that corresponds to the
same source code type. These types are initially from different modules,
but have the same ODR identifier.
If the same (in the sense of ODR identifier/ODR uniquing rules) local
type is present in two modules, and these modules are linked together,
the type gets uniqued. A DIType, that happens to be loaded first,
survives linking, and the references on other types with the same ODR
identifier from the modules loaded later are replaced with the
references on the DIType loaded first. Since defintion subprograms, in
scope of which these types are located, are not deduplicated, the linker
output may contain multiple DISubprogram's having the same (uniqued)
type in their retainedNodes lists.
Further compilation of such modules causes crashes.
To tackle that,
* previous solution to handle LTO linking with local types in
retainedNodes is removed (cloneLocalTypes() function),
* for each loaded distinct (definition) DISubprogram, its retainedNodes
list is scanned after loading, and DITypes with a scope of another
subprogram are removed. If something from a Function corresponding to
the DISubprogram references uniqued type, we rely on cross-CU links.
Additionally:
* a check is added to Verifier to report about local types located in a
wrong retainedNodes list,
Original commit message follows.
---------
RFC https://discourse.llvm.org/t/rfc-dwarfdebug-fix-and-improve-handling-imported-entities-types-and-static-local-in-subprogram-and-lexical-block-scopes/68544
Similar to imported declarations, the patch tracks function-local types in
DISubprogram's 'retainedNodes' field. DwarfDebug is adjusted in accordance with
the aforementioned metadata change and provided a support of function-local
types scoped within a lexical block.
The patch assumes that DICompileUnit's 'enums field' no longer tracks local
types and DwarfDebug would assert if any locally-scoped types get placed there.
Authored-by: Kristina Bessonova <kbessonova@accesssoftek.com>
Co-authored-by: Jeremy Morse <jeremy.morse@sony.com>
Diffstat (limited to 'llvm/lib/Bitcode/Reader')
| -rw-r--r-- | llvm/lib/Bitcode/Reader/MetadataLoader.cpp | 178 |
1 files changed, 124 insertions, 54 deletions
diff --git a/llvm/lib/Bitcode/Reader/MetadataLoader.cpp b/llvm/lib/Bitcode/Reader/MetadataLoader.cpp index a12176d5bfdb..4bc55232a6df 100644 --- a/llvm/lib/Bitcode/Reader/MetadataLoader.cpp +++ b/llvm/lib/Bitcode/Reader/MetadataLoader.cpp @@ -116,6 +116,8 @@ public: RefsUpperBound(std::min((size_t)std::numeric_limits<unsigned>::max(), RefsUpperBound)) {} + using const_iterator = SmallVector<TrackingMDRef, 1>::const_iterator; + // vector compatibility methods unsigned size() const { return MetadataPtrs.size(); } void resize(unsigned N) { MetadataPtrs.resize(N); } @@ -124,6 +126,8 @@ public: Metadata *back() const { return MetadataPtrs.back(); } void pop_back() { MetadataPtrs.pop_back(); } bool empty() const { return MetadataPtrs.empty(); } + const_iterator begin() const { return MetadataPtrs.begin(); } + const_iterator end() const { return MetadataPtrs.end(); } Metadata *operator[](unsigned i) const { return MetadataPtrs[i]; } @@ -448,6 +452,11 @@ class MetadataLoader::MetadataLoaderImpl { /// metadata. SmallDenseMap<Function *, DISubprogram *, 16> FunctionsWithSPs; + /// retainedNodes of these subprograms should be cleaned up from incorrectly + /// scoped local types. + /// See \ref DISubprogram::cleanupRetainedNodes. + SmallVector<DISubprogram *> NewDistinctSPs; + // Map the bitcode's custom MDKind ID to the Module's MDKind ID. DenseMap<unsigned, unsigned> MDKindMap; @@ -538,56 +547,82 @@ class MetadataLoader::MetadataLoaderImpl { /// Move local imports from DICompileUnit's 'imports' field to /// DISubprogram's retainedNodes. + /// Move function-local enums from DICompileUnit's enums + /// to DISubprogram's retainedNodes. void upgradeCULocals() { - if (NamedMDNode *CUNodes = TheModule.getNamedMetadata("llvm.dbg.cu")) { - for (MDNode *N : CUNodes->operands()) { - auto *CU = dyn_cast<DICompileUnit>(N); - if (!CU) - continue; - - if (CU->getRawImportedEntities()) { - // Collect a set of imported entities to be moved. - SetVector<Metadata *> EntitiesToRemove; - for (Metadata *Op : CU->getImportedEntities()->operands()) { - auto *IE = cast<DIImportedEntity>(Op); - if (isa_and_nonnull<DILocalScope>(IE->getScope())) { - EntitiesToRemove.insert(IE); - } - } - - if (!EntitiesToRemove.empty()) { - // Make a new list of CU's 'imports'. - SmallVector<Metadata *> NewImports; - for (Metadata *Op : CU->getImportedEntities()->operands()) { - if (!EntitiesToRemove.contains(cast<DIImportedEntity>(Op))) { - NewImports.push_back(Op); - } - } + NamedMDNode *CUNodes = TheModule.getNamedMetadata("llvm.dbg.cu"); + if (!CUNodes) + return; - // Find DISubprogram corresponding to each entity. - std::map<DISubprogram *, SmallVector<Metadata *>> SPToEntities; - for (auto *I : EntitiesToRemove) { - auto *Entity = cast<DIImportedEntity>(I); - if (auto *SP = findEnclosingSubprogram( - cast<DILocalScope>(Entity->getScope()))) { - SPToEntities[SP].push_back(Entity); - } - } + // Filter out elements of ToRemove from tuple T. + auto FilterTuple = [this](MDNode *T, + const SetVector<Metadata *> &ToRemove) { + SmallVector<Metadata *> Result; + for (Metadata *Op : T->operands()) + if (!ToRemove.contains(Op)) + Result.push_back(Op); + return MDTuple::get(Context, Result); + }; - // Update DISubprograms' retainedNodes. - for (auto I = SPToEntities.begin(); I != SPToEntities.end(); ++I) { - auto *SP = I->first; - auto RetainedNodes = SP->getRetainedNodes(); - SmallVector<Metadata *> MDs(RetainedNodes.begin(), - RetainedNodes.end()); - MDs.append(I->second); - SP->replaceRetainedNodes(MDNode::get(Context, MDs)); - } + // For each CU: + // - Collect local metadata nodes from CU's imports: and enums: lists in + // MetadataToRemove set. + // - Remove metadata nodes of MetadataToRemove set from CU's imports: and + // enums: lists. + // - Group MetadataToRemove items by their parent subprograms (in + // SPToEntities map). + // - For each subprogram SP in SPToEntities: + // - Append collected local metadata nodes to SP's retainedNodes: list. + for (MDNode *N : CUNodes->operands()) { + auto *CU = dyn_cast<DICompileUnit>(N); + if (!CU) + continue; - // Remove entities with local scope from CU. - CU->replaceImportedEntities(MDTuple::get(Context, NewImports)); - } + SetVector<Metadata *> MetadataToRemove; + // Collect imported entities to be moved. + if (CU->getRawImportedEntities()) + for (Metadata *Op : CU->getImportedEntities()->operands()) { + auto *IE = cast<DIImportedEntity>(Op); + if (isa_and_nonnull<DILocalScope>(IE->getScope())) + MetadataToRemove.insert(IE); + } + // Collect enums to be moved. + if (CU->getRawEnumTypes()) + for (Metadata *Op : CU->getEnumTypes()->operands()) { + auto *Enum = cast<DICompositeType>(Op); + if (isa_and_nonnull<DILocalScope>(Enum->getScope())) + MetadataToRemove.insert(Enum); } + + if (MetadataToRemove.empty()) + continue; + + // Remove entities with local scope from CU. + if (CU->getRawImportedEntities()) + CU->replaceImportedEntities( + FilterTuple(CU->getImportedEntities().get(), MetadataToRemove)); + + // Remove enums with local scope from CU. + if (CU->getRawEnumTypes()) + CU->replaceEnumTypes( + FilterTuple(CU->getEnumTypes().get(), MetadataToRemove)); + + // Find DISubprogram corresponding to each entity. + SmallDenseMap<DISubprogram *, SmallVector<Metadata *>> SPToEntities; + for (auto *I : MetadataToRemove) { + DILocalScope *Scope = + DISubprogram::getRetainedNodeScope(cast<DINode>(I)); + if (auto *SP = findEnclosingSubprogram(Scope)) + SPToEntities[SP].push_back(I); + } + + // Update DISubprograms' retainedNodes. + for (auto I = SPToEntities.begin(); I != SPToEntities.end(); ++I) { + auto *SP = I->first; + auto RetainedNodes = SP->getRetainedNodes(); + SmallVector<Metadata *> MDs(RetainedNodes.begin(), RetainedNodes.end()); + MDs.append(I->second); + SP->replaceRetainedNodes(MDNode::get(Context, MDs)); } } @@ -703,13 +738,40 @@ class MetadataLoader::MetadataLoaderImpl { return Error::success(); } - void upgradeDebugInfo(bool ModuleLevel) { + /// Specifies which kind of debug info upgrade should be performed. + /// + /// The upgrade of compile units' enums: and imports: fields is performed + /// only when module level metadata block is loaded (i.e. all elements of + /// "llvm.dbg.cu" named metadata node are loaded). + enum class DebugInfoUpgradeMode { + /// No debug info upgrade. + None, + /// Debug info upgrade after loading function-level metadata block. + Partial, + /// Debug info upgrade after loading module-level metadata block. + ModuleLevel, + }; + + void upgradeDebugInfo(DebugInfoUpgradeMode Mode) { + if (Mode == DebugInfoUpgradeMode::None) + return; upgradeCUSubprograms(); upgradeCUVariables(); - if (ModuleLevel) + if (Mode == DebugInfoUpgradeMode::ModuleLevel) upgradeCULocals(); } + /// Prepare loaded metadata nodes to be used by loader clients. + void resolveLoadedMetadata(PlaceholderQueue &Placeholders, + DebugInfoUpgradeMode DIUpgradeMode) { + resolveForwardRefsAndPlaceholders(Placeholders); + upgradeDebugInfo(DIUpgradeMode); + DISubprogram::cleanupRetainedNodes(NewDistinctSPs); + LLVM_DEBUG(llvm::dbgs() << "Resolved loaded metadata. Cleaned up " + << NewDistinctSPs.size() << " subprogram(s).\n"); + NewDistinctSPs.clear(); + } + void callMDTypeCallback(Metadata **Val, unsigned TypeID); public: @@ -735,7 +797,8 @@ public: if (ID < (MDStringRef.size() + GlobalMetadataBitPosIndex.size())) { PlaceholderQueue Placeholders; lazyLoadOneMetadata(ID, Placeholders); - resolveForwardRefsAndPlaceholders(Placeholders); + LLVM_DEBUG(llvm::dbgs() << "\nLazy metadata loading: "); + resolveLoadedMetadata(Placeholders, DebugInfoUpgradeMode::None); return MetadataList.lookup(ID); } return MetadataList.getMetadataFwdRef(ID); @@ -1060,6 +1123,8 @@ Error MetadataLoader::MetadataLoaderImpl::parseMetadata(bool ModuleLevel) { SmallVector<uint64_t, 64> Record; PlaceholderQueue Placeholders; + auto DIUpgradeMode = ModuleLevel ? DebugInfoUpgradeMode::ModuleLevel + : DebugInfoUpgradeMode::Partial; // We lazy-load module-level metadata: we build an index for each record, and // then load individual record as needed, starting with the named metadata. @@ -1084,8 +1149,8 @@ Error MetadataLoader::MetadataLoaderImpl::parseMetadata(bool ModuleLevel) { // Reading the named metadata created forward references and/or // placeholders, that we flush here. - resolveForwardRefsAndPlaceholders(Placeholders); - upgradeDebugInfo(ModuleLevel); + LLVM_DEBUG(llvm::dbgs() << "\nNamed metadata loading: "); + resolveLoadedMetadata(Placeholders, DIUpgradeMode); // Return at the beginning of the block, since it is easy to skip it // entirely from there. Stream.ReadBlockEnd(); // Pop the abbrev block context. @@ -1115,8 +1180,8 @@ Error MetadataLoader::MetadataLoaderImpl::parseMetadata(bool ModuleLevel) { case BitstreamEntry::Error: return error("Malformed block"); case BitstreamEntry::EndBlock: - resolveForwardRefsAndPlaceholders(Placeholders); - upgradeDebugInfo(ModuleLevel); + LLVM_DEBUG(llvm::dbgs() << "\nEager metadata loading: "); + resolveLoadedMetadata(Placeholders, DIUpgradeMode); return Error::success(); case BitstreamEntry::Record: // The interesting case. @@ -1999,6 +2064,9 @@ Error MetadataLoader::MetadataLoaderImpl::parseOneMetadata( MetadataList.assignValue(SP, NextMetadataNo); NextMetadataNo++; + if (IsDistinct) + NewDistinctSPs.push_back(SP); + // Upgrade sp->function mapping to function->sp mapping. if (HasFn) { if (auto *CMD = dyn_cast_or_null<ConstantAsMetadata>(CUorFn)) @@ -2482,7 +2550,8 @@ Error MetadataLoader::MetadataLoaderImpl::parseMetadataAttachment( case BitstreamEntry::Error: return error("Malformed block"); case BitstreamEntry::EndBlock: - resolveForwardRefsAndPlaceholders(Placeholders); + LLVM_DEBUG(llvm::dbgs() << "\nAttachment metadata loading: "); + resolveLoadedMetadata(Placeholders, DebugInfoUpgradeMode::None); return Error::success(); case BitstreamEntry::Record: // The interesting case. @@ -2525,7 +2594,8 @@ Error MetadataLoader::MetadataLoaderImpl::parseMetadataAttachment( // Load the attachment if it is in the lazy-loadable range and hasn't // been loaded yet. lazyLoadOneMetadata(Idx, Placeholders); - resolveForwardRefsAndPlaceholders(Placeholders); + LLVM_DEBUG(llvm::dbgs() << "\nLazy attachment metadata loading: "); + resolveLoadedMetadata(Placeholders, DebugInfoUpgradeMode::None); } Metadata *Node = MetadataList.getMetadataFwdRef(Idx); |
