diff options
author | DaPorkchop_ <daporkchop@daporkchop.net> | 2024-06-08 15:32:34 +0200 |
---|---|---|
committer | GitHub <noreply@github.com> | 2024-06-08 21:32:34 +0800 |
commit | 540f68c44f4813c2c16f92ccbba5a15e8ff87c85 (patch) | |
tree | 3e907a1604b10fbdbb71b31a5d586cefa3f437c8 /llvm/lib/Transforms/Utils/SimplifyCFG.cpp | |
parent | d4eed43badfcaba044b038b704b57ea130fd5e15 (diff) | |
download | llvm-540f68c44f4813c2c16f92ccbba5a15e8ff87c85.zip llvm-540f68c44f4813c2c16f92ccbba5a15e8ff87c85.tar.gz llvm-540f68c44f4813c2c16f92ccbba5a15e8ff87c85.tar.bz2 |
[SimplifyCFG] Don't use a mask for lookup tables generated from switches with an unreachable default case (#94468)
When transforming a switch with holes into a lookup table, we currently
use a mask to check if the current index is handled by the switch or if
it is a hole. If it is a hole, we skip loading from the lookup table.
Normally, if the switch's default case is unreachable this has no
impact, as the mask test gets optimized away by subsequent passes.
However, if the switch is large enough that the number of lookup table
entries exceeds the target's register width, we won't be able to fit all
the cases into a mask and the switch won't get transformed into a lookup
table. If we know that the switch's default case is unreachable, we know
that the mask is unnecessary and can skip constructing it entirely,
which allows us to transform the switch into a lookup table.
[Example](https://godbolt.org/z/7x7qfx8M1)
In the future, it might be interesting to consider allowing lookup table
masks to be more than one register large (e.g. using a constant array of
bit flags, similar to `std::bitset`).
Diffstat (limited to 'llvm/lib/Transforms/Utils/SimplifyCFG.cpp')
-rw-r--r-- | llvm/lib/Transforms/Utils/SimplifyCFG.cpp | 30 |
1 files changed, 21 insertions, 9 deletions
diff --git a/llvm/lib/Transforms/Utils/SimplifyCFG.cpp b/llvm/lib/Transforms/Utils/SimplifyCFG.cpp index fe6ec88..292739b 100644 --- a/llvm/lib/Transforms/Utils/SimplifyCFG.cpp +++ b/llvm/lib/Transforms/Utils/SimplifyCFG.cpp @@ -6743,8 +6743,25 @@ static bool SwitchToLookupTable(SwitchInst *SI, IRBuilder<> &Builder, TableSize = (MaxCaseVal->getValue() - MinCaseVal->getValue()).getLimitedValue() + 1; + // If the default destination is unreachable, or if the lookup table covers + // all values of the conditional variable, branch directly to the lookup table + // BB. Otherwise, check that the condition is within the case range. + bool DefaultIsReachable = !SI->defaultDestUndefined(); + bool TableHasHoles = (NumResults < TableSize); - bool NeedMask = (TableHasHoles && !HasDefaultResults); + + // If the table has holes but the default destination doesn't produce any + // constant results, the lookup table entries corresponding to the holes will + // contain undefined values. + bool AllHolesAreUndefined = TableHasHoles && !HasDefaultResults; + + // If the default destination doesn't produce a constant result but is still + // reachable, and the lookup table has holes, we need to use a mask to + // determine if the current index should load from the lookup table or jump + // to the default case. + // The mask is unnecessary if the table has holes but the default destination + // is unreachable, as in that case the holes must also be unreachable. + bool NeedMask = AllHolesAreUndefined && DefaultIsReachable; if (NeedMask) { // As an extra penalty for the validity test we require more cases. if (SI->getNumCases() < 4) // FIXME: Find best threshold value (benchmark). @@ -6766,12 +6783,6 @@ static bool SwitchToLookupTable(SwitchInst *SI, IRBuilder<> &Builder, "It is impossible for a switch to have more entries than the max " "representable value of its input integer type's size."); - // If the default destination is unreachable, or if the lookup table covers - // all values of the conditional variable, branch directly to the lookup table - // BB. Otherwise, check that the condition is within the case range. - bool DefaultIsReachable = - !isa<UnreachableInst>(SI->getDefaultDest()->getFirstNonPHIOrDbg()); - // Create the BB that does the lookups. Module &Mod = *CommonDest->getParent()->getParent(); BasicBlock *LookupBB = BasicBlock::Create( @@ -6895,8 +6906,9 @@ static bool SwitchToLookupTable(SwitchInst *SI, IRBuilder<> &Builder, for (PHINode *PHI : PHIs) { const ResultListTy &ResultList = ResultLists[PHI]; - // If using a bitmask, use any value to fill the lookup table holes. - Constant *DV = NeedMask ? ResultLists[PHI][0].second : DefaultResults[PHI]; + // Use any value to fill the lookup table holes. + Constant *DV = + AllHolesAreUndefined ? ResultLists[PHI][0].second : DefaultResults[PHI]; StringRef FuncName = Fn->getName(); SwitchLookupTable Table(Mod, TableSize, TableIndexOffset, ResultList, DV, DL, FuncName); |