aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorAlexey Bataev <a.bataev@outlook.com>2025-04-15 07:18:47 -0700
committerAlexey Bataev <a.bataev@outlook.com>2025-04-15 07:24:17 -0700
commit57025b42c43b2f14f7e58692bc19cd53d1b8a45e (patch)
tree081075b3c5e30ecab1187d71c3c655eb524239eb
parent552902455c7a3958930d4607ac8b85fd39d7c8a3 (diff)
downloadllvm-57025b42c43b2f14f7e58692bc19cd53d1b8a45e.zip
llvm-57025b42c43b2f14f7e58692bc19cd53d1b8a45e.tar.gz
llvm-57025b42c43b2f14f7e58692bc19cd53d1b8a45e.tar.bz2
[SLP]Mark smin reduction as signed compare
Reduction signed min must be marked as signed compare, fixing the analysis for the cases, where the incoming arguments are unsigned. Fixes #133943
-rw-r--r--llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp4
-rw-r--r--llvm/test/Transforms/SLPVectorizer/RISCV/smin-reduction-unsigned-missing-sign.ll5
2 files changed, 7 insertions, 2 deletions
diff --git a/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp b/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp
index 50c4039..f7c37d8 100644
--- a/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp
+++ b/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp
@@ -20170,6 +20170,10 @@ void BoUpSLP::computeMinimumValueSizes() {
IsTruncRoot = true;
}
bool IsSignedCmp = false;
+ if (UserIgnoreList && all_of(*UserIgnoreList, [](Value *V) {
+ return match(V, m_SMin(m_Value(), m_Value()));
+ }))
+ IsSignedCmp = true;
while (NodeIdx < VectorizableTree.size()) {
ArrayRef<Value *> TreeRoot = VectorizableTree[NodeIdx]->Scalars;
unsigned Limit = 2;
diff --git a/llvm/test/Transforms/SLPVectorizer/RISCV/smin-reduction-unsigned-missing-sign.ll b/llvm/test/Transforms/SLPVectorizer/RISCV/smin-reduction-unsigned-missing-sign.ll
index 67f5ccc..cf7127e 100644
--- a/llvm/test/Transforms/SLPVectorizer/RISCV/smin-reduction-unsigned-missing-sign.ll
+++ b/llvm/test/Transforms/SLPVectorizer/RISCV/smin-reduction-unsigned-missing-sign.ll
@@ -7,8 +7,9 @@ define i32 @test(i8 %0) {
; CHECK-NEXT: [[ENTRY:.*:]]
; CHECK-NEXT: [[TMP1:%.*]] = insertelement <4 x i8> <i8 poison, i8 0, i8 0, i8 0>, i8 [[TMP0]], i32 0
; CHECK-NEXT: [[TMP2:%.*]] = icmp ne <4 x i8> [[TMP1]], zeroinitializer
-; CHECK-NEXT: [[TMP3:%.*]] = call i1 @llvm.vector.reduce.smin.v4i1(<4 x i1> [[TMP2]])
-; CHECK-NEXT: [[TMP4:%.*]] = zext i1 [[TMP3]] to i32
+; CHECK-NEXT: [[TMP3:%.*]] = zext <4 x i1> [[TMP2]] to <4 x i8>
+; CHECK-NEXT: [[TMP5:%.*]] = call i8 @llvm.vector.reduce.smin.v4i8(<4 x i8> [[TMP3]])
+; CHECK-NEXT: [[TMP4:%.*]] = zext i8 [[TMP5]] to i32
; CHECK-NEXT: ret i32 [[TMP4]]
;
entry: