diff options
-rw-r--r-- | llvm/test/Transforms/SLPVectorizer/X86/minbitwidth-node-with-multi-users.ll | 69 |
1 files changed, 69 insertions, 0 deletions
diff --git a/llvm/test/Transforms/SLPVectorizer/X86/minbitwidth-node-with-multi-users.ll b/llvm/test/Transforms/SLPVectorizer/X86/minbitwidth-node-with-multi-users.ll new file mode 100644 index 0000000..958761484 --- /dev/null +++ b/llvm/test/Transforms/SLPVectorizer/X86/minbitwidth-node-with-multi-users.ll @@ -0,0 +1,69 @@ +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 4 +; RUN: opt -S --passes=slp-vectorizer -mtriple=x86_64-unknown-linux-gnu < %s | FileCheck %s + +define void @test() { +; CHECK-LABEL: define void @test() { +; CHECK-NEXT: entry: +; CHECK-NEXT: [[TMP0:%.*]] = load i16, ptr null, align 2 +; CHECK-NEXT: [[TMP1:%.*]] = and i8 0, 1 +; CHECK-NEXT: [[TMP2:%.*]] = and i32 0, 0 +; CHECK-NEXT: [[TMP3:%.*]] = select i1 false, i32 0, i32 0 +; CHECK-NEXT: [[TMP4:%.*]] = insertelement <4 x i8> <i8 poison, i8 0, i8 poison, i8 poison>, i8 [[TMP1]], i32 0 +; CHECK-NEXT: [[TMP5:%.*]] = shufflevector <4 x i8> [[TMP4]], <4 x i8> poison, <4 x i32> <i32 0, i32 0, i32 0, i32 1> +; CHECK-NEXT: [[TMP6:%.*]] = trunc <4 x i8> [[TMP5]] to <4 x i1> +; CHECK-NEXT: [[TMP7:%.*]] = zext <4 x i1> [[TMP6]] to <4 x i32> +; CHECK-NEXT: [[TMP8:%.*]] = shufflevector <4 x i8> [[TMP4]], <4 x i8> poison, <4 x i32> zeroinitializer +; CHECK-NEXT: [[TMP9:%.*]] = or <4 x i8> [[TMP8]], zeroinitializer +; CHECK-NEXT: [[TMP10:%.*]] = sext <4 x i8> [[TMP9]] to <4 x i32> +; CHECK-NEXT: [[TMP11:%.*]] = zext <4 x i1> [[TMP6]] to <4 x i32> +; CHECK-NEXT: [[TMP12:%.*]] = or <4 x i32> zeroinitializer, [[TMP11]] +; CHECK-NEXT: [[TMP13:%.*]] = icmp eq <4 x i32> [[TMP10]], [[TMP12]] +; CHECK-NEXT: [[TMP14:%.*]] = shufflevector <4 x i32> <i32 0, i32 0, i32 poison, i32 0>, <4 x i32> [[TMP7]], <4 x i32> <i32 0, i32 1, i32 6, i32 3> +; CHECK-NEXT: [[TMP15:%.*]] = select <4 x i1> [[TMP13]], <4 x i32> [[TMP14]], <4 x i32> zeroinitializer +; CHECK-NEXT: [[TMP16:%.*]] = trunc <4 x i32> [[TMP15]] to <4 x i1> +; CHECK-NEXT: [[TMP17:%.*]] = call i1 @llvm.vector.reduce.and.v4i1(<4 x i1> [[TMP16]]) +; CHECK-NEXT: [[TMP18:%.*]] = zext i1 [[TMP17]] to i32 +; CHECK-NEXT: [[OP_RDX:%.*]] = and i32 0, [[TMP18]] +; CHECK-NEXT: store i32 [[OP_RDX]], ptr null, align 4 +; CHECK-NEXT: ret void +; +entry: + %0 = load i16, ptr null, align 2 + %1 = and i8 0, 1 + %2 = and i32 0, 0 + %3 = select i1 false, i32 0, i32 0 + %i2 = sext i8 %1 to i32 + %i3 = or i8 %1, 0 + %i4 = sext i8 %i3 to i32 + %i5 = or i32 0, %i2 + %b1 = icmp eq i32 %i4, %i5 + %a1 = select i1 %b1, i32 0, i32 0 + %4 = and i32 %a1, 0 + %s1 = and i32 %4, 0 + %i8 = sext i8 %1 to i32 + %i9 = or i8 %1, 0 + %i10 = sext i8 %i9 to i32 + %i11 = or i32 0, %i8 + %b2 = icmp eq i32 %i10, %i11 + %a2 = select i1 %b2, i32 0, i32 0 + %5 = and i32 %a2, 0 + %s2 = and i32 %5, %s1 + %i14 = sext i8 %1 to i32 + %i15 = or i8 %1, 0 + %i16 = sext i8 %i15 to i32 + %i17 = or i32 0, %i14 + %b3 = icmp eq i32 %i16, %i17 + %a3 = select i1 %b3, i32 %i14, i32 0 + %6 = and i32 %a3, 0 + %s3 = and i32 %6, %s2 + %i20 = sext i8 0 to i32 + %i21 = or i8 %1, 0 + %i22 = sext i8 %i21 to i32 + %i23 = or i32 0, %i20 + %b4 = icmp eq i32 %i22, %i23 + %a4 = select i1 %b4, i32 0, i32 0 + %7 = and i32 %a4, 0 + %s4 = and i32 %7, %s3 + store i32 %s4, ptr null, align 4 + ret void +} |