aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorSimon Pilgrim <llvm-dev@redking.me.uk>2022-08-20 14:13:38 +0100
committerSimon Pilgrim <llvm-dev@redking.me.uk>2022-08-20 14:13:44 +0100
commit8faf515a36c07e383310c7b1aa59e42a16b548bf (patch)
tree5e0c26bd080d8fb7d1e61d4f2908d3bf3592452a
parent2ede992c01c4e7faaa9649b56903f0551c190eda (diff)
downloadllvm-8faf515a36c07e383310c7b1aa59e42a16b548bf.zip
llvm-8faf515a36c07e383310c7b1aa59e42a16b548bf.tar.gz
llvm-8faf515a36c07e383310c7b1aa59e42a16b548bf.tar.bz2
[X86] Add vector test coverage of 'one-bit-diff' and/or icmp ne/eq patterns
-rw-r--r--llvm/test/CodeGen/X86/vec_setcc.ll104
1 files changed, 104 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/X86/vec_setcc.ll b/llvm/test/CodeGen/X86/vec_setcc.ll
index 09d655a..faf9dc4 100644
--- a/llvm/test/CodeGen/X86/vec_setcc.ll
+++ b/llvm/test/CodeGen/X86/vec_setcc.ll
@@ -139,6 +139,110 @@ define <4 x i32> @v4i32_icmp_ule(<4 x i32> %a, <4 x i32> %b) nounwind readnone s
ret <4 x i32> %2
}
+define <16 x i8> @or_icmp_eq_const_1bit_diff(<16 x i8> %x) {
+; SSE-LABEL: or_icmp_eq_const_1bit_diff:
+; SSE: # %bb.0:
+; SSE-NEXT: movdqa {{.*#+}} xmm1 = [43,43,43,43,43,43,43,43,43,43,43,43,43,43,43,43]
+; SSE-NEXT: pcmpeqb %xmm0, %xmm1
+; SSE-NEXT: pcmpeqb {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0
+; SSE-NEXT: por %xmm1, %xmm0
+; SSE-NEXT: retq
+;
+; AVX-LABEL: or_icmp_eq_const_1bit_diff:
+; AVX: # %bb.0:
+; AVX-NEXT: vpcmpeqb {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm1
+; AVX-NEXT: vpcmpeqb {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm0
+; AVX-NEXT: vpor %xmm0, %xmm1, %xmm0
+; AVX-NEXT: retq
+ %a = icmp eq <16 x i8> %x, <i8 43, i8 43, i8 43, i8 43, i8 43, i8 43, i8 43, i8 43, i8 43, i8 43, i8 43, i8 43, i8 43, i8 43, i8 43, i8 43>
+ %b = icmp eq <16 x i8> %x, <i8 45, i8 45, i8 45, i8 45, i8 45, i8 45, i8 45, i8 45, i8 45, i8 45, i8 45, i8 45, i8 45, i8 45, i8 45, i8 45>
+ %ax = sext <16 x i1> %a to <16 x i8>
+ %bx = sext <16 x i1> %b to <16 x i8>
+ %r = or <16 x i8> %ax, %bx
+ ret <16 x i8> %r
+}
+
+define <4 x i32> @or_icmp_ne_const_1bit_diff(<4 x i32> %x) {
+; SSE-LABEL: or_icmp_ne_const_1bit_diff:
+; SSE: # %bb.0:
+; SSE-NEXT: movdqa {{.*#+}} xmm1 = [44,60,44,60]
+; SSE-NEXT: pcmpeqd %xmm0, %xmm1
+; SSE-NEXT: pcmpeqd %xmm2, %xmm2
+; SSE-NEXT: pxor %xmm2, %xmm1
+; SSE-NEXT: pcmpeqd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0
+; SSE-NEXT: pxor %xmm2, %xmm0
+; SSE-NEXT: por %xmm1, %xmm0
+; SSE-NEXT: retq
+;
+; AVX-LABEL: or_icmp_ne_const_1bit_diff:
+; AVX: # %bb.0:
+; AVX-NEXT: vpcmpeqd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm1
+; AVX-NEXT: vpcmpeqd %xmm2, %xmm2, %xmm2
+; AVX-NEXT: vpxor %xmm2, %xmm1, %xmm1
+; AVX-NEXT: vpcmpeqd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm0
+; AVX-NEXT: vpxor %xmm2, %xmm0, %xmm0
+; AVX-NEXT: vpor %xmm0, %xmm1, %xmm0
+; AVX-NEXT: retq
+ %a = icmp ne <4 x i32> %x, <i32 44, i32 60, i32 44, i32 60>
+ %b = icmp ne <4 x i32> %x, <i32 60, i32 44, i32 60, i32 44>
+ %ax = sext <4 x i1> %a to <4 x i32>
+ %bx = sext <4 x i1> %b to <4 x i32>
+ %r = or <4 x i32> %ax, %bx
+ ret <4 x i32> %r
+}
+
+define <16 x i8> @and_icmp_eq_const_1bit_diff(<16 x i8> %x) {
+; SSE-LABEL: and_icmp_eq_const_1bit_diff:
+; SSE: # %bb.0:
+; SSE-NEXT: movdqa {{.*#+}} xmm1 = [43,43,45,45,43,43,45,45,43,43,45,45,43,43,45,45]
+; SSE-NEXT: pcmpeqb %xmm0, %xmm1
+; SSE-NEXT: pcmpeqb {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0
+; SSE-NEXT: pand %xmm1, %xmm0
+; SSE-NEXT: retq
+;
+; AVX-LABEL: and_icmp_eq_const_1bit_diff:
+; AVX: # %bb.0:
+; AVX-NEXT: vpcmpeqb {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm1
+; AVX-NEXT: vpcmpeqb {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm0
+; AVX-NEXT: vpand %xmm0, %xmm1, %xmm0
+; AVX-NEXT: retq
+ %a = icmp eq <16 x i8> %x, <i8 43, i8 43, i8 45, i8 45, i8 43, i8 43, i8 45, i8 45, i8 43, i8 43, i8 45, i8 45, i8 43, i8 43, i8 45, i8 45>
+ %b = icmp eq <16 x i8> %x, <i8 45, i8 45, i8 43, i8 43, i8 45, i8 45, i8 43, i8 43, i8 45, i8 45, i8 43, i8 43, i8 45, i8 45, i8 43, i8 43>
+ %ax = sext <16 x i1> %a to <16 x i8>
+ %bx = sext <16 x i1> %b to <16 x i8>
+ %r = and <16 x i8> %ax, %bx
+ ret <16 x i8> %r
+}
+
+define <4 x i32> @and_icmp_ne_const_1bit_diff(<4 x i32> %x) {
+; SSE-LABEL: and_icmp_ne_const_1bit_diff:
+; SSE: # %bb.0:
+; SSE-NEXT: movdqa {{.*#+}} xmm1 = [44,60,54,44]
+; SSE-NEXT: pcmpeqd %xmm0, %xmm1
+; SSE-NEXT: pcmpeqd %xmm2, %xmm2
+; SSE-NEXT: pxor %xmm2, %xmm1
+; SSE-NEXT: pcmpeqd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0
+; SSE-NEXT: pxor %xmm2, %xmm0
+; SSE-NEXT: por %xmm1, %xmm0
+; SSE-NEXT: retq
+;
+; AVX-LABEL: and_icmp_ne_const_1bit_diff:
+; AVX: # %bb.0:
+; AVX-NEXT: vpcmpeqd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm1
+; AVX-NEXT: vpcmpeqd %xmm2, %xmm2, %xmm2
+; AVX-NEXT: vpxor %xmm2, %xmm1, %xmm1
+; AVX-NEXT: vpcmpeqd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm0
+; AVX-NEXT: vpxor %xmm2, %xmm0, %xmm0
+; AVX-NEXT: vpor %xmm0, %xmm1, %xmm0
+; AVX-NEXT: retq
+ %a = icmp ne <4 x i32> %x, <i32 44, i32 60, i32 54, i32 44>
+ %b = icmp ne <4 x i32> %x, <i32 60, i32 52, i32 50, i32 60>
+ %ax = sext <4 x i1> %a to <4 x i32>
+ %bx = sext <4 x i1> %b to <4 x i32>
+ %r = or <4 x i32> %ax, %bx
+ ret <4 x i32> %r
+}
+
; At one point we were incorrectly constant-folding a setcc to 0x1 instead of
; 0xff, leading to a constpool load. The instruction doesn't matter here, but it
; should set all bits to 1.