diff options
author | Simon Pilgrim <llvm-dev@redking.me.uk> | 2022-01-13 15:06:13 +0000 |
---|---|---|
committer | Simon Pilgrim <llvm-dev@redking.me.uk> | 2022-01-13 15:14:20 +0000 |
commit | ec5b63ba968973fa6b17e0bb8eec0c20aaabde2c (patch) | |
tree | 6632e15f77f52a95a1b88ada0ce53a41986ff20b | |
parent | 42185ad870cb750ede2be38cf5ac5326ab9ac424 (diff) | |
download | llvm-ec5b63ba968973fa6b17e0bb8eec0c20aaabde2c.zip llvm-ec5b63ba968973fa6b17e0bb8eec0c20aaabde2c.tar.gz llvm-ec5b63ba968973fa6b17e0bb8eec0c20aaabde2c.tar.bz2 |
[X86] Add tests showing failure to merge shuffles through xop shift binops
-rw-r--r-- | llvm/test/CodeGen/X86/xop-shifts.ll | 38 |
1 files changed, 38 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/X86/xop-shifts.ll b/llvm/test/CodeGen/X86/xop-shifts.ll index 335b3ab..3916fc7 100644 --- a/llvm/test/CodeGen/X86/xop-shifts.ll +++ b/llvm/test/CodeGen/X86/xop-shifts.ll @@ -1,6 +1,10 @@ ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+xop | FileCheck %s +; +; SimplifyDemandedVectorEltsForTargetNode Handling +; + define <16 x i8> @demandedelts_vpshab(<16 x i8> %a0, <16 x i8> %a1) { ; CHECK-LABEL: demandedelts_vpshab: ; CHECK: # %bb.0: @@ -26,6 +30,40 @@ define <4 x i32> @demandedelts_vpshld(<4 x i32> %a0, <4 x i32> %a1) { ret <4 x i32> %result } +; +; isBinOp Handling (TODO) +; + +define <8 x i16> @binop_shuffle_vpshaw(<8 x i16> %a0, <8 x i16> %a1) { +; CHECK-LABEL: binop_shuffle_vpshaw: +; CHECK: # %bb.0: +; CHECK-NEXT: vpshuflw {{.*#+}} xmm0 = xmm0[3,2,1,0,4,5,6,7] +; CHECK-NEXT: vpshuflw {{.*#+}} xmm1 = xmm1[3,2,1,0,4,5,6,7] +; CHECK-NEXT: vpshlw %xmm1, %xmm0, %xmm0 +; CHECK-NEXT: vpshuflw {{.*#+}} xmm0 = xmm0[3,2,1,0,4,5,6,7] +; CHECK-NEXT: retq + %shuffle0 = shufflevector <8 x i16> %a0, <8 x i16> undef, <8 x i32> <i32 3, i32 2, i32 1, i32 0, i32 4, i32 5, i32 6, i32 7> + %shuffle1 = shufflevector <8 x i16> %a1, <8 x i16> undef, <8 x i32> <i32 3, i32 2, i32 1, i32 0, i32 4, i32 5, i32 6, i32 7> + %shift = call <8 x i16> @llvm.x86.xop.vpshlw(<8 x i16> %shuffle0, <8 x i16> %shuffle1) + %result = shufflevector <8 x i16> %shift, <8 x i16> undef, <8 x i32> <i32 3, i32 2, i32 1, i32 0, i32 4, i32 5, i32 6, i32 7> + ret <8 x i16> %result +} + +define <2 x i64> @binop_shuffle_vpshlq(<2 x i64> %a0, <2 x i64> %a1) { +; CHECK-LABEL: binop_shuffle_vpshlq: +; CHECK: # %bb.0: +; CHECK-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[2,3,0,1] +; CHECK-NEXT: vpshufd {{.*#+}} xmm1 = xmm1[0,1,0,1] +; CHECK-NEXT: vpshlq %xmm1, %xmm0, %xmm0 +; CHECK-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[2,3,0,1] +; CHECK-NEXT: retq + %shuffle0 = shufflevector <2 x i64> %a0, <2 x i64> undef, <2 x i32> <i32 1, i32 0> + %shuffle1 = shufflevector <2 x i64> %a1, <2 x i64> undef, <2 x i32> <i32 0, i32 0> + %shift = call <2 x i64> @llvm.x86.xop.vpshlq(<2 x i64> %shuffle0, <2 x i64> %shuffle1) + %result = shufflevector <2 x i64> %shift, <2 x i64> undef, <2 x i32> <i32 1, i32 0> + ret <2 x i64> %result +} + declare <16 x i8> @llvm.x86.xop.vpshab(<16 x i8>, <16 x i8>) nounwind readnone declare <4 x i32> @llvm.x86.xop.vpshad(<4 x i32>, <4 x i32>) nounwind readnone declare <2 x i64> @llvm.x86.xop.vpshaq(<2 x i64>, <2 x i64>) nounwind readnone |