aboutsummaryrefslogtreecommitdiff
path: root/llvm/test/CodeGen/AArch64
diff options
context:
space:
mode:
authorDavid Green <david.green@arm.com>2024-03-22 09:55:18 +0000
committerDavid Green <david.green@arm.com>2024-03-22 09:55:18 +0000
commit99d8c25b3104fc07f46532bd681515c5f3c71133 (patch)
treed75eb14d1cffd34b14bd91e05a778770c6cf989f /llvm/test/CodeGen/AArch64
parent5f1b2cffe5fab0aa733fc8d5f1546c1c800faac4 (diff)
downloadllvm-99d8c25b3104fc07f46532bd681515c5f3c71133.zip
llvm-99d8c25b3104fc07f46532bd681515c5f3c71133.tar.gz
llvm-99d8c25b3104fc07f46532bd681515c5f3c71133.tar.bz2
[AArch64] Extra tests for v2i8 concat loads. NFC
Diffstat (limited to 'llvm/test/CodeGen/AArch64')
-rw-r--r--llvm/test/CodeGen/AArch64/insert-subvector.ll129
1 files changed, 127 insertions, 2 deletions
diff --git a/llvm/test/CodeGen/AArch64/insert-subvector.ll b/llvm/test/CodeGen/AArch64/insert-subvector.ll
index d7656e1..95ad980 100644
--- a/llvm/test/CodeGen/AArch64/insert-subvector.ll
+++ b/llvm/test/CodeGen/AArch64/insert-subvector.ll
@@ -374,6 +374,131 @@ define <16 x i8> @load_v16i8_8_2(float %tmp, <16 x i8> %b, ptr %a) {
ret <16 x i8> %s2
}
+define <8 x i8> @load_v8i8_2_1(float %tmp, <8 x i8> %b, ptr %a) {
+; CHECK-LABEL: load_v8i8_2_1:
+; CHECK: // %bb.0:
+; CHECK-NEXT: ld1 { v2.b }[0], [x0]
+; CHECK-NEXT: add x8, x0, #1
+; CHECK-NEXT: mov v0.16b, v2.16b
+; CHECK-NEXT: ld1 { v0.b }[4], [x8]
+; CHECK-NEXT: mov v2.b[1], v0.b[4]
+; CHECK-NEXT: fmov d0, d1
+; CHECK-NEXT: mov v0.h[0], v2.h[0]
+; CHECK-NEXT: // kill: def $d0 killed $d0 killed $q0
+; CHECK-NEXT: ret
+ %l = load <2 x i8>, ptr %a
+ %s1 = shufflevector <2 x i8> %l, <2 x i8> poison, <8 x i32> <i32 0, i32 1, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef>
+ %s2 = shufflevector <8 x i8> %s1, <8 x i8> %b, <8 x i32> <i32 0, i32 1, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
+ ret <8 x i8> %s2
+}
+
+define <8 x i8> @load_v8i8_2_15(float %tmp, <8 x i8> %b, ptr %a) {
+; CHECK-LABEL: load_v8i8_2_15:
+; CHECK: // %bb.0:
+; CHECK-NEXT: ld1 { v0.b }[0], [x0]
+; CHECK-NEXT: add x8, x0, #1
+; CHECK-NEXT: // kill: def $d1 killed $d1 def $q1
+; CHECK-NEXT: ld1 { v0.b }[4], [x8]
+; CHECK-NEXT: adrp x8, .LCPI33_0
+; CHECK-NEXT: mov v0.b[1], v0.b[4]
+; CHECK-NEXT: mov v0.d[1], v1.d[0]
+; CHECK-NEXT: ldr d1, [x8, :lo12:.LCPI33_0]
+; CHECK-NEXT: tbl v0.8b, { v0.16b }, v1.8b
+; CHECK-NEXT: ret
+ %l = load <2 x i8>, ptr %a
+ %s1 = shufflevector <2 x i8> %l, <2 x i8> poison, <8 x i32> <i32 0, i32 1, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef>
+ %s2 = shufflevector <8 x i8> %s1, <8 x i8> %b, <8 x i32> <i32 8, i32 0, i32 1, i32 11, i32 12, i32 13, i32 14, i32 15>
+ ret <8 x i8> %s2
+}
+
+define <8 x i8> @load_v8i8_2_2(float %tmp, <8 x i8> %b, ptr %a) {
+; CHECK-LABEL: load_v8i8_2_2:
+; CHECK: // %bb.0:
+; CHECK-NEXT: ld1 { v2.b }[0], [x0]
+; CHECK-NEXT: add x8, x0, #1
+; CHECK-NEXT: mov v0.16b, v2.16b
+; CHECK-NEXT: ld1 { v0.b }[4], [x8]
+; CHECK-NEXT: mov v2.b[1], v0.b[4]
+; CHECK-NEXT: fmov d0, d1
+; CHECK-NEXT: mov v0.h[1], v2.h[0]
+; CHECK-NEXT: // kill: def $d0 killed $d0 killed $q0
+; CHECK-NEXT: ret
+ %l = load <2 x i8>, ptr %a
+ %s1 = shufflevector <2 x i8> %l, <2 x i8> poison, <8 x i32> <i32 0, i32 1, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef>
+ %s2 = shufflevector <8 x i8> %s1, <8 x i8> %b, <8 x i32> <i32 8, i32 9, i32 0, i32 1, i32 12, i32 13, i32 14, i32 15>
+ ret <8 x i8> %s2
+}
+
+define <8 x i8> @load_v8i8_2_3(float %tmp, <8 x i8> %b, ptr %a) {
+; CHECK-LABEL: load_v8i8_2_3:
+; CHECK: // %bb.0:
+; CHECK-NEXT: ld1 { v2.b }[0], [x0]
+; CHECK-NEXT: add x8, x0, #1
+; CHECK-NEXT: mov v0.16b, v2.16b
+; CHECK-NEXT: ld1 { v0.b }[4], [x8]
+; CHECK-NEXT: mov v2.b[1], v0.b[4]
+; CHECK-NEXT: fmov d0, d1
+; CHECK-NEXT: mov v0.h[2], v2.h[0]
+; CHECK-NEXT: // kill: def $d0 killed $d0 killed $q0
+; CHECK-NEXT: ret
+ %l = load <2 x i8>, ptr %a
+ %s1 = shufflevector <2 x i8> %l, <2 x i8> poison, <8 x i32> <i32 0, i32 1, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef>
+ %s2 = shufflevector <8 x i8> %s1, <8 x i8> %b, <8 x i32> <i32 8, i32 9, i32 10, i32 11, i32 0, i32 1, i32 14, i32 15>
+ ret <8 x i8> %s2
+}
+
+define <8 x i8> @load_v8i8_2_4(float %tmp, <8 x i8> %b, ptr %a) {
+; CHECK-LABEL: load_v8i8_2_4:
+; CHECK: // %bb.0:
+; CHECK-NEXT: ld1 { v2.b }[0], [x0]
+; CHECK-NEXT: add x8, x0, #1
+; CHECK-NEXT: mov v0.16b, v2.16b
+; CHECK-NEXT: ld1 { v0.b }[4], [x8]
+; CHECK-NEXT: mov v2.b[1], v0.b[4]
+; CHECK-NEXT: fmov d0, d1
+; CHECK-NEXT: mov v0.h[3], v2.h[0]
+; CHECK-NEXT: // kill: def $d0 killed $d0 killed $q0
+; CHECK-NEXT: ret
+ %l = load <2 x i8>, ptr %a
+ %s1 = shufflevector <2 x i8> %l, <2 x i8> poison, <8 x i32> <i32 0, i32 1, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef>
+ %s2 = shufflevector <8 x i8> %s1, <8 x i8> %b, <8 x i32> <i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 0, i32 1>
+ ret <8 x i8> %s2
+}
+
+define <4 x i8> @load_v4i8_2_1(float %tmp, <4 x i8> %b, ptr %a) {
+; CHECK-LABEL: load_v4i8_2_1:
+; CHECK: // %bb.0:
+; CHECK-NEXT: ld1 { v0.b }[0], [x0]
+; CHECK-NEXT: add x8, x0, #1
+; CHECK-NEXT: // kill: def $d1 killed $d1 def $q1
+; CHECK-NEXT: ld1 { v0.b }[4], [x8]
+; CHECK-NEXT: uzp1 v0.4h, v0.4h, v0.4h
+; CHECK-NEXT: mov v0.s[1], v1.s[1]
+; CHECK-NEXT: // kill: def $d0 killed $d0 killed $q0
+; CHECK-NEXT: ret
+ %l = load <2 x i8>, ptr %a
+ %s1 = shufflevector <2 x i8> %l, <2 x i8> poison, <4 x i32> <i32 0, i32 1, i32 undef, i32 undef>
+ %s2 = shufflevector <4 x i8> %s1, <4 x i8> %b, <4 x i32> <i32 0, i32 1, i32 6, i32 7>
+ ret <4 x i8> %s2
+}
+
+define <4 x i8> @load_v4i8_2_2(float %tmp, <4 x i8> %b, ptr %a) {
+; CHECK-LABEL: load_v4i8_2_2:
+; CHECK: // %bb.0:
+; CHECK-NEXT: ld1 { v0.b }[0], [x0]
+; CHECK-NEXT: add x8, x0, #1
+; CHECK-NEXT: ld1 { v0.b }[4], [x8]
+; CHECK-NEXT: uzp1 v2.4h, v0.4h, v0.4h
+; CHECK-NEXT: fmov d0, d1
+; CHECK-NEXT: mov v0.s[1], v2.s[0]
+; CHECK-NEXT: // kill: def $d0 killed $d0 killed $q0
+; CHECK-NEXT: ret
+ %l = load <2 x i8>, ptr %a
+ %s1 = shufflevector <2 x i8> %l, <2 x i8> poison, <4 x i32> <i32 0, i32 1, i32 undef, i32 undef>
+ %s2 = shufflevector <4 x i8> %s1, <4 x i8> %b, <4 x i32> <i32 4, i32 5, i32 0, i32 1>
+ ret <4 x i8> %s2
+}
+
; i16
define <8 x i16> @load_v8i16_2_1(float %tmp, <8 x i16> %b, ptr %a) {
@@ -400,10 +525,10 @@ define <8 x i16> @load_v8i16_2_15(float %tmp, <8 x i16> %b, ptr %a) {
; CHECK-NEXT: add x9, x0, #2
; CHECK-NEXT: // kill: def $q1 killed $q1 def $q0_q1
; CHECK-NEXT: fmov s2, w8
-; CHECK-NEXT: adrp x8, .LCPI33_0
+; CHECK-NEXT: adrp x8, .LCPI40_0
; CHECK-NEXT: ld1 { v2.h }[2], [x9]
; CHECK-NEXT: xtn v0.4h, v2.4s
-; CHECK-NEXT: ldr q2, [x8, :lo12:.LCPI33_0]
+; CHECK-NEXT: ldr q2, [x8, :lo12:.LCPI40_0]
; CHECK-NEXT: tbl v0.16b, { v0.16b, v1.16b }, v2.16b
; CHECK-NEXT: ret
%l = load <2 x i16>, ptr %a