; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py ; RUN: llc < %s -mtriple=x86_64-- -mattr=+movrs,+avx10.2-256 -verify-machineinstrs --show-mc-encoding | FileCheck %s --check-prefixes=CHECK define <2 x i64> @test_mm_movrsb_epu8(ptr %__A) { ; CHECK-LABEL: test_mm_movrsb_epu8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vmovrsb (%rdi), %xmm0 # encoding: [0x62,0xf5,0x7f,0x08,0x6f,0x07] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <16 x i8> @llvm.x86.avx10.vmovrsb128(ptr %__A) %1 = bitcast <16 x i8> %0 to <2 x i64> ret <2 x i64> %1 } define <2 x i64> @test_mm_mask_movrsb_epu8(<2 x i64> %__A, i16 zeroext %__B, ptr %__C) { ; CHECK-LABEL: test_mm_mask_movrsb_epu8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] ; CHECK-NEXT: vmovrsb (%rsi), %xmm0 {%k1} # encoding: [0x62,0xf5,0x7f,0x09,0x6f,0x06] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <16 x i8> @llvm.x86.avx10.vmovrsb128(ptr %__C) %1 = bitcast <2 x i64> %__A to <16 x i8> %2 = bitcast i16 %__B to <16 x i1> %3 = select <16 x i1> %2, <16 x i8> %0, <16 x i8> %1 %4 = bitcast <16 x i8> %3 to <2 x i64> ret <2 x i64> %4 } define <2 x i64> @test_mm_maskz_movrsb_epu8(i16 zeroext %__A, ptr %__B) { ; CHECK-LABEL: test_mm_maskz_movrsb_epu8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] ; CHECK-NEXT: vmovrsb (%rsi), %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7f,0x89,0x6f,0x06] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <16 x i8> @llvm.x86.avx10.vmovrsb128(ptr %__B ) %1 = bitcast i16 %__A to <16 x i1> %2 = select <16 x i1> %1, <16 x i8> %0, <16 x i8> zeroinitializer %3 = bitcast <16 x i8> %2 to <2 x i64> ret <2 x i64> %3 } define <4 x i64> @test_mm256_movrsb_epu8(ptr %__A) { ; CHECK-LABEL: test_mm256_movrsb_epu8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vmovrsb (%rdi), %ymm0 # encoding: [0x62,0xf5,0x7f,0x28,0x6f,0x07] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <32 x i8> @llvm.x86.avx10.vmovrsb256(ptr %__A) %1 = bitcast <32 x i8> %0 to <4 x i64> ret <4 x i64> %1 } define <4 x i64> @test_mm256_mask_movrsb_epu8(<4 x i64> %__A, i32 %__B, ptr %__C) { ; CHECK-LABEL: test_mm256_mask_movrsb_epu8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] ; CHECK-NEXT: vmovrsb (%rsi), %ymm0 {%k1} # encoding: [0x62,0xf5,0x7f,0x29,0x6f,0x06] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <32 x i8> @llvm.x86.avx10.vmovrsb256(ptr %__C) %1 = bitcast <4 x i64> %__A to <32 x i8> %2 = bitcast i32 %__B to <32 x i1> %3 = select <32 x i1> %2, <32 x i8> %0, <32 x i8> %1 %4 = bitcast <32 x i8> %3 to <4 x i64> ret <4 x i64> %4 } define <4 x i64> @test_mm256_maskz_movrsb_epu8(i32 %__A, ptr %__B) { ; CHECK-LABEL: test_mm256_maskz_movrsb_epu8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] ; CHECK-NEXT: vmovrsb (%rsi), %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7f,0xa9,0x6f,0x06] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <32 x i8> @llvm.x86.avx10.vmovrsb256(ptr %__B) %1 = bitcast i32 %__A to <32 x i1> %2 = select <32 x i1> %1, <32 x i8> %0, <32 x i8> zeroinitializer %3 = bitcast <32 x i8> %2 to <4 x i64> ret <4 x i64> %3 } define <2 x i64> @test_mm_movrsd_epu32(ptr %__A) { ; CHECK-LABEL: test_mm_movrsd_epu32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vmovrsd (%rdi), %xmm0 # encoding: [0x62,0xf5,0x7e,0x08,0x6f,0x07] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <4 x i32> @llvm.x86.avx10.vmovrsd128(ptr %__A) %1 = bitcast <4 x i32> %0 to <2 x i64> ret <2 x i64> %1 } define <2 x i64> @test_mm_mask_movrsd_epu32(<2 x i64> %__A, i8 zeroext %__B, ptr %__C) { ; CHECK-LABEL: test_mm_mask_movrsd_epu32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] ; CHECK-NEXT: vmovrsd (%rsi), %xmm0 {%k1} # encoding: [0x62,0xf5,0x7e,0x09,0x6f,0x06] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <4 x i32> @llvm.x86.avx10.vmovrsd128(ptr %__C) %1 = bitcast <2 x i64> %__A to <4 x i32> %2 = bitcast i8 %__B to <8 x i1> %extract.i = shufflevector <8 x i1> %2, <8 x i1> poison, <4 x i32> %3 = select <4 x i1> %extract.i, <4 x i32> %0, <4 x i32> %1 %4 = bitcast <4 x i32> %3 to <2 x i64> ret <2 x i64> %4 } define <2 x i64> @test_mm_maskz_movrsd_epu32(i8 zeroext %__A, ptr %__B) { ; CHECK-LABEL: test_mm_maskz_movrsd_epu32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] ; CHECK-NEXT: vmovrsd (%rsi), %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7e,0x89,0x6f,0x06] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <4 x i32> @llvm.x86.avx10.vmovrsd128(ptr %__B) %1 = bitcast i8 %__A to <8 x i1> %extract.i = shufflevector <8 x i1> %1, <8 x i1> poison, <4 x i32> %2 = select <4 x i1> %extract.i, <4 x i32> %0, <4 x i32> zeroinitializer %3 = bitcast <4 x i32> %2 to <2 x i64> ret <2 x i64> %3 } define <4 x i64> @test_mm256_movrsd_epu32(ptr %__A) { ; CHECK-LABEL: test_mm256_movrsd_epu32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vmovrsd (%rdi), %ymm0 # encoding: [0x62,0xf5,0x7e,0x28,0x6f,0x07] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <8 x i32> @llvm.x86.avx10.vmovrsd256(ptr %__A) %1 = bitcast <8 x i32> %0 to <4 x i64> ret <4 x i64> %1 } define <4 x i64> @test_mm256_mask_movrsd_epu32(<4 x i64> %__A, i8 zeroext %__B, ptr %__C) { ; CHECK-LABEL: test_mm256_mask_movrsd_epu32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] ; CHECK-NEXT: vmovrsd (%rsi), %ymm0 {%k1} # encoding: [0x62,0xf5,0x7e,0x29,0x6f,0x06] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <8 x i32> @llvm.x86.avx10.vmovrsd256(ptr %__C) %1 = bitcast <4 x i64> %__A to <8 x i32> %2 = bitcast i8 %__B to <8 x i1> %3 = select <8 x i1> %2, <8 x i32> %0, <8 x i32> %1 %4 = bitcast <8 x i32> %3 to <4 x i64> ret <4 x i64> %4 } define <4 x i64> @test_mm256_maskz_movrsd_epu32(i8 zeroext %__A, ptr %__B) { ; CHECK-LABEL: test_mm256_maskz_movrsd_epu32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] ; CHECK-NEXT: vmovrsd (%rsi), %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7e,0xa9,0x6f,0x06] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <8 x i32> @llvm.x86.avx10.vmovrsd256(ptr %__B) %1 = bitcast i8 %__A to <8 x i1> %2 = select <8 x i1> %1, <8 x i32> %0, <8 x i32> zeroinitializer %3 = bitcast <8 x i32> %2 to <4 x i64> ret <4 x i64> %3 } define <2 x i64> @test_mm_movrsq_epu64(ptr %__A) { ; CHECK-LABEL: test_mm_movrsq_epu64: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vmovrsq (%rdi), %xmm0 # encoding: [0x62,0xf5,0xfe,0x08,0x6f,0x07] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <2 x i64> @llvm.x86.avx10.vmovrsq128(ptr %__A) ret <2 x i64> %0 } define <2 x i64> @test_mm_mask_movrsq_epu64(<2 x i64> %__A, i8 zeroext %__B, ptr %__C) { ; CHECK-LABEL: test_mm_mask_movrsq_epu64: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] ; CHECK-NEXT: vmovrsq (%rsi), %xmm0 {%k1} # encoding: [0x62,0xf5,0xfe,0x09,0x6f,0x06] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <2 x i64> @llvm.x86.avx10.vmovrsq128(ptr %__C) %1 = bitcast i8 %__B to <8 x i1> %extract.i = shufflevector <8 x i1> %1, <8 x i1> poison, <2 x i32> %2 = select <2 x i1> %extract.i, <2 x i64> %0, <2 x i64> %__A ret <2 x i64> %2 } define <2 x i64> @test_mm_maskz_movrsq_epu64(i8 zeroext %__A, ptr %__B) { ; CHECK-LABEL: test_mm_maskz_movrsq_epu64: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] ; CHECK-NEXT: vmovrsq (%rsi), %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0xfe,0x89,0x6f,0x06] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <2 x i64> @llvm.x86.avx10.vmovrsq128(ptr %__B) %1 = bitcast i8 %__A to <8 x i1> %extract.i = shufflevector <8 x i1> %1, <8 x i1> poison, <2 x i32> %2 = select <2 x i1> %extract.i, <2 x i64> %0, <2 x i64> zeroinitializer ret <2 x i64> %2 } define <4 x i64> @test_mm256_movrsq_epu64(ptr %__A) { ; CHECK-LABEL: test_mm256_movrsq_epu64: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vmovrsq (%rdi), %ymm0 # encoding: [0x62,0xf5,0xfe,0x28,0x6f,0x07] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <4 x i64> @llvm.x86.avx10.vmovrsq256(ptr %__A) ret <4 x i64> %0 } define <4 x i64> @test_mm256_mask_movrsq_epu64(<4 x i64> %__A, i8 zeroext %__B, ptr %__C) { ; CHECK-LABEL: test_mm256_mask_movrsq_epu64: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] ; CHECK-NEXT: vmovrsq (%rsi), %ymm0 {%k1} # encoding: [0x62,0xf5,0xfe,0x29,0x6f,0x06] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <4 x i64> @llvm.x86.avx10.vmovrsq256(ptr %__C) %1 = bitcast i8 %__B to <8 x i1> %extract.i = shufflevector <8 x i1> %1, <8 x i1> poison, <4 x i32> %2 = select <4 x i1> %extract.i, <4 x i64> %0, <4 x i64> %__A ret <4 x i64> %2 } define <4 x i64> @test_mm256_maskz_movrsq_epu64(i8 zeroext %__A, ptr %__B) { ; CHECK-LABEL: test_mm256_maskz_movrsq_epu64: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] ; CHECK-NEXT: vmovrsq (%rsi), %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0xfe,0xa9,0x6f,0x06] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <4 x i64> @llvm.x86.avx10.vmovrsq256(ptr %__B) %1 = bitcast i8 %__A to <8 x i1> %extract.i = shufflevector <8 x i1> %1, <8 x i1> poison, <4 x i32> %2 = select <4 x i1> %extract.i, <4 x i64> %0, <4 x i64> zeroinitializer ret <4 x i64> %2 } define <2 x i64> @test_mm_movrsw_epu16(ptr %__A) { ; CHECK-LABEL: test_mm_movrsw_epu16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vmovrsw (%rdi), %xmm0 # encoding: [0x62,0xf5,0xff,0x08,0x6f,0x07] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <8 x i16> @llvm.x86.avx10.vmovrsw128(ptr %__A) %1 = bitcast <8 x i16> %0 to <2 x i64> ret <2 x i64> %1 } define <2 x i64> @test_mm_mask_movrsw_epu16(<2 x i64> %__A, i8 zeroext %__B, ptr %__C) { ; CHECK-LABEL: test_mm_mask_movrsw_epu16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] ; CHECK-NEXT: vmovrsw (%rsi), %xmm0 {%k1} # encoding: [0x62,0xf5,0xff,0x09,0x6f,0x06] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <8 x i16> @llvm.x86.avx10.vmovrsw128(ptr %__C) %1 = bitcast <2 x i64> %__A to <8 x i16> %2 = bitcast i8 %__B to <8 x i1> %3 = select <8 x i1> %2, <8 x i16> %0, <8 x i16> %1 %4 = bitcast <8 x i16> %3 to <2 x i64> ret <2 x i64> %4 } define <2 x i64> @test_mm_maskz_movrsw_epu16(i8 zeroext %__A, ptr %__B) { ; CHECK-LABEL: test_mm_maskz_movrsw_epu16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] ; CHECK-NEXT: vmovrsw (%rsi), %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0xff,0x89,0x6f,0x06] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <8 x i16> @llvm.x86.avx10.vmovrsw128(ptr %__B) %1 = bitcast i8 %__A to <8 x i1> %2 = select <8 x i1> %1, <8 x i16> %0, <8 x i16> zeroinitializer %3 = bitcast <8 x i16> %2 to <2 x i64> ret <2 x i64> %3 } define <4 x i64> @test_mm256_movrsw_epu16(ptr %__A) { ; CHECK-LABEL: test_mm256_movrsw_epu16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vmovrsw (%rdi), %ymm0 # encoding: [0x62,0xf5,0xff,0x28,0x6f,0x07] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <16 x i16> @llvm.x86.avx10.vmovrsw256(ptr %__A) %1 = bitcast <16 x i16> %0 to <4 x i64> ret <4 x i64> %1 } define <4 x i64> @test_mm256_mask_movrsw_epu16(<4 x i64> %__A, i16 zeroext %__B, ptr %__C) { ; CHECK-LABEL: test_mm256_mask_movrsw_epu16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] ; CHECK-NEXT: vmovrsw (%rsi), %ymm0 {%k1} # encoding: [0x62,0xf5,0xff,0x29,0x6f,0x06] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <16 x i16> @llvm.x86.avx10.vmovrsw256(ptr %__C) %1 = bitcast <4 x i64> %__A to <16 x i16> %2 = bitcast i16 %__B to <16 x i1> %3 = select <16 x i1> %2, <16 x i16> %0, <16 x i16> %1 %4 = bitcast <16 x i16> %3 to <4 x i64> ret <4 x i64> %4 } define <4 x i64> @test_mm256_maskz_movrsw_epu16(i16 zeroext %__A, ptr %__B) { ; CHECK-LABEL: test_mm256_maskz_movrsw_epu16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] ; CHECK-NEXT: vmovrsw (%rsi), %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0xff,0xa9,0x6f,0x06] ; CHECK-NEXT: retq # encoding: [0xc3] entry: %0 = tail call <16 x i16> @llvm.x86.avx10.vmovrsw256(ptr %__B) %1 = bitcast i16 %__A to <16 x i1> %2 = select <16 x i1> %1, <16 x i16> %0, <16 x i16> zeroinitializer %3 = bitcast <16 x i16> %2 to <4 x i64> ret <4 x i64> %3 } declare <16 x i8> @llvm.x86.avx10.vmovrsb128(ptr) declare <32 x i8> @llvm.x86.avx10.vmovrsb256(ptr) declare <4 x i32> @llvm.x86.avx10.vmovrsd128(ptr) declare <8 x i32> @llvm.x86.avx10.vmovrsd256(ptr) declare <2 x i64> @llvm.x86.avx10.vmovrsq128(ptr) declare <4 x i64> @llvm.x86.avx10.vmovrsq256(ptr) declare <8 x i16> @llvm.x86.avx10.vmovrsw128(ptr) declare <16 x i16> @llvm.x86.avx10.vmovrsw256(ptr)