; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5 ; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu \ ; RUN: -mcpu=future -ppc-asm-full-reg-names \ ; RUN: -ppc-vsr-nums-as-vr < %s | FileCheck %s ; RUN: llc -verify-machineinstrs -mtriple=powerpc64-ibm-aix \ ; RUN: -mcpu=future -ppc-asm-full-reg-names \ ; RUN: -ppc-vsr-nums-as-vr < %s | FileCheck %s --check-prefix=CHECK-BE define void @tdmrz(ptr nocapture readonly %vp1, ptr nocapture %resp) { ; CHECK-LABEL: tdmrz: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: dmsetdmrz dmr0 ; CHECK-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc0, 0 ; CHECK-NEXT: stxvp vsp34, 96(r4) ; CHECK-NEXT: stxvp vsp36, 64(r4) ; CHECK-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc_hi0, 1 ; CHECK-NEXT: stxvp vsp34, 32(r4) ; CHECK-NEXT: stxvp vsp36, 0(r4) ; CHECK-NEXT: blr ; ; CHECK-BE-LABEL: tdmrz: ; CHECK-BE: # %bb.0: # %entry ; CHECK-BE-NEXT: dmsetdmrz dmr0 ; CHECK-BE-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc_hi0, 1 ; CHECK-BE-NEXT: stxvp vsp36, 96(r4) ; CHECK-BE-NEXT: stxvp vsp34, 64(r4) ; CHECK-BE-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc0, 0 ; CHECK-BE-NEXT: stxvp vsp36, 32(r4) ; CHECK-BE-NEXT: stxvp vsp34, 0(r4) ; CHECK-BE-NEXT: blr entry: %z = call <1024 x i1> @llvm.ppc.mma.dmsetdmrz() store <1024 x i1> %z, ptr %resp, align 32 ret void } define void @tdmmr(ptr nocapture readonly %vp1, ptr nocapture %resp) { ; CHECK-LABEL: tdmmr: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: lxvp vsp34, 0(r3) ; CHECK-NEXT: lxvp vsp36, 32(r3) ; CHECK-NEXT: dmxxinstdmr512 wacc_hi0, vsp36, vsp34, 1 ; CHECK-NEXT: lxvp vsp34, 64(r3) ; CHECK-NEXT: lxvp vsp36, 96(r3) ; CHECK-NEXT: dmxxinstdmr512 wacc0, vsp36, vsp34, 0 ; CHECK-NEXT: dmmr dmr0, dmr0 ; CHECK-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc0, 0 ; CHECK-NEXT: stxvp vsp34, 96(r4) ; CHECK-NEXT: stxvp vsp36, 64(r4) ; CHECK-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc_hi0, 1 ; CHECK-NEXT: stxvp vsp34, 32(r4) ; CHECK-NEXT: stxvp vsp36, 0(r4) ; CHECK-NEXT: blr ; ; CHECK-BE-LABEL: tdmmr: ; CHECK-BE: # %bb.0: # %entry ; CHECK-BE-NEXT: lxvp vsp34, 96(r3) ; CHECK-BE-NEXT: lxvp vsp36, 64(r3) ; CHECK-BE-NEXT: dmxxinstdmr512 wacc_hi0, vsp36, vsp34, 1 ; CHECK-BE-NEXT: lxvp vsp34, 32(r3) ; CHECK-BE-NEXT: lxvp vsp36, 0(r3) ; CHECK-BE-NEXT: dmxxinstdmr512 wacc0, vsp36, vsp34, 0 ; CHECK-BE-NEXT: dmmr dmr0, dmr0 ; CHECK-BE-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc_hi0, 1 ; CHECK-BE-NEXT: stxvp vsp36, 96(r4) ; CHECK-BE-NEXT: stxvp vsp34, 64(r4) ; CHECK-BE-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc0, 0 ; CHECK-BE-NEXT: stxvp vsp36, 32(r4) ; CHECK-BE-NEXT: stxvp vsp34, 0(r4) ; CHECK-BE-NEXT: blr entry: %l = load <1024 x i1>, ptr %vp1, align 32 %c = call <1024 x i1> @llvm.ppc.mma.dmmr(<1024 x i1> %l) store <1024 x i1> %c, ptr %resp, align 32 ret void } define void @tdmxor(ptr nocapture readonly %vp1, ptr %vp2, ptr nocapture %resp) { ; CHECK-LABEL: tdmxor: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: lxvp vsp34, 0(r3) ; CHECK-NEXT: lxvp vsp36, 32(r3) ; CHECK-NEXT: dmxxinstdmr512 wacc_hi0, vsp36, vsp34, 1 ; CHECK-NEXT: lxvp vsp34, 64(r3) ; CHECK-NEXT: lxvp vsp36, 96(r3) ; CHECK-NEXT: dmxxinstdmr512 wacc0, vsp36, vsp34, 0 ; CHECK-NEXT: lxvp vsp34, 0(r4) ; CHECK-NEXT: lxvp vsp36, 32(r4) ; CHECK-NEXT: dmxxinstdmr512 wacc_hi1, vsp36, vsp34, 1 ; CHECK-NEXT: lxvp vsp34, 64(r4) ; CHECK-NEXT: lxvp vsp36, 96(r4) ; CHECK-NEXT: dmxxinstdmr512 wacc1, vsp36, vsp34, 0 ; CHECK-NEXT: dmxor dmr0, dmr1 ; CHECK-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc0, 0 ; CHECK-NEXT: stxvp vsp34, 96(r5) ; CHECK-NEXT: stxvp vsp36, 64(r5) ; CHECK-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc_hi0, 1 ; CHECK-NEXT: stxvp vsp34, 32(r5) ; CHECK-NEXT: stxvp vsp36, 0(r5) ; CHECK-NEXT: blr ; ; CHECK-BE-LABEL: tdmxor: ; CHECK-BE: # %bb.0: # %entry ; CHECK-BE-NEXT: lxvp vsp34, 96(r3) ; CHECK-BE-NEXT: lxvp vsp36, 64(r3) ; CHECK-BE-NEXT: dmxxinstdmr512 wacc_hi0, vsp36, vsp34, 1 ; CHECK-BE-NEXT: lxvp vsp34, 32(r3) ; CHECK-BE-NEXT: lxvp vsp36, 0(r3) ; CHECK-BE-NEXT: dmxxinstdmr512 wacc0, vsp36, vsp34, 0 ; CHECK-BE-NEXT: lxvp vsp34, 96(r4) ; CHECK-BE-NEXT: lxvp vsp36, 64(r4) ; CHECK-BE-NEXT: dmxxinstdmr512 wacc_hi1, vsp36, vsp34, 1 ; CHECK-BE-NEXT: lxvp vsp34, 32(r4) ; CHECK-BE-NEXT: lxvp vsp36, 0(r4) ; CHECK-BE-NEXT: dmxxinstdmr512 wacc1, vsp36, vsp34, 0 ; CHECK-BE-NEXT: dmxor dmr0, dmr1 ; CHECK-BE-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc_hi0, 1 ; CHECK-BE-NEXT: stxvp vsp36, 96(r5) ; CHECK-BE-NEXT: stxvp vsp34, 64(r5) ; CHECK-BE-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc0, 0 ; CHECK-BE-NEXT: stxvp vsp36, 32(r5) ; CHECK-BE-NEXT: stxvp vsp34, 0(r5) ; CHECK-BE-NEXT: blr entry: %l = load <1024 x i1>, ptr %vp1, align 32 %r = load <1024 x i1>, ptr %vp2, align 32 %x = call <1024 x i1> @llvm.ppc.mma.dmxor(<1024 x i1> %l, <1024 x i1> %r) store <1024 x i1> %x, ptr %resp, align 32 ret void } define void @text512(ptr %vp1, ptr %rp1, ptr %rp2, ptr %rp3, ptr %rp4) { ; CHECK-LABEL: text512: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: dmsetdmrz dmr0 ; CHECK-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc0, 0 ; CHECK-NEXT: stxv v2, 16(r4) ; CHECK-NEXT: stxv v3, 0(r4) ; CHECK-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc_hi0, 1 ; CHECK-NEXT: stxv v2, 16(r6) ; CHECK-NEXT: stxv v3, 0(r6) ; CHECK-NEXT: blr ; ; CHECK-BE-LABEL: text512: ; CHECK-BE: # %bb.0: # %entry ; CHECK-BE-NEXT: dmsetdmrz dmr0 ; CHECK-BE-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc0, 0 ; CHECK-BE-NEXT: stxv v3, 16(r4) ; CHECK-BE-NEXT: stxv v2, 0(r4) ; CHECK-BE-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc_hi0, 1 ; CHECK-BE-NEXT: stxv v3, 16(r6) ; CHECK-BE-NEXT: stxv v2, 0(r6) ; CHECK-BE-NEXT: blr entry: %z = call <1024 x i1> @llvm.ppc.mma.dmsetdmrz() %x = call { <256 x i1>, <256 x i1> } @llvm.ppc.mma.dmxxextfdmr512(<1024 x i1> %z, i32 0) %p = extractvalue { <256 x i1>, <256 x i1 > } %x, 0 store <256 x i1> %p, ptr %rp1, align 16 %y = call { <256 x i1>, <256 x i1> } @llvm.ppc.mma.dmxxextfdmr512(<1024 x i1> %z, i32 1) %q = extractvalue { <256 x i1>, <256 x i1 > } %y, 0 store <256 x i1> %q, ptr %rp3, align 16 ret void } define void @text256(ptr %vp1, ptr %rp1, ptr %rp2, ptr %rp3, ptr %rp4) { ; CHECK-LABEL: text256: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: dmsetdmrz dmr0 ; CHECK-NEXT: dmxxextfdmr256 vsp34, dmr0, 0 ; CHECK-NEXT: stxv v2, 16(r4) ; CHECK-NEXT: stxv v3, 0(r4) ; CHECK-NEXT: dmxxextfdmr256 vsp34, dmr0, 1 ; CHECK-NEXT: stxv v2, 16(r5) ; CHECK-NEXT: stxv v3, 0(r5) ; CHECK-NEXT: dmxxextfdmr256 vsp34, dmr0, 2 ; CHECK-NEXT: stxv v2, 16(r6) ; CHECK-NEXT: stxv v3, 0(r6) ; CHECK-NEXT: dmxxextfdmr256 vsp34, dmr0, 3 ; CHECK-NEXT: stxv v2, 16(r7) ; CHECK-NEXT: stxv v3, 0(r7) ; CHECK-NEXT: blr ; ; CHECK-BE-LABEL: text256: ; CHECK-BE: # %bb.0: # %entry ; CHECK-BE-NEXT: dmsetdmrz dmr0 ; CHECK-BE-NEXT: dmxxextfdmr256 vsp34, dmr0, 0 ; CHECK-BE-NEXT: stxv v3, 16(r4) ; CHECK-BE-NEXT: stxv v2, 0(r4) ; CHECK-BE-NEXT: dmxxextfdmr256 vsp34, dmr0, 1 ; CHECK-BE-NEXT: stxv v3, 16(r5) ; CHECK-BE-NEXT: stxv v2, 0(r5) ; CHECK-BE-NEXT: dmxxextfdmr256 vsp34, dmr0, 2 ; CHECK-BE-NEXT: stxv v3, 16(r6) ; CHECK-BE-NEXT: stxv v2, 0(r6) ; CHECK-BE-NEXT: dmxxextfdmr256 vsp34, dmr0, 3 ; CHECK-BE-NEXT: stxv v3, 16(r7) ; CHECK-BE-NEXT: stxv v2, 0(r7) ; CHECK-BE-NEXT: blr entry: %z = call <1024 x i1> @llvm.ppc.mma.dmsetdmrz() %x = call <256 x i1> @llvm.ppc.mma.dmxxextfdmr256(<1024 x i1> %z, i32 0) store <256 x i1> %x, ptr %rp1, align 16 %q = call <256 x i1> @llvm.ppc.mma.dmxxextfdmr256(<1024 x i1> %z, i32 1) store <256 x i1> %q, ptr %rp2, align 16 %w = call <256 x i1> @llvm.ppc.mma.dmxxextfdmr256(<1024 x i1> %z, i32 2) store <256 x i1> %w, ptr %rp3, align 16 %y = call <256 x i1> @llvm.ppc.mma.dmxxextfdmr256(<1024 x i1> %z, i32 3) store <256 x i1> %y, ptr %rp4, align 16 ret void } define void @tins512(ptr %vp1, ptr %vp2, ptr %vp3, ptr %vp4, ptr %rp1, ptr %rp2) { ; CHECK-LABEL: tins512: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: lxv v2, 16(r3) ; CHECK-NEXT: lxv v3, 0(r3) ; CHECK-NEXT: lxv v4, 16(r4) ; CHECK-NEXT: lxv v5, 0(r4) ; CHECK-NEXT: dmsetdmrz dmr0 ; CHECK-NEXT: dmxxinstdmr512 wacc0, vsp34, vsp36, 0 ; CHECK-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc0, 0 ; CHECK-NEXT: stxvp vsp34, 96(r7) ; CHECK-NEXT: stxvp vsp36, 64(r7) ; CHECK-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc_hi0, 1 ; CHECK-NEXT: stxvp vsp34, 32(r7) ; CHECK-NEXT: stxvp vsp36, 0(r7) ; CHECK-NEXT: lxv v2, 16(r5) ; CHECK-NEXT: lxv v4, 16(r6) ; CHECK-NEXT: lxv v3, 0(r5) ; CHECK-NEXT: lxv v5, 0(r6) ; CHECK-NEXT: dmxxinstdmr512 wacc_hi0, vsp34, vsp36, 1 ; CHECK-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc0, 0 ; CHECK-NEXT: stxvp vsp34, 96(r8) ; CHECK-NEXT: stxvp vsp36, 64(r8) ; CHECK-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc_hi0, 1 ; CHECK-NEXT: stxvp vsp34, 32(r8) ; CHECK-NEXT: stxvp vsp36, 0(r8) ; CHECK-NEXT: blr ; ; CHECK-BE-LABEL: tins512: ; CHECK-BE: # %bb.0: # %entry ; CHECK-BE-NEXT: lxv v2, 0(r3) ; CHECK-BE-NEXT: lxv v3, 16(r3) ; CHECK-BE-NEXT: lxv v4, 0(r4) ; CHECK-BE-NEXT: lxv v5, 16(r4) ; CHECK-BE-NEXT: dmsetdmrz dmr0 ; CHECK-BE-NEXT: dmxxinstdmr512 wacc0, vsp34, vsp36, 0 ; CHECK-BE-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc_hi0, 1 ; CHECK-BE-NEXT: stxvp vsp36, 96(r7) ; CHECK-BE-NEXT: stxvp vsp34, 64(r7) ; CHECK-BE-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc0, 0 ; CHECK-BE-NEXT: stxvp vsp36, 32(r7) ; CHECK-BE-NEXT: stxvp vsp34, 0(r7) ; CHECK-BE-NEXT: lxv v2, 0(r5) ; CHECK-BE-NEXT: lxv v4, 0(r6) ; CHECK-BE-NEXT: lxv v3, 16(r5) ; CHECK-BE-NEXT: lxv v5, 16(r6) ; CHECK-BE-NEXT: dmxxinstdmr512 wacc_hi0, vsp34, vsp36, 1 ; CHECK-BE-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc_hi0, 1 ; CHECK-BE-NEXT: stxvp vsp36, 96(r8) ; CHECK-BE-NEXT: stxvp vsp34, 64(r8) ; CHECK-BE-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc0, 0 ; CHECK-BE-NEXT: stxvp vsp36, 32(r8) ; CHECK-BE-NEXT: stxvp vsp34, 0(r8) ; CHECK-BE-NEXT: blr entry: %z = call <1024 x i1> @llvm.ppc.mma.dmsetdmrz() %l1 = load <256 x i1>, ptr %vp1, align 16 %r1 = load <256 x i1>, ptr %vp2, align 16 %a = call <1024 x i1> @llvm.ppc.mma.dmxxinstdmr512(<1024 x i1> %z, <256 x i1> %l1, <256 x i1> %r1, i32 0) store <1024 x i1> %a, ptr %rp1, align 16 %l2 = load <256 x i1>, ptr %vp3, align 16 %r2 = load <256 x i1>, ptr %vp4, align 16 %b = call <1024 x i1> @llvm.ppc.mma.dmxxinstdmr512(<1024 x i1> %a, <256 x i1> %l2, <256 x i1> %r2, i32 1) store <1024 x i1> %b, ptr %rp2, align 16 ret void } define void @tins256(ptr %vp1, ptr %vp2, ptr %vp3, ptr %vp4, ptr %rp1, ptr %rp2, ptr %rp3, ptr %rp4) { ; CHECK-LABEL: tins256: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: lxv v2, 16(r3) ; CHECK-NEXT: lxv v3, 0(r3) ; CHECK-NEXT: dmsetdmrz dmr0 ; CHECK-NEXT: dmxxinstdmr256 dmr0, vsp34, 0 ; CHECK-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc0, 0 ; CHECK-NEXT: stxvp vsp34, 96(r7) ; CHECK-NEXT: stxvp vsp36, 64(r7) ; CHECK-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc_hi0, 1 ; CHECK-NEXT: stxvp vsp34, 32(r7) ; CHECK-NEXT: stxvp vsp36, 0(r7) ; CHECK-NEXT: lxv v2, 16(r4) ; CHECK-NEXT: lxv v3, 0(r4) ; CHECK-NEXT: dmxxinstdmr256 dmr0, vsp34, 1 ; CHECK-NEXT: dmxxextfdmr512 vsp36, vsp32, wacc0, 0 ; CHECK-NEXT: stxvp vsp36, 96(r8) ; CHECK-NEXT: stxvp vsp32, 64(r8) ; CHECK-NEXT: dmxxextfdmr512 vsp36, vsp32, wacc_hi0, 1 ; CHECK-NEXT: stxvp vsp36, 32(r8) ; CHECK-NEXT: stxvp vsp32, 0(r8) ; CHECK-NEXT: dmxxinstdmr256 dmr0, vsp34, 2 ; CHECK-NEXT: dmxxextfdmr512 vsp36, vsp32, wacc0, 0 ; CHECK-NEXT: stxvp vsp36, 96(r9) ; CHECK-NEXT: stxvp vsp32, 64(r9) ; CHECK-NEXT: dmxxextfdmr512 vsp36, vsp32, wacc_hi0, 1 ; CHECK-NEXT: stxvp vsp36, 32(r9) ; CHECK-NEXT: stxvp vsp32, 0(r9) ; CHECK-NEXT: dmxxinstdmr256 dmr0, vsp34, 3 ; CHECK-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc0, 0 ; CHECK-NEXT: stxvp vsp34, 96(r10) ; CHECK-NEXT: stxvp vsp36, 64(r10) ; CHECK-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc_hi0, 1 ; CHECK-NEXT: stxvp vsp34, 32(r10) ; CHECK-NEXT: stxvp vsp36, 0(r10) ; CHECK-NEXT: blr ; ; CHECK-BE-LABEL: tins256: ; CHECK-BE: # %bb.0: # %entry ; CHECK-BE-NEXT: lxv v2, 0(r3) ; CHECK-BE-NEXT: lxv v3, 16(r3) ; CHECK-BE-NEXT: dmsetdmrz dmr0 ; CHECK-BE-NEXT: dmxxinstdmr256 dmr0, vsp34, 0 ; CHECK-BE-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc_hi0, 1 ; CHECK-BE-NEXT: stxvp vsp36, 96(r7) ; CHECK-BE-NEXT: stxvp vsp34, 64(r7) ; CHECK-BE-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc0, 0 ; CHECK-BE-NEXT: stxvp vsp36, 32(r7) ; CHECK-BE-NEXT: stxvp vsp34, 0(r7) ; CHECK-BE-NEXT: lxv v2, 0(r4) ; CHECK-BE-NEXT: lxv v3, 16(r4) ; CHECK-BE-NEXT: dmxxinstdmr256 dmr0, vsp34, 1 ; CHECK-BE-NEXT: dmxxextfdmr512 vsp36, vsp32, wacc_hi0, 1 ; CHECK-BE-NEXT: stxvp vsp32, 96(r8) ; CHECK-BE-NEXT: stxvp vsp36, 64(r8) ; CHECK-BE-NEXT: dmxxextfdmr512 vsp36, vsp32, wacc0, 0 ; CHECK-BE-NEXT: stxvp vsp32, 32(r8) ; CHECK-BE-NEXT: stxvp vsp36, 0(r8) ; CHECK-BE-NEXT: dmxxinstdmr256 dmr0, vsp34, 2 ; CHECK-BE-NEXT: dmxxextfdmr512 vsp36, vsp32, wacc_hi0, 1 ; CHECK-BE-NEXT: stxvp vsp32, 96(r9) ; CHECK-BE-NEXT: stxvp vsp36, 64(r9) ; CHECK-BE-NEXT: dmxxextfdmr512 vsp36, vsp32, wacc0, 0 ; CHECK-BE-NEXT: stxvp vsp32, 32(r9) ; CHECK-BE-NEXT: stxvp vsp36, 0(r9) ; CHECK-BE-NEXT: dmxxinstdmr256 dmr0, vsp34, 3 ; CHECK-BE-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc_hi0, 1 ; CHECK-BE-NEXT: stxvp vsp36, 96(r10) ; CHECK-BE-NEXT: stxvp vsp34, 64(r10) ; CHECK-BE-NEXT: dmxxextfdmr512 vsp34, vsp36, wacc0, 0 ; CHECK-BE-NEXT: stxvp vsp36, 32(r10) ; CHECK-BE-NEXT: stxvp vsp34, 0(r10) ; CHECK-BE-NEXT: blr entry: %z = call <1024 x i1> @llvm.ppc.mma.dmsetdmrz() %l1 = load <256 x i1>, ptr %vp1, align 16 %a = call <1024 x i1> @llvm.ppc.mma.dmxxinstdmr256(<1024 x i1> %z, <256 x i1> %l1, i32 0) store <1024 x i1> %a, ptr %rp1, align 16 %l2 = load <256 x i1>, ptr %vp2, align 16 %b = call <1024 x i1> @llvm.ppc.mma.dmxxinstdmr256(<1024 x i1> %a, <256 x i1> %l2, i32 1) store <1024 x i1> %b, ptr %rp2, align 16 %l3 = load <256 x i1>, ptr %vp3, align 16 %c = call <1024 x i1> @llvm.ppc.mma.dmxxinstdmr256(<1024 x i1> %b, <256 x i1> %l2, i32 2) store <1024 x i1> %c, ptr %rp3, align 16 %l4 = load <256 x i1>, ptr %vp4, align 16 %d = call <1024 x i1> @llvm.ppc.mma.dmxxinstdmr256(<1024 x i1> %c, <256 x i1> %l2, i32 3) store <1024 x i1> %d, ptr %rp4, align 16 ret void } declare <1024 x i1> @llvm.ppc.mma.dmsetdmrz() declare <1024 x i1> @llvm.ppc.mma.dmmr(<1024 x i1>) declare <1024 x i1> @llvm.ppc.mma.dmxor(<1024 x i1>, <1024 x i1>) declare <1024 x i1> @llvm.ppc.mma.dmxxinstdmr512(<1024 x i1>, <256 x i1>, <256 x i1>, i32) declare <1024 x i1> @llvm.ppc.mma.dmxxinstdmr256(<1024 x i1>, <256 x i1>, i32) declare { <256 x i1>, <256 x i1> } @llvm.ppc.mma.dmxxextfdmr512(<1024 x i1>, i32) declare <256 x i1> @llvm.ppc.mma.dmxxextfdmr256(<1024 x i1>, i32)