; NOTE: Assertions have been autogenerated by utils/update_test_checks.py ; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-promote-alloca < %s | FileCheck %s ; Check that types where the store/allocation sizes don't match the type size ; don't crash. define <7 x i9> @load_elem_i9_access_7xi9() { ; CHECK-LABEL: @load_elem_i9_access_7xi9( ; CHECK-NEXT: [[P:%.*]] = alloca <16 x i9>, align 1, addrspace(5) ; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4 ; CHECK-NEXT: [[L:%.*]] = load <7 x i9>, ptr addrspace(5) [[G]], align 1 ; CHECK-NEXT: ret <7 x i9> [[L]] ; %p = alloca <16 x i9>, align 1, addrspace(5) %g = getelementptr i8, ptr addrspace(5) %p, i64 4 %l = load <7 x i9>, ptr addrspace(5) %g, align 1 ret <7 x i9> %l } define <8 x i1> @load_elem_i1_access_8xi1() { ; CHECK-LABEL: @load_elem_i1_access_8xi1( ; CHECK-NEXT: [[P:%.*]] = alloca <16 x i1>, align 1, addrspace(5) ; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4 ; CHECK-NEXT: [[L:%.*]] = load <8 x i1>, ptr addrspace(5) [[G]], align 1 ; CHECK-NEXT: ret <8 x i1> [[L]] ; %p = alloca <16 x i1>, align 1, addrspace(5) %g = getelementptr i8, ptr addrspace(5) %p, i64 4 %l = load <8 x i1>, ptr addrspace(5) %g, align 1 ret <8 x i1> %l } define <3 x i1> @load_elem_i1_access_3xi1() { ; CHECK-LABEL: @load_elem_i1_access_3xi1( ; CHECK-NEXT: [[P:%.*]] = alloca <16 x i1>, align 1, addrspace(5) ; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4 ; CHECK-NEXT: [[L:%.*]] = load <3 x i1>, ptr addrspace(5) [[G]], align 1 ; CHECK-NEXT: ret <3 x i1> [[L]] ; %p = alloca <16 x i1>, align 1, addrspace(5) %g = getelementptr i8, ptr addrspace(5) %p, i64 4 %l = load <3 x i1>, ptr addrspace(5) %g, align 1 ret <3 x i1> %l } define <3 x i1> @load_elem_i8_access_3xi1() { ; CHECK-LABEL: @load_elem_i8_access_3xi1( ; CHECK-NEXT: [[P:%.*]] = alloca <8 x i8>, align 1, addrspace(5) ; CHECK-NEXT: store <8 x i8> , ptr addrspace(5) [[P]], align 1 ; CHECK-NEXT: [[G:%.*]] = getelementptr <4 x i8>, ptr addrspace(5) [[P]], i64 1 ; CHECK-NEXT: [[L:%.*]] = load <3 x i1>, ptr addrspace(5) [[G]], align 1 ; CHECK-NEXT: ret <3 x i1> [[L]] ; %p = alloca <8 x i8>, align 1, addrspace(5) store <8 x i8> , ptr addrspace(5) %p, align 1 %g = getelementptr <4 x i8>, ptr addrspace(5) %p, i64 1 %l = load <3 x i1>, ptr addrspace(5) %g, align 1 ret <3 x i1> %l } ; This one is actually not problematic. define <8 x i1> @load_elem_i8_access_8xi1() { ; CHECK-LABEL: @load_elem_i8_access_8xi1( ; CHECK-NEXT: [[P:%.*]] = freeze <8 x i8> poison ; CHECK-NEXT: ret <8 x i1> ; %p = alloca <8 x i8>, align 1, addrspace(5) store <8 x i8> , ptr addrspace(5) %p, align 1 %g = getelementptr <4 x i8>, ptr addrspace(5) %p, i64 1 %l = load <8 x i1>, ptr addrspace(5) %g, align 1 ret <8 x i1> %l } define <8 x i1> @storeload_elem_i1_access_8xi1() { ; CHECK-LABEL: @storeload_elem_i1_access_8xi1( ; CHECK-NEXT: [[P:%.*]] = alloca <16 x i1>, align 1, addrspace(5) ; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4 ; CHECK-NEXT: store <8 x i1> , ptr addrspace(5) [[G]], align 1 ; CHECK-NEXT: [[L:%.*]] = load <8 x i1>, ptr addrspace(5) [[G]], align 1 ; CHECK-NEXT: ret <8 x i1> [[L]] ; %p = alloca <16 x i1>, align 1, addrspace(5) %g = getelementptr i8, ptr addrspace(5) %p, i64 4 store <8 x i1> , ptr addrspace(5) %g, align 1 %l = load <8 x i1>, ptr addrspace(5) %g, align 1 ret <8 x i1> %l } define <3 x i1> @storeload_elem_i1_access_3xi1() { ; CHECK-LABEL: @storeload_elem_i1_access_3xi1( ; CHECK-NEXT: [[P:%.*]] = alloca <16 x i1>, align 1, addrspace(5) ; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4 ; CHECK-NEXT: store <3 x i1> , ptr addrspace(5) [[G]], align 1 ; CHECK-NEXT: [[L:%.*]] = load <3 x i1>, ptr addrspace(5) [[G]], align 1 ; CHECK-NEXT: ret <3 x i1> [[L]] ; %p = alloca <16 x i1>, align 1, addrspace(5) %g = getelementptr i8, ptr addrspace(5) %p, i64 4 store <3 x i1> , ptr addrspace(5) %g, align 1 %l = load <3 x i1>, ptr addrspace(5) %g, align 1 ret <3 x i1> %l } define <3 x i1> @storeload_elem_i8_access_3xi1() { ; CHECK-LABEL: @storeload_elem_i8_access_3xi1( ; CHECK-NEXT: [[P:%.*]] = alloca <8 x i8>, align 1, addrspace(5) ; CHECK-NEXT: store <8 x i8> , ptr addrspace(5) [[P]], align 1 ; CHECK-NEXT: [[G:%.*]] = getelementptr <4 x i8>, ptr addrspace(5) [[P]], i64 1 ; CHECK-NEXT: store <3 x i1> , ptr addrspace(5) [[G]], align 1 ; CHECK-NEXT: [[L:%.*]] = load <3 x i1>, ptr addrspace(5) [[G]], align 1 ; CHECK-NEXT: ret <3 x i1> [[L]] ; %p = alloca <8 x i8>, align 1, addrspace(5) store <8 x i8> , ptr addrspace(5) %p, align 1 %g = getelementptr <4 x i8>, ptr addrspace(5) %p, i64 1 store <3 x i1> , ptr addrspace(5) %g, align 1 %l = load <3 x i1>, ptr addrspace(5) %g, align 1 ret <3 x i1> %l } ; This one is actually not problematic. define <8 x i1> @storeload_elem_i8_access_8xi1() { ; CHECK-LABEL: @storeload_elem_i8_access_8xi1( ; CHECK-NEXT: [[P:%.*]] = freeze <8 x i8> poison ; CHECK-NEXT: ret <8 x i1> ; %p = alloca <8 x i8>, align 1, addrspace(5) store <8 x i8> , ptr addrspace(5) %p, align 1 %g = getelementptr <4 x i8>, ptr addrspace(5) %p, i64 1 store <8 x i1> , ptr addrspace(5) %g, align 1 %l = load <8 x i1>, ptr addrspace(5) %g, align 1 ret <8 x i1> %l } define <8 x i1> @array_of_vec_elem_i1_access_8xi1() { ; CHECK-LABEL: @array_of_vec_elem_i1_access_8xi1( ; CHECK-NEXT: [[P:%.*]] = alloca [2 x <16 x i1>], align 1, addrspace(5) ; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4 ; CHECK-NEXT: store <8 x i1> , ptr addrspace(5) [[G]], align 1 ; CHECK-NEXT: [[L:%.*]] = load <8 x i1>, ptr addrspace(5) [[G]], align 1 ; CHECK-NEXT: ret <8 x i1> [[L]] ; %p = alloca [2 x <16 x i1>], align 1, addrspace(5) %g = getelementptr i8, ptr addrspace(5) %p, i64 4 store <8 x i1> , ptr addrspace(5) %g, align 1 %l = load <8 x i1>, ptr addrspace(5) %g, align 1 ret <8 x i1> %l } define <3 x i1> @array_of_vec_elem_i1_access_3xi1() { ; CHECK-LABEL: @array_of_vec_elem_i1_access_3xi1( ; CHECK-NEXT: [[P:%.*]] = alloca [2 x <16 x i1>], align 1, addrspace(5) ; CHECK-NEXT: [[G:%.*]] = getelementptr i8, ptr addrspace(5) [[P]], i64 4 ; CHECK-NEXT: store <3 x i1> , ptr addrspace(5) [[G]], align 1 ; CHECK-NEXT: [[L:%.*]] = load <3 x i1>, ptr addrspace(5) [[G]], align 1 ; CHECK-NEXT: ret <3 x i1> [[L]] ; %p = alloca [2 x <16 x i1>], align 1, addrspace(5) %g = getelementptr i8, ptr addrspace(5) %p, i64 4 store <3 x i1> , ptr addrspace(5) %g, align 1 %l = load <3 x i1>, ptr addrspace(5) %g, align 1 ret <3 x i1> %l } define <3 x i1> @array_of_vec_elem_i8_access_3xi1() { ; CHECK-LABEL: @array_of_vec_elem_i8_access_3xi1( ; CHECK-NEXT: [[P:%.*]] = alloca [2 x <8 x i8>], align 1, addrspace(5) ; CHECK-NEXT: store <8 x i8> , ptr addrspace(5) [[P]], align 1 ; CHECK-NEXT: [[G:%.*]] = getelementptr <4 x i8>, ptr addrspace(5) [[P]], i64 1 ; CHECK-NEXT: store <3 x i1> , ptr addrspace(5) [[G]], align 1 ; CHECK-NEXT: [[L:%.*]] = load <3 x i1>, ptr addrspace(5) [[G]], align 1 ; CHECK-NEXT: ret <3 x i1> [[L]] ; %p = alloca [2 x <8 x i8>], align 1, addrspace(5) store <8 x i8> , ptr addrspace(5) %p, align 1 %g = getelementptr <4 x i8>, ptr addrspace(5) %p, i64 1 store <3 x i1> , ptr addrspace(5) %g, align 1 %l = load <3 x i1>, ptr addrspace(5) %g, align 1 ret <3 x i1> %l } ; This one is actually not problematic. define <8 x i1> @array_of_vec_elem_i8_access_8xi1() { ; CHECK-LABEL: @array_of_vec_elem_i8_access_8xi1( ; CHECK-NEXT: [[P:%.*]] = freeze <16 x i8> poison ; CHECK-NEXT: [[TMP1:%.*]] = insertelement <16 x i8> [[P]], i8 1, i32 0 ; CHECK-NEXT: [[TMP2:%.*]] = insertelement <16 x i8> [[TMP1]], i8 2, i32 1 ; CHECK-NEXT: [[TMP3:%.*]] = insertelement <16 x i8> [[TMP2]], i8 3, i32 2 ; CHECK-NEXT: [[TMP4:%.*]] = insertelement <16 x i8> [[TMP3]], i8 4, i32 3 ; CHECK-NEXT: [[TMP5:%.*]] = insertelement <16 x i8> [[TMP4]], i8 5, i32 4 ; CHECK-NEXT: [[TMP6:%.*]] = insertelement <16 x i8> [[TMP5]], i8 6, i32 5 ; CHECK-NEXT: [[TMP7:%.*]] = insertelement <16 x i8> [[TMP6]], i8 7, i32 6 ; CHECK-NEXT: [[TMP8:%.*]] = insertelement <16 x i8> [[TMP7]], i8 8, i32 7 ; CHECK-NEXT: [[TMP9:%.*]] = insertelement <16 x i8> [[TMP8]], i8 5, i32 4 ; CHECK-NEXT: ret <8 x i1> ; %p = alloca [2 x <8 x i8>], align 1, addrspace(5) store <8 x i8> , ptr addrspace(5) %p, align 1 %g = getelementptr <4 x i8>, ptr addrspace(5) %p, i64 1 store <8 x i1> , ptr addrspace(5) %g, align 1 %l = load <8 x i1>, ptr addrspace(5) %g, align 1 ret <8 x i1> %l }