// NOTE: Assertions have been autogenerated by utils/update_cc_test_checks.py UTC_ARGS: --version 6 // RUN: %clang_cc1 -triple spirv64-amd-amdhsa -x hip -emit-llvm -fcuda-is-device -O3 \ // RUN: -o - %s | FileCheck --check-prefix=AMDGCNSPIRV %s // RUN: %clang_cc1 -triple amdgcn-amd-amdhsa -x hip -target-cpu gfx906 -emit-llvm -fcuda-is-device -O3 \ // RUN: -o - %s | FileCheck --check-prefix=AMDGPU %s #define __global__ __attribute__((global)) #define __device__ __attribute__((device)) union Transparent { unsigned x; }; using V1 = unsigned __attribute__((ext_vector_type(1))); using V2 = unsigned __attribute__((ext_vector_type(2))); using V3 = unsigned __attribute__((ext_vector_type(3))); using V4 = unsigned __attribute__((ext_vector_type(4))); struct SingleElement { unsigned x; }; struct ByRef { unsigned x[17]; }; // AMDGCNSPIRV-LABEL: define spir_kernel void @_Z2k0s( // AMDGCNSPIRV-SAME: i16 noundef [[TMP0:%.*]]) local_unnamed_addr addrspace(4) #[[ATTR0:[0-9]+]] !max_work_group_size [[META9:![0-9]+]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret void // // AMDGPU-LABEL: define dso_local amdgpu_kernel void @_Z2k0s( // AMDGPU-SAME: i16 noundef [[TMP0:%.*]]) local_unnamed_addr #[[ATTR0:[0-9]+]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret void // __global__ void k0(short) { } // AMDGCNSPIRV-LABEL: define spir_kernel void @_Z2k1j( // AMDGCNSPIRV-SAME: i32 noundef [[TMP0:%.*]]) local_unnamed_addr addrspace(4) #[[ATTR0]] !max_work_group_size [[META9]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret void // // AMDGPU-LABEL: define dso_local amdgpu_kernel void @_Z2k1j( // AMDGPU-SAME: i32 noundef [[TMP0:%.*]]) local_unnamed_addr #[[ATTR0]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret void // __global__ void k1(unsigned) { } // AMDGCNSPIRV-LABEL: define spir_kernel void @_Z2k2d( // AMDGCNSPIRV-SAME: double noundef [[TMP0:%.*]]) local_unnamed_addr addrspace(4) #[[ATTR0]] !max_work_group_size [[META9]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret void // // AMDGPU-LABEL: define dso_local amdgpu_kernel void @_Z2k2d( // AMDGPU-SAME: double noundef [[TMP0:%.*]]) local_unnamed_addr #[[ATTR0]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret void // __global__ void k2(double) { } // AMDGCNSPIRV-LABEL: define spir_kernel void @_Z2k311Transparent( // AMDGCNSPIRV-SAME: i32 [[DOTCOERCE:%.*]]) local_unnamed_addr addrspace(4) #[[ATTR0]] !max_work_group_size [[META9]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret void // // AMDGPU-LABEL: define dso_local amdgpu_kernel void @_Z2k311Transparent( // AMDGPU-SAME: i32 [[DOTCOERCE:%.*]]) local_unnamed_addr #[[ATTR0]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret void // __global__ void k3(Transparent) { } // AMDGCNSPIRV-LABEL: define spir_kernel void @_Z2k413SingleElement( // AMDGCNSPIRV-SAME: i32 [[DOTCOERCE:%.*]]) local_unnamed_addr addrspace(4) #[[ATTR0]] !max_work_group_size [[META9]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret void // // AMDGPU-LABEL: define dso_local amdgpu_kernel void @_Z2k413SingleElement( // AMDGPU-SAME: i32 [[DOTCOERCE:%.*]]) local_unnamed_addr #[[ATTR0]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret void // __global__ void k4(SingleElement) { } // AMDGCNSPIRV-LABEL: define spir_kernel void @_Z2k55ByRef( // AMDGCNSPIRV-SAME: ptr addrspace(2) noundef readnone byref([[STRUCT_BYREF:%.*]]) align 4 captures(none) [[TMP0:%.*]]) local_unnamed_addr addrspace(4) #[[ATTR0]] !max_work_group_size [[META9]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret void // // AMDGPU-LABEL: define dso_local amdgpu_kernel void @_Z2k55ByRef( // AMDGPU-SAME: ptr addrspace(4) noundef readnone byref([[STRUCT_BYREF:%.*]]) align 4 captures(none) [[TMP0:%.*]]) local_unnamed_addr #[[ATTR0]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret void // __global__ void k5(ByRef) { } // AMDGCNSPIRV-LABEL: define spir_kernel void @_Z2k6Dv1_jDv2_jDv3_jDv4_j( // AMDGCNSPIRV-SAME: <1 x i32> noundef [[TMP0:%.*]], <2 x i32> noundef [[TMP1:%.*]], <3 x i32> noundef [[TMP2:%.*]], <4 x i32> noundef [[TMP3:%.*]]) local_unnamed_addr addrspace(4) #[[ATTR0]] !max_work_group_size [[META9]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret void // // AMDGPU-LABEL: define dso_local amdgpu_kernel void @_Z2k6Dv1_jDv2_jDv3_jDv4_j( // AMDGPU-SAME: <1 x i32> noundef [[TMP0:%.*]], <2 x i32> noundef [[TMP1:%.*]], <3 x i32> noundef [[TMP2:%.*]], <4 x i32> noundef [[TMP3:%.*]]) local_unnamed_addr #[[ATTR0]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret void // __global__ void k6(V1, V2, V3, V4) { } // AMDGCNSPIRV-LABEL: define spir_kernel void @_Z2k7Pj( // AMDGCNSPIRV-SAME: ptr addrspace(1) noundef readnone captures(none) [[DOTCOERCE:%.*]]) local_unnamed_addr addrspace(4) #[[ATTR0]] !max_work_group_size [[META9]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret void // // AMDGPU-LABEL: define dso_local amdgpu_kernel void @_Z2k7Pj( // AMDGPU-SAME: ptr addrspace(1) noundef readnone captures(none) [[DOTCOERCE:%.*]]) local_unnamed_addr #[[ATTR0]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret void // __global__ void k7(unsigned*) { } // AMDGCNSPIRV-LABEL: define spir_func void @_Z2f0s( // AMDGCNSPIRV-SAME: i16 noundef signext [[TMP0:%.*]]) local_unnamed_addr addrspace(4) #[[ATTR1:[0-9]+]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret void // // AMDGPU-LABEL: define dso_local void @_Z2f0s( // AMDGPU-SAME: i16 noundef signext [[TMP0:%.*]]) local_unnamed_addr #[[ATTR1:[0-9]+]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret void // __device__ void f0(short) { } // AMDGCNSPIRV-LABEL: define spir_func void @_Z2f1j( // AMDGCNSPIRV-SAME: i32 noundef [[TMP0:%.*]]) local_unnamed_addr addrspace(4) #[[ATTR1]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret void // // AMDGPU-LABEL: define dso_local void @_Z2f1j( // AMDGPU-SAME: i32 noundef [[TMP0:%.*]]) local_unnamed_addr #[[ATTR1]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret void // __device__ void f1(unsigned) { } // AMDGCNSPIRV-LABEL: define spir_func void @_Z2f2d( // AMDGCNSPIRV-SAME: double noundef [[TMP0:%.*]]) local_unnamed_addr addrspace(4) #[[ATTR1]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret void // // AMDGPU-LABEL: define dso_local void @_Z2f2d( // AMDGPU-SAME: double noundef [[TMP0:%.*]]) local_unnamed_addr #[[ATTR1]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret void // __device__ void f2(double) { } // AMDGCNSPIRV-LABEL: define spir_func void @_Z2f311Transparent( // AMDGCNSPIRV-SAME: i32 [[DOTCOERCE:%.*]]) local_unnamed_addr addrspace(4) #[[ATTR1]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret void // // AMDGPU-LABEL: define dso_local void @_Z2f311Transparent( // AMDGPU-SAME: i32 [[DOTCOERCE:%.*]]) local_unnamed_addr #[[ATTR1]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret void // __device__ void f3(Transparent) { } // AMDGCNSPIRV-LABEL: define spir_func void @_Z2f413SingleElement( // AMDGCNSPIRV-SAME: i32 [[DOTCOERCE:%.*]]) local_unnamed_addr addrspace(4) #[[ATTR1]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret void // // AMDGPU-LABEL: define dso_local void @_Z2f413SingleElement( // AMDGPU-SAME: i32 [[DOTCOERCE:%.*]]) local_unnamed_addr #[[ATTR1]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret void // __device__ void f4(SingleElement) { } // AMDGCNSPIRV-LABEL: define spir_func void @_Z2f55ByRef( // AMDGCNSPIRV-SAME: ptr noundef readnone byref([[STRUCT_BYREF:%.*]]) align 4 captures(none) [[TMP0:%.*]]) local_unnamed_addr addrspace(4) #[[ATTR1]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret void // // AMDGPU-LABEL: define dso_local void @_Z2f55ByRef( // AMDGPU-SAME: ptr addrspace(5) noundef readnone byref([[STRUCT_BYREF:%.*]]) align 4 captures(none) [[TMP0:%.*]]) local_unnamed_addr #[[ATTR1]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret void // __device__ void f5(ByRef) { } // AMDGCNSPIRV-LABEL: define spir_func void @_Z2f6Dv1_jDv2_jDv3_jDv4_j( // AMDGCNSPIRV-SAME: <1 x i32> noundef [[TMP0:%.*]], <2 x i32> noundef [[TMP1:%.*]], <3 x i32> noundef [[TMP2:%.*]], <4 x i32> noundef [[TMP3:%.*]]) local_unnamed_addr addrspace(4) #[[ATTR1]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret void // // AMDGPU-LABEL: define dso_local void @_Z2f6Dv1_jDv2_jDv3_jDv4_j( // AMDGPU-SAME: <1 x i32> noundef [[TMP0:%.*]], <2 x i32> noundef [[TMP1:%.*]], <3 x i32> noundef [[TMP2:%.*]], <4 x i32> noundef [[TMP3:%.*]]) local_unnamed_addr #[[ATTR1]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret void // __device__ void f6(V1, V2, V3, V4) { } // AMDGCNSPIRV-LABEL: define spir_func noundef signext i16 @_Z2f7v( // AMDGCNSPIRV-SAME: ) local_unnamed_addr addrspace(4) #[[ATTR1]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret i16 0 // // AMDGPU-LABEL: define dso_local noundef signext i16 @_Z2f7v( // AMDGPU-SAME: ) local_unnamed_addr #[[ATTR1]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret i16 0 // __device__ short f7() { return 0; } // AMDGCNSPIRV-LABEL: define spir_func noundef i32 @_Z2f8v( // AMDGCNSPIRV-SAME: ) local_unnamed_addr addrspace(4) #[[ATTR1]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret i32 0 // // AMDGPU-LABEL: define dso_local noundef i32 @_Z2f8v( // AMDGPU-SAME: ) local_unnamed_addr #[[ATTR1]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret i32 0 // __device__ unsigned f8() { return 0; } // AMDGCNSPIRV-LABEL: define spir_func noundef double @_Z2f9v( // AMDGCNSPIRV-SAME: ) local_unnamed_addr addrspace(4) #[[ATTR1]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret double 0.000000e+00 // // AMDGPU-LABEL: define dso_local noundef double @_Z2f9v( // AMDGPU-SAME: ) local_unnamed_addr #[[ATTR1]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret double 0.000000e+00 // __device__ double f9() { return 0.; } // AMDGCNSPIRV-LABEL: define spir_func noundef i32 @_Z3f10v( // AMDGCNSPIRV-SAME: ) local_unnamed_addr addrspace(4) #[[ATTR1]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret i32 0 // // AMDGPU-LABEL: define dso_local noundef i32 @_Z3f10v( // AMDGPU-SAME: ) local_unnamed_addr #[[ATTR1]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret i32 0 // __device__ Transparent f10() { return {}; } // AMDGCNSPIRV-LABEL: define spir_func noundef i32 @_Z3f11v( // AMDGCNSPIRV-SAME: ) local_unnamed_addr addrspace(4) #[[ATTR1]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret i32 0 // // AMDGPU-LABEL: define dso_local noundef i32 @_Z3f11v( // AMDGPU-SAME: ) local_unnamed_addr #[[ATTR1]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret i32 0 // __device__ SingleElement f11() { return {}; } // AMDGCNSPIRV-LABEL: define spir_func void @_Z3f12v( // AMDGCNSPIRV-SAME: ptr dead_on_unwind noalias writable writeonly sret([[STRUCT_BYREF:%.*]]) align 4 captures(none) initializes((0, 68)) [[AGG_RESULT:%.*]]) local_unnamed_addr addrspace(4) #[[ATTR2:[0-9]+]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: tail call addrspace(4) void @llvm.memset.p0.i64(ptr noundef nonnull align 4 dereferenceable(68) [[AGG_RESULT]], i8 0, i64 68, i1 false) // AMDGCNSPIRV-NEXT: ret void // // AMDGPU-LABEL: define dso_local void @_Z3f12v( // AMDGPU-SAME: ptr addrspace(5) dead_on_unwind noalias writable writeonly sret([[STRUCT_BYREF:%.*]]) align 4 captures(none) initializes((0, 68)) [[AGG_RESULT:%.*]]) local_unnamed_addr #[[ATTR2:[0-9]+]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: tail call void @llvm.memset.p5.i64(ptr addrspace(5) noundef align 4 dereferenceable(68) [[AGG_RESULT]], i8 0, i64 68, i1 false) // AMDGPU-NEXT: ret void // __device__ ByRef f12() { return {}; } // AMDGCNSPIRV-LABEL: define spir_func noundef <1 x i32> @_Z3f13v( // AMDGCNSPIRV-SAME: ) local_unnamed_addr addrspace(4) #[[ATTR1]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret <1 x i32> zeroinitializer // // AMDGPU-LABEL: define dso_local noundef <1 x i32> @_Z3f13v( // AMDGPU-SAME: ) local_unnamed_addr #[[ATTR1]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret <1 x i32> zeroinitializer // __device__ V1 f13() { return {}; } // AMDGCNSPIRV-LABEL: define spir_func noundef <2 x i32> @_Z3f14v( // AMDGCNSPIRV-SAME: ) local_unnamed_addr addrspace(4) #[[ATTR1]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret <2 x i32> zeroinitializer // // AMDGPU-LABEL: define dso_local noundef <2 x i32> @_Z3f14v( // AMDGPU-SAME: ) local_unnamed_addr #[[ATTR1]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret <2 x i32> zeroinitializer // __device__ V2 f14() { return {}; } // AMDGCNSPIRV-LABEL: define spir_func noundef <3 x i32> @_Z3f15v( // AMDGCNSPIRV-SAME: ) local_unnamed_addr addrspace(4) #[[ATTR1]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret <3 x i32> zeroinitializer // // AMDGPU-LABEL: define dso_local noundef <3 x i32> @_Z3f15v( // AMDGPU-SAME: ) local_unnamed_addr #[[ATTR1]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret <3 x i32> zeroinitializer // __device__ V3 f15() { return {}; } // AMDGCNSPIRV-LABEL: define spir_func noundef <4 x i32> @_Z3f16v( // AMDGCNSPIRV-SAME: ) local_unnamed_addr addrspace(4) #[[ATTR1]] { // AMDGCNSPIRV-NEXT: [[ENTRY:.*:]] // AMDGCNSPIRV-NEXT: ret <4 x i32> zeroinitializer // // AMDGPU-LABEL: define dso_local noundef <4 x i32> @_Z3f16v( // AMDGPU-SAME: ) local_unnamed_addr #[[ATTR1]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: ret <4 x i32> zeroinitializer // __device__ V4 f16() { return {}; } //. // AMDGCNSPIRV: [[META9]] = !{i32 1024, i32 1, i32 1} //.