// NOTE: Assertions have been autogenerated by utils/update_cc_test_checks.py UTC_ARGS: --version 5 // RUN: %clang_cc1 -triple nvptx64-nvidia-cuda -emit-llvm \ // RUN: -fvisibility=hidden -o - %s | FileCheck %s --check-prefix=NVPTX // RUN: %clang_cc1 -triple amdgcn-amd-amdhsa -emit-llvm \ // RUN: -fvisibility=hidden -o - %s | FileCheck %s --check-prefix=AMDGPU // NVPTX-LABEL: define hidden void @_Z1fPv( // NVPTX-SAME: ptr noundef [[P:%.*]]) #[[ATTR0:[0-9]+]] { // NVPTX-NEXT: [[ENTRY:.*:]] // NVPTX-NEXT: [[P_ADDR:%.*]] = alloca ptr, align 8 // NVPTX-NEXT: store ptr [[P]], ptr [[P_ADDR]], align 8 // NVPTX-NEXT: ret void // // AMDGPU-LABEL: define hidden void @_Z1fPv( // AMDGPU-SAME: ptr noundef [[P:%.*]]) #[[ATTR0:[0-9]+]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: [[P_ADDR:%.*]] = alloca ptr, align 8, addrspace(5) // AMDGPU-NEXT: [[P_ADDR_ASCAST:%.*]] = addrspacecast ptr addrspace(5) [[P_ADDR]] to ptr // AMDGPU-NEXT: store ptr [[P]], ptr [[P_ADDR_ASCAST]], align 8 // AMDGPU-NEXT: ret void // void f(void *p) {} // NVPTX-LABEL: define hidden void @_Z2p1Pv( // NVPTX-SAME: ptr noundef [[P:%.*]]) #[[ATTR0]] { // NVPTX-NEXT: [[ENTRY:.*:]] // NVPTX-NEXT: [[P_ADDR:%.*]] = alloca ptr, align 8 // NVPTX-NEXT: store ptr [[P]], ptr [[P_ADDR]], align 8 // NVPTX-NEXT: [[TMP0:%.*]] = load ptr, ptr [[P_ADDR]], align 8 // NVPTX-NEXT: call void @_Z1fPv(ptr noundef [[TMP0]]) #[[ATTR1:[0-9]+]] // NVPTX-NEXT: ret void // // AMDGPU-LABEL: define hidden void @_Z2p1Pv( // AMDGPU-SAME: ptr noundef [[P:%.*]]) #[[ATTR0]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: [[P_ADDR:%.*]] = alloca ptr, align 8, addrspace(5) // AMDGPU-NEXT: [[P_ADDR_ASCAST:%.*]] = addrspacecast ptr addrspace(5) [[P_ADDR]] to ptr // AMDGPU-NEXT: store ptr [[P]], ptr [[P_ADDR_ASCAST]], align 8 // AMDGPU-NEXT: [[TMP0:%.*]] = load ptr, ptr [[P_ADDR_ASCAST]], align 8 // AMDGPU-NEXT: call void @_Z1fPv(ptr noundef [[TMP0]]) #[[ATTR1:[0-9]+]] // AMDGPU-NEXT: ret void // void p1(void [[clang::address_space(0)]] * p) { f(p); } // NVPTX-LABEL: define hidden noundef ptr @_Z2p2PU3AS3v( // NVPTX-SAME: ptr addrspace(3) noundef [[P:%.*]]) #[[ATTR0]] { // NVPTX-NEXT: [[ENTRY:.*:]] // NVPTX-NEXT: [[P_ADDR:%.*]] = alloca ptr addrspace(3), align 8 // NVPTX-NEXT: store ptr addrspace(3) [[P]], ptr [[P_ADDR]], align 8 // NVPTX-NEXT: [[TMP0:%.*]] = load ptr addrspace(3), ptr [[P_ADDR]], align 8 // NVPTX-NEXT: [[TMP1:%.*]] = addrspacecast ptr addrspace(3) [[TMP0]] to ptr // NVPTX-NEXT: ret ptr [[TMP1]] // // AMDGPU-LABEL: define hidden noundef ptr @_Z2p2PU3AS3v( // AMDGPU-SAME: ptr addrspace(3) noundef [[P:%.*]]) #[[ATTR0]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: [[RETVAL:%.*]] = alloca ptr, align 8, addrspace(5) // AMDGPU-NEXT: [[P_ADDR:%.*]] = alloca ptr addrspace(3), align 4, addrspace(5) // AMDGPU-NEXT: [[RETVAL_ASCAST:%.*]] = addrspacecast ptr addrspace(5) [[RETVAL]] to ptr // AMDGPU-NEXT: [[P_ADDR_ASCAST:%.*]] = addrspacecast ptr addrspace(5) [[P_ADDR]] to ptr // AMDGPU-NEXT: store ptr addrspace(3) [[P]], ptr [[P_ADDR_ASCAST]], align 4 // AMDGPU-NEXT: [[TMP0:%.*]] = load ptr addrspace(3), ptr [[P_ADDR_ASCAST]], align 4 // AMDGPU-NEXT: [[TMP1:%.*]] = addrspacecast ptr addrspace(3) [[TMP0]] to ptr // AMDGPU-NEXT: ret ptr [[TMP1]] // void *p2(void [[clang::address_space(3)]] * p) { return p; } // NVPTX-LABEL: define hidden noundef ptr @_Z2p3PU3AS3v( // NVPTX-SAME: ptr addrspace(3) noundef [[P:%.*]]) #[[ATTR0]] { // NVPTX-NEXT: [[ENTRY:.*:]] // NVPTX-NEXT: [[P_ADDR:%.*]] = alloca ptr addrspace(3), align 8 // NVPTX-NEXT: store ptr addrspace(3) [[P]], ptr [[P_ADDR]], align 8 // NVPTX-NEXT: [[TMP0:%.*]] = load ptr addrspace(3), ptr [[P_ADDR]], align 8 // NVPTX-NEXT: [[TMP1:%.*]] = addrspacecast ptr addrspace(3) [[TMP0]] to ptr // NVPTX-NEXT: ret ptr [[TMP1]] // // AMDGPU-LABEL: define hidden noundef ptr @_Z2p3PU3AS3v( // AMDGPU-SAME: ptr addrspace(3) noundef [[P:%.*]]) #[[ATTR0]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: [[RETVAL:%.*]] = alloca ptr, align 8, addrspace(5) // AMDGPU-NEXT: [[P_ADDR:%.*]] = alloca ptr addrspace(3), align 4, addrspace(5) // AMDGPU-NEXT: [[RETVAL_ASCAST:%.*]] = addrspacecast ptr addrspace(5) [[RETVAL]] to ptr // AMDGPU-NEXT: [[P_ADDR_ASCAST:%.*]] = addrspacecast ptr addrspace(5) [[P_ADDR]] to ptr // AMDGPU-NEXT: store ptr addrspace(3) [[P]], ptr [[P_ADDR_ASCAST]], align 4 // AMDGPU-NEXT: [[TMP0:%.*]] = load ptr addrspace(3), ptr [[P_ADDR_ASCAST]], align 4 // AMDGPU-NEXT: [[TMP1:%.*]] = addrspacecast ptr addrspace(3) [[TMP0]] to ptr // AMDGPU-NEXT: ret ptr [[TMP1]] // void *p3(void [[clang::address_space(3)]] * p) { return p; } struct S { S() = default; ~S() = default; void foo() {} }; S s1; S [[clang::address_space(1)]] s2; S [[clang::address_space(3)]] s3; template void foo(Ty *) {} // NVPTX-LABEL: define hidden void @_Z2t1Pv( // NVPTX-SAME: ptr noundef [[P:%.*]]) #[[ATTR0]] { // NVPTX-NEXT: [[ENTRY:.*:]] // NVPTX-NEXT: [[P_ADDR:%.*]] = alloca ptr, align 8 // NVPTX-NEXT: store ptr [[P]], ptr [[P_ADDR]], align 8 // NVPTX-NEXT: [[TMP0:%.*]] = load ptr, ptr [[P_ADDR]], align 8 // NVPTX-NEXT: call void @_Z3fooIvEvPT_(ptr noundef [[TMP0]]) #[[ATTR1]] // NVPTX-NEXT: ret void // // AMDGPU-LABEL: define hidden void @_Z2t1Pv( // AMDGPU-SAME: ptr noundef [[P:%.*]]) #[[ATTR0]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: [[P_ADDR:%.*]] = alloca ptr, align 8, addrspace(5) // AMDGPU-NEXT: [[P_ADDR_ASCAST:%.*]] = addrspacecast ptr addrspace(5) [[P_ADDR]] to ptr // AMDGPU-NEXT: store ptr [[P]], ptr [[P_ADDR_ASCAST]], align 8 // AMDGPU-NEXT: [[TMP0:%.*]] = load ptr, ptr [[P_ADDR_ASCAST]], align 8 // AMDGPU-NEXT: call void @_Z3fooIvEvPT_(ptr noundef [[TMP0]]) #[[ATTR1]] // AMDGPU-NEXT: ret void // void t1(void *p) { foo(p); } // NVPTX-LABEL: define hidden void @_Z2t3PU3AS3v( // NVPTX-SAME: ptr addrspace(3) noundef [[P:%.*]]) #[[ATTR0]] { // NVPTX-NEXT: [[ENTRY:.*:]] // NVPTX-NEXT: [[P_ADDR:%.*]] = alloca ptr addrspace(3), align 8 // NVPTX-NEXT: store ptr addrspace(3) [[P]], ptr [[P_ADDR]], align 8 // NVPTX-NEXT: [[TMP0:%.*]] = load ptr addrspace(3), ptr [[P_ADDR]], align 8 // NVPTX-NEXT: call void @_Z3fooIU3AS3vEvPT_(ptr addrspace(3) noundef [[TMP0]]) #[[ATTR1]] // NVPTX-NEXT: ret void // // AMDGPU-LABEL: define hidden void @_Z2t3PU3AS3v( // AMDGPU-SAME: ptr addrspace(3) noundef [[P:%.*]]) #[[ATTR0]] { // AMDGPU-NEXT: [[ENTRY:.*:]] // AMDGPU-NEXT: [[P_ADDR:%.*]] = alloca ptr addrspace(3), align 4, addrspace(5) // AMDGPU-NEXT: [[P_ADDR_ASCAST:%.*]] = addrspacecast ptr addrspace(5) [[P_ADDR]] to ptr // AMDGPU-NEXT: store ptr addrspace(3) [[P]], ptr [[P_ADDR_ASCAST]], align 4 // AMDGPU-NEXT: [[TMP0:%.*]] = load ptr addrspace(3), ptr [[P_ADDR_ASCAST]], align 4 // AMDGPU-NEXT: call void @_Z3fooIU3AS3vEvPT_(ptr addrspace(3) noundef [[TMP0]]) #[[ATTR1]] // AMDGPU-NEXT: ret void // void t3(void [[clang::address_space(3)]] *p) { foo(p); }