diff options
author | Joseph Huber <huberjn@outlook.com> | 2024-04-05 07:38:01 -0500 |
---|---|---|
committer | GitHub <noreply@github.com> | 2024-04-05 07:38:01 -0500 |
commit | 2650375b3beeb60596ca38e2e06685e48e8ed01f (patch) | |
tree | ee9ff1988f16993350d6af43b9e580666d3cc707 /llvm | |
parent | 3b961d113e6986eb9a6b448b72a730c289b8e6ab (diff) | |
download | llvm-2650375b3beeb60596ca38e2e06685e48e8ed01f.zip llvm-2650375b3beeb60596ca38e2e06685e48e8ed01f.tar.gz llvm-2650375b3beeb60596ca38e2e06685e48e8ed01f.tar.bz2 |
[OpenMP] Add amdgpu-num-work-groups attribute to OpenMP kernels (#87695)
Summary:
This new attribute was introduced recently. We already do this for NVPTX
kernels so we should apply this for AMDGPU as well. This patch simply
applies this metadata in cases where a lower bound is known
Diffstat (limited to 'llvm')
-rw-r--r-- | llvm/lib/Frontend/OpenMP/OMPIRBuilder.cpp | 3 |
1 files changed, 3 insertions, 0 deletions
diff --git a/llvm/lib/Frontend/OpenMP/OMPIRBuilder.cpp b/llvm/lib/Frontend/OpenMP/OMPIRBuilder.cpp index 16507a6..7fd8474 100644 --- a/llvm/lib/Frontend/OpenMP/OMPIRBuilder.cpp +++ b/llvm/lib/Frontend/OpenMP/OMPIRBuilder.cpp @@ -4791,6 +4791,9 @@ void OpenMPIRBuilder::writeTeamsForKernel(const Triple &T, Function &Kernel, updateNVPTXMetadata(Kernel, "maxclusterrank", UB, true); updateNVPTXMetadata(Kernel, "minctasm", LB, false); } + if (T.isAMDGPU()) + Kernel.addFnAttr("amdgpu-max-num-workgroups", llvm::utostr(LB) + ",1,1"); + Kernel.addFnAttr("omp_target_num_teams", std::to_string(LB)); } |