diff options
author | Kun Wu <kunww@google.com> | 2023-06-01 17:46:08 +0000 |
---|---|---|
committer | Kun Wu <kunww@google.com> | 2023-06-01 17:52:58 +0000 |
commit | be6c5320059fcc6a86c775108ff440f7e53f84b6 (patch) | |
tree | 4b000617dd35b1c7a8204fd410cb49b756d0e91e | |
parent | b092f417db211b5316b2222c29bc651eaaa86ce1 (diff) | |
download | llvm-be6c5320059fcc6a86c775108ff440f7e53f84b6.zip llvm-be6c5320059fcc6a86c775108ff440f7e53f84b6.tar.gz llvm-be6c5320059fcc6a86c775108ff440f7e53f84b6.tar.bz2 |
[mlir][sparse][gpu] fixing broken literal names in cuda runner macros
Differential Revision: https://reviews.llvm.org/D151910
-rw-r--r-- | mlir/lib/ExecutionEngine/CudaRuntimeWrappers.cpp | 13 |
1 files changed, 6 insertions, 7 deletions
diff --git a/mlir/lib/ExecutionEngine/CudaRuntimeWrappers.cpp b/mlir/lib/ExecutionEngine/CudaRuntimeWrappers.cpp index c7367a8..17be418 100644 --- a/mlir/lib/ExecutionEngine/CudaRuntimeWrappers.cpp +++ b/mlir/lib/ExecutionEngine/CudaRuntimeWrappers.cpp @@ -232,10 +232,10 @@ extern "C" MLIR_CUDA_WRAPPERS_EXPORT void mgpuSetDefaultDevice(int32_t device) { // Some macro magic to get float/double alpha and beta on host. #define ALPHABETA(dtp, alpha, beta) \ - __nv_bfloat16(alpha##bf16) = 1.0f; \ - __nv_bfloat16(beta##bf16) = 1.0f; \ - __half(alpha##f16) = 1.0f; \ - __half(beta##f16) = 1.0f; \ + __nv_bfloat16(alpha##16bf) = 1.0f; \ + __nv_bfloat16(beta##16bf) = 1.0f; \ + __half(alpha##16f) = 1.0f; \ + __half(beta##16f) = 1.0f; \ float(alpha##f) = 1.0f; \ float(beta##f) = 1.0f; \ double(alpha##d) = 1.0; \ @@ -251,11 +251,9 @@ extern "C" MLIR_CUDA_WRAPPERS_EXPORT void mgpuSetDefaultDevice(int32_t device) { } else if (dtp == CUDA_R_32F || dtp == CUDA_C_32F) { \ (alpha##p) = reinterpret_cast<void *>(&(alpha##f)); \ (beta##p) = reinterpret_cast<void *>(&(beta##f)); \ - } else if (dtp == CUDA_R_64F || dtp == CUDA_C_64F) { \ + } else { \ (alpha##p) = reinterpret_cast<void *>(&(alpha##d)); \ (beta##p) = reinterpret_cast<void *>(&(beta##d)); \ - } else { \ - llvm_unreachable("Unsupported data type"); \ } extern "C" MLIR_CUDA_WRAPPERS_EXPORT void * @@ -321,6 +319,7 @@ mgpuCreateCsr(intptr_t rows, intptr_t cols, intptr_t nnz, void *rowPos, cusparseSpMatDescr_t mat = nullptr; auto pTp = static_cast<cusparseIndexType_t>(ptp); auto iTp = static_cast<cusparseIndexType_t>(itp); + auto dTp = static_cast<cudaDataType_t>(dtp); CUSPARSE_REPORT_IF_ERROR(cusparseCreateCsr(&mat, rows, cols, nnz, rowPos, colIdxs, values, pTp, iTp, CUSPARSE_INDEX_BASE_ZERO, dtp)) |