aboutsummaryrefslogtreecommitdiff
path: root/mlir/test/Conversion
diff options
context:
space:
mode:
authorGiuseppe Rossini <giuseppe.rossini@amd.com>2024-09-03 17:47:08 +0100
committerGitHub <noreply@github.com>2024-09-03 17:47:08 +0100
commita8e1c6f99abc273677afed5eaaeee2c0296db59f (patch)
tree5903e0a58aafaa3b867953f424866599a6580e47 /mlir/test/Conversion
parent0b2f2537a5b717539b200bd7fa31cbc24679e96f (diff)
downloadllvm-a8e1c6f99abc273677afed5eaaeee2c0296db59f.zip
llvm-a8e1c6f99abc273677afed5eaaeee2c0296db59f.tar.gz
llvm-a8e1c6f99abc273677afed5eaaeee2c0296db59f.tar.bz2
[MLIR][AMDGPU] Add support for fp8 ops on gfx12 (#106388)
This PR is adding support for `fp8` and `bfp8` on gfx12
Diffstat (limited to 'mlir/test/Conversion')
-rw-r--r--mlir/test/Conversion/AMDGPUToROCDL/wmma-gfx12.mlir9
1 files changed, 9 insertions, 0 deletions
diff --git a/mlir/test/Conversion/AMDGPUToROCDL/wmma-gfx12.mlir b/mlir/test/Conversion/AMDGPUToROCDL/wmma-gfx12.mlir
new file mode 100644
index 0000000..7b2b524
--- /dev/null
+++ b/mlir/test/Conversion/AMDGPUToROCDL/wmma-gfx12.mlir
@@ -0,0 +1,9 @@
+// RUN: mlir-opt %s -convert-amdgpu-to-rocdl=chipset=gfx1200 --allow-unregistered-dialect | FileCheck %s
+func.func @mfma_to_rocdl(%arg0 : vector<8xf8E4M3FN>, %arg1 : vector<8xf8E5M2>, %arg2 : vector<8xf32>) {
+ // CHECK: rocdl.wmma.f32.16x16x16.fp8{{.*}}: (vector<2xi32>, vector<2xi32>, vector<8xf32>) -> vector<8xf32>
+ amdgpu.wmma %arg0 * %arg0 + %arg2: vector<8xf8E4M3FN>, vector<8xf8E4M3FN>, vector<8xf32>
+
+ // CHECK: rocdl.wmma.f32.16x16x16.bf8{{.*}}: (vector<2xi32>, vector<2xi32>, vector<8xf32>) -> vector<8xf32>
+ amdgpu.wmma %arg1 * %arg1 + %arg2: vector<8xf8E5M2>, vector<8xf8E5M2>, vector<8xf32>
+ func.return
+}