//===- TestAllReduceLowering.cpp - Test gpu.all_reduce lowering -----------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // // This file contains test passes for lowering the gpu.all_reduce op. // //===----------------------------------------------------------------------===// #include "mlir/Dialect/AMDGPU/IR/AMDGPUDialect.h" #include "mlir/Dialect/AMDGPU/Utils/Chipset.h" #include "mlir/Dialect/Arith/IR/Arith.h" #include "mlir/Dialect/Func/IR/FuncOps.h" #include "mlir/Dialect/GPU/Transforms/Passes.h" #include "mlir/Dialect/Index/IR/IndexDialect.h" #include "mlir/Dialect/LLVMIR/ROCDLDialect.h" #include "mlir/Dialect/MemRef/IR/MemRef.h" #include "mlir/Dialect/Vector/IR/VectorOps.h" #include "mlir/IR/PatternMatch.h" #include "mlir/Pass/Pass.h" #include "mlir/Transforms/GreedyPatternRewriteDriver.h" using namespace mlir; namespace { struct TestGpuRewritePass : public PassWrapper> { MLIR_DEFINE_EXPLICIT_INTERNAL_INLINE_TYPE_ID(TestGpuRewritePass) void getDependentDialects(DialectRegistry ®istry) const override { registry.insert(); } StringRef getArgument() const final { return "test-gpu-rewrite"; } StringRef getDescription() const final { return "Applies all rewrite patterns within the GPU dialect."; } void runOnOperation() override { RewritePatternSet patterns(&getContext()); populateGpuRewritePatterns(patterns); populateGpuSubgroupIdPatterns(patterns); (void)applyPatternsGreedily(getOperation(), std::move(patterns)); } }; struct TestGpuSubgroupReduceLoweringPass : public PassWrapper> { MLIR_DEFINE_EXPLICIT_INTERNAL_INLINE_TYPE_ID( TestGpuSubgroupReduceLoweringPass) TestGpuSubgroupReduceLoweringPass() = default; TestGpuSubgroupReduceLoweringPass( const TestGpuSubgroupReduceLoweringPass &pass) : PassWrapper(pass) {} void getDependentDialects(DialectRegistry ®istry) const override { registry .insert(); } StringRef getArgument() const final { return "test-gpu-subgroup-reduce-lowering"; } StringRef getDescription() const final { return "Applies gpu.subgroup_reduce lowering patterns."; } Option expandToShuffles{ *this, "expand-to-shuffles", llvm::cl::desc("Expand subgroup_reduce ops to shuffle ops."), llvm::cl::init(false)}; Option target{ *this, "target", llvm::cl::desc("Target backend name which will be used to provide " "compatible lowerings of subgroup reduce."), llvm::cl::init("")}; void runOnOperation() override { RewritePatternSet patterns(&getContext()); // Since both pattern sets match on the same ops, set higher benefit to // perform fewer failing matches. populateGpuBreakDownSubgroupReducePatterns(patterns, /*maxShuffleBitwidth=*/32, PatternBenefit(3)); if (expandToShuffles) { auto maybeChipset = amdgpu::Chipset::parse(target); if (succeeded(maybeChipset)) { populateGpuLowerSubgroupReduceToDPPPatterns( patterns, /*subgroupSize=*/64, *maybeChipset, PatternBenefit(2)); populateGpuLowerClusteredSubgroupReduceToDPPPatterns( patterns, /*subgroupSize=*/64, *maybeChipset, PatternBenefit(2)); } populateGpuLowerSubgroupReduceToShufflePatterns( patterns, /*subgroupSize=*/32, /*shuffleBitwidth=*/32); populateGpuLowerClusteredSubgroupReduceToShufflePatterns( patterns, /*subgroupSize=*/32, /*shuffleBitwidth=*/32); } (void)applyPatternsGreedily(getOperation(), std::move(patterns)); } }; } // namespace namespace mlir { void registerTestGpuLoweringPasses() { PassRegistration(); PassRegistration(); } } // namespace mlir