1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
|
//===- XeGPUFoldAliasOps.cpp - XeGPU alias ops folders ----------*- C++ -*-===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
#include "mlir/Dialect/XeGPU/Transforms/Passes.h"
#include "mlir/Dialect/Affine/ViewLikeInterfaceUtils.h"
#include "mlir/Dialect/MemRef/IR/MemRef.h"
#include "mlir/Dialect/XeGPU/IR/XeGPU.h"
#include "mlir/Dialect/XeGPU/Transforms/Transforms.h"
#include "mlir/Transforms/GreedyPatternRewriteDriver.h"
namespace mlir {
namespace xegpu {
#define GEN_PASS_DEF_XEGPUFOLDALIASOPS
#include "mlir/Dialect/XeGPU/Transforms/Passes.h.inc"
} // namespace xegpu
} // namespace mlir
#define DEBUG_TYPE "xegpu-fold-alias-ops"
#define DBGS() (llvm::dbgs() << "[" DEBUG_TYPE "]: ")
using namespace mlir;
namespace {
/// Merges subview operation with xegpu.create_nd_tdesc operation.
class XegpuCreateNdDescOpSubViewOpFolder final
: public OpRewritePattern<xegpu::CreateNdDescOp> {
public:
using OpRewritePattern<xegpu::CreateNdDescOp>::OpRewritePattern;
LogicalResult matchAndRewrite(xegpu::CreateNdDescOp descOp,
PatternRewriter &rewriter) const override;
};
} // namespace
LogicalResult XegpuCreateNdDescOpSubViewOpFolder::matchAndRewrite(
xegpu::CreateNdDescOp descOp, PatternRewriter &rewriter) const {
auto subViewOp = descOp.getSource().getDefiningOp<memref::SubViewOp>();
if (!subViewOp)
return rewriter.notifyMatchFailure(descOp, "not a subview producer");
if (!subViewOp.hasUnitStride())
return rewriter.notifyMatchFailure(descOp, "requires unit strides");
SmallVector<Value> resolvedOffsets;
affine::resolveIndicesIntoOpWithOffsetsAndStrides(
rewriter, descOp.getLoc(), subViewOp.getMixedOffsets(),
subViewOp.getMixedStrides(), subViewOp.getDroppedDims(),
descOp.getMixedOffsets(), resolvedOffsets);
rewriter.replaceOpWithNewOp<xegpu::CreateNdDescOp>(
descOp, descOp.getTensorDesc().getType(), subViewOp.getSource(),
getAsOpFoldResult(resolvedOffsets));
return success();
}
void xegpu::populateXeGPUFoldAliasOpsPatterns(RewritePatternSet &patterns) {
patterns.add<XegpuCreateNdDescOpSubViewOpFolder>(patterns.getContext());
}
namespace {
struct XeGPUFoldAliasOpsPass final
: public xegpu::impl::XeGPUFoldAliasOpsBase<XeGPUFoldAliasOpsPass> {
void runOnOperation() override;
};
} // namespace
void XeGPUFoldAliasOpsPass::runOnOperation() {
RewritePatternSet patterns(&getContext());
xegpu::populateXeGPUFoldAliasOpsPatterns(patterns);
(void)applyPatternsGreedily(getOperation(), std::move(patterns));
}
|