1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82
|
//===- XeGPUFoldAliasOps.cpp - XeGPU alias ops folders ----------*- C++ -*-===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
#include "mlir/Dialect/XeGPU/Transforms/Passes.h"
#include "mlir/Dialect/Affine/ViewLikeInterfaceUtils.h"
#include "mlir/Dialect/MemRef/IR/MemRef.h"
#include "mlir/Dialect/XeGPU/IR/XeGPU.h"
#include "mlir/Dialect/XeGPU/Transforms/Transforms.h"
#include "mlir/Pass/Pass.h"
#include "mlir/Transforms/GreedyPatternRewriteDriver.h"
#include "llvm/Support/Debug.h"
namespace mlir {
namespace xegpu {
#define GEN_PASS_DEF_XEGPUFOLDALIASOPS
#include "mlir/Dialect/XeGPU/Transforms/Passes.h.inc"
} // namespace xegpu
} // namespace mlir
#define DEBUG_TYPE "xegpu-fold-alias-ops"
#define DBGS() (llvm::dbgs() << "[" DEBUG_TYPE "]: ")
using namespace mlir;
namespace {
/// Merges subview operation with xegpu.create_nd_tdesc operation.
class XegpuCreateNdDescOpSubViewOpFolder final
: public OpRewritePattern<xegpu::CreateNdDescOp> {
public:
using OpRewritePattern<xegpu::CreateNdDescOp>::OpRewritePattern;
LogicalResult matchAndRewrite(xegpu::CreateNdDescOp descOp,
PatternRewriter &rewriter) const override;
};
} // namespace
LogicalResult XegpuCreateNdDescOpSubViewOpFolder::matchAndRewrite(
xegpu::CreateNdDescOp descOp, PatternRewriter &rewriter) const {
auto subViewOp = descOp.getSource().getDefiningOp<memref::SubViewOp>();
if (!subViewOp)
return rewriter.notifyMatchFailure(descOp, "not a subview producer");
if (!subViewOp.hasUnitStride())
return rewriter.notifyMatchFailure(descOp, "requires unit strides");
SmallVector<Value> resolvedOffsets;
affine::resolveIndicesIntoOpWithOffsetsAndStrides(
rewriter, descOp.getLoc(), subViewOp.getMixedOffsets(),
subViewOp.getMixedStrides(), subViewOp.getDroppedDims(),
descOp.getMixedOffsets(), resolvedOffsets);
rewriter.replaceOpWithNewOp<xegpu::CreateNdDescOp>(
descOp, descOp.getTensorDesc().getType(), subViewOp.getSource(),
getAsOpFoldResult(resolvedOffsets));
return success();
}
void xegpu::populateXeGPUFoldAliasOpsPatterns(RewritePatternSet &patterns) {
patterns.add<XegpuCreateNdDescOpSubViewOpFolder>(patterns.getContext());
}
namespace {
struct XeGPUFoldAliasOpsPass final
: public xegpu::impl::XeGPUFoldAliasOpsBase<XeGPUFoldAliasOpsPass> {
void runOnOperation() override;
};
} // namespace
void XeGPUFoldAliasOpsPass::runOnOperation() {
RewritePatternSet patterns(&getContext());
xegpu::populateXeGPUFoldAliasOpsPatterns(patterns);
(void)applyPatternsAndFoldGreedily(getOperation(), std::move(patterns));
}
|