Files
llvm-project/mlir/lib/Dialect/Math/Transforms/SincosFusion.cpp
yebinchon 495e1a4257 [mlir] added a check in the walk to prevent catching a cos in a nested region (#190064)
The walk in SincosFusion may detect a cos within a nested region of the
sin block. This triggers an assertion in `isBeforeInBlock` later on.
Added a check within the walk so it filters operations in nested
regions, which are not in the same block and should not be fused anyway.

---------

Co-authored-by: Yebin Chon <ychon@nvidia.com>
2026-04-01 20:10:56 -07:00

79 lines
2.5 KiB
C++

//===- SincosFusion.cpp - Fuse sin/cos into sincos -----------------------===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
#include "mlir/Dialect/Math/IR/Math.h"
#include "mlir/Dialect/Math/Transforms/Passes.h"
#include "mlir/IR/PatternMatch.h"
#include "mlir/Transforms/GreedyPatternRewriteDriver.h"
using namespace mlir;
using namespace mlir::math;
namespace {
/// Fuse a math.sin and math.cos in the same block that use the same operand and
/// have identical fastmath flags into a single math.sincos.
struct SincosFusionPattern : OpRewritePattern<math::SinOp> {
using Base::Base;
LogicalResult matchAndRewrite(math::SinOp sinOp,
PatternRewriter &rewriter) const override {
Value operand = sinOp.getOperand();
mlir::arith::FastMathFlags sinFastMathFlags = sinOp.getFastmath();
math::CosOp cosOp = nullptr;
for (auto op : sinOp->getBlock()->getOps<math::CosOp>())
if (op.getOperand() == operand && op.getFastmath() == sinFastMathFlags) {
cosOp = op;
break;
}
if (!cosOp)
return failure();
Operation *firstOp = sinOp->isBeforeInBlock(cosOp) ? sinOp.getOperation()
: cosOp.getOperation();
rewriter.setInsertionPoint(firstOp);
Type elemType = sinOp.getType();
auto sincos = math::SincosOp::create(rewriter, firstOp->getLoc(),
TypeRange{elemType, elemType}, operand,
sinOp.getFastmathAttr());
rewriter.replaceOp(sinOp, sincos.getSin());
rewriter.replaceOp(cosOp, sincos.getCos());
return success();
}
};
} // namespace
namespace mlir::math {
#define GEN_PASS_DEF_MATHSINCOSFUSIONPASS
#include "mlir/Dialect/Math/Transforms/Passes.h.inc"
} // namespace mlir::math
namespace {
struct MathSincosFusionPass final
: math::impl::MathSincosFusionPassBase<MathSincosFusionPass> {
using MathSincosFusionPassBase::MathSincosFusionPassBase;
void runOnOperation() override {
RewritePatternSet patterns(&getContext());
patterns.add<SincosFusionPattern>(&getContext());
GreedyRewriteConfig config;
if (failed(
applyPatternsGreedily(getOperation(), std::move(patterns), config)))
return signalPassFailure();
}
};
} // namespace