We see performance improvements from using sincos to reuse calculations in hot loops that compute sin() and cos() of the same operand. Add a pass to identify sin() and cos() calls in the same block with the same operand and fast-math flags, and fuse them into a sincos op. Follow-up to: * #160561 * #160772
81 lines
2.6 KiB
C++
81 lines
2.6 KiB
C++
//===- SincosFusion.cpp - Fuse sin/cos into sincos -----------------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "mlir/Dialect/Math/IR/Math.h"
|
|
#include "mlir/Dialect/Math/Transforms/Passes.h"
|
|
#include "mlir/IR/PatternMatch.h"
|
|
#include "mlir/Transforms/GreedyPatternRewriteDriver.h"
|
|
|
|
using namespace mlir;
|
|
using namespace mlir::math;
|
|
|
|
namespace {
|
|
|
|
/// Fuse a math.sin and math.cos in the same block that use the same operand and
|
|
/// have identical fastmath flags into a single math.sincos.
|
|
struct SincosFusionPattern : OpRewritePattern<math::SinOp> {
|
|
using Base::Base;
|
|
|
|
LogicalResult matchAndRewrite(math::SinOp sinOp,
|
|
PatternRewriter &rewriter) const override {
|
|
Value operand = sinOp.getOperand();
|
|
mlir::arith::FastMathFlags sinFastMathFlags = sinOp.getFastmath();
|
|
|
|
math::CosOp cosOp = nullptr;
|
|
sinOp->getBlock()->walk([&](math::CosOp op) {
|
|
if (op.getOperand() == operand && op.getFastmath() == sinFastMathFlags) {
|
|
cosOp = op;
|
|
return WalkResult::interrupt();
|
|
}
|
|
return WalkResult::advance();
|
|
});
|
|
|
|
if (!cosOp)
|
|
return failure();
|
|
|
|
Operation *firstOp = sinOp->isBeforeInBlock(cosOp) ? sinOp.getOperation()
|
|
: cosOp.getOperation();
|
|
rewriter.setInsertionPoint(firstOp);
|
|
|
|
Type elemType = sinOp.getType();
|
|
auto sincos = math::SincosOp::create(rewriter, firstOp->getLoc(),
|
|
TypeRange{elemType, elemType}, operand,
|
|
sinOp.getFastmathAttr());
|
|
|
|
rewriter.replaceOp(sinOp, sincos.getSin());
|
|
rewriter.replaceOp(cosOp, sincos.getCos());
|
|
return success();
|
|
}
|
|
};
|
|
|
|
} // namespace
|
|
|
|
namespace mlir::math {
|
|
#define GEN_PASS_DEF_MATHSINCOSFUSIONPASS
|
|
#include "mlir/Dialect/Math/Transforms/Passes.h.inc"
|
|
} // namespace mlir::math
|
|
|
|
namespace {
|
|
|
|
struct MathSincosFusionPass final
|
|
: math::impl::MathSincosFusionPassBase<MathSincosFusionPass> {
|
|
using MathSincosFusionPassBase::MathSincosFusionPassBase;
|
|
|
|
void runOnOperation() override {
|
|
RewritePatternSet patterns(&getContext());
|
|
patterns.add<SincosFusionPattern>(&getContext());
|
|
|
|
GreedyRewriteConfig config;
|
|
if (failed(
|
|
applyPatternsGreedily(getOperation(), std::move(patterns), config)))
|
|
return signalPassFailure();
|
|
}
|
|
};
|
|
|
|
} // namespace
|