insert is soft deprecated, so remove all references so it's less likely to be used and can be easily removed in the future. Differential Revision: https://reviews.llvm.org/D120021
122 lines
4.8 KiB
C++
122 lines
4.8 KiB
C++
//===- TosaDecomposeDepthwise.cpp
|
|
//------------------------------------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// Decompose TOSA Depthwise operation to a series of TOSA Ops specifically
|
|
// (1) Convert a 1x1 Depthwise to Reshape -> Mul -> Reshape -> Add
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "mlir/Dialect/Tosa/IR/TosaOps.h"
|
|
#include "mlir/Dialect/Tosa/Transforms/Passes.h"
|
|
#include "mlir/Pass/Pass.h"
|
|
|
|
using namespace mlir;
|
|
using namespace mlir::tosa;
|
|
|
|
namespace {
|
|
|
|
struct DepthwiseConv2DIsMul : public OpRewritePattern<tosa::DepthwiseConv2DOp> {
|
|
explicit DepthwiseConv2DIsMul(MLIRContext *context)
|
|
: OpRewritePattern(context) {}
|
|
|
|
LogicalResult matchAndRewrite(tosa::DepthwiseConv2DOp op,
|
|
PatternRewriter &rewriter) const override {
|
|
Value input = op.input();
|
|
Value weight = op.weight();
|
|
ShapedType inputType = input.getType().cast<ShapedType>();
|
|
ShapedType weightType = weight.getType().cast<ShapedType>();
|
|
ShapedType resultType = op.output().getType().cast<ShapedType>();
|
|
Type inputEType = inputType.getElementType();
|
|
|
|
if (!(inputType.hasStaticShape() && weightType.hasStaticShape() &&
|
|
resultType.hasStaticShape())) {
|
|
return failure();
|
|
}
|
|
|
|
// Quantization information needs to still be performed.
|
|
if (op.quantization_info() || !inputEType.isa<FloatType>()) {
|
|
return failure();
|
|
}
|
|
|
|
// Stride must be 1 for this optimization.
|
|
for (Attribute stride : op.stride().getValue()) {
|
|
if (!stride.cast<IntegerAttr>().getValue().isOne()) {
|
|
return failure();
|
|
}
|
|
}
|
|
|
|
// Only works for a 1x1 kernel.
|
|
ArrayRef<int64_t> weightShape = weightType.getShape();
|
|
if (weightShape[0] != 1 || weightShape[1] != 1) {
|
|
return failure();
|
|
}
|
|
|
|
// Reshape input to [N, H, W, C] -> [N, H, W, C, 1].
|
|
ArrayRef<int64_t> inputShape = inputType.getShape();
|
|
llvm::SmallVector<int64_t, 2> revisedInputShape{
|
|
inputShape[0], inputShape[1], inputShape[2], inputShape[3], 1};
|
|
auto revisedInputShapeType = RankedTensorType::get(
|
|
revisedInputShape,
|
|
input.getType().dyn_cast<RankedTensorType>().getElementType());
|
|
auto reshapedInput = rewriter
|
|
.create<tosa::ReshapeOp>(
|
|
op.getLoc(), revisedInputShapeType, input,
|
|
rewriter.getI64ArrayAttr(revisedInputShape))
|
|
.getResult();
|
|
|
|
// Reshape kernel to [KH, KW, C, M] -> [1, 1, 1, C, M].
|
|
llvm::SmallVector<int64_t, 2> revisedWeightShape{1, 1, 1, weightShape[2],
|
|
weightShape[3]};
|
|
auto revisedWeightShapeType = RankedTensorType::get(
|
|
revisedWeightShape,
|
|
weight.getType().dyn_cast<RankedTensorType>().getElementType());
|
|
auto reshapedWeight = rewriter
|
|
.create<tosa::ReshapeOp>(
|
|
op.getLoc(), revisedWeightShapeType, weight,
|
|
rewriter.getI64ArrayAttr(revisedWeightShape))
|
|
.getResult();
|
|
|
|
// Perform an elementwise mul over the reshaped input and weight.
|
|
llvm::SmallVector<int64_t, 2> mulShape{inputShape[0], inputShape[1],
|
|
inputShape[2], inputShape[3],
|
|
weightShape[3]};
|
|
auto mulShapeType = RankedTensorType::get(
|
|
mulShape,
|
|
weight.getType().dyn_cast<RankedTensorType>().getElementType());
|
|
Value mulValue =
|
|
rewriter
|
|
.create<tosa::MulOp>(op.getLoc(), mulShapeType, reshapedInput,
|
|
reshapedWeight, /*shift=*/0)
|
|
.getResult();
|
|
|
|
// Reshape output to [N, H, W, C * M].
|
|
auto outputShape = op.output().getType().cast<ShapedType>().getShape();
|
|
auto outputShapeType = RankedTensorType::get(
|
|
outputShape,
|
|
input.getType().dyn_cast<RankedTensorType>().getElementType());
|
|
auto outputValue =
|
|
rewriter.create<tosa::ReshapeOp>(op.getLoc(), outputShapeType, mulValue,
|
|
rewriter.getI64ArrayAttr(outputShape));
|
|
|
|
// Add in the bias.
|
|
rewriter
|
|
.replaceOpWithNewOp<tosa::AddOp>(op, outputShapeType, outputValue,
|
|
op.bias())
|
|
.getResult();
|
|
return success();
|
|
}
|
|
};
|
|
|
|
} // namespace
|
|
|
|
void mlir::tosa::populateTosaDecomposeDepthwise(MLIRContext *ctx,
|
|
RewritePatternSet &patterns) {
|
|
patterns.add<DepthwiseConv2DIsMul>(ctx);
|
|
}
|