[mlir][arith] Add support for extf, truncf to ArithToAPFloat (#169275)

Add support for `arith.extf` and `arith.truncf`. No support for custom
rounding modes yet.
This commit is contained in:
Matthias Springer 2025-11-25 09:09:26 +08:00 committed by GitHub
parent 2f8e712875
commit 78994706d8
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
4 changed files with 130 additions and 24 deletions

View File

@ -40,6 +40,29 @@ static FuncOp createFnDecl(OpBuilder &b, SymbolOpInterface symTable,
return funcOp;
}
/// Helper function to look up or create the symbol for a runtime library
/// function with the given parameter types. Always returns an int64_t.
static FailureOr<FuncOp>
lookupOrCreateApFloatFn(OpBuilder &b, SymbolOpInterface symTable,
StringRef name, TypeRange paramTypes,
SymbolTableCollection *symbolTables = nullptr) {
auto i64Type = IntegerType::get(symTable->getContext(), 64);
std::string funcName = (llvm::Twine("_mlir_apfloat_") + name).str();
auto funcT = FunctionType::get(b.getContext(), paramTypes, {i64Type});
FailureOr<FuncOp> func =
lookupFnDecl(symTable, funcName, funcT, symbolTables);
// Failed due to type mismatch.
if (failed(func))
return func;
// Successfully matched existing decl.
if (*func)
return *func;
return createFnDecl(b, symTable, funcName, funcT,
/*setPrivate=*/true, symbolTables);
}
/// Helper function to look up or create the symbol for a runtime library
/// function for a binary arithmetic operation.
///
@ -55,21 +78,14 @@ lookupOrCreateBinaryFn(OpBuilder &b, SymbolOpInterface symTable, StringRef name,
SymbolTableCollection *symbolTables = nullptr) {
auto i32Type = IntegerType::get(symTable->getContext(), 32);
auto i64Type = IntegerType::get(symTable->getContext(), 64);
return lookupOrCreateApFloatFn(b, symTable, name, {i32Type, i64Type, i64Type},
symbolTables);
}
std::string funcName = (llvm::Twine("_mlir_apfloat_") + name).str();
FunctionType funcT =
FunctionType::get(b.getContext(), {i32Type, i64Type, i64Type}, {i64Type});
FailureOr<FuncOp> func =
lookupFnDecl(symTable, funcName, funcT, symbolTables);
// Failed due to type mismatch.
if (failed(func))
return func;
// Successfully matched existing decl.
if (*func)
return *func;
return createFnDecl(b, symTable, funcName, funcT,
/*setPrivate=*/true, symbolTables);
static Value getSemanticsValue(OpBuilder &b, Location loc, FloatType floatTy) {
int32_t sem = llvm::APFloatBase::SemanticsToEnum(floatTy.getFloatSemantics());
return arith::ConstantOp::create(b, loc, b.getI32Type(),
b.getIntegerAttr(b.getI32Type(), sem));
}
/// Rewrite a binary arithmetic operation to an APFloat function call.
@ -104,11 +120,7 @@ struct BinaryArithOpToAPFloatConversion final : OpRewritePattern<OpTy> {
arith::BitcastOp::create(rewriter, loc, intWType, op.getRhs()));
// Call APFloat function.
int32_t sem =
llvm::APFloatBase::SemanticsToEnum(floatTy.getFloatSemantics());
Value semValue = arith::ConstantOp::create(
rewriter, loc, rewriter.getI32Type(),
rewriter.getIntegerAttr(rewriter.getI32Type(), sem));
Value semValue = getSemanticsValue(rewriter, loc, floatTy);
SmallVector<Value> params = {semValue, lhsBits, rhsBits};
auto resultOp =
func::CallOp::create(rewriter, loc, TypeRange(rewriter.getI64Type()),
@ -126,6 +138,53 @@ struct BinaryArithOpToAPFloatConversion final : OpRewritePattern<OpTy> {
const char *APFloatName;
};
template <typename OpTy>
struct FpToFpConversion final : OpRewritePattern<OpTy> {
FpToFpConversion(MLIRContext *context, SymbolOpInterface symTable,
PatternBenefit benefit = 1)
: OpRewritePattern<OpTy>(context, benefit), symTable(symTable) {}
LogicalResult matchAndRewrite(OpTy op,
PatternRewriter &rewriter) const override {
// Get APFloat function from runtime library.
auto i32Type = IntegerType::get(symTable->getContext(), 32);
auto i64Type = IntegerType::get(symTable->getContext(), 64);
FailureOr<FuncOp> fn = lookupOrCreateApFloatFn(
rewriter, symTable, "convert", {i32Type, i32Type, i64Type});
if (failed(fn))
return fn;
rewriter.setInsertionPoint(op);
// Cast operands to 64-bit integers.
Location loc = op.getLoc();
auto inFloatTy = cast<FloatType>(op.getOperand().getType());
auto inIntWType = rewriter.getIntegerType(inFloatTy.getWidth());
auto int64Type = rewriter.getI64Type();
Value operandBits = arith::ExtUIOp::create(
rewriter, loc, int64Type,
arith::BitcastOp::create(rewriter, loc, inIntWType, op.getOperand()));
// Call APFloat function.
Value inSemValue = getSemanticsValue(rewriter, loc, inFloatTy);
auto outFloatTy = cast<FloatType>(op.getType());
Value outSemValue = getSemanticsValue(rewriter, loc, outFloatTy);
std::array<Value, 3> params = {inSemValue, outSemValue, operandBits};
auto resultOp =
func::CallOp::create(rewriter, loc, TypeRange(rewriter.getI64Type()),
SymbolRefAttr::get(*fn), params);
// Truncate result to the original width.
auto outIntWType = rewriter.getIntegerType(outFloatTy.getWidth());
Value truncatedBits = arith::TruncIOp::create(rewriter, loc, outIntWType,
resultOp->getResult(0));
rewriter.replaceOp(
op, arith::BitcastOp::create(rewriter, loc, outFloatTy, truncatedBits));
return success();
}
SymbolOpInterface symTable;
};
namespace {
struct ArithToAPFloatConversionPass final
: impl::ArithToAPFloatConversionPassBase<ArithToAPFloatConversionPass> {
@ -147,6 +206,9 @@ void ArithToAPFloatConversionPass::runOnOperation() {
context, "divide", getOperation());
patterns.add<BinaryArithOpToAPFloatConversion<arith::RemFOp>>(
context, "remainder", getOperation());
patterns
.add<FpToFpConversion<arith::ExtFOp>, FpToFpConversion<arith::TruncFOp>>(
context, getOperation());
LogicalResult result = success();
ScopedDiagnosticHandler scopedHandler(context, [&result](Diagnostic &diag) {
if (diag.getSeverity() == DiagnosticSeverity::Error) {

View File

@ -51,7 +51,7 @@
/// Binary operations with rounding mode.
#define APFLOAT_BINARY_OP_ROUNDING_MODE(OP, ROUNDING_MODE) \
MLIR_APFLOAT_WRAPPERS_EXPORT int64_t _mlir_apfloat_##OP( \
MLIR_APFLOAT_WRAPPERS_EXPORT uint64_t _mlir_apfloat_##OP( \
int32_t semantics, uint64_t a, uint64_t b) { \
const llvm::fltSemantics &sem = llvm::APFloatBase::EnumToSemantics( \
static_cast<llvm::APFloatBase::Semantics>(semantics)); \
@ -86,4 +86,19 @@ MLIR_APFLOAT_WRAPPERS_EXPORT void printApFloat(int32_t semantics, uint64_t a) {
double d = x.convertToDouble();
fprintf(stdout, "%lg", d);
}
MLIR_APFLOAT_WRAPPERS_EXPORT uint64_t
_mlir_apfloat_convert(int32_t inSemantics, int32_t outSemantics, uint64_t a) {
const llvm::fltSemantics &inSem = llvm::APFloatBase::EnumToSemantics(
static_cast<llvm::APFloatBase::Semantics>(inSemantics));
const llvm::fltSemantics &outSem = llvm::APFloatBase::EnumToSemantics(
static_cast<llvm::APFloatBase::Semantics>(outSemantics));
unsigned bitWidthIn = llvm::APFloatBase::semanticsSizeInBits(inSem);
llvm::APFloat val(inSem, llvm::APInt(bitWidthIn, a));
// TODO: Custom rounding modes are not supported yet.
bool losesInfo;
val.convert(outSem, llvm::RoundingMode::NearestTiesToEven, &losesInfo);
llvm::APInt result = val.bitcastToAPInt();
return result.getZExtValue();
}
}

View File

@ -126,3 +126,25 @@ func.func @remf(%arg0: f4E2M1FN, %arg1: f4E2M1FN) {
%0 = arith.remf %arg0, %arg1 : f4E2M1FN
return
}
// -----
// CHECK: func.func private @_mlir_apfloat_convert(i32, i32, i64) -> i64
// CHECK: %[[sem_in:.*]] = arith.constant 18 : i32
// CHECK: %[[sem_out:.*]] = arith.constant 2 : i32
// CHECK: call @_mlir_apfloat_convert(%[[sem_in]], %[[sem_out]], %{{.*}}) : (i32, i32, i64) -> i64
func.func @extf(%arg0: f4E2M1FN) {
%0 = arith.extf %arg0 : f4E2M1FN to f32
return
}
// -----
// CHECK: func.func private @_mlir_apfloat_convert(i32, i32, i64) -> i64
// CHECK: %[[sem_in:.*]] = arith.constant 1 : i32
// CHECK: %[[sem_out:.*]] = arith.constant 18 : i32
// CHECK: call @_mlir_apfloat_convert(%[[sem_in]], %[[sem_out]], %{{.*}}) : (i32, i32, i64) -> i64
func.func @truncf(%arg0: bf16) {
%0 = arith.truncf %arg0 : bf16 to f4E2M1FN
return
}

View File

@ -27,14 +27,21 @@ func.func @entry() {
%a1 = arith.constant 1.4 : f8E4M3FN
%a2 = arith.constant 1.4 : f32
%b1, %b2 = func.call @foo() : () -> (f8E4M3FN, f32)
%c1 = arith.addf %a1, %b1 : f8E4M3FN // not supported by LLVM
%c2 = arith.addf %a2, %b2 : f32 // supported by LLVM
// CHECK: 3.5
// CHECK: 2.2
vector.print %b2 : f32
// CHECK-NEXT: 3.5
%c1 = arith.addf %a1, %b1 : f8E4M3FN // not supported by LLVM
vector.print %c1 : f8E4M3FN
// CHECK: 3.6
// CHECK-NEXT: 3.6
%c2 = arith.addf %a2, %b2 : f32 // supported by LLVM
vector.print %c2 : f32
// CHECK-NEXT: 2.25
%cvt = arith.truncf %b2 : f32 to f8E4M3FN
vector.print %cvt : f8E4M3FN
return
}