Conversion/MathToLibm/MathToLibm.cpp

34810e1bSTres Popp//===-- MathToLibm.cpp - conversion from Math to libm calls ---------------===//
34810e1bSTres Popp//
34810e1bSTres Popp// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
34810e1bSTres Popp// See https://llvm.org/LICENSE.txt for license information.
34810e1bSTres Popp// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
34810e1bSTres Popp//
34810e1bSTres Popp//===----------------------------------------------------------------------===//
34810e1bSTres Popp
34810e1bSTres Popp#include "mlir/Conversion/MathToLibm/MathToLibm.h"
34810e1bSTres Popp
abc362a1SJakub Kuderski#include "mlir/Dialect/Arith/IR/Arith.h"
23aa5a74SRiver Riddle#include "mlir/Dialect/Func/IR/FuncOps.h"
9c442c7dSSlava Zakharin#include "mlir/Dialect/LLVMIR/LLVMDialect.h"
34810e1bSTres Popp#include "mlir/Dialect/Math/IR/Math.h"
99ef9eebSMatthias Springer#include "mlir/Dialect/Utils/IndexingUtils.h"
99ef9eebSMatthias Springer#include "mlir/Dialect/Vector/IR/VectorOps.h"
34810e1bSTres Popp#include "mlir/IR/BuiltinDialect.h"
34810e1bSTres Popp#include "mlir/IR/PatternMatch.h"
67d0d7acSMichele Scuttari#include "mlir/Pass/Pass.h"
8a9d4895SAlexander Belyaev#include "mlir/Transforms/DialectConversion.h"
67d0d7acSMichele Scuttari
67d0d7acSMichele Scuttarinamespace mlir {
67d0d7acSMichele Scuttari#define GEN_PASS_DEF_CONVERTMATHTOLIBM
67d0d7acSMichele Scuttari#include "mlir/Conversion/Passes.h.inc"
67d0d7acSMichele Scuttari} // namespace mlir
34810e1bSTres Popp
34810e1bSTres Poppusing namespace mlir;
34810e1bSTres Popp
34810e1bSTres Poppnamespace {
34810e1bSTres Popp// Pattern to convert vector operations to scalar operations. This is needed as
34810e1bSTres Popp// libm calls require scalars.
34810e1bSTres Popptemplate <typename Op>
34810e1bSTres Poppstruct VecOpToScalarOp : public OpRewritePattern<Op> {
34810e1bSTres Popppublic:
34810e1bSTres Popp  using OpRewritePattern<Op>::OpRewritePattern;
34810e1bSTres Popp
34810e1bSTres Popp  LogicalResult matchAndRewrite(Op op, PatternRewriter &rewriter) const final;
34810e1bSTres Popp};
a48adc56SBenjamin Kramer// Pattern to promote an op of a smaller floating point type to F32.
a48adc56SBenjamin Kramertemplate <typename Op>
a48adc56SBenjamin Kramerstruct PromoteOpToF32 : public OpRewritePattern<Op> {
a48adc56SBenjamin Kramerpublic:
a48adc56SBenjamin Kramer  using OpRewritePattern<Op>::OpRewritePattern;
a48adc56SBenjamin Kramer
a48adc56SBenjamin Kramer  LogicalResult matchAndRewrite(Op op, PatternRewriter &rewriter) const final;
a48adc56SBenjamin Kramer};
34810e1bSTres Popp// Pattern to convert scalar math operations to calls to libm functions.
34810e1bSTres Popp// Additionally the libm function signatures are declared.
34810e1bSTres Popptemplate <typename Op>
34810e1bSTres Poppstruct ScalarOpToLibmCall : public OpRewritePattern<Op> {
34810e1bSTres Popppublic:
34810e1bSTres Popp  using OpRewritePattern<Op>::OpRewritePattern;
a4ee55feSAlexander Batashev  ScalarOpToLibmCall(MLIRContext *context, StringRef floatFunc,
8a9d4895SAlexander Belyaev                     StringRef doubleFunc)
8a9d4895SAlexander Belyaev      : OpRewritePattern<Op>(context), floatFunc(floatFunc),
34810e1bSTres Popp        doubleFunc(doubleFunc){};
34810e1bSTres Popp
34810e1bSTres Popp  LogicalResult matchAndRewrite(Op op, PatternRewriter &rewriter) const final;
34810e1bSTres Popp
34810e1bSTres Poppprivate:
34810e1bSTres Popp  std::string floatFunc, doubleFunc;
34810e1bSTres Popp};
3bf1f0e7SAlexander Belyaev
3bf1f0e7SAlexander Belyaevtemplate <typename OpTy>
3bf1f0e7SAlexander Belyaevvoid populatePatternsForOp(RewritePatternSet &patterns, MLIRContext *ctx,
3bf1f0e7SAlexander Belyaev                           StringRef floatFunc, StringRef doubleFunc) {
3bf1f0e7SAlexander Belyaev  patterns.add<VecOpToScalarOp<OpTy>, PromoteOpToF32<OpTy>>(ctx);
3bf1f0e7SAlexander Belyaev  patterns.add<ScalarOpToLibmCall<OpTy>>(ctx, floatFunc, doubleFunc);
3bf1f0e7SAlexander Belyaev}
3bf1f0e7SAlexander Belyaev
34810e1bSTres Popp} // namespace
34810e1bSTres Popp
34810e1bSTres Popptemplate <typename Op>
34810e1bSTres PoppLogicalResult
34810e1bSTres PoppVecOpToScalarOp<Op>::matchAndRewrite(Op op, PatternRewriter &rewriter) const {
34810e1bSTres Popp  auto opType = op.getType();
34810e1bSTres Popp  auto loc = op.getLoc();
5550c821STres Popp  auto vecType = dyn_cast<VectorType>(opType);
34810e1bSTres Popp
34810e1bSTres Popp  if (!vecType)
34810e1bSTres Popp    return failure();
34810e1bSTres Popp  if (!vecType.hasRank())
34810e1bSTres Popp    return failure();
34810e1bSTres Popp  auto shape = vecType.getShape();
921d91f3SAdrian Kuegel  int64_t numElements = vecType.getNumElements();
34810e1bSTres Popp
a54f4eaeSMogball  Value result = rewriter.create<arith::ConstantOp>(
34810e1bSTres Popp      loc, DenseElementsAttr::get(
34810e1bSTres Popp               vecType, FloatAttr::get(vecType.getElementType(), 0.0)));
7a69a9d7SNicolas Vasilache  SmallVector<int64_t> strides = computeStrides(shape);
921d91f3SAdrian Kuegel  for (auto linearIndex = 0; linearIndex < numElements; ++linearIndex) {
203fad47SNicolas Vasilache    SmallVector<int64_t> positions = delinearize(linearIndex, strides);
34810e1bSTres Popp    SmallVector<Value> operands;
34810e1bSTres Popp    for (auto input : op->getOperands())
34810e1bSTres Popp      operands.push_back(
921d91f3SAdrian Kuegel          rewriter.create<vector::ExtractOp>(loc, input, positions));
34810e1bSTres Popp    Value scalarOp =
34810e1bSTres Popp        rewriter.create<Op>(loc, vecType.getElementType(), operands);
921d91f3SAdrian Kuegel    result =
921d91f3SAdrian Kuegel        rewriter.create<vector::InsertOp>(loc, scalarOp, result, positions);
34810e1bSTres Popp  }
34810e1bSTres Popp  rewriter.replaceOp(op, {result});
34810e1bSTres Popp  return success();
34810e1bSTres Popp}
34810e1bSTres Popp
34810e1bSTres Popptemplate <typename Op>
34810e1bSTres PoppLogicalResult
a48adc56SBenjamin KramerPromoteOpToF32<Op>::matchAndRewrite(Op op, PatternRewriter &rewriter) const {
a48adc56SBenjamin Kramer  auto opType = op.getType();
5550c821STres Popp  if (!isa<Float16Type, BFloat16Type>(opType))
a48adc56SBenjamin Kramer    return failure();
a48adc56SBenjamin Kramer
a48adc56SBenjamin Kramer  auto loc = op.getLoc();
a48adc56SBenjamin Kramer  auto f32 = rewriter.getF32Type();
a48adc56SBenjamin Kramer  auto extendedOperands = llvm::to_vector(
a48adc56SBenjamin Kramer      llvm::map_range(op->getOperands(), [&](Value operand) -> Value {
a48adc56SBenjamin Kramer        return rewriter.create<arith::ExtFOp>(loc, f32, operand);
a48adc56SBenjamin Kramer      }));
a48adc56SBenjamin Kramer  auto newOp = rewriter.create<Op>(loc, f32, extendedOperands);
a48adc56SBenjamin Kramer  rewriter.replaceOpWithNewOp<arith::TruncFOp>(op, opType, newOp);
a48adc56SBenjamin Kramer  return success();
a48adc56SBenjamin Kramer}
a48adc56SBenjamin Kramer
a48adc56SBenjamin Kramertemplate <typename Op>
a48adc56SBenjamin KramerLogicalResult
34810e1bSTres PoppScalarOpToLibmCall<Op>::matchAndRewrite(Op op,
34810e1bSTres Popp                                        PatternRewriter &rewriter) const {
1ebf7ce9STres Popp  auto module = SymbolTable::getNearestSymbolTable(op);
34810e1bSTres Popp  auto type = op.getType();
5550c821STres Popp  if (!isa<Float32Type, Float64Type>(type))
34810e1bSTres Popp    return failure();
34810e1bSTres Popp
34810e1bSTres Popp  auto name = type.getIntOrFloatBitWidth() == 64 ? doubleFunc : floatFunc;
1ebf7ce9STres Popp  auto opFunc = dyn_cast_or_null<SymbolOpInterface>(
1ebf7ce9STres Popp      SymbolTable::lookupSymbolIn(module, name));
34810e1bSTres Popp  // Forward declare function if it hasn't already been
34810e1bSTres Popp  if (!opFunc) {
34810e1bSTres Popp    OpBuilder::InsertionGuard guard(rewriter);
1ebf7ce9STres Popp    rewriter.setInsertionPointToStart(&module->getRegion(0).front());
34810e1bSTres Popp    auto opFunctionTy = FunctionType::get(
34810e1bSTres Popp        rewriter.getContext(), op->getOperandTypes(), op->getResultTypes());
58ceae95SRiver Riddle    opFunc = rewriter.create<func::FuncOp>(rewriter.getUnknownLoc(), name,
58ceae95SRiver Riddle                                           opFunctionTy);
34810e1bSTres Popp    opFunc.setPrivate();
9c442c7dSSlava Zakharin
9c442c7dSSlava Zakharin    // By definition Math dialect operations imply LLVM's "readnone"
9c442c7dSSlava Zakharin    // function attribute, so we can set it here to provide more
9c442c7dSSlava Zakharin    // optimization opportunities (e.g. LICM) for backends targeting LLVM IR.
9c442c7dSSlava Zakharin    // This will have to be changed, when strict FP behavior is supported
9c442c7dSSlava Zakharin    // by Math dialect.
9c442c7dSSlava Zakharin    opFunc->setAttr(LLVM::LLVMDialect::getReadnoneAttrName(),
9c442c7dSSlava Zakharin                    UnitAttr::get(rewriter.getContext()));
34810e1bSTres Popp  }
7ceffae1SRiver Riddle  assert(isa<FunctionOpInterface>(SymbolTable::lookupSymbolIn(module, name)));
34810e1bSTres Popp
23aa5a74SRiver Riddle  rewriter.replaceOpWithNewOp<func::CallOp>(op, name, op.getType(),
1ebf7ce9STres Popp                                            op->getOperands());
34810e1bSTres Popp
34810e1bSTres Popp  return success();
34810e1bSTres Popp}
34810e1bSTres Popp
8a9d4895SAlexander Belyaevvoid mlir::populateMathToLibmConversionPatterns(RewritePatternSet &patterns) {
8a9d4895SAlexander Belyaev  MLIRContext *ctx = patterns.getContext();
3bf1f0e7SAlexander Belyaev
50b93733SCorentin Ferry  populatePatternsForOp<math::AbsFOp>(patterns, ctx, "fabsf", "fabs");
f7250179SFrederik Harwath  populatePatternsForOp<math::AcosOp>(patterns, ctx, "acosf", "acos");
b8dca4faSVivek Khandelwal  populatePatternsForOp<math::AcoshOp>(patterns, ctx, "acoshf", "acosh");
b8dca4faSVivek Khandelwal  populatePatternsForOp<math::AsinOp>(patterns, ctx, "asinf", "asin");
b8dca4faSVivek Khandelwal  populatePatternsForOp<math::AsinhOp>(patterns, ctx, "asinhf", "asinh");
3bf1f0e7SAlexander Belyaev  populatePatternsForOp<math::Atan2Op>(patterns, ctx, "atan2f", "atan2");
3bf1f0e7SAlexander Belyaev  populatePatternsForOp<math::AtanOp>(patterns, ctx, "atanf", "atan");
b8dca4faSVivek Khandelwal  populatePatternsForOp<math::AtanhOp>(patterns, ctx, "atanhf", "atanh");
3bf1f0e7SAlexander Belyaev  populatePatternsForOp<math::CbrtOp>(patterns, ctx, "cbrtf", "cbrt");
3bf1f0e7SAlexander Belyaev  populatePatternsForOp<math::CeilOp>(patterns, ctx, "ceilf", "ceil");
3bf1f0e7SAlexander Belyaev  populatePatternsForOp<math::CosOp>(patterns, ctx, "cosf", "cos");
762964e9SSungsoon Cho  populatePatternsForOp<math::CoshOp>(patterns, ctx, "coshf", "cosh");
3bf1f0e7SAlexander Belyaev  populatePatternsForOp<math::ErfOp>(patterns, ctx, "erff", "erf");
50b93733SCorentin Ferry  populatePatternsForOp<math::ExpOp>(patterns, ctx, "expf", "exp");
50b93733SCorentin Ferry  populatePatternsForOp<math::Exp2Op>(patterns, ctx, "exp2f", "exp2");
3bf1f0e7SAlexander Belyaev  populatePatternsForOp<math::ExpM1Op>(patterns, ctx, "expm1f", "expm1");
3bf1f0e7SAlexander Belyaev  populatePatternsForOp<math::FloorOp>(patterns, ctx, "floorf", "floor");
50b93733SCorentin Ferry  populatePatternsForOp<math::FmaOp>(patterns, ctx, "fmaf", "fma");
50b93733SCorentin Ferry  populatePatternsForOp<math::LogOp>(patterns, ctx, "logf", "log");
50b93733SCorentin Ferry  populatePatternsForOp<math::Log2Op>(patterns, ctx, "log2f", "log2");
50b93733SCorentin Ferry  populatePatternsForOp<math::Log10Op>(patterns, ctx, "log10f", "log10");
3bf1f0e7SAlexander Belyaev  populatePatternsForOp<math::Log1pOp>(patterns, ctx, "log1pf", "log1p");
50b93733SCorentin Ferry  populatePatternsForOp<math::PowFOp>(patterns, ctx, "powf", "pow");
3bf1f0e7SAlexander Belyaev  populatePatternsForOp<math::RoundEvenOp>(patterns, ctx, "roundevenf",
8a9d4895SAlexander Belyaev                                           "roundeven");
3bf1f0e7SAlexander Belyaev  populatePatternsForOp<math::RoundOp>(patterns, ctx, "roundf", "round");
3bf1f0e7SAlexander Belyaev  populatePatternsForOp<math::SinOp>(patterns, ctx, "sinf", "sin");
aa165edcSRob Suderman  populatePatternsForOp<math::SinhOp>(patterns, ctx, "sinhf", "sinh");
50b93733SCorentin Ferry  populatePatternsForOp<math::SqrtOp>(patterns, ctx, "sqrtf", "sqrt");
*b96f18b2SIvy Zhang  populatePatternsForOp<math::RsqrtOp>(patterns, ctx, "rsqrtf", "rsqrt");
3bf1f0e7SAlexander Belyaev  populatePatternsForOp<math::TanOp>(patterns, ctx, "tanf", "tan");
3bf1f0e7SAlexander Belyaev  populatePatternsForOp<math::TanhOp>(patterns, ctx, "tanhf", "tanh");
3bf1f0e7SAlexander Belyaev  populatePatternsForOp<math::TruncOp>(patterns, ctx, "truncf", "trunc");
34810e1bSTres Popp}
34810e1bSTres Popp
34810e1bSTres Poppnamespace {
34810e1bSTres Poppstruct ConvertMathToLibmPass
67d0d7acSMichele Scuttari    : public impl::ConvertMathToLibmBase<ConvertMathToLibmPass> {
34810e1bSTres Popp  void runOnOperation() override;
34810e1bSTres Popp};
34810e1bSTres Popp} // namespace
34810e1bSTres Popp
34810e1bSTres Poppvoid ConvertMathToLibmPass::runOnOperation() {
34810e1bSTres Popp  auto module = getOperation();
34810e1bSTres Popp
34810e1bSTres Popp  RewritePatternSet patterns(&getContext());
8a9d4895SAlexander Belyaev  populateMathToLibmConversionPatterns(patterns);
34810e1bSTres Popp
34810e1bSTres Popp  ConversionTarget target(getContext());
abc362a1SJakub Kuderski  target.addLegalDialect<arith::ArithDialect, BuiltinDialect, func::FuncDialect,
abc362a1SJakub Kuderski                         vector::VectorDialect>();
34810e1bSTres Popp  target.addIllegalDialect<math::MathDialect>();
34810e1bSTres Popp  if (failed(applyPartialConversion(module, target, std::move(patterns))))
34810e1bSTres Popp    signalPassFailure();
34810e1bSTres Popp}
34810e1bSTres Popp
34810e1bSTres Poppstd::unique_ptr<OperationPass<ModuleOp>> mlir::createConvertMathToLibmPass() {
34810e1bSTres Popp  return std::make_unique<ConvertMathToLibmPass>();
34810e1bSTres Popp}