Math/Transforms/ExpandPatterns.cpp

10a57f3aSPrashant Kumar//===- ExpandPatterns.cpp - Code to expand various math operations. -------===//
f3bdb56dSRob Suderman//
f3bdb56dSRob Suderman// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
f3bdb56dSRob Suderman// See https://llvm.org/LICENSE.txt for license information.
f3bdb56dSRob Suderman// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
f3bdb56dSRob Suderman//
f3bdb56dSRob Suderman//===----------------------------------------------------------------------===//
f3bdb56dSRob Suderman//
10a57f3aSPrashant Kumar// This file implements expansion of various math operations.
f3bdb56dSRob Suderman//
f3bdb56dSRob Suderman//===----------------------------------------------------------------------===//
f3bdb56dSRob Suderman
abc362a1SJakub Kuderski#include "mlir/Dialect/Arith/IR/Arith.h"
f3bdb56dSRob Suderman#include "mlir/Dialect/Math/IR/Math.h"
f3bdb56dSRob Suderman#include "mlir/Dialect/Math/Transforms/Passes.h"
8b68da2cSAlex Zinenko#include "mlir/Dialect/SCF/IR/SCF.h"
711c5893SRobert Suderman#include "mlir/Dialect/Vector/IR/VectorOps.h"
f3bdb56dSRob Suderman#include "mlir/IR/Builders.h"
740e2e90SRobert Suderman#include "mlir/IR/ImplicitLocOpBuilder.h"
711c5893SRobert Suderman#include "mlir/IR/TypeUtilities.h"
f3bdb56dSRob Suderman#include "mlir/Transforms/DialectConversion.h"
f3bdb56dSRob Suderman
f3bdb56dSRob Sudermanusing namespace mlir;
f3bdb56dSRob Suderman
711c5893SRobert Suderman/// Create a float constant.
10a57f3aSPrashant Kumarstatic Value createFloatConst(Location loc, Type type, APFloat value,
711c5893SRobert Suderman                              OpBuilder &b) {
10a57f3aSPrashant Kumar  bool losesInfo = false;
10a57f3aSPrashant Kumar  auto eltType = getElementTypeOrSelf(type);
10a57f3aSPrashant Kumar  // Convert double to the given `FloatType` with round-to-nearest-ties-to-even.
10a57f3aSPrashant Kumar  value.convert(cast<FloatType>(eltType).getFloatSemantics(),
10a57f3aSPrashant Kumar                APFloat::rmNearestTiesToEven, &losesInfo);
10a57f3aSPrashant Kumar  auto attr = b.getFloatAttr(eltType, value);
711c5893SRobert Suderman  if (auto shapedTy = dyn_cast<ShapedType>(type)) {
711c5893SRobert Suderman    return b.create<arith::ConstantOp>(loc,
711c5893SRobert Suderman                                       DenseElementsAttr::get(shapedTy, attr));
711c5893SRobert Suderman  }
711c5893SRobert Suderman
711c5893SRobert Suderman  return b.create<arith::ConstantOp>(loc, attr);
711c5893SRobert Suderman}
711c5893SRobert Suderman
10a57f3aSPrashant Kumarstatic Value createFloatConst(Location loc, Type type, double value,
10a57f3aSPrashant Kumar                              OpBuilder &b) {
10a57f3aSPrashant Kumar  return createFloatConst(loc, type, APFloat(value), b);
10a57f3aSPrashant Kumar}
10a57f3aSPrashant Kumar
10a57f3aSPrashant Kumar/// Create an integer constant.
711c5893SRobert Sudermanstatic Value createIntConst(Location loc, Type type, int64_t value,
711c5893SRobert Suderman                            OpBuilder &b) {
711c5893SRobert Suderman  auto attr = b.getIntegerAttr(getElementTypeOrSelf(type), value);
711c5893SRobert Suderman  if (auto shapedTy = dyn_cast<ShapedType>(type)) {
711c5893SRobert Suderman    return b.create<arith::ConstantOp>(loc,
711c5893SRobert Suderman                                       DenseElementsAttr::get(shapedTy, attr));
711c5893SRobert Suderman  }
711c5893SRobert Suderman
711c5893SRobert Suderman  return b.create<arith::ConstantOp>(loc, attr);
711c5893SRobert Suderman}
711c5893SRobert Suderman
2217888dSBalaji V. Iyerstatic Value createTruncatedFPValue(Value operand, ImplicitLocOpBuilder &b) {
2217888dSBalaji V. Iyer  Type opType = operand.getType();
44baa655SRamiro Leal-Cavazos  Type i64Ty = b.getI64Type();
44baa655SRamiro Leal-Cavazos  if (auto shapedTy = dyn_cast<ShapedType>(opType))
44baa655SRamiro Leal-Cavazos    i64Ty = shapedTy.clone(i64Ty);
44baa655SRamiro Leal-Cavazos  Value fixedConvert = b.create<arith::FPToSIOp>(i64Ty, operand);
2217888dSBalaji V. Iyer  Value fpFixedConvert = b.create<arith::SIToFPOp>(opType, fixedConvert);
44baa655SRamiro Leal-Cavazos  // The truncation does not preserve the sign when the truncated
44baa655SRamiro Leal-Cavazos  // value is -0. So here the sign is copied again.
44baa655SRamiro Leal-Cavazos  return b.create<math::CopySignOp>(fpFixedConvert, operand);
2217888dSBalaji V. Iyer}
2217888dSBalaji V. Iyer
aa165edcSRob Suderman// sinhf(float x) -> (exp(x) - exp(-x)) / 2
aa165edcSRob Sudermanstatic LogicalResult convertSinhOp(math::SinhOp op, PatternRewriter &rewriter) {
aa165edcSRob Suderman  ImplicitLocOpBuilder b(op->getLoc(), rewriter);
aa165edcSRob Suderman  Value operand = op.getOperand();
aa165edcSRob Suderman  Type opType = operand.getType();
aa165edcSRob Suderman
a62a7024Sjinchen  Value exp = b.create<math::ExpOp>(operand);
a62a7024Sjinchen  Value neg = b.create<arith::NegFOp>(operand);
a62a7024Sjinchen  Value nexp = b.create<math::ExpOp>(neg);
aa165edcSRob Suderman  Value sub = b.create<arith::SubFOp>(exp, nexp);
a62a7024Sjinchen  Value half = createFloatConst(op->getLoc(), opType, 0.5, rewriter);
a62a7024Sjinchen  Value res = b.create<arith::MulFOp>(sub, half);
a62a7024Sjinchen  rewriter.replaceOp(op, res);
aa165edcSRob Suderman  return success();
aa165edcSRob Suderman}
aa165edcSRob Suderman
aa165edcSRob Suderman// coshf(float x) -> (exp(x) + exp(-x)) / 2
aa165edcSRob Sudermanstatic LogicalResult convertCoshOp(math::CoshOp op, PatternRewriter &rewriter) {
aa165edcSRob Suderman  ImplicitLocOpBuilder b(op->getLoc(), rewriter);
aa165edcSRob Suderman  Value operand = op.getOperand();
aa165edcSRob Suderman  Type opType = operand.getType();
aa165edcSRob Suderman
a62a7024Sjinchen  Value exp = b.create<math::ExpOp>(operand);
a62a7024Sjinchen  Value neg = b.create<arith::NegFOp>(operand);
a62a7024Sjinchen  Value nexp = b.create<math::ExpOp>(neg);
aa165edcSRob Suderman  Value add = b.create<arith::AddFOp>(exp, nexp);
a62a7024Sjinchen  Value half = createFloatConst(op->getLoc(), opType, 0.5, rewriter);
a62a7024Sjinchen  Value res = b.create<arith::MulFOp>(add, half);
a62a7024Sjinchen  rewriter.replaceOp(op, res);
aa165edcSRob Suderman  return success();
aa165edcSRob Suderman}
aa165edcSRob Suderman
f3bdb56dSRob Suderman/// Expands tanh op into
d39ac3a8Ssrcarroll/// 1-exp^{-2x} / 1+exp^{-2x}
d39ac3a8Ssrcarroll/// To avoid overflow we exploit the reflection symmetry `tanh(-x) = -tanh(x)`.
d39ac3a8Ssrcarroll/// We compute a "signs" value which is -1 if input is negative and +1 if input
d39ac3a8Ssrcarroll/// is positive.  Then multiply the input by this value, guaranteeing that the
d39ac3a8Ssrcarroll/// result is positive, which also guarantees `exp^{-2x * sign(x)}` is in (0,
d39ac3a8Ssrcarroll/// 1]. Expand the computation on the input `x * sign(x)`, then multiply the
d39ac3a8Ssrcarroll/// result by `sign(x)` to retain sign of the real result.
f3bdb56dSRob Sudermanstatic LogicalResult convertTanhOp(math::TanhOp op, PatternRewriter &rewriter) {
f3bdb56dSRob Suderman  auto floatType = op.getOperand().getType();
f3bdb56dSRob Suderman  Location loc = op.getLoc();
d39ac3a8Ssrcarroll  Value zero = createFloatConst(loc, floatType, 0.0, rewriter);
711c5893SRobert Suderman  Value one = createFloatConst(loc, floatType, 1.0, rewriter);
d39ac3a8Ssrcarroll  Value negTwo = createFloatConst(loc, floatType, -2.0, rewriter);
f3bdb56dSRob Suderman
d39ac3a8Ssrcarroll  // Compute sign(x) = cast<float_type>(x < 0) * (-2) + 1
d39ac3a8Ssrcarroll  Value isNegative = rewriter.create<arith::CmpFOp>(
d39ac3a8Ssrcarroll      loc, arith::CmpFPredicate::OLT, op.getOperand(), zero);
d39ac3a8Ssrcarroll  Value isNegativeFloat =
d39ac3a8Ssrcarroll      rewriter.create<arith::UIToFPOp>(loc, floatType, isNegative);
d39ac3a8Ssrcarroll  Value isNegativeTimesNegTwo =
d39ac3a8Ssrcarroll      rewriter.create<arith::MulFOp>(loc, isNegativeFloat, negTwo);
d39ac3a8Ssrcarroll  Value sign = rewriter.create<arith::AddFOp>(loc, isNegativeTimesNegTwo, one);
d39ac3a8Ssrcarroll
d39ac3a8Ssrcarroll  // Normalize input to positive value: y = sign(x) * x
d39ac3a8Ssrcarroll  Value positiveX = rewriter.create<arith::MulFOp>(loc, sign, op.getOperand());
d39ac3a8Ssrcarroll
d39ac3a8Ssrcarroll  // Decompose on normalized input
d39ac3a8Ssrcarroll  Value negDoubledX = rewriter.create<arith::MulFOp>(loc, negTwo, positiveX);
f3bdb56dSRob Suderman  Value exp2x = rewriter.create<math::ExpOp>(loc, negDoubledX);
f3bdb56dSRob Suderman  Value dividend = rewriter.create<arith::SubFOp>(loc, one, exp2x);
f3bdb56dSRob Suderman  Value divisor = rewriter.create<arith::AddFOp>(loc, one, exp2x);
f3bdb56dSRob Suderman  Value positiveRes = rewriter.create<arith::DivFOp>(loc, dividend, divisor);
f3bdb56dSRob Suderman
d39ac3a8Ssrcarroll  // Multiply result by sign(x) to retain signs from negative inputs
d39ac3a8Ssrcarroll  rewriter.replaceOpWithNewOp<arith::MulFOp>(op, sign, positiveRes);
f3bdb56dSRob Suderman
f3bdb56dSRob Suderman  return success();
f3bdb56dSRob Suderman}
f3bdb56dSRob Suderman
711c5893SRobert Suderman// Converts math.tan to math.sin, math.cos, and arith.divf.
740e2e90SRobert Sudermanstatic LogicalResult convertTanOp(math::TanOp op, PatternRewriter &rewriter) {
740e2e90SRobert Suderman  ImplicitLocOpBuilder b(op->getLoc(), rewriter);
740e2e90SRobert Suderman  Value operand = op.getOperand();
740e2e90SRobert Suderman  Type type = operand.getType();
740e2e90SRobert Suderman  Value sin = b.create<math::SinOp>(type, operand);
740e2e90SRobert Suderman  Value cos = b.create<math::CosOp>(type, operand);
740e2e90SRobert Suderman  Value div = b.create<arith::DivFOp>(type, sin, cos);
740e2e90SRobert Suderman  rewriter.replaceOp(op, div);
740e2e90SRobert Suderman  return success();
740e2e90SRobert Suderman}
740e2e90SRobert Suderman
a62a7024Sjinchen// asinh(float x) -> log(x + sqrt(x**2 + 1))
a62a7024Sjinchenstatic LogicalResult convertAsinhOp(math::AsinhOp op,
a62a7024Sjinchen                                    PatternRewriter &rewriter) {
a62a7024Sjinchen  ImplicitLocOpBuilder b(op->getLoc(), rewriter);
a62a7024Sjinchen  Value operand = op.getOperand();
a62a7024Sjinchen  Type opType = operand.getType();
a62a7024Sjinchen
a62a7024Sjinchen  Value one = createFloatConst(op->getLoc(), opType, 1.0, rewriter);
a62a7024Sjinchen  Value fma = b.create<math::FmaOp>(operand, operand, one);
a62a7024Sjinchen  Value sqrt = b.create<math::SqrtOp>(fma);
a62a7024Sjinchen  Value add = b.create<arith::AddFOp>(operand, sqrt);
a62a7024Sjinchen  Value res = b.create<math::LogOp>(add);
a62a7024Sjinchen  rewriter.replaceOp(op, res);
a62a7024Sjinchen  return success();
a62a7024Sjinchen}
a62a7024Sjinchen
a62a7024Sjinchen// acosh(float x) -> log(x + sqrt(x**2 - 1))
a62a7024Sjinchenstatic LogicalResult convertAcoshOp(math::AcoshOp op,
a62a7024Sjinchen                                    PatternRewriter &rewriter) {
a62a7024Sjinchen  ImplicitLocOpBuilder b(op->getLoc(), rewriter);
a62a7024Sjinchen  Value operand = op.getOperand();
a62a7024Sjinchen  Type opType = operand.getType();
a62a7024Sjinchen
a62a7024Sjinchen  Value negOne = createFloatConst(op->getLoc(), opType, -1.0, rewriter);
a62a7024Sjinchen  Value fma = b.create<math::FmaOp>(operand, operand, negOne);
a62a7024Sjinchen  Value sqrt = b.create<math::SqrtOp>(fma);
a62a7024Sjinchen  Value add = b.create<arith::AddFOp>(operand, sqrt);
a62a7024Sjinchen  Value res = b.create<math::LogOp>(add);
a62a7024Sjinchen  rewriter.replaceOp(op, res);
a62a7024Sjinchen  return success();
a62a7024Sjinchen}
a62a7024Sjinchen
a62a7024Sjinchen// atanh(float x) -> log((1 + x) / (1 - x)) / 2
a62a7024Sjinchenstatic LogicalResult convertAtanhOp(math::AtanhOp op,
a62a7024Sjinchen                                    PatternRewriter &rewriter) {
a62a7024Sjinchen  ImplicitLocOpBuilder b(op->getLoc(), rewriter);
a62a7024Sjinchen  Value operand = op.getOperand();
a62a7024Sjinchen  Type opType = operand.getType();
a62a7024Sjinchen
a62a7024Sjinchen  Value one = createFloatConst(op->getLoc(), opType, 1.0, rewriter);
a62a7024Sjinchen  Value add = b.create<arith::AddFOp>(operand, one);
a62a7024Sjinchen  Value neg = b.create<arith::NegFOp>(operand);
a62a7024Sjinchen  Value sub = b.create<arith::AddFOp>(neg, one);
a62a7024Sjinchen  Value div = b.create<arith::DivFOp>(add, sub);
a62a7024Sjinchen  Value log = b.create<math::LogOp>(div);
a62a7024Sjinchen  Value half = createFloatConst(op->getLoc(), opType, 0.5, rewriter);
a62a7024Sjinchen  Value res = b.create<arith::MulFOp>(log, half);
a62a7024Sjinchen  rewriter.replaceOp(op, res);
a62a7024Sjinchen  return success();
a62a7024Sjinchen}
a62a7024Sjinchen
a7c2102dSBalaji V. Iyerstatic LogicalResult convertFmaFOp(math::FmaOp op, PatternRewriter &rewriter) {
a7c2102dSBalaji V. Iyer  ImplicitLocOpBuilder b(op->getLoc(), rewriter);
a7c2102dSBalaji V. Iyer  Value operandA = op.getOperand(0);
a7c2102dSBalaji V. Iyer  Value operandB = op.getOperand(1);
a7c2102dSBalaji V. Iyer  Value operandC = op.getOperand(2);
a7c2102dSBalaji V. Iyer  Type type = op.getType();
a7c2102dSBalaji V. Iyer  Value mult = b.create<arith::MulFOp>(type, operandA, operandB);
a7c2102dSBalaji V. Iyer  Value add = b.create<arith::AddFOp>(type, mult, operandC);
a7c2102dSBalaji V. Iyer  rewriter.replaceOp(op, add);
a7c2102dSBalaji V. Iyer  return success();
a7c2102dSBalaji V. Iyer}
a7c2102dSBalaji V. Iyer
2217888dSBalaji V. Iyer// Converts a ceilf() function to the following:
2217888dSBalaji V. Iyer// ceilf(float x) ->
2217888dSBalaji V. Iyer//      y = (float)(int) x
2217888dSBalaji V. Iyer//      if (x > y) then incr = 1 else incr = 0
2217888dSBalaji V. Iyer//      y = y + incr   <= replace this op with the ceilf op.
2217888dSBalaji V. Iyerstatic LogicalResult convertCeilOp(math::CeilOp op, PatternRewriter &rewriter) {
2217888dSBalaji V. Iyer  ImplicitLocOpBuilder b(op->getLoc(), rewriter);
2217888dSBalaji V. Iyer  Value operand = op.getOperand();
2217888dSBalaji V. Iyer  Type opType = operand.getType();
2217888dSBalaji V. Iyer  Value fpFixedConvert = createTruncatedFPValue(operand, b);
2217888dSBalaji V. Iyer
2217888dSBalaji V. Iyer  // Creating constants for later use.
2217888dSBalaji V. Iyer  Value zero = createFloatConst(op->getLoc(), opType, 0.00, rewriter);
2217888dSBalaji V. Iyer  Value one = createFloatConst(op->getLoc(), opType, 1.00, rewriter);
2217888dSBalaji V. Iyer
2217888dSBalaji V. Iyer  Value gtCheck = b.create<arith::CmpFOp>(arith::CmpFPredicate::OGT, operand,
2217888dSBalaji V. Iyer                                          fpFixedConvert);
2217888dSBalaji V. Iyer  Value incrValue = b.create<arith::SelectOp>(op->getLoc(), gtCheck, one, zero);
2217888dSBalaji V. Iyer
2217888dSBalaji V. Iyer  Value ret = b.create<arith::AddFOp>(opType, fpFixedConvert, incrValue);
2217888dSBalaji V. Iyer  rewriter.replaceOp(op, ret);
2217888dSBalaji V. Iyer  return success();
2217888dSBalaji V. Iyer}
10a57f3aSPrashant Kumar
10a57f3aSPrashant Kumar// Convert `math.fpowi` to a series of `arith.mulf` operations.
10a57f3aSPrashant Kumar// If the power is negative, we divide one by the result.
10a57f3aSPrashant Kumar// If both the base and power are zero, the result is 1.
5b702be1SPrashant Kumar// In the case of non constant power, we convert the operation to `math.powf`.
5b702be1SPrashant Kumarstatic LogicalResult convertFPowIOp(math::FPowIOp op,
10a57f3aSPrashant Kumar                                    PatternRewriter &rewriter) {
10a57f3aSPrashant Kumar  ImplicitLocOpBuilder b(op->getLoc(), rewriter);
10a57f3aSPrashant Kumar  Value base = op.getOperand(0);
10a57f3aSPrashant Kumar  Value power = op.getOperand(1);
10a57f3aSPrashant Kumar  Type baseType = base.getType();
10a57f3aSPrashant Kumar
5b702be1SPrashant Kumar  auto convertFPowItoPowf = [&]() -> LogicalResult {
5b702be1SPrashant Kumar    Value castPowerToFp =
5b702be1SPrashant Kumar        rewriter.create<arith::SIToFPOp>(op.getLoc(), baseType, power);
5b702be1SPrashant Kumar    Value res = rewriter.create<math::PowFOp>(op.getLoc(), baseType, base,
5b702be1SPrashant Kumar                                              castPowerToFp);
5b702be1SPrashant Kumar    rewriter.replaceOp(op, res);
5b702be1SPrashant Kumar    return success();
5b702be1SPrashant Kumar  };
5b702be1SPrashant Kumar
10a57f3aSPrashant Kumar  Attribute cstAttr;
10a57f3aSPrashant Kumar  if (!matchPattern(power, m_Constant(&cstAttr)))
5b702be1SPrashant Kumar    return convertFPowItoPowf();
10a57f3aSPrashant Kumar
10a57f3aSPrashant Kumar  APInt value;
10a57f3aSPrashant Kumar  if (!matchPattern(cstAttr, m_ConstantInt(&value)))
5b702be1SPrashant Kumar    return convertFPowItoPowf();
10a57f3aSPrashant Kumar
10a57f3aSPrashant Kumar  int64_t powerInt = value.getSExtValue();
10a57f3aSPrashant Kumar  bool isNegative = powerInt < 0;
10a57f3aSPrashant Kumar  int64_t absPower = std::abs(powerInt);
10a57f3aSPrashant Kumar  Value one = createFloatConst(op->getLoc(), baseType, 1.00, rewriter);
10a57f3aSPrashant Kumar  Value res = createFloatConst(op->getLoc(), baseType, 1.00, rewriter);
10a57f3aSPrashant Kumar
10a57f3aSPrashant Kumar  while (absPower > 0) {
10a57f3aSPrashant Kumar    if (absPower & 1)
10a57f3aSPrashant Kumar      res = b.create<arith::MulFOp>(baseType, base, res);
10a57f3aSPrashant Kumar    absPower >>= 1;
10a57f3aSPrashant Kumar    base = b.create<arith::MulFOp>(baseType, base, base);
10a57f3aSPrashant Kumar  }
10a57f3aSPrashant Kumar
10a57f3aSPrashant Kumar  // Make sure not to introduce UB in case of negative power.
10a57f3aSPrashant Kumar  if (isNegative) {
10a57f3aSPrashant Kumar    auto &sem = dyn_cast<mlir::FloatType>(getElementTypeOrSelf(baseType))
10a57f3aSPrashant Kumar                    .getFloatSemantics();
10a57f3aSPrashant Kumar    Value zero =
10a57f3aSPrashant Kumar        createFloatConst(op->getLoc(), baseType,
10a57f3aSPrashant Kumar                         APFloat::getZero(sem, /*Negative=*/false), rewriter);
10a57f3aSPrashant Kumar    Value negZero =
10a57f3aSPrashant Kumar        createFloatConst(op->getLoc(), baseType,
10a57f3aSPrashant Kumar                         APFloat::getZero(sem, /*Negative=*/true), rewriter);
10a57f3aSPrashant Kumar    Value posInfinity =
10a57f3aSPrashant Kumar        createFloatConst(op->getLoc(), baseType,
10a57f3aSPrashant Kumar                         APFloat::getInf(sem, /*Negative=*/false), rewriter);
10a57f3aSPrashant Kumar    Value negInfinity =
10a57f3aSPrashant Kumar        createFloatConst(op->getLoc(), baseType,
10a57f3aSPrashant Kumar                         APFloat::getInf(sem, /*Negative=*/true), rewriter);
10a57f3aSPrashant Kumar    Value zeroEqCheck =
10a57f3aSPrashant Kumar        b.create<arith::CmpFOp>(arith::CmpFPredicate::OEQ, res, zero);
10a57f3aSPrashant Kumar    Value negZeroEqCheck =
10a57f3aSPrashant Kumar        b.create<arith::CmpFOp>(arith::CmpFPredicate::OEQ, res, negZero);
10a57f3aSPrashant Kumar    res = b.create<arith::DivFOp>(baseType, one, res);
10a57f3aSPrashant Kumar    res =
10a57f3aSPrashant Kumar        b.create<arith::SelectOp>(op->getLoc(), zeroEqCheck, posInfinity, res);
10a57f3aSPrashant Kumar    res = b.create<arith::SelectOp>(op->getLoc(), negZeroEqCheck, negInfinity,
10a57f3aSPrashant Kumar                                    res);
10a57f3aSPrashant Kumar  }
10a57f3aSPrashant Kumar
10a57f3aSPrashant Kumar  rewriter.replaceOp(op, res);
10a57f3aSPrashant Kumar  return success();
10a57f3aSPrashant Kumar}
10a57f3aSPrashant Kumar
2d4e8567SBalaji V. Iyer// Converts Powf(float a, float b) (meaning a^b) to exp^(b * ln(a))
*3a337757SHyunsung Lee// Restricting a >= 0
2d4e8567SBalaji V. Iyerstatic LogicalResult convertPowfOp(math::PowFOp op, PatternRewriter &rewriter) {
2d4e8567SBalaji V. Iyer  ImplicitLocOpBuilder b(op->getLoc(), rewriter);
2d4e8567SBalaji V. Iyer  Value operandA = op.getOperand(0);
2d4e8567SBalaji V. Iyer  Value operandB = op.getOperand(1);
2d4e8567SBalaji V. Iyer  Type opType = operandA.getType();
f66e4bd6SBalaji V. Iyer  Value zero = createFloatConst(op->getLoc(), opType, 0.00, rewriter);
a92e3df3SChristopher Bate  Value one = createFloatConst(op->getLoc(), opType, 1.00, rewriter);
2d4e8567SBalaji V. Iyer
*3a337757SHyunsung Lee  Value logA = b.create<math::LogOp>(opType, operandA);
*3a337757SHyunsung Lee  Value mult = b.create<arith::MulFOp>(opType, operandB, logA);
2d4e8567SBalaji V. Iyer  Value expResult = b.create<math::ExpOp>(opType, mult);
f66e4bd6SBalaji V. Iyer
a92e3df3SChristopher Bate  // First, we select between the exp value and the adjusted value for odd
a92e3df3SChristopher Bate  // powers of negatives. Then, we ensure that one is produced if `b` is zero.
a92e3df3SChristopher Bate  // This corresponds to `libm` behavior, even for `0^0`. Without this check,
a92e3df3SChristopher Bate  // `exp(0 * ln(0)) = exp(0 *-inf) = exp(-nan) = -nan`.
a92e3df3SChristopher Bate  Value zeroCheck =
a92e3df3SChristopher Bate      b.create<arith::CmpFOp>(arith::CmpFPredicate::OEQ, operandB, zero);
*3a337757SHyunsung Lee  Value finalResult =
*3a337757SHyunsung Lee      b.create<arith::SelectOp>(op->getLoc(), zeroCheck, one, expResult);
*3a337757SHyunsung Lee  rewriter.replaceOp(op, finalResult);
2d4e8567SBalaji V. Iyer  return success();
2d4e8567SBalaji V. Iyer}
2217888dSBalaji V. Iyer
4da96515SBalaji V. Iyer// exp2f(float x) -> exp(x * ln(2))
4da96515SBalaji V. Iyer//   Proof: Let's say 2^x = y
4da96515SBalaji V. Iyer//   ln(2^x) = ln(y)
4da96515SBalaji V. Iyer//   x * ln(2) = ln(y) => e ^(x*ln(2)) = y
4da96515SBalaji V. Iyerstatic LogicalResult convertExp2fOp(math::Exp2Op op,
4da96515SBalaji V. Iyer                                    PatternRewriter &rewriter) {
4da96515SBalaji V. Iyer  ImplicitLocOpBuilder b(op->getLoc(), rewriter);
4da96515SBalaji V. Iyer  Value operand = op.getOperand();
4da96515SBalaji V. Iyer  Type opType = operand.getType();
4da96515SBalaji V. Iyer  Value ln2 = createFloatConst(op->getLoc(), opType, llvm::numbers::ln2, b);
4da96515SBalaji V. Iyer  Value mult = b.create<arith::MulFOp>(opType, operand, ln2);
4da96515SBalaji V. Iyer  Value exp = b.create<math::ExpOp>(op->getLoc(), mult);
4da96515SBalaji V. Iyer  rewriter.replaceOp(op, exp);
4da96515SBalaji V. Iyer  return success();
4da96515SBalaji V. Iyer}
4da96515SBalaji V. Iyer
be911578SBalaji V. Iyerstatic LogicalResult convertRoundOp(math::RoundOp op,
be911578SBalaji V. Iyer                                    PatternRewriter &rewriter) {
44baa655SRamiro Leal-Cavazos  Location loc = op.getLoc();
44baa655SRamiro Leal-Cavazos  ImplicitLocOpBuilder b(loc, rewriter);
be911578SBalaji V. Iyer  Value operand = op.getOperand();
be911578SBalaji V. Iyer  Type opType = operand.getType();
44baa655SRamiro Leal-Cavazos  Type opEType = getElementTypeOrSelf(opType);
be911578SBalaji V. Iyer
44baa655SRamiro Leal-Cavazos  if (!opEType.isF32()) {
44baa655SRamiro Leal-Cavazos    return rewriter.notifyMatchFailure(op, "not a round of f32.");
44baa655SRamiro Leal-Cavazos  }
be911578SBalaji V. Iyer
44baa655SRamiro Leal-Cavazos  Type i32Ty = b.getI32Type();
44baa655SRamiro Leal-Cavazos  if (auto shapedTy = dyn_cast<ShapedType>(opType))
44baa655SRamiro Leal-Cavazos    i32Ty = shapedTy.clone(i32Ty);
44baa655SRamiro Leal-Cavazos
44baa655SRamiro Leal-Cavazos  Value half = createFloatConst(loc, opType, 0.5, b);
44baa655SRamiro Leal-Cavazos  Value c23 = createIntConst(loc, i32Ty, 23, b);
44baa655SRamiro Leal-Cavazos  Value c127 = createIntConst(loc, i32Ty, 127, b);
44baa655SRamiro Leal-Cavazos  Value expMask = createIntConst(loc, i32Ty, (1 << 8) - 1, b);
44baa655SRamiro Leal-Cavazos
44baa655SRamiro Leal-Cavazos  Value incrValue = b.create<math::CopySignOp>(half, operand);
be911578SBalaji V. Iyer  Value add = b.create<arith::AddFOp>(opType, operand, incrValue);
be911578SBalaji V. Iyer  Value fpFixedConvert = createTruncatedFPValue(add, b);
44baa655SRamiro Leal-Cavazos
44baa655SRamiro Leal-Cavazos  // There are three cases where adding 0.5 to the value and truncating by
44baa655SRamiro Leal-Cavazos  // converting to an i64 does not result in the correct behavior:
44baa655SRamiro Leal-Cavazos  //
44baa655SRamiro Leal-Cavazos  // 1. Special values: +-inf and +-nan
44baa655SRamiro Leal-Cavazos  //     Casting these special values to i64 has undefined behavior. To identify
44baa655SRamiro Leal-Cavazos  //     these values, we use the fact that these values are the only float
44baa655SRamiro Leal-Cavazos  //     values with the maximum possible biased exponent.
44baa655SRamiro Leal-Cavazos  //
44baa655SRamiro Leal-Cavazos  // 2. Large values: 2^23 <= |x| <= INT_64_MAX
44baa655SRamiro Leal-Cavazos  //     Adding 0.5 to a float larger than or equal to 2^23 results in precision
44baa655SRamiro Leal-Cavazos  //     errors that sometimes round the value up and sometimes round the value
44baa655SRamiro Leal-Cavazos  //     down. For example:
44baa655SRamiro Leal-Cavazos  //         8388608.0 + 0.5 = 8388608.0
44baa655SRamiro Leal-Cavazos  //         8388609.0 + 0.5 = 8388610.0
44baa655SRamiro Leal-Cavazos  //
44baa655SRamiro Leal-Cavazos  // 3. Very large values: |x| > INT_64_MAX
44baa655SRamiro Leal-Cavazos  //     Casting to i64 a value greater than the max i64 value will overflow the
44baa655SRamiro Leal-Cavazos  //     i64 leading to wrong outputs.
44baa655SRamiro Leal-Cavazos  //
44baa655SRamiro Leal-Cavazos  // All three cases satisfy the property `biasedExp >= 23`.
44baa655SRamiro Leal-Cavazos  Value operandBitcast = b.create<arith::BitcastOp>(i32Ty, operand);
44baa655SRamiro Leal-Cavazos  Value operandExp = b.create<arith::AndIOp>(
44baa655SRamiro Leal-Cavazos      b.create<arith::ShRUIOp>(operandBitcast, c23), expMask);
44baa655SRamiro Leal-Cavazos  Value operandBiasedExp = b.create<arith::SubIOp>(operandExp, c127);
44baa655SRamiro Leal-Cavazos  Value isSpecialValOrLargeVal =
44baa655SRamiro Leal-Cavazos      b.create<arith::CmpIOp>(arith::CmpIPredicate::sge, operandBiasedExp, c23);
44baa655SRamiro Leal-Cavazos
44baa655SRamiro Leal-Cavazos  Value result = b.create<arith::SelectOp>(isSpecialValOrLargeVal, operand,
44baa655SRamiro Leal-Cavazos                                           fpFixedConvert);
44baa655SRamiro Leal-Cavazos  rewriter.replaceOp(op, result);
be911578SBalaji V. Iyer  return success();
be911578SBalaji V. Iyer}
be911578SBalaji V. Iyer
711c5893SRobert Suderman// Converts math.ctlz to scf and arith operations. This is done
711c5893SRobert Suderman// by performing a binary search on the bits.
f3bdb56dSRob Sudermanstatic LogicalResult convertCtlzOp(math::CountLeadingZerosOp op,
f3bdb56dSRob Suderman                                   PatternRewriter &rewriter) {
f3bdb56dSRob Suderman  auto operand = op.getOperand();
711c5893SRobert Suderman  auto operandTy = operand.getType();
711c5893SRobert Suderman  auto eTy = getElementTypeOrSelf(operandTy);
f3bdb56dSRob Suderman  Location loc = op.getLoc();
f3bdb56dSRob Suderman
711c5893SRobert Suderman  int32_t bitwidth = eTy.getIntOrFloatBitWidth();
711c5893SRobert Suderman  if (bitwidth > 64)
711c5893SRobert Suderman    return failure();
f3bdb56dSRob Suderman
711c5893SRobert Suderman  uint64_t allbits = -1;
711c5893SRobert Suderman  if (bitwidth < 64) {
711c5893SRobert Suderman    allbits = allbits >> (64 - bitwidth);
711c5893SRobert Suderman  }
f3bdb56dSRob Suderman
711c5893SRobert Suderman  Value x = operand;
711c5893SRobert Suderman  Value count = createIntConst(loc, operandTy, 0, rewriter);
711c5893SRobert Suderman  for (int32_t bw = bitwidth; bw > 1; bw = bw / 2) {
711c5893SRobert Suderman    auto half = bw / 2;
711c5893SRobert Suderman    auto bits = createIntConst(loc, operandTy, half, rewriter);
711c5893SRobert Suderman    auto mask = createIntConst(loc, operandTy, allbits >> half, rewriter);
f3bdb56dSRob Suderman
711c5893SRobert Suderman    Value pred =
711c5893SRobert Suderman        rewriter.create<arith::CmpIOp>(loc, arith::CmpIPredicate::ule, x, mask);
711c5893SRobert Suderman    Value add = rewriter.create<arith::AddIOp>(loc, count, bits);
711c5893SRobert Suderman    Value shift = rewriter.create<arith::ShLIOp>(loc, x, bits);
f3bdb56dSRob Suderman
711c5893SRobert Suderman    x = rewriter.create<arith::SelectOp>(loc, pred, shift, x);
711c5893SRobert Suderman    count = rewriter.create<arith::SelectOp>(loc, pred, add, count);
711c5893SRobert Suderman  }
f3bdb56dSRob Suderman
711c5893SRobert Suderman  Value zero = createIntConst(loc, operandTy, 0, rewriter);
711c5893SRobert Suderman  Value pred = rewriter.create<arith::CmpIOp>(loc, arith::CmpIPredicate::eq,
711c5893SRobert Suderman                                              operand, zero);
f3bdb56dSRob Suderman
711c5893SRobert Suderman  Value bwval = createIntConst(loc, operandTy, bitwidth, rewriter);
711c5893SRobert Suderman  Value sel = rewriter.create<arith::SelectOp>(loc, pred, bwval, count);
711c5893SRobert Suderman  rewriter.replaceOp(op, sel);
f3bdb56dSRob Suderman  return success();
f3bdb56dSRob Suderman}
f3bdb56dSRob Suderman
44baa655SRamiro Leal-Cavazos// Convert `math.roundeven` into `math.round` + arith ops
44baa655SRamiro Leal-Cavazosstatic LogicalResult convertRoundEvenOp(math::RoundEvenOp op,
44baa655SRamiro Leal-Cavazos                                        PatternRewriter &rewriter) {
44baa655SRamiro Leal-Cavazos  Location loc = op.getLoc();
44baa655SRamiro Leal-Cavazos  ImplicitLocOpBuilder b(loc, rewriter);
44baa655SRamiro Leal-Cavazos  auto operand = op.getOperand();
44baa655SRamiro Leal-Cavazos  Type operandTy = operand.getType();
44baa655SRamiro Leal-Cavazos  Type resultTy = op.getType();
44baa655SRamiro Leal-Cavazos  Type operandETy = getElementTypeOrSelf(operandTy);
44baa655SRamiro Leal-Cavazos  Type resultETy = getElementTypeOrSelf(resultTy);
44baa655SRamiro Leal-Cavazos
fe355a44SAlexander Shaposhnikov  if (!isa<FloatType>(operandETy) || !isa<FloatType>(resultETy)) {
fe355a44SAlexander Shaposhnikov    return rewriter.notifyMatchFailure(op, "not a roundeven of f16 or f32.");
44baa655SRamiro Leal-Cavazos  }
44baa655SRamiro Leal-Cavazos
fe355a44SAlexander Shaposhnikov  Type fTy = operandTy;
fe355a44SAlexander Shaposhnikov  Type iTy = rewriter.getIntegerType(operandETy.getIntOrFloatBitWidth());
fe355a44SAlexander Shaposhnikov  if (auto shapedTy = dyn_cast<ShapedType>(fTy)) {
fe355a44SAlexander Shaposhnikov    iTy = shapedTy.clone(iTy);
44baa655SRamiro Leal-Cavazos  }
44baa655SRamiro Leal-Cavazos
fe355a44SAlexander Shaposhnikov  unsigned bitWidth = operandETy.getIntOrFloatBitWidth();
fe355a44SAlexander Shaposhnikov  // The width returned by getFPMantissaWidth includes the integer bit.
fe355a44SAlexander Shaposhnikov  unsigned mantissaWidth =
fe355a44SAlexander Shaposhnikov      llvm::cast<FloatType>(operandETy).getFPMantissaWidth() - 1;
fe355a44SAlexander Shaposhnikov  unsigned exponentWidth = bitWidth - mantissaWidth - 1;
44baa655SRamiro Leal-Cavazos
fe355a44SAlexander Shaposhnikov  // The names of the variables correspond to f32.
fe355a44SAlexander Shaposhnikov  // f64: 1 bit sign | 11 bits exponent | 52 bits mantissa.
fe355a44SAlexander Shaposhnikov  // f32: 1 bit sign | 8 bits exponent  | 23 bits mantissa.
fe355a44SAlexander Shaposhnikov  // f16: 1 bit sign | 5 bits exponent  | 10 bits mantissa.
fe355a44SAlexander Shaposhnikov  Value c1Float = createFloatConst(loc, fTy, 1.0, b);
fe355a44SAlexander Shaposhnikov  Value c0 = createIntConst(loc, iTy, 0, b);
fe355a44SAlexander Shaposhnikov  Value c1 = createIntConst(loc, iTy, 1, b);
fe355a44SAlexander Shaposhnikov  Value cNeg1 = createIntConst(loc, iTy, -1, b);
fe355a44SAlexander Shaposhnikov  Value c23 = createIntConst(loc, iTy, mantissaWidth, b);
fe355a44SAlexander Shaposhnikov  Value c31 = createIntConst(loc, iTy, bitWidth - 1, b);
fe355a44SAlexander Shaposhnikov  Value c127 = createIntConst(loc, iTy, (1ull << (exponentWidth - 1)) - 1, b);
fe355a44SAlexander Shaposhnikov  Value c2To22 = createIntConst(loc, iTy, 1ull << (mantissaWidth - 1), b);
fe355a44SAlexander Shaposhnikov  Value c23Mask = createIntConst(loc, iTy, (1ull << mantissaWidth) - 1, b);
fe355a44SAlexander Shaposhnikov  Value expMask = createIntConst(loc, iTy, (1ull << exponentWidth) - 1, b);
fe355a44SAlexander Shaposhnikov
fe355a44SAlexander Shaposhnikov  Value operandBitcast = b.create<arith::BitcastOp>(iTy, operand);
44baa655SRamiro Leal-Cavazos  Value round = b.create<math::RoundOp>(operand);
fe355a44SAlexander Shaposhnikov  Value roundBitcast = b.create<arith::BitcastOp>(iTy, round);
44baa655SRamiro Leal-Cavazos
44baa655SRamiro Leal-Cavazos  // Get biased exponents for operand and round(operand)
44baa655SRamiro Leal-Cavazos  Value operandExp = b.create<arith::AndIOp>(
44baa655SRamiro Leal-Cavazos      b.create<arith::ShRUIOp>(operandBitcast, c23), expMask);
44baa655SRamiro Leal-Cavazos  Value operandBiasedExp = b.create<arith::SubIOp>(operandExp, c127);
44baa655SRamiro Leal-Cavazos  Value roundExp = b.create<arith::AndIOp>(
44baa655SRamiro Leal-Cavazos      b.create<arith::ShRUIOp>(roundBitcast, c23), expMask);
44baa655SRamiro Leal-Cavazos  Value roundBiasedExp = b.create<arith::SubIOp>(roundExp, c127);
44baa655SRamiro Leal-Cavazos
44baa655SRamiro Leal-Cavazos  auto safeShiftRight = [&](Value x, Value shift) -> Value {
fe355a44SAlexander Shaposhnikov    // Clamp shift to valid range [0, bitwidth - 1] to avoid undefined behavior
44baa655SRamiro Leal-Cavazos    Value clampedShift = b.create<arith::MaxSIOp>(shift, c0);
44baa655SRamiro Leal-Cavazos    clampedShift = b.create<arith::MinSIOp>(clampedShift, c31);
44baa655SRamiro Leal-Cavazos    return b.create<arith::ShRUIOp>(x, clampedShift);
44baa655SRamiro Leal-Cavazos  };
44baa655SRamiro Leal-Cavazos
44baa655SRamiro Leal-Cavazos  auto maskMantissa = [&](Value mantissa,
44baa655SRamiro Leal-Cavazos                          Value mantissaMaskRightShift) -> Value {
44baa655SRamiro Leal-Cavazos    Value shiftedMantissaMask = safeShiftRight(c23Mask, mantissaMaskRightShift);
44baa655SRamiro Leal-Cavazos    return b.create<arith::AndIOp>(mantissa, shiftedMantissaMask);
44baa655SRamiro Leal-Cavazos  };
44baa655SRamiro Leal-Cavazos
44baa655SRamiro Leal-Cavazos  // A whole number `x`, such that `|x| != 1`, is even if the mantissa, ignoring
44baa655SRamiro Leal-Cavazos  // the leftmost `clamp(biasedExp - 1, 0, 23)` bits, is zero. Large numbers
44baa655SRamiro Leal-Cavazos  // with `biasedExp > 23` (numbers where there is not enough precision to store
44baa655SRamiro Leal-Cavazos  // decimals) are always even, and they satisfy the even condition trivially
44baa655SRamiro Leal-Cavazos  // since the mantissa without all its bits is zero. The even condition
44baa655SRamiro Leal-Cavazos  // is also true for +-0, since they have `biasedExp = -127` and the entire
44baa655SRamiro Leal-Cavazos  // mantissa is zero. The case of +-1 has to be handled separately. Here
44baa655SRamiro Leal-Cavazos  // we identify these values by noting that +-1 are the only whole numbers with
44baa655SRamiro Leal-Cavazos  // `biasedExp == 0`.
44baa655SRamiro Leal-Cavazos  //
44baa655SRamiro Leal-Cavazos  // The special values +-inf and +-nan also satisfy the same property that
44baa655SRamiro Leal-Cavazos  // whole non-unit even numbers satisfy. In particular, the special values have
44baa655SRamiro Leal-Cavazos  // `biasedExp > 23`, so they get treated as large numbers with no room for
44baa655SRamiro Leal-Cavazos  // decimals, which are always even.
44baa655SRamiro Leal-Cavazos  Value roundBiasedExpEq0 =
44baa655SRamiro Leal-Cavazos      b.create<arith::CmpIOp>(arith::CmpIPredicate::eq, roundBiasedExp, c0);
44baa655SRamiro Leal-Cavazos  Value roundBiasedExpMinus1 = b.create<arith::SubIOp>(roundBiasedExp, c1);
44baa655SRamiro Leal-Cavazos  Value roundMaskedMantissa = maskMantissa(roundBitcast, roundBiasedExpMinus1);
44baa655SRamiro Leal-Cavazos  Value roundIsNotEvenOrSpecialVal = b.create<arith::CmpIOp>(
44baa655SRamiro Leal-Cavazos      arith::CmpIPredicate::ne, roundMaskedMantissa, c0);
44baa655SRamiro Leal-Cavazos  roundIsNotEvenOrSpecialVal =
44baa655SRamiro Leal-Cavazos      b.create<arith::OrIOp>(roundIsNotEvenOrSpecialVal, roundBiasedExpEq0);
44baa655SRamiro Leal-Cavazos
44baa655SRamiro Leal-Cavazos  // A value `x` with `0 <= biasedExp < 23`, is halfway between two consecutive
44baa655SRamiro Leal-Cavazos  // integers if the bit at index `biasedExp` starting from the left in the
44baa655SRamiro Leal-Cavazos  // mantissa is 1 and all the bits to the right are zero. Values with
44baa655SRamiro Leal-Cavazos  // `biasedExp >= 23` don't have decimals, so they are never halfway. The
44baa655SRamiro Leal-Cavazos  // values +-0.5 are the only halfway values that have `biasedExp == -1 < 0`,
44baa655SRamiro Leal-Cavazos  // so these are handled separately. In particular, if `biasedExp == -1`, the
44baa655SRamiro Leal-Cavazos  // value is halfway if the entire mantissa is zero.
44baa655SRamiro Leal-Cavazos  Value operandBiasedExpEqNeg1 = b.create<arith::CmpIOp>(
44baa655SRamiro Leal-Cavazos      arith::CmpIPredicate::eq, operandBiasedExp, cNeg1);
44baa655SRamiro Leal-Cavazos  Value expectedOperandMaskedMantissa = b.create<arith::SelectOp>(
44baa655SRamiro Leal-Cavazos      operandBiasedExpEqNeg1, c0, safeShiftRight(c2To22, operandBiasedExp));
44baa655SRamiro Leal-Cavazos  Value operandMaskedMantissa = maskMantissa(operandBitcast, operandBiasedExp);
44baa655SRamiro Leal-Cavazos  Value operandIsHalfway =
44baa655SRamiro Leal-Cavazos      b.create<arith::CmpIOp>(arith::CmpIPredicate::eq, operandMaskedMantissa,
44baa655SRamiro Leal-Cavazos                              expectedOperandMaskedMantissa);
44baa655SRamiro Leal-Cavazos  // Ensure `biasedExp` is in the valid range for half values.
44baa655SRamiro Leal-Cavazos  Value operandBiasedExpGeNeg1 = b.create<arith::CmpIOp>(
44baa655SRamiro Leal-Cavazos      arith::CmpIPredicate::sge, operandBiasedExp, cNeg1);
44baa655SRamiro Leal-Cavazos  Value operandBiasedExpLt23 =
44baa655SRamiro Leal-Cavazos      b.create<arith::CmpIOp>(arith::CmpIPredicate::slt, operandBiasedExp, c23);
44baa655SRamiro Leal-Cavazos  operandIsHalfway =
44baa655SRamiro Leal-Cavazos      b.create<arith::AndIOp>(operandIsHalfway, operandBiasedExpLt23);
44baa655SRamiro Leal-Cavazos  operandIsHalfway =
44baa655SRamiro Leal-Cavazos      b.create<arith::AndIOp>(operandIsHalfway, operandBiasedExpGeNeg1);
44baa655SRamiro Leal-Cavazos
44baa655SRamiro Leal-Cavazos  // Adjust rounded operand with `round(operand) - sign(operand)` to correct the
44baa655SRamiro Leal-Cavazos  // case where `round` rounded in the opposite direction of `roundeven`.
44baa655SRamiro Leal-Cavazos  Value sign = b.create<math::CopySignOp>(c1Float, operand);
44baa655SRamiro Leal-Cavazos  Value roundShifted = b.create<arith::SubFOp>(round, sign);
44baa655SRamiro Leal-Cavazos  // If the rounded value is even or a special value, we default to the behavior
44baa655SRamiro Leal-Cavazos  // of `math.round`.
44baa655SRamiro Leal-Cavazos  Value needsShift =
44baa655SRamiro Leal-Cavazos      b.create<arith::AndIOp>(roundIsNotEvenOrSpecialVal, operandIsHalfway);
44baa655SRamiro Leal-Cavazos  Value result = b.create<arith::SelectOp>(needsShift, roundShifted, round);
44baa655SRamiro Leal-Cavazos  // The `x - sign` adjustment does not preserve the sign when we are adjusting
44baa655SRamiro Leal-Cavazos  // the value -1 to -0. So here the sign is copied again to ensure that -0.5 is
44baa655SRamiro Leal-Cavazos  // rounded to -0.0.
44baa655SRamiro Leal-Cavazos  result = b.create<math::CopySignOp>(result, operand);
44baa655SRamiro Leal-Cavazos  rewriter.replaceOp(op, result);
44baa655SRamiro Leal-Cavazos  return success();
44baa655SRamiro Leal-Cavazos}
44baa655SRamiro Leal-Cavazos
279a659eSCorentin Ferry// Convert `math.rsqrt` into `arith.divf` + `math.sqrt`
279a659eSCorentin Ferrystatic LogicalResult convertRsqrtOp(math::RsqrtOp op,
279a659eSCorentin Ferry                                    PatternRewriter &rewriter) {
279a659eSCorentin Ferry
279a659eSCorentin Ferry  auto operand = op.getOperand();
279a659eSCorentin Ferry  auto operandTy = operand.getType();
279a659eSCorentin Ferry  auto eTy = getElementTypeOrSelf(operandTy);
279a659eSCorentin Ferry  if (!isa<FloatType>(eTy))
279a659eSCorentin Ferry    return failure();
279a659eSCorentin Ferry
279a659eSCorentin Ferry  Location loc = op->getLoc();
279a659eSCorentin Ferry  auto constOneFloat = createFloatConst(loc, operandTy, 1.0, rewriter);
279a659eSCorentin Ferry  auto sqrtOp = rewriter.create<math::SqrtOp>(loc, operand);
279a659eSCorentin Ferry  rewriter.replaceOpWithNewOp<arith::DivFOp>(op, constOneFloat, sqrtOp);
279a659eSCorentin Ferry  return success();
279a659eSCorentin Ferry}
279a659eSCorentin Ferry
f3bdb56dSRob Sudermanvoid mlir::populateExpandCtlzPattern(RewritePatternSet &patterns) {
f3bdb56dSRob Suderman  patterns.add(convertCtlzOp);
f3bdb56dSRob Suderman}
f3bdb56dSRob Suderman
aa165edcSRob Sudermanvoid mlir::populateExpandSinhPattern(RewritePatternSet &patterns) {
aa165edcSRob Suderman  patterns.add(convertSinhOp);
aa165edcSRob Suderman}
aa165edcSRob Suderman
aa165edcSRob Sudermanvoid mlir::populateExpandCoshPattern(RewritePatternSet &patterns) {
aa165edcSRob Suderman  patterns.add(convertCoshOp);
aa165edcSRob Suderman}
aa165edcSRob Suderman
740e2e90SRobert Sudermanvoid mlir::populateExpandTanPattern(RewritePatternSet &patterns) {
740e2e90SRobert Suderman  patterns.add(convertTanOp);
740e2e90SRobert Suderman}
740e2e90SRobert Suderman
f3bdb56dSRob Sudermanvoid mlir::populateExpandTanhPattern(RewritePatternSet &patterns) {
f3bdb56dSRob Suderman  patterns.add(convertTanhOp);
f3bdb56dSRob Suderman}
a7c2102dSBalaji V. Iyer
a62a7024Sjinchenvoid mlir::populateExpandAsinhPattern(RewritePatternSet &patterns) {
a62a7024Sjinchen  patterns.add(convertAsinhOp);
a62a7024Sjinchen}
a62a7024Sjinchen
a62a7024Sjinchenvoid mlir::populateExpandAcoshPattern(RewritePatternSet &patterns) {
a62a7024Sjinchen  patterns.add(convertAcoshOp);
a62a7024Sjinchen}
a62a7024Sjinchen
a62a7024Sjinchenvoid mlir::populateExpandAtanhPattern(RewritePatternSet &patterns) {
a62a7024Sjinchen  patterns.add(convertAtanhOp);
a62a7024Sjinchen}
a62a7024Sjinchen
a7c2102dSBalaji V. Iyervoid mlir::populateExpandFmaFPattern(RewritePatternSet &patterns) {
a7c2102dSBalaji V. Iyer  patterns.add(convertFmaFOp);
a7c2102dSBalaji V. Iyer}
2217888dSBalaji V. Iyer
2217888dSBalaji V. Iyervoid mlir::populateExpandCeilFPattern(RewritePatternSet &patterns) {
2217888dSBalaji V. Iyer  patterns.add(convertCeilOp);
2217888dSBalaji V. Iyer}
2217888dSBalaji V. Iyer
4da96515SBalaji V. Iyervoid mlir::populateExpandExp2FPattern(RewritePatternSet &patterns) {
4da96515SBalaji V. Iyer  patterns.add(convertExp2fOp);
4da96515SBalaji V. Iyer}
4da96515SBalaji V. Iyer
2d4e8567SBalaji V. Iyervoid mlir::populateExpandPowFPattern(RewritePatternSet &patterns) {
2d4e8567SBalaji V. Iyer  patterns.add(convertPowfOp);
2d4e8567SBalaji V. Iyer}
2d4e8567SBalaji V. Iyer
10a57f3aSPrashant Kumarvoid mlir::populateExpandFPowIPattern(RewritePatternSet &patterns) {
5b702be1SPrashant Kumar  patterns.add(convertFPowIOp);
10a57f3aSPrashant Kumar}
10a57f3aSPrashant Kumar
be911578SBalaji V. Iyervoid mlir::populateExpandRoundFPattern(RewritePatternSet &patterns) {
be911578SBalaji V. Iyer  patterns.add(convertRoundOp);
be911578SBalaji V. Iyer}
be911578SBalaji V. Iyer
44baa655SRamiro Leal-Cavazosvoid mlir::populateExpandRoundEvenPattern(RewritePatternSet &patterns) {
44baa655SRamiro Leal-Cavazos  patterns.add(convertRoundEvenOp);
44baa655SRamiro Leal-Cavazos}
279a659eSCorentin Ferry
279a659eSCorentin Ferryvoid mlir::populateExpandRsqrtPattern(RewritePatternSet &patterns) {
279a659eSCorentin Ferry  patterns.add(convertRsqrtOp);
279a659eSCorentin Ferry}