Conversion/MathToSPIRV/MathToSPIRV.cpp

995c3984SLei Zhang//===- MathToSPIRV.cpp - Math to SPIR-V Patterns --------------------------===//
995c3984SLei Zhang//
995c3984SLei Zhang// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
995c3984SLei Zhang// See https://llvm.org/LICENSE.txt for license information.
995c3984SLei Zhang// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
995c3984SLei Zhang//
995c3984SLei Zhang//===----------------------------------------------------------------------===//
995c3984SLei Zhang//
995c3984SLei Zhang// This file implements patterns to convert Math dialect to SPIR-V dialect.
995c3984SLei Zhang//
995c3984SLei Zhang//===----------------------------------------------------------------------===//
995c3984SLei Zhang
a54f4eaeSMogball#include "../SPIRVCommon/Pattern.h"
995c3984SLei Zhang#include "mlir/Dialect/Math/IR/Math.h"
995c3984SLei Zhang#include "mlir/Dialect/SPIRV/IR/SPIRVDialect.h"
995c3984SLei Zhang#include "mlir/Dialect/SPIRV/IR/SPIRVOps.h"
995c3984SLei Zhang#include "mlir/Dialect/SPIRV/Transforms/SPIRVConversion.h"
533ec929SLei Zhang#include "mlir/IR/BuiltinTypes.h"
b9e642afSRobert Suderman#include "mlir/IR/TypeUtilities.h"
cc020a22SLei Zhang#include "mlir/Transforms/DialectConversion.h"
7f7e33c2SJakub Kuderski#include "llvm/ADT/STLExtras.h"
995c3984SLei Zhang#include "llvm/Support/Debug.h"
7f7e33c2SJakub Kuderski#include "llvm/Support/FormatVariadic.h"
995c3984SLei Zhang
995c3984SLei Zhang#define DEBUG_TYPE "math-to-spirv-pattern"
995c3984SLei Zhang
995c3984SLei Zhangusing namespace mlir;
995c3984SLei Zhang
995c3984SLei Zhang//===----------------------------------------------------------------------===//
cc020a22SLei Zhang// Utility functions
cc020a22SLei Zhang//===----------------------------------------------------------------------===//
cc020a22SLei Zhang
cc020a22SLei Zhang/// Creates a 32-bit scalar/vector integer constant. Returns nullptr if the
cc020a22SLei Zhang/// given type is not a 32-bit scalar/vector type.
cc020a22SLei Zhangstatic Value getScalarOrVectorI32Constant(Type type, int value,
cc020a22SLei Zhang                                          OpBuilder &builder, Location loc) {
5550c821STres Popp  if (auto vectorType = dyn_cast<VectorType>(type)) {
cc020a22SLei Zhang    if (!vectorType.getElementType().isInteger(32))
cc020a22SLei Zhang      return nullptr;
cc020a22SLei Zhang    SmallVector<int> values(vectorType.getNumElements(), value);
cc020a22SLei Zhang    return builder.create<spirv::ConstantOp>(loc, type,
cc020a22SLei Zhang                                             builder.getI32VectorAttr(values));
cc020a22SLei Zhang  }
cc020a22SLei Zhang  if (type.isInteger(32))
cc020a22SLei Zhang    return builder.create<spirv::ConstantOp>(loc, type,
cc020a22SLei Zhang                                             builder.getI32IntegerAttr(value));
cc020a22SLei Zhang
cc020a22SLei Zhang  return nullptr;
cc020a22SLei Zhang}
cc020a22SLei Zhang
7f7e33c2SJakub Kuderski/// Check if the type is supported by math-to-spirv conversion. We expect to
7f7e33c2SJakub Kuderski/// only see scalars and vectors at this point, with higher-level types already
7f7e33c2SJakub Kuderski/// lowered.
7f7e33c2SJakub Kuderskistatic bool isSupportedSourceType(Type originalType) {
7f7e33c2SJakub Kuderski  if (originalType.isIntOrIndexOrFloat())
7f7e33c2SJakub Kuderski    return true;
7f7e33c2SJakub Kuderski
5550c821STres Popp  if (auto vecTy = dyn_cast<VectorType>(originalType)) {
7f7e33c2SJakub Kuderski    if (!vecTy.getElementType().isIntOrIndexOrFloat())
7f7e33c2SJakub Kuderski      return false;
7f7e33c2SJakub Kuderski    if (vecTy.isScalable())
7f7e33c2SJakub Kuderski      return false;
7f7e33c2SJakub Kuderski    if (vecTy.getRank() > 1)
7f7e33c2SJakub Kuderski      return false;
7f7e33c2SJakub Kuderski
7f7e33c2SJakub Kuderski    return true;
7f7e33c2SJakub Kuderski  }
7f7e33c2SJakub Kuderski
7f7e33c2SJakub Kuderski  return false;
7f7e33c2SJakub Kuderski}
7f7e33c2SJakub Kuderski
7f7e33c2SJakub Kuderski/// Check if all `sourceOp` types are supported by math-to-spirv conversion.
7f7e33c2SJakub Kuderski/// Notify of a match failure othwerise and return a `failure` result.
7f7e33c2SJakub Kuderski/// This is intended to simplify type checks in `OpConversionPattern`s.
7f7e33c2SJakub Kuderskistatic LogicalResult checkSourceOpTypes(ConversionPatternRewriter &rewriter,
7f7e33c2SJakub Kuderski                                        Operation *sourceOp) {
7f7e33c2SJakub Kuderski  auto allTypes = llvm::to_vector(sourceOp->getOperandTypes());
7f7e33c2SJakub Kuderski  llvm::append_range(allTypes, sourceOp->getResultTypes());
7f7e33c2SJakub Kuderski
7f7e33c2SJakub Kuderski  for (Type ty : allTypes) {
7f7e33c2SJakub Kuderski    if (!isSupportedSourceType(ty)) {
7f7e33c2SJakub Kuderski      return rewriter.notifyMatchFailure(
7f7e33c2SJakub Kuderski          sourceOp,
7f7e33c2SJakub Kuderski          llvm::formatv(
7f7e33c2SJakub Kuderski              "unsupported source type for Math to SPIR-V conversion: {0}",
7f7e33c2SJakub Kuderski              ty));
7f7e33c2SJakub Kuderski    }
7f7e33c2SJakub Kuderski  }
7f7e33c2SJakub Kuderski
7f7e33c2SJakub Kuderski  return success();
7f7e33c2SJakub Kuderski}
7f7e33c2SJakub Kuderski
cc020a22SLei Zhang//===----------------------------------------------------------------------===//
995c3984SLei Zhang// Operation conversion
995c3984SLei Zhang//===----------------------------------------------------------------------===//
995c3984SLei Zhang
995c3984SLei Zhang// Note that DRR cannot be used for the patterns in this file: we may need to
995c3984SLei Zhang// convert type along the way, which requires ConversionPattern. DRR generates
995c3984SLei Zhang// normal RewritePattern.
995c3984SLei Zhang
995c3984SLei Zhangnamespace {
7f7e33c2SJakub Kuderski/// Converts elementwise unary, binary, and ternary standard operations to
7f7e33c2SJakub Kuderski/// SPIR-V operations. Checks that source `Op` types are supported.
7f7e33c2SJakub Kuderskitemplate <typename Op, typename SPIRVOp>
7f7e33c2SJakub Kuderskistruct CheckedElementwiseOpPattern final
7f7e33c2SJakub Kuderski    : public spirv::ElementwiseOpPattern<Op, SPIRVOp> {
7f7e33c2SJakub Kuderski  using BasePattern = typename spirv::ElementwiseOpPattern<Op, SPIRVOp>;
7f7e33c2SJakub Kuderski  using BasePattern::BasePattern;
7f7e33c2SJakub Kuderski
7f7e33c2SJakub Kuderski  LogicalResult
7f7e33c2SJakub Kuderski  matchAndRewrite(Op op, typename Op::Adaptor adaptor,
7f7e33c2SJakub Kuderski                  ConversionPatternRewriter &rewriter) const override {
7f7e33c2SJakub Kuderski    if (LogicalResult res = checkSourceOpTypes(rewriter, op); failed(res))
7f7e33c2SJakub Kuderski      return res;
7f7e33c2SJakub Kuderski
7f7e33c2SJakub Kuderski    return BasePattern::matchAndRewrite(op, adaptor, rewriter);
7f7e33c2SJakub Kuderski  }
7f7e33c2SJakub Kuderski};
7f7e33c2SJakub Kuderski
533ec929SLei Zhang/// Converts math.copysign to SPIR-V ops.
7f7e33c2SJakub Kuderskistruct CopySignPattern final : public OpConversionPattern<math::CopySignOp> {
533ec929SLei Zhang  using OpConversionPattern::OpConversionPattern;
533ec929SLei Zhang
533ec929SLei Zhang  LogicalResult
533ec929SLei Zhang  matchAndRewrite(math::CopySignOp copySignOp, OpAdaptor adaptor,
533ec929SLei Zhang                  ConversionPatternRewriter &rewriter) const override {
7f7e33c2SJakub Kuderski    if (LogicalResult res = checkSourceOpTypes(rewriter, copySignOp);
7f7e33c2SJakub Kuderski        failed(res))
7f7e33c2SJakub Kuderski      return res;
7f7e33c2SJakub Kuderski
7f7e33c2SJakub Kuderski    Type type = getTypeConverter()->convertType(copySignOp.getType());
533ec929SLei Zhang    if (!type)
533ec929SLei Zhang      return failure();
533ec929SLei Zhang
533ec929SLei Zhang    FloatType floatType;
5550c821STres Popp    if (auto scalarType = dyn_cast<FloatType>(copySignOp.getType())) {
533ec929SLei Zhang      floatType = scalarType;
5550c821STres Popp    } else if (auto vectorType = dyn_cast<VectorType>(copySignOp.getType())) {
5550c821STres Popp      floatType = cast<FloatType>(vectorType.getElementType());
533ec929SLei Zhang    } else {
533ec929SLei Zhang      return failure();
533ec929SLei Zhang    }
533ec929SLei Zhang
533ec929SLei Zhang    Location loc = copySignOp.getLoc();
533ec929SLei Zhang    int bitwidth = floatType.getWidth();
533ec929SLei Zhang    Type intType = rewriter.getIntegerType(bitwidth);
5f14aee3SStella Stamenova    uint64_t intValue = uint64_t(1) << (bitwidth - 1);
533ec929SLei Zhang
533ec929SLei Zhang    Value signMask = rewriter.create<spirv::ConstantOp>(
5f14aee3SStella Stamenova        loc, intType, rewriter.getIntegerAttr(intType, intValue));
533ec929SLei Zhang    Value valueMask = rewriter.create<spirv::ConstantOp>(
5f14aee3SStella Stamenova        loc, intType, rewriter.getIntegerAttr(intType, intValue - 1u));
533ec929SLei Zhang
5550c821STres Popp    if (auto vectorType = dyn_cast<VectorType>(type)) {
533ec929SLei Zhang      assert(vectorType.getRank() == 1);
533ec929SLei Zhang      int count = vectorType.getNumElements();
533ec929SLei Zhang      intType = VectorType::get(count, intType);
533ec929SLei Zhang
533ec929SLei Zhang      SmallVector<Value> signSplat(count, signMask);
533ec929SLei Zhang      signMask =
533ec929SLei Zhang          rewriter.create<spirv::CompositeConstructOp>(loc, intType, signSplat);
533ec929SLei Zhang
533ec929SLei Zhang      SmallVector<Value> valueSplat(count, valueMask);
533ec929SLei Zhang      valueMask = rewriter.create<spirv::CompositeConstructOp>(loc, intType,
533ec929SLei Zhang                                                               valueSplat);
533ec929SLei Zhang    }
533ec929SLei Zhang
533ec929SLei Zhang    Value lhsCast =
533ec929SLei Zhang        rewriter.create<spirv::BitcastOp>(loc, intType, adaptor.getLhs());
533ec929SLei Zhang    Value rhsCast =
533ec929SLei Zhang        rewriter.create<spirv::BitcastOp>(loc, intType, adaptor.getRhs());
533ec929SLei Zhang
533ec929SLei Zhang    Value value = rewriter.create<spirv::BitwiseAndOp>(
533ec929SLei Zhang        loc, intType, ValueRange{lhsCast, valueMask});
533ec929SLei Zhang    Value sign = rewriter.create<spirv::BitwiseAndOp>(
533ec929SLei Zhang        loc, intType, ValueRange{rhsCast, signMask});
533ec929SLei Zhang
533ec929SLei Zhang    Value result = rewriter.create<spirv::BitwiseOrOp>(loc, intType,
533ec929SLei Zhang                                                       ValueRange{value, sign});
533ec929SLei Zhang    rewriter.replaceOpWithNewOp<spirv::BitcastOp>(copySignOp, type, result);
533ec929SLei Zhang    return success();
533ec929SLei Zhang  }
533ec929SLei Zhang};
533ec929SLei Zhang
cc020a22SLei Zhang/// Converts math.ctlz to SPIR-V ops.
cc020a22SLei Zhang///
cc020a22SLei Zhang/// SPIR-V does not have a direct operations for counting leading zeros. If
52b630daSJakub Kuderski/// Shader capability is supported, we can leverage GL FindUMsb to calculate
cc020a22SLei Zhang/// it.
7f7e33c2SJakub Kuderskistruct CountLeadingZerosPattern final
cc020a22SLei Zhang    : public OpConversionPattern<math::CountLeadingZerosOp> {
cc020a22SLei Zhang  using OpConversionPattern::OpConversionPattern;
cc020a22SLei Zhang
cc020a22SLei Zhang  LogicalResult
cc020a22SLei Zhang  matchAndRewrite(math::CountLeadingZerosOp countOp, OpAdaptor adaptor,
cc020a22SLei Zhang                  ConversionPatternRewriter &rewriter) const override {
7f7e33c2SJakub Kuderski    if (LogicalResult res = checkSourceOpTypes(rewriter, countOp); failed(res))
7f7e33c2SJakub Kuderski      return res;
7f7e33c2SJakub Kuderski
7f7e33c2SJakub Kuderski    Type type = getTypeConverter()->convertType(countOp.getType());
cc020a22SLei Zhang    if (!type)
cc020a22SLei Zhang      return failure();
cc020a22SLei Zhang
cc020a22SLei Zhang    // We can only support 32-bit integer types for now.
cc020a22SLei Zhang    unsigned bitwidth = 0;
5550c821STres Popp    if (isa<IntegerType>(type))
cc020a22SLei Zhang      bitwidth = type.getIntOrFloatBitWidth();
5550c821STres Popp    if (auto vectorType = dyn_cast<VectorType>(type))
cc020a22SLei Zhang      bitwidth = vectorType.getElementTypeBitWidth();
cc020a22SLei Zhang    if (bitwidth != 32)
cc020a22SLei Zhang      return failure();
cc020a22SLei Zhang
cc020a22SLei Zhang    Location loc = countOp.getLoc();
2320a4aeSLei Zhang    Value input = adaptor.getOperand();
2320a4aeSLei Zhang    Value val1 = getScalarOrVectorI32Constant(type, 1, rewriter, loc);
cc020a22SLei Zhang    Value val31 = getScalarOrVectorI32Constant(type, 31, rewriter, loc);
2320a4aeSLei Zhang    Value val32 = getScalarOrVectorI32Constant(type, 32, rewriter, loc);
2320a4aeSLei Zhang
52b630daSJakub Kuderski    Value msb = rewriter.create<spirv::GLFindUMsbOp>(loc, input);
2320a4aeSLei Zhang    // We need to subtract from 31 given that the index returned by GLSL
2320a4aeSLei Zhang    // FindUMsb is counted from the least significant bit. Theoretically this
2320a4aeSLei Zhang    // also gives the correct result even if the integer has all zero bits, in
52b630daSJakub Kuderski    // which case GL FindUMsb would return -1.
2320a4aeSLei Zhang    Value subMsb = rewriter.create<spirv::ISubOp>(loc, val31, msb);
2320a4aeSLei Zhang    // However, certain Vulkan implementations have driver bugs for the corner
2320a4aeSLei Zhang    // case where the input is zero. And.. it can be smart to optimize a select
2320a4aeSLei Zhang    // only involving the corner case. So separately compute the result when the
2320a4aeSLei Zhang    // input is either zero or one.
2320a4aeSLei Zhang    Value subInput = rewriter.create<spirv::ISubOp>(loc, val32, input);
2320a4aeSLei Zhang    Value cmp = rewriter.create<spirv::ULessThanEqualOp>(loc, input, val1);
2320a4aeSLei Zhang    rewriter.replaceOpWithNewOp<spirv::SelectOp>(countOp, cmp, subInput,
2320a4aeSLei Zhang                                                 subMsb);
cc020a22SLei Zhang    return success();
cc020a22SLei Zhang  }
cc020a22SLei Zhang};
cc020a22SLei Zhang
3e746c6dSRob Suderman/// Converts math.expm1 to SPIR-V ops.
3e746c6dSRob Suderman///
3e746c6dSRob Suderman/// SPIR-V does not have a direct operations for exp(x)-1. Explicitly lower to
3e746c6dSRob Suderman/// these operations.
3e746c6dSRob Sudermantemplate <typename ExpOp>
533ec929SLei Zhangstruct ExpM1OpPattern final : public OpConversionPattern<math::ExpM1Op> {
533ec929SLei Zhang  using OpConversionPattern::OpConversionPattern;
3e746c6dSRob Suderman
3e746c6dSRob Suderman  LogicalResult
3e746c6dSRob Suderman  matchAndRewrite(math::ExpM1Op operation, OpAdaptor adaptor,
3e746c6dSRob Suderman                  ConversionPatternRewriter &rewriter) const override {
3e746c6dSRob Suderman    assert(adaptor.getOperands().size() == 1);
7f7e33c2SJakub Kuderski    if (LogicalResult res = checkSourceOpTypes(rewriter, operation);
7f7e33c2SJakub Kuderski        failed(res))
7f7e33c2SJakub Kuderski      return res;
7f7e33c2SJakub Kuderski
3e746c6dSRob Suderman    Location loc = operation.getLoc();
7f7e33c2SJakub Kuderski    Type type = this->getTypeConverter()->convertType(operation.getType());
7f7e33c2SJakub Kuderski    if (!type)
7f7e33c2SJakub Kuderski      return failure();
7f7e33c2SJakub Kuderski
7f7e33c2SJakub Kuderski    Value exp = rewriter.create<ExpOp>(loc, type, adaptor.getOperand());
3e746c6dSRob Suderman    auto one = spirv::ConstantOp::getOne(type, loc, rewriter);
3e746c6dSRob Suderman    rewriter.replaceOpWithNewOp<spirv::FSubOp>(operation, exp, one);
3e746c6dSRob Suderman    return success();
3e746c6dSRob Suderman  }
3e746c6dSRob Suderman};
3e746c6dSRob Suderman
995c3984SLei Zhang/// Converts math.log1p to SPIR-V ops.
995c3984SLei Zhang///
995c3984SLei Zhang/// SPIR-V does not have a direct operations for log(1+x). Explicitly lower to
995c3984SLei Zhang/// these operations.
75a1bee0SButygintemplate <typename LogOp>
533ec929SLei Zhangstruct Log1pOpPattern final : public OpConversionPattern<math::Log1pOp> {
533ec929SLei Zhang  using OpConversionPattern::OpConversionPattern;
995c3984SLei Zhang
995c3984SLei Zhang  LogicalResult
b54c724bSRiver Riddle  matchAndRewrite(math::Log1pOp operation, OpAdaptor adaptor,
995c3984SLei Zhang                  ConversionPatternRewriter &rewriter) const override {
b54c724bSRiver Riddle    assert(adaptor.getOperands().size() == 1);
7f7e33c2SJakub Kuderski    if (LogicalResult res = checkSourceOpTypes(rewriter, operation);
7f7e33c2SJakub Kuderski        failed(res))
7f7e33c2SJakub Kuderski      return res;
7f7e33c2SJakub Kuderski
995c3984SLei Zhang    Location loc = operation.getLoc();
7f7e33c2SJakub Kuderski    Type type = this->getTypeConverter()->convertType(operation.getType());
7f7e33c2SJakub Kuderski    if (!type)
7f7e33c2SJakub Kuderski      return failure();
7f7e33c2SJakub Kuderski
995c3984SLei Zhang    auto one = spirv::ConstantOp::getOne(type, operation.getLoc(), rewriter);
7f7e33c2SJakub Kuderski    Value onePlus =
3e746c6dSRob Suderman        rewriter.create<spirv::FAddOp>(loc, one, adaptor.getOperand());
75a1bee0SButygin    rewriter.replaceOpWithNewOp<LogOp>(operation, type, onePlus);
995c3984SLei Zhang    return success();
995c3984SLei Zhang  }
995c3984SLei Zhang};
06c6758aSLei Zhang
8d165136Smeehatpa/// Converts math.log2 and math.log10 to SPIR-V ops.
8d165136Smeehatpa///
8d165136Smeehatpa/// SPIR-V does not have direct operations for log2 and log10. Explicitly
8d165136Smeehatpa/// lower to these operations using:
8d165136Smeehatpa///   log2(x) = log(x) * 1/log(2)
8d165136Smeehatpa///   log10(x) = log(x) * 1/log(10)
8d165136Smeehatpa
8d165136Smeehatpatemplate <typename MathLogOp, typename SpirvLogOp>
8d165136Smeehatpastruct Log2Log10OpPattern final : public OpConversionPattern<MathLogOp> {
8d165136Smeehatpa  using OpConversionPattern<MathLogOp>::OpConversionPattern;
8d165136Smeehatpa  using typename OpConversionPattern<MathLogOp>::OpAdaptor;
8d165136Smeehatpa
8d165136Smeehatpa  static constexpr double log2Reciprocal =
8d165136Smeehatpa      1.442695040888963407359924681001892137426645954152985934135449407;
8d165136Smeehatpa  static constexpr double log10Reciprocal =
8d165136Smeehatpa      0.4342944819032518276511289189166050822943970058036665661144537832;
8d165136Smeehatpa
8d165136Smeehatpa  LogicalResult
8d165136Smeehatpa  matchAndRewrite(MathLogOp operation, OpAdaptor adaptor,
8d165136Smeehatpa                  ConversionPatternRewriter &rewriter) const override {
8d165136Smeehatpa    assert(adaptor.getOperands().size() == 1);
8d165136Smeehatpa    if (LogicalResult res = checkSourceOpTypes(rewriter, operation);
8d165136Smeehatpa        failed(res))
8d165136Smeehatpa      return res;
8d165136Smeehatpa
8d165136Smeehatpa    Location loc = operation.getLoc();
8d165136Smeehatpa    Type type = this->getTypeConverter()->convertType(operation.getType());
8d165136Smeehatpa    if (!type)
8d165136Smeehatpa      return rewriter.notifyMatchFailure(operation, "type conversion failed");
8d165136Smeehatpa
8d165136Smeehatpa    auto getConstantValue = [&](double value) {
8d165136Smeehatpa      if (auto floatType = dyn_cast<FloatType>(type)) {
8d165136Smeehatpa        return rewriter.create<spirv::ConstantOp>(
8d165136Smeehatpa            loc, type, rewriter.getFloatAttr(floatType, value));
8d165136Smeehatpa      }
8d165136Smeehatpa      if (auto vectorType = dyn_cast<VectorType>(type)) {
8d165136Smeehatpa        Type elemType = vectorType.getElementType();
8d165136Smeehatpa
8d165136Smeehatpa        if (isa<FloatType>(elemType)) {
8d165136Smeehatpa          return rewriter.create<spirv::ConstantOp>(
8d165136Smeehatpa              loc, type,
8d165136Smeehatpa              DenseFPElementsAttr::get(
8d165136Smeehatpa                  vectorType, FloatAttr::get(elemType, value).getValue()));
8d165136Smeehatpa        }
8d165136Smeehatpa      }
8d165136Smeehatpa
8d165136Smeehatpa      llvm_unreachable("unimplemented types for log2/log10");
8d165136Smeehatpa    };
8d165136Smeehatpa
8d165136Smeehatpa    Value constantValue = getConstantValue(
8d165136Smeehatpa        std::is_same<MathLogOp, math::Log2Op>() ? log2Reciprocal
8d165136Smeehatpa                                                : log10Reciprocal);
8d165136Smeehatpa    Value log = rewriter.create<SpirvLogOp>(loc, adaptor.getOperand());
8d165136Smeehatpa    rewriter.replaceOpWithNewOp<spirv::FMulOp>(operation, type, log,
8d165136Smeehatpa                                               constantValue);
8d165136Smeehatpa    return success();
8d165136Smeehatpa  }
8d165136Smeehatpa};
8d165136Smeehatpa
06c6758aSLei Zhang/// Converts math.powf to SPIRV-Ops.
06c6758aSLei Zhangstruct PowFOpPattern final : public OpConversionPattern<math::PowFOp> {
06c6758aSLei Zhang  using OpConversionPattern::OpConversionPattern;
06c6758aSLei Zhang
06c6758aSLei Zhang  LogicalResult
06c6758aSLei Zhang  matchAndRewrite(math::PowFOp powfOp, OpAdaptor adaptor,
06c6758aSLei Zhang                  ConversionPatternRewriter &rewriter) const override {
7f7e33c2SJakub Kuderski    if (LogicalResult res = checkSourceOpTypes(rewriter, powfOp); failed(res))
7f7e33c2SJakub Kuderski      return res;
7f7e33c2SJakub Kuderski
7f7e33c2SJakub Kuderski    Type dstType = getTypeConverter()->convertType(powfOp.getType());
06c6758aSLei Zhang    if (!dstType)
06c6758aSLei Zhang      return failure();
06c6758aSLei Zhang
58839f2eSDaniel Garvey    // Get the scalar float type.
58839f2eSDaniel Garvey    FloatType scalarFloatType;
5550c821STres Popp    if (auto scalarType = dyn_cast<FloatType>(powfOp.getType())) {
58839f2eSDaniel Garvey      scalarFloatType = scalarType;
5550c821STres Popp    } else if (auto vectorType = dyn_cast<VectorType>(powfOp.getType())) {
5550c821STres Popp      scalarFloatType = cast<FloatType>(vectorType.getElementType());
58839f2eSDaniel Garvey    } else {
58839f2eSDaniel Garvey      return failure();
58839f2eSDaniel Garvey    }
58839f2eSDaniel Garvey
58839f2eSDaniel Garvey    // Get int type of the same shape as the float type.
58839f2eSDaniel Garvey    Type scalarIntType = rewriter.getIntegerType(32);
58839f2eSDaniel Garvey    Type intType = scalarIntType;
*b9314a82SDmitriy Smirnov    auto operandType = adaptor.getRhs().getType();
*b9314a82SDmitriy Smirnov    if (auto vectorType = dyn_cast<VectorType>(operandType)) {
58839f2eSDaniel Garvey      auto shape = vectorType.getShape();
58839f2eSDaniel Garvey      intType = VectorType::get(shape, scalarIntType);
58839f2eSDaniel Garvey    }
58839f2eSDaniel Garvey
52b630daSJakub Kuderski    // Per GL Pow extended instruction spec:
06c6758aSLei Zhang    // "Result is undefined if x < 0. Result is undefined if x = 0 and y <= 0."
06c6758aSLei Zhang    Location loc = powfOp.getLoc();
*b9314a82SDmitriy Smirnov    Value zero = spirv::ConstantOp::getZero(operandType, loc, rewriter);
06c6758aSLei Zhang    Value lessThan =
06c6758aSLei Zhang        rewriter.create<spirv::FOrdLessThanOp>(loc, adaptor.getLhs(), zero);
*b9314a82SDmitriy Smirnov
*b9314a82SDmitriy Smirnov    // Per C/C++ spec:
*b9314a82SDmitriy Smirnov    // > pow(base, exponent) returns NaN (and raises FE_INVALID) if base is
*b9314a82SDmitriy Smirnov    // > finite and negative and exponent is finite and non-integer.
*b9314a82SDmitriy Smirnov    // Calculate the reminder from the exponent and check whether it is zero.
*b9314a82SDmitriy Smirnov    Value floatOne = spirv::ConstantOp::getOne(operandType, loc, rewriter);
*b9314a82SDmitriy Smirnov    Value expRem =
*b9314a82SDmitriy Smirnov        rewriter.create<spirv::FRemOp>(loc, adaptor.getRhs(), floatOne);
*b9314a82SDmitriy Smirnov    Value expRemNonZero =
*b9314a82SDmitriy Smirnov        rewriter.create<spirv::FOrdNotEqualOp>(loc, expRem, zero);
*b9314a82SDmitriy Smirnov    Value cmpNegativeWithFractionalExp =
*b9314a82SDmitriy Smirnov        rewriter.create<spirv::LogicalAndOp>(loc, expRemNonZero, lessThan);
*b9314a82SDmitriy Smirnov    // Create NaN result and replace base value if conditions are met.
*b9314a82SDmitriy Smirnov    const auto &floatSemantics = scalarFloatType.getFloatSemantics();
*b9314a82SDmitriy Smirnov    const auto nan = APFloat::getNaN(floatSemantics);
*b9314a82SDmitriy Smirnov    Attribute nanAttr = rewriter.getFloatAttr(scalarFloatType, nan);
*b9314a82SDmitriy Smirnov    if (auto vectorType = dyn_cast<VectorType>(operandType))
*b9314a82SDmitriy Smirnov      nanAttr = DenseElementsAttr::get(vectorType, nan);
*b9314a82SDmitriy Smirnov
*b9314a82SDmitriy Smirnov    Value NanValue =
*b9314a82SDmitriy Smirnov        rewriter.create<spirv::ConstantOp>(loc, operandType, nanAttr);
*b9314a82SDmitriy Smirnov    Value lhs = rewriter.create<spirv::SelectOp>(
*b9314a82SDmitriy Smirnov        loc, cmpNegativeWithFractionalExp, NanValue, adaptor.getLhs());
*b9314a82SDmitriy Smirnov    Value abs = rewriter.create<spirv::GLFAbsOp>(loc, lhs);
58839f2eSDaniel Garvey
58839f2eSDaniel Garvey    // TODO: The following just forcefully casts y into an integer value in
58839f2eSDaniel Garvey    // order to properly propagate the sign, assuming integer y cases. It
58839f2eSDaniel Garvey    // doesn't cover other cases and should be fixed.
58839f2eSDaniel Garvey
58839f2eSDaniel Garvey    // Cast exponent to integer and calculate exponent % 2 != 0.
58839f2eSDaniel Garvey    Value intRhs =
58839f2eSDaniel Garvey        rewriter.create<spirv::ConvertFToSOp>(loc, intType, adaptor.getRhs());
58839f2eSDaniel Garvey    Value intOne = spirv::ConstantOp::getOne(intType, loc, rewriter);
58839f2eSDaniel Garvey    Value bitwiseAndOne =
58839f2eSDaniel Garvey        rewriter.create<spirv::BitwiseAndOp>(loc, intRhs, intOne);
58839f2eSDaniel Garvey    Value isOdd = rewriter.create<spirv::IEqualOp>(loc, bitwiseAndOne, intOne);
58839f2eSDaniel Garvey
58839f2eSDaniel Garvey    // calculate pow based on abs(lhs)^rhs.
52b630daSJakub Kuderski    Value pow = rewriter.create<spirv::GLPowOp>(loc, abs, adaptor.getRhs());
06c6758aSLei Zhang    Value negate = rewriter.create<spirv::FNegateOp>(loc, pow);
58839f2eSDaniel Garvey    // if the exponent is odd and lhs < 0, negate the result.
58839f2eSDaniel Garvey    Value shouldNegate =
58839f2eSDaniel Garvey        rewriter.create<spirv::LogicalAndOp>(loc, lessThan, isOdd);
58839f2eSDaniel Garvey    rewriter.replaceOpWithNewOp<spirv::SelectOp>(powfOp, shouldNegate, negate,
58839f2eSDaniel Garvey                                                 pow);
06c6758aSLei Zhang    return success();
06c6758aSLei Zhang  }
06c6758aSLei Zhang};
06c6758aSLei Zhang
b9e642afSRobert Suderman/// Converts math.round to GLSL SPIRV extended ops.
b9e642afSRobert Sudermanstruct RoundOpPattern final : public OpConversionPattern<math::RoundOp> {
b9e642afSRobert Suderman  using OpConversionPattern::OpConversionPattern;
b9e642afSRobert Suderman
b9e642afSRobert Suderman  LogicalResult
b9e642afSRobert Suderman  matchAndRewrite(math::RoundOp roundOp, OpAdaptor adaptor,
b9e642afSRobert Suderman                  ConversionPatternRewriter &rewriter) const override {
7f7e33c2SJakub Kuderski    if (LogicalResult res = checkSourceOpTypes(rewriter, roundOp); failed(res))
7f7e33c2SJakub Kuderski      return res;
7f7e33c2SJakub Kuderski
b9e642afSRobert Suderman    Location loc = roundOp.getLoc();
7f7e33c2SJakub Kuderski    Value operand = roundOp.getOperand();
7f7e33c2SJakub Kuderski    Type ty = operand.getType();
7f7e33c2SJakub Kuderski    Type ety = getElementTypeOrSelf(ty);
b9e642afSRobert Suderman
b9e642afSRobert Suderman    auto zero = spirv::ConstantOp::getZero(ty, loc, rewriter);
b9e642afSRobert Suderman    auto one = spirv::ConstantOp::getOne(ty, loc, rewriter);
b9e642afSRobert Suderman    Value half;
5550c821STres Popp    if (VectorType vty = dyn_cast<VectorType>(ty)) {
b9e642afSRobert Suderman      half = rewriter.create<spirv::ConstantOp>(
b9e642afSRobert Suderman          loc, vty,
b9e642afSRobert Suderman          DenseElementsAttr::get(vty,
b9e642afSRobert Suderman                                 rewriter.getFloatAttr(ety, 0.5).getValue()));
b9e642afSRobert Suderman    } else {
b9e642afSRobert Suderman      half = rewriter.create<spirv::ConstantOp>(
b9e642afSRobert Suderman          loc, ty, rewriter.getFloatAttr(ety, 0.5));
b9e642afSRobert Suderman    }
b9e642afSRobert Suderman
52b630daSJakub Kuderski    auto abs = rewriter.create<spirv::GLFAbsOp>(loc, operand);
52b630daSJakub Kuderski    auto floor = rewriter.create<spirv::GLFloorOp>(loc, abs);
b9e642afSRobert Suderman    auto sub = rewriter.create<spirv::FSubOp>(loc, abs, floor);
b9e642afSRobert Suderman    auto greater =
b9e642afSRobert Suderman        rewriter.create<spirv::FOrdGreaterThanEqualOp>(loc, sub, half);
b9e642afSRobert Suderman    auto select = rewriter.create<spirv::SelectOp>(loc, greater, one, zero);
b9e642afSRobert Suderman    auto add = rewriter.create<spirv::FAddOp>(loc, floor, select);
b9e642afSRobert Suderman    rewriter.replaceOpWithNewOp<math::CopySignOp>(roundOp, add, operand);
b9e642afSRobert Suderman    return success();
b9e642afSRobert Suderman  }
b9e642afSRobert Suderman};
b9e642afSRobert Suderman
995c3984SLei Zhang} // namespace
995c3984SLei Zhang
995c3984SLei Zhang//===----------------------------------------------------------------------===//
995c3984SLei Zhang// Pattern population
995c3984SLei Zhang//===----------------------------------------------------------------------===//
995c3984SLei Zhang
995c3984SLei Zhangnamespace mlir {
206fad0eSMatthias Springervoid populateMathToSPIRVPatterns(const SPIRVTypeConverter &typeConverter,
995c3984SLei Zhang                                 RewritePatternSet &patterns) {
533ec929SLei Zhang  // Core patterns
533ec929SLei Zhang  patterns.add<CopySignPattern>(typeConverter, patterns.getContext());
75a1bee0SButygin
75a1bee0SButygin  // GLSL patterns
d9edc1a5SThomas Raoux  patterns
52b630daSJakub Kuderski      .add<CountLeadingZerosPattern, Log1pOpPattern<spirv::GLLogOp>,
8d165136Smeehatpa           Log2Log10OpPattern<math::Log2Op, spirv::GLLogOp>,
8d165136Smeehatpa           Log2Log10OpPattern<math::Log10Op, spirv::GLLogOp>,
52b630daSJakub Kuderski           ExpM1OpPattern<spirv::GLExpOp>, PowFOpPattern, RoundOpPattern,
7f7e33c2SJakub Kuderski           CheckedElementwiseOpPattern<math::AbsFOp, spirv::GLFAbsOp>,
7f7e33c2SJakub Kuderski           CheckedElementwiseOpPattern<math::AbsIOp, spirv::GLSAbsOp>,
49777d7fSmeehatpa           CheckedElementwiseOpPattern<math::AtanOp, spirv::GLAtanOp>,
7f7e33c2SJakub Kuderski           CheckedElementwiseOpPattern<math::CeilOp, spirv::GLCeilOp>,
7f7e33c2SJakub Kuderski           CheckedElementwiseOpPattern<math::CosOp, spirv::GLCosOp>,
7f7e33c2SJakub Kuderski           CheckedElementwiseOpPattern<math::ExpOp, spirv::GLExpOp>,
7f7e33c2SJakub Kuderski           CheckedElementwiseOpPattern<math::FloorOp, spirv::GLFloorOp>,
7f7e33c2SJakub Kuderski           CheckedElementwiseOpPattern<math::FmaOp, spirv::GLFmaOp>,
7f7e33c2SJakub Kuderski           CheckedElementwiseOpPattern<math::LogOp, spirv::GLLogOp>,
7f7e33c2SJakub Kuderski           CheckedElementwiseOpPattern<math::RoundEvenOp, spirv::GLRoundEvenOp>,
7f7e33c2SJakub Kuderski           CheckedElementwiseOpPattern<math::RsqrtOp, spirv::GLInverseSqrtOp>,
7f7e33c2SJakub Kuderski           CheckedElementwiseOpPattern<math::SinOp, spirv::GLSinOp>,
7f7e33c2SJakub Kuderski           CheckedElementwiseOpPattern<math::SqrtOp, spirv::GLSqrtOp>,
7f7e33c2SJakub Kuderski           CheckedElementwiseOpPattern<math::TanhOp, spirv::GLTanhOp>>(
995c3984SLei Zhang          typeConverter, patterns.getContext());
75a1bee0SButygin
75a1bee0SButygin  // OpenCL patterns
3930cc68SJakub Kuderski  patterns.add<Log1pOpPattern<spirv::CLLogOp>, ExpM1OpPattern<spirv::CLExpOp>,
8d165136Smeehatpa               Log2Log10OpPattern<math::Log2Op, spirv::CLLogOp>,
8d165136Smeehatpa               Log2Log10OpPattern<math::Log10Op, spirv::CLLogOp>,
7f7e33c2SJakub Kuderski               CheckedElementwiseOpPattern<math::AbsFOp, spirv::CLFAbsOp>,
266b5bc1SNishant Patel               CheckedElementwiseOpPattern<math::AbsIOp, spirv::CLSAbsOp>,
49777d7fSmeehatpa               CheckedElementwiseOpPattern<math::AtanOp, spirv::CLAtanOp>,
49777d7fSmeehatpa               CheckedElementwiseOpPattern<math::Atan2Op, spirv::CLAtan2Op>,
7f7e33c2SJakub Kuderski               CheckedElementwiseOpPattern<math::CeilOp, spirv::CLCeilOp>,
7f7e33c2SJakub Kuderski               CheckedElementwiseOpPattern<math::CosOp, spirv::CLCosOp>,
7f7e33c2SJakub Kuderski               CheckedElementwiseOpPattern<math::ErfOp, spirv::CLErfOp>,
7f7e33c2SJakub Kuderski               CheckedElementwiseOpPattern<math::ExpOp, spirv::CLExpOp>,
7f7e33c2SJakub Kuderski               CheckedElementwiseOpPattern<math::FloorOp, spirv::CLFloorOp>,
7f7e33c2SJakub Kuderski               CheckedElementwiseOpPattern<math::FmaOp, spirv::CLFmaOp>,
7f7e33c2SJakub Kuderski               CheckedElementwiseOpPattern<math::LogOp, spirv::CLLogOp>,
7f7e33c2SJakub Kuderski               CheckedElementwiseOpPattern<math::PowFOp, spirv::CLPowOp>,
7f7e33c2SJakub Kuderski               CheckedElementwiseOpPattern<math::RoundEvenOp, spirv::CLRintOp>,
7f7e33c2SJakub Kuderski               CheckedElementwiseOpPattern<math::RoundOp, spirv::CLRoundOp>,
7f7e33c2SJakub Kuderski               CheckedElementwiseOpPattern<math::RsqrtOp, spirv::CLRsqrtOp>,
7f7e33c2SJakub Kuderski               CheckedElementwiseOpPattern<math::SinOp, spirv::CLSinOp>,
7f7e33c2SJakub Kuderski               CheckedElementwiseOpPattern<math::SqrtOp, spirv::CLSqrtOp>,
7f7e33c2SJakub Kuderski               CheckedElementwiseOpPattern<math::TanhOp, spirv::CLTanhOp>>(
75a1bee0SButygin      typeConverter, patterns.getContext());
995c3984SLei Zhang}
995c3984SLei Zhang
995c3984SLei Zhang} // namespace mlir