doxygen/MathToROCDL_8cpp_source.html

 //===-- MathToROCDL.cpp - conversion from Math to rocdl calls -------------===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//


 #include "mlir/Conversion/MathToROCDL/MathToROCDL.h"

 #include "mlir/Conversion/LLVMCommon/LoweringOptions.h"

 #include "mlir/Conversion/LLVMCommon/TypeConverter.h"

 #include "mlir/Dialect/Func/IR/FuncOps.h"

 #include "mlir/Dialect/LLVMIR/LLVMDialect.h"

 #include "mlir/Dialect/LLVMIR/ROCDLDialect.h"

 #include "mlir/Dialect/Math/IR/Math.h"

 #include "mlir/Dialect/Utils/IndexingUtils.h"

 #include "mlir/Dialect/Vector/IR/VectorOps.h"

 #include "mlir/IR/BuiltinDialect.h"

 #include "mlir/IR/PatternMatch.h"

 #include "mlir/Pass/Pass.h"

 #include "mlir/Transforms/DialectConversion.h"


 #include "../GPUCommon/GPUOpsLowering.h"

 #include "../GPUCommon/IndexIntrinsicsOpLowering.h"

 #include "../GPUCommon/OpToFuncCallLowering.h"

 #include "mlir/Conversion/GPUCommon/GPUCommonPass.h"


 namespace mlir {

 #define GEN_PASS_DEF_CONVERTMATHTOROCDL

 #include "mlir/Conversion/Passes.h.inc"

 } // namespace mlir


 using namespace mlir;


 #define DEBUG_TYPE "math-to-rocdl"

 #define DBGS() (llvm::dbgs() << "[" DEBUG_TYPE "]: ")


 template <typename OpTy>

 static void populateOpPatterns(const LLVMTypeConverter &converter,

                                RewritePatternSet &patterns, StringRef f32Func,

                                StringRef f64Func, StringRef f16Func,

                                StringRef f32ApproxFunc = "") {

   patterns.add<ScalarizeVectorOpLowering<OpTy>>(converter);

   patterns.add<OpToFuncCallLowering<OpTy>>(converter, f32Func, f64Func,

                                            f32ApproxFunc, f16Func);

 }


 void mlir::populateMathToROCDLConversionPatterns(

     const LLVMTypeConverter &converter, RewritePatternSet &patterns) {

   // Handled by mathToLLVM: math::AbsIOp

   // Handled by mathToLLVM: math::AbsFOp

   // Handled by mathToLLVM: math::CopySignOp

   // Handled by mathToLLVM: math::CountLeadingZerosOp

   // Handled by mathToLLVM: math::CountTrailingZerosOp

   // Handled by mathToLLVM: math::CgPopOp

   // Handled by mathToLLVM: math::ExpOp (32-bit only)

   // Handled by mathToLLVM: math::FmaOp

   // Handled by mathToLLVM: math::LogOp (32-bit only)

   // FIXME: math::IPowIOp

   // Handled by mathToLLVM: math::RoundEvenOp

   // Handled by mathToLLVM: math::RoundOp

   // Handled by mathToLLVM: math::SqrtOp

   // Handled by mathToLLVM: math::TruncOp

   populateOpPatterns<math::AcosOp>(converter, patterns, "__ocml_acos_f32",

                                    "__ocml_acos_f64", "__ocml_acos_f16");

   populateOpPatterns<math::AcoshOp>(converter, patterns, "__ocml_acosh_f32",

                                     "__ocml_acosh_f64", "__ocml_acosh_f16");

   populateOpPatterns<math::AsinOp>(converter, patterns, "__ocml_asin_f32",

                                    "__ocml_asin_f64", "__ocml_asin_f16");

   populateOpPatterns<math::AsinhOp>(converter, patterns, "__ocml_asinh_f32",

                                     "__ocml_asinh_f64", "__ocml_asinh_f16");

   populateOpPatterns<math::AtanOp>(converter, patterns, "__ocml_atan_f32",

                                    "__ocml_atan_f64", "__ocml_atan_f16");

   populateOpPatterns<math::AtanhOp>(converter, patterns, "__ocml_atanh_f32",

                                     "__ocml_atanh_f64", "__ocml_atanh_f16");

   populateOpPatterns<math::Atan2Op>(converter, patterns, "__ocml_atan2_f32",

                                     "__ocml_atan2_f64", "__ocml_atan2_f16");

   populateOpPatterns<math::CbrtOp>(converter, patterns, "__ocml_cbrt_f32",

                                    "__ocml_cbrt_f64", "__ocml_cbrt_f16");

   populateOpPatterns<math::CeilOp>(converter, patterns, "__ocml_ceil_f32",

                                    "__ocml_ceil_f64", "__ocml_ceil_f16");

   populateOpPatterns<math::CosOp>(converter, patterns, "__ocml_cos_f32",

                                   "__ocml_cos_f64", "__ocml_cos_f16");

   populateOpPatterns<math::CoshOp>(converter, patterns, "__ocml_cosh_f32",

                                    "__ocml_cosh_f64", "__ocml_cosh_f16");

   populateOpPatterns<math::SinhOp>(converter, patterns, "__ocml_sinh_f32",

                                    "__ocml_sinh_f64", "__ocml_sinh_f16");

   populateOpPatterns<math::ExpOp>(converter, patterns, "", "__ocml_exp_f64",

                                   "__ocml_exp_f16");

   populateOpPatterns<math::Exp2Op>(converter, patterns, "__ocml_exp2_f32",

                                    "__ocml_exp2_f64", "__ocml_exp2_f16");

   populateOpPatterns<math::ExpM1Op>(converter, patterns, "__ocml_expm1_f32",

                                     "__ocml_expm1_f64", "__ocml_expm1_f16");

   populateOpPatterns<math::FloorOp>(converter, patterns, "__ocml_floor_f32",

                                     "__ocml_floor_f64", "__ocml_floor_f16");

   populateOpPatterns<math::LogOp>(converter, patterns, "", "__ocml_log_f64",

                                   "__ocml_log_f16");

   populateOpPatterns<math::Log10Op>(converter, patterns, "__ocml_log10_f32",

                                     "__ocml_log10_f64", "__ocml_log10_f16");

   populateOpPatterns<math::Log1pOp>(converter, patterns, "__ocml_log1p_f32",

                                     "__ocml_log1p_f64", "__ocml_log1p_f16");

   populateOpPatterns<math::Log2Op>(converter, patterns, "__ocml_log2_f32",

                                    "__ocml_log2_f64", "__ocml_log2_f16");

   populateOpPatterns<math::PowFOp>(converter, patterns, "__ocml_pow_f32",

                                    "__ocml_pow_f64", "__ocml_pow_f16");

   populateOpPatterns<math::RsqrtOp>(converter, patterns, "__ocml_rsqrt_f32",

                                     "__ocml_rsqrt_f64", "__ocml_rsqrt_f16");

   populateOpPatterns<math::SinOp>(converter, patterns, "__ocml_sin_f32",

                                   "__ocml_sin_f64", "__ocml_sin_f16");

   populateOpPatterns<math::TanhOp>(converter, patterns, "__ocml_tanh_f32",

                                    "__ocml_tanh_f64", "__ocml_tanh_f16");

   populateOpPatterns<math::TanOp>(converter, patterns, "__ocml_tan_f32",

                                   "__ocml_tan_f64", "__ocml_tan_f16");

   populateOpPatterns<math::ErfOp>(converter, patterns, "__ocml_erf_f32",

                                   "__ocml_erf_f64", "__ocml_erf_f16");

   populateOpPatterns<math::ErfcOp>(converter, patterns, "__ocml_erfc_f32",

                                    "__ocml_erfc_f64", "__ocml_erfc_f16");

   populateOpPatterns<math::FPowIOp>(converter, patterns, "__ocml_pown_f32",

                                     "__ocml_pown_f64", "__ocml_pown_f16");

   // Single arith pattern that needs a ROCDL call, probably not

   // worth creating a separate pass for it.

   populateOpPatterns<arith::RemFOp>(converter, patterns, "__ocml_fmod_f32",

                                     "__ocml_fmod_f64", "__ocml_fmod_f16");

 }


 namespace {

 struct ConvertMathToROCDLPass

     : public impl::ConvertMathToROCDLBase<ConvertMathToROCDLPass> {

   ConvertMathToROCDLPass() = default;

   void runOnOperation() override;

 };

 } // namespace


 void ConvertMathToROCDLPass::runOnOperation() {

   auto m = getOperation();

   MLIRContext *ctx = m.getContext();


   RewritePatternSet patterns(&getContext());

   LowerToLLVMOptions options(ctx, DataLayout(m));

   LLVMTypeConverter converter(ctx, options);

   populateMathToROCDLConversionPatterns(converter, patterns);

   ConversionTarget target(getContext());

   target.addLegalDialect<BuiltinDialect, func::FuncDialect,

                          vector::VectorDialect, LLVM::LLVMDialect>();

   target.addIllegalOp<LLVM::CosOp, LLVM::ExpOp, LLVM::Exp2Op, LLVM::FAbsOp,

                       LLVM::FCeilOp, LLVM::FFloorOp, LLVM::FRemOp, LLVM::LogOp,

                       LLVM::Log10Op, LLVM::Log2Op, LLVM::PowOp, LLVM::SinOp,

                       LLVM::SqrtOp>();

   if (failed(applyPartialConversion(m, target, std::move(patterns))))

     signalPassFailure();

 }

BuiltinDialect.h

DialectConversion.h

FuncOps.h

GPUCommonPass.h

getContext
static MLIRContext * getContext(OpFoldResult val)
Definition: IndexingUtils.cpp:295

IndexingUtils.h

LLVMDialect.h

LoweringOptions.h

populateOpPatterns
static void populateOpPatterns(const LLVMTypeConverter &converter, RewritePatternSet &patterns, StringRef f32Func, StringRef f64Func, StringRef f16Func, StringRef f32ApproxFunc="")
Definition: MathToROCDL.cpp:39

MathToROCDL.h

options
static llvm::ManagedStatic< PassManagerOptions > options
Definition: PassManagerOptions.cpp:89

PatternMatch.h

ROCDLDialect.h

TypeConverter.h

VectorOps.h

mlir::ConversionTarget
This class describes a specific conversion target.
Definition: DialectConversion.h:869

mlir::DataLayout
The main mechanism for performing data layout queries.
Definition: DataLayoutInterfaces.h:212

mlir::LLVMTypeConverter
Conversion from types to the LLVM IR dialect.
Definition: TypeConverter.h:35

mlir::LowerToLLVMOptions
Options to control the LLVM lowering.
Definition: LoweringOptions.h:30

mlir::MLIRContext
MLIRContext is the top-level object for a collection of MLIR operations.
Definition: MLIRContext.h:60

mlir::RewritePatternSet
Definition: PatternMatch.h:772

Pass.h

Math.h

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20

mlir::patterns
const FrozenRewritePatternSet & patterns
Definition: GreedyPatternRewriteDriver.h:283

mlir::applyPartialConversion
LogicalResult applyPartialConversion(ArrayRef< Operation * > ops, const ConversionTarget &target, const FrozenRewritePatternSet &patterns, ConversionConfig config=ConversionConfig())
Below we define several entry points for operation conversion.
Definition: DialectConversion.cpp:3378

mlir::populateMathToROCDLConversionPatterns
void populateMathToROCDLConversionPatterns(const LLVMTypeConverter &converter, RewritePatternSet &patterns)
Populate the given list with patterns that convert from Math to ROCDL calls.
Definition: MathToROCDL.cpp:48

mlir::OpToFuncCallLowering
Rewriting that replaces SourceOp with a CallOp to f32Func or f64Func or f32ApproxFunc or f16Func or i...
Definition: OpToFuncCallLowering.h:55

mlir::ScalarizeVectorOpLowering
Unrolls SourceOp to array/vector elements.
Definition: GPUOpsLowering.h:185