doxygen/GPUToROCDLPass_8h_source.html

 //===- GPUToROCDLPass.h - Convert GPU kernel to ROCDL dialect ---*- C++ -*-===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//

 #ifndef MLIR_CONVERSION_GPUTOROCDL_GPUTOROCDLPASS_H_

 #define MLIR_CONVERSION_GPUTOROCDL_GPUTOROCDLPASS_H_


 #include "mlir/Conversion/GPUToROCDL/Runtimes.h"

 #include "mlir/Conversion/LLVMCommon/LoweringOptions.h"

 #include <memory>


 namespace mlir {

 class LLVMTypeConverter;

 class ConversionTarget;

 class RewritePatternSet;


 template <typename OpT>

 class OperationPass;


 namespace amdgpu {

 struct Chipset;

 } // namespace amdgpu


 namespace gpu {

 class GPUModuleOp;

 } // namespace gpu


 #define GEN_PASS_DECL_CONVERTGPUOPSTOROCDLOPS

 #include "mlir/Conversion/Passes.h.inc"


 /// Collect a set of patterns to convert from the GPU dialect to ROCDL.

 /// If `runtime` is Unknown, gpu.printf will not be lowered

 /// The resulting pattern set should be run over a gpu.module op

 void populateGpuToROCDLConversionPatterns(const LLVMTypeConverter &converter,

                                           RewritePatternSet &patterns,

                                           gpu::amd::Runtime runtime,

                                           amdgpu::Chipset chipset);


 /// Configure target to convert from the GPU dialect to ROCDL.

 void configureGpuToROCDLConversionLegality(ConversionTarget &target);


 /// Creates a pass that lowers GPU dialect operations to ROCDL counterparts. The

 /// index bitwidth used for the lowering of the device side index computations

 /// is configurable.

 std::unique_ptr<OperationPass<gpu::GPUModuleOp>>

 createLowerGpuOpsToROCDLOpsPass(

     const std::string &chipset = "gfx900",

     unsigned indexBitwidth = kDeriveIndexBitwidthFromDataLayout,

     bool useBarePtrCallConv = false,

     gpu::amd::Runtime runtime = gpu::amd::Runtime::Unknown);


 } // namespace mlir


 #endif // MLIR_CONVERSION_GPUTOROCDL_GPUTOROCDLPASS_H_

LoweringOptions.h

Runtimes.h

mlir::gpu::amd::Runtime
Runtime
Potential runtimes for AMD GPU kernels.
Definition: Runtimes.h:15

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20

mlir::populateGpuToROCDLConversionPatterns
void populateGpuToROCDLConversionPatterns(const LLVMTypeConverter &converter, RewritePatternSet &patterns, gpu::amd::Runtime runtime, amdgpu::Chipset chipset)
Collect a set of patterns to convert from the GPU dialect to ROCDL.
Definition: LowerGpuOpsToROCDLOps.cpp:416

mlir::kDeriveIndexBitwidthFromDataLayout
static constexpr unsigned kDeriveIndexBitwidthFromDataLayout
Value to pass as bitwidth for the index type when the converter is expected to derive the bitwidth fr...
Definition: LoweringOptions.h:26

mlir::configureGpuToROCDLConversionLegality
void configureGpuToROCDLConversionLegality(ConversionTarget &target)
Configure target to convert from the GPU dialect to ROCDL.
Definition: LowerGpuOpsToROCDLOps.cpp:400

mlir::createLowerGpuOpsToROCDLOpsPass
std::unique_ptr< OperationPass< gpu::GPUModuleOp > > createLowerGpuOpsToROCDLOpsPass(const std::string &chipset="gfx900", unsigned indexBitwidth=kDeriveIndexBitwidthFromDataLayout, bool useBarePtrCallConv=false, gpu::amd::Runtime runtime=gpu::amd::Runtime::Unknown)
Creates a pass that lowers GPU dialect operations to ROCDL counterparts.
Definition: LowerGpuOpsToROCDLOps.cpp:463

mlir::patterns
const FrozenRewritePatternSet & patterns
Definition: GreedyPatternRewriteDriver.h:283

mlir::amdgpu::Chipset
Represents the amdgpu gfx chipset version, e.g., gfx90a, gfx942, gfx1103.
Definition: Chipset.h:22