9#ifndef MLIR_DIALECT_GPU_PIPELINES_PASSES_H_
10#define MLIR_DIALECT_GPU_PIPELINES_PASSES_H_
21 *
this,
"index-bitwidth",
22 llvm::cl::desc(
"Bitwidth of the index type for the host (warning this "
23 "should be 64 until the GPU layering is fixed)"),
26 *
this,
"cubin-triple",
27 llvm::cl::desc(
"Triple to use to serialize to cubin."),
28 llvm::cl::init(
"nvptx64-nvidia-cuda")};
30 *
this,
"cubin-chip", llvm::cl::desc(
"Chip to use to serialize to cubin."),
31 llvm::cl::init(
"sm_75")};
33 *
this,
"cubin-features",
34 llvm::cl::desc(
"Features to use to serialize to cubin."),
37 *
this,
"cubin-format",
38 llvm::cl::desc(
"Compilation format to use to serialize to cubin."),
39 llvm::cl::init(
"fatbin")};
41 *
this,
"ptxas-cmd-options",
43 "Command line options to pass to the downstream compiler."),
47 llvm::cl::desc(
"Optimization level for NVVM compilation"),
50 *
this,
"kernel-bare-ptr-calling-convention",
52 "Whether to use the bareptr calling convention on the kernel "
53 "(warning this should be false until the GPU layering is fixed)"),
54 llvm::cl::init(
false)};
56 *
this,
"host-bare-ptr-calling-convention",
58 "Whether to use the bareptr calling convention on the host (warning "
59 "this should be false until the GPU layering is fixed)"),
60 llvm::cl::init(
false)};
62 *
this,
"allow-pattern-rollback",
63 llvm::cl::desc(
"Allow pattern rollback during dialect conversion"),
64 llvm::cl::init(
true)};
71 *
this,
"index-bitwidth",
72 llvm::cl::desc(
"Bitwidth of the index type for the host (warning this "
73 "should be 64 until the GPU layering is fixed)"),
75 PassOptions::Option<std::string>
triple{
77 llvm::cl::desc(
"AMDGPU target triple (e.g. amdgcn-amd-amdhsa)."),
78 llvm::cl::init(
"amdgcn-amd-amdhsa")};
79 PassOptions::Option<std::string>
chip{
82 "AMDGPU target chip (e.g. gfx90a, gfx942, gfx1100). Required: "
83 "AMDGCN binaries are not forward-compatible across chip families.")};
85 *
this,
"features", llvm::cl::desc(
"AMDGPU target features."),
88 *
this,
"binary-format",
89 llvm::cl::desc(
"Final GPU binary emission format (e.g. fatbin, binary, "
90 "isa, llvm, offloading)."),
91 llvm::cl::init(
"fatbin")};
94 llvm::cl::desc(
"AMDHSA ABI version (e.g. \"500\", \"600\")."),
95 llvm::cl::init(
"600")};
98 llvm::cl::desc(
"Use Wave64 mode (default true; wave32 if false, "
99 "appropriate for RDNA / gfx10+ where supported)."),
100 llvm::cl::init(
true)};
103 llvm::cl::desc(
"Optimization level for ROCDL/AMDGPU compilation."),
106 *
this,
"rocdl-cmd-options",
108 "Command line options to pass to the downstream AMDGPU compiler."),
111 *
this,
"kernel-bare-ptr-calling-convention",
112 llvm::cl::desc(
"Use bareptr calling convention for device kernels."),
113 llvm::cl::init(
false)};
115 *
this,
"host-bare-ptr-calling-convention",
116 llvm::cl::desc(
"Use bareptr calling convention for the host."),
117 llvm::cl::init(
false)};
124 *
this,
"xegpu-op-level",
125 llvm::cl::desc(
"Granularity of XeGPU operations to target: workgroup | "
127 llvm::cl::init(
"workgroup")};
130 *
this,
"use-64bit-index",
131 llvm::cl::desc(
"Bitwidth of the index type (host & device)"),
132 llvm::cl::init(
true)};
134 *
this,
"kernel-bare-ptr-calling-convention",
135 llvm::cl::desc(
"Use bare pointer calling convention for device kernels"),
136 llvm::cl::init(
false)};
138 *
this,
"host-bare-ptr-calling-convention",
139 llvm::cl::desc(
"Use bare pointer calling convention for host launches"),
140 llvm::cl::init(
false)};
142 *
this,
"binary-format",
143 llvm::cl::desc(
"Final GPU binary emission format (e.g. fatbin)"),
144 llvm::cl::init(
"fatbin")};
147 *
this,
"xevm-module-matcher",
148 llvm::cl::desc(
"Regex to match gpu.module names for XeVM target attach"),
151 *
this,
"zebin-triple", llvm::cl::desc(
"Target triple for XeVM codegen"),
152 llvm::cl::init(
"spirv64-unknown-unknown")};
154 *
this,
"zebin-chip", llvm::cl::desc(
"Target chip (e.g. pvc, bmg)"),
155 llvm::cl::init(
"bmg")};
158 llvm::cl::desc(
"Optimization level for attached target/codegen"),
161 *
this,
"igc-cmd-options",
162 llvm::cl::desc(
"Additional downstream compiler command line options"),
174 const GPUToNVVMPipelineOptions &
options);
180 const GPUToROCDLPipelineOptions &
options);
186 const GPUToXeVMPipelineOptions &
options);
static llvm::ManagedStatic< PassManagerOptions > options
This class represents a pass manager that runs passes on either a specific operation type,...
void registerGPUToNVVMPipeline()
Register all pipelines for the gpu dialect.
void registerGPUToXeVMPipeline()
void buildLowerToXeVMPassPipeline(OpPassManager &pm, const GPUToXeVMPipelineOptions &options)
Adds the GPU to XeVM pipeline to the given pass manager.
void registerGPUToROCDLPipeline()
void buildLowerToROCDLPassPipeline(OpPassManager &pm, const GPUToROCDLPipelineOptions &options)
Adds the GPU to ROCDL pipeline to the given pass manager.
void buildLowerToNVVMPassPipeline(OpPassManager &pm, const GPUToNVVMPipelineOptions &options)
Adds the GPU to NVVM pipeline to the given pass manager.
Include the generated interface declarations.
Options for the gpu to nvvm pipeline.
PassOptions::Option< std::string > cubinChip
PassOptions::Option< int > optLevel
PassOptions::Option< bool > allowPatternRollback
PassOptions::Option< bool > hostUseBarePtrCallConv
PassOptions::Option< std::string > cmdOptions
PassOptions::Option< std::string > cubinFeatures
PassOptions::Option< std::string > cubinFormat
PassOptions::Option< int64_t > indexBitWidth
PassOptions::Option< std::string > cubinTriple
PassOptions::Option< bool > kernelUseBarePtrCallConv
Options for the gpu to rocdl pipeline.
PassOptions::Option< std::string > chip
PassOptions::Option< std::string > cmdOptions
PassOptions::Option< int64_t > indexBitWidth
PassOptions::Option< std::string > triple
PassOptions::Option< std::string > abiVersion
PassOptions::Option< bool > hostUseBarePtrCallConv
PassOptions::Option< bool > wave64
PassOptions::Option< bool > kernelUseBarePtrCallConv
PassOptions::Option< std::string > binaryFormat
PassOptions::Option< int > optLevel
PassOptions::Option< std::string > features
PassOptions::Option< bool > hostBarePtrCallConv
PassOptions::Option< unsigned > optLevel
PassOptions::Option< std::string > xegpuOpLevel
PassOptions::Option< std::string > xevmModuleMatcher
PassOptions::Option< std::string > zebinTriple
PassOptions::Option< bool > kernelBarePtrCallConv
PassOptions::Option< std::string > binaryFormat
PassOptions::Option< std::string > cmdOptions
PassOptions::Option< bool > use64bitIndex
PassOptions::Option< std::string > zebinChip