13 #ifndef MLIR_DIALECT_NVGPU_NVGPUDIALECT_H_
14 #define MLIR_DIALECT_NVGPU_NVGPUDIALECT_H_
23 #include "mlir/Dialect/NVGPU/IR/NVGPUEnums.h.inc"
40 #define GET_ATTRDEF_CLASSES
41 #include "mlir/Dialect/NVGPU/IR/NVGPUAttrDefs.h.inc"
43 #define GET_TYPEDEF_CLASSES
44 #include "mlir/Dialect/NVGPU/IR/NVGPUTypes.h.inc"
46 #include "mlir/Dialect/NVGPU/IR/NVGPUDialect.h.inc"
48 #define GET_OP_CLASSES
49 #include "mlir/Dialect/NVGPU/IR/NVGPU.h.inc"
constexpr int kWgmmaSizeM
M size of wgmma.mma_async instruction.
constexpr unsigned kMaxTMATensorDimension
Maximum TMA tile dimension (tensorRank) must be non-zero and less than or equal to the maximum suppor...
constexpr unsigned kMaxTMADimension
Maximum TMA tile size (boxDim), which specifies number of elements to be traversed along each of the ...
constexpr unsigned kMaxTMALastdimByte
Last dimension of 2D+ TMA must be 128 bytes.