doxygen/SCFToGPU_8h_source.html

 //===- SCFToGPU.h - Convert loop nests to GPU kernels -----------*- C++ -*-===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//

 #ifndef MLIR_CONVERSION_SCFTOGPU_SCFTOGPU_H_

 #define MLIR_CONVERSION_SCFTOGPU_SCFTOGPU_H_


 #include "mlir/Support/LLVM.h"


 namespace mlir {

 class ConversionTarget;

 class MLIRContext;

 class Value;

 class Operation;

 class RewritePatternSet;


 namespace affine {

 class AffineForOp;

 } // namespace affine


 namespace scf {

 class ForOp;

 } // namespace scf


 /// Convert a perfect affine loop nest with the outermost loop identified by

 /// `forOp` into a gpu::Launch operation.  Map `numBlockDims` outer loops to

 /// GPU blocks and `numThreadDims` to GPU threads.  The bounds of the loops that

 /// are mapped should be independent of the induction variables of the other

 /// mapped loops.

 ///

 /// No check on the size of the block or grid, or on the validity of

 /// parallelization is performed, it is under the responsibility of the caller

 /// to strip-mine the loops and to perform the dependence analysis before

 /// calling the conversion.


 // TODO: Consider removing this in favor of affine.for -> affine.parallel

 // detection followed by an affine.parallel -> scf.parallel -> gpu.launch

 // conversion

 LogicalResult convertAffineLoopNestToGPULaunch(affine::AffineForOp forOp,

                                                unsigned numBlockDims,

                                                unsigned numThreadDims);


 /// Adds the conversion pattern from `scf.parallel` to `gpu.launch` to the

 /// provided pattern list.

 void populateParallelLoopToGPUPatterns(RewritePatternSet &patterns);


 /// Configures the rewrite target such that only `scf.parallel` operations that

 /// are not rewritten by the provided patterns are legal.

 void configureParallelLoopToGPULegality(ConversionTarget &target);


 /// Clean up after applyPartialConversion/applyFullConversion call.

 void finalizeParallelLoopToGPUConversion(Operation *op);


 } // namespace mlir


 #endif // MLIR_CONVERSION_SCFTOGPU_SCFTOGPU_H_

mlir::ConversionTarget
This class describes a specific conversion target.
Definition: DialectConversion.h:868

mlir::Operation
Operation is the basic unit of execution within MLIR.
Definition: Operation.h:88

mlir::RewritePatternSet
Definition: PatternMatch.h:772

LLVM.h

mlir::lsp::CompletionItemKind::Value
@ Value

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20

mlir::finalizeParallelLoopToGPUConversion
void finalizeParallelLoopToGPUConversion(Operation *op)
Clean up after applyPartialConversion/applyFullConversion call.
Definition: SCFToGPU.cpp:719

mlir::populateParallelLoopToGPUPatterns
void populateParallelLoopToGPUPatterns(RewritePatternSet &patterns)
Adds the conversion pattern from scf.parallel to gpu.launch to the provided pattern list.
Definition: SCFToGPU.cpp:707

mlir::convertAffineLoopNestToGPULaunch
LogicalResult convertAffineLoopNestToGPULaunch(affine::AffineForOp forOp, unsigned numBlockDims, unsigned numThreadDims)
Convert a perfect affine loop nest with the outermost loop identified by forOp into a gpu::Launch ope...

mlir::patterns
const FrozenRewritePatternSet & patterns
Definition: GreedyPatternRewriteDriver.h:283

mlir::configureParallelLoopToGPULegality
void configureParallelLoopToGPULegality(ConversionTarget &target)
Configures the rewrite target such that only scf.parallel operations that are not rewritten by the pr...
Definition: SCFToGPU.cpp:711