17#define GEN_PASS_DEF_CONVERTAFFINEFORTOGPUPASS
18#define GEN_PASS_DEF_CONVERTPARALLELLOOPTOGPUPASS
19#include "mlir/Conversion/Passes.h.inc"
33 void runOnOperation()
override {
34 for (Operation &op : llvm::make_early_inc_range(
35 getOperation().getFunctionBody().getOps())) {
36 if (
auto forOp = dyn_cast<affine::AffineForOp>(&op)) {
45struct ParallelLoopToGpuPass
47 void runOnOperation()
override {
51 target.markUnknownOpDynamicallyLegal([](Operation *) {
return true; });
53 if (
failed(applyPartialConversion(getOperation(),
target,
Include the generated interface declarations.
void finalizeParallelLoopToGPUConversion(Operation *op)
Clean up after applyPartialConversion/applyFullConversion call.
void populateParallelLoopToGPUPatterns(RewritePatternSet &patterns)
Adds the conversion pattern from scf.parallel to gpu.launch to the provided pattern list.
LogicalResult convertAffineLoopNestToGPULaunch(affine::AffineForOp forOp, unsigned numBlockDims, unsigned numThreadDims)
Convert a perfect affine loop nest with the outermost loop identified by forOp into a gpu::Launch ope...
const FrozenRewritePatternSet & patterns
void configureParallelLoopToGPULegality(ConversionTarget &target)
Configures the rewrite target such that only scf.parallel operations that are not rewritten by the pr...