MLIR 22.0.0git
OpenMPDialect.cpp
Go to the documentation of this file.
1//===- OpenMPDialect.cpp - MLIR Dialect for OpenMP implementation ---------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file implements the OpenMP dialect and its operations.
10//
11//===----------------------------------------------------------------------===//
12
18#include "mlir/IR/Attributes.h"
23#include "mlir/IR/SymbolTable.h"
25
26#include "llvm/ADT/ArrayRef.h"
27#include "llvm/ADT/PostOrderIterator.h"
28#include "llvm/ADT/STLExtras.h"
29#include "llvm/ADT/STLForwardCompat.h"
30#include "llvm/ADT/SmallString.h"
31#include "llvm/ADT/StringExtras.h"
32#include "llvm/ADT/StringRef.h"
33#include "llvm/ADT/TypeSwitch.h"
34#include "llvm/ADT/bit.h"
35#include "llvm/Support/InterleavedRange.h"
36#include <cstddef>
37#include <iterator>
38#include <optional>
39#include <variant>
40
41#include "mlir/Dialect/OpenMP/OpenMPOpsDialect.cpp.inc"
42#include "mlir/Dialect/OpenMP/OpenMPOpsEnums.cpp.inc"
43#include "mlir/Dialect/OpenMP/OpenMPOpsInterfaces.cpp.inc"
44#include "mlir/Dialect/OpenMP/OpenMPTypeInterfaces.cpp.inc"
45
46using namespace mlir;
47using namespace mlir::omp;
48
51 return attrs.empty() ? nullptr : ArrayAttr::get(context, attrs);
52}
53
56 return boolArray.empty() ? nullptr : DenseBoolArrayAttr::get(ctx, boolArray);
57}
58
61 return intArray.empty() ? nullptr : DenseI64ArrayAttr::get(ctx, intArray);
62}
63
64namespace {
65struct MemRefPointerLikeModel
66 : public PointerLikeType::ExternalModel<MemRefPointerLikeModel,
67 MemRefType> {
68 Type getElementType(Type pointer) const {
69 return llvm::cast<MemRefType>(pointer).getElementType();
70 }
71};
72
73struct LLVMPointerPointerLikeModel
74 : public PointerLikeType::ExternalModel<LLVMPointerPointerLikeModel,
75 LLVM::LLVMPointerType> {
76 Type getElementType(Type pointer) const { return Type(); }
77};
78} // namespace
79
80/// Generate a name of a canonical loop nest of the format
81/// `<prefix>(_r<idx>_s<idx>)*`. Hereby, `_r<idx>` identifies the region
82/// argument index of an operation that has multiple regions, if the operation
83/// has multiple regions.
84/// `_s<idx>` identifies the position of an operation within a region, where
85/// only operations that may potentially contain loops ("container operations"
86/// i.e. have region arguments) are counted. Again, it is omitted if there is
87/// only one such operation in a region. If there are canonical loops nested
88/// inside each other, also may also use the format `_d<num>` where <num> is the
89/// nesting depth of the loop.
90///
91/// The generated name is a best-effort to make canonical loop unique within an
92/// SSA namespace. This also means that regions with IsolatedFromAbove property
93/// do not consider any parents or siblings.
94static std::string generateLoopNestingName(StringRef prefix,
95 CanonicalLoopOp op) {
96 struct Component {
97 /// If true, this component describes a region operand of an operation (the
98 /// operand's owner) If false, this component describes an operation located
99 /// in a parent region
100 bool isRegionArgOfOp;
101 bool skip = false;
102 bool isUnique = false;
103
104 size_t idx;
105 Operation *op;
106 Region *parentRegion;
107 size_t loopDepth;
108
109 Operation *&getOwnerOp() {
110 assert(isRegionArgOfOp && "Must describe a region operand");
111 return op;
112 }
113 size_t &getArgIdx() {
114 assert(isRegionArgOfOp && "Must describe a region operand");
115 return idx;
116 }
117
118 Operation *&getContainerOp() {
119 assert(!isRegionArgOfOp && "Must describe a operation of a region");
120 return op;
121 }
122 size_t &getOpPos() {
123 assert(!isRegionArgOfOp && "Must describe a operation of a region");
124 return idx;
125 }
126 bool isLoopOp() const {
127 assert(!isRegionArgOfOp && "Must describe a operation of a region");
128 return isa<CanonicalLoopOp>(op);
129 }
130 Region *&getParentRegion() {
131 assert(!isRegionArgOfOp && "Must describe a operation of a region");
132 return parentRegion;
133 }
134 size_t &getLoopDepth() {
135 assert(!isRegionArgOfOp && "Must describe a operation of a region");
136 return loopDepth;
137 }
138
139 void skipIf(bool v = true) { skip = skip || v; }
140 };
141
142 // List of ancestors, from inner to outer.
143 // Alternates between
144 // * region argument of an operation
145 // * operation within a region
146 SmallVector<Component> components;
147
148 // Gather a list of parent regions and operations, and the position within
149 // their parent
150 Operation *o = op.getOperation();
151 while (o) {
152 // Operation within a region
153 Region *r = o->getParentRegion();
154 if (!r)
155 break;
156
157 llvm::ReversePostOrderTraversal<Block *> traversal(&r->getBlocks().front());
158 size_t idx = 0;
159 bool found = false;
160 size_t sequentialIdx = -1;
161 bool isOnlyContainerOp = true;
162 for (Block *b : traversal) {
163 for (Operation &op : *b) {
164 if (&op == o && !found) {
165 sequentialIdx = idx;
166 found = true;
167 }
168 if (op.getNumRegions()) {
169 idx += 1;
170 if (idx > 1)
171 isOnlyContainerOp = false;
172 }
173 if (found && !isOnlyContainerOp)
174 break;
175 }
176 }
177
178 Component &containerOpInRegion = components.emplace_back();
179 containerOpInRegion.isRegionArgOfOp = false;
180 containerOpInRegion.isUnique = isOnlyContainerOp;
181 containerOpInRegion.getContainerOp() = o;
182 containerOpInRegion.getOpPos() = sequentialIdx;
183 containerOpInRegion.getParentRegion() = r;
184
185 Operation *parent = r->getParentOp();
186
187 // Region argument of an operation
188 Component &regionArgOfOperation = components.emplace_back();
189 regionArgOfOperation.isRegionArgOfOp = true;
190 regionArgOfOperation.isUnique = true;
191 regionArgOfOperation.getArgIdx() = 0;
192 regionArgOfOperation.getOwnerOp() = parent;
193
194 // The IsolatedFromAbove trait of the parent operation implies that each
195 // individual region argument has its own separate namespace, so no
196 // ambiguity.
197 if (!parent || parent->hasTrait<mlir::OpTrait::IsIsolatedFromAbove>())
198 break;
199
200 // Component only needed if operation has multiple region operands. Region
201 // arguments may be optional, but we currently do not consider this.
202 if (parent->getRegions().size() > 1) {
203 auto getRegionIndex = [](Operation *o, Region *r) {
204 for (auto [idx, region] : llvm::enumerate(o->getRegions())) {
205 if (&region == r)
206 return idx;
207 }
208 llvm_unreachable("Region not child of its parent operation");
209 };
210 regionArgOfOperation.isUnique = false;
211 regionArgOfOperation.getArgIdx() = getRegionIndex(parent, r);
212 }
213
214 // next parent
215 o = parent;
216 }
217
218 // Determine whether a region-argument component is not needed
219 for (Component &c : components)
220 c.skipIf(c.isRegionArgOfOp && c.isUnique);
221
222 // Find runs of nested loops and determine each loop's depth in the loop nest
223 size_t numSurroundingLoops = 0;
224 for (Component &c : llvm::reverse(components)) {
225 if (c.skip)
226 continue;
227
228 // non-skipped multi-argument operands interrupt the loop nest
229 if (c.isRegionArgOfOp) {
230 numSurroundingLoops = 0;
231 continue;
232 }
233
234 // Multiple loops in a region means each of them is the outermost loop of a
235 // new loop nest
236 if (!c.isUnique)
237 numSurroundingLoops = 0;
238
239 c.getLoopDepth() = numSurroundingLoops;
240
241 // Next loop is surrounded by one more loop
242 if (isa<CanonicalLoopOp>(c.getContainerOp()))
243 numSurroundingLoops += 1;
244 }
245
246 // In loop nests, skip all but the innermost loop that contains the depth
247 // number
248 bool isLoopNest = false;
249 for (Component &c : components) {
250 if (c.skip || c.isRegionArgOfOp)
251 continue;
252
253 if (!isLoopNest && c.getLoopDepth() >= 1) {
254 // Innermost loop of a loop nest of at least two loops
255 isLoopNest = true;
256 } else if (isLoopNest) {
257 // Non-innermost loop of a loop nest
258 c.skipIf(c.isUnique);
259
260 // If there is no surrounding loop left, this must have been the outermost
261 // loop; leave loop-nest mode for the next iteration
262 if (c.getLoopDepth() == 0)
263 isLoopNest = false;
264 }
265 }
266
267 // Skip non-loop unambiguous regions (but they should interrupt loop nests, so
268 // we mark them as skipped only after computing loop nests)
269 for (Component &c : components)
270 c.skipIf(!c.isRegionArgOfOp && c.isUnique &&
271 !isa<CanonicalLoopOp>(c.getContainerOp()));
272
273 // Components can be skipped if they are already disambiguated by their parent
274 // (or does not have a parent)
275 bool newRegion = true;
276 for (Component &c : llvm::reverse(components)) {
277 c.skipIf(newRegion && c.isUnique);
278
279 // non-skipped components disambiguate unique children
280 if (!c.skip)
281 newRegion = true;
282
283 // ...except canonical loops that need a suffix for each nest
284 if (!c.isRegionArgOfOp && c.getContainerOp())
285 newRegion = false;
286 }
287
288 // Compile the nesting name string
289 SmallString<64> Name{prefix};
290 llvm::raw_svector_ostream NameOS(Name);
291 for (auto &c : llvm::reverse(components)) {
292 if (c.skip)
293 continue;
294
295 if (c.isRegionArgOfOp)
296 NameOS << "_r" << c.getArgIdx();
297 else if (c.getLoopDepth() >= 1)
298 NameOS << "_d" << c.getLoopDepth();
299 else
300 NameOS << "_s" << c.getOpPos();
301 }
302
303 return NameOS.str().str();
304}
305
306void OpenMPDialect::initialize() {
307 addOperations<
308#define GET_OP_LIST
309#include "mlir/Dialect/OpenMP/OpenMPOps.cpp.inc"
310 >();
311 addAttributes<
312#define GET_ATTRDEF_LIST
313#include "mlir/Dialect/OpenMP/OpenMPOpsAttributes.cpp.inc"
314 >();
315 addTypes<
316#define GET_TYPEDEF_LIST
317#include "mlir/Dialect/OpenMP/OpenMPOpsTypes.cpp.inc"
318 >();
319
320 declarePromisedInterface<ConvertToLLVMPatternInterface, OpenMPDialect>();
321
322 MemRefType::attachInterface<MemRefPointerLikeModel>(*getContext());
323 LLVM::LLVMPointerType::attachInterface<LLVMPointerPointerLikeModel>(
324 *getContext());
325
326 // Attach default offload module interface to module op to access
327 // offload functionality through
328 mlir::ModuleOp::attachInterface<mlir::omp::OffloadModuleDefaultModel>(
329 *getContext());
330
331 // Attach default declare target interfaces to operations which can be marked
332 // as declare target (Global Operations and Functions/Subroutines in dialects
333 // that Fortran (or other languages that lower to MLIR) translates too
334 mlir::LLVM::GlobalOp::attachInterface<
336 *getContext());
337 mlir::LLVM::LLVMFuncOp::attachInterface<
339 *getContext());
340 mlir::func::FuncOp::attachInterface<
342}
343
344//===----------------------------------------------------------------------===//
345// Parser and printer for Allocate Clause
346//===----------------------------------------------------------------------===//
347
348/// Parse an allocate clause with allocators and a list of operands with types.
349///
350/// allocate-operand-list :: = allocate-operand |
351/// allocator-operand `,` allocate-operand-list
352/// allocate-operand :: = ssa-id-and-type -> ssa-id-and-type
353/// ssa-id-and-type ::= ssa-id `:` type
354static ParseResult parseAllocateAndAllocator(
355 OpAsmParser &parser,
357 SmallVectorImpl<Type> &allocateTypes,
359 SmallVectorImpl<Type> &allocatorTypes) {
360
361 return parser.parseCommaSeparatedList([&]() {
363 Type type;
364 if (parser.parseOperand(operand) || parser.parseColonType(type))
365 return failure();
366 allocatorVars.push_back(operand);
367 allocatorTypes.push_back(type);
368 if (parser.parseArrow())
369 return failure();
370 if (parser.parseOperand(operand) || parser.parseColonType(type))
371 return failure();
372
373 allocateVars.push_back(operand);
374 allocateTypes.push_back(type);
375 return success();
376 });
377}
378
379/// Print allocate clause
381 OperandRange allocateVars,
382 TypeRange allocateTypes,
383 OperandRange allocatorVars,
384 TypeRange allocatorTypes) {
385 for (unsigned i = 0; i < allocateVars.size(); ++i) {
386 std::string separator = i == allocateVars.size() - 1 ? "" : ", ";
387 p << allocatorVars[i] << " : " << allocatorTypes[i] << " -> ";
388 p << allocateVars[i] << " : " << allocateTypes[i] << separator;
389 }
390}
391
392//===----------------------------------------------------------------------===//
393// Parser and printer for a clause attribute (StringEnumAttr)
394//===----------------------------------------------------------------------===//
395
396template <typename ClauseAttr>
397static ParseResult parseClauseAttr(AsmParser &parser, ClauseAttr &attr) {
398 using ClauseT = decltype(std::declval<ClauseAttr>().getValue());
399 StringRef enumStr;
400 SMLoc loc = parser.getCurrentLocation();
401 if (parser.parseKeyword(&enumStr))
402 return failure();
403 if (std::optional<ClauseT> enumValue = symbolizeEnum<ClauseT>(enumStr)) {
404 attr = ClauseAttr::get(parser.getContext(), *enumValue);
405 return success();
406 }
407 return parser.emitError(loc, "invalid clause value: '") << enumStr << "'";
408}
409
410template <typename ClauseAttr>
411static void printClauseAttr(OpAsmPrinter &p, Operation *op, ClauseAttr attr) {
412 p << stringifyEnum(attr.getValue());
413}
414
415//===----------------------------------------------------------------------===//
416// Parser and printer for Linear Clause
417//===----------------------------------------------------------------------===//
418
419/// linear ::= `linear` `(` linear-list `)`
420/// linear-list := linear-val | linear-val linear-list
421/// linear-val := ssa-id-and-type `=` ssa-id-and-type
422static ParseResult parseLinearClause(
423 OpAsmParser &parser,
425 SmallVectorImpl<Type> &linearTypes,
427 return parser.parseCommaSeparatedList([&]() {
429 Type type;
431 if (parser.parseOperand(var) || parser.parseEqual() ||
432 parser.parseOperand(stepVar) || parser.parseColonType(type))
433 return failure();
434
435 linearVars.push_back(var);
436 linearTypes.push_back(type);
437 linearStepVars.push_back(stepVar);
438 return success();
439 });
440}
441
442/// Print Linear Clause
444 ValueRange linearVars, TypeRange linearTypes,
445 ValueRange linearStepVars) {
446 size_t linearVarsSize = linearVars.size();
447 for (unsigned i = 0; i < linearVarsSize; ++i) {
448 std::string separator = i == linearVarsSize - 1 ? "" : ", ";
449 p << linearVars[i];
450 if (linearStepVars.size() > i)
451 p << " = " << linearStepVars[i];
452 p << " : " << linearVars[i].getType() << separator;
453 }
454}
455
456//===----------------------------------------------------------------------===//
457// Verifier for Nontemporal Clause
458//===----------------------------------------------------------------------===//
459
460static LogicalResult verifyNontemporalClause(Operation *op,
461 OperandRange nontemporalVars) {
462
463 // Check if each var is unique - OpenMP 5.0 -> 2.9.3.1 section
464 DenseSet<Value> nontemporalItems;
465 for (const auto &it : nontemporalVars)
466 if (!nontemporalItems.insert(it).second)
467 return op->emitOpError() << "nontemporal variable used more than once";
468
469 return success();
470}
471
472//===----------------------------------------------------------------------===//
473// Parser, verifier and printer for Aligned Clause
474//===----------------------------------------------------------------------===//
475static LogicalResult verifyAlignedClause(Operation *op,
476 std::optional<ArrayAttr> alignments,
477 OperandRange alignedVars) {
478 // Check if number of alignment values equals to number of aligned variables
479 if (!alignedVars.empty()) {
480 if (!alignments || alignments->size() != alignedVars.size())
481 return op->emitOpError()
482 << "expected as many alignment values as aligned variables";
483 } else {
484 if (alignments)
485 return op->emitOpError() << "unexpected alignment values attribute";
486 return success();
487 }
488
489 // Check if each var is aligned only once - OpenMP 4.5 -> 2.8.1 section
490 DenseSet<Value> alignedItems;
491 for (auto it : alignedVars)
492 if (!alignedItems.insert(it).second)
493 return op->emitOpError() << "aligned variable used more than once";
494
495 if (!alignments)
496 return success();
497
498 // Check if all alignment values are positive - OpenMP 4.5 -> 2.8.1 section
499 for (unsigned i = 0; i < (*alignments).size(); ++i) {
500 if (auto intAttr = llvm::dyn_cast<IntegerAttr>((*alignments)[i])) {
501 if (intAttr.getValue().sle(0))
502 return op->emitOpError() << "alignment should be greater than 0";
503 } else {
504 return op->emitOpError() << "expected integer alignment";
505 }
506 }
507
508 return success();
509}
510
511/// aligned ::= `aligned` `(` aligned-list `)`
512/// aligned-list := aligned-val | aligned-val aligned-list
513/// aligned-val := ssa-id-and-type `->` alignment
514static ParseResult
517 SmallVectorImpl<Type> &alignedTypes,
518 ArrayAttr &alignmentsAttr) {
519 SmallVector<Attribute> alignmentVec;
520 if (failed(parser.parseCommaSeparatedList([&]() {
521 if (parser.parseOperand(alignedVars.emplace_back()) ||
522 parser.parseColonType(alignedTypes.emplace_back()) ||
523 parser.parseArrow() ||
524 parser.parseAttribute(alignmentVec.emplace_back())) {
525 return failure();
526 }
527 return success();
528 })))
529 return failure();
530 SmallVector<Attribute> alignments(alignmentVec.begin(), alignmentVec.end());
531 alignmentsAttr = ArrayAttr::get(parser.getContext(), alignments);
532 return success();
533}
534
535/// Print Aligned Clause
537 ValueRange alignedVars, TypeRange alignedTypes,
538 std::optional<ArrayAttr> alignments) {
539 for (unsigned i = 0; i < alignedVars.size(); ++i) {
540 if (i != 0)
541 p << ", ";
542 p << alignedVars[i] << " : " << alignedVars[i].getType();
543 p << " -> " << (*alignments)[i];
544 }
545}
546
547//===----------------------------------------------------------------------===//
548// Parser, printer and verifier for Schedule Clause
549//===----------------------------------------------------------------------===//
550
551static ParseResult
553 SmallVectorImpl<SmallString<12>> &modifiers) {
554 if (modifiers.size() > 2)
555 return parser.emitError(parser.getNameLoc()) << " unexpected modifier(s)";
556 for (const auto &mod : modifiers) {
557 // Translate the string. If it has no value, then it was not a valid
558 // modifier!
559 auto symbol = symbolizeScheduleModifier(mod);
560 if (!symbol)
561 return parser.emitError(parser.getNameLoc())
562 << " unknown modifier type: " << mod;
563 }
564
565 // If we have one modifier that is "simd", then stick a "none" modiifer in
566 // index 0.
567 if (modifiers.size() == 1) {
568 if (symbolizeScheduleModifier(modifiers[0]) == ScheduleModifier::simd) {
569 modifiers.push_back(modifiers[0]);
570 modifiers[0] = stringifyScheduleModifier(ScheduleModifier::none);
571 }
572 } else if (modifiers.size() == 2) {
573 // If there are two modifier:
574 // First modifier should not be simd, second one should be simd
575 if (symbolizeScheduleModifier(modifiers[0]) == ScheduleModifier::simd ||
576 symbolizeScheduleModifier(modifiers[1]) != ScheduleModifier::simd)
577 return parser.emitError(parser.getNameLoc())
578 << " incorrect modifier order";
579 }
580 return success();
581}
582
583/// schedule ::= `schedule` `(` sched-list `)`
584/// sched-list ::= sched-val | sched-val sched-list |
585/// sched-val `,` sched-modifier
586/// sched-val ::= sched-with-chunk | sched-wo-chunk
587/// sched-with-chunk ::= sched-with-chunk-types (`=` ssa-id-and-type)?
588/// sched-with-chunk-types ::= `static` | `dynamic` | `guided`
589/// sched-wo-chunk ::= `auto` | `runtime`
590/// sched-modifier ::= sched-mod-val | sched-mod-val `,` sched-mod-val
591/// sched-mod-val ::= `monotonic` | `nonmonotonic` | `simd` | `none`
592static ParseResult
593parseScheduleClause(OpAsmParser &parser, ClauseScheduleKindAttr &scheduleAttr,
594 ScheduleModifierAttr &scheduleMod, UnitAttr &scheduleSimd,
595 std::optional<OpAsmParser::UnresolvedOperand> &chunkSize,
596 Type &chunkType) {
597 StringRef keyword;
598 if (parser.parseKeyword(&keyword))
599 return failure();
600 std::optional<mlir::omp::ClauseScheduleKind> schedule =
601 symbolizeClauseScheduleKind(keyword);
602 if (!schedule)
603 return parser.emitError(parser.getNameLoc()) << " expected schedule kind";
604
605 scheduleAttr = ClauseScheduleKindAttr::get(parser.getContext(), *schedule);
606 switch (*schedule) {
607 case ClauseScheduleKind::Static:
608 case ClauseScheduleKind::Dynamic:
609 case ClauseScheduleKind::Guided:
610 if (succeeded(parser.parseOptionalEqual())) {
611 chunkSize = OpAsmParser::UnresolvedOperand{};
612 if (parser.parseOperand(*chunkSize) || parser.parseColonType(chunkType))
613 return failure();
614 } else {
615 chunkSize = std::nullopt;
616 }
617 break;
618 case ClauseScheduleKind::Auto:
619 case ClauseScheduleKind::Runtime:
620 case ClauseScheduleKind::Distribute:
621 chunkSize = std::nullopt;
622 }
623
624 // If there is a comma, we have one or more modifiers..
626 while (succeeded(parser.parseOptionalComma())) {
627 StringRef mod;
628 if (parser.parseKeyword(&mod))
629 return failure();
630 modifiers.push_back(mod);
631 }
632
633 if (verifyScheduleModifiers(parser, modifiers))
634 return failure();
635
636 if (!modifiers.empty()) {
637 SMLoc loc = parser.getCurrentLocation();
638 if (std::optional<ScheduleModifier> mod =
639 symbolizeScheduleModifier(modifiers[0])) {
640 scheduleMod = ScheduleModifierAttr::get(parser.getContext(), *mod);
641 } else {
642 return parser.emitError(loc, "invalid schedule modifier");
643 }
644 // Only SIMD attribute is allowed here!
645 if (modifiers.size() > 1) {
646 assert(symbolizeScheduleModifier(modifiers[1]) == ScheduleModifier::simd);
647 scheduleSimd = UnitAttr::get(parser.getBuilder().getContext());
648 }
649 }
650
651 return success();
652}
653
654/// Print schedule clause
656 ClauseScheduleKindAttr scheduleKind,
657 ScheduleModifierAttr scheduleMod,
658 UnitAttr scheduleSimd, Value scheduleChunk,
659 Type scheduleChunkType) {
660 p << stringifyClauseScheduleKind(scheduleKind.getValue());
661 if (scheduleChunk)
662 p << " = " << scheduleChunk << " : " << scheduleChunk.getType();
663 if (scheduleMod)
664 p << ", " << stringifyScheduleModifier(scheduleMod.getValue());
665 if (scheduleSimd)
666 p << ", simd";
667}
668
669//===----------------------------------------------------------------------===//
670// Parser and printer for Order Clause
671//===----------------------------------------------------------------------===//
672
673// order ::= `order` `(` [order-modifier ':'] concurrent `)`
674// order-modifier ::= reproducible | unconstrained
675static ParseResult parseOrderClause(OpAsmParser &parser,
676 ClauseOrderKindAttr &order,
677 OrderModifierAttr &orderMod) {
678 StringRef enumStr;
679 SMLoc loc = parser.getCurrentLocation();
680 if (parser.parseKeyword(&enumStr))
681 return failure();
682 if (std::optional<OrderModifier> enumValue =
683 symbolizeOrderModifier(enumStr)) {
684 orderMod = OrderModifierAttr::get(parser.getContext(), *enumValue);
685 if (parser.parseOptionalColon())
686 return failure();
687 loc = parser.getCurrentLocation();
688 if (parser.parseKeyword(&enumStr))
689 return failure();
690 }
691 if (std::optional<ClauseOrderKind> enumValue =
692 symbolizeClauseOrderKind(enumStr)) {
693 order = ClauseOrderKindAttr::get(parser.getContext(), *enumValue);
694 return success();
695 }
696 return parser.emitError(loc, "invalid clause value: '") << enumStr << "'";
697}
698
700 ClauseOrderKindAttr order,
701 OrderModifierAttr orderMod) {
702 if (orderMod)
703 p << stringifyOrderModifier(orderMod.getValue()) << ":";
704 if (order)
705 p << stringifyClauseOrderKind(order.getValue());
706}
707
708template <typename ClauseTypeAttr, typename ClauseType>
709static ParseResult
710parseGranularityClause(OpAsmParser &parser, ClauseTypeAttr &prescriptiveness,
711 std::optional<OpAsmParser::UnresolvedOperand> &operand,
712 Type &operandType,
713 std::optional<ClauseType> (*symbolizeClause)(StringRef),
714 StringRef clauseName) {
715 StringRef enumStr;
716 if (succeeded(parser.parseOptionalKeyword(&enumStr))) {
717 if (std::optional<ClauseType> enumValue = symbolizeClause(enumStr)) {
718 prescriptiveness = ClauseTypeAttr::get(parser.getContext(), *enumValue);
719 if (parser.parseComma())
720 return failure();
721 } else {
722 return parser.emitError(parser.getCurrentLocation())
723 << "invalid " << clauseName << " modifier : '" << enumStr << "'";
724 ;
725 }
726 }
727
729 if (succeeded(parser.parseOperand(var))) {
730 operand = var;
731 } else {
732 return parser.emitError(parser.getCurrentLocation())
733 << "expected " << clauseName << " operand";
734 }
735
736 if (operand.has_value()) {
737 if (parser.parseColonType(operandType))
738 return failure();
739 }
740
741 return success();
742}
743
744template <typename ClauseTypeAttr, typename ClauseType>
745static void
747 ClauseTypeAttr prescriptiveness, Value operand,
748 mlir::Type operandType,
749 StringRef (*stringifyClauseType)(ClauseType)) {
750
751 if (prescriptiveness)
752 p << stringifyClauseType(prescriptiveness.getValue()) << ", ";
753
754 if (operand)
755 p << operand << ": " << operandType;
756}
757
758//===----------------------------------------------------------------------===//
759// Parser and printer for grainsize Clause
760//===----------------------------------------------------------------------===//
761
762// grainsize ::= `grainsize` `(` [strict ':'] grain-size `)`
763static ParseResult
764parseGrainsizeClause(OpAsmParser &parser, ClauseGrainsizeTypeAttr &grainsizeMod,
765 std::optional<OpAsmParser::UnresolvedOperand> &grainsize,
766 Type &grainsizeType) {
768 parser, grainsizeMod, grainsize, grainsizeType,
769 &symbolizeClauseGrainsizeType, "grainsize");
770}
771
773 ClauseGrainsizeTypeAttr grainsizeMod,
774 Value grainsize, mlir::Type grainsizeType) {
776 p, op, grainsizeMod, grainsize, grainsizeType,
777 &stringifyClauseGrainsizeType);
778}
779
780//===----------------------------------------------------------------------===//
781// Parser and printer for num_tasks Clause
782//===----------------------------------------------------------------------===//
783
784// numtask ::= `num_tasks` `(` [strict ':'] num-tasks `)`
785static ParseResult
786parseNumTasksClause(OpAsmParser &parser, ClauseNumTasksTypeAttr &numTasksMod,
787 std::optional<OpAsmParser::UnresolvedOperand> &numTasks,
788 Type &numTasksType) {
790 parser, numTasksMod, numTasks, numTasksType, &symbolizeClauseNumTasksType,
791 "num_tasks");
792}
793
795 ClauseNumTasksTypeAttr numTasksMod,
796 Value numTasks, mlir::Type numTasksType) {
798 p, op, numTasksMod, numTasks, numTasksType, &stringifyClauseNumTasksType);
799}
800
801//===----------------------------------------------------------------------===//
802// Parsers for operations including clauses that define entry block arguments.
803//===----------------------------------------------------------------------===//
804
805namespace {
806struct MapParseArgs {
807 SmallVectorImpl<OpAsmParser::UnresolvedOperand> &vars;
808 SmallVectorImpl<Type> &types;
809 MapParseArgs(SmallVectorImpl<OpAsmParser::UnresolvedOperand> &vars,
810 SmallVectorImpl<Type> &types)
811 : vars(vars), types(types) {}
812};
813struct PrivateParseArgs {
814 llvm::SmallVectorImpl<OpAsmParser::UnresolvedOperand> &vars;
815 llvm::SmallVectorImpl<Type> &types;
816 ArrayAttr &syms;
817 UnitAttr &needsBarrier;
818 DenseI64ArrayAttr *mapIndices;
819 PrivateParseArgs(SmallVectorImpl<OpAsmParser::UnresolvedOperand> &vars,
820 SmallVectorImpl<Type> &types, ArrayAttr &syms,
821 UnitAttr &needsBarrier,
822 DenseI64ArrayAttr *mapIndices = nullptr)
823 : vars(vars), types(types), syms(syms), needsBarrier(needsBarrier),
824 mapIndices(mapIndices) {}
825};
826
827struct ReductionParseArgs {
828 SmallVectorImpl<OpAsmParser::UnresolvedOperand> &vars;
829 SmallVectorImpl<Type> &types;
830 DenseBoolArrayAttr &byref;
831 ArrayAttr &syms;
832 ReductionModifierAttr *modifier;
833 ReductionParseArgs(SmallVectorImpl<OpAsmParser::UnresolvedOperand> &vars,
834 SmallVectorImpl<Type> &types, DenseBoolArrayAttr &byref,
835 ArrayAttr &syms, ReductionModifierAttr *mod = nullptr)
836 : vars(vars), types(types), byref(byref), syms(syms), modifier(mod) {}
837};
838
839struct AllRegionParseArgs {
840 std::optional<MapParseArgs> hasDeviceAddrArgs;
841 std::optional<MapParseArgs> hostEvalArgs;
842 std::optional<ReductionParseArgs> inReductionArgs;
843 std::optional<MapParseArgs> mapArgs;
844 std::optional<PrivateParseArgs> privateArgs;
845 std::optional<ReductionParseArgs> reductionArgs;
846 std::optional<ReductionParseArgs> taskReductionArgs;
847 std::optional<MapParseArgs> useDeviceAddrArgs;
848 std::optional<MapParseArgs> useDevicePtrArgs;
849};
850} // namespace
851
852static inline constexpr StringRef getPrivateNeedsBarrierSpelling() {
853 return "private_barrier";
854}
855
856static ParseResult parseClauseWithRegionArgs(
857 OpAsmParser &parser,
861 ArrayAttr *symbols = nullptr, DenseI64ArrayAttr *mapIndices = nullptr,
862 DenseBoolArrayAttr *byref = nullptr,
863 ReductionModifierAttr *modifier = nullptr,
864 UnitAttr *needsBarrier = nullptr) {
866 SmallVector<int64_t> mapIndicesVec;
867 SmallVector<bool> isByRefVec;
868 unsigned regionArgOffset = regionPrivateArgs.size();
869
870 if (parser.parseLParen())
871 return failure();
872
873 if (modifier && succeeded(parser.parseOptionalKeyword("mod"))) {
874 StringRef enumStr;
875 if (parser.parseColon() || parser.parseKeyword(&enumStr) ||
876 parser.parseComma())
877 return failure();
878 std::optional<ReductionModifier> enumValue =
879 symbolizeReductionModifier(enumStr);
880 if (!enumValue.has_value())
881 return failure();
882 *modifier = ReductionModifierAttr::get(parser.getContext(), *enumValue);
883 if (!*modifier)
884 return failure();
885 }
886
887 if (parser.parseCommaSeparatedList([&]() {
888 if (byref)
889 isByRefVec.push_back(
890 parser.parseOptionalKeyword("byref").succeeded());
891
892 if (symbols && parser.parseAttribute(symbolVec.emplace_back()))
893 return failure();
894
895 if (parser.parseOperand(operands.emplace_back()) ||
896 parser.parseArrow() ||
897 parser.parseArgument(regionPrivateArgs.emplace_back()))
898 return failure();
899
900 if (mapIndices) {
901 if (parser.parseOptionalLSquare().succeeded()) {
902 if (parser.parseKeyword("map_idx") || parser.parseEqual() ||
903 parser.parseInteger(mapIndicesVec.emplace_back()) ||
904 parser.parseRSquare())
905 return failure();
906 } else {
907 mapIndicesVec.push_back(-1);
908 }
909 }
910
911 return success();
912 }))
913 return failure();
914
915 if (parser.parseColon())
916 return failure();
917
918 if (parser.parseCommaSeparatedList([&]() {
919 if (parser.parseType(types.emplace_back()))
920 return failure();
921
922 return success();
923 }))
924 return failure();
925
926 if (operands.size() != types.size())
927 return failure();
928
929 if (parser.parseRParen())
930 return failure();
931
932 if (needsBarrier) {
934 .succeeded())
935 *needsBarrier = mlir::UnitAttr::get(parser.getContext());
936 }
937
938 auto *argsBegin = regionPrivateArgs.begin();
939 MutableArrayRef argsSubrange(argsBegin + regionArgOffset,
940 argsBegin + regionArgOffset + types.size());
941 for (auto [prv, type] : llvm::zip_equal(argsSubrange, types)) {
942 prv.type = type;
943 }
944
945 if (symbols) {
946 SmallVector<Attribute> symbolAttrs(symbolVec.begin(), symbolVec.end());
947 *symbols = ArrayAttr::get(parser.getContext(), symbolAttrs);
948 }
949
950 if (!mapIndicesVec.empty())
951 *mapIndices =
952 mlir::DenseI64ArrayAttr::get(parser.getContext(), mapIndicesVec);
953
954 if (byref)
955 *byref = makeDenseBoolArrayAttr(parser.getContext(), isByRefVec);
956
957 return success();
958}
959
960static ParseResult parseBlockArgClause(
961 OpAsmParser &parser,
963 StringRef keyword, std::optional<MapParseArgs> mapArgs) {
964 if (succeeded(parser.parseOptionalKeyword(keyword))) {
965 if (!mapArgs)
966 return failure();
967
968 if (failed(parseClauseWithRegionArgs(parser, mapArgs->vars, mapArgs->types,
969 entryBlockArgs)))
970 return failure();
971 }
972 return success();
973}
974
975static ParseResult parseBlockArgClause(
976 OpAsmParser &parser,
978 StringRef keyword, std::optional<PrivateParseArgs> privateArgs) {
979 if (succeeded(parser.parseOptionalKeyword(keyword))) {
980 if (!privateArgs)
981 return failure();
982
983 if (failed(parseClauseWithRegionArgs(
984 parser, privateArgs->vars, privateArgs->types, entryBlockArgs,
985 &privateArgs->syms, privateArgs->mapIndices, /*byref=*/nullptr,
986 /*modifier=*/nullptr, &privateArgs->needsBarrier)))
987 return failure();
988 }
989 return success();
990}
991
992static ParseResult parseBlockArgClause(
993 OpAsmParser &parser,
995 StringRef keyword, std::optional<ReductionParseArgs> reductionArgs) {
996 if (succeeded(parser.parseOptionalKeyword(keyword))) {
997 if (!reductionArgs)
998 return failure();
999 if (failed(parseClauseWithRegionArgs(
1000 parser, reductionArgs->vars, reductionArgs->types, entryBlockArgs,
1001 &reductionArgs->syms, /*mapIndices=*/nullptr, &reductionArgs->byref,
1002 reductionArgs->modifier)))
1003 return failure();
1004 }
1005 return success();
1006}
1007
1008static ParseResult parseBlockArgRegion(OpAsmParser &parser, Region &region,
1009 AllRegionParseArgs args) {
1011
1012 if (failed(parseBlockArgClause(parser, entryBlockArgs, "has_device_addr",
1013 args.hasDeviceAddrArgs)))
1014 return parser.emitError(parser.getCurrentLocation())
1015 << "invalid `has_device_addr` format";
1016
1017 if (failed(parseBlockArgClause(parser, entryBlockArgs, "host_eval",
1018 args.hostEvalArgs)))
1019 return parser.emitError(parser.getCurrentLocation())
1020 << "invalid `host_eval` format";
1021
1022 if (failed(parseBlockArgClause(parser, entryBlockArgs, "in_reduction",
1023 args.inReductionArgs)))
1024 return parser.emitError(parser.getCurrentLocation())
1025 << "invalid `in_reduction` format";
1026
1027 if (failed(parseBlockArgClause(parser, entryBlockArgs, "map_entries",
1028 args.mapArgs)))
1029 return parser.emitError(parser.getCurrentLocation())
1030 << "invalid `map_entries` format";
1031
1032 if (failed(parseBlockArgClause(parser, entryBlockArgs, "private",
1033 args.privateArgs)))
1034 return parser.emitError(parser.getCurrentLocation())
1035 << "invalid `private` format";
1036
1037 if (failed(parseBlockArgClause(parser, entryBlockArgs, "reduction",
1038 args.reductionArgs)))
1039 return parser.emitError(parser.getCurrentLocation())
1040 << "invalid `reduction` format";
1041
1042 if (failed(parseBlockArgClause(parser, entryBlockArgs, "task_reduction",
1043 args.taskReductionArgs)))
1044 return parser.emitError(parser.getCurrentLocation())
1045 << "invalid `task_reduction` format";
1046
1047 if (failed(parseBlockArgClause(parser, entryBlockArgs, "use_device_addr",
1048 args.useDeviceAddrArgs)))
1049 return parser.emitError(parser.getCurrentLocation())
1050 << "invalid `use_device_addr` format";
1051
1052 if (failed(parseBlockArgClause(parser, entryBlockArgs, "use_device_ptr",
1053 args.useDevicePtrArgs)))
1054 return parser.emitError(parser.getCurrentLocation())
1055 << "invalid `use_device_addr` format";
1056
1057 return parser.parseRegion(region, entryBlockArgs);
1058}
1059
1060// These parseXyz functions correspond to the custom<Xyz> definitions
1061// in the .td file(s).
1062static ParseResult parseTargetOpRegion(
1063 OpAsmParser &parser, Region &region,
1065 SmallVectorImpl<Type> &hasDeviceAddrTypes,
1067 SmallVectorImpl<Type> &hostEvalTypes,
1069 SmallVectorImpl<Type> &inReductionTypes,
1070 DenseBoolArrayAttr &inReductionByref, ArrayAttr &inReductionSyms,
1072 SmallVectorImpl<Type> &mapTypes,
1074 llvm::SmallVectorImpl<Type> &privateTypes, ArrayAttr &privateSyms,
1075 UnitAttr &privateNeedsBarrier, DenseI64ArrayAttr &privateMaps) {
1076 AllRegionParseArgs args;
1077 args.hasDeviceAddrArgs.emplace(hasDeviceAddrVars, hasDeviceAddrTypes);
1078 args.hostEvalArgs.emplace(hostEvalVars, hostEvalTypes);
1079 args.inReductionArgs.emplace(inReductionVars, inReductionTypes,
1080 inReductionByref, inReductionSyms);
1081 args.mapArgs.emplace(mapVars, mapTypes);
1082 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1083 privateNeedsBarrier, &privateMaps);
1084 return parseBlockArgRegion(parser, region, args);
1085}
1086
1088 OpAsmParser &parser, Region &region,
1090 SmallVectorImpl<Type> &inReductionTypes,
1091 DenseBoolArrayAttr &inReductionByref, ArrayAttr &inReductionSyms,
1093 llvm::SmallVectorImpl<Type> &privateTypes, ArrayAttr &privateSyms,
1094 UnitAttr &privateNeedsBarrier) {
1095 AllRegionParseArgs args;
1096 args.inReductionArgs.emplace(inReductionVars, inReductionTypes,
1097 inReductionByref, inReductionSyms);
1098 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1099 privateNeedsBarrier);
1100 return parseBlockArgRegion(parser, region, args);
1101}
1102
1104 OpAsmParser &parser, Region &region,
1106 SmallVectorImpl<Type> &inReductionTypes,
1107 DenseBoolArrayAttr &inReductionByref, ArrayAttr &inReductionSyms,
1109 llvm::SmallVectorImpl<Type> &privateTypes, ArrayAttr &privateSyms,
1110 UnitAttr &privateNeedsBarrier, ReductionModifierAttr &reductionMod,
1112 SmallVectorImpl<Type> &reductionTypes, DenseBoolArrayAttr &reductionByref,
1113 ArrayAttr &reductionSyms) {
1114 AllRegionParseArgs args;
1115 args.inReductionArgs.emplace(inReductionVars, inReductionTypes,
1116 inReductionByref, inReductionSyms);
1117 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1118 privateNeedsBarrier);
1119 args.reductionArgs.emplace(reductionVars, reductionTypes, reductionByref,
1120 reductionSyms, &reductionMod);
1121 return parseBlockArgRegion(parser, region, args);
1122}
1123
1124static ParseResult parsePrivateRegion(
1125 OpAsmParser &parser, Region &region,
1127 llvm::SmallVectorImpl<Type> &privateTypes, ArrayAttr &privateSyms,
1128 UnitAttr &privateNeedsBarrier) {
1129 AllRegionParseArgs args;
1130 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1131 privateNeedsBarrier);
1132 return parseBlockArgRegion(parser, region, args);
1133}
1134
1136 OpAsmParser &parser, Region &region,
1138 llvm::SmallVectorImpl<Type> &privateTypes, ArrayAttr &privateSyms,
1139 UnitAttr &privateNeedsBarrier, ReductionModifierAttr &reductionMod,
1141 SmallVectorImpl<Type> &reductionTypes, DenseBoolArrayAttr &reductionByref,
1142 ArrayAttr &reductionSyms) {
1143 AllRegionParseArgs args;
1144 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1145 privateNeedsBarrier);
1146 args.reductionArgs.emplace(reductionVars, reductionTypes, reductionByref,
1147 reductionSyms, &reductionMod);
1148 return parseBlockArgRegion(parser, region, args);
1149}
1150
1151static ParseResult parseTaskReductionRegion(
1152 OpAsmParser &parser, Region &region,
1154 SmallVectorImpl<Type> &taskReductionTypes,
1155 DenseBoolArrayAttr &taskReductionByref, ArrayAttr &taskReductionSyms) {
1156 AllRegionParseArgs args;
1157 args.taskReductionArgs.emplace(taskReductionVars, taskReductionTypes,
1158 taskReductionByref, taskReductionSyms);
1159 return parseBlockArgRegion(parser, region, args);
1160}
1161
1163 OpAsmParser &parser, Region &region,
1165 SmallVectorImpl<Type> &useDeviceAddrTypes,
1167 SmallVectorImpl<Type> &useDevicePtrTypes) {
1168 AllRegionParseArgs args;
1169 args.useDeviceAddrArgs.emplace(useDeviceAddrVars, useDeviceAddrTypes);
1170 args.useDevicePtrArgs.emplace(useDevicePtrVars, useDevicePtrTypes);
1171 return parseBlockArgRegion(parser, region, args);
1172}
1173
1174//===----------------------------------------------------------------------===//
1175// Printers for operations including clauses that define entry block arguments.
1176//===----------------------------------------------------------------------===//
1177
1178namespace {
1179struct MapPrintArgs {
1180 ValueRange vars;
1181 TypeRange types;
1182 MapPrintArgs(ValueRange vars, TypeRange types) : vars(vars), types(types) {}
1183};
1184struct PrivatePrintArgs {
1185 ValueRange vars;
1186 TypeRange types;
1187 ArrayAttr syms;
1188 UnitAttr needsBarrier;
1189 DenseI64ArrayAttr mapIndices;
1190 PrivatePrintArgs(ValueRange vars, TypeRange types, ArrayAttr syms,
1191 UnitAttr needsBarrier, DenseI64ArrayAttr mapIndices)
1192 : vars(vars), types(types), syms(syms), needsBarrier(needsBarrier),
1193 mapIndices(mapIndices) {}
1194};
1195struct ReductionPrintArgs {
1196 ValueRange vars;
1197 TypeRange types;
1198 DenseBoolArrayAttr byref;
1199 ArrayAttr syms;
1200 ReductionModifierAttr modifier;
1201 ReductionPrintArgs(ValueRange vars, TypeRange types, DenseBoolArrayAttr byref,
1202 ArrayAttr syms, ReductionModifierAttr mod = nullptr)
1203 : vars(vars), types(types), byref(byref), syms(syms), modifier(mod) {}
1204};
1205struct AllRegionPrintArgs {
1206 std::optional<MapPrintArgs> hasDeviceAddrArgs;
1207 std::optional<MapPrintArgs> hostEvalArgs;
1208 std::optional<ReductionPrintArgs> inReductionArgs;
1209 std::optional<MapPrintArgs> mapArgs;
1210 std::optional<PrivatePrintArgs> privateArgs;
1211 std::optional<ReductionPrintArgs> reductionArgs;
1212 std::optional<ReductionPrintArgs> taskReductionArgs;
1213 std::optional<MapPrintArgs> useDeviceAddrArgs;
1214 std::optional<MapPrintArgs> useDevicePtrArgs;
1215};
1216} // namespace
1217
1219 OpAsmPrinter &p, MLIRContext *ctx, StringRef clauseName,
1220 ValueRange argsSubrange, ValueRange operands, TypeRange types,
1221 ArrayAttr symbols = nullptr, DenseI64ArrayAttr mapIndices = nullptr,
1222 DenseBoolArrayAttr byref = nullptr,
1223 ReductionModifierAttr modifier = nullptr, UnitAttr needsBarrier = nullptr) {
1224 if (argsSubrange.empty())
1225 return;
1226
1227 p << clauseName << "(";
1228
1229 if (modifier)
1230 p << "mod: " << stringifyReductionModifier(modifier.getValue()) << ", ";
1231
1232 if (!symbols) {
1233 llvm::SmallVector<Attribute> values(operands.size(), nullptr);
1234 symbols = ArrayAttr::get(ctx, values);
1235 }
1236
1237 if (!mapIndices) {
1238 llvm::SmallVector<int64_t> values(operands.size(), -1);
1239 mapIndices = DenseI64ArrayAttr::get(ctx, values);
1240 }
1241
1242 if (!byref) {
1243 mlir::SmallVector<bool> values(operands.size(), false);
1244 byref = DenseBoolArrayAttr::get(ctx, values);
1245 }
1246
1247 llvm::interleaveComma(llvm::zip_equal(operands, argsSubrange, symbols,
1248 mapIndices.asArrayRef(),
1249 byref.asArrayRef()),
1250 p, [&p](auto t) {
1251 auto [op, arg, sym, map, isByRef] = t;
1252 if (isByRef)
1253 p << "byref ";
1254 if (sym)
1255 p << sym << " ";
1256
1257 p << op << " -> " << arg;
1258
1259 if (map != -1)
1260 p << " [map_idx=" << map << "]";
1261 });
1262 p << " : ";
1263 llvm::interleaveComma(types, p);
1264 p << ") ";
1265
1266 if (needsBarrier)
1267 p << getPrivateNeedsBarrierSpelling() << " ";
1268}
1269
1271 StringRef clauseName, ValueRange argsSubrange,
1272 std::optional<MapPrintArgs> mapArgs) {
1273 if (mapArgs)
1274 printClauseWithRegionArgs(p, ctx, clauseName, argsSubrange, mapArgs->vars,
1275 mapArgs->types);
1276}
1277
1279 StringRef clauseName, ValueRange argsSubrange,
1280 std::optional<PrivatePrintArgs> privateArgs) {
1281 if (privateArgs)
1283 p, ctx, clauseName, argsSubrange, privateArgs->vars, privateArgs->types,
1284 privateArgs->syms, privateArgs->mapIndices, /*byref=*/nullptr,
1285 /*modifier=*/nullptr, privateArgs->needsBarrier);
1286}
1287
1288static void
1289printBlockArgClause(OpAsmPrinter &p, MLIRContext *ctx, StringRef clauseName,
1290 ValueRange argsSubrange,
1291 std::optional<ReductionPrintArgs> reductionArgs) {
1292 if (reductionArgs)
1293 printClauseWithRegionArgs(p, ctx, clauseName, argsSubrange,
1294 reductionArgs->vars, reductionArgs->types,
1295 reductionArgs->syms, /*mapIndices=*/nullptr,
1296 reductionArgs->byref, reductionArgs->modifier);
1297}
1298
1300 const AllRegionPrintArgs &args) {
1301 auto iface = llvm::cast<mlir::omp::BlockArgOpenMPOpInterface>(op);
1302 MLIRContext *ctx = op->getContext();
1303
1304 printBlockArgClause(p, ctx, "has_device_addr",
1305 iface.getHasDeviceAddrBlockArgs(),
1306 args.hasDeviceAddrArgs);
1307 printBlockArgClause(p, ctx, "host_eval", iface.getHostEvalBlockArgs(),
1308 args.hostEvalArgs);
1309 printBlockArgClause(p, ctx, "in_reduction", iface.getInReductionBlockArgs(),
1310 args.inReductionArgs);
1311 printBlockArgClause(p, ctx, "map_entries", iface.getMapBlockArgs(),
1312 args.mapArgs);
1313 printBlockArgClause(p, ctx, "private", iface.getPrivateBlockArgs(),
1314 args.privateArgs);
1315 printBlockArgClause(p, ctx, "reduction", iface.getReductionBlockArgs(),
1316 args.reductionArgs);
1317 printBlockArgClause(p, ctx, "task_reduction",
1318 iface.getTaskReductionBlockArgs(),
1319 args.taskReductionArgs);
1320 printBlockArgClause(p, ctx, "use_device_addr",
1321 iface.getUseDeviceAddrBlockArgs(),
1322 args.useDeviceAddrArgs);
1323 printBlockArgClause(p, ctx, "use_device_ptr",
1324 iface.getUseDevicePtrBlockArgs(), args.useDevicePtrArgs);
1325
1326 p.printRegion(region, /*printEntryBlockArgs=*/false);
1327}
1328
1329// These parseXyz functions correspond to the custom<Xyz> definitions
1330// in the .td file(s).
1332 OpAsmPrinter &p, Operation *op, Region &region,
1333 ValueRange hasDeviceAddrVars, TypeRange hasDeviceAddrTypes,
1334 ValueRange hostEvalVars, TypeRange hostEvalTypes,
1335 ValueRange inReductionVars, TypeRange inReductionTypes,
1336 DenseBoolArrayAttr inReductionByref, ArrayAttr inReductionSyms,
1337 ValueRange mapVars, TypeRange mapTypes, ValueRange privateVars,
1338 TypeRange privateTypes, ArrayAttr privateSyms, UnitAttr privateNeedsBarrier,
1339 DenseI64ArrayAttr privateMaps) {
1340 AllRegionPrintArgs args;
1341 args.hasDeviceAddrArgs.emplace(hasDeviceAddrVars, hasDeviceAddrTypes);
1342 args.hostEvalArgs.emplace(hostEvalVars, hostEvalTypes);
1343 args.inReductionArgs.emplace(inReductionVars, inReductionTypes,
1344 inReductionByref, inReductionSyms);
1345 args.mapArgs.emplace(mapVars, mapTypes);
1346 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1347 privateNeedsBarrier, privateMaps);
1348 printBlockArgRegion(p, op, region, args);
1349}
1350
1352 OpAsmPrinter &p, Operation *op, Region &region, ValueRange inReductionVars,
1353 TypeRange inReductionTypes, DenseBoolArrayAttr inReductionByref,
1354 ArrayAttr inReductionSyms, ValueRange privateVars, TypeRange privateTypes,
1355 ArrayAttr privateSyms, UnitAttr privateNeedsBarrier) {
1356 AllRegionPrintArgs args;
1357 args.inReductionArgs.emplace(inReductionVars, inReductionTypes,
1358 inReductionByref, inReductionSyms);
1359 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1360 privateNeedsBarrier,
1361 /*mapIndices=*/nullptr);
1362 printBlockArgRegion(p, op, region, args);
1363}
1364
1366 OpAsmPrinter &p, Operation *op, Region &region, ValueRange inReductionVars,
1367 TypeRange inReductionTypes, DenseBoolArrayAttr inReductionByref,
1368 ArrayAttr inReductionSyms, ValueRange privateVars, TypeRange privateTypes,
1369 ArrayAttr privateSyms, UnitAttr privateNeedsBarrier,
1370 ReductionModifierAttr reductionMod, ValueRange reductionVars,
1371 TypeRange reductionTypes, DenseBoolArrayAttr reductionByref,
1372 ArrayAttr reductionSyms) {
1373 AllRegionPrintArgs args;
1374 args.inReductionArgs.emplace(inReductionVars, inReductionTypes,
1375 inReductionByref, inReductionSyms);
1376 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1377 privateNeedsBarrier,
1378 /*mapIndices=*/nullptr);
1379 args.reductionArgs.emplace(reductionVars, reductionTypes, reductionByref,
1380 reductionSyms, reductionMod);
1381 printBlockArgRegion(p, op, region, args);
1382}
1383
1385 ValueRange privateVars, TypeRange privateTypes,
1386 ArrayAttr privateSyms,
1387 UnitAttr privateNeedsBarrier) {
1388 AllRegionPrintArgs args;
1389 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1390 privateNeedsBarrier,
1391 /*mapIndices=*/nullptr);
1392 printBlockArgRegion(p, op, region, args);
1393}
1394
1396 OpAsmPrinter &p, Operation *op, Region &region, ValueRange privateVars,
1397 TypeRange privateTypes, ArrayAttr privateSyms, UnitAttr privateNeedsBarrier,
1398 ReductionModifierAttr reductionMod, ValueRange reductionVars,
1399 TypeRange reductionTypes, DenseBoolArrayAttr reductionByref,
1400 ArrayAttr reductionSyms) {
1401 AllRegionPrintArgs args;
1402 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1403 privateNeedsBarrier,
1404 /*mapIndices=*/nullptr);
1405 args.reductionArgs.emplace(reductionVars, reductionTypes, reductionByref,
1406 reductionSyms, reductionMod);
1407 printBlockArgRegion(p, op, region, args);
1408}
1409
1411 Region &region,
1412 ValueRange taskReductionVars,
1413 TypeRange taskReductionTypes,
1414 DenseBoolArrayAttr taskReductionByref,
1415 ArrayAttr taskReductionSyms) {
1416 AllRegionPrintArgs args;
1417 args.taskReductionArgs.emplace(taskReductionVars, taskReductionTypes,
1418 taskReductionByref, taskReductionSyms);
1419 printBlockArgRegion(p, op, region, args);
1420}
1421
1423 Region &region,
1424 ValueRange useDeviceAddrVars,
1425 TypeRange useDeviceAddrTypes,
1426 ValueRange useDevicePtrVars,
1427 TypeRange useDevicePtrTypes) {
1428 AllRegionPrintArgs args;
1429 args.useDeviceAddrArgs.emplace(useDeviceAddrVars, useDeviceAddrTypes);
1430 args.useDevicePtrArgs.emplace(useDevicePtrVars, useDevicePtrTypes);
1431 printBlockArgRegion(p, op, region, args);
1432}
1433
1434/// Verifies Reduction Clause
1435static LogicalResult
1436verifyReductionVarList(Operation *op, std::optional<ArrayAttr> reductionSyms,
1437 OperandRange reductionVars,
1438 std::optional<ArrayRef<bool>> reductionByref) {
1439 if (!reductionVars.empty()) {
1440 if (!reductionSyms || reductionSyms->size() != reductionVars.size())
1441 return op->emitOpError()
1442 << "expected as many reduction symbol references "
1443 "as reduction variables";
1444 if (reductionByref && reductionByref->size() != reductionVars.size())
1445 return op->emitError() << "expected as many reduction variable by "
1446 "reference attributes as reduction variables";
1447 } else {
1448 if (reductionSyms)
1449 return op->emitOpError() << "unexpected reduction symbol references";
1450 return success();
1451 }
1452
1453 // TODO: The followings should be done in
1454 // SymbolUserOpInterface::verifySymbolUses.
1455 DenseSet<Value> accumulators;
1456 for (auto args : llvm::zip(reductionVars, *reductionSyms)) {
1457 Value accum = std::get<0>(args);
1458
1459 if (!accumulators.insert(accum).second)
1460 return op->emitOpError() << "accumulator variable used more than once";
1461
1462 Type varType = accum.getType();
1463 auto symbolRef = llvm::cast<SymbolRefAttr>(std::get<1>(args));
1464 auto decl =
1466 if (!decl)
1467 return op->emitOpError() << "expected symbol reference " << symbolRef
1468 << " to point to a reduction declaration";
1469
1470 if (decl.getAccumulatorType() && decl.getAccumulatorType() != varType)
1471 return op->emitOpError()
1472 << "expected accumulator (" << varType
1473 << ") to be the same type as reduction declaration ("
1474 << decl.getAccumulatorType() << ")";
1475 }
1476
1477 return success();
1478}
1479
1480//===----------------------------------------------------------------------===//
1481// Parser, printer and verifier for Copyprivate
1482//===----------------------------------------------------------------------===//
1483
1484/// copyprivate-entry-list ::= copyprivate-entry
1485/// | copyprivate-entry-list `,` copyprivate-entry
1486/// copyprivate-entry ::= ssa-id `->` symbol-ref `:` type
1487static ParseResult parseCopyprivate(
1488 OpAsmParser &parser,
1490 SmallVectorImpl<Type> &copyprivateTypes, ArrayAttr &copyprivateSyms) {
1492 if (failed(parser.parseCommaSeparatedList([&]() {
1493 if (parser.parseOperand(copyprivateVars.emplace_back()) ||
1494 parser.parseArrow() ||
1495 parser.parseAttribute(symsVec.emplace_back()) ||
1496 parser.parseColonType(copyprivateTypes.emplace_back()))
1497 return failure();
1498 return success();
1499 })))
1500 return failure();
1501 SmallVector<Attribute> syms(symsVec.begin(), symsVec.end());
1502 copyprivateSyms = ArrayAttr::get(parser.getContext(), syms);
1503 return success();
1504}
1505
1506/// Print Copyprivate clause
1508 OperandRange copyprivateVars,
1509 TypeRange copyprivateTypes,
1510 std::optional<ArrayAttr> copyprivateSyms) {
1511 if (!copyprivateSyms.has_value())
1512 return;
1513 llvm::interleaveComma(
1514 llvm::zip(copyprivateVars, *copyprivateSyms, copyprivateTypes), p,
1515 [&](const auto &args) {
1516 p << std::get<0>(args) << " -> " << std::get<1>(args) << " : "
1517 << std::get<2>(args);
1518 });
1519}
1520
1521/// Verifies CopyPrivate Clause
1522static LogicalResult
1524 std::optional<ArrayAttr> copyprivateSyms) {
1525 size_t copyprivateSymsSize =
1526 copyprivateSyms.has_value() ? copyprivateSyms->size() : 0;
1527 if (copyprivateSymsSize != copyprivateVars.size())
1528 return op->emitOpError() << "inconsistent number of copyprivate vars (= "
1529 << copyprivateVars.size()
1530 << ") and functions (= " << copyprivateSymsSize
1531 << "), both must be equal";
1532 if (!copyprivateSyms.has_value())
1533 return success();
1534
1535 for (auto copyprivateVarAndSym :
1536 llvm::zip(copyprivateVars, *copyprivateSyms)) {
1537 auto symbolRef =
1538 llvm::cast<SymbolRefAttr>(std::get<1>(copyprivateVarAndSym));
1539 std::optional<std::variant<mlir::func::FuncOp, mlir::LLVM::LLVMFuncOp>>
1540 funcOp;
1541 if (mlir::func::FuncOp mlirFuncOp =
1543 symbolRef))
1544 funcOp = mlirFuncOp;
1545 else if (mlir::LLVM::LLVMFuncOp llvmFuncOp =
1547 op, symbolRef))
1548 funcOp = llvmFuncOp;
1549
1550 auto getNumArguments = [&] {
1551 return std::visit([](auto &f) { return f.getNumArguments(); }, *funcOp);
1552 };
1553
1554 auto getArgumentType = [&](unsigned i) {
1555 return std::visit([i](auto &f) { return f.getArgumentTypes()[i]; },
1556 *funcOp);
1557 };
1558
1559 if (!funcOp)
1560 return op->emitOpError() << "expected symbol reference " << symbolRef
1561 << " to point to a copy function";
1562
1563 if (getNumArguments() != 2)
1564 return op->emitOpError()
1565 << "expected copy function " << symbolRef << " to have 2 operands";
1566
1567 Type argTy = getArgumentType(0);
1568 if (argTy != getArgumentType(1))
1569 return op->emitOpError() << "expected copy function " << symbolRef
1570 << " arguments to have the same type";
1571
1572 Type varType = std::get<0>(copyprivateVarAndSym).getType();
1573 if (argTy != varType)
1574 return op->emitOpError()
1575 << "expected copy function arguments' type (" << argTy
1576 << ") to be the same as copyprivate variable's type (" << varType
1577 << ")";
1578 }
1579
1580 return success();
1581}
1582
1583//===----------------------------------------------------------------------===//
1584// Parser, printer and verifier for DependVarList
1585//===----------------------------------------------------------------------===//
1586
1587/// depend-entry-list ::= depend-entry
1588/// | depend-entry-list `,` depend-entry
1589/// depend-entry ::= depend-kind `->` ssa-id `:` type
1590static ParseResult
1593 SmallVectorImpl<Type> &dependTypes, ArrayAttr &dependKinds) {
1595 if (failed(parser.parseCommaSeparatedList([&]() {
1596 StringRef keyword;
1597 if (parser.parseKeyword(&keyword) || parser.parseArrow() ||
1598 parser.parseOperand(dependVars.emplace_back()) ||
1599 parser.parseColonType(dependTypes.emplace_back()))
1600 return failure();
1601 if (std::optional<ClauseTaskDepend> keywordDepend =
1602 (symbolizeClauseTaskDepend(keyword)))
1603 kindsVec.emplace_back(
1604 ClauseTaskDependAttr::get(parser.getContext(), *keywordDepend));
1605 else
1606 return failure();
1607 return success();
1608 })))
1609 return failure();
1610 SmallVector<Attribute> kinds(kindsVec.begin(), kindsVec.end());
1611 dependKinds = ArrayAttr::get(parser.getContext(), kinds);
1612 return success();
1613}
1614
1615/// Print Depend clause
1617 OperandRange dependVars, TypeRange dependTypes,
1618 std::optional<ArrayAttr> dependKinds) {
1619
1620 for (unsigned i = 0, e = dependKinds->size(); i < e; ++i) {
1621 if (i != 0)
1622 p << ", ";
1623 p << stringifyClauseTaskDepend(
1624 llvm::cast<mlir::omp::ClauseTaskDependAttr>((*dependKinds)[i])
1625 .getValue())
1626 << " -> " << dependVars[i] << " : " << dependTypes[i];
1627 }
1628}
1629
1630/// Verifies Depend clause
1631static LogicalResult verifyDependVarList(Operation *op,
1632 std::optional<ArrayAttr> dependKinds,
1633 OperandRange dependVars) {
1634 if (!dependVars.empty()) {
1635 if (!dependKinds || dependKinds->size() != dependVars.size())
1636 return op->emitOpError() << "expected as many depend values"
1637 " as depend variables";
1638 } else {
1639 if (dependKinds && !dependKinds->empty())
1640 return op->emitOpError() << "unexpected depend values";
1641 return success();
1642 }
1643
1644 return success();
1645}
1646
1647//===----------------------------------------------------------------------===//
1648// Parser, printer and verifier for Synchronization Hint (2.17.12)
1649//===----------------------------------------------------------------------===//
1650
1651/// Parses a Synchronization Hint clause. The value of hint is an integer
1652/// which is a combination of different hints from `omp_sync_hint_t`.
1653///
1654/// hint-clause = `hint` `(` hint-value `)`
1655static ParseResult parseSynchronizationHint(OpAsmParser &parser,
1656 IntegerAttr &hintAttr) {
1657 StringRef hintKeyword;
1658 int64_t hint = 0;
1659 if (succeeded(parser.parseOptionalKeyword("none"))) {
1660 hintAttr = IntegerAttr::get(parser.getBuilder().getI64Type(), 0);
1661 return success();
1662 }
1663 auto parseKeyword = [&]() -> ParseResult {
1664 if (failed(parser.parseKeyword(&hintKeyword)))
1665 return failure();
1666 if (hintKeyword == "uncontended")
1667 hint |= 1;
1668 else if (hintKeyword == "contended")
1669 hint |= 2;
1670 else if (hintKeyword == "nonspeculative")
1671 hint |= 4;
1672 else if (hintKeyword == "speculative")
1673 hint |= 8;
1674 else
1675 return parser.emitError(parser.getCurrentLocation())
1676 << hintKeyword << " is not a valid hint";
1677 return success();
1678 };
1679 if (parser.parseCommaSeparatedList(parseKeyword))
1680 return failure();
1681 hintAttr = IntegerAttr::get(parser.getBuilder().getI64Type(), hint);
1682 return success();
1683}
1684
1685/// Prints a Synchronization Hint clause
1687 IntegerAttr hintAttr) {
1688 int64_t hint = hintAttr.getInt();
1689
1690 if (hint == 0) {
1691 p << "none";
1692 return;
1693 }
1694
1695 // Helper function to get n-th bit from the right end of `value`
1696 auto bitn = [](int value, int n) -> bool { return value & (1 << n); };
1697
1698 bool uncontended = bitn(hint, 0);
1699 bool contended = bitn(hint, 1);
1700 bool nonspeculative = bitn(hint, 2);
1701 bool speculative = bitn(hint, 3);
1702
1704 if (uncontended)
1705 hints.push_back("uncontended");
1706 if (contended)
1707 hints.push_back("contended");
1708 if (nonspeculative)
1709 hints.push_back("nonspeculative");
1710 if (speculative)
1711 hints.push_back("speculative");
1712
1713 llvm::interleaveComma(hints, p);
1714}
1715
1716/// Verifies a synchronization hint clause
1717static LogicalResult verifySynchronizationHint(Operation *op, uint64_t hint) {
1718
1719 // Helper function to get n-th bit from the right end of `value`
1720 auto bitn = [](int value, int n) -> bool { return value & (1 << n); };
1721
1722 bool uncontended = bitn(hint, 0);
1723 bool contended = bitn(hint, 1);
1724 bool nonspeculative = bitn(hint, 2);
1725 bool speculative = bitn(hint, 3);
1726
1727 if (uncontended && contended)
1728 return op->emitOpError() << "the hints omp_sync_hint_uncontended and "
1729 "omp_sync_hint_contended cannot be combined";
1730 if (nonspeculative && speculative)
1731 return op->emitOpError() << "the hints omp_sync_hint_nonspeculative and "
1732 "omp_sync_hint_speculative cannot be combined.";
1733 return success();
1734}
1735
1736//===----------------------------------------------------------------------===//
1737// Parser, printer and verifier for Target
1738//===----------------------------------------------------------------------===//
1739
1740// Helper function to get bitwise AND of `value` and 'flag' then return it as a
1741// boolean
1742static bool mapTypeToBool(ClauseMapFlags value, ClauseMapFlags flag) {
1743 return (value & flag) == flag;
1744}
1745
1746/// Parses a map_entries map type from a string format back into its numeric
1747/// value.
1748///
1749/// map-clause = `map_clauses ( ( `(` `always, `? `implicit, `? `ompx_hold, `?
1750/// `close, `? `present, `? ( `to` | `from` | `delete` `)` )+ `)` )
1751static ParseResult parseMapClause(OpAsmParser &parser,
1752 ClauseMapFlagsAttr &mapType) {
1753 ClauseMapFlags mapTypeBits = ClauseMapFlags::none;
1754 // This simply verifies the correct keyword is read in, the
1755 // keyword itself is stored inside of the operation
1756 auto parseTypeAndMod = [&]() -> ParseResult {
1757 StringRef mapTypeMod;
1758 if (parser.parseKeyword(&mapTypeMod))
1759 return failure();
1760
1761 if (mapTypeMod == "always")
1762 mapTypeBits |= ClauseMapFlags::always;
1763
1764 if (mapTypeMod == "implicit")
1765 mapTypeBits |= ClauseMapFlags::implicit;
1766
1767 if (mapTypeMod == "ompx_hold")
1768 mapTypeBits |= ClauseMapFlags::ompx_hold;
1769
1770 if (mapTypeMod == "close")
1771 mapTypeBits |= ClauseMapFlags::close;
1772
1773 if (mapTypeMod == "present")
1774 mapTypeBits |= ClauseMapFlags::present;
1775
1776 if (mapTypeMod == "to")
1777 mapTypeBits |= ClauseMapFlags::to;
1778
1779 if (mapTypeMod == "from")
1780 mapTypeBits |= ClauseMapFlags::from;
1781
1782 if (mapTypeMod == "tofrom")
1783 mapTypeBits |= ClauseMapFlags::to | ClauseMapFlags::from;
1784
1785 if (mapTypeMod == "delete")
1786 mapTypeBits |= ClauseMapFlags::del;
1787
1788 if (mapTypeMod == "storage")
1789 mapTypeBits |= ClauseMapFlags::storage;
1790
1791 if (mapTypeMod == "return_param")
1792 mapTypeBits |= ClauseMapFlags::return_param;
1793
1794 if (mapTypeMod == "private")
1795 mapTypeBits |= ClauseMapFlags::priv;
1796
1797 if (mapTypeMod == "literal")
1798 mapTypeBits |= ClauseMapFlags::literal;
1799
1800 if (mapTypeMod == "attach")
1801 mapTypeBits |= ClauseMapFlags::attach;
1802
1803 if (mapTypeMod == "attach_always")
1804 mapTypeBits |= ClauseMapFlags::attach_always;
1805
1806 if (mapTypeMod == "attach_none")
1807 mapTypeBits |= ClauseMapFlags::attach_none;
1808
1809 if (mapTypeMod == "attach_auto")
1810 mapTypeBits |= ClauseMapFlags::attach_auto;
1811
1812 if (mapTypeMod == "ref_ptr")
1813 mapTypeBits |= ClauseMapFlags::ref_ptr;
1814
1815 if (mapTypeMod == "ref_ptee")
1816 mapTypeBits |= ClauseMapFlags::ref_ptee;
1817
1818 if (mapTypeMod == "ref_ptr_ptee")
1819 mapTypeBits |= ClauseMapFlags::ref_ptr_ptee;
1820
1821 if (mapTypeMod == "is_device_ptr")
1822 mapTypeBits |= ClauseMapFlags::is_device_ptr;
1823
1824 return success();
1825 };
1826
1827 if (parser.parseCommaSeparatedList(parseTypeAndMod))
1828 return failure();
1829
1830 mapType =
1831 parser.getBuilder().getAttr<mlir::omp::ClauseMapFlagsAttr>(mapTypeBits);
1832
1833 return success();
1834}
1835
1836/// Prints a map_entries map type from its numeric value out into its string
1837/// format.
1838static void printMapClause(OpAsmPrinter &p, Operation *op,
1839 ClauseMapFlagsAttr mapType) {
1841 ClauseMapFlags mapFlags = mapType.getValue();
1842
1843 // handling of always, close, present placed at the beginning of the string
1844 // to aid readability
1845 if (mapTypeToBool(mapFlags, ClauseMapFlags::always))
1846 mapTypeStrs.push_back("always");
1847 if (mapTypeToBool(mapFlags, ClauseMapFlags::implicit))
1848 mapTypeStrs.push_back("implicit");
1849 if (mapTypeToBool(mapFlags, ClauseMapFlags::ompx_hold))
1850 mapTypeStrs.push_back("ompx_hold");
1851 if (mapTypeToBool(mapFlags, ClauseMapFlags::close))
1852 mapTypeStrs.push_back("close");
1853 if (mapTypeToBool(mapFlags, ClauseMapFlags::present))
1854 mapTypeStrs.push_back("present");
1855
1856 // special handling of to/from/tofrom/delete and release/alloc, release +
1857 // alloc are the abscense of one of the other flags, whereas tofrom requires
1858 // both the to and from flag to be set.
1859 bool to = mapTypeToBool(mapFlags, ClauseMapFlags::to);
1860 bool from = mapTypeToBool(mapFlags, ClauseMapFlags::from);
1861
1862 if (to && from)
1863 mapTypeStrs.push_back("tofrom");
1864 else if (from)
1865 mapTypeStrs.push_back("from");
1866 else if (to)
1867 mapTypeStrs.push_back("to");
1868
1869 if (mapTypeToBool(mapFlags, ClauseMapFlags::del))
1870 mapTypeStrs.push_back("delete");
1871 if (mapTypeToBool(mapFlags, ClauseMapFlags::return_param))
1872 mapTypeStrs.push_back("return_param");
1873 if (mapTypeToBool(mapFlags, ClauseMapFlags::storage))
1874 mapTypeStrs.push_back("storage");
1875 if (mapTypeToBool(mapFlags, ClauseMapFlags::priv))
1876 mapTypeStrs.push_back("private");
1877 if (mapTypeToBool(mapFlags, ClauseMapFlags::literal))
1878 mapTypeStrs.push_back("literal");
1879 if (mapTypeToBool(mapFlags, ClauseMapFlags::attach))
1880 mapTypeStrs.push_back("attach");
1881 if (mapTypeToBool(mapFlags, ClauseMapFlags::attach_always))
1882 mapTypeStrs.push_back("attach_always");
1883 if (mapTypeToBool(mapFlags, ClauseMapFlags::attach_none))
1884 mapTypeStrs.push_back("attach_none");
1885 if (mapTypeToBool(mapFlags, ClauseMapFlags::attach_auto))
1886 mapTypeStrs.push_back("attach_auto");
1887 if (mapTypeToBool(mapFlags, ClauseMapFlags::ref_ptr))
1888 mapTypeStrs.push_back("ref_ptr");
1889 if (mapTypeToBool(mapFlags, ClauseMapFlags::ref_ptee))
1890 mapTypeStrs.push_back("ref_ptee");
1891 if (mapTypeToBool(mapFlags, ClauseMapFlags::ref_ptr_ptee))
1892 mapTypeStrs.push_back("ref_ptr_ptee");
1893 if (mapTypeToBool(mapFlags, ClauseMapFlags::is_device_ptr))
1894 mapTypeStrs.push_back("is_device_ptr");
1895 if (mapFlags == ClauseMapFlags::none)
1896 mapTypeStrs.push_back("none");
1897
1898 for (unsigned int i = 0; i < mapTypeStrs.size(); ++i) {
1899 p << mapTypeStrs[i];
1900 if (i + 1 < mapTypeStrs.size()) {
1901 p << ", ";
1902 }
1903 }
1904}
1905
1906static ParseResult parseMembersIndex(OpAsmParser &parser,
1907 ArrayAttr &membersIdx) {
1908 SmallVector<Attribute> values, memberIdxs;
1909
1910 auto parseIndices = [&]() -> ParseResult {
1911 int64_t value;
1912 if (parser.parseInteger(value))
1913 return failure();
1914 values.push_back(IntegerAttr::get(parser.getBuilder().getIntegerType(64),
1915 APInt(64, value, /*isSigned=*/false)));
1916 return success();
1917 };
1918
1919 do {
1920 if (failed(parser.parseLSquare()))
1921 return failure();
1922
1923 if (parser.parseCommaSeparatedList(parseIndices))
1924 return failure();
1925
1926 if (failed(parser.parseRSquare()))
1927 return failure();
1928
1929 memberIdxs.push_back(ArrayAttr::get(parser.getContext(), values));
1930 values.clear();
1931 } while (succeeded(parser.parseOptionalComma()));
1932
1933 if (!memberIdxs.empty())
1934 membersIdx = ArrayAttr::get(parser.getContext(), memberIdxs);
1935
1936 return success();
1937}
1938
1939static void printMembersIndex(OpAsmPrinter &p, MapInfoOp op,
1940 ArrayAttr membersIdx) {
1941 if (!membersIdx)
1942 return;
1943
1944 llvm::interleaveComma(membersIdx, p, [&p](Attribute v) {
1945 p << "[";
1946 auto memberIdx = cast<ArrayAttr>(v);
1947 llvm::interleaveComma(memberIdx.getValue(), p, [&p](Attribute v2) {
1948 p << cast<IntegerAttr>(v2).getInt();
1949 });
1950 p << "]";
1951 });
1952}
1953
1955 VariableCaptureKindAttr mapCaptureType) {
1956 std::string typeCapStr;
1957 llvm::raw_string_ostream typeCap(typeCapStr);
1958 if (mapCaptureType.getValue() == mlir::omp::VariableCaptureKind::ByRef)
1959 typeCap << "ByRef";
1960 if (mapCaptureType.getValue() == mlir::omp::VariableCaptureKind::ByCopy)
1961 typeCap << "ByCopy";
1962 if (mapCaptureType.getValue() == mlir::omp::VariableCaptureKind::VLAType)
1963 typeCap << "VLAType";
1964 if (mapCaptureType.getValue() == mlir::omp::VariableCaptureKind::This)
1965 typeCap << "This";
1966 p << typeCapStr;
1967}
1968
1969static ParseResult parseCaptureType(OpAsmParser &parser,
1970 VariableCaptureKindAttr &mapCaptureType) {
1971 StringRef mapCaptureKey;
1972 if (parser.parseKeyword(&mapCaptureKey))
1973 return failure();
1974
1975 if (mapCaptureKey == "This")
1976 mapCaptureType = mlir::omp::VariableCaptureKindAttr::get(
1977 parser.getContext(), mlir::omp::VariableCaptureKind::This);
1978 if (mapCaptureKey == "ByRef")
1979 mapCaptureType = mlir::omp::VariableCaptureKindAttr::get(
1980 parser.getContext(), mlir::omp::VariableCaptureKind::ByRef);
1981 if (mapCaptureKey == "ByCopy")
1982 mapCaptureType = mlir::omp::VariableCaptureKindAttr::get(
1983 parser.getContext(), mlir::omp::VariableCaptureKind::ByCopy);
1984 if (mapCaptureKey == "VLAType")
1985 mapCaptureType = mlir::omp::VariableCaptureKindAttr::get(
1986 parser.getContext(), mlir::omp::VariableCaptureKind::VLAType);
1987
1988 return success();
1989}
1990
1991static LogicalResult verifyMapClause(Operation *op, OperandRange mapVars) {
1994
1995 for (auto mapOp : mapVars) {
1996 if (!mapOp.getDefiningOp())
1997 return emitError(op->getLoc(), "missing map operation");
1998
1999 if (auto mapInfoOp = mapOp.getDefiningOp<mlir::omp::MapInfoOp>()) {
2000 mlir::omp::ClauseMapFlags mapTypeBits = mapInfoOp.getMapType();
2001
2002 bool to = mapTypeToBool(mapTypeBits, ClauseMapFlags::to);
2003 bool from = mapTypeToBool(mapTypeBits, ClauseMapFlags::from);
2004 bool del = mapTypeToBool(mapTypeBits, ClauseMapFlags::del);
2005
2006 bool always = mapTypeToBool(mapTypeBits, ClauseMapFlags::always);
2007 bool close = mapTypeToBool(mapTypeBits, ClauseMapFlags::close);
2008 bool implicit = mapTypeToBool(mapTypeBits, ClauseMapFlags::implicit);
2009
2010 if ((isa<TargetDataOp>(op) || isa<TargetOp>(op)) && del)
2011 return emitError(op->getLoc(),
2012 "to, from, tofrom and alloc map types are permitted");
2013
2014 if (isa<TargetEnterDataOp>(op) && (from || del))
2015 return emitError(op->getLoc(), "to and alloc map types are permitted");
2016
2017 if (isa<TargetExitDataOp>(op) && to)
2018 return emitError(op->getLoc(),
2019 "from, release and delete map types are permitted");
2020
2021 if (isa<TargetUpdateOp>(op)) {
2022 if (del) {
2023 return emitError(op->getLoc(),
2024 "at least one of to or from map types must be "
2025 "specified, other map types are not permitted");
2026 }
2027
2028 if (!to && !from) {
2029 return emitError(op->getLoc(),
2030 "at least one of to or from map types must be "
2031 "specified, other map types are not permitted");
2032 }
2033
2034 auto updateVar = mapInfoOp.getVarPtr();
2035
2036 if ((to && from) || (to && updateFromVars.contains(updateVar)) ||
2037 (from && updateToVars.contains(updateVar))) {
2038 return emitError(
2039 op->getLoc(),
2040 "either to or from map types can be specified, not both");
2041 }
2042
2043 if (always || close || implicit) {
2044 return emitError(
2045 op->getLoc(),
2046 "present, mapper and iterator map type modifiers are permitted");
2047 }
2048
2049 to ? updateToVars.insert(updateVar) : updateFromVars.insert(updateVar);
2050 }
2051 } else if (!isa<DeclareMapperInfoOp>(op)) {
2052 return emitError(op->getLoc(),
2053 "map argument is not a map entry operation");
2054 }
2055 }
2056
2057 return success();
2058}
2059
2060static LogicalResult verifyPrivateVarsMapping(TargetOp targetOp) {
2061 std::optional<DenseI64ArrayAttr> privateMapIndices =
2062 targetOp.getPrivateMapsAttr();
2063
2064 // None of the private operands are mapped.
2065 if (!privateMapIndices.has_value() || !privateMapIndices.value())
2066 return success();
2067
2068 OperandRange privateVars = targetOp.getPrivateVars();
2069
2070 if (privateMapIndices.value().size() !=
2071 static_cast<int64_t>(privateVars.size()))
2072 return emitError(targetOp.getLoc(), "sizes of `private` operand range and "
2073 "`private_maps` attribute mismatch");
2074
2075 return success();
2076}
2077
2078//===----------------------------------------------------------------------===//
2079// MapInfoOp
2080//===----------------------------------------------------------------------===//
2081
2082static LogicalResult verifyMapInfoDefinedArgs(Operation *op,
2083 StringRef clauseName,
2084 OperandRange vars) {
2085 for (Value var : vars)
2086 if (!llvm::isa_and_present<MapInfoOp>(var.getDefiningOp()))
2087 return op->emitOpError()
2088 << "'" << clauseName
2089 << "' arguments must be defined by 'omp.map.info' ops";
2090 return success();
2091}
2092
2093LogicalResult MapInfoOp::verify() {
2094 if (getMapperId() &&
2096 *this, getMapperIdAttr())) {
2097 return emitError("invalid mapper id");
2098 }
2099
2100 if (failed(verifyMapInfoDefinedArgs(*this, "members", getMembers())))
2101 return failure();
2102
2103 return success();
2104}
2105
2106//===----------------------------------------------------------------------===//
2107// TargetDataOp
2108//===----------------------------------------------------------------------===//
2109
2110void TargetDataOp::build(OpBuilder &builder, OperationState &state,
2111 const TargetDataOperands &clauses) {
2112 TargetDataOp::build(builder, state, clauses.device, clauses.ifExpr,
2113 clauses.mapVars, clauses.useDeviceAddrVars,
2114 clauses.useDevicePtrVars);
2115}
2116
2117LogicalResult TargetDataOp::verify() {
2118 if (getMapVars().empty() && getUseDevicePtrVars().empty() &&
2119 getUseDeviceAddrVars().empty()) {
2120 return ::emitError(this->getLoc(),
2121 "At least one of map, use_device_ptr_vars, or "
2122 "use_device_addr_vars operand must be present");
2123 }
2124
2125 if (failed(verifyMapInfoDefinedArgs(*this, "use_device_ptr",
2126 getUseDevicePtrVars())))
2127 return failure();
2128
2129 if (failed(verifyMapInfoDefinedArgs(*this, "use_device_addr",
2130 getUseDeviceAddrVars())))
2131 return failure();
2132
2133 return verifyMapClause(*this, getMapVars());
2134}
2135
2136//===----------------------------------------------------------------------===//
2137// TargetEnterDataOp
2138//===----------------------------------------------------------------------===//
2139
2140void TargetEnterDataOp::build(
2141 OpBuilder &builder, OperationState &state,
2142 const TargetEnterExitUpdateDataOperands &clauses) {
2143 MLIRContext *ctx = builder.getContext();
2144 TargetEnterDataOp::build(builder, state,
2145 makeArrayAttr(ctx, clauses.dependKinds),
2146 clauses.dependVars, clauses.device, clauses.ifExpr,
2147 clauses.mapVars, clauses.nowait);
2148}
2149
2150LogicalResult TargetEnterDataOp::verify() {
2151 LogicalResult verifyDependVars =
2152 verifyDependVarList(*this, getDependKinds(), getDependVars());
2153 return failed(verifyDependVars) ? verifyDependVars
2154 : verifyMapClause(*this, getMapVars());
2155}
2156
2157//===----------------------------------------------------------------------===//
2158// TargetExitDataOp
2159//===----------------------------------------------------------------------===//
2160
2161void TargetExitDataOp::build(OpBuilder &builder, OperationState &state,
2162 const TargetEnterExitUpdateDataOperands &clauses) {
2163 MLIRContext *ctx = builder.getContext();
2164 TargetExitDataOp::build(builder, state,
2165 makeArrayAttr(ctx, clauses.dependKinds),
2166 clauses.dependVars, clauses.device, clauses.ifExpr,
2167 clauses.mapVars, clauses.nowait);
2168}
2169
2170LogicalResult TargetExitDataOp::verify() {
2171 LogicalResult verifyDependVars =
2172 verifyDependVarList(*this, getDependKinds(), getDependVars());
2173 return failed(verifyDependVars) ? verifyDependVars
2174 : verifyMapClause(*this, getMapVars());
2175}
2176
2177//===----------------------------------------------------------------------===//
2178// TargetUpdateOp
2179//===----------------------------------------------------------------------===//
2180
2181void TargetUpdateOp::build(OpBuilder &builder, OperationState &state,
2182 const TargetEnterExitUpdateDataOperands &clauses) {
2183 MLIRContext *ctx = builder.getContext();
2184 TargetUpdateOp::build(builder, state, makeArrayAttr(ctx, clauses.dependKinds),
2185 clauses.dependVars, clauses.device, clauses.ifExpr,
2186 clauses.mapVars, clauses.nowait);
2187}
2188
2189LogicalResult TargetUpdateOp::verify() {
2190 LogicalResult verifyDependVars =
2191 verifyDependVarList(*this, getDependKinds(), getDependVars());
2192 return failed(verifyDependVars) ? verifyDependVars
2193 : verifyMapClause(*this, getMapVars());
2194}
2195
2196//===----------------------------------------------------------------------===//
2197// TargetOp
2198//===----------------------------------------------------------------------===//
2199
2200void TargetOp::build(OpBuilder &builder, OperationState &state,
2201 const TargetOperands &clauses) {
2202 MLIRContext *ctx = builder.getContext();
2203 // TODO Store clauses in op: allocateVars, allocatorVars, inReductionVars,
2204 // inReductionByref, inReductionSyms.
2205 TargetOp::build(builder, state, /*allocate_vars=*/{}, /*allocator_vars=*/{},
2206 clauses.bare, makeArrayAttr(ctx, clauses.dependKinds),
2207 clauses.dependVars, clauses.device, clauses.hasDeviceAddrVars,
2208 clauses.hostEvalVars, clauses.ifExpr,
2209 /*in_reduction_vars=*/{}, /*in_reduction_byref=*/nullptr,
2210 /*in_reduction_syms=*/nullptr, clauses.isDevicePtrVars,
2211 clauses.mapVars, clauses.nowait, clauses.privateVars,
2212 makeArrayAttr(ctx, clauses.privateSyms),
2213 clauses.privateNeedsBarrier, clauses.threadLimit,
2214 /*private_maps=*/nullptr);
2215}
2216
2217LogicalResult TargetOp::verify() {
2218 if (failed(verifyDependVarList(*this, getDependKinds(), getDependVars())))
2219 return failure();
2220
2221 if (failed(verifyMapInfoDefinedArgs(*this, "has_device_addr",
2222 getHasDeviceAddrVars())))
2223 return failure();
2224
2225 if (failed(verifyMapClause(*this, getMapVars())))
2226 return failure();
2227
2228 return verifyPrivateVarsMapping(*this);
2229}
2230
2231LogicalResult TargetOp::verifyRegions() {
2232 auto teamsOps = getOps<TeamsOp>();
2233 if (std::distance(teamsOps.begin(), teamsOps.end()) > 1)
2234 return emitError("target containing multiple 'omp.teams' nested ops");
2235
2236 // Check that host_eval values are only used in legal ways.
2237 Operation *capturedOp = getInnermostCapturedOmpOp();
2238 TargetRegionFlags execFlags = getKernelExecFlags(capturedOp);
2239 for (Value hostEvalArg :
2240 cast<BlockArgOpenMPOpInterface>(getOperation()).getHostEvalBlockArgs()) {
2241 for (Operation *user : hostEvalArg.getUsers()) {
2242 if (auto teamsOp = dyn_cast<TeamsOp>(user)) {
2243 if (llvm::is_contained({teamsOp.getNumTeamsLower(),
2244 teamsOp.getNumTeamsUpper(),
2245 teamsOp.getThreadLimit()},
2246 hostEvalArg))
2247 continue;
2248
2249 return emitOpError() << "host_eval argument only legal as 'num_teams' "
2250 "and 'thread_limit' in 'omp.teams'";
2251 }
2252 if (auto parallelOp = dyn_cast<ParallelOp>(user)) {
2253 if (bitEnumContainsAny(execFlags, TargetRegionFlags::spmd) &&
2254 parallelOp->isAncestor(capturedOp) &&
2255 hostEvalArg == parallelOp.getNumThreads())
2256 continue;
2257
2258 return emitOpError()
2259 << "host_eval argument only legal as 'num_threads' in "
2260 "'omp.parallel' when representing target SPMD";
2261 }
2262 if (auto loopNestOp = dyn_cast<LoopNestOp>(user)) {
2263 if (bitEnumContainsAny(execFlags, TargetRegionFlags::trip_count) &&
2264 loopNestOp.getOperation() == capturedOp &&
2265 (llvm::is_contained(loopNestOp.getLoopLowerBounds(), hostEvalArg) ||
2266 llvm::is_contained(loopNestOp.getLoopUpperBounds(), hostEvalArg) ||
2267 llvm::is_contained(loopNestOp.getLoopSteps(), hostEvalArg)))
2268 continue;
2269
2270 return emitOpError() << "host_eval argument only legal as loop bounds "
2271 "and steps in 'omp.loop_nest' when trip count "
2272 "must be evaluated in the host";
2273 }
2274
2275 return emitOpError() << "host_eval argument illegal use in '"
2276 << user->getName() << "' operation";
2277 }
2278 }
2279 return success();
2280}
2281
2282static Operation *
2283findCapturedOmpOp(Operation *rootOp, bool checkSingleMandatoryExec,
2284 llvm::function_ref<bool(Operation *)> siblingAllowedFn) {
2285 assert(rootOp && "expected valid operation");
2286
2287 Dialect *ompDialect = rootOp->getDialect();
2288 Operation *capturedOp = nullptr;
2289 DominanceInfo domInfo;
2290
2291 // Process in pre-order to check operations from outermost to innermost,
2292 // ensuring we only enter the region of an operation if it meets the criteria
2293 // for being captured. We stop the exploration of nested operations as soon as
2294 // we process a region holding no operations to be captured.
2295 rootOp->walk<WalkOrder::PreOrder>([&](Operation *op) {
2296 if (op == rootOp)
2297 return WalkResult::advance();
2298
2299 // Ignore operations of other dialects or omp operations with no regions,
2300 // because these will only be checked if they are siblings of an omp
2301 // operation that can potentially be captured.
2302 bool isOmpDialect = op->getDialect() == ompDialect;
2303 bool hasRegions = op->getNumRegions() > 0;
2304 if (!isOmpDialect || !hasRegions)
2305 return WalkResult::skip();
2306
2307 // This operation cannot be captured if it can be executed more than once
2308 // (i.e. its block's successors can reach it) or if it's not guaranteed to
2309 // be executed before all exits of the region (i.e. it doesn't dominate all
2310 // blocks with no successors reachable from the entry block).
2311 if (checkSingleMandatoryExec) {
2312 Region *parentRegion = op->getParentRegion();
2313 Block *parentBlock = op->getBlock();
2314
2315 for (Block *successor : parentBlock->getSuccessors())
2316 if (successor->isReachable(parentBlock))
2317 return WalkResult::interrupt();
2318
2319 for (Block &block : *parentRegion)
2320 if (domInfo.isReachableFromEntry(&block) && block.hasNoSuccessors() &&
2321 !domInfo.dominates(parentBlock, &block))
2322 return WalkResult::interrupt();
2323 }
2324
2325 // Don't capture this op if it has a not-allowed sibling, and stop recursing
2326 // into nested operations.
2327 for (Operation &sibling : op->getParentRegion()->getOps())
2328 if (&sibling != op && !siblingAllowedFn(&sibling))
2329 return WalkResult::interrupt();
2330
2331 // Don't continue capturing nested operations if we reach an omp.loop_nest.
2332 // Otherwise, process the contents of this operation.
2333 capturedOp = op;
2334 return llvm::isa<LoopNestOp>(op) ? WalkResult::interrupt()
2336 });
2337
2338 return capturedOp;
2339}
2340
2341Operation *TargetOp::getInnermostCapturedOmpOp() {
2342 auto *ompDialect = getContext()->getLoadedDialect<omp::OpenMPDialect>();
2343
2344 // Only allow OpenMP terminators and non-OpenMP ops that have known memory
2345 // effects, but don't include a memory write effect.
2346 return findCapturedOmpOp(
2347 *this, /*checkSingleMandatoryExec=*/true, [&](Operation *sibling) {
2348 if (!sibling)
2349 return false;
2350
2351 if (ompDialect == sibling->getDialect())
2352 return sibling->hasTrait<OpTrait::IsTerminator>();
2353
2354 if (auto memOp = dyn_cast<MemoryEffectOpInterface>(sibling)) {
2356 effects;
2357 memOp.getEffects(effects);
2358 return !llvm::any_of(
2359 effects, [&](MemoryEffects::EffectInstance &effect) {
2360 return isa<MemoryEffects::Write>(effect.getEffect()) &&
2361 isa<SideEffects::AutomaticAllocationScopeResource>(
2362 effect.getResource());
2363 });
2364 }
2365 return true;
2366 });
2367}
2368
2369/// Check if we can promote SPMD kernel to No-Loop kernel.
2370static bool canPromoteToNoLoop(Operation *capturedOp, TeamsOp teamsOp,
2371 WsloopOp *wsLoopOp) {
2372 // num_teams clause can break no-loop teams/threads assumption.
2373 if (teamsOp.getNumTeamsUpper())
2374 return false;
2375
2376 // Reduction kernels are slower in no-loop mode.
2377 if (teamsOp.getNumReductionVars())
2378 return false;
2379 if (wsLoopOp->getNumReductionVars())
2380 return false;
2381
2382 // Check if the user allows the promotion of kernels to no-loop mode.
2383 OffloadModuleInterface offloadMod =
2384 capturedOp->getParentOfType<omp::OffloadModuleInterface>();
2385 if (!offloadMod)
2386 return false;
2387 auto ompFlags = offloadMod.getFlags();
2388 if (!ompFlags)
2389 return false;
2390 return ompFlags.getAssumeTeamsOversubscription() &&
2391 ompFlags.getAssumeThreadsOversubscription();
2392}
2393
2394TargetRegionFlags TargetOp::getKernelExecFlags(Operation *capturedOp) {
2395 // A non-null captured op is only valid if it resides inside of a TargetOp
2396 // and is the result of calling getInnermostCapturedOmpOp() on it.
2397 TargetOp targetOp =
2398 capturedOp ? capturedOp->getParentOfType<TargetOp>() : nullptr;
2399 assert((!capturedOp ||
2400 (targetOp && targetOp.getInnermostCapturedOmpOp() == capturedOp)) &&
2401 "unexpected captured op");
2402
2403 // If it's not capturing a loop, it's a default target region.
2404 if (!isa_and_present<LoopNestOp>(capturedOp))
2405 return TargetRegionFlags::generic;
2406
2407 // Get the innermost non-simd loop wrapper.
2409 cast<LoopNestOp>(capturedOp).gatherWrappers(loopWrappers);
2410 assert(!loopWrappers.empty());
2411
2412 LoopWrapperInterface *innermostWrapper = loopWrappers.begin();
2413 if (isa<SimdOp>(innermostWrapper))
2414 innermostWrapper = std::next(innermostWrapper);
2415
2416 auto numWrappers = std::distance(innermostWrapper, loopWrappers.end());
2417 if (numWrappers != 1 && numWrappers != 2)
2418 return TargetRegionFlags::generic;
2419
2420 // Detect target-teams-distribute-parallel-wsloop[-simd].
2421 if (numWrappers == 2) {
2422 WsloopOp *wsloopOp = dyn_cast<WsloopOp>(innermostWrapper);
2423 if (!wsloopOp)
2424 return TargetRegionFlags::generic;
2425
2426 innermostWrapper = std::next(innermostWrapper);
2427 if (!isa<DistributeOp>(innermostWrapper))
2428 return TargetRegionFlags::generic;
2429
2430 Operation *parallelOp = (*innermostWrapper)->getParentOp();
2431 if (!isa_and_present<ParallelOp>(parallelOp))
2432 return TargetRegionFlags::generic;
2433
2434 TeamsOp teamsOp = dyn_cast<TeamsOp>(parallelOp->getParentOp());
2435 if (!teamsOp)
2436 return TargetRegionFlags::generic;
2437
2438 if (teamsOp->getParentOp() == targetOp.getOperation()) {
2439 TargetRegionFlags result =
2440 TargetRegionFlags::spmd | TargetRegionFlags::trip_count;
2441 if (canPromoteToNoLoop(capturedOp, teamsOp, wsloopOp))
2442 result = result | TargetRegionFlags::no_loop;
2443 return result;
2444 }
2445 }
2446 // Detect target-teams-distribute[-simd] and target-teams-loop.
2447 else if (isa<DistributeOp, LoopOp>(innermostWrapper)) {
2448 Operation *teamsOp = (*innermostWrapper)->getParentOp();
2449 if (!isa_and_present<TeamsOp>(teamsOp))
2450 return TargetRegionFlags::generic;
2451
2452 if (teamsOp->getParentOp() != targetOp.getOperation())
2453 return TargetRegionFlags::generic;
2454
2455 if (isa<LoopOp>(innermostWrapper))
2456 return TargetRegionFlags::spmd | TargetRegionFlags::trip_count;
2457
2458 // Find single immediately nested captured omp.parallel and add spmd flag
2459 // (generic-spmd case).
2460 //
2461 // TODO: This shouldn't have to be done here, as it is too easy to break.
2462 // The openmp-opt pass should be updated to be able to promote kernels like
2463 // this from "Generic" to "Generic-SPMD". However, the use of the
2464 // `kmpc_distribute_static_loop` family of functions produced by the
2465 // OMPIRBuilder for these kernels prevents that from working.
2466 Dialect *ompDialect = targetOp->getDialect();
2467 Operation *nestedCapture = findCapturedOmpOp(
2468 capturedOp, /*checkSingleMandatoryExec=*/false,
2469 [&](Operation *sibling) {
2470 return sibling && (ompDialect != sibling->getDialect() ||
2471 sibling->hasTrait<OpTrait::IsTerminator>());
2472 });
2473
2474 TargetRegionFlags result =
2475 TargetRegionFlags::generic | TargetRegionFlags::trip_count;
2476
2477 if (!nestedCapture)
2478 return result;
2479
2480 while (nestedCapture->getParentOp() != capturedOp)
2481 nestedCapture = nestedCapture->getParentOp();
2482
2483 return isa<ParallelOp>(nestedCapture) ? result | TargetRegionFlags::spmd
2484 : result;
2485 }
2486 // Detect target-parallel-wsloop[-simd].
2487 else if (isa<WsloopOp>(innermostWrapper)) {
2488 Operation *parallelOp = (*innermostWrapper)->getParentOp();
2489 if (!isa_and_present<ParallelOp>(parallelOp))
2490 return TargetRegionFlags::generic;
2491
2492 if (parallelOp->getParentOp() == targetOp.getOperation())
2493 return TargetRegionFlags::spmd;
2494 }
2495
2496 return TargetRegionFlags::generic;
2497}
2498
2499//===----------------------------------------------------------------------===//
2500// ParallelOp
2501//===----------------------------------------------------------------------===//
2502
2503void ParallelOp::build(OpBuilder &builder, OperationState &state,
2504 ArrayRef<NamedAttribute> attributes) {
2505 ParallelOp::build(builder, state, /*allocate_vars=*/ValueRange(),
2506 /*allocator_vars=*/ValueRange(), /*if_expr=*/nullptr,
2507 /*num_threads=*/nullptr, /*private_vars=*/ValueRange(),
2508 /*private_syms=*/nullptr, /*private_needs_barrier=*/nullptr,
2509 /*proc_bind_kind=*/nullptr,
2510 /*reduction_mod =*/nullptr, /*reduction_vars=*/ValueRange(),
2511 /*reduction_byref=*/nullptr, /*reduction_syms=*/nullptr);
2512 state.addAttributes(attributes);
2513}
2514
2515void ParallelOp::build(OpBuilder &builder, OperationState &state,
2516 const ParallelOperands &clauses) {
2517 MLIRContext *ctx = builder.getContext();
2518 ParallelOp::build(builder, state, clauses.allocateVars, clauses.allocatorVars,
2519 clauses.ifExpr, clauses.numThreads, clauses.privateVars,
2520 makeArrayAttr(ctx, clauses.privateSyms),
2521 clauses.privateNeedsBarrier, clauses.procBindKind,
2522 clauses.reductionMod, clauses.reductionVars,
2523 makeDenseBoolArrayAttr(ctx, clauses.reductionByref),
2524 makeArrayAttr(ctx, clauses.reductionSyms));
2525}
2526
2527template <typename OpType>
2528static LogicalResult verifyPrivateVarList(OpType &op) {
2529 auto privateVars = op.getPrivateVars();
2530 auto privateSyms = op.getPrivateSymsAttr();
2531
2532 if (privateVars.empty() && (privateSyms == nullptr || privateSyms.empty()))
2533 return success();
2534
2535 auto numPrivateVars = privateVars.size();
2536 auto numPrivateSyms = (privateSyms == nullptr) ? 0 : privateSyms.size();
2537
2538 if (numPrivateVars != numPrivateSyms)
2539 return op.emitError() << "inconsistent number of private variables and "
2540 "privatizer op symbols, private vars: "
2541 << numPrivateVars
2542 << " vs. privatizer op symbols: " << numPrivateSyms;
2543
2544 for (auto privateVarInfo : llvm::zip_equal(privateVars, privateSyms)) {
2545 Type varType = std::get<0>(privateVarInfo).getType();
2546 SymbolRefAttr privateSym = cast<SymbolRefAttr>(std::get<1>(privateVarInfo));
2547 PrivateClauseOp privatizerOp =
2549
2550 if (privatizerOp == nullptr)
2551 return op.emitError() << "failed to lookup privatizer op with symbol: '"
2552 << privateSym << "'";
2553
2554 Type privatizerType = privatizerOp.getArgType();
2555
2556 if (privatizerType && (varType != privatizerType))
2557 return op.emitError()
2558 << "type mismatch between a "
2559 << (privatizerOp.getDataSharingType() ==
2560 DataSharingClauseType::Private
2561 ? "private"
2562 : "firstprivate")
2563 << " variable and its privatizer op, var type: " << varType
2564 << " vs. privatizer op type: " << privatizerType;
2565 }
2566
2567 return success();
2568}
2569
2570LogicalResult ParallelOp::verify() {
2571 if (getAllocateVars().size() != getAllocatorVars().size())
2572 return emitError(
2573 "expected equal sizes for allocate and allocator variables");
2574
2575 if (failed(verifyPrivateVarList(*this)))
2576 return failure();
2577
2578 return verifyReductionVarList(*this, getReductionSyms(), getReductionVars(),
2579 getReductionByref());
2580}
2581
2582LogicalResult ParallelOp::verifyRegions() {
2583 auto distChildOps = getOps<DistributeOp>();
2584 int numDistChildOps = std::distance(distChildOps.begin(), distChildOps.end());
2585 if (numDistChildOps > 1)
2586 return emitError()
2587 << "multiple 'omp.distribute' nested inside of 'omp.parallel'";
2588
2589 if (numDistChildOps == 1) {
2590 if (!isComposite())
2591 return emitError()
2592 << "'omp.composite' attribute missing from composite operation";
2593
2594 auto *ompDialect = getContext()->getLoadedDialect<OpenMPDialect>();
2595 Operation &distributeOp = **distChildOps.begin();
2596 for (Operation &childOp : getOps()) {
2597 if (&childOp == &distributeOp || ompDialect != childOp.getDialect())
2598 continue;
2599
2600 if (!childOp.hasTrait<OpTrait::IsTerminator>())
2601 return emitError() << "unexpected OpenMP operation inside of composite "
2602 "'omp.parallel': "
2603 << childOp.getName();
2604 }
2605 } else if (isComposite()) {
2606 return emitError()
2607 << "'omp.composite' attribute present in non-composite operation";
2608 }
2609 return success();
2610}
2611
2612//===----------------------------------------------------------------------===//
2613// TeamsOp
2614//===----------------------------------------------------------------------===//
2615
2617 while ((op = op->getParentOp()))
2618 if (isa<OpenMPDialect>(op->getDialect()))
2619 return false;
2620 return true;
2621}
2622
2623void TeamsOp::build(OpBuilder &builder, OperationState &state,
2624 const TeamsOperands &clauses) {
2625 MLIRContext *ctx = builder.getContext();
2626 // TODO Store clauses in op: privateVars, privateSyms, privateNeedsBarrier
2627 TeamsOp::build(builder, state, clauses.allocateVars, clauses.allocatorVars,
2628 clauses.ifExpr, clauses.numTeamsLower, clauses.numTeamsUpper,
2629 /*private_vars=*/{}, /*private_syms=*/nullptr,
2630 /*private_needs_barrier=*/nullptr, clauses.reductionMod,
2631 clauses.reductionVars,
2632 makeDenseBoolArrayAttr(ctx, clauses.reductionByref),
2633 makeArrayAttr(ctx, clauses.reductionSyms),
2634 clauses.threadLimit);
2635}
2636
2637LogicalResult TeamsOp::verify() {
2638 // Check parent region
2639 // TODO If nested inside of a target region, also check that it does not
2640 // contain any statements, declarations or directives other than this
2641 // omp.teams construct. The issue is how to support the initialization of
2642 // this operation's own arguments (allow SSA values across omp.target?).
2643 Operation *op = getOperation();
2644 if (!isa<TargetOp>(op->getParentOp()) &&
2646 return emitError("expected to be nested inside of omp.target or not nested "
2647 "in any OpenMP dialect operations");
2648
2649 // Check for num_teams clause restrictions
2650 if (auto numTeamsLowerBound = getNumTeamsLower()) {
2651 auto numTeamsUpperBound = getNumTeamsUpper();
2652 if (!numTeamsUpperBound)
2653 return emitError("expected num_teams upper bound to be defined if the "
2654 "lower bound is defined");
2655 if (numTeamsLowerBound.getType() != numTeamsUpperBound.getType())
2656 return emitError(
2657 "expected num_teams upper bound and lower bound to be the same type");
2658 }
2659
2660 // Check for allocate clause restrictions
2661 if (getAllocateVars().size() != getAllocatorVars().size())
2662 return emitError(
2663 "expected equal sizes for allocate and allocator variables");
2664
2665 return verifyReductionVarList(*this, getReductionSyms(), getReductionVars(),
2666 getReductionByref());
2667}
2668
2669//===----------------------------------------------------------------------===//
2670// SectionOp
2671//===----------------------------------------------------------------------===//
2672
2673OperandRange SectionOp::getPrivateVars() {
2674 return getParentOp().getPrivateVars();
2675}
2676
2677OperandRange SectionOp::getReductionVars() {
2678 return getParentOp().getReductionVars();
2679}
2680
2681//===----------------------------------------------------------------------===//
2682// SectionsOp
2683//===----------------------------------------------------------------------===//
2684
2685void SectionsOp::build(OpBuilder &builder, OperationState &state,
2686 const SectionsOperands &clauses) {
2687 MLIRContext *ctx = builder.getContext();
2688 // TODO Store clauses in op: privateVars, privateSyms, privateNeedsBarrier
2689 SectionsOp::build(builder, state, clauses.allocateVars, clauses.allocatorVars,
2690 clauses.nowait, /*private_vars=*/{},
2691 /*private_syms=*/nullptr, /*private_needs_barrier=*/nullptr,
2692 clauses.reductionMod, clauses.reductionVars,
2693 makeDenseBoolArrayAttr(ctx, clauses.reductionByref),
2694 makeArrayAttr(ctx, clauses.reductionSyms));
2695}
2696
2697LogicalResult SectionsOp::verify() {
2698 if (getAllocateVars().size() != getAllocatorVars().size())
2699 return emitError(
2700 "expected equal sizes for allocate and allocator variables");
2701
2702 return verifyReductionVarList(*this, getReductionSyms(), getReductionVars(),
2703 getReductionByref());
2704}
2705
2706LogicalResult SectionsOp::verifyRegions() {
2707 for (auto &inst : *getRegion().begin()) {
2708 if (!(isa<SectionOp>(inst) || isa<TerminatorOp>(inst))) {
2709 return emitOpError()
2710 << "expected omp.section op or terminator op inside region";
2711 }
2712 }
2713
2714 return success();
2715}
2716
2717//===----------------------------------------------------------------------===//
2718// SingleOp
2719//===----------------------------------------------------------------------===//
2720
2721void SingleOp::build(OpBuilder &builder, OperationState &state,
2722 const SingleOperands &clauses) {
2723 MLIRContext *ctx = builder.getContext();
2724 // TODO Store clauses in op: privateVars, privateSyms, privateNeedsBarrier
2725 SingleOp::build(builder, state, clauses.allocateVars, clauses.allocatorVars,
2726 clauses.copyprivateVars,
2727 makeArrayAttr(ctx, clauses.copyprivateSyms), clauses.nowait,
2728 /*private_vars=*/{}, /*private_syms=*/nullptr,
2729 /*private_needs_barrier=*/nullptr);
2730}
2731
2732LogicalResult SingleOp::verify() {
2733 // Check for allocate clause restrictions
2734 if (getAllocateVars().size() != getAllocatorVars().size())
2735 return emitError(
2736 "expected equal sizes for allocate and allocator variables");
2737
2738 return verifyCopyprivateVarList(*this, getCopyprivateVars(),
2739 getCopyprivateSyms());
2740}
2741
2742//===----------------------------------------------------------------------===//
2743// WorkshareOp
2744//===----------------------------------------------------------------------===//
2745
2746void WorkshareOp::build(OpBuilder &builder, OperationState &state,
2747 const WorkshareOperands &clauses) {
2748 WorkshareOp::build(builder, state, clauses.nowait);
2749}
2750
2751//===----------------------------------------------------------------------===//
2752// WorkshareLoopWrapperOp
2753//===----------------------------------------------------------------------===//
2754
2755LogicalResult WorkshareLoopWrapperOp::verify() {
2756 if (!(*this)->getParentOfType<WorkshareOp>())
2757 return emitOpError() << "must be nested in an omp.workshare";
2758 return success();
2759}
2760
2761LogicalResult WorkshareLoopWrapperOp::verifyRegions() {
2762 if (isa_and_nonnull<LoopWrapperInterface>((*this)->getParentOp()) ||
2763 getNestedWrapper())
2764 return emitOpError() << "expected to be a standalone loop wrapper";
2765
2766 return success();
2767}
2768
2769//===----------------------------------------------------------------------===//
2770// LoopWrapperInterface
2771//===----------------------------------------------------------------------===//
2772
2773LogicalResult LoopWrapperInterface::verifyImpl() {
2774 Operation *op = this->getOperation();
2775 if (!op->hasTrait<OpTrait::NoTerminator>() ||
2777 return emitOpError() << "loop wrapper must also have the `NoTerminator` "
2778 "and `SingleBlock` traits";
2779
2780 if (op->getNumRegions() != 1)
2781 return emitOpError() << "loop wrapper does not contain exactly one region";
2782
2783 Region &region = op->getRegion(0);
2784 if (range_size(region.getOps()) != 1)
2785 return emitOpError()
2786 << "loop wrapper does not contain exactly one nested op";
2787
2788 Operation &firstOp = *region.op_begin();
2789 if (!isa<LoopNestOp, LoopWrapperInterface>(firstOp))
2790 return emitOpError() << "nested in loop wrapper is not another loop "
2791 "wrapper or `omp.loop_nest`";
2792
2793 return success();
2794}
2795
2796//===----------------------------------------------------------------------===//
2797// LoopOp
2798//===----------------------------------------------------------------------===//
2799
2800void LoopOp::build(OpBuilder &builder, OperationState &state,
2801 const LoopOperands &clauses) {
2802 MLIRContext *ctx = builder.getContext();
2803
2804 LoopOp::build(builder, state, clauses.bindKind, clauses.privateVars,
2805 makeArrayAttr(ctx, clauses.privateSyms),
2806 clauses.privateNeedsBarrier, clauses.order, clauses.orderMod,
2807 clauses.reductionMod, clauses.reductionVars,
2808 makeDenseBoolArrayAttr(ctx, clauses.reductionByref),
2809 makeArrayAttr(ctx, clauses.reductionSyms));
2810}
2811
2812LogicalResult LoopOp::verify() {
2813 return verifyReductionVarList(*this, getReductionSyms(), getReductionVars(),
2814 getReductionByref());
2815}
2816
2817LogicalResult LoopOp::verifyRegions() {
2818 if (llvm::isa_and_nonnull<LoopWrapperInterface>((*this)->getParentOp()) ||
2819 getNestedWrapper())
2820 return emitOpError() << "expected to be a standalone loop wrapper";
2821
2822 return success();
2823}
2824
2825//===----------------------------------------------------------------------===//
2826// WsloopOp
2827//===----------------------------------------------------------------------===//
2828
2829void WsloopOp::build(OpBuilder &builder, OperationState &state,
2830 ArrayRef<NamedAttribute> attributes) {
2831 build(builder, state, /*allocate_vars=*/{}, /*allocator_vars=*/{},
2832 /*linear_vars=*/ValueRange(), /*linear_step_vars=*/ValueRange(),
2833 /*linear_var_types*/ nullptr,
2834 /*nowait=*/false, /*order=*/nullptr, /*order_mod=*/nullptr,
2835 /*ordered=*/nullptr, /*private_vars=*/{}, /*private_syms=*/nullptr,
2836 /*private_needs_barrier=*/false,
2837 /*reduction_mod=*/nullptr, /*reduction_vars=*/ValueRange(),
2838 /*reduction_byref=*/nullptr,
2839 /*reduction_syms=*/nullptr, /*schedule_kind=*/nullptr,
2840 /*schedule_chunk=*/nullptr, /*schedule_mod=*/nullptr,
2841 /*schedule_simd=*/false);
2842 state.addAttributes(attributes);
2843}
2844
2845void WsloopOp::build(OpBuilder &builder, OperationState &state,
2846 const WsloopOperands &clauses) {
2847 MLIRContext *ctx = builder.getContext();
2848 // TODO: Store clauses in op: allocateVars, allocatorVars
2849 WsloopOp::build(
2850 builder, state,
2851 /*allocate_vars=*/{}, /*allocator_vars=*/{}, clauses.linearVars,
2852 clauses.linearStepVars, clauses.linearVarTypes, clauses.nowait,
2853 clauses.order, clauses.orderMod, clauses.ordered, clauses.privateVars,
2854 makeArrayAttr(ctx, clauses.privateSyms), clauses.privateNeedsBarrier,
2855 clauses.reductionMod, clauses.reductionVars,
2856 makeDenseBoolArrayAttr(ctx, clauses.reductionByref),
2857 makeArrayAttr(ctx, clauses.reductionSyms), clauses.scheduleKind,
2858 clauses.scheduleChunk, clauses.scheduleMod, clauses.scheduleSimd);
2859}
2860
2861LogicalResult WsloopOp::verify() {
2862 return verifyReductionVarList(*this, getReductionSyms(), getReductionVars(),
2863 getReductionByref());
2864}
2865
2866LogicalResult WsloopOp::verifyRegions() {
2867 bool isCompositeChildLeaf =
2868 llvm::dyn_cast_if_present<LoopWrapperInterface>((*this)->getParentOp());
2869
2870 if (LoopWrapperInterface nested = getNestedWrapper()) {
2871 if (!isComposite())
2872 return emitError()
2873 << "'omp.composite' attribute missing from composite wrapper";
2874
2875 // Check for the allowed leaf constructs that may appear in a composite
2876 // construct directly after DO/FOR.
2877 if (!isa<SimdOp>(nested))
2878 return emitError() << "only supported nested wrapper is 'omp.simd'";
2879
2880 } else if (isComposite() && !isCompositeChildLeaf) {
2881 return emitError()
2882 << "'omp.composite' attribute present in non-composite wrapper";
2883 } else if (!isComposite() && isCompositeChildLeaf) {
2884 return emitError()
2885 << "'omp.composite' attribute missing from composite wrapper";
2886 }
2887
2888 return success();
2889}
2890
2891//===----------------------------------------------------------------------===//
2892// Simd construct [2.9.3.1]
2893//===----------------------------------------------------------------------===//
2894
2895void SimdOp::build(OpBuilder &builder, OperationState &state,
2896 const SimdOperands &clauses) {
2897 MLIRContext *ctx = builder.getContext();
2898 SimdOp::build(
2899 builder, state, clauses.alignedVars,
2900 makeArrayAttr(ctx, clauses.alignments), clauses.ifExpr,
2901 clauses.linearVars, clauses.linearStepVars, clauses.linearVarTypes,
2902 clauses.nontemporalVars, clauses.order, clauses.orderMod,
2903 clauses.privateVars, makeArrayAttr(ctx, clauses.privateSyms),
2904 clauses.privateNeedsBarrier, clauses.reductionMod, clauses.reductionVars,
2905 makeDenseBoolArrayAttr(ctx, clauses.reductionByref),
2906 makeArrayAttr(ctx, clauses.reductionSyms), clauses.safelen,
2907 clauses.simdlen);
2908}
2909
2910LogicalResult SimdOp::verify() {
2911 if (getSimdlen().has_value() && getSafelen().has_value() &&
2912 getSimdlen().value() > getSafelen().value())
2913 return emitOpError()
2914 << "simdlen clause and safelen clause are both present, but the "
2915 "simdlen value is not less than or equal to safelen value";
2916
2917 if (verifyAlignedClause(*this, getAlignments(), getAlignedVars()).failed())
2918 return failure();
2919
2920 if (verifyNontemporalClause(*this, getNontemporalVars()).failed())
2921 return failure();
2922
2923 bool isCompositeChildLeaf =
2924 llvm::dyn_cast_if_present<LoopWrapperInterface>((*this)->getParentOp());
2925
2926 if (!isComposite() && isCompositeChildLeaf)
2927 return emitError()
2928 << "'omp.composite' attribute missing from composite wrapper";
2929
2930 if (isComposite() && !isCompositeChildLeaf)
2931 return emitError()
2932 << "'omp.composite' attribute present in non-composite wrapper";
2933
2934 // Firstprivate is not allowed for SIMD in the standard. Check that none of
2935 // the private decls are for firstprivate.
2936 std::optional<ArrayAttr> privateSyms = getPrivateSyms();
2937 if (privateSyms) {
2938 for (const Attribute &sym : *privateSyms) {
2939 auto symRef = cast<SymbolRefAttr>(sym);
2940 omp::PrivateClauseOp privatizer =
2942 getOperation(), symRef);
2943 if (!privatizer)
2944 return emitError() << "Cannot find privatizer '" << symRef << "'";
2945 if (privatizer.getDataSharingType() ==
2946 DataSharingClauseType::FirstPrivate)
2947 return emitError() << "FIRSTPRIVATE cannot be used with SIMD";
2948 }
2949 }
2950
2951 return success();
2952}
2953
2954LogicalResult SimdOp::verifyRegions() {
2955 if (getNestedWrapper())
2956 return emitOpError() << "must wrap an 'omp.loop_nest' directly";
2957
2958 return success();
2959}
2960
2961//===----------------------------------------------------------------------===//
2962// Distribute construct [2.9.4.1]
2963//===----------------------------------------------------------------------===//
2964
2965void DistributeOp::build(OpBuilder &builder, OperationState &state,
2966 const DistributeOperands &clauses) {
2967 DistributeOp::build(builder, state, clauses.allocateVars,
2968 clauses.allocatorVars, clauses.distScheduleStatic,
2969 clauses.distScheduleChunkSize, clauses.order,
2970 clauses.orderMod, clauses.privateVars,
2971 makeArrayAttr(builder.getContext(), clauses.privateSyms),
2972 clauses.privateNeedsBarrier);
2973}
2974
2975LogicalResult DistributeOp::verify() {
2976 if (this->getDistScheduleChunkSize() && !this->getDistScheduleStatic())
2977 return emitOpError() << "chunk size set without "
2978 "dist_schedule_static being present";
2979
2980 if (getAllocateVars().size() != getAllocatorVars().size())
2981 return emitError(
2982 "expected equal sizes for allocate and allocator variables");
2983
2984 return success();
2985}
2986
2987LogicalResult DistributeOp::verifyRegions() {
2988 if (LoopWrapperInterface nested = getNestedWrapper()) {
2989 if (!isComposite())
2990 return emitError()
2991 << "'omp.composite' attribute missing from composite wrapper";
2992 // Check for the allowed leaf constructs that may appear in a composite
2993 // construct directly after DISTRIBUTE.
2994 if (isa<WsloopOp>(nested)) {
2995 Operation *parentOp = (*this)->getParentOp();
2996 if (!llvm::dyn_cast_if_present<ParallelOp>(parentOp) ||
2997 !cast<ComposableOpInterface>(parentOp).isComposite()) {
2998 return emitError() << "an 'omp.wsloop' nested wrapper is only allowed "
2999 "when a composite 'omp.parallel' is the direct "
3000 "parent";
3001 }
3002 } else if (!isa<SimdOp>(nested))
3003 return emitError() << "only supported nested wrappers are 'omp.simd' and "
3004 "'omp.wsloop'";
3005 } else if (isComposite()) {
3006 return emitError()
3007 << "'omp.composite' attribute present in non-composite wrapper";
3008 }
3009
3010 return success();
3011}
3012
3013//===----------------------------------------------------------------------===//
3014// DeclareMapperOp / DeclareMapperInfoOp
3015//===----------------------------------------------------------------------===//
3016
3017LogicalResult DeclareMapperInfoOp::verify() {
3018 return verifyMapClause(*this, getMapVars());
3019}
3020
3021LogicalResult DeclareMapperOp::verifyRegions() {
3022 if (!llvm::isa_and_present<DeclareMapperInfoOp>(
3023 getRegion().getBlocks().front().getTerminator()))
3024 return emitOpError() << "expected terminator to be a DeclareMapperInfoOp";
3025
3026 return success();
3027}
3028
3029//===----------------------------------------------------------------------===//
3030// DeclareReductionOp
3031//===----------------------------------------------------------------------===//
3032
3033LogicalResult DeclareReductionOp::verifyRegions() {
3034 if (!getAllocRegion().empty()) {
3035 for (YieldOp yieldOp : getAllocRegion().getOps<YieldOp>()) {
3036 if (yieldOp.getResults().size() != 1 ||
3037 yieldOp.getResults().getTypes()[0] != getType())
3038 return emitOpError() << "expects alloc region to yield a value "
3039 "of the reduction type";
3040 }
3041 }
3042
3043 if (getInitializerRegion().empty())
3044 return emitOpError() << "expects non-empty initializer region";
3045 Block &initializerEntryBlock = getInitializerRegion().front();
3046
3047 if (initializerEntryBlock.getNumArguments() == 1) {
3048 if (!getAllocRegion().empty())
3049 return emitOpError() << "expects two arguments to the initializer region "
3050 "when an allocation region is used";
3051 } else if (initializerEntryBlock.getNumArguments() == 2) {
3052 if (getAllocRegion().empty())
3053 return emitOpError() << "expects one argument to the initializer region "
3054 "when no allocation region is used";
3055 } else {
3056 return emitOpError()
3057 << "expects one or two arguments to the initializer region";
3058 }
3059
3060 for (mlir::Value arg : initializerEntryBlock.getArguments())
3061 if (arg.getType() != getType())
3062 return emitOpError() << "expects initializer region argument to match "
3063 "the reduction type";
3064
3065 for (YieldOp yieldOp : getInitializerRegion().getOps<YieldOp>()) {
3066 if (yieldOp.getResults().size() != 1 ||
3067 yieldOp.getResults().getTypes()[0] != getType())
3068 return emitOpError() << "expects initializer region to yield a value "
3069 "of the reduction type";
3070 }
3071
3072 if (getReductionRegion().empty())
3073 return emitOpError() << "expects non-empty reduction region";
3074 Block &reductionEntryBlock = getReductionRegion().front();
3075 if (reductionEntryBlock.getNumArguments() != 2 ||
3076 reductionEntryBlock.getArgumentTypes()[0] !=
3077 reductionEntryBlock.getArgumentTypes()[1] ||
3078 reductionEntryBlock.getArgumentTypes()[0] != getType())
3079 return emitOpError() << "expects reduction region with two arguments of "
3080 "the reduction type";
3081 for (YieldOp yieldOp : getReductionRegion().getOps<YieldOp>()) {
3082 if (yieldOp.getResults().size() != 1 ||
3083 yieldOp.getResults().getTypes()[0] != getType())
3084 return emitOpError() << "expects reduction region to yield a value "
3085 "of the reduction type";
3086 }
3087
3088 if (!getAtomicReductionRegion().empty()) {
3089 Block &atomicReductionEntryBlock = getAtomicReductionRegion().front();
3090 if (atomicReductionEntryBlock.getNumArguments() != 2 ||
3091 atomicReductionEntryBlock.getArgumentTypes()[0] !=
3092 atomicReductionEntryBlock.getArgumentTypes()[1])
3093 return emitOpError() << "expects atomic reduction region with two "
3094 "arguments of the same type";
3095 auto ptrType = llvm::dyn_cast<PointerLikeType>(
3096 atomicReductionEntryBlock.getArgumentTypes()[0]);
3097 if (!ptrType ||
3098 (ptrType.getElementType() && ptrType.getElementType() != getType()))
3099 return emitOpError() << "expects atomic reduction region arguments to "
3100 "be accumulators containing the reduction type";
3101 }
3102
3103 if (getCleanupRegion().empty())
3104 return success();
3105 Block &cleanupEntryBlock = getCleanupRegion().front();
3106 if (cleanupEntryBlock.getNumArguments() != 1 ||
3107 cleanupEntryBlock.getArgument(0).getType() != getType())
3108 return emitOpError() << "expects cleanup region with one argument "
3109 "of the reduction type";
3110
3111 return success();
3112}
3113
3114//===----------------------------------------------------------------------===//
3115// TaskOp
3116//===----------------------------------------------------------------------===//
3117
3118void TaskOp::build(OpBuilder &builder, OperationState &state,
3119 const TaskOperands &clauses) {
3120 MLIRContext *ctx = builder.getContext();
3121 TaskOp::build(builder, state, clauses.allocateVars, clauses.allocatorVars,
3122 makeArrayAttr(ctx, clauses.dependKinds), clauses.dependVars,
3123 clauses.final, clauses.ifExpr, clauses.inReductionVars,
3124 makeDenseBoolArrayAttr(ctx, clauses.inReductionByref),
3125 makeArrayAttr(ctx, clauses.inReductionSyms), clauses.mergeable,
3126 clauses.priority, /*private_vars=*/clauses.privateVars,
3127 /*private_syms=*/makeArrayAttr(ctx, clauses.privateSyms),
3128 clauses.privateNeedsBarrier, clauses.untied,
3129 clauses.eventHandle);
3130}
3131
3132LogicalResult TaskOp::verify() {
3133 LogicalResult verifyDependVars =
3134 verifyDependVarList(*this, getDependKinds(), getDependVars());
3135 return failed(verifyDependVars)
3136 ? verifyDependVars
3137 : verifyReductionVarList(*this, getInReductionSyms(),
3138 getInReductionVars(),
3139 getInReductionByref());
3140}
3141
3142//===----------------------------------------------------------------------===//
3143// TaskgroupOp
3144//===----------------------------------------------------------------------===//
3145
3146void TaskgroupOp::build(OpBuilder &builder, OperationState &state,
3147 const TaskgroupOperands &clauses) {
3148 MLIRContext *ctx = builder.getContext();
3149 TaskgroupOp::build(builder, state, clauses.allocateVars,
3150 clauses.allocatorVars, clauses.taskReductionVars,
3151 makeDenseBoolArrayAttr(ctx, clauses.taskReductionByref),
3152 makeArrayAttr(ctx, clauses.taskReductionSyms));
3153}
3154
3155LogicalResult TaskgroupOp::verify() {
3156 return verifyReductionVarList(*this, getTaskReductionSyms(),
3157 getTaskReductionVars(),
3158 getTaskReductionByref());
3159}
3160
3161//===----------------------------------------------------------------------===//
3162// TaskloopOp
3163//===----------------------------------------------------------------------===//
3164
3165void TaskloopOp::build(OpBuilder &builder, OperationState &state,
3166 const TaskloopOperands &clauses) {
3167 MLIRContext *ctx = builder.getContext();
3168 TaskloopOp::build(
3169 builder, state, clauses.allocateVars, clauses.allocatorVars,
3170 clauses.final, clauses.grainsizeMod, clauses.grainsize, clauses.ifExpr,
3171 clauses.inReductionVars,
3172 makeDenseBoolArrayAttr(ctx, clauses.inReductionByref),
3173 makeArrayAttr(ctx, clauses.inReductionSyms), clauses.mergeable,
3174 clauses.nogroup, clauses.numTasksMod, clauses.numTasks, clauses.priority,
3175 /*private_vars=*/clauses.privateVars,
3176 /*private_syms=*/makeArrayAttr(ctx, clauses.privateSyms),
3177 clauses.privateNeedsBarrier, clauses.reductionMod, clauses.reductionVars,
3178 makeDenseBoolArrayAttr(ctx, clauses.reductionByref),
3179 makeArrayAttr(ctx, clauses.reductionSyms), clauses.untied);
3180}
3181
3182LogicalResult TaskloopOp::verify() {
3183 if (getAllocateVars().size() != getAllocatorVars().size())
3184 return emitError(
3185 "expected equal sizes for allocate and allocator variables");
3186 if (failed(verifyReductionVarList(*this, getReductionSyms(),
3187 getReductionVars(), getReductionByref())) ||
3188 failed(verifyReductionVarList(*this, getInReductionSyms(),
3189 getInReductionVars(),
3190 getInReductionByref())))
3191 return failure();
3192
3193 if (!getReductionVars().empty() && getNogroup())
3194 return emitError("if a reduction clause is present on the taskloop "
3195 "directive, the nogroup clause must not be specified");
3196 for (auto var : getReductionVars()) {
3197 if (llvm::is_contained(getInReductionVars(), var))
3198 return emitError("the same list item cannot appear in both a reduction "
3199 "and an in_reduction clause");
3200 }
3201
3202 if (getGrainsize() && getNumTasks()) {
3203 return emitError(
3204 "the grainsize clause and num_tasks clause are mutually exclusive and "
3205 "may not appear on the same taskloop directive");
3206 }
3207
3208 return success();
3209}
3210
3211LogicalResult TaskloopOp::verifyRegions() {
3212 if (LoopWrapperInterface nested = getNestedWrapper()) {
3213 if (!isComposite())
3214 return emitError()
3215 << "'omp.composite' attribute missing from composite wrapper";
3216
3217 // Check for the allowed leaf constructs that may appear in a composite
3218 // construct directly after TASKLOOP.
3219 if (!isa<SimdOp>(nested))
3220 return emitError() << "only supported nested wrapper is 'omp.simd'";
3221 } else if (isComposite()) {
3222 return emitError()
3223 << "'omp.composite' attribute present in non-composite wrapper";
3224 }
3225
3226 return success();
3227}
3228
3229//===----------------------------------------------------------------------===//
3230// LoopNestOp
3231//===----------------------------------------------------------------------===//
3232
3233ParseResult LoopNestOp::parse(OpAsmParser &parser, OperationState &result) {
3234 // Parse an opening `(` followed by induction variables followed by `)`
3237 Type loopVarType;
3239 parser.parseColonType(loopVarType) ||
3240 // Parse loop bounds.
3241 parser.parseEqual() ||
3242 parser.parseOperandList(lbs, ivs.size(), OpAsmParser::Delimiter::Paren) ||
3243 parser.parseKeyword("to") ||
3244 parser.parseOperandList(ubs, ivs.size(), OpAsmParser::Delimiter::Paren))
3245 return failure();
3246
3247 for (auto &iv : ivs)
3248 iv.type = loopVarType;
3249
3250 auto *ctx = parser.getBuilder().getContext();
3251 // Parse "inclusive" flag.
3252 if (succeeded(parser.parseOptionalKeyword("inclusive")))
3253 result.addAttribute("loop_inclusive", UnitAttr::get(ctx));
3254
3255 // Parse step values.
3257 if (parser.parseKeyword("step") ||
3258 parser.parseOperandList(steps, ivs.size(), OpAsmParser::Delimiter::Paren))
3259 return failure();
3260
3261 // Parse collapse
3262 int64_t value = 0;
3263 if (!parser.parseOptionalKeyword("collapse") &&
3264 (parser.parseLParen() || parser.parseInteger(value) ||
3265 parser.parseRParen()))
3266 return failure();
3267 if (value > 1)
3268 result.addAttribute(
3269 "collapse_num_loops",
3270 IntegerAttr::get(parser.getBuilder().getI64Type(), value));
3271
3272 // Parse tiles
3274 auto parseTiles = [&]() -> ParseResult {
3275 int64_t tile;
3276 if (parser.parseInteger(tile))
3277 return failure();
3278 tiles.push_back(tile);
3279 return success();
3280 };
3281
3282 if (!parser.parseOptionalKeyword("tiles") &&
3283 (parser.parseLParen() || parser.parseCommaSeparatedList(parseTiles) ||
3284 parser.parseRParen()))
3285 return failure();
3286
3287 if (tiles.size() > 0)
3288 result.addAttribute("tile_sizes", DenseI64ArrayAttr::get(ctx, tiles));
3289
3290 // Parse the body.
3291 Region *region = result.addRegion();
3292 if (parser.parseRegion(*region, ivs))
3293 return failure();
3294
3295 // Resolve operands.
3296 if (parser.resolveOperands(lbs, loopVarType, result.operands) ||
3297 parser.resolveOperands(ubs, loopVarType, result.operands) ||
3298 parser.resolveOperands(steps, loopVarType, result.operands))
3299 return failure();
3300
3301 // Parse the optional attribute list.
3302 return parser.parseOptionalAttrDict(result.attributes);
3303}
3304
3305void LoopNestOp::print(OpAsmPrinter &p) {
3306 Region &region = getRegion();
3307 auto args = region.getArguments();
3308 p << " (" << args << ") : " << args[0].getType() << " = ("
3309 << getLoopLowerBounds() << ") to (" << getLoopUpperBounds() << ") ";
3310 if (getLoopInclusive())
3311 p << "inclusive ";
3312 p << "step (" << getLoopSteps() << ") ";
3313 if (int64_t numCollapse = getCollapseNumLoops())
3314 if (numCollapse > 1)
3315 p << "collapse(" << numCollapse << ") ";
3316
3317 if (const auto tiles = getTileSizes())
3318 p << "tiles(" << tiles.value() << ") ";
3319
3320 p.printRegion(region, /*printEntryBlockArgs=*/false);
3321}
3322
3323void LoopNestOp::build(OpBuilder &builder, OperationState &state,
3324 const LoopNestOperands &clauses) {
3325 MLIRContext *ctx = builder.getContext();
3326 LoopNestOp::build(builder, state, clauses.collapseNumLoops,
3327 clauses.loopLowerBounds, clauses.loopUpperBounds,
3328 clauses.loopSteps, clauses.loopInclusive,
3329 makeDenseI64ArrayAttr(ctx, clauses.tileSizes));
3330}
3331
3332LogicalResult LoopNestOp::verify() {
3333 if (getLoopLowerBounds().empty())
3334 return emitOpError() << "must represent at least one loop";
3335
3336 if (getLoopLowerBounds().size() != getIVs().size())
3337 return emitOpError() << "number of range arguments and IVs do not match";
3338
3339 for (auto [lb, iv] : llvm::zip_equal(getLoopLowerBounds(), getIVs())) {
3340 if (lb.getType() != iv.getType())
3341 return emitOpError()
3342 << "range argument type does not match corresponding IV type";
3343 }
3344
3345 uint64_t numIVs = getIVs().size();
3346
3347 if (const auto &numCollapse = getCollapseNumLoops())
3348 if (numCollapse > numIVs)
3349 return emitOpError()
3350 << "collapse value is larger than the number of loops";
3351
3352 if (const auto &tiles = getTileSizes())
3353 if (tiles.value().size() > numIVs)
3354 return emitOpError() << "too few canonical loops for tile dimensions";
3355
3356 if (!llvm::dyn_cast_if_present<LoopWrapperInterface>((*this)->getParentOp()))
3357 return emitOpError() << "expects parent op to be a loop wrapper";
3358
3359 return success();
3360}
3361
3362void LoopNestOp::gatherWrappers(
3364 Operation *parent = (*this)->getParentOp();
3365 while (auto wrapper =
3366 llvm::dyn_cast_if_present<LoopWrapperInterface>(parent)) {
3367 wrappers.push_back(wrapper);
3368 parent = parent->getParentOp();
3369 }
3370}
3371
3372//===----------------------------------------------------------------------===//
3373// OpenMP canonical loop handling
3374//===----------------------------------------------------------------------===//
3375
3376std::tuple<NewCliOp, OpOperand *, OpOperand *>
3377mlir::omp ::decodeCli(Value cli) {
3378
3379 // Defining a CLI for a generated loop is optional; if there is none then
3380 // there is no followup-tranformation
3381 if (!cli)
3382 return {{}, nullptr, nullptr};
3383
3384 assert(cli.getType() == CanonicalLoopInfoType::get(cli.getContext()) &&
3385 "Unexpected type of cli");
3386
3387 NewCliOp create = cast<NewCliOp>(cli.getDefiningOp());
3388 OpOperand *gen = nullptr;
3389 OpOperand *cons = nullptr;
3390 for (OpOperand &use : cli.getUses()) {
3391 auto op = cast<LoopTransformationInterface>(use.getOwner());
3392
3393 unsigned opnum = use.getOperandNumber();
3394 if (op.isGeneratee(opnum)) {
3395 assert(!gen && "Each CLI may have at most one def");
3396 gen = &use;
3397 } else if (op.isApplyee(opnum)) {
3398 assert(!cons && "Each CLI may have at most one consumer");
3399 cons = &use;
3400 } else {
3401 llvm_unreachable("Unexpected operand for a CLI");
3402 }
3403 }
3404
3405 return {create, gen, cons};
3406}
3407
3408void NewCliOp::build(::mlir::OpBuilder &odsBuilder,
3409 ::mlir::OperationState &odsState) {
3410 odsState.addTypes(CanonicalLoopInfoType::get(odsBuilder.getContext()));
3411}
3412
3413void NewCliOp::getAsmResultNames(OpAsmSetValueNameFn setNameFn) {
3414 Value result = getResult();
3415 auto [newCli, gen, cons] = decodeCli(result);
3416
3417 // Structured binding `gen` cannot be captured in lambdas before C++20
3418 OpOperand *generator = gen;
3419
3420 // Derive the CLI variable name from its generator:
3421 // * "canonloop" for omp.canonical_loop
3422 // * custom name for loop transformation generatees
3423 // * "cli" as fallback if no generator
3424 // * "_r<idx>" suffix for nested loops, where <idx> is the sequential order
3425 // at that level
3426 // * "_s<idx>" suffix for operations with multiple regions, where <idx> is
3427 // the index of that region
3428 std::string cliName{"cli"};
3429 if (gen) {
3430 cliName =
3432 .Case([&](CanonicalLoopOp op) {
3433 return generateLoopNestingName("canonloop", op);
3434 })
3435 .Case([&](UnrollHeuristicOp op) -> std::string {
3436 llvm_unreachable("heuristic unrolling does not generate a loop");
3437 })
3438 .Case([&](TileOp op) -> std::string {
3439 auto [generateesFirst, generateesCount] =
3440 op.getGenerateesODSOperandIndexAndLength();
3441 unsigned firstGrid = generateesFirst;
3442 unsigned firstIntratile = generateesFirst + generateesCount / 2;
3443 unsigned end = generateesFirst + generateesCount;
3444 unsigned opnum = generator->getOperandNumber();
3445 // In the OpenMP apply and looprange clauses, indices are 1-based
3446 if (firstGrid <= opnum && opnum < firstIntratile) {
3447 unsigned gridnum = opnum - firstGrid + 1;
3448 return ("grid" + Twine(gridnum)).str();
3449 }
3450 if (firstIntratile <= opnum && opnum < end) {
3451 unsigned intratilenum = opnum - firstIntratile + 1;
3452 return ("intratile" + Twine(intratilenum)).str();
3453 }
3454 llvm_unreachable("Unexpected generatee argument");
3455 })
3456 .DefaultUnreachable("TODO: Custom name for this operation");
3457 }
3458
3459 setNameFn(result, cliName);
3460}
3461
3462LogicalResult NewCliOp::verify() {
3463 Value cli = getResult();
3464
3465 assert(cli.getType() == CanonicalLoopInfoType::get(cli.getContext()) &&
3466 "Unexpected type of cli");
3467
3468 // Check that the CLI is used in at most generator and one consumer
3469 OpOperand *gen = nullptr;
3470 OpOperand *cons = nullptr;
3471 for (mlir::OpOperand &use : cli.getUses()) {
3472 auto op = cast<mlir::omp::LoopTransformationInterface>(use.getOwner());
3473
3474 unsigned opnum = use.getOperandNumber();
3475 if (op.isGeneratee(opnum)) {
3476 if (gen) {
3477 InFlightDiagnostic error =
3478 emitOpError("CLI must have at most one generator");
3479 error.attachNote(gen->getOwner()->getLoc())
3480 .append("first generator here:");
3481 error.attachNote(use.getOwner()->getLoc())
3482 .append("second generator here:");
3483 return error;
3484 }
3485
3486 gen = &use;
3487 } else if (op.isApplyee(opnum)) {
3488 if (cons) {
3489 InFlightDiagnostic error =
3490 emitOpError("CLI must have at most one consumer");
3491 error.attachNote(cons->getOwner()->getLoc())
3492 .append("first consumer here:")
3493 .appendOp(*cons->getOwner(),
3494 OpPrintingFlags().printGenericOpForm());
3495 error.attachNote(use.getOwner()->getLoc())
3496 .append("second consumer here:")
3497 .appendOp(*use.getOwner(), OpPrintingFlags().printGenericOpForm());
3498 return error;
3499 }
3500
3501 cons = &use;
3502 } else {
3503 llvm_unreachable("Unexpected operand for a CLI");
3504 }
3505 }
3506
3507 // If the CLI is source of a transformation, it must have a generator
3508 if (cons && !gen) {
3509 InFlightDiagnostic error = emitOpError("CLI has no generator");
3510 error.attachNote(cons->getOwner()->getLoc())
3511 .append("see consumer here: ")
3512 .appendOp(*cons->getOwner(), OpPrintingFlags().printGenericOpForm());
3513 return error;
3514 }
3515
3516 return success();
3517}
3518
3519void CanonicalLoopOp::build(OpBuilder &odsBuilder, OperationState &odsState,
3520 Value tripCount) {
3521 odsState.addOperands(tripCount);
3522 odsState.addOperands(Value());
3523 (void)odsState.addRegion();
3524}
3525
3526void CanonicalLoopOp::build(OpBuilder &odsBuilder, OperationState &odsState,
3527 Value tripCount, ::mlir::Value cli) {
3528 odsState.addOperands(tripCount);
3529 odsState.addOperands(cli);
3530 (void)odsState.addRegion();
3531}
3532
3533void CanonicalLoopOp::getAsmBlockNames(OpAsmSetBlockNameFn setNameFn) {
3534 setNameFn(&getRegion().front(), "body_entry");
3535}
3536
3537void CanonicalLoopOp::getAsmBlockArgumentNames(Region &region,
3538 OpAsmSetValueNameFn setNameFn) {
3539 std::string ivName = generateLoopNestingName("iv", *this);
3540 setNameFn(region.getArgument(0), ivName);
3541}
3542
3543void CanonicalLoopOp::print(OpAsmPrinter &p) {
3544 if (getCli())
3545 p << '(' << getCli() << ')';
3546 p << ' ' << getInductionVar() << " : " << getInductionVar().getType()
3547 << " in range(" << getTripCount() << ") ";
3548
3549 p.printRegion(getRegion(), /*printEntryBlockArgs=*/false,
3550 /*printBlockTerminators=*/true);
3551
3552 p.printOptionalAttrDict((*this)->getAttrs());
3553}
3554
3555mlir::ParseResult CanonicalLoopOp::parse(::mlir::OpAsmParser &parser,
3557 CanonicalLoopInfoType cliType =
3558 CanonicalLoopInfoType::get(parser.getContext());
3559
3560 // Parse (optional) omp.cli identifier
3562 SmallVector<mlir::Value, 1> cliOperand;
3563 if (!parser.parseOptionalLParen()) {
3564 if (parser.parseOperand(cli) ||
3565 parser.resolveOperand(cli, cliType, cliOperand) || parser.parseRParen())
3566 return failure();
3567 }
3568
3569 // We derive the type of tripCount from inductionVariable. MLIR requires the
3570 // type of tripCount to be known when calling resolveOperand so we have parse
3571 // the type before processing the inductionVariable.
3572 OpAsmParser::Argument inductionVariable;
3574 if (parser.parseArgument(inductionVariable, /*allowType*/ true) ||
3575 parser.parseKeyword("in") || parser.parseKeyword("range") ||
3576 parser.parseLParen() || parser.parseOperand(tripcount) ||
3577 parser.parseRParen() ||
3578 parser.resolveOperand(tripcount, inductionVariable.type, result.operands))
3579 return failure();
3580
3581 // Parse the loop body.
3582 Region *region = result.addRegion();
3583 if (parser.parseRegion(*region, {inductionVariable}))
3584 return failure();
3585
3586 // We parsed the cli operand forst, but because it is optional, it must be
3587 // last in the operand list.
3588 result.operands.append(cliOperand);
3589
3590 // Parse the optional attribute list.
3591 if (parser.parseOptionalAttrDict(result.attributes))
3592 return failure();
3593
3594 return mlir::success();
3595}
3596
3597LogicalResult CanonicalLoopOp::verify() {
3598 // The region's entry must accept the induction variable
3599 // It can also be empty if just created
3600 if (!getRegion().empty()) {
3601 Region &region = getRegion();
3602 if (region.getNumArguments() != 1)
3603 return emitOpError(
3604 "Canonical loop region must have exactly one argument");
3605
3606 if (getInductionVar().getType() != getTripCount().getType())
3607 return emitOpError(
3608 "Region argument must be the same type as the trip count");
3609 }
3610
3611 return success();
3612}
3613
3614Value CanonicalLoopOp::getInductionVar() { return getRegion().getArgument(0); }
3615
3616std::pair<unsigned, unsigned>
3617CanonicalLoopOp::getApplyeesODSOperandIndexAndLength() {
3618 // No applyees
3619 return {0, 0};
3620}
3621
3622std::pair<unsigned, unsigned>
3623CanonicalLoopOp::getGenerateesODSOperandIndexAndLength() {
3624 return getODSOperandIndexAndLength(odsIndex_cli);
3625}
3626
3627//===----------------------------------------------------------------------===//
3628// UnrollHeuristicOp
3629//===----------------------------------------------------------------------===//
3630
3631void UnrollHeuristicOp::build(::mlir::OpBuilder &odsBuilder,
3632 ::mlir::OperationState &odsState,
3633 ::mlir::Value cli) {
3634 odsState.addOperands(cli);
3635}
3636
3637void UnrollHeuristicOp::print(OpAsmPrinter &p) {
3638 p << '(' << getApplyee() << ')';
3639
3640 p.printOptionalAttrDict((*this)->getAttrs());
3641}
3642
3643mlir::ParseResult UnrollHeuristicOp::parse(::mlir::OpAsmParser &parser,
3645 auto cliType = CanonicalLoopInfoType::get(parser.getContext());
3646
3647 if (parser.parseLParen())
3648 return failure();
3649
3651 if (parser.parseOperand(applyee) ||
3652 parser.resolveOperand(applyee, cliType, result.operands))
3653 return failure();
3654
3655 if (parser.parseRParen())
3656 return failure();
3657
3658 // Optional output loop (full unrolling has none)
3659 if (!parser.parseOptionalArrow()) {
3660 if (parser.parseLParen() || parser.parseRParen())
3661 return failure();
3662 }
3663
3664 // Parse the optional attribute list.
3665 if (parser.parseOptionalAttrDict(result.attributes))
3666 return failure();
3667
3668 return mlir::success();
3669}
3670
3671std::pair<unsigned, unsigned>
3672UnrollHeuristicOp ::getApplyeesODSOperandIndexAndLength() {
3673 return getODSOperandIndexAndLength(odsIndex_applyee);
3674}
3675
3676std::pair<unsigned, unsigned>
3677UnrollHeuristicOp::getGenerateesODSOperandIndexAndLength() {
3678 return {0, 0};
3679}
3680
3681//===----------------------------------------------------------------------===//
3682// TileOp
3683//===----------------------------------------------------------------------===//
3684
3685static void printLoopTransformClis(OpAsmPrinter &p, TileOp op,
3686 OperandRange generatees,
3687 OperandRange applyees) {
3688 if (!generatees.empty())
3689 p << '(' << llvm::interleaved(generatees) << ')';
3690
3691 if (!applyees.empty())
3692 p << " <- (" << llvm::interleaved(applyees) << ')';
3693}
3694
3695static ParseResult parseLoopTransformClis(
3696 OpAsmParser &parser,
3699 if (parser.parseOptionalLess()) {
3700 // Syntax 1: generatees present
3701
3702 if (parser.parseOperandList(generateesOperands,
3704 return failure();
3705
3706 if (parser.parseLess())
3707 return failure();
3708 } else {
3709 // Syntax 2: generatees omitted
3710 }
3711
3712 // Parse `<-` (`<` has already been parsed)
3713 if (parser.parseMinus())
3714 return failure();
3715
3716 if (parser.parseOperandList(applyeesOperands,
3718 return failure();
3719
3720 return success();
3721}
3722
3723LogicalResult TileOp::verify() {
3724 if (getApplyees().empty())
3725 return emitOpError() << "must apply to at least one loop";
3726
3727 if (getSizes().size() != getApplyees().size())
3728 return emitOpError() << "there must be one tile size for each applyee";
3729
3730 if (!getGeneratees().empty() &&
3731 2 * getSizes().size() != getGeneratees().size())
3732 return emitOpError()
3733 << "expecting two times the number of generatees than applyees";
3734
3735 DenseSet<Value> parentIVs;
3736
3737 Value parent = getApplyees().front();
3738 for (auto &&applyee : llvm::drop_begin(getApplyees())) {
3739 auto [parentCreate, parentGen, parentCons] = decodeCli(parent);
3740 auto [create, gen, cons] = decodeCli(applyee);
3741
3742 if (!parentGen)
3743 return emitOpError() << "applyee CLI has no generator";
3744
3745 auto parentLoop = dyn_cast_or_null<CanonicalLoopOp>(parentGen->getOwner());
3746 if (!parentGen)
3747 return emitOpError()
3748 << "currently only supports omp.canonical_loop as applyee";
3749
3750 parentIVs.insert(parentLoop.getInductionVar());
3751
3752 if (!gen)
3753 return emitOpError() << "applyee CLI has no generator";
3754 auto loop = dyn_cast_or_null<CanonicalLoopOp>(gen->getOwner());
3755 if (!loop)
3756 return emitOpError()
3757 << "currently only supports omp.canonical_loop as applyee";
3758
3759 // Canonical loop must be perfectly nested, i.e. the body of the parent must
3760 // only contain the omp.canonical_loop of the nested loops, and
3761 // omp.terminator
3762 bool isPerfectlyNested = [&]() {
3763 auto &parentBody = parentLoop.getRegion();
3764 if (!parentBody.hasOneBlock())
3765 return false;
3766 auto &parentBlock = parentBody.getBlocks().front();
3767
3768 auto nestedLoopIt = parentBlock.begin();
3769 if (nestedLoopIt == parentBlock.end() ||
3770 (&*nestedLoopIt != loop.getOperation()))
3771 return false;
3772
3773 auto termIt = std::next(nestedLoopIt);
3774 if (termIt == parentBlock.end() || !isa<TerminatorOp>(termIt))
3775 return false;
3776
3777 if (std::next(termIt) != parentBlock.end())
3778 return false;
3779
3780 return true;
3781 }();
3782 if (!isPerfectlyNested)
3783 return emitOpError() << "tiled loop nest must be perfectly nested";
3784
3785 if (parentIVs.contains(loop.getTripCount()))
3786 return emitOpError() << "tiled loop nest must be rectangular";
3787
3788 parent = applyee;
3789 }
3790
3791 // TODO: The tile sizes must be computed before the loop, but checking this
3792 // requires dominance analysis. For instance:
3793 //
3794 // %canonloop = omp.new_cli
3795 // omp.canonical_loop(%canonloop) %iv : i32 in range(%tc) {
3796 // // write to %x
3797 // omp.terminator
3798 // }
3799 // %ts = llvm.load %x
3800 // omp.tile <- (%canonloop) sizes(%ts : i32)
3801
3802 return success();
3803}
3804
3805std::pair<unsigned, unsigned> TileOp ::getApplyeesODSOperandIndexAndLength() {
3806 return getODSOperandIndexAndLength(odsIndex_applyees);
3807}
3808
3809std::pair<unsigned, unsigned> TileOp::getGenerateesODSOperandIndexAndLength() {
3810 return getODSOperandIndexAndLength(odsIndex_generatees);
3811}
3812
3813//===----------------------------------------------------------------------===//
3814// Critical construct (2.17.1)
3815//===----------------------------------------------------------------------===//
3816
3817void CriticalDeclareOp::build(OpBuilder &builder, OperationState &state,
3818 const CriticalDeclareOperands &clauses) {
3819 CriticalDeclareOp::build(builder, state, clauses.symName, clauses.hint);
3820}
3821
3822LogicalResult CriticalDeclareOp::verify() {
3823 return verifySynchronizationHint(*this, getHint());
3824}
3825
3826LogicalResult CriticalOp::verifySymbolUses(SymbolTableCollection &symbolTable) {
3827 if (getNameAttr()) {
3828 SymbolRefAttr symbolRef = getNameAttr();
3829 auto decl = symbolTable.lookupNearestSymbolFrom<CriticalDeclareOp>(
3830 *this, symbolRef);
3831 if (!decl) {
3832 return emitOpError() << "expected symbol reference " << symbolRef
3833 << " to point to a critical declaration";
3834 }
3835 }
3836
3837 return success();
3838}
3839
3840//===----------------------------------------------------------------------===//
3841// Ordered construct
3842//===----------------------------------------------------------------------===//
3843
3844static LogicalResult verifyOrderedParent(Operation &op) {
3845 bool hasRegion = op.getNumRegions() > 0;
3846 auto loopOp = op.getParentOfType<LoopNestOp>();
3847 if (!loopOp) {
3848 if (hasRegion)
3849 return success();
3850
3851 // TODO: Consider if this needs to be the case only for the standalone
3852 // variant of the ordered construct.
3853 return op.emitOpError() << "must be nested inside of a loop";
3854 }
3855
3856 Operation *wrapper = loopOp->getParentOp();
3857 if (auto wsloopOp = dyn_cast<WsloopOp>(wrapper)) {
3858 IntegerAttr orderedAttr = wsloopOp.getOrderedAttr();
3859 if (!orderedAttr)
3860 return op.emitOpError() << "the enclosing worksharing-loop region must "
3861 "have an ordered clause";
3862
3863 if (hasRegion && orderedAttr.getInt() != 0)
3864 return op.emitOpError() << "the enclosing loop's ordered clause must not "
3865 "have a parameter present";
3866
3867 if (!hasRegion && orderedAttr.getInt() == 0)
3868 return op.emitOpError() << "the enclosing loop's ordered clause must "
3869 "have a parameter present";
3870 } else if (!isa<SimdOp>(wrapper)) {
3871 return op.emitOpError() << "must be nested inside of a worksharing, simd "
3872 "or worksharing simd loop";
3873 }
3874 return success();
3875}
3876
3877void OrderedOp::build(OpBuilder &builder, OperationState &state,
3878 const OrderedOperands &clauses) {
3879 OrderedOp::build(builder, state, clauses.doacrossDependType,
3880 clauses.doacrossNumLoops, clauses.doacrossDependVars);
3881}
3882
3883LogicalResult OrderedOp::verify() {
3884 if (failed(verifyOrderedParent(**this)))
3885 return failure();
3886
3887 auto wrapper = (*this)->getParentOfType<WsloopOp>();
3888 if (!wrapper || *wrapper.getOrdered() != *getDoacrossNumLoops())
3889 return emitOpError() << "number of variables in depend clause does not "
3890 << "match number of iteration variables in the "
3891 << "doacross loop";
3892
3893 return success();
3894}
3895
3896void OrderedRegionOp::build(OpBuilder &builder, OperationState &state,
3897 const OrderedRegionOperands &clauses) {
3898 OrderedRegionOp::build(builder, state, clauses.parLevelSimd);
3899}
3900
3901LogicalResult OrderedRegionOp::verify() { return verifyOrderedParent(**this); }
3902
3903//===----------------------------------------------------------------------===//
3904// TaskwaitOp
3905//===----------------------------------------------------------------------===//
3906
3907void TaskwaitOp::build(OpBuilder &builder, OperationState &state,
3908 const TaskwaitOperands &clauses) {
3909 // TODO Store clauses in op: dependKinds, dependVars, nowait.
3910 TaskwaitOp::build(builder, state, /*depend_kinds=*/nullptr,
3911 /*depend_vars=*/{}, /*nowait=*/nullptr);
3912}
3913
3914//===----------------------------------------------------------------------===//
3915// Verifier for AtomicReadOp
3916//===----------------------------------------------------------------------===//
3917
3918LogicalResult AtomicReadOp::verify() {
3919 if (verifyCommon().failed())
3920 return mlir::failure();
3921
3922 if (auto mo = getMemoryOrder()) {
3923 if (*mo == ClauseMemoryOrderKind::Acq_rel ||
3924 *mo == ClauseMemoryOrderKind::Release) {
3925 return emitError(
3926 "memory-order must not be acq_rel or release for atomic reads");
3927 }
3928 }
3929 return verifySynchronizationHint(*this, getHint());
3930}
3931
3932//===----------------------------------------------------------------------===//
3933// Verifier for AtomicWriteOp
3934//===----------------------------------------------------------------------===//
3935
3936LogicalResult AtomicWriteOp::verify() {
3937 if (verifyCommon().failed())
3938 return mlir::failure();
3939
3940 if (auto mo = getMemoryOrder()) {
3941 if (*mo == ClauseMemoryOrderKind::Acq_rel ||
3942 *mo == ClauseMemoryOrderKind::Acquire) {
3943 return emitError(
3944 "memory-order must not be acq_rel or acquire for atomic writes");
3945 }
3946 }
3947 return verifySynchronizationHint(*this, getHint());
3948}
3949
3950//===----------------------------------------------------------------------===//
3951// Verifier for AtomicUpdateOp
3952//===----------------------------------------------------------------------===//
3953
3954LogicalResult AtomicUpdateOp::canonicalize(AtomicUpdateOp op,
3955 PatternRewriter &rewriter) {
3956 if (op.isNoOp()) {
3957 rewriter.eraseOp(op);
3958 return success();
3959 }
3960 if (Value writeVal = op.getWriteOpVal()) {
3961 rewriter.replaceOpWithNewOp<AtomicWriteOp>(
3962 op, op.getX(), writeVal, op.getHintAttr(), op.getMemoryOrderAttr());
3963 return success();
3964 }
3965 return failure();
3966}
3967
3968LogicalResult AtomicUpdateOp::verify() {
3969 if (verifyCommon().failed())
3970 return mlir::failure();
3971
3972 if (auto mo = getMemoryOrder()) {
3973 if (*mo == ClauseMemoryOrderKind::Acq_rel ||
3974 *mo == ClauseMemoryOrderKind::Acquire) {
3975 return emitError(
3976 "memory-order must not be acq_rel or acquire for atomic updates");
3977 }
3978 }
3979
3980 return verifySynchronizationHint(*this, getHint());
3981}
3982
3983LogicalResult AtomicUpdateOp::verifyRegions() { return verifyRegionsCommon(); }
3984
3985//===----------------------------------------------------------------------===//
3986// Verifier for AtomicCaptureOp
3987//===----------------------------------------------------------------------===//
3988
3989AtomicReadOp AtomicCaptureOp::getAtomicReadOp() {
3990 if (auto op = dyn_cast<AtomicReadOp>(getFirstOp()))
3991 return op;
3992 return dyn_cast<AtomicReadOp>(getSecondOp());
3993}
3994
3995AtomicWriteOp AtomicCaptureOp::getAtomicWriteOp() {
3996 if (auto op = dyn_cast<AtomicWriteOp>(getFirstOp()))
3997 return op;
3998 return dyn_cast<AtomicWriteOp>(getSecondOp());
3999}
4000
4001AtomicUpdateOp AtomicCaptureOp::getAtomicUpdateOp() {
4002 if (auto op = dyn_cast<AtomicUpdateOp>(getFirstOp()))
4003 return op;
4004 return dyn_cast<AtomicUpdateOp>(getSecondOp());
4005}
4006
4007LogicalResult AtomicCaptureOp::verify() {
4008 return verifySynchronizationHint(*this, getHint());
4009}
4010
4011LogicalResult AtomicCaptureOp::verifyRegions() {
4012 if (verifyRegionsCommon().failed())
4013 return mlir::failure();
4014
4015 if (getFirstOp()->getAttr("hint") || getSecondOp()->getAttr("hint"))
4016 return emitOpError(
4017 "operations inside capture region must not have hint clause");
4018
4019 if (getFirstOp()->getAttr("memory_order") ||
4020 getSecondOp()->getAttr("memory_order"))
4021 return emitOpError(
4022 "operations inside capture region must not have memory_order clause");
4023 return success();
4024}
4025
4026//===----------------------------------------------------------------------===//
4027// CancelOp
4028//===----------------------------------------------------------------------===//
4029
4030void CancelOp::build(OpBuilder &builder, OperationState &state,
4031 const CancelOperands &clauses) {
4032 CancelOp::build(builder, state, clauses.cancelDirective, clauses.ifExpr);
4033}
4034
4036 Operation *parent = thisOp->getParentOp();
4037 while (parent) {
4038 if (parent->getDialect() == thisOp->getDialect())
4039 return parent;
4040 parent = parent->getParentOp();
4041 }
4042 return nullptr;
4043}
4044
4045LogicalResult CancelOp::verify() {
4046 ClauseCancellationConstructType cct = getCancelDirective();
4047 // The next OpenMP operation in the chain of parents
4048 Operation *structuralParent = getParentInSameDialect((*this).getOperation());
4049 if (!structuralParent)
4050 return emitOpError() << "Orphaned cancel construct";
4051
4052 if ((cct == ClauseCancellationConstructType::Parallel) &&
4053 !mlir::isa<ParallelOp>(structuralParent)) {
4054 return emitOpError() << "cancel parallel must appear "
4055 << "inside a parallel region";
4056 }
4057 if (cct == ClauseCancellationConstructType::Loop) {
4058 // structural parent will be omp.loop_nest, directly nested inside
4059 // omp.wsloop
4060 auto wsloopOp = mlir::dyn_cast<WsloopOp>(structuralParent->getParentOp());
4061
4062 if (!wsloopOp) {
4063 return emitOpError()
4064 << "cancel loop must appear inside a worksharing-loop region";
4065 }
4066 if (wsloopOp.getNowaitAttr()) {
4067 return emitError() << "A worksharing construct that is canceled "
4068 << "must not have a nowait clause";
4069 }
4070 if (wsloopOp.getOrderedAttr()) {
4071 return emitError() << "A worksharing construct that is canceled "
4072 << "must not have an ordered clause";
4073 }
4074
4075 } else if (cct == ClauseCancellationConstructType::Sections) {
4076 // structural parent will be an omp.section, directly nested inside
4077 // omp.sections
4078 auto sectionsOp =
4079 mlir::dyn_cast<SectionsOp>(structuralParent->getParentOp());
4080 if (!sectionsOp) {
4081 return emitOpError() << "cancel sections must appear "
4082 << "inside a sections region";
4083 }
4084 if (sectionsOp.getNowait()) {
4085 return emitError() << "A sections construct that is canceled "
4086 << "must not have a nowait clause";
4087 }
4088 }
4089 if ((cct == ClauseCancellationConstructType::Taskgroup) &&
4090 (!mlir::isa<omp::TaskOp>(structuralParent) &&
4091 !mlir::isa<omp::TaskloopOp>(structuralParent->getParentOp()))) {
4092 return emitOpError() << "cancel taskgroup must appear "
4093 << "inside a task region";
4094 }
4095 return success();
4096}
4097
4098//===----------------------------------------------------------------------===//
4099// CancellationPointOp
4100//===----------------------------------------------------------------------===//
4101
4102void CancellationPointOp::build(OpBuilder &builder, OperationState &state,
4103 const CancellationPointOperands &clauses) {
4104 CancellationPointOp::build(builder, state, clauses.cancelDirective);
4105}
4106
4107LogicalResult CancellationPointOp::verify() {
4108 ClauseCancellationConstructType cct = getCancelDirective();
4109 // The next OpenMP operation in the chain of parents
4110 Operation *structuralParent = getParentInSameDialect((*this).getOperation());
4111 if (!structuralParent)
4112 return emitOpError() << "Orphaned cancellation point";
4113
4114 if ((cct == ClauseCancellationConstructType::Parallel) &&
4115 !mlir::isa<ParallelOp>(structuralParent)) {
4116 return emitOpError() << "cancellation point parallel must appear "
4117 << "inside a parallel region";
4118 }
4119 // Strucutal parent here will be an omp.loop_nest. Get the parent of that to
4120 // find the wsloop
4121 if ((cct == ClauseCancellationConstructType::Loop) &&
4122 !mlir::isa<WsloopOp>(structuralParent->getParentOp())) {
4123 return emitOpError() << "cancellation point loop must appear "
4124 << "inside a worksharing-loop region";
4125 }
4126 if ((cct == ClauseCancellationConstructType::Sections) &&
4127 !mlir::isa<omp::SectionOp>(structuralParent)) {
4128 return emitOpError() << "cancellation point sections must appear "
4129 << "inside a sections region";
4130 }
4131 if ((cct == ClauseCancellationConstructType::Taskgroup) &&
4132 !mlir::isa<omp::TaskOp>(structuralParent)) {
4133 return emitOpError() << "cancellation point taskgroup must appear "
4134 << "inside a task region";
4135 }
4136 return success();
4137}
4138
4139//===----------------------------------------------------------------------===//
4140// MapBoundsOp
4141//===----------------------------------------------------------------------===//
4142
4143LogicalResult MapBoundsOp::verify() {
4144 auto extent = getExtent();
4145 auto upperbound = getUpperBound();
4146 if (!extent && !upperbound)
4147 return emitError("expected extent or upperbound.");
4148 return success();
4149}
4150
4151void PrivateClauseOp::build(OpBuilder &odsBuilder, OperationState &odsState,
4152 TypeRange /*result_types*/, StringAttr symName,
4153 TypeAttr type) {
4154 PrivateClauseOp::build(
4155 odsBuilder, odsState, symName, type,
4156 DataSharingClauseTypeAttr::get(odsBuilder.getContext(),
4157 DataSharingClauseType::Private));
4158}
4159
4160LogicalResult PrivateClauseOp::verifyRegions() {
4161 Type argType = getArgType();
4162 auto verifyTerminator = [&](Operation *terminator,
4163 bool yieldsValue) -> LogicalResult {
4164 if (!terminator->getBlock()->getSuccessors().empty())
4165 return success();
4166
4167 if (!llvm::isa<YieldOp>(terminator))
4168 return mlir::emitError(terminator->getLoc())
4169 << "expected exit block terminator to be an `omp.yield` op.";
4170
4171 YieldOp yieldOp = llvm::cast<YieldOp>(terminator);
4172 TypeRange yieldedTypes = yieldOp.getResults().getTypes();
4173
4174 if (!yieldsValue) {
4175 if (yieldedTypes.empty())
4176 return success();
4177
4178 return mlir::emitError(terminator->getLoc())
4179 << "Did not expect any values to be yielded.";
4180 }
4181
4182 if (yieldedTypes.size() == 1 && yieldedTypes.front() == argType)
4183 return success();
4184
4185 auto error = mlir::emitError(yieldOp.getLoc())
4186 << "Invalid yielded value. Expected type: " << argType
4187 << ", got: ";
4188
4189 if (yieldedTypes.empty())
4190 error << "None";
4191 else
4192 error << yieldedTypes;
4193
4194 return error;
4195 };
4196
4197 auto verifyRegion = [&](Region &region, unsigned expectedNumArgs,
4198 StringRef regionName,
4199 bool yieldsValue) -> LogicalResult {
4200 assert(!region.empty());
4201
4202 if (region.getNumArguments() != expectedNumArgs)
4203 return mlir::emitError(region.getLoc())
4204 << "`" << regionName << "`: "
4205 << "expected " << expectedNumArgs
4206 << " region arguments, got: " << region.getNumArguments();
4207
4208 for (Block &block : region) {
4209 // MLIR will verify the absence of the terminator for us.
4210 if (!block.mightHaveTerminator())
4211 continue;
4212
4213 if (failed(verifyTerminator(block.getTerminator(), yieldsValue)))
4214 return failure();
4215 }
4216
4217 return success();
4218 };
4219
4220 // Ensure all of the region arguments have the same type
4221 for (Region *region : getRegions())
4222 for (Type ty : region->getArgumentTypes())
4223 if (ty != argType)
4224 return emitError() << "Region argument type mismatch: got " << ty
4225 << " expected " << argType << ".";
4226
4227 mlir::Region &initRegion = getInitRegion();
4228 if (!initRegion.empty() &&
4229 failed(verifyRegion(getInitRegion(), /*expectedNumArgs=*/2, "init",
4230 /*yieldsValue=*/true)))
4231 return failure();
4232
4233 DataSharingClauseType dsType = getDataSharingType();
4234
4235 if (dsType == DataSharingClauseType::Private && !getCopyRegion().empty())
4236 return emitError("`private` clauses do not require a `copy` region.");
4237
4238 if (dsType == DataSharingClauseType::FirstPrivate && getCopyRegion().empty())
4239 return emitError(
4240 "`firstprivate` clauses require at least a `copy` region.");
4241
4242 if (dsType == DataSharingClauseType::FirstPrivate &&
4243 failed(verifyRegion(getCopyRegion(), /*expectedNumArgs=*/2, "copy",
4244 /*yieldsValue=*/true)))
4245 return failure();
4246
4247 if (!getDeallocRegion().empty() &&
4248 failed(verifyRegion(getDeallocRegion(), /*expectedNumArgs=*/1, "dealloc",
4249 /*yieldsValue=*/false)))
4250 return failure();
4251
4252 return success();
4253}
4254
4255//===----------------------------------------------------------------------===//
4256// Spec 5.2: Masked construct (10.5)
4257//===----------------------------------------------------------------------===//
4258
4259void MaskedOp::build(OpBuilder &builder, OperationState &state,
4260 const MaskedOperands &clauses) {
4261 MaskedOp::build(builder, state, clauses.filteredThreadId);
4262}
4263
4264//===----------------------------------------------------------------------===//
4265// Spec 5.2: Scan construct (5.6)
4266//===----------------------------------------------------------------------===//
4267
4268void ScanOp::build(OpBuilder &builder, OperationState &state,
4269 const ScanOperands &clauses) {
4270 ScanOp::build(builder, state, clauses.inclusiveVars, clauses.exclusiveVars);
4271}
4272
4273LogicalResult ScanOp::verify() {
4274 if (hasExclusiveVars() == hasInclusiveVars())
4275 return emitError(
4276 "Exactly one of EXCLUSIVE or INCLUSIVE clause is expected");
4277 if (WsloopOp parentWsLoopOp = (*this)->getParentOfType<WsloopOp>()) {
4278 if (parentWsLoopOp.getReductionModAttr() &&
4279 parentWsLoopOp.getReductionModAttr().getValue() ==
4280 ReductionModifier::inscan)
4281 return success();
4282 }
4283 if (SimdOp parentSimdOp = (*this)->getParentOfType<SimdOp>()) {
4284 if (parentSimdOp.getReductionModAttr() &&
4285 parentSimdOp.getReductionModAttr().getValue() ==
4286 ReductionModifier::inscan)
4287 return success();
4288 }
4289 return emitError("SCAN directive needs to be enclosed within a parent "
4290 "worksharing loop construct or SIMD construct with INSCAN "
4291 "reduction modifier");
4292}
4293
4294/// Verifies align clause in allocate directive
4295
4296LogicalResult AllocateDirOp::verify() {
4297 std::optional<uint64_t> align = this->getAlign();
4298
4299 if (align.has_value()) {
4300 if ((align.value() > 0) && !llvm::has_single_bit(align.value()))
4301 return emitError() << "ALIGN value : " << align.value()
4302 << " must be power of 2";
4303 }
4304
4305 return success();
4306}
4307
4308//===----------------------------------------------------------------------===//
4309// TargetAllocMemOp
4310//===----------------------------------------------------------------------===//
4311
4312mlir::Type omp::TargetAllocMemOp::getAllocatedType() {
4313 return getInTypeAttr().getValue();
4314}
4315
4316/// operation ::= %res = (`omp.target_alloc_mem`) $device : devicetype,
4317/// $in_type ( `(` $typeparams `)` )? ( `,` $shape )?
4318/// attr-dict-without-keyword
4319static mlir::ParseResult parseTargetAllocMemOp(mlir::OpAsmParser &parser,
4321 auto &builder = parser.getBuilder();
4322 bool hasOperands = false;
4323 std::int32_t typeparamsSize = 0;
4324
4325 // Parse device number as a new operand
4327 mlir::Type deviceType;
4328 if (parser.parseOperand(deviceOperand) || parser.parseColonType(deviceType))
4329 return mlir::failure();
4330 if (parser.resolveOperand(deviceOperand, deviceType, result.operands))
4331 return mlir::failure();
4332 if (parser.parseComma())
4333 return mlir::failure();
4334
4335 mlir::Type intype;
4336 if (parser.parseType(intype))
4337 return mlir::failure();
4338 result.addAttribute("in_type", mlir::TypeAttr::get(intype));
4341 if (!parser.parseOptionalLParen()) {
4342 // parse the LEN params of the derived type. (<params> : <types>)
4344 parser.parseColonTypeList(typeVec) || parser.parseRParen())
4345 return mlir::failure();
4346 typeparamsSize = operands.size();
4347 hasOperands = true;
4348 }
4349 std::int32_t shapeSize = 0;
4350 if (!parser.parseOptionalComma()) {
4351 // parse size to scale by, vector of n dimensions of type index
4353 return mlir::failure();
4354 shapeSize = operands.size() - typeparamsSize;
4355 auto idxTy = builder.getIndexType();
4356 for (std::int32_t i = typeparamsSize, end = operands.size(); i != end; ++i)
4357 typeVec.push_back(idxTy);
4358 hasOperands = true;
4359 }
4360 if (hasOperands &&
4361 parser.resolveOperands(operands, typeVec, parser.getNameLoc(),
4362 result.operands))
4363 return mlir::failure();
4364
4365 mlir::Type restype = builder.getIntegerType(64);
4366 if (!restype) {
4367 parser.emitError(parser.getNameLoc(), "invalid allocate type: ") << intype;
4368 return mlir::failure();
4369 }
4370 llvm::SmallVector<std::int32_t> segmentSizes{1, typeparamsSize, shapeSize};
4371 result.addAttribute("operandSegmentSizes",
4372 builder.getDenseI32ArrayAttr(segmentSizes));
4373 if (parser.parseOptionalAttrDict(result.attributes) ||
4374 parser.addTypeToList(restype, result.types))
4375 return mlir::failure();
4376 return mlir::success();
4377}
4378
4379mlir::ParseResult omp::TargetAllocMemOp::parse(mlir::OpAsmParser &parser,
4381 return parseTargetAllocMemOp(parser, result);
4382}
4383
4384void omp::TargetAllocMemOp::print(mlir::OpAsmPrinter &p) {
4385 p << " ";
4387 p << " : ";
4388 p << getDevice().getType();
4389 p << ", ";
4390 p << getInType();
4391 if (!getTypeparams().empty()) {
4392 p << '(' << getTypeparams() << " : " << getTypeparams().getTypes() << ')';
4393 }
4394 for (auto sh : getShape()) {
4395 p << ", ";
4396 p.printOperand(sh);
4397 }
4398 p.printOptionalAttrDict((*this)->getAttrs(),
4399 {"in_type", "operandSegmentSizes"});
4400}
4401
4402llvm::LogicalResult omp::TargetAllocMemOp::verify() {
4403 mlir::Type outType = getType();
4404 if (!mlir::dyn_cast<IntegerType>(outType))
4405 return emitOpError("must be a integer type");
4406 return mlir::success();
4407}
4408
4409//===----------------------------------------------------------------------===//
4410// WorkdistributeOp
4411//===----------------------------------------------------------------------===//
4412
4413LogicalResult WorkdistributeOp::verify() {
4414 // Check that region exists and is not empty
4415 Region &region = getRegion();
4416 if (region.empty())
4417 return emitOpError("region cannot be empty");
4418 // Verify single entry point.
4419 Block &entryBlock = region.front();
4420 if (entryBlock.empty())
4421 return emitOpError("region must contain a structured block");
4422 // Verify single exit point.
4423 bool hasTerminator = false;
4424 for (Block &block : region) {
4425 if (isa<TerminatorOp>(block.back())) {
4426 if (hasTerminator) {
4427 return emitOpError("region must have exactly one terminator");
4428 }
4429 hasTerminator = true;
4430 }
4431 }
4432 if (!hasTerminator) {
4433 return emitOpError("region must be terminated with omp.terminator");
4434 }
4435 auto walkResult = region.walk([&](Operation *op) -> WalkResult {
4436 // No implicit barrier at end
4437 if (isa<BarrierOp>(op)) {
4438 return emitOpError(
4439 "explicit barriers are not allowed in workdistribute region");
4440 }
4441 // Check for invalid nested constructs
4442 if (isa<ParallelOp>(op)) {
4443 return emitOpError(
4444 "nested parallel constructs not allowed in workdistribute");
4445 }
4446 if (isa<TeamsOp>(op)) {
4447 return emitOpError(
4448 "nested teams constructs not allowed in workdistribute");
4449 }
4450 return WalkResult::advance();
4451 });
4452 if (walkResult.wasInterrupted())
4453 return failure();
4454
4455 Operation *parentOp = (*this)->getParentOp();
4456 if (!llvm::dyn_cast<TeamsOp>(parentOp))
4457 return emitOpError("workdistribute must be nested under teams");
4458 return success();
4459}
4460
4461#define GET_ATTRDEF_CLASSES
4462#include "mlir/Dialect/OpenMP/OpenMPOpsAttributes.cpp.inc"
4463
4464#define GET_OP_CLASSES
4465#include "mlir/Dialect/OpenMP/OpenMPOps.cpp.inc"
4466
4467#define GET_TYPEDEF_CLASSES
4468#include "mlir/Dialect/OpenMP/OpenMPOpsTypes.cpp.inc"
static SmallVector< Value > getTileSizes(Location loc, amx::TileType tType, RewriterBase &rewriter)
Maps the 2-dim vector shape to the two 16-bit tile sizes.
return success()
p<< " : "<< getMemRefType()<< ", "<< getType();}static LogicalResult verifyVectorMemoryOp(Operation *op, MemRefType memrefType, VectorType vectorType) { if(memrefType.getElementType() !=vectorType.getElementType()) return op-> emitOpError("requires memref and vector types of the same elemental type")
Given a list of lists of parsed operands, populates uniqueOperands with unique operands.
static std::optional< int64_t > getUpperBound(Value iv)
Gets the constant upper bound on an affine.for iv.
static LogicalResult verifyRegion(emitc::SwitchOp op, Region &region, const Twine &name)
Definition EmitC.cpp:1400
static Type getElementType(Type type)
Determine the element type of type.
static ze_device_handle_t getDevice(const uint32_t driverIdx=0, const int32_t devIdx=0)
b
Return true if permutation is a valid permutation of the outer_dims_perm (case OuterOrInnerPerm::Oute...
ArrayAttr()
b getContext())
static const mlir::GenInfo * generator
static LogicalResult verifyNontemporalClause(Operation *op, OperandRange nontemporalVars)
static DenseI64ArrayAttr makeDenseI64ArrayAttr(MLIRContext *ctx, const ArrayRef< int64_t > intArray)
static constexpr StringRef getPrivateNeedsBarrierSpelling()
static LogicalResult verifyMapClause(Operation *op, OperandRange mapVars)
static LogicalResult verifyReductionVarList(Operation *op, std::optional< ArrayAttr > reductionSyms, OperandRange reductionVars, std::optional< ArrayRef< bool > > reductionByref)
Verifies Reduction Clause.
static ParseResult parseInReductionPrivateRegion(OpAsmParser &parser, Region &region, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &inReductionVars, SmallVectorImpl< Type > &inReductionTypes, DenseBoolArrayAttr &inReductionByref, ArrayAttr &inReductionSyms, llvm::SmallVectorImpl< OpAsmParser::UnresolvedOperand > &privateVars, llvm::SmallVectorImpl< Type > &privateTypes, ArrayAttr &privateSyms, UnitAttr &privateNeedsBarrier)
static ArrayAttr makeArrayAttr(MLIRContext *context, llvm::ArrayRef< Attribute > attrs)
static ParseResult parseClauseAttr(AsmParser &parser, ClauseAttr &attr)
static void printAllocateAndAllocator(OpAsmPrinter &p, Operation *op, OperandRange allocateVars, TypeRange allocateTypes, OperandRange allocatorVars, TypeRange allocatorTypes)
Print allocate clause.
static DenseBoolArrayAttr makeDenseBoolArrayAttr(MLIRContext *ctx, const ArrayRef< bool > boolArray)
static std::string generateLoopNestingName(StringRef prefix, CanonicalLoopOp op)
Generate a name of a canonical loop nest of the format <prefix>(_r<idx>_s<idx>)*.
static void printClauseWithRegionArgs(OpAsmPrinter &p, MLIRContext *ctx, StringRef clauseName, ValueRange argsSubrange, ValueRange operands, TypeRange types, ArrayAttr symbols=nullptr, DenseI64ArrayAttr mapIndices=nullptr, DenseBoolArrayAttr byref=nullptr, ReductionModifierAttr modifier=nullptr, UnitAttr needsBarrier=nullptr)
static void printBlockArgClause(OpAsmPrinter &p, MLIRContext *ctx, StringRef clauseName, ValueRange argsSubrange, std::optional< MapPrintArgs > mapArgs)
static void printBlockArgRegion(OpAsmPrinter &p, Operation *op, Region &region, const AllRegionPrintArgs &args)
static ParseResult parseGranularityClause(OpAsmParser &parser, ClauseTypeAttr &prescriptiveness, std::optional< OpAsmParser::UnresolvedOperand > &operand, Type &operandType, std::optional< ClauseType >(*symbolizeClause)(StringRef), StringRef clauseName)
static ParseResult parseBlockArgRegion(OpAsmParser &parser, Region &region, AllRegionParseArgs args)
static ParseResult parseLoopTransformClis(OpAsmParser &parser, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &generateesOperands, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &applyeesOperands)
static ParseResult parseSynchronizationHint(OpAsmParser &parser, IntegerAttr &hintAttr)
Parses a Synchronization Hint clause.
static ParseResult parseLinearClause(OpAsmParser &parser, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &linearVars, SmallVectorImpl< Type > &linearTypes, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &linearStepVars)
linear ::= linear ( linear-list ) linear-list := linear-val | linear-val linear-list linear-val := ss...
static void printScheduleClause(OpAsmPrinter &p, Operation *op, ClauseScheduleKindAttr scheduleKind, ScheduleModifierAttr scheduleMod, UnitAttr scheduleSimd, Value scheduleChunk, Type scheduleChunkType)
Print schedule clause.
static void printCopyprivate(OpAsmPrinter &p, Operation *op, OperandRange copyprivateVars, TypeRange copyprivateTypes, std::optional< ArrayAttr > copyprivateSyms)
Print Copyprivate clause.
static ParseResult parseOrderClause(OpAsmParser &parser, ClauseOrderKindAttr &order, OrderModifierAttr &orderMod)
static bool mapTypeToBool(ClauseMapFlags value, ClauseMapFlags flag)
static void printAlignedClause(OpAsmPrinter &p, Operation *op, ValueRange alignedVars, TypeRange alignedTypes, std::optional< ArrayAttr > alignments)
Print Aligned Clause.
static LogicalResult verifySynchronizationHint(Operation *op, uint64_t hint)
Verifies a synchronization hint clause.
static ParseResult parseUseDeviceAddrUseDevicePtrRegion(OpAsmParser &parser, Region &region, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &useDeviceAddrVars, SmallVectorImpl< Type > &useDeviceAddrTypes, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &useDevicePtrVars, SmallVectorImpl< Type > &useDevicePtrTypes)
static void printLinearClause(OpAsmPrinter &p, Operation *op, ValueRange linearVars, TypeRange linearTypes, ValueRange linearStepVars)
Print Linear Clause.
*attr dict without keyword *static mlir::ParseResult parseTargetAllocMemOp(mlir::OpAsmParser &parser, mlir::OperationState &result)
operation ::= res = (omp.target_alloc_mem) $device : devicetype, $in_type ( ( $typeparams ) )?...
static Operation * findCapturedOmpOp(Operation *rootOp, bool checkSingleMandatoryExec, llvm::function_ref< bool(Operation *)> siblingAllowedFn)
static void printInReductionPrivateReductionRegion(OpAsmPrinter &p, Operation *op, Region &region, ValueRange inReductionVars, TypeRange inReductionTypes, DenseBoolArrayAttr inReductionByref, ArrayAttr inReductionSyms, ValueRange privateVars, TypeRange privateTypes, ArrayAttr privateSyms, UnitAttr privateNeedsBarrier, ReductionModifierAttr reductionMod, ValueRange reductionVars, TypeRange reductionTypes, DenseBoolArrayAttr reductionByref, ArrayAttr reductionSyms)
static void printInReductionPrivateRegion(OpAsmPrinter &p, Operation *op, Region &region, ValueRange inReductionVars, TypeRange inReductionTypes, DenseBoolArrayAttr inReductionByref, ArrayAttr inReductionSyms, ValueRange privateVars, TypeRange privateTypes, ArrayAttr privateSyms, UnitAttr privateNeedsBarrier)
static void printSynchronizationHint(OpAsmPrinter &p, Operation *op, IntegerAttr hintAttr)
Prints a Synchronization Hint clause.
static void printGranularityClause(OpAsmPrinter &p, Operation *op, ClauseTypeAttr prescriptiveness, Value operand, mlir::Type operandType, StringRef(*stringifyClauseType)(ClauseType))
static void printDependVarList(OpAsmPrinter &p, Operation *op, OperandRange dependVars, TypeRange dependTypes, std::optional< ArrayAttr > dependKinds)
Print Depend clause.
static void printTargetOpRegion(OpAsmPrinter &p, Operation *op, Region &region, ValueRange hasDeviceAddrVars, TypeRange hasDeviceAddrTypes, ValueRange hostEvalVars, TypeRange hostEvalTypes, ValueRange inReductionVars, TypeRange inReductionTypes, DenseBoolArrayAttr inReductionByref, ArrayAttr inReductionSyms, ValueRange mapVars, TypeRange mapTypes, ValueRange privateVars, TypeRange privateTypes, ArrayAttr privateSyms, UnitAttr privateNeedsBarrier, DenseI64ArrayAttr privateMaps)
static Operation * getParentInSameDialect(Operation *thisOp)
static LogicalResult verifyCopyprivateVarList(Operation *op, OperandRange copyprivateVars, std::optional< ArrayAttr > copyprivateSyms)
Verifies CopyPrivate Clause.
static LogicalResult verifyAlignedClause(Operation *op, std::optional< ArrayAttr > alignments, OperandRange alignedVars)
static ParseResult parseTargetOpRegion(OpAsmParser &parser, Region &region, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &hasDeviceAddrVars, SmallVectorImpl< Type > &hasDeviceAddrTypes, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &hostEvalVars, SmallVectorImpl< Type > &hostEvalTypes, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &inReductionVars, SmallVectorImpl< Type > &inReductionTypes, DenseBoolArrayAttr &inReductionByref, ArrayAttr &inReductionSyms, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &mapVars, SmallVectorImpl< Type > &mapTypes, llvm::SmallVectorImpl< OpAsmParser::UnresolvedOperand > &privateVars, llvm::SmallVectorImpl< Type > &privateTypes, ArrayAttr &privateSyms, UnitAttr &privateNeedsBarrier, DenseI64ArrayAttr &privateMaps)
static ParseResult parsePrivateRegion(OpAsmParser &parser, Region &region, llvm::SmallVectorImpl< OpAsmParser::UnresolvedOperand > &privateVars, llvm::SmallVectorImpl< Type > &privateTypes, ArrayAttr &privateSyms, UnitAttr &privateNeedsBarrier)
static void printNumTasksClause(OpAsmPrinter &p, Operation *op, ClauseNumTasksTypeAttr numTasksMod, Value numTasks, mlir::Type numTasksType)
static void printLoopTransformClis(OpAsmPrinter &p, TileOp op, OperandRange generatees, OperandRange applyees)
static void printPrivateRegion(OpAsmPrinter &p, Operation *op, Region &region, ValueRange privateVars, TypeRange privateTypes, ArrayAttr privateSyms, UnitAttr privateNeedsBarrier)
static void printPrivateReductionRegion(OpAsmPrinter &p, Operation *op, Region &region, ValueRange privateVars, TypeRange privateTypes, ArrayAttr privateSyms, UnitAttr privateNeedsBarrier, ReductionModifierAttr reductionMod, ValueRange reductionVars, TypeRange reductionTypes, DenseBoolArrayAttr reductionByref, ArrayAttr reductionSyms)
static void printTaskReductionRegion(OpAsmPrinter &p, Operation *op, Region &region, ValueRange taskReductionVars, TypeRange taskReductionTypes, DenseBoolArrayAttr taskReductionByref, ArrayAttr taskReductionSyms)
return success()
static LogicalResult verifyOrderedParent(Operation &op)
static void printOrderClause(OpAsmPrinter &p, Operation *op, ClauseOrderKindAttr order, OrderModifierAttr orderMod)
static ParseResult parseBlockArgClause(OpAsmParser &parser, llvm::SmallVectorImpl< OpAsmParser::Argument > &entryBlockArgs, StringRef keyword, std::optional< MapParseArgs > mapArgs)
static ParseResult parseClauseWithRegionArgs(OpAsmParser &parser, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &operands, SmallVectorImpl< Type > &types, SmallVectorImpl< OpAsmParser::Argument > &regionPrivateArgs, ArrayAttr *symbols=nullptr, DenseI64ArrayAttr *mapIndices=nullptr, DenseBoolArrayAttr *byref=nullptr, ReductionModifierAttr *modifier=nullptr, UnitAttr *needsBarrier=nullptr)
static LogicalResult verifyPrivateVarsMapping(TargetOp targetOp)
static ParseResult parseScheduleClause(OpAsmParser &parser, ClauseScheduleKindAttr &scheduleAttr, ScheduleModifierAttr &scheduleMod, UnitAttr &scheduleSimd, std::optional< OpAsmParser::UnresolvedOperand > &chunkSize, Type &chunkType)
schedule ::= schedule ( sched-list ) sched-list ::= sched-val | sched-val sched-list | sched-val ,...
static void printClauseAttr(OpAsmPrinter &p, Operation *op, ClauseAttr attr)
static ParseResult parseAllocateAndAllocator(OpAsmParser &parser, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &allocateVars, SmallVectorImpl< Type > &allocateTypes, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &allocatorVars, SmallVectorImpl< Type > &allocatorTypes)
Parse an allocate clause with allocators and a list of operands with types.
static void printMembersIndex(OpAsmPrinter &p, MapInfoOp op, ArrayAttr membersIdx)
static bool canPromoteToNoLoop(Operation *capturedOp, TeamsOp teamsOp, WsloopOp *wsLoopOp)
Check if we can promote SPMD kernel to No-Loop kernel.
static void printCaptureType(OpAsmPrinter &p, Operation *op, VariableCaptureKindAttr mapCaptureType)
static bool opInGlobalImplicitParallelRegion(Operation *op)
static void printUseDeviceAddrUseDevicePtrRegion(OpAsmPrinter &p, Operation *op, Region &region, ValueRange useDeviceAddrVars, TypeRange useDeviceAddrTypes, ValueRange useDevicePtrVars, TypeRange useDevicePtrTypes)
static LogicalResult verifyPrivateVarList(OpType &op)
static ParseResult parseNumTasksClause(OpAsmParser &parser, ClauseNumTasksTypeAttr &numTasksMod, std::optional< OpAsmParser::UnresolvedOperand > &numTasks, Type &numTasksType)
static ParseResult parseAlignedClause(OpAsmParser &parser, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &alignedVars, SmallVectorImpl< Type > &alignedTypes, ArrayAttr &alignmentsAttr)
aligned ::= aligned ( aligned-list ) aligned-list := aligned-val | aligned-val aligned-list aligned-v...
static ParseResult parsePrivateReductionRegion(OpAsmParser &parser, Region &region, llvm::SmallVectorImpl< OpAsmParser::UnresolvedOperand > &privateVars, llvm::SmallVectorImpl< Type > &privateTypes, ArrayAttr &privateSyms, UnitAttr &privateNeedsBarrier, ReductionModifierAttr &reductionMod, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &reductionVars, SmallVectorImpl< Type > &reductionTypes, DenseBoolArrayAttr &reductionByref, ArrayAttr &reductionSyms)
static ParseResult parseInReductionPrivateReductionRegion(OpAsmParser &parser, Region &region, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &inReductionVars, SmallVectorImpl< Type > &inReductionTypes, DenseBoolArrayAttr &inReductionByref, ArrayAttr &inReductionSyms, llvm::SmallVectorImpl< OpAsmParser::UnresolvedOperand > &privateVars, llvm::SmallVectorImpl< Type > &privateTypes, ArrayAttr &privateSyms, UnitAttr &privateNeedsBarrier, ReductionModifierAttr &reductionMod, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &reductionVars, SmallVectorImpl< Type > &reductionTypes, DenseBoolArrayAttr &reductionByref, ArrayAttr &reductionSyms)
static ParseResult parseCaptureType(OpAsmParser &parser, VariableCaptureKindAttr &mapCaptureType)
static ParseResult parseTaskReductionRegion(OpAsmParser &parser, Region &region, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &taskReductionVars, SmallVectorImpl< Type > &taskReductionTypes, DenseBoolArrayAttr &taskReductionByref, ArrayAttr &taskReductionSyms)
static ParseResult parseGrainsizeClause(OpAsmParser &parser, ClauseGrainsizeTypeAttr &grainsizeMod, std::optional< OpAsmParser::UnresolvedOperand > &grainsize, Type &grainsizeType)
static ParseResult parseCopyprivate(OpAsmParser &parser, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &copyprivateVars, SmallVectorImpl< Type > &copyprivateTypes, ArrayAttr &copyprivateSyms)
copyprivate-entry-list ::= copyprivate-entry | copyprivate-entry-list , copyprivate-entry copyprivate...
static LogicalResult verifyDependVarList(Operation *op, std::optional< ArrayAttr > dependKinds, OperandRange dependVars)
Verifies Depend clause.
static ParseResult parseDependVarList(OpAsmParser &parser, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &dependVars, SmallVectorImpl< Type > &dependTypes, ArrayAttr &dependKinds)
depend-entry-list ::= depend-entry | depend-entry-list , depend-entry depend-entry ::= depend-kind ->...
static LogicalResult verifyMapInfoDefinedArgs(Operation *op, StringRef clauseName, OperandRange vars)
static void printGrainsizeClause(OpAsmPrinter &p, Operation *op, ClauseGrainsizeTypeAttr grainsizeMod, Value grainsize, mlir::Type grainsizeType)
static ParseResult verifyScheduleModifiers(OpAsmParser &parser, SmallVectorImpl< SmallString< 12 > > &modifiers)
static bool isUnique(It begin, It end)
Definition ShardOps.cpp:161
static ArrayRef< int64_t > getShape(Type type)
Returns the shape of the given type.
Definition Traits.cpp:117
This base class exposes generic asm parser hooks, usable across the various derived parsers.
virtual ParseResult parseMinus()=0
Parse a '-' token.
@ Paren
Parens surrounding zero or more operands.
@ None
Zero or more operands with no delimiters.
virtual ParseResult parseColonTypeList(SmallVectorImpl< Type > &result)=0
Parse a colon followed by a type list, which must have at least one type.
virtual Builder & getBuilder() const =0
Return a builder which provides useful access to MLIRContext, global objects like types and attribute...
virtual ParseResult parseCommaSeparatedList(Delimiter delimiter, function_ref< ParseResult()> parseElementFn, StringRef contextMessage=StringRef())=0
Parse a list of comma-separated items with an optional delimiter.
virtual ParseResult parseOptionalAttrDict(NamedAttrList &result)=0
Parse a named dictionary into 'result' if it is present.
virtual ParseResult parseOptionalEqual()=0
Parse a = token if present.
virtual ParseResult parseOptionalKeyword(StringRef keyword)=0
Parse the given keyword if present.
MLIRContext * getContext() const
virtual ParseResult parseRParen()=0
Parse a ) token.
virtual InFlightDiagnostic emitError(SMLoc loc, const Twine &message={})=0
Emit a diagnostic at the specified location and return failure.
virtual ParseResult parseOptionalColon()=0
Parse a : token if present.
virtual ParseResult parseLSquare()=0
Parse a [ token.
virtual ParseResult parseRSquare()=0
Parse a ] token.
ParseResult parseInteger(IntT &result)
Parse an integer value from the stream.
virtual ParseResult parseOptionalArrow()=0
Parse a '->' token if present.
ParseResult addTypeToList(Type type, SmallVectorImpl< Type > &result)
Add the specified type to the end of the specified type list and return success.
virtual ParseResult parseLess()=0
Parse a '<' token.
virtual ParseResult parseEqual()=0
Parse a = token.
virtual ParseResult parseColonType(Type &result)=0
Parse a colon followed by a type.
virtual SMLoc getCurrentLocation()=0
Get the location of the next token and store it into the argument.
virtual ParseResult parseOptionalComma()=0
Parse a , token if present.
virtual ParseResult parseColon()=0
Parse a : token.
virtual SMLoc getNameLoc() const =0
Return the location of the original name token.
virtual ParseResult parseOptionalLess()=0
Parse a '<' token if present.
virtual ParseResult parseArrow()=0
Parse a '->' token.
virtual ParseResult parseLParen()=0
Parse a ( token.
virtual ParseResult parseType(Type &result)=0
Parse a type.
virtual ParseResult parseComma()=0
Parse a , token.
virtual ParseResult parseOptionalLParen()=0
Parse a ( token if present.
ParseResult parseKeyword(StringRef keyword)
Parse a given keyword.
Attributes are known-constant values of operations.
Definition Attributes.h:25
Block represents an ordered list of Operations.
Definition Block.h:33
ValueTypeRange< BlockArgListType > getArgumentTypes()
Return a range containing the types of the arguments for this block.
Definition Block.cpp:149
bool empty()
Definition Block.h:148
BlockArgument getArgument(unsigned i)
Definition Block.h:129
unsigned getNumArguments()
Definition Block.h:128
Operation & front()
Definition Block.h:153
SuccessorRange getSuccessors()
Definition Block.h:270
BlockArgListType getArguments()
Definition Block.h:87
DenseI32ArrayAttr getDenseI32ArrayAttr(ArrayRef< int32_t > values)
Definition Builders.cpp:163
IntegerType getI64Type()
Definition Builders.cpp:65
IntegerType getIntegerType(unsigned width)
Definition Builders.cpp:67
MLIRContext * getContext() const
Definition Builders.h:56
IndexType getIndexType()
Definition Builders.cpp:51
Attr getAttr(Args &&...args)
Get or construct an instance of the attribute Attr with provided arguments.
Definition Builders.h:98
Diagnostic & append(Arg1 &&arg1, Arg2 &&arg2, Args &&...args)
Append arguments to the diagnostic.
Diagnostic & appendOp(Operation &op, const OpPrintingFlags &flags)
Append an operation with the given printing flags.
Dialects are groups of MLIR operations, types and attributes, as well as behavior associated with the...
Definition Dialect.h:38
A class for computing basic dominance information.
Definition Dominance.h:140
bool dominates(Operation *a, Operation *b) const
Return true if operation A dominates operation B, i.e.
Definition Dominance.h:158
This class represents a diagnostic that is inflight and set to be reported.
Diagnostic & attachNote(std::optional< Location > noteLoc=std::nullopt)
Attaches a note to this diagnostic.
MLIRContext is the top-level object for a collection of MLIR operations.
Definition MLIRContext.h:63
The OpAsmParser has methods for interacting with the asm parser: parsing things from it,...
virtual ParseResult parseRegion(Region &region, ArrayRef< Argument > arguments={}, bool enableNameShadowing=false)=0
Parses a region.
virtual ParseResult parseArgument(Argument &result, bool allowType=false, bool allowAttrs=false)=0
Parse a single argument with the following syntax:
virtual ParseResult parseArgumentList(SmallVectorImpl< Argument > &result, Delimiter delimiter=Delimiter::None, bool allowType=false, bool allowAttrs=false)=0
Parse zero or more arguments with a specified surrounding delimiter.
virtual ParseResult resolveOperand(const UnresolvedOperand &operand, Type type, SmallVectorImpl< Value > &result)=0
Resolve an operand to an SSA value, emitting an error on failure.
ParseResult resolveOperands(Operands &&operands, Type type, SmallVectorImpl< Value > &result)
Resolve a list of operands to SSA values, emitting an error on failure, or appending the results to t...
virtual ParseResult parseOperand(UnresolvedOperand &result, bool allowResultNumber=true)=0
Parse a single SSA value operand name along with a result number if allowResultNumber is true.
virtual ParseResult parseOperandList(SmallVectorImpl< UnresolvedOperand > &result, Delimiter delimiter=Delimiter::None, bool allowResultNumber=true, int requiredOperandCount=-1)=0
Parse zero or more SSA comma-separated operand references with a specified surrounding delimiter,...
This is a pure-virtual base class that exposes the asmprinter hooks necessary to implement a custom p...
virtual void printOptionalAttrDict(ArrayRef< NamedAttribute > attrs, ArrayRef< StringRef > elidedAttrs={})=0
If the specified operation has attributes, print out an attribute dictionary with their values.
virtual void printRegion(Region &blocks, bool printEntryBlockArgs=true, bool printBlockTerminators=true, bool printEmptyBlock=false)=0
Prints a region.
virtual void printOperand(Value value)=0
Print implementations for various things an operation contains.
This class helps build Operations.
Definition Builders.h:207
This class represents an operand of an operation.
Definition Value.h:257
Set of flags used to control the behavior of the various IR print methods (e.g.
This class provides the API for ops that are known to be isolated from above.
This class provides the API for ops that are known to be terminators.
This class indicates that the regions associated with this op don't have terminators.
This class implements the operand iterators for the Operation class.
Definition ValueRange.h:43
Operation is the basic unit of execution within MLIR.
Definition Operation.h:88
Dialect * getDialect()
Return the dialect this operation is associated with, or nullptr if the associated dialect is not loa...
Definition Operation.h:220
Region & getRegion(unsigned index)
Returns the region held by this operation at position 'index'.
Definition Operation.h:686
bool hasTrait()
Returns true if the operation was registered with a particular trait, e.g.
Definition Operation.h:749
Block * getBlock()
Returns the operation block that contains this operation.
Definition Operation.h:213
unsigned getNumRegions()
Returns the number of regions held by this operation.
Definition Operation.h:674
Location getLoc()
The source location the operation was defined or derived from.
Definition Operation.h:223
Operation * getParentOp()
Returns the closest surrounding operation that contains this operation or nullptr if this is a top-le...
Definition Operation.h:234
InFlightDiagnostic emitError(const Twine &message={})
Emit an error about fatal conditions with this operation, reporting up to any diagnostic handlers tha...
OpTy getParentOfType()
Return the closest surrounding parent operation that is of type 'OpTy'.
Definition Operation.h:238
MutableArrayRef< Region > getRegions()
Returns the regions held by this operation.
Definition Operation.h:677
std::enable_if_t< llvm::function_traits< std::decay_t< FnT > >::num_args==1, RetT > walk(FnT &&callback)
Walk the operation by calling the callback for each nested operation (including this one),...
Definition Operation.h:797
user_range getUsers()
Returns a range of all users.
Definition Operation.h:873
Region * getParentRegion()
Returns the region to which the instruction belongs.
Definition Operation.h:230
MLIRContext * getContext()
Return the context this operation is associated with.
Definition Operation.h:216
InFlightDiagnostic emitOpError(const Twine &message={})
Emit an error with the op name prefixed, like "'dim' op " which is convenient for verifiers.
A special type of RewriterBase that coordinates the application of a rewrite pattern on the current I...
This class contains a list of basic blocks and a link to the parent operation it is attached to.
Definition Region.h:26
Block & front()
Definition Region.h:65
BlockArgListType getArguments()
Definition Region.h:81
OpIterator op_begin()
Return iterators that walk the operations nested directly within this region.
Definition Region.h:170
iterator_range< OpIterator > getOps()
Definition Region.h:172
bool empty()
Definition Region.h:60
unsigned getNumArguments()
Definition Region.h:123
Location getLoc()
Return a location for this region.
Definition Region.cpp:31
BlockArgument getArgument(unsigned i)
Definition Region.h:124
Operation * getParentOp()
Return the parent operation this region is attached to.
Definition Region.h:200
BlockListType & getBlocks()
Definition Region.h:45
virtual void eraseOp(Operation *op)
This method erases an operation that is known to have no uses.
OpTy replaceOpWithNewOp(Operation *op, Args &&...args)
Replace the results of the given (original) op with a new op that is created without verification (re...
Resource * getResource() const
Return the resource that the effect applies to.
EffectT * getEffect() const
Return the effect being applied.
This class represents a collection of SymbolTables.
virtual Operation * lookupNearestSymbolFrom(Operation *from, StringAttr symbol)
Returns the operation registered with the given symbol name within the closest parent operation of,...
static Operation * lookupNearestSymbolFrom(Operation *from, StringAttr symbol)
Returns the operation registered with the given symbol name within the closest parent operation of,...
This class provides an abstraction over the various different ranges of value types.
Definition TypeRange.h:37
Instances of the Type class are uniqued, have an immutable identifier and an optional mutable compone...
Definition Types.h:74
This class provides an abstraction over the different types of ranges over Values.
Definition ValueRange.h:387
type_range getType() const
This class represents an instance of an SSA value in the MLIR system, representing a computable value...
Definition Value.h:96
MLIRContext * getContext() const
Utility to get the associated MLIRContext that this value is defined in.
Definition Value.h:108
Type getType() const
Return the type of this value.
Definition Value.h:105
use_range getUses() const
Returns a range of all uses, which is useful for iterating over all uses.
Definition Value.h:188
Operation * getDefiningOp() const
If this value is the result of an operation, return the operation that defines it.
Definition Value.cpp:18
A utility result that is used to signal how to proceed with an ongoing walk:
Definition WalkResult.h:29
static WalkResult skip()
Definition WalkResult.h:48
static WalkResult advance()
Definition WalkResult.h:47
static WalkResult interrupt()
Definition WalkResult.h:46
static DenseArrayAttrImpl get(MLIRContext *context, ArrayRef< bool > content)
bool isReachableFromEntry(Block *a) const
Return true if the specified block is reachable from the entry block of its region.
Operation * getOwner() const
Return the owner of this operand.
Definition UseDefLists.h:38
SideEffects::EffectInstance< Effect > EffectInstance
bool isPerfectlyNested(ArrayRef< AffineForOp > loops)
Returns true if loops is a perfectly nested loop nest, where loops appear in it from outermost to inn...
TargetEnterDataOperands TargetEnterExitUpdateDataOperands
omp.target_enter_data, omp.target_exit_data and omp.target_update take the same clauses,...
std::tuple< NewCliOp, OpOperand *, OpOperand * > decodeCli(mlir::Value cli)
Find the omp.new_cli, generator, and consumer of a canonical loop info.
detail::InFlightRemark failed(Location loc, RemarkOpts opts)
Report an optimization remark that failed.
Definition Remarks.h:573
Include the generated interface declarations.
detail::DenseArrayAttrImpl< int64_t > DenseI64ArrayAttr
function_ref< void(Value, StringRef)> OpAsmSetValueNameFn
A functor used to set the name of the start of a result group of an operation.
Type getType(OpFoldResult ofr)
Returns the int type of the integer in ofr.
Definition Utils.cpp:304
llvm::DenseSet< ValueT, ValueInfoT > DenseSet
Definition LLVM.h:128
InFlightDiagnostic emitError(Location loc)
Utility method to emit an error message using this location.
llvm::TypeSwitch< T, ResultT > TypeSwitch
Definition LLVM.h:144
SmallVector< Loops, 8 > tile(ArrayRef< scf::ForOp > forOps, ArrayRef< Value > sizes, ArrayRef< scf::ForOp > targets)
Performs tiling fo imperfectly nested loops (with interchange) by strip-mining the forOps by sizes an...
Definition Utils.cpp:1293
detail::DenseArrayAttrImpl< bool > DenseBoolArrayAttr
function_ref< void(Block *, StringRef)> OpAsmSetBlockNameFn
A functor used to set the name of blocks in regions directly nested under an operation.
This is the representation of an operand reference.
This class provides APIs and verifiers for ops with regions having a single block.
This represents an operation in an abstracted form, suitable for use with the builder APIs.
void addOperands(ValueRange newOperands)
void addAttributes(ArrayRef< NamedAttribute > newAttributes)
Add an array of named attributes.
void addTypes(ArrayRef< Type > newTypes)
Region * addRegion()
Create a region that should be attached to the operation.