MLIR 22.0.0git
OpenMPDialect.cpp
Go to the documentation of this file.
1//===- OpenMPDialect.cpp - MLIR Dialect for OpenMP implementation ---------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file implements the OpenMP dialect and its operations.
10//
11//===----------------------------------------------------------------------===//
12
18#include "mlir/IR/Attributes.h"
23#include "mlir/IR/SymbolTable.h"
25
26#include "llvm/ADT/ArrayRef.h"
27#include "llvm/ADT/PostOrderIterator.h"
28#include "llvm/ADT/STLExtras.h"
29#include "llvm/ADT/STLForwardCompat.h"
30#include "llvm/ADT/SmallString.h"
31#include "llvm/ADT/StringExtras.h"
32#include "llvm/ADT/StringRef.h"
33#include "llvm/ADT/TypeSwitch.h"
34#include "llvm/ADT/bit.h"
35#include "llvm/Support/InterleavedRange.h"
36#include <cstddef>
37#include <iterator>
38#include <optional>
39#include <variant>
40
41#include "mlir/Dialect/OpenMP/OpenMPOpsDialect.cpp.inc"
42#include "mlir/Dialect/OpenMP/OpenMPOpsEnums.cpp.inc"
43#include "mlir/Dialect/OpenMP/OpenMPOpsInterfaces.cpp.inc"
44#include "mlir/Dialect/OpenMP/OpenMPTypeInterfaces.cpp.inc"
45
46using namespace mlir;
47using namespace mlir::omp;
48
51 return attrs.empty() ? nullptr : ArrayAttr::get(context, attrs);
52}
53
56 return boolArray.empty() ? nullptr : DenseBoolArrayAttr::get(ctx, boolArray);
57}
58
61 return intArray.empty() ? nullptr : DenseI64ArrayAttr::get(ctx, intArray);
62}
63
64namespace {
65struct MemRefPointerLikeModel
66 : public PointerLikeType::ExternalModel<MemRefPointerLikeModel,
67 MemRefType> {
68 Type getElementType(Type pointer) const {
69 return llvm::cast<MemRefType>(pointer).getElementType();
70 }
71};
72
73struct LLVMPointerPointerLikeModel
74 : public PointerLikeType::ExternalModel<LLVMPointerPointerLikeModel,
75 LLVM::LLVMPointerType> {
76 Type getElementType(Type pointer) const { return Type(); }
77};
78} // namespace
79
80/// Generate a name of a canonical loop nest of the format
81/// `<prefix>(_r<idx>_s<idx>)*`. Hereby, `_r<idx>` identifies the region
82/// argument index of an operation that has multiple regions, if the operation
83/// has multiple regions.
84/// `_s<idx>` identifies the position of an operation within a region, where
85/// only operations that may potentially contain loops ("container operations"
86/// i.e. have region arguments) are counted. Again, it is omitted if there is
87/// only one such operation in a region. If there are canonical loops nested
88/// inside each other, also may also use the format `_d<num>` where <num> is the
89/// nesting depth of the loop.
90///
91/// The generated name is a best-effort to make canonical loop unique within an
92/// SSA namespace. This also means that regions with IsolatedFromAbove property
93/// do not consider any parents or siblings.
94static std::string generateLoopNestingName(StringRef prefix,
95 CanonicalLoopOp op) {
96 struct Component {
97 /// If true, this component describes a region operand of an operation (the
98 /// operand's owner) If false, this component describes an operation located
99 /// in a parent region
100 bool isRegionArgOfOp;
101 bool skip = false;
102 bool isUnique = false;
103
104 size_t idx;
105 Operation *op;
106 Region *parentRegion;
107 size_t loopDepth;
108
109 Operation *&getOwnerOp() {
110 assert(isRegionArgOfOp && "Must describe a region operand");
111 return op;
112 }
113 size_t &getArgIdx() {
114 assert(isRegionArgOfOp && "Must describe a region operand");
115 return idx;
116 }
117
118 Operation *&getContainerOp() {
119 assert(!isRegionArgOfOp && "Must describe a operation of a region");
120 return op;
121 }
122 size_t &getOpPos() {
123 assert(!isRegionArgOfOp && "Must describe a operation of a region");
124 return idx;
125 }
126 bool isLoopOp() const {
127 assert(!isRegionArgOfOp && "Must describe a operation of a region");
128 return isa<CanonicalLoopOp>(op);
129 }
130 Region *&getParentRegion() {
131 assert(!isRegionArgOfOp && "Must describe a operation of a region");
132 return parentRegion;
133 }
134 size_t &getLoopDepth() {
135 assert(!isRegionArgOfOp && "Must describe a operation of a region");
136 return loopDepth;
137 }
138
139 void skipIf(bool v = true) { skip = skip || v; }
140 };
141
142 // List of ancestors, from inner to outer.
143 // Alternates between
144 // * region argument of an operation
145 // * operation within a region
146 SmallVector<Component> components;
147
148 // Gather a list of parent regions and operations, and the position within
149 // their parent
150 Operation *o = op.getOperation();
151 while (o) {
152 // Operation within a region
153 Region *r = o->getParentRegion();
154 if (!r)
155 break;
156
157 llvm::ReversePostOrderTraversal<Block *> traversal(&r->getBlocks().front());
158 size_t idx = 0;
159 bool found = false;
160 size_t sequentialIdx = -1;
161 bool isOnlyContainerOp = true;
162 for (Block *b : traversal) {
163 for (Operation &op : *b) {
164 if (&op == o && !found) {
165 sequentialIdx = idx;
166 found = true;
167 }
168 if (op.getNumRegions()) {
169 idx += 1;
170 if (idx > 1)
171 isOnlyContainerOp = false;
172 }
173 if (found && !isOnlyContainerOp)
174 break;
175 }
176 }
177
178 Component &containerOpInRegion = components.emplace_back();
179 containerOpInRegion.isRegionArgOfOp = false;
180 containerOpInRegion.isUnique = isOnlyContainerOp;
181 containerOpInRegion.getContainerOp() = o;
182 containerOpInRegion.getOpPos() = sequentialIdx;
183 containerOpInRegion.getParentRegion() = r;
184
185 Operation *parent = r->getParentOp();
186
187 // Region argument of an operation
188 Component &regionArgOfOperation = components.emplace_back();
189 regionArgOfOperation.isRegionArgOfOp = true;
190 regionArgOfOperation.isUnique = true;
191 regionArgOfOperation.getArgIdx() = 0;
192 regionArgOfOperation.getOwnerOp() = parent;
193
194 // The IsolatedFromAbove trait of the parent operation implies that each
195 // individual region argument has its own separate namespace, so no
196 // ambiguity.
197 if (!parent || parent->hasTrait<mlir::OpTrait::IsIsolatedFromAbove>())
198 break;
199
200 // Component only needed if operation has multiple region operands. Region
201 // arguments may be optional, but we currently do not consider this.
202 if (parent->getRegions().size() > 1) {
203 auto getRegionIndex = [](Operation *o, Region *r) {
204 for (auto [idx, region] : llvm::enumerate(o->getRegions())) {
205 if (&region == r)
206 return idx;
207 }
208 llvm_unreachable("Region not child of its parent operation");
209 };
210 regionArgOfOperation.isUnique = false;
211 regionArgOfOperation.getArgIdx() = getRegionIndex(parent, r);
212 }
213
214 // next parent
215 o = parent;
216 }
217
218 // Determine whether a region-argument component is not needed
219 for (Component &c : components)
220 c.skipIf(c.isRegionArgOfOp && c.isUnique);
221
222 // Find runs of nested loops and determine each loop's depth in the loop nest
223 size_t numSurroundingLoops = 0;
224 for (Component &c : llvm::reverse(components)) {
225 if (c.skip)
226 continue;
227
228 // non-skipped multi-argument operands interrupt the loop nest
229 if (c.isRegionArgOfOp) {
230 numSurroundingLoops = 0;
231 continue;
232 }
233
234 // Multiple loops in a region means each of them is the outermost loop of a
235 // new loop nest
236 if (!c.isUnique)
237 numSurroundingLoops = 0;
238
239 c.getLoopDepth() = numSurroundingLoops;
240
241 // Next loop is surrounded by one more loop
242 if (isa<CanonicalLoopOp>(c.getContainerOp()))
243 numSurroundingLoops += 1;
244 }
245
246 // In loop nests, skip all but the innermost loop that contains the depth
247 // number
248 bool isLoopNest = false;
249 for (Component &c : components) {
250 if (c.skip || c.isRegionArgOfOp)
251 continue;
252
253 if (!isLoopNest && c.getLoopDepth() >= 1) {
254 // Innermost loop of a loop nest of at least two loops
255 isLoopNest = true;
256 } else if (isLoopNest) {
257 // Non-innermost loop of a loop nest
258 c.skipIf(c.isUnique);
259
260 // If there is no surrounding loop left, this must have been the outermost
261 // loop; leave loop-nest mode for the next iteration
262 if (c.getLoopDepth() == 0)
263 isLoopNest = false;
264 }
265 }
266
267 // Skip non-loop unambiguous regions (but they should interrupt loop nests, so
268 // we mark them as skipped only after computing loop nests)
269 for (Component &c : components)
270 c.skipIf(!c.isRegionArgOfOp && c.isUnique &&
271 !isa<CanonicalLoopOp>(c.getContainerOp()));
272
273 // Components can be skipped if they are already disambiguated by their parent
274 // (or does not have a parent)
275 bool newRegion = true;
276 for (Component &c : llvm::reverse(components)) {
277 c.skipIf(newRegion && c.isUnique);
278
279 // non-skipped components disambiguate unique children
280 if (!c.skip)
281 newRegion = true;
282
283 // ...except canonical loops that need a suffix for each nest
284 if (!c.isRegionArgOfOp && c.getContainerOp())
285 newRegion = false;
286 }
287
288 // Compile the nesting name string
289 SmallString<64> Name{prefix};
290 llvm::raw_svector_ostream NameOS(Name);
291 for (auto &c : llvm::reverse(components)) {
292 if (c.skip)
293 continue;
294
295 if (c.isRegionArgOfOp)
296 NameOS << "_r" << c.getArgIdx();
297 else if (c.getLoopDepth() >= 1)
298 NameOS << "_d" << c.getLoopDepth();
299 else
300 NameOS << "_s" << c.getOpPos();
301 }
302
303 return NameOS.str().str();
304}
305
306void OpenMPDialect::initialize() {
307 addOperations<
308#define GET_OP_LIST
309#include "mlir/Dialect/OpenMP/OpenMPOps.cpp.inc"
310 >();
311 addAttributes<
312#define GET_ATTRDEF_LIST
313#include "mlir/Dialect/OpenMP/OpenMPOpsAttributes.cpp.inc"
314 >();
315 addTypes<
316#define GET_TYPEDEF_LIST
317#include "mlir/Dialect/OpenMP/OpenMPOpsTypes.cpp.inc"
318 >();
319
320 declarePromisedInterface<ConvertToLLVMPatternInterface, OpenMPDialect>();
321
322 MemRefType::attachInterface<MemRefPointerLikeModel>(*getContext());
323 LLVM::LLVMPointerType::attachInterface<LLVMPointerPointerLikeModel>(
324 *getContext());
325
326 // Attach default offload module interface to module op to access
327 // offload functionality through
328 mlir::ModuleOp::attachInterface<mlir::omp::OffloadModuleDefaultModel>(
329 *getContext());
330
331 // Attach default declare target interfaces to operations which can be marked
332 // as declare target (Global Operations and Functions/Subroutines in dialects
333 // that Fortran (or other languages that lower to MLIR) translates too
334 mlir::LLVM::GlobalOp::attachInterface<
336 *getContext());
337 mlir::LLVM::LLVMFuncOp::attachInterface<
339 *getContext());
340 mlir::func::FuncOp::attachInterface<
342}
343
344//===----------------------------------------------------------------------===//
345// Parser and printer for Allocate Clause
346//===----------------------------------------------------------------------===//
347
348/// Parse an allocate clause with allocators and a list of operands with types.
349///
350/// allocate-operand-list :: = allocate-operand |
351/// allocator-operand `,` allocate-operand-list
352/// allocate-operand :: = ssa-id-and-type -> ssa-id-and-type
353/// ssa-id-and-type ::= ssa-id `:` type
354static ParseResult parseAllocateAndAllocator(
355 OpAsmParser &parser,
357 SmallVectorImpl<Type> &allocateTypes,
359 SmallVectorImpl<Type> &allocatorTypes) {
360
361 return parser.parseCommaSeparatedList([&]() {
363 Type type;
364 if (parser.parseOperand(operand) || parser.parseColonType(type))
365 return failure();
366 allocatorVars.push_back(operand);
367 allocatorTypes.push_back(type);
368 if (parser.parseArrow())
369 return failure();
370 if (parser.parseOperand(operand) || parser.parseColonType(type))
371 return failure();
372
373 allocateVars.push_back(operand);
374 allocateTypes.push_back(type);
375 return success();
376 });
377}
378
379/// Print allocate clause
381 OperandRange allocateVars,
382 TypeRange allocateTypes,
383 OperandRange allocatorVars,
384 TypeRange allocatorTypes) {
385 for (unsigned i = 0; i < allocateVars.size(); ++i) {
386 std::string separator = i == allocateVars.size() - 1 ? "" : ", ";
387 p << allocatorVars[i] << " : " << allocatorTypes[i] << " -> ";
388 p << allocateVars[i] << " : " << allocateTypes[i] << separator;
389 }
390}
391
392//===----------------------------------------------------------------------===//
393// Parser and printer for a clause attribute (StringEnumAttr)
394//===----------------------------------------------------------------------===//
395
396template <typename ClauseAttr>
397static ParseResult parseClauseAttr(AsmParser &parser, ClauseAttr &attr) {
398 using ClauseT = decltype(std::declval<ClauseAttr>().getValue());
399 StringRef enumStr;
400 SMLoc loc = parser.getCurrentLocation();
401 if (parser.parseKeyword(&enumStr))
402 return failure();
403 if (std::optional<ClauseT> enumValue = symbolizeEnum<ClauseT>(enumStr)) {
404 attr = ClauseAttr::get(parser.getContext(), *enumValue);
405 return success();
406 }
407 return parser.emitError(loc, "invalid clause value: '") << enumStr << "'";
408}
409
410template <typename ClauseAttr>
411static void printClauseAttr(OpAsmPrinter &p, Operation *op, ClauseAttr attr) {
412 p << stringifyEnum(attr.getValue());
413}
414
415//===----------------------------------------------------------------------===//
416// Parser and printer for Linear Clause
417//===----------------------------------------------------------------------===//
418
419/// linear ::= `linear` `(` linear-list `)`
420/// linear-list := linear-val | linear-val linear-list
421/// linear-val := ssa-id-and-type `=` ssa-id-and-type
422static ParseResult parseLinearClause(
423 OpAsmParser &parser,
425 SmallVectorImpl<Type> &linearTypes,
427 return parser.parseCommaSeparatedList([&]() {
429 Type type;
431 if (parser.parseOperand(var) || parser.parseEqual() ||
432 parser.parseOperand(stepVar) || parser.parseColonType(type))
433 return failure();
434
435 linearVars.push_back(var);
436 linearTypes.push_back(type);
437 linearStepVars.push_back(stepVar);
438 return success();
439 });
440}
441
442/// Print Linear Clause
444 ValueRange linearVars, TypeRange linearTypes,
445 ValueRange linearStepVars) {
446 size_t linearVarsSize = linearVars.size();
447 for (unsigned i = 0; i < linearVarsSize; ++i) {
448 std::string separator = i == linearVarsSize - 1 ? "" : ", ";
449 p << linearVars[i];
450 if (linearStepVars.size() > i)
451 p << " = " << linearStepVars[i];
452 p << " : " << linearVars[i].getType() << separator;
453 }
454}
455
456//===----------------------------------------------------------------------===//
457// Verifier for Nontemporal Clause
458//===----------------------------------------------------------------------===//
459
460static LogicalResult verifyNontemporalClause(Operation *op,
461 OperandRange nontemporalVars) {
462
463 // Check if each var is unique - OpenMP 5.0 -> 2.9.3.1 section
464 DenseSet<Value> nontemporalItems;
465 for (const auto &it : nontemporalVars)
466 if (!nontemporalItems.insert(it).second)
467 return op->emitOpError() << "nontemporal variable used more than once";
468
469 return success();
470}
471
472//===----------------------------------------------------------------------===//
473// Parser, verifier and printer for Aligned Clause
474//===----------------------------------------------------------------------===//
475static LogicalResult verifyAlignedClause(Operation *op,
476 std::optional<ArrayAttr> alignments,
477 OperandRange alignedVars) {
478 // Check if number of alignment values equals to number of aligned variables
479 if (!alignedVars.empty()) {
480 if (!alignments || alignments->size() != alignedVars.size())
481 return op->emitOpError()
482 << "expected as many alignment values as aligned variables";
483 } else {
484 if (alignments)
485 return op->emitOpError() << "unexpected alignment values attribute";
486 return success();
487 }
488
489 // Check if each var is aligned only once - OpenMP 4.5 -> 2.8.1 section
490 DenseSet<Value> alignedItems;
491 for (auto it : alignedVars)
492 if (!alignedItems.insert(it).second)
493 return op->emitOpError() << "aligned variable used more than once";
494
495 if (!alignments)
496 return success();
497
498 // Check if all alignment values are positive - OpenMP 4.5 -> 2.8.1 section
499 for (unsigned i = 0; i < (*alignments).size(); ++i) {
500 if (auto intAttr = llvm::dyn_cast<IntegerAttr>((*alignments)[i])) {
501 if (intAttr.getValue().sle(0))
502 return op->emitOpError() << "alignment should be greater than 0";
503 } else {
504 return op->emitOpError() << "expected integer alignment";
505 }
506 }
507
508 return success();
509}
510
511/// aligned ::= `aligned` `(` aligned-list `)`
512/// aligned-list := aligned-val | aligned-val aligned-list
513/// aligned-val := ssa-id-and-type `->` alignment
514static ParseResult
517 SmallVectorImpl<Type> &alignedTypes,
518 ArrayAttr &alignmentsAttr) {
519 SmallVector<Attribute> alignmentVec;
520 if (failed(parser.parseCommaSeparatedList([&]() {
521 if (parser.parseOperand(alignedVars.emplace_back()) ||
522 parser.parseColonType(alignedTypes.emplace_back()) ||
523 parser.parseArrow() ||
524 parser.parseAttribute(alignmentVec.emplace_back())) {
525 return failure();
526 }
527 return success();
528 })))
529 return failure();
530 SmallVector<Attribute> alignments(alignmentVec.begin(), alignmentVec.end());
531 alignmentsAttr = ArrayAttr::get(parser.getContext(), alignments);
532 return success();
533}
534
535/// Print Aligned Clause
537 ValueRange alignedVars, TypeRange alignedTypes,
538 std::optional<ArrayAttr> alignments) {
539 for (unsigned i = 0; i < alignedVars.size(); ++i) {
540 if (i != 0)
541 p << ", ";
542 p << alignedVars[i] << " : " << alignedVars[i].getType();
543 p << " -> " << (*alignments)[i];
544 }
545}
546
547//===----------------------------------------------------------------------===//
548// Parser, printer and verifier for Schedule Clause
549//===----------------------------------------------------------------------===//
550
551static ParseResult
553 SmallVectorImpl<SmallString<12>> &modifiers) {
554 if (modifiers.size() > 2)
555 return parser.emitError(parser.getNameLoc()) << " unexpected modifier(s)";
556 for (const auto &mod : modifiers) {
557 // Translate the string. If it has no value, then it was not a valid
558 // modifier!
559 auto symbol = symbolizeScheduleModifier(mod);
560 if (!symbol)
561 return parser.emitError(parser.getNameLoc())
562 << " unknown modifier type: " << mod;
563 }
564
565 // If we have one modifier that is "simd", then stick a "none" modiifer in
566 // index 0.
567 if (modifiers.size() == 1) {
568 if (symbolizeScheduleModifier(modifiers[0]) == ScheduleModifier::simd) {
569 modifiers.push_back(modifiers[0]);
570 modifiers[0] = stringifyScheduleModifier(ScheduleModifier::none);
571 }
572 } else if (modifiers.size() == 2) {
573 // If there are two modifier:
574 // First modifier should not be simd, second one should be simd
575 if (symbolizeScheduleModifier(modifiers[0]) == ScheduleModifier::simd ||
576 symbolizeScheduleModifier(modifiers[1]) != ScheduleModifier::simd)
577 return parser.emitError(parser.getNameLoc())
578 << " incorrect modifier order";
579 }
580 return success();
581}
582
583/// schedule ::= `schedule` `(` sched-list `)`
584/// sched-list ::= sched-val | sched-val sched-list |
585/// sched-val `,` sched-modifier
586/// sched-val ::= sched-with-chunk | sched-wo-chunk
587/// sched-with-chunk ::= sched-with-chunk-types (`=` ssa-id-and-type)?
588/// sched-with-chunk-types ::= `static` | `dynamic` | `guided`
589/// sched-wo-chunk ::= `auto` | `runtime`
590/// sched-modifier ::= sched-mod-val | sched-mod-val `,` sched-mod-val
591/// sched-mod-val ::= `monotonic` | `nonmonotonic` | `simd` | `none`
592static ParseResult
593parseScheduleClause(OpAsmParser &parser, ClauseScheduleKindAttr &scheduleAttr,
594 ScheduleModifierAttr &scheduleMod, UnitAttr &scheduleSimd,
595 std::optional<OpAsmParser::UnresolvedOperand> &chunkSize,
596 Type &chunkType) {
597 StringRef keyword;
598 if (parser.parseKeyword(&keyword))
599 return failure();
600 std::optional<mlir::omp::ClauseScheduleKind> schedule =
601 symbolizeClauseScheduleKind(keyword);
602 if (!schedule)
603 return parser.emitError(parser.getNameLoc()) << " expected schedule kind";
604
605 scheduleAttr = ClauseScheduleKindAttr::get(parser.getContext(), *schedule);
606 switch (*schedule) {
607 case ClauseScheduleKind::Static:
608 case ClauseScheduleKind::Dynamic:
609 case ClauseScheduleKind::Guided:
610 if (succeeded(parser.parseOptionalEqual())) {
611 chunkSize = OpAsmParser::UnresolvedOperand{};
612 if (parser.parseOperand(*chunkSize) || parser.parseColonType(chunkType))
613 return failure();
614 } else {
615 chunkSize = std::nullopt;
616 }
617 break;
618 case ClauseScheduleKind::Auto:
619 case ClauseScheduleKind::Runtime:
620 case ClauseScheduleKind::Distribute:
621 chunkSize = std::nullopt;
622 }
623
624 // If there is a comma, we have one or more modifiers..
626 while (succeeded(parser.parseOptionalComma())) {
627 StringRef mod;
628 if (parser.parseKeyword(&mod))
629 return failure();
630 modifiers.push_back(mod);
631 }
632
633 if (verifyScheduleModifiers(parser, modifiers))
634 return failure();
635
636 if (!modifiers.empty()) {
637 SMLoc loc = parser.getCurrentLocation();
638 if (std::optional<ScheduleModifier> mod =
639 symbolizeScheduleModifier(modifiers[0])) {
640 scheduleMod = ScheduleModifierAttr::get(parser.getContext(), *mod);
641 } else {
642 return parser.emitError(loc, "invalid schedule modifier");
643 }
644 // Only SIMD attribute is allowed here!
645 if (modifiers.size() > 1) {
646 assert(symbolizeScheduleModifier(modifiers[1]) == ScheduleModifier::simd);
647 scheduleSimd = UnitAttr::get(parser.getBuilder().getContext());
648 }
649 }
650
651 return success();
652}
653
654/// Print schedule clause
656 ClauseScheduleKindAttr scheduleKind,
657 ScheduleModifierAttr scheduleMod,
658 UnitAttr scheduleSimd, Value scheduleChunk,
659 Type scheduleChunkType) {
660 p << stringifyClauseScheduleKind(scheduleKind.getValue());
661 if (scheduleChunk)
662 p << " = " << scheduleChunk << " : " << scheduleChunk.getType();
663 if (scheduleMod)
664 p << ", " << stringifyScheduleModifier(scheduleMod.getValue());
665 if (scheduleSimd)
666 p << ", simd";
667}
668
669//===----------------------------------------------------------------------===//
670// Parser and printer for Order Clause
671//===----------------------------------------------------------------------===//
672
673// order ::= `order` `(` [order-modifier ':'] concurrent `)`
674// order-modifier ::= reproducible | unconstrained
675static ParseResult parseOrderClause(OpAsmParser &parser,
676 ClauseOrderKindAttr &order,
677 OrderModifierAttr &orderMod) {
678 StringRef enumStr;
679 SMLoc loc = parser.getCurrentLocation();
680 if (parser.parseKeyword(&enumStr))
681 return failure();
682 if (std::optional<OrderModifier> enumValue =
683 symbolizeOrderModifier(enumStr)) {
684 orderMod = OrderModifierAttr::get(parser.getContext(), *enumValue);
685 if (parser.parseOptionalColon())
686 return failure();
687 loc = parser.getCurrentLocation();
688 if (parser.parseKeyword(&enumStr))
689 return failure();
690 }
691 if (std::optional<ClauseOrderKind> enumValue =
692 symbolizeClauseOrderKind(enumStr)) {
693 order = ClauseOrderKindAttr::get(parser.getContext(), *enumValue);
694 return success();
695 }
696 return parser.emitError(loc, "invalid clause value: '") << enumStr << "'";
697}
698
700 ClauseOrderKindAttr order,
701 OrderModifierAttr orderMod) {
702 if (orderMod)
703 p << stringifyOrderModifier(orderMod.getValue()) << ":";
704 if (order)
705 p << stringifyClauseOrderKind(order.getValue());
706}
707
708template <typename ClauseTypeAttr, typename ClauseType>
709static ParseResult
710parseGranularityClause(OpAsmParser &parser, ClauseTypeAttr &prescriptiveness,
711 std::optional<OpAsmParser::UnresolvedOperand> &operand,
712 Type &operandType,
713 std::optional<ClauseType> (*symbolizeClause)(StringRef),
714 StringRef clauseName) {
715 StringRef enumStr;
716 if (succeeded(parser.parseOptionalKeyword(&enumStr))) {
717 if (std::optional<ClauseType> enumValue = symbolizeClause(enumStr)) {
718 prescriptiveness = ClauseTypeAttr::get(parser.getContext(), *enumValue);
719 if (parser.parseComma())
720 return failure();
721 } else {
722 return parser.emitError(parser.getCurrentLocation())
723 << "invalid " << clauseName << " modifier : '" << enumStr << "'";
724 ;
725 }
726 }
727
729 if (succeeded(parser.parseOperand(var))) {
730 operand = var;
731 } else {
732 return parser.emitError(parser.getCurrentLocation())
733 << "expected " << clauseName << " operand";
734 }
735
736 if (operand.has_value()) {
737 if (parser.parseColonType(operandType))
738 return failure();
739 }
740
741 return success();
742}
743
744template <typename ClauseTypeAttr, typename ClauseType>
745static void
747 ClauseTypeAttr prescriptiveness, Value operand,
748 mlir::Type operandType,
749 StringRef (*stringifyClauseType)(ClauseType)) {
750
751 if (prescriptiveness)
752 p << stringifyClauseType(prescriptiveness.getValue()) << ", ";
753
754 if (operand)
755 p << operand << ": " << operandType;
756}
757
758//===----------------------------------------------------------------------===//
759// Parser and printer for grainsize Clause
760//===----------------------------------------------------------------------===//
761
762// grainsize ::= `grainsize` `(` [strict ':'] grain-size `)`
763static ParseResult
764parseGrainsizeClause(OpAsmParser &parser, ClauseGrainsizeTypeAttr &grainsizeMod,
765 std::optional<OpAsmParser::UnresolvedOperand> &grainsize,
766 Type &grainsizeType) {
768 parser, grainsizeMod, grainsize, grainsizeType,
769 &symbolizeClauseGrainsizeType, "grainsize");
770}
771
773 ClauseGrainsizeTypeAttr grainsizeMod,
774 Value grainsize, mlir::Type grainsizeType) {
776 p, op, grainsizeMod, grainsize, grainsizeType,
777 &stringifyClauseGrainsizeType);
778}
779
780//===----------------------------------------------------------------------===//
781// Parser and printer for num_tasks Clause
782//===----------------------------------------------------------------------===//
783
784// numtask ::= `num_tasks` `(` [strict ':'] num-tasks `)`
785static ParseResult
786parseNumTasksClause(OpAsmParser &parser, ClauseNumTasksTypeAttr &numTasksMod,
787 std::optional<OpAsmParser::UnresolvedOperand> &numTasks,
788 Type &numTasksType) {
790 parser, numTasksMod, numTasks, numTasksType, &symbolizeClauseNumTasksType,
791 "num_tasks");
792}
793
795 ClauseNumTasksTypeAttr numTasksMod,
796 Value numTasks, mlir::Type numTasksType) {
798 p, op, numTasksMod, numTasks, numTasksType, &stringifyClauseNumTasksType);
799}
800
801//===----------------------------------------------------------------------===//
802// Parsers for operations including clauses that define entry block arguments.
803//===----------------------------------------------------------------------===//
804
805namespace {
806struct MapParseArgs {
807 SmallVectorImpl<OpAsmParser::UnresolvedOperand> &vars;
808 SmallVectorImpl<Type> &types;
809 MapParseArgs(SmallVectorImpl<OpAsmParser::UnresolvedOperand> &vars,
810 SmallVectorImpl<Type> &types)
811 : vars(vars), types(types) {}
812};
813struct PrivateParseArgs {
814 llvm::SmallVectorImpl<OpAsmParser::UnresolvedOperand> &vars;
815 llvm::SmallVectorImpl<Type> &types;
816 ArrayAttr &syms;
817 UnitAttr &needsBarrier;
818 DenseI64ArrayAttr *mapIndices;
819 PrivateParseArgs(SmallVectorImpl<OpAsmParser::UnresolvedOperand> &vars,
820 SmallVectorImpl<Type> &types, ArrayAttr &syms,
821 UnitAttr &needsBarrier,
822 DenseI64ArrayAttr *mapIndices = nullptr)
823 : vars(vars), types(types), syms(syms), needsBarrier(needsBarrier),
824 mapIndices(mapIndices) {}
825};
826
827struct ReductionParseArgs {
828 SmallVectorImpl<OpAsmParser::UnresolvedOperand> &vars;
829 SmallVectorImpl<Type> &types;
830 DenseBoolArrayAttr &byref;
831 ArrayAttr &syms;
832 ReductionModifierAttr *modifier;
833 ReductionParseArgs(SmallVectorImpl<OpAsmParser::UnresolvedOperand> &vars,
834 SmallVectorImpl<Type> &types, DenseBoolArrayAttr &byref,
835 ArrayAttr &syms, ReductionModifierAttr *mod = nullptr)
836 : vars(vars), types(types), byref(byref), syms(syms), modifier(mod) {}
837};
838
839struct AllRegionParseArgs {
840 std::optional<MapParseArgs> hasDeviceAddrArgs;
841 std::optional<MapParseArgs> hostEvalArgs;
842 std::optional<ReductionParseArgs> inReductionArgs;
843 std::optional<MapParseArgs> mapArgs;
844 std::optional<PrivateParseArgs> privateArgs;
845 std::optional<ReductionParseArgs> reductionArgs;
846 std::optional<ReductionParseArgs> taskReductionArgs;
847 std::optional<MapParseArgs> useDeviceAddrArgs;
848 std::optional<MapParseArgs> useDevicePtrArgs;
849};
850} // namespace
851
852static inline constexpr StringRef getPrivateNeedsBarrierSpelling() {
853 return "private_barrier";
854}
855
856static ParseResult parseClauseWithRegionArgs(
857 OpAsmParser &parser,
861 ArrayAttr *symbols = nullptr, DenseI64ArrayAttr *mapIndices = nullptr,
862 DenseBoolArrayAttr *byref = nullptr,
863 ReductionModifierAttr *modifier = nullptr,
864 UnitAttr *needsBarrier = nullptr) {
866 SmallVector<int64_t> mapIndicesVec;
867 SmallVector<bool> isByRefVec;
868 unsigned regionArgOffset = regionPrivateArgs.size();
869
870 if (parser.parseLParen())
871 return failure();
872
873 if (modifier && succeeded(parser.parseOptionalKeyword("mod"))) {
874 StringRef enumStr;
875 if (parser.parseColon() || parser.parseKeyword(&enumStr) ||
876 parser.parseComma())
877 return failure();
878 std::optional<ReductionModifier> enumValue =
879 symbolizeReductionModifier(enumStr);
880 if (!enumValue.has_value())
881 return failure();
882 *modifier = ReductionModifierAttr::get(parser.getContext(), *enumValue);
883 if (!*modifier)
884 return failure();
885 }
886
887 if (parser.parseCommaSeparatedList([&]() {
888 if (byref)
889 isByRefVec.push_back(
890 parser.parseOptionalKeyword("byref").succeeded());
891
892 if (symbols && parser.parseAttribute(symbolVec.emplace_back()))
893 return failure();
894
895 if (parser.parseOperand(operands.emplace_back()) ||
896 parser.parseArrow() ||
897 parser.parseArgument(regionPrivateArgs.emplace_back()))
898 return failure();
899
900 if (mapIndices) {
901 if (parser.parseOptionalLSquare().succeeded()) {
902 if (parser.parseKeyword("map_idx") || parser.parseEqual() ||
903 parser.parseInteger(mapIndicesVec.emplace_back()) ||
904 parser.parseRSquare())
905 return failure();
906 } else {
907 mapIndicesVec.push_back(-1);
908 }
909 }
910
911 return success();
912 }))
913 return failure();
914
915 if (parser.parseColon())
916 return failure();
917
918 if (parser.parseCommaSeparatedList([&]() {
919 if (parser.parseType(types.emplace_back()))
920 return failure();
921
922 return success();
923 }))
924 return failure();
925
926 if (operands.size() != types.size())
927 return failure();
928
929 if (parser.parseRParen())
930 return failure();
931
932 if (needsBarrier) {
934 .succeeded())
935 *needsBarrier = mlir::UnitAttr::get(parser.getContext());
936 }
937
938 auto *argsBegin = regionPrivateArgs.begin();
939 MutableArrayRef argsSubrange(argsBegin + regionArgOffset,
940 argsBegin + regionArgOffset + types.size());
941 for (auto [prv, type] : llvm::zip_equal(argsSubrange, types)) {
942 prv.type = type;
943 }
944
945 if (symbols) {
946 SmallVector<Attribute> symbolAttrs(symbolVec.begin(), symbolVec.end());
947 *symbols = ArrayAttr::get(parser.getContext(), symbolAttrs);
948 }
949
950 if (!mapIndicesVec.empty())
951 *mapIndices =
952 mlir::DenseI64ArrayAttr::get(parser.getContext(), mapIndicesVec);
953
954 if (byref)
955 *byref = makeDenseBoolArrayAttr(parser.getContext(), isByRefVec);
956
957 return success();
958}
959
960static ParseResult parseBlockArgClause(
961 OpAsmParser &parser,
963 StringRef keyword, std::optional<MapParseArgs> mapArgs) {
964 if (succeeded(parser.parseOptionalKeyword(keyword))) {
965 if (!mapArgs)
966 return failure();
967
968 if (failed(parseClauseWithRegionArgs(parser, mapArgs->vars, mapArgs->types,
969 entryBlockArgs)))
970 return failure();
971 }
972 return success();
973}
974
975static ParseResult parseBlockArgClause(
976 OpAsmParser &parser,
978 StringRef keyword, std::optional<PrivateParseArgs> privateArgs) {
979 if (succeeded(parser.parseOptionalKeyword(keyword))) {
980 if (!privateArgs)
981 return failure();
982
983 if (failed(parseClauseWithRegionArgs(
984 parser, privateArgs->vars, privateArgs->types, entryBlockArgs,
985 &privateArgs->syms, privateArgs->mapIndices, /*byref=*/nullptr,
986 /*modifier=*/nullptr, &privateArgs->needsBarrier)))
987 return failure();
988 }
989 return success();
990}
991
992static ParseResult parseBlockArgClause(
993 OpAsmParser &parser,
995 StringRef keyword, std::optional<ReductionParseArgs> reductionArgs) {
996 if (succeeded(parser.parseOptionalKeyword(keyword))) {
997 if (!reductionArgs)
998 return failure();
999 if (failed(parseClauseWithRegionArgs(
1000 parser, reductionArgs->vars, reductionArgs->types, entryBlockArgs,
1001 &reductionArgs->syms, /*mapIndices=*/nullptr, &reductionArgs->byref,
1002 reductionArgs->modifier)))
1003 return failure();
1004 }
1005 return success();
1006}
1007
1008static ParseResult parseBlockArgRegion(OpAsmParser &parser, Region &region,
1009 AllRegionParseArgs args) {
1011
1012 if (failed(parseBlockArgClause(parser, entryBlockArgs, "has_device_addr",
1013 args.hasDeviceAddrArgs)))
1014 return parser.emitError(parser.getCurrentLocation())
1015 << "invalid `has_device_addr` format";
1016
1017 if (failed(parseBlockArgClause(parser, entryBlockArgs, "host_eval",
1018 args.hostEvalArgs)))
1019 return parser.emitError(parser.getCurrentLocation())
1020 << "invalid `host_eval` format";
1021
1022 if (failed(parseBlockArgClause(parser, entryBlockArgs, "in_reduction",
1023 args.inReductionArgs)))
1024 return parser.emitError(parser.getCurrentLocation())
1025 << "invalid `in_reduction` format";
1026
1027 if (failed(parseBlockArgClause(parser, entryBlockArgs, "map_entries",
1028 args.mapArgs)))
1029 return parser.emitError(parser.getCurrentLocation())
1030 << "invalid `map_entries` format";
1031
1032 if (failed(parseBlockArgClause(parser, entryBlockArgs, "private",
1033 args.privateArgs)))
1034 return parser.emitError(parser.getCurrentLocation())
1035 << "invalid `private` format";
1036
1037 if (failed(parseBlockArgClause(parser, entryBlockArgs, "reduction",
1038 args.reductionArgs)))
1039 return parser.emitError(parser.getCurrentLocation())
1040 << "invalid `reduction` format";
1041
1042 if (failed(parseBlockArgClause(parser, entryBlockArgs, "task_reduction",
1043 args.taskReductionArgs)))
1044 return parser.emitError(parser.getCurrentLocation())
1045 << "invalid `task_reduction` format";
1046
1047 if (failed(parseBlockArgClause(parser, entryBlockArgs, "use_device_addr",
1048 args.useDeviceAddrArgs)))
1049 return parser.emitError(parser.getCurrentLocation())
1050 << "invalid `use_device_addr` format";
1051
1052 if (failed(parseBlockArgClause(parser, entryBlockArgs, "use_device_ptr",
1053 args.useDevicePtrArgs)))
1054 return parser.emitError(parser.getCurrentLocation())
1055 << "invalid `use_device_addr` format";
1056
1057 return parser.parseRegion(region, entryBlockArgs);
1058}
1059
1060// These parseXyz functions correspond to the custom<Xyz> definitions
1061// in the .td file(s).
1062static ParseResult parseTargetOpRegion(
1063 OpAsmParser &parser, Region &region,
1065 SmallVectorImpl<Type> &hasDeviceAddrTypes,
1067 SmallVectorImpl<Type> &hostEvalTypes,
1069 SmallVectorImpl<Type> &inReductionTypes,
1070 DenseBoolArrayAttr &inReductionByref, ArrayAttr &inReductionSyms,
1072 SmallVectorImpl<Type> &mapTypes,
1074 llvm::SmallVectorImpl<Type> &privateTypes, ArrayAttr &privateSyms,
1075 UnitAttr &privateNeedsBarrier, DenseI64ArrayAttr &privateMaps) {
1076 AllRegionParseArgs args;
1077 args.hasDeviceAddrArgs.emplace(hasDeviceAddrVars, hasDeviceAddrTypes);
1078 args.hostEvalArgs.emplace(hostEvalVars, hostEvalTypes);
1079 args.inReductionArgs.emplace(inReductionVars, inReductionTypes,
1080 inReductionByref, inReductionSyms);
1081 args.mapArgs.emplace(mapVars, mapTypes);
1082 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1083 privateNeedsBarrier, &privateMaps);
1084 return parseBlockArgRegion(parser, region, args);
1085}
1086
1088 OpAsmParser &parser, Region &region,
1090 SmallVectorImpl<Type> &inReductionTypes,
1091 DenseBoolArrayAttr &inReductionByref, ArrayAttr &inReductionSyms,
1093 llvm::SmallVectorImpl<Type> &privateTypes, ArrayAttr &privateSyms,
1094 UnitAttr &privateNeedsBarrier) {
1095 AllRegionParseArgs args;
1096 args.inReductionArgs.emplace(inReductionVars, inReductionTypes,
1097 inReductionByref, inReductionSyms);
1098 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1099 privateNeedsBarrier);
1100 return parseBlockArgRegion(parser, region, args);
1101}
1102
1104 OpAsmParser &parser, Region &region,
1106 SmallVectorImpl<Type> &inReductionTypes,
1107 DenseBoolArrayAttr &inReductionByref, ArrayAttr &inReductionSyms,
1109 llvm::SmallVectorImpl<Type> &privateTypes, ArrayAttr &privateSyms,
1110 UnitAttr &privateNeedsBarrier, ReductionModifierAttr &reductionMod,
1112 SmallVectorImpl<Type> &reductionTypes, DenseBoolArrayAttr &reductionByref,
1113 ArrayAttr &reductionSyms) {
1114 AllRegionParseArgs args;
1115 args.inReductionArgs.emplace(inReductionVars, inReductionTypes,
1116 inReductionByref, inReductionSyms);
1117 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1118 privateNeedsBarrier);
1119 args.reductionArgs.emplace(reductionVars, reductionTypes, reductionByref,
1120 reductionSyms, &reductionMod);
1121 return parseBlockArgRegion(parser, region, args);
1122}
1123
1124static ParseResult parsePrivateRegion(
1125 OpAsmParser &parser, Region &region,
1127 llvm::SmallVectorImpl<Type> &privateTypes, ArrayAttr &privateSyms,
1128 UnitAttr &privateNeedsBarrier) {
1129 AllRegionParseArgs args;
1130 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1131 privateNeedsBarrier);
1132 return parseBlockArgRegion(parser, region, args);
1133}
1134
1136 OpAsmParser &parser, Region &region,
1138 llvm::SmallVectorImpl<Type> &privateTypes, ArrayAttr &privateSyms,
1139 UnitAttr &privateNeedsBarrier, ReductionModifierAttr &reductionMod,
1141 SmallVectorImpl<Type> &reductionTypes, DenseBoolArrayAttr &reductionByref,
1142 ArrayAttr &reductionSyms) {
1143 AllRegionParseArgs args;
1144 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1145 privateNeedsBarrier);
1146 args.reductionArgs.emplace(reductionVars, reductionTypes, reductionByref,
1147 reductionSyms, &reductionMod);
1148 return parseBlockArgRegion(parser, region, args);
1149}
1150
1151static ParseResult parseTaskReductionRegion(
1152 OpAsmParser &parser, Region &region,
1154 SmallVectorImpl<Type> &taskReductionTypes,
1155 DenseBoolArrayAttr &taskReductionByref, ArrayAttr &taskReductionSyms) {
1156 AllRegionParseArgs args;
1157 args.taskReductionArgs.emplace(taskReductionVars, taskReductionTypes,
1158 taskReductionByref, taskReductionSyms);
1159 return parseBlockArgRegion(parser, region, args);
1160}
1161
1163 OpAsmParser &parser, Region &region,
1165 SmallVectorImpl<Type> &useDeviceAddrTypes,
1167 SmallVectorImpl<Type> &useDevicePtrTypes) {
1168 AllRegionParseArgs args;
1169 args.useDeviceAddrArgs.emplace(useDeviceAddrVars, useDeviceAddrTypes);
1170 args.useDevicePtrArgs.emplace(useDevicePtrVars, useDevicePtrTypes);
1171 return parseBlockArgRegion(parser, region, args);
1172}
1173
1174//===----------------------------------------------------------------------===//
1175// Printers for operations including clauses that define entry block arguments.
1176//===----------------------------------------------------------------------===//
1177
1178namespace {
1179struct MapPrintArgs {
1180 ValueRange vars;
1181 TypeRange types;
1182 MapPrintArgs(ValueRange vars, TypeRange types) : vars(vars), types(types) {}
1183};
1184struct PrivatePrintArgs {
1185 ValueRange vars;
1186 TypeRange types;
1187 ArrayAttr syms;
1188 UnitAttr needsBarrier;
1189 DenseI64ArrayAttr mapIndices;
1190 PrivatePrintArgs(ValueRange vars, TypeRange types, ArrayAttr syms,
1191 UnitAttr needsBarrier, DenseI64ArrayAttr mapIndices)
1192 : vars(vars), types(types), syms(syms), needsBarrier(needsBarrier),
1193 mapIndices(mapIndices) {}
1194};
1195struct ReductionPrintArgs {
1196 ValueRange vars;
1197 TypeRange types;
1198 DenseBoolArrayAttr byref;
1199 ArrayAttr syms;
1200 ReductionModifierAttr modifier;
1201 ReductionPrintArgs(ValueRange vars, TypeRange types, DenseBoolArrayAttr byref,
1202 ArrayAttr syms, ReductionModifierAttr mod = nullptr)
1203 : vars(vars), types(types), byref(byref), syms(syms), modifier(mod) {}
1204};
1205struct AllRegionPrintArgs {
1206 std::optional<MapPrintArgs> hasDeviceAddrArgs;
1207 std::optional<MapPrintArgs> hostEvalArgs;
1208 std::optional<ReductionPrintArgs> inReductionArgs;
1209 std::optional<MapPrintArgs> mapArgs;
1210 std::optional<PrivatePrintArgs> privateArgs;
1211 std::optional<ReductionPrintArgs> reductionArgs;
1212 std::optional<ReductionPrintArgs> taskReductionArgs;
1213 std::optional<MapPrintArgs> useDeviceAddrArgs;
1214 std::optional<MapPrintArgs> useDevicePtrArgs;
1215};
1216} // namespace
1217
1219 OpAsmPrinter &p, MLIRContext *ctx, StringRef clauseName,
1220 ValueRange argsSubrange, ValueRange operands, TypeRange types,
1221 ArrayAttr symbols = nullptr, DenseI64ArrayAttr mapIndices = nullptr,
1222 DenseBoolArrayAttr byref = nullptr,
1223 ReductionModifierAttr modifier = nullptr, UnitAttr needsBarrier = nullptr) {
1224 if (argsSubrange.empty())
1225 return;
1226
1227 p << clauseName << "(";
1228
1229 if (modifier)
1230 p << "mod: " << stringifyReductionModifier(modifier.getValue()) << ", ";
1231
1232 if (!symbols) {
1233 llvm::SmallVector<Attribute> values(operands.size(), nullptr);
1234 symbols = ArrayAttr::get(ctx, values);
1235 }
1236
1237 if (!mapIndices) {
1238 llvm::SmallVector<int64_t> values(operands.size(), -1);
1239 mapIndices = DenseI64ArrayAttr::get(ctx, values);
1240 }
1241
1242 if (!byref) {
1243 mlir::SmallVector<bool> values(operands.size(), false);
1244 byref = DenseBoolArrayAttr::get(ctx, values);
1245 }
1246
1247 llvm::interleaveComma(llvm::zip_equal(operands, argsSubrange, symbols,
1248 mapIndices.asArrayRef(),
1249 byref.asArrayRef()),
1250 p, [&p](auto t) {
1251 auto [op, arg, sym, map, isByRef] = t;
1252 if (isByRef)
1253 p << "byref ";
1254 if (sym)
1255 p << sym << " ";
1256
1257 p << op << " -> " << arg;
1258
1259 if (map != -1)
1260 p << " [map_idx=" << map << "]";
1261 });
1262 p << " : ";
1263 llvm::interleaveComma(types, p);
1264 p << ") ";
1265
1266 if (needsBarrier)
1267 p << getPrivateNeedsBarrierSpelling() << " ";
1268}
1269
1271 StringRef clauseName, ValueRange argsSubrange,
1272 std::optional<MapPrintArgs> mapArgs) {
1273 if (mapArgs)
1274 printClauseWithRegionArgs(p, ctx, clauseName, argsSubrange, mapArgs->vars,
1275 mapArgs->types);
1276}
1277
1279 StringRef clauseName, ValueRange argsSubrange,
1280 std::optional<PrivatePrintArgs> privateArgs) {
1281 if (privateArgs)
1283 p, ctx, clauseName, argsSubrange, privateArgs->vars, privateArgs->types,
1284 privateArgs->syms, privateArgs->mapIndices, /*byref=*/nullptr,
1285 /*modifier=*/nullptr, privateArgs->needsBarrier);
1286}
1287
1288static void
1289printBlockArgClause(OpAsmPrinter &p, MLIRContext *ctx, StringRef clauseName,
1290 ValueRange argsSubrange,
1291 std::optional<ReductionPrintArgs> reductionArgs) {
1292 if (reductionArgs)
1293 printClauseWithRegionArgs(p, ctx, clauseName, argsSubrange,
1294 reductionArgs->vars, reductionArgs->types,
1295 reductionArgs->syms, /*mapIndices=*/nullptr,
1296 reductionArgs->byref, reductionArgs->modifier);
1297}
1298
1300 const AllRegionPrintArgs &args) {
1301 auto iface = llvm::cast<mlir::omp::BlockArgOpenMPOpInterface>(op);
1302 MLIRContext *ctx = op->getContext();
1303
1304 printBlockArgClause(p, ctx, "has_device_addr",
1305 iface.getHasDeviceAddrBlockArgs(),
1306 args.hasDeviceAddrArgs);
1307 printBlockArgClause(p, ctx, "host_eval", iface.getHostEvalBlockArgs(),
1308 args.hostEvalArgs);
1309 printBlockArgClause(p, ctx, "in_reduction", iface.getInReductionBlockArgs(),
1310 args.inReductionArgs);
1311 printBlockArgClause(p, ctx, "map_entries", iface.getMapBlockArgs(),
1312 args.mapArgs);
1313 printBlockArgClause(p, ctx, "private", iface.getPrivateBlockArgs(),
1314 args.privateArgs);
1315 printBlockArgClause(p, ctx, "reduction", iface.getReductionBlockArgs(),
1316 args.reductionArgs);
1317 printBlockArgClause(p, ctx, "task_reduction",
1318 iface.getTaskReductionBlockArgs(),
1319 args.taskReductionArgs);
1320 printBlockArgClause(p, ctx, "use_device_addr",
1321 iface.getUseDeviceAddrBlockArgs(),
1322 args.useDeviceAddrArgs);
1323 printBlockArgClause(p, ctx, "use_device_ptr",
1324 iface.getUseDevicePtrBlockArgs(), args.useDevicePtrArgs);
1325
1326 p.printRegion(region, /*printEntryBlockArgs=*/false);
1327}
1328
1329// These parseXyz functions correspond to the custom<Xyz> definitions
1330// in the .td file(s).
1332 OpAsmPrinter &p, Operation *op, Region &region,
1333 ValueRange hasDeviceAddrVars, TypeRange hasDeviceAddrTypes,
1334 ValueRange hostEvalVars, TypeRange hostEvalTypes,
1335 ValueRange inReductionVars, TypeRange inReductionTypes,
1336 DenseBoolArrayAttr inReductionByref, ArrayAttr inReductionSyms,
1337 ValueRange mapVars, TypeRange mapTypes, ValueRange privateVars,
1338 TypeRange privateTypes, ArrayAttr privateSyms, UnitAttr privateNeedsBarrier,
1339 DenseI64ArrayAttr privateMaps) {
1340 AllRegionPrintArgs args;
1341 args.hasDeviceAddrArgs.emplace(hasDeviceAddrVars, hasDeviceAddrTypes);
1342 args.hostEvalArgs.emplace(hostEvalVars, hostEvalTypes);
1343 args.inReductionArgs.emplace(inReductionVars, inReductionTypes,
1344 inReductionByref, inReductionSyms);
1345 args.mapArgs.emplace(mapVars, mapTypes);
1346 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1347 privateNeedsBarrier, privateMaps);
1348 printBlockArgRegion(p, op, region, args);
1349}
1350
1352 OpAsmPrinter &p, Operation *op, Region &region, ValueRange inReductionVars,
1353 TypeRange inReductionTypes, DenseBoolArrayAttr inReductionByref,
1354 ArrayAttr inReductionSyms, ValueRange privateVars, TypeRange privateTypes,
1355 ArrayAttr privateSyms, UnitAttr privateNeedsBarrier) {
1356 AllRegionPrintArgs args;
1357 args.inReductionArgs.emplace(inReductionVars, inReductionTypes,
1358 inReductionByref, inReductionSyms);
1359 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1360 privateNeedsBarrier,
1361 /*mapIndices=*/nullptr);
1362 printBlockArgRegion(p, op, region, args);
1363}
1364
1366 OpAsmPrinter &p, Operation *op, Region &region, ValueRange inReductionVars,
1367 TypeRange inReductionTypes, DenseBoolArrayAttr inReductionByref,
1368 ArrayAttr inReductionSyms, ValueRange privateVars, TypeRange privateTypes,
1369 ArrayAttr privateSyms, UnitAttr privateNeedsBarrier,
1370 ReductionModifierAttr reductionMod, ValueRange reductionVars,
1371 TypeRange reductionTypes, DenseBoolArrayAttr reductionByref,
1372 ArrayAttr reductionSyms) {
1373 AllRegionPrintArgs args;
1374 args.inReductionArgs.emplace(inReductionVars, inReductionTypes,
1375 inReductionByref, inReductionSyms);
1376 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1377 privateNeedsBarrier,
1378 /*mapIndices=*/nullptr);
1379 args.reductionArgs.emplace(reductionVars, reductionTypes, reductionByref,
1380 reductionSyms, reductionMod);
1381 printBlockArgRegion(p, op, region, args);
1382}
1383
1385 ValueRange privateVars, TypeRange privateTypes,
1386 ArrayAttr privateSyms,
1387 UnitAttr privateNeedsBarrier) {
1388 AllRegionPrintArgs args;
1389 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1390 privateNeedsBarrier,
1391 /*mapIndices=*/nullptr);
1392 printBlockArgRegion(p, op, region, args);
1393}
1394
1396 OpAsmPrinter &p, Operation *op, Region &region, ValueRange privateVars,
1397 TypeRange privateTypes, ArrayAttr privateSyms, UnitAttr privateNeedsBarrier,
1398 ReductionModifierAttr reductionMod, ValueRange reductionVars,
1399 TypeRange reductionTypes, DenseBoolArrayAttr reductionByref,
1400 ArrayAttr reductionSyms) {
1401 AllRegionPrintArgs args;
1402 args.privateArgs.emplace(privateVars, privateTypes, privateSyms,
1403 privateNeedsBarrier,
1404 /*mapIndices=*/nullptr);
1405 args.reductionArgs.emplace(reductionVars, reductionTypes, reductionByref,
1406 reductionSyms, reductionMod);
1407 printBlockArgRegion(p, op, region, args);
1408}
1409
1411 Region &region,
1412 ValueRange taskReductionVars,
1413 TypeRange taskReductionTypes,
1414 DenseBoolArrayAttr taskReductionByref,
1415 ArrayAttr taskReductionSyms) {
1416 AllRegionPrintArgs args;
1417 args.taskReductionArgs.emplace(taskReductionVars, taskReductionTypes,
1418 taskReductionByref, taskReductionSyms);
1419 printBlockArgRegion(p, op, region, args);
1420}
1421
1423 Region &region,
1424 ValueRange useDeviceAddrVars,
1425 TypeRange useDeviceAddrTypes,
1426 ValueRange useDevicePtrVars,
1427 TypeRange useDevicePtrTypes) {
1428 AllRegionPrintArgs args;
1429 args.useDeviceAddrArgs.emplace(useDeviceAddrVars, useDeviceAddrTypes);
1430 args.useDevicePtrArgs.emplace(useDevicePtrVars, useDevicePtrTypes);
1431 printBlockArgRegion(p, op, region, args);
1432}
1433
1434/// Verifies Reduction Clause
1435static LogicalResult
1436verifyReductionVarList(Operation *op, std::optional<ArrayAttr> reductionSyms,
1437 OperandRange reductionVars,
1438 std::optional<ArrayRef<bool>> reductionByref) {
1439 if (!reductionVars.empty()) {
1440 if (!reductionSyms || reductionSyms->size() != reductionVars.size())
1441 return op->emitOpError()
1442 << "expected as many reduction symbol references "
1443 "as reduction variables";
1444 if (reductionByref && reductionByref->size() != reductionVars.size())
1445 return op->emitError() << "expected as many reduction variable by "
1446 "reference attributes as reduction variables";
1447 } else {
1448 if (reductionSyms)
1449 return op->emitOpError() << "unexpected reduction symbol references";
1450 return success();
1451 }
1452
1453 // TODO: The followings should be done in
1454 // SymbolUserOpInterface::verifySymbolUses.
1455 DenseSet<Value> accumulators;
1456 for (auto args : llvm::zip(reductionVars, *reductionSyms)) {
1457 Value accum = std::get<0>(args);
1458
1459 if (!accumulators.insert(accum).second)
1460 return op->emitOpError() << "accumulator variable used more than once";
1461
1462 Type varType = accum.getType();
1463 auto symbolRef = llvm::cast<SymbolRefAttr>(std::get<1>(args));
1464 auto decl =
1466 if (!decl)
1467 return op->emitOpError() << "expected symbol reference " << symbolRef
1468 << " to point to a reduction declaration";
1469
1470 if (decl.getAccumulatorType() && decl.getAccumulatorType() != varType)
1471 return op->emitOpError()
1472 << "expected accumulator (" << varType
1473 << ") to be the same type as reduction declaration ("
1474 << decl.getAccumulatorType() << ")";
1475 }
1476
1477 return success();
1478}
1479
1480//===----------------------------------------------------------------------===//
1481// Parser, printer and verifier for Copyprivate
1482//===----------------------------------------------------------------------===//
1483
1484/// copyprivate-entry-list ::= copyprivate-entry
1485/// | copyprivate-entry-list `,` copyprivate-entry
1486/// copyprivate-entry ::= ssa-id `->` symbol-ref `:` type
1487static ParseResult parseCopyprivate(
1488 OpAsmParser &parser,
1490 SmallVectorImpl<Type> &copyprivateTypes, ArrayAttr &copyprivateSyms) {
1492 if (failed(parser.parseCommaSeparatedList([&]() {
1493 if (parser.parseOperand(copyprivateVars.emplace_back()) ||
1494 parser.parseArrow() ||
1495 parser.parseAttribute(symsVec.emplace_back()) ||
1496 parser.parseColonType(copyprivateTypes.emplace_back()))
1497 return failure();
1498 return success();
1499 })))
1500 return failure();
1501 SmallVector<Attribute> syms(symsVec.begin(), symsVec.end());
1502 copyprivateSyms = ArrayAttr::get(parser.getContext(), syms);
1503 return success();
1504}
1505
1506/// Print Copyprivate clause
1508 OperandRange copyprivateVars,
1509 TypeRange copyprivateTypes,
1510 std::optional<ArrayAttr> copyprivateSyms) {
1511 if (!copyprivateSyms.has_value())
1512 return;
1513 llvm::interleaveComma(
1514 llvm::zip(copyprivateVars, *copyprivateSyms, copyprivateTypes), p,
1515 [&](const auto &args) {
1516 p << std::get<0>(args) << " -> " << std::get<1>(args) << " : "
1517 << std::get<2>(args);
1518 });
1519}
1520
1521/// Verifies CopyPrivate Clause
1522static LogicalResult
1524 std::optional<ArrayAttr> copyprivateSyms) {
1525 size_t copyprivateSymsSize =
1526 copyprivateSyms.has_value() ? copyprivateSyms->size() : 0;
1527 if (copyprivateSymsSize != copyprivateVars.size())
1528 return op->emitOpError() << "inconsistent number of copyprivate vars (= "
1529 << copyprivateVars.size()
1530 << ") and functions (= " << copyprivateSymsSize
1531 << "), both must be equal";
1532 if (!copyprivateSyms.has_value())
1533 return success();
1534
1535 for (auto copyprivateVarAndSym :
1536 llvm::zip(copyprivateVars, *copyprivateSyms)) {
1537 auto symbolRef =
1538 llvm::cast<SymbolRefAttr>(std::get<1>(copyprivateVarAndSym));
1539 std::optional<std::variant<mlir::func::FuncOp, mlir::LLVM::LLVMFuncOp>>
1540 funcOp;
1541 if (mlir::func::FuncOp mlirFuncOp =
1543 symbolRef))
1544 funcOp = mlirFuncOp;
1545 else if (mlir::LLVM::LLVMFuncOp llvmFuncOp =
1547 op, symbolRef))
1548 funcOp = llvmFuncOp;
1549
1550 auto getNumArguments = [&] {
1551 return std::visit([](auto &f) { return f.getNumArguments(); }, *funcOp);
1552 };
1553
1554 auto getArgumentType = [&](unsigned i) {
1555 return std::visit([i](auto &f) { return f.getArgumentTypes()[i]; },
1556 *funcOp);
1557 };
1558
1559 if (!funcOp)
1560 return op->emitOpError() << "expected symbol reference " << symbolRef
1561 << " to point to a copy function";
1562
1563 if (getNumArguments() != 2)
1564 return op->emitOpError()
1565 << "expected copy function " << symbolRef << " to have 2 operands";
1566
1567 Type argTy = getArgumentType(0);
1568 if (argTy != getArgumentType(1))
1569 return op->emitOpError() << "expected copy function " << symbolRef
1570 << " arguments to have the same type";
1571
1572 Type varType = std::get<0>(copyprivateVarAndSym).getType();
1573 if (argTy != varType)
1574 return op->emitOpError()
1575 << "expected copy function arguments' type (" << argTy
1576 << ") to be the same as copyprivate variable's type (" << varType
1577 << ")";
1578 }
1579
1580 return success();
1581}
1582
1583//===----------------------------------------------------------------------===//
1584// Parser, printer and verifier for DependVarList
1585//===----------------------------------------------------------------------===//
1586
1587/// depend-entry-list ::= depend-entry
1588/// | depend-entry-list `,` depend-entry
1589/// depend-entry ::= depend-kind `->` ssa-id `:` type
1590static ParseResult
1593 SmallVectorImpl<Type> &dependTypes, ArrayAttr &dependKinds) {
1595 if (failed(parser.parseCommaSeparatedList([&]() {
1596 StringRef keyword;
1597 if (parser.parseKeyword(&keyword) || parser.parseArrow() ||
1598 parser.parseOperand(dependVars.emplace_back()) ||
1599 parser.parseColonType(dependTypes.emplace_back()))
1600 return failure();
1601 if (std::optional<ClauseTaskDepend> keywordDepend =
1602 (symbolizeClauseTaskDepend(keyword)))
1603 kindsVec.emplace_back(
1604 ClauseTaskDependAttr::get(parser.getContext(), *keywordDepend));
1605 else
1606 return failure();
1607 return success();
1608 })))
1609 return failure();
1610 SmallVector<Attribute> kinds(kindsVec.begin(), kindsVec.end());
1611 dependKinds = ArrayAttr::get(parser.getContext(), kinds);
1612 return success();
1613}
1614
1615/// Print Depend clause
1617 OperandRange dependVars, TypeRange dependTypes,
1618 std::optional<ArrayAttr> dependKinds) {
1619
1620 for (unsigned i = 0, e = dependKinds->size(); i < e; ++i) {
1621 if (i != 0)
1622 p << ", ";
1623 p << stringifyClauseTaskDepend(
1624 llvm::cast<mlir::omp::ClauseTaskDependAttr>((*dependKinds)[i])
1625 .getValue())
1626 << " -> " << dependVars[i] << " : " << dependTypes[i];
1627 }
1628}
1629
1630/// Verifies Depend clause
1631static LogicalResult verifyDependVarList(Operation *op,
1632 std::optional<ArrayAttr> dependKinds,
1633 OperandRange dependVars) {
1634 if (!dependVars.empty()) {
1635 if (!dependKinds || dependKinds->size() != dependVars.size())
1636 return op->emitOpError() << "expected as many depend values"
1637 " as depend variables";
1638 } else {
1639 if (dependKinds && !dependKinds->empty())
1640 return op->emitOpError() << "unexpected depend values";
1641 return success();
1642 }
1643
1644 return success();
1645}
1646
1647//===----------------------------------------------------------------------===//
1648// Parser, printer and verifier for Synchronization Hint (2.17.12)
1649//===----------------------------------------------------------------------===//
1650
1651/// Parses a Synchronization Hint clause. The value of hint is an integer
1652/// which is a combination of different hints from `omp_sync_hint_t`.
1653///
1654/// hint-clause = `hint` `(` hint-value `)`
1655static ParseResult parseSynchronizationHint(OpAsmParser &parser,
1656 IntegerAttr &hintAttr) {
1657 StringRef hintKeyword;
1658 int64_t hint = 0;
1659 if (succeeded(parser.parseOptionalKeyword("none"))) {
1660 hintAttr = IntegerAttr::get(parser.getBuilder().getI64Type(), 0);
1661 return success();
1662 }
1663 auto parseKeyword = [&]() -> ParseResult {
1664 if (failed(parser.parseKeyword(&hintKeyword)))
1665 return failure();
1666 if (hintKeyword == "uncontended")
1667 hint |= 1;
1668 else if (hintKeyword == "contended")
1669 hint |= 2;
1670 else if (hintKeyword == "nonspeculative")
1671 hint |= 4;
1672 else if (hintKeyword == "speculative")
1673 hint |= 8;
1674 else
1675 return parser.emitError(parser.getCurrentLocation())
1676 << hintKeyword << " is not a valid hint";
1677 return success();
1678 };
1679 if (parser.parseCommaSeparatedList(parseKeyword))
1680 return failure();
1681 hintAttr = IntegerAttr::get(parser.getBuilder().getI64Type(), hint);
1682 return success();
1683}
1684
1685/// Prints a Synchronization Hint clause
1687 IntegerAttr hintAttr) {
1688 int64_t hint = hintAttr.getInt();
1689
1690 if (hint == 0) {
1691 p << "none";
1692 return;
1693 }
1694
1695 // Helper function to get n-th bit from the right end of `value`
1696 auto bitn = [](int value, int n) -> bool { return value & (1 << n); };
1697
1698 bool uncontended = bitn(hint, 0);
1699 bool contended = bitn(hint, 1);
1700 bool nonspeculative = bitn(hint, 2);
1701 bool speculative = bitn(hint, 3);
1702
1704 if (uncontended)
1705 hints.push_back("uncontended");
1706 if (contended)
1707 hints.push_back("contended");
1708 if (nonspeculative)
1709 hints.push_back("nonspeculative");
1710 if (speculative)
1711 hints.push_back("speculative");
1712
1713 llvm::interleaveComma(hints, p);
1714}
1715
1716/// Verifies a synchronization hint clause
1717static LogicalResult verifySynchronizationHint(Operation *op, uint64_t hint) {
1718
1719 // Helper function to get n-th bit from the right end of `value`
1720 auto bitn = [](int value, int n) -> bool { return value & (1 << n); };
1721
1722 bool uncontended = bitn(hint, 0);
1723 bool contended = bitn(hint, 1);
1724 bool nonspeculative = bitn(hint, 2);
1725 bool speculative = bitn(hint, 3);
1726
1727 if (uncontended && contended)
1728 return op->emitOpError() << "the hints omp_sync_hint_uncontended and "
1729 "omp_sync_hint_contended cannot be combined";
1730 if (nonspeculative && speculative)
1731 return op->emitOpError() << "the hints omp_sync_hint_nonspeculative and "
1732 "omp_sync_hint_speculative cannot be combined.";
1733 return success();
1734}
1735
1736//===----------------------------------------------------------------------===//
1737// Parser, printer and verifier for Target
1738//===----------------------------------------------------------------------===//
1739
1740// Helper function to get bitwise AND of `value` and 'flag' then return it as a
1741// boolean
1742static bool mapTypeToBool(ClauseMapFlags value, ClauseMapFlags flag) {
1743 return (value & flag) == flag;
1744}
1745
1746/// Parses a map_entries map type from a string format back into its numeric
1747/// value.
1748///
1749/// map-clause = `map_clauses ( ( `(` `always, `? `implicit, `? `ompx_hold, `?
1750/// `close, `? `present, `? ( `to` | `from` | `delete` `)` )+ `)` )
1751static ParseResult parseMapClause(OpAsmParser &parser,
1752 ClauseMapFlagsAttr &mapType) {
1753 ClauseMapFlags mapTypeBits = ClauseMapFlags::none;
1754 // This simply verifies the correct keyword is read in, the
1755 // keyword itself is stored inside of the operation
1756 auto parseTypeAndMod = [&]() -> ParseResult {
1757 StringRef mapTypeMod;
1758 if (parser.parseKeyword(&mapTypeMod))
1759 return failure();
1760
1761 if (mapTypeMod == "always")
1762 mapTypeBits |= ClauseMapFlags::always;
1763
1764 if (mapTypeMod == "implicit")
1765 mapTypeBits |= ClauseMapFlags::implicit;
1766
1767 if (mapTypeMod == "ompx_hold")
1768 mapTypeBits |= ClauseMapFlags::ompx_hold;
1769
1770 if (mapTypeMod == "close")
1771 mapTypeBits |= ClauseMapFlags::close;
1772
1773 if (mapTypeMod == "present")
1774 mapTypeBits |= ClauseMapFlags::present;
1775
1776 if (mapTypeMod == "to")
1777 mapTypeBits |= ClauseMapFlags::to;
1778
1779 if (mapTypeMod == "from")
1780 mapTypeBits |= ClauseMapFlags::from;
1781
1782 if (mapTypeMod == "tofrom")
1783 mapTypeBits |= ClauseMapFlags::to | ClauseMapFlags::from;
1784
1785 if (mapTypeMod == "delete")
1786 mapTypeBits |= ClauseMapFlags::del;
1787
1788 if (mapTypeMod == "storage")
1789 mapTypeBits |= ClauseMapFlags::storage;
1790
1791 if (mapTypeMod == "return_param")
1792 mapTypeBits |= ClauseMapFlags::return_param;
1793
1794 if (mapTypeMod == "private")
1795 mapTypeBits |= ClauseMapFlags::priv;
1796
1797 if (mapTypeMod == "literal")
1798 mapTypeBits |= ClauseMapFlags::literal;
1799
1800 if (mapTypeMod == "attach")
1801 mapTypeBits |= ClauseMapFlags::attach;
1802
1803 if (mapTypeMod == "attach_always")
1804 mapTypeBits |= ClauseMapFlags::attach_always;
1805
1806 if (mapTypeMod == "attach_none")
1807 mapTypeBits |= ClauseMapFlags::attach_none;
1808
1809 if (mapTypeMod == "attach_auto")
1810 mapTypeBits |= ClauseMapFlags::attach_auto;
1811
1812 if (mapTypeMod == "ref_ptr")
1813 mapTypeBits |= ClauseMapFlags::ref_ptr;
1814
1815 if (mapTypeMod == "ref_ptee")
1816 mapTypeBits |= ClauseMapFlags::ref_ptee;
1817
1818 if (mapTypeMod == "ref_ptr_ptee")
1819 mapTypeBits |= ClauseMapFlags::ref_ptr_ptee;
1820
1821 if (mapTypeMod == "is_device_ptr")
1822 mapTypeBits |= ClauseMapFlags::is_device_ptr;
1823
1824 return success();
1825 };
1826
1827 if (parser.parseCommaSeparatedList(parseTypeAndMod))
1828 return failure();
1829
1830 mapType =
1831 parser.getBuilder().getAttr<mlir::omp::ClauseMapFlagsAttr>(mapTypeBits);
1832
1833 return success();
1834}
1835
1836/// Prints a map_entries map type from its numeric value out into its string
1837/// format.
1838static void printMapClause(OpAsmPrinter &p, Operation *op,
1839 ClauseMapFlagsAttr mapType) {
1841 ClauseMapFlags mapFlags = mapType.getValue();
1842
1843 // handling of always, close, present placed at the beginning of the string
1844 // to aid readability
1845 if (mapTypeToBool(mapFlags, ClauseMapFlags::always))
1846 mapTypeStrs.push_back("always");
1847 if (mapTypeToBool(mapFlags, ClauseMapFlags::implicit))
1848 mapTypeStrs.push_back("implicit");
1849 if (mapTypeToBool(mapFlags, ClauseMapFlags::ompx_hold))
1850 mapTypeStrs.push_back("ompx_hold");
1851 if (mapTypeToBool(mapFlags, ClauseMapFlags::close))
1852 mapTypeStrs.push_back("close");
1853 if (mapTypeToBool(mapFlags, ClauseMapFlags::present))
1854 mapTypeStrs.push_back("present");
1855
1856 // special handling of to/from/tofrom/delete and release/alloc, release +
1857 // alloc are the abscense of one of the other flags, whereas tofrom requires
1858 // both the to and from flag to be set.
1859 bool to = mapTypeToBool(mapFlags, ClauseMapFlags::to);
1860 bool from = mapTypeToBool(mapFlags, ClauseMapFlags::from);
1861
1862 if (to && from)
1863 mapTypeStrs.push_back("tofrom");
1864 else if (from)
1865 mapTypeStrs.push_back("from");
1866 else if (to)
1867 mapTypeStrs.push_back("to");
1868
1869 if (mapTypeToBool(mapFlags, ClauseMapFlags::del))
1870 mapTypeStrs.push_back("delete");
1871 if (mapTypeToBool(mapFlags, ClauseMapFlags::return_param))
1872 mapTypeStrs.push_back("return_param");
1873 if (mapTypeToBool(mapFlags, ClauseMapFlags::storage))
1874 mapTypeStrs.push_back("storage");
1875 if (mapTypeToBool(mapFlags, ClauseMapFlags::priv))
1876 mapTypeStrs.push_back("private");
1877 if (mapTypeToBool(mapFlags, ClauseMapFlags::literal))
1878 mapTypeStrs.push_back("literal");
1879 if (mapTypeToBool(mapFlags, ClauseMapFlags::attach))
1880 mapTypeStrs.push_back("attach");
1881 if (mapTypeToBool(mapFlags, ClauseMapFlags::attach_always))
1882 mapTypeStrs.push_back("attach_always");
1883 if (mapTypeToBool(mapFlags, ClauseMapFlags::attach_none))
1884 mapTypeStrs.push_back("attach_none");
1885 if (mapTypeToBool(mapFlags, ClauseMapFlags::attach_auto))
1886 mapTypeStrs.push_back("attach_auto");
1887 if (mapTypeToBool(mapFlags, ClauseMapFlags::ref_ptr))
1888 mapTypeStrs.push_back("ref_ptr");
1889 if (mapTypeToBool(mapFlags, ClauseMapFlags::ref_ptee))
1890 mapTypeStrs.push_back("ref_ptee");
1891 if (mapTypeToBool(mapFlags, ClauseMapFlags::ref_ptr_ptee))
1892 mapTypeStrs.push_back("ref_ptr_ptee");
1893 if (mapTypeToBool(mapFlags, ClauseMapFlags::is_device_ptr))
1894 mapTypeStrs.push_back("is_device_ptr");
1895 if (mapFlags == ClauseMapFlags::none)
1896 mapTypeStrs.push_back("none");
1897
1898 for (unsigned int i = 0; i < mapTypeStrs.size(); ++i) {
1899 p << mapTypeStrs[i];
1900 if (i + 1 < mapTypeStrs.size()) {
1901 p << ", ";
1902 }
1903 }
1904}
1905
1906static ParseResult parseMembersIndex(OpAsmParser &parser,
1907 ArrayAttr &membersIdx) {
1908 SmallVector<Attribute> values, memberIdxs;
1909
1910 auto parseIndices = [&]() -> ParseResult {
1911 int64_t value;
1912 if (parser.parseInteger(value))
1913 return failure();
1914 values.push_back(IntegerAttr::get(parser.getBuilder().getIntegerType(64),
1915 APInt(64, value, /*isSigned=*/false)));
1916 return success();
1917 };
1918
1919 do {
1920 if (failed(parser.parseLSquare()))
1921 return failure();
1922
1923 if (parser.parseCommaSeparatedList(parseIndices))
1924 return failure();
1925
1926 if (failed(parser.parseRSquare()))
1927 return failure();
1928
1929 memberIdxs.push_back(ArrayAttr::get(parser.getContext(), values));
1930 values.clear();
1931 } while (succeeded(parser.parseOptionalComma()));
1932
1933 if (!memberIdxs.empty())
1934 membersIdx = ArrayAttr::get(parser.getContext(), memberIdxs);
1935
1936 return success();
1937}
1938
1939static void printMembersIndex(OpAsmPrinter &p, MapInfoOp op,
1940 ArrayAttr membersIdx) {
1941 if (!membersIdx)
1942 return;
1943
1944 llvm::interleaveComma(membersIdx, p, [&p](Attribute v) {
1945 p << "[";
1946 auto memberIdx = cast<ArrayAttr>(v);
1947 llvm::interleaveComma(memberIdx.getValue(), p, [&p](Attribute v2) {
1948 p << cast<IntegerAttr>(v2).getInt();
1949 });
1950 p << "]";
1951 });
1952}
1953
1955 VariableCaptureKindAttr mapCaptureType) {
1956 std::string typeCapStr;
1957 llvm::raw_string_ostream typeCap(typeCapStr);
1958 if (mapCaptureType.getValue() == mlir::omp::VariableCaptureKind::ByRef)
1959 typeCap << "ByRef";
1960 if (mapCaptureType.getValue() == mlir::omp::VariableCaptureKind::ByCopy)
1961 typeCap << "ByCopy";
1962 if (mapCaptureType.getValue() == mlir::omp::VariableCaptureKind::VLAType)
1963 typeCap << "VLAType";
1964 if (mapCaptureType.getValue() == mlir::omp::VariableCaptureKind::This)
1965 typeCap << "This";
1966 p << typeCapStr;
1967}
1968
1969static ParseResult parseCaptureType(OpAsmParser &parser,
1970 VariableCaptureKindAttr &mapCaptureType) {
1971 StringRef mapCaptureKey;
1972 if (parser.parseKeyword(&mapCaptureKey))
1973 return failure();
1974
1975 if (mapCaptureKey == "This")
1976 mapCaptureType = mlir::omp::VariableCaptureKindAttr::get(
1977 parser.getContext(), mlir::omp::VariableCaptureKind::This);
1978 if (mapCaptureKey == "ByRef")
1979 mapCaptureType = mlir::omp::VariableCaptureKindAttr::get(
1980 parser.getContext(), mlir::omp::VariableCaptureKind::ByRef);
1981 if (mapCaptureKey == "ByCopy")
1982 mapCaptureType = mlir::omp::VariableCaptureKindAttr::get(
1983 parser.getContext(), mlir::omp::VariableCaptureKind::ByCopy);
1984 if (mapCaptureKey == "VLAType")
1985 mapCaptureType = mlir::omp::VariableCaptureKindAttr::get(
1986 parser.getContext(), mlir::omp::VariableCaptureKind::VLAType);
1987
1988 return success();
1989}
1990
1991static LogicalResult verifyMapClause(Operation *op, OperandRange mapVars) {
1994
1995 for (auto mapOp : mapVars) {
1996 if (!mapOp.getDefiningOp())
1997 return emitError(op->getLoc(), "missing map operation");
1998
1999 if (auto mapInfoOp = mapOp.getDefiningOp<mlir::omp::MapInfoOp>()) {
2000 mlir::omp::ClauseMapFlags mapTypeBits = mapInfoOp.getMapType();
2001
2002 bool to = mapTypeToBool(mapTypeBits, ClauseMapFlags::to);
2003 bool from = mapTypeToBool(mapTypeBits, ClauseMapFlags::from);
2004 bool del = mapTypeToBool(mapTypeBits, ClauseMapFlags::del);
2005
2006 bool always = mapTypeToBool(mapTypeBits, ClauseMapFlags::always);
2007 bool close = mapTypeToBool(mapTypeBits, ClauseMapFlags::close);
2008 bool implicit = mapTypeToBool(mapTypeBits, ClauseMapFlags::implicit);
2009
2010 if ((isa<TargetDataOp>(op) || isa<TargetOp>(op)) && del)
2011 return emitError(op->getLoc(),
2012 "to, from, tofrom and alloc map types are permitted");
2013
2014 if (isa<TargetEnterDataOp>(op) && (from || del))
2015 return emitError(op->getLoc(), "to and alloc map types are permitted");
2016
2017 if (isa<TargetExitDataOp>(op) && to)
2018 return emitError(op->getLoc(),
2019 "from, release and delete map types are permitted");
2020
2021 if (isa<TargetUpdateOp>(op)) {
2022 if (del) {
2023 return emitError(op->getLoc(),
2024 "at least one of to or from map types must be "
2025 "specified, other map types are not permitted");
2026 }
2027
2028 if (!to && !from) {
2029 return emitError(op->getLoc(),
2030 "at least one of to or from map types must be "
2031 "specified, other map types are not permitted");
2032 }
2033
2034 auto updateVar = mapInfoOp.getVarPtr();
2035
2036 if ((to && from) || (to && updateFromVars.contains(updateVar)) ||
2037 (from && updateToVars.contains(updateVar))) {
2038 return emitError(
2039 op->getLoc(),
2040 "either to or from map types can be specified, not both");
2041 }
2042
2043 if (always || close || implicit) {
2044 return emitError(
2045 op->getLoc(),
2046 "present, mapper and iterator map type modifiers are permitted");
2047 }
2048
2049 to ? updateToVars.insert(updateVar) : updateFromVars.insert(updateVar);
2050 }
2051 } else if (!isa<DeclareMapperInfoOp>(op)) {
2052 return emitError(op->getLoc(),
2053 "map argument is not a map entry operation");
2054 }
2055 }
2056
2057 return success();
2058}
2059
2060static LogicalResult verifyPrivateVarsMapping(TargetOp targetOp) {
2061 std::optional<DenseI64ArrayAttr> privateMapIndices =
2062 targetOp.getPrivateMapsAttr();
2063
2064 // None of the private operands are mapped.
2065 if (!privateMapIndices.has_value() || !privateMapIndices.value())
2066 return success();
2067
2068 OperandRange privateVars = targetOp.getPrivateVars();
2069
2070 if (privateMapIndices.value().size() !=
2071 static_cast<int64_t>(privateVars.size()))
2072 return emitError(targetOp.getLoc(), "sizes of `private` operand range and "
2073 "`private_maps` attribute mismatch");
2074
2075 return success();
2076}
2077
2078//===----------------------------------------------------------------------===//
2079// MapInfoOp
2080//===----------------------------------------------------------------------===//
2081
2082static LogicalResult verifyMapInfoDefinedArgs(Operation *op,
2083 StringRef clauseName,
2084 OperandRange vars) {
2085 for (Value var : vars)
2086 if (!llvm::isa_and_present<MapInfoOp>(var.getDefiningOp()))
2087 return op->emitOpError()
2088 << "'" << clauseName
2089 << "' arguments must be defined by 'omp.map.info' ops";
2090 return success();
2091}
2092
2093LogicalResult MapInfoOp::verify() {
2094 if (getMapperId() &&
2096 *this, getMapperIdAttr())) {
2097 return emitError("invalid mapper id");
2098 }
2099
2100 if (failed(verifyMapInfoDefinedArgs(*this, "members", getMembers())))
2101 return failure();
2102
2103 return success();
2104}
2105
2106//===----------------------------------------------------------------------===//
2107// TargetDataOp
2108//===----------------------------------------------------------------------===//
2109
2110void TargetDataOp::build(OpBuilder &builder, OperationState &state,
2111 const TargetDataOperands &clauses) {
2112 TargetDataOp::build(builder, state, clauses.device, clauses.ifExpr,
2113 clauses.mapVars, clauses.useDeviceAddrVars,
2114 clauses.useDevicePtrVars);
2115}
2116
2117LogicalResult TargetDataOp::verify() {
2118 if (getMapVars().empty() && getUseDevicePtrVars().empty() &&
2119 getUseDeviceAddrVars().empty()) {
2120 return ::emitError(this->getLoc(),
2121 "At least one of map, use_device_ptr_vars, or "
2122 "use_device_addr_vars operand must be present");
2123 }
2124
2125 if (failed(verifyMapInfoDefinedArgs(*this, "use_device_ptr",
2126 getUseDevicePtrVars())))
2127 return failure();
2128
2129 if (failed(verifyMapInfoDefinedArgs(*this, "use_device_addr",
2130 getUseDeviceAddrVars())))
2131 return failure();
2132
2133 return verifyMapClause(*this, getMapVars());
2134}
2135
2136//===----------------------------------------------------------------------===//
2137// TargetEnterDataOp
2138//===----------------------------------------------------------------------===//
2139
2140void TargetEnterDataOp::build(
2141 OpBuilder &builder, OperationState &state,
2142 const TargetEnterExitUpdateDataOperands &clauses) {
2143 MLIRContext *ctx = builder.getContext();
2144 TargetEnterDataOp::build(builder, state,
2145 makeArrayAttr(ctx, clauses.dependKinds),
2146 clauses.dependVars, clauses.device, clauses.ifExpr,
2147 clauses.mapVars, clauses.nowait);
2148}
2149
2150LogicalResult TargetEnterDataOp::verify() {
2151 LogicalResult verifyDependVars =
2152 verifyDependVarList(*this, getDependKinds(), getDependVars());
2153 return failed(verifyDependVars) ? verifyDependVars
2154 : verifyMapClause(*this, getMapVars());
2155}
2156
2157//===----------------------------------------------------------------------===//
2158// TargetExitDataOp
2159//===----------------------------------------------------------------------===//
2160
2161void TargetExitDataOp::build(OpBuilder &builder, OperationState &state,
2162 const TargetEnterExitUpdateDataOperands &clauses) {
2163 MLIRContext *ctx = builder.getContext();
2164 TargetExitDataOp::build(builder, state,
2165 makeArrayAttr(ctx, clauses.dependKinds),
2166 clauses.dependVars, clauses.device, clauses.ifExpr,
2167 clauses.mapVars, clauses.nowait);
2168}
2169
2170LogicalResult TargetExitDataOp::verify() {
2171 LogicalResult verifyDependVars =
2172 verifyDependVarList(*this, getDependKinds(), getDependVars());
2173 return failed(verifyDependVars) ? verifyDependVars
2174 : verifyMapClause(*this, getMapVars());
2175}
2176
2177//===----------------------------------------------------------------------===//
2178// TargetUpdateOp
2179//===----------------------------------------------------------------------===//
2180
2181void TargetUpdateOp::build(OpBuilder &builder, OperationState &state,
2182 const TargetEnterExitUpdateDataOperands &clauses) {
2183 MLIRContext *ctx = builder.getContext();
2184 TargetUpdateOp::build(builder, state, makeArrayAttr(ctx, clauses.dependKinds),
2185 clauses.dependVars, clauses.device, clauses.ifExpr,
2186 clauses.mapVars, clauses.nowait);
2187}
2188
2189LogicalResult TargetUpdateOp::verify() {
2190 LogicalResult verifyDependVars =
2191 verifyDependVarList(*this, getDependKinds(), getDependVars());
2192 return failed(verifyDependVars) ? verifyDependVars
2193 : verifyMapClause(*this, getMapVars());
2194}
2195
2196//===----------------------------------------------------------------------===//
2197// TargetOp
2198//===----------------------------------------------------------------------===//
2199
2200void TargetOp::build(OpBuilder &builder, OperationState &state,
2201 const TargetOperands &clauses) {
2202 MLIRContext *ctx = builder.getContext();
2203 // TODO Store clauses in op: allocateVars, allocatorVars, inReductionVars,
2204 // inReductionByref, inReductionSyms.
2205 TargetOp::build(builder, state, /*allocate_vars=*/{}, /*allocator_vars=*/{},
2206 clauses.bare, makeArrayAttr(ctx, clauses.dependKinds),
2207 clauses.dependVars, clauses.device, clauses.hasDeviceAddrVars,
2208 clauses.hostEvalVars, clauses.ifExpr,
2209 /*in_reduction_vars=*/{}, /*in_reduction_byref=*/nullptr,
2210 /*in_reduction_syms=*/nullptr, clauses.isDevicePtrVars,
2211 clauses.mapVars, clauses.nowait, clauses.privateVars,
2212 makeArrayAttr(ctx, clauses.privateSyms),
2213 clauses.privateNeedsBarrier, clauses.threadLimit,
2214 /*private_maps=*/nullptr);
2215}
2216
2217LogicalResult TargetOp::verify() {
2218 if (failed(verifyDependVarList(*this, getDependKinds(), getDependVars())))
2219 return failure();
2220
2221 if (failed(verifyMapInfoDefinedArgs(*this, "has_device_addr",
2222 getHasDeviceAddrVars())))
2223 return failure();
2224
2225 if (failed(verifyMapClause(*this, getMapVars())))
2226 return failure();
2227
2228 return verifyPrivateVarsMapping(*this);
2229}
2230
2231LogicalResult TargetOp::verifyRegions() {
2232 auto teamsOps = getOps<TeamsOp>();
2233 if (std::distance(teamsOps.begin(), teamsOps.end()) > 1)
2234 return emitError("target containing multiple 'omp.teams' nested ops");
2235
2236 // Check that host_eval values are only used in legal ways.
2237 Operation *capturedOp = getInnermostCapturedOmpOp();
2238 TargetRegionFlags execFlags = getKernelExecFlags(capturedOp);
2239 for (Value hostEvalArg :
2240 cast<BlockArgOpenMPOpInterface>(getOperation()).getHostEvalBlockArgs()) {
2241 for (Operation *user : hostEvalArg.getUsers()) {
2242 if (auto teamsOp = dyn_cast<TeamsOp>(user)) {
2243 if (llvm::is_contained({teamsOp.getNumTeamsLower(),
2244 teamsOp.getNumTeamsUpper(),
2245 teamsOp.getThreadLimit()},
2246 hostEvalArg))
2247 continue;
2248
2249 return emitOpError() << "host_eval argument only legal as 'num_teams' "
2250 "and 'thread_limit' in 'omp.teams'";
2251 }
2252 if (auto parallelOp = dyn_cast<ParallelOp>(user)) {
2253 if (bitEnumContainsAny(execFlags, TargetRegionFlags::spmd) &&
2254 parallelOp->isAncestor(capturedOp) &&
2255 hostEvalArg == parallelOp.getNumThreads())
2256 continue;
2257
2258 return emitOpError()
2259 << "host_eval argument only legal as 'num_threads' in "
2260 "'omp.parallel' when representing target SPMD";
2261 }
2262 if (auto loopNestOp = dyn_cast<LoopNestOp>(user)) {
2263 if (bitEnumContainsAny(execFlags, TargetRegionFlags::trip_count) &&
2264 loopNestOp.getOperation() == capturedOp &&
2265 (llvm::is_contained(loopNestOp.getLoopLowerBounds(), hostEvalArg) ||
2266 llvm::is_contained(loopNestOp.getLoopUpperBounds(), hostEvalArg) ||
2267 llvm::is_contained(loopNestOp.getLoopSteps(), hostEvalArg)))
2268 continue;
2269
2270 return emitOpError() << "host_eval argument only legal as loop bounds "
2271 "and steps in 'omp.loop_nest' when trip count "
2272 "must be evaluated in the host";
2273 }
2274
2275 return emitOpError() << "host_eval argument illegal use in '"
2276 << user->getName() << "' operation";
2277 }
2278 }
2279 return success();
2280}
2281
2282static Operation *
2283findCapturedOmpOp(Operation *rootOp, bool checkSingleMandatoryExec,
2284 llvm::function_ref<bool(Operation *)> siblingAllowedFn) {
2285 assert(rootOp && "expected valid operation");
2286
2287 Dialect *ompDialect = rootOp->getDialect();
2288 Operation *capturedOp = nullptr;
2289 DominanceInfo domInfo;
2290
2291 // Process in pre-order to check operations from outermost to innermost,
2292 // ensuring we only enter the region of an operation if it meets the criteria
2293 // for being captured. We stop the exploration of nested operations as soon as
2294 // we process a region holding no operations to be captured.
2295 rootOp->walk<WalkOrder::PreOrder>([&](Operation *op) {
2296 if (op == rootOp)
2297 return WalkResult::advance();
2298
2299 // Ignore operations of other dialects or omp operations with no regions,
2300 // because these will only be checked if they are siblings of an omp
2301 // operation that can potentially be captured.
2302 bool isOmpDialect = op->getDialect() == ompDialect;
2303 bool hasRegions = op->getNumRegions() > 0;
2304 if (!isOmpDialect || !hasRegions)
2305 return WalkResult::skip();
2306
2307 // This operation cannot be captured if it can be executed more than once
2308 // (i.e. its block's successors can reach it) or if it's not guaranteed to
2309 // be executed before all exits of the region (i.e. it doesn't dominate all
2310 // blocks with no successors reachable from the entry block).
2311 if (checkSingleMandatoryExec) {
2312 Region *parentRegion = op->getParentRegion();
2313 Block *parentBlock = op->getBlock();
2314
2315 for (Block *successor : parentBlock->getSuccessors())
2316 if (successor->isReachable(parentBlock))
2317 return WalkResult::interrupt();
2318
2319 for (Block &block : *parentRegion)
2320 if (domInfo.isReachableFromEntry(&block) && block.hasNoSuccessors() &&
2321 !domInfo.dominates(parentBlock, &block))
2322 return WalkResult::interrupt();
2323 }
2324
2325 // Don't capture this op if it has a not-allowed sibling, and stop recursing
2326 // into nested operations.
2327 for (Operation &sibling : op->getParentRegion()->getOps())
2328 if (&sibling != op && !siblingAllowedFn(&sibling))
2329 return WalkResult::interrupt();
2330
2331 // Don't continue capturing nested operations if we reach an omp.loop_nest.
2332 // Otherwise, process the contents of this operation.
2333 capturedOp = op;
2334 return llvm::isa<LoopNestOp>(op) ? WalkResult::interrupt()
2336 });
2337
2338 return capturedOp;
2339}
2340
2341Operation *TargetOp::getInnermostCapturedOmpOp() {
2342 auto *ompDialect = getContext()->getLoadedDialect<omp::OpenMPDialect>();
2343
2344 // Only allow OpenMP terminators and non-OpenMP ops that have known memory
2345 // effects, but don't include a memory write effect.
2346 return findCapturedOmpOp(
2347 *this, /*checkSingleMandatoryExec=*/true, [&](Operation *sibling) {
2348 if (!sibling)
2349 return false;
2350
2351 if (ompDialect == sibling->getDialect())
2352 return sibling->hasTrait<OpTrait::IsTerminator>();
2353
2354 if (auto memOp = dyn_cast<MemoryEffectOpInterface>(sibling)) {
2356 effects;
2357 memOp.getEffects(effects);
2358 return !llvm::any_of(
2359 effects, [&](MemoryEffects::EffectInstance &effect) {
2360 return isa<MemoryEffects::Write>(effect.getEffect()) &&
2361 isa<SideEffects::AutomaticAllocationScopeResource>(
2362 effect.getResource());
2363 });
2364 }
2365 return true;
2366 });
2367}
2368
2369/// Check if we can promote SPMD kernel to No-Loop kernel.
2370static bool canPromoteToNoLoop(Operation *capturedOp, TeamsOp teamsOp,
2371 WsloopOp *wsLoopOp) {
2372 // num_teams clause can break no-loop teams/threads assumption.
2373 if (teamsOp.getNumTeamsUpper())
2374 return false;
2375
2376 // Reduction kernels are slower in no-loop mode.
2377 if (teamsOp.getNumReductionVars())
2378 return false;
2379 if (wsLoopOp->getNumReductionVars())
2380 return false;
2381
2382 // Check if the user allows the promotion of kernels to no-loop mode.
2383 OffloadModuleInterface offloadMod =
2384 capturedOp->getParentOfType<omp::OffloadModuleInterface>();
2385 if (!offloadMod)
2386 return false;
2387 auto ompFlags = offloadMod.getFlags();
2388 if (!ompFlags)
2389 return false;
2390 return ompFlags.getAssumeTeamsOversubscription() &&
2391 ompFlags.getAssumeThreadsOversubscription();
2392}
2393
2394TargetRegionFlags TargetOp::getKernelExecFlags(Operation *capturedOp) {
2395 // A non-null captured op is only valid if it resides inside of a TargetOp
2396 // and is the result of calling getInnermostCapturedOmpOp() on it.
2397 TargetOp targetOp =
2398 capturedOp ? capturedOp->getParentOfType<TargetOp>() : nullptr;
2399 assert((!capturedOp ||
2400 (targetOp && targetOp.getInnermostCapturedOmpOp() == capturedOp)) &&
2401 "unexpected captured op");
2402
2403 // If it's not capturing a loop, it's a default target region.
2404 if (!isa_and_present<LoopNestOp>(capturedOp))
2405 return TargetRegionFlags::generic;
2406
2407 // Get the innermost non-simd loop wrapper.
2409 cast<LoopNestOp>(capturedOp).gatherWrappers(loopWrappers);
2410 assert(!loopWrappers.empty());
2411
2412 LoopWrapperInterface *innermostWrapper = loopWrappers.begin();
2413 if (isa<SimdOp>(innermostWrapper))
2414 innermostWrapper = std::next(innermostWrapper);
2415
2416 auto numWrappers = std::distance(innermostWrapper, loopWrappers.end());
2417 if (numWrappers != 1 && numWrappers != 2)
2418 return TargetRegionFlags::generic;
2419
2420 // Detect target-teams-distribute-parallel-wsloop[-simd].
2421 if (numWrappers == 2) {
2422 WsloopOp *wsloopOp = dyn_cast<WsloopOp>(innermostWrapper);
2423 if (!wsloopOp)
2424 return TargetRegionFlags::generic;
2425
2426 innermostWrapper = std::next(innermostWrapper);
2427 if (!isa<DistributeOp>(innermostWrapper))
2428 return TargetRegionFlags::generic;
2429
2430 Operation *parallelOp = (*innermostWrapper)->getParentOp();
2431 if (!isa_and_present<ParallelOp>(parallelOp))
2432 return TargetRegionFlags::generic;
2433
2434 TeamsOp teamsOp = dyn_cast<TeamsOp>(parallelOp->getParentOp());
2435 if (!teamsOp)
2436 return TargetRegionFlags::generic;
2437
2438 if (teamsOp->getParentOp() == targetOp.getOperation()) {
2439 TargetRegionFlags result =
2440 TargetRegionFlags::spmd | TargetRegionFlags::trip_count;
2441 if (canPromoteToNoLoop(capturedOp, teamsOp, wsloopOp))
2442 result = result | TargetRegionFlags::no_loop;
2443 return result;
2444 }
2445 }
2446 // Detect target-teams-distribute[-simd] and target-teams-loop.
2447 else if (isa<DistributeOp, LoopOp>(innermostWrapper)) {
2448 Operation *teamsOp = (*innermostWrapper)->getParentOp();
2449 if (!isa_and_present<TeamsOp>(teamsOp))
2450 return TargetRegionFlags::generic;
2451
2452 if (teamsOp->getParentOp() != targetOp.getOperation())
2453 return TargetRegionFlags::generic;
2454
2455 if (isa<LoopOp>(innermostWrapper))
2456 return TargetRegionFlags::spmd | TargetRegionFlags::trip_count;
2457
2458 // Find single immediately nested captured omp.parallel and add spmd flag
2459 // (generic-spmd case).
2460 //
2461 // TODO: This shouldn't have to be done here, as it is too easy to break.
2462 // The openmp-opt pass should be updated to be able to promote kernels like
2463 // this from "Generic" to "Generic-SPMD". However, the use of the
2464 // `kmpc_distribute_static_loop` family of functions produced by the
2465 // OMPIRBuilder for these kernels prevents that from working.
2466 Dialect *ompDialect = targetOp->getDialect();
2467 Operation *nestedCapture = findCapturedOmpOp(
2468 capturedOp, /*checkSingleMandatoryExec=*/false,
2469 [&](Operation *sibling) {
2470 return sibling && (ompDialect != sibling->getDialect() ||
2471 sibling->hasTrait<OpTrait::IsTerminator>());
2472 });
2473
2474 TargetRegionFlags result =
2475 TargetRegionFlags::generic | TargetRegionFlags::trip_count;
2476
2477 if (!nestedCapture)
2478 return result;
2479
2480 while (nestedCapture->getParentOp() != capturedOp)
2481 nestedCapture = nestedCapture->getParentOp();
2482
2483 return isa<ParallelOp>(nestedCapture) ? result | TargetRegionFlags::spmd
2484 : result;
2485 }
2486 // Detect target-parallel-wsloop[-simd].
2487 else if (isa<WsloopOp>(innermostWrapper)) {
2488 Operation *parallelOp = (*innermostWrapper)->getParentOp();
2489 if (!isa_and_present<ParallelOp>(parallelOp))
2490 return TargetRegionFlags::generic;
2491
2492 if (parallelOp->getParentOp() == targetOp.getOperation())
2493 return TargetRegionFlags::spmd;
2494 }
2495
2496 return TargetRegionFlags::generic;
2497}
2498
2499//===----------------------------------------------------------------------===//
2500// ParallelOp
2501//===----------------------------------------------------------------------===//
2502
2503void ParallelOp::build(OpBuilder &builder, OperationState &state,
2504 ArrayRef<NamedAttribute> attributes) {
2505 ParallelOp::build(builder, state, /*allocate_vars=*/ValueRange(),
2506 /*allocator_vars=*/ValueRange(), /*if_expr=*/nullptr,
2507 /*num_threads=*/nullptr, /*private_vars=*/ValueRange(),
2508 /*private_syms=*/nullptr, /*private_needs_barrier=*/nullptr,
2509 /*proc_bind_kind=*/nullptr,
2510 /*reduction_mod =*/nullptr, /*reduction_vars=*/ValueRange(),
2511 /*reduction_byref=*/nullptr, /*reduction_syms=*/nullptr);
2512 state.addAttributes(attributes);
2513}
2514
2515void ParallelOp::build(OpBuilder &builder, OperationState &state,
2516 const ParallelOperands &clauses) {
2517 MLIRContext *ctx = builder.getContext();
2518 ParallelOp::build(builder, state, clauses.allocateVars, clauses.allocatorVars,
2519 clauses.ifExpr, clauses.numThreads, clauses.privateVars,
2520 makeArrayAttr(ctx, clauses.privateSyms),
2521 clauses.privateNeedsBarrier, clauses.procBindKind,
2522 clauses.reductionMod, clauses.reductionVars,
2523 makeDenseBoolArrayAttr(ctx, clauses.reductionByref),
2524 makeArrayAttr(ctx, clauses.reductionSyms));
2525}
2526
2527template <typename OpType>
2528static LogicalResult verifyPrivateVarList(OpType &op) {
2529 auto privateVars = op.getPrivateVars();
2530 auto privateSyms = op.getPrivateSymsAttr();
2531
2532 if (privateVars.empty() && (privateSyms == nullptr || privateSyms.empty()))
2533 return success();
2534
2535 auto numPrivateVars = privateVars.size();
2536 auto numPrivateSyms = (privateSyms == nullptr) ? 0 : privateSyms.size();
2537
2538 if (numPrivateVars != numPrivateSyms)
2539 return op.emitError() << "inconsistent number of private variables and "
2540 "privatizer op symbols, private vars: "
2541 << numPrivateVars
2542 << " vs. privatizer op symbols: " << numPrivateSyms;
2543
2544 for (auto privateVarInfo : llvm::zip_equal(privateVars, privateSyms)) {
2545 Type varType = std::get<0>(privateVarInfo).getType();
2546 SymbolRefAttr privateSym = cast<SymbolRefAttr>(std::get<1>(privateVarInfo));
2547 PrivateClauseOp privatizerOp =
2549
2550 if (privatizerOp == nullptr)
2551 return op.emitError() << "failed to lookup privatizer op with symbol: '"
2552 << privateSym << "'";
2553
2554 Type privatizerType = privatizerOp.getArgType();
2555
2556 if (privatizerType && (varType != privatizerType))
2557 return op.emitError()
2558 << "type mismatch between a "
2559 << (privatizerOp.getDataSharingType() ==
2560 DataSharingClauseType::Private
2561 ? "private"
2562 : "firstprivate")
2563 << " variable and its privatizer op, var type: " << varType
2564 << " vs. privatizer op type: " << privatizerType;
2565 }
2566
2567 return success();
2568}
2569
2570LogicalResult ParallelOp::verify() {
2571 if (getAllocateVars().size() != getAllocatorVars().size())
2572 return emitError(
2573 "expected equal sizes for allocate and allocator variables");
2574
2575 if (failed(verifyPrivateVarList(*this)))
2576 return failure();
2577
2578 return verifyReductionVarList(*this, getReductionSyms(), getReductionVars(),
2579 getReductionByref());
2580}
2581
2582LogicalResult ParallelOp::verifyRegions() {
2583 auto distChildOps = getOps<DistributeOp>();
2584 int numDistChildOps = std::distance(distChildOps.begin(), distChildOps.end());
2585 if (numDistChildOps > 1)
2586 return emitError()
2587 << "multiple 'omp.distribute' nested inside of 'omp.parallel'";
2588
2589 if (numDistChildOps == 1) {
2590 if (!isComposite())
2591 return emitError()
2592 << "'omp.composite' attribute missing from composite operation";
2593
2594 auto *ompDialect = getContext()->getLoadedDialect<OpenMPDialect>();
2595 Operation &distributeOp = **distChildOps.begin();
2596 for (Operation &childOp : getOps()) {
2597 if (&childOp == &distributeOp || ompDialect != childOp.getDialect())
2598 continue;
2599
2600 if (!childOp.hasTrait<OpTrait::IsTerminator>())
2601 return emitError() << "unexpected OpenMP operation inside of composite "
2602 "'omp.parallel': "
2603 << childOp.getName();
2604 }
2605 } else if (isComposite()) {
2606 return emitError()
2607 << "'omp.composite' attribute present in non-composite operation";
2608 }
2609 return success();
2610}
2611
2612//===----------------------------------------------------------------------===//
2613// TeamsOp
2614//===----------------------------------------------------------------------===//
2615
2617 while ((op = op->getParentOp()))
2618 if (isa<OpenMPDialect>(op->getDialect()))
2619 return false;
2620 return true;
2621}
2622
2623void TeamsOp::build(OpBuilder &builder, OperationState &state,
2624 const TeamsOperands &clauses) {
2625 MLIRContext *ctx = builder.getContext();
2626 // TODO Store clauses in op: privateVars, privateSyms, privateNeedsBarrier
2627 TeamsOp::build(builder, state, clauses.allocateVars, clauses.allocatorVars,
2628 clauses.ifExpr, clauses.numTeamsLower, clauses.numTeamsUpper,
2629 /*private_vars=*/{}, /*private_syms=*/nullptr,
2630 /*private_needs_barrier=*/nullptr, clauses.reductionMod,
2631 clauses.reductionVars,
2632 makeDenseBoolArrayAttr(ctx, clauses.reductionByref),
2633 makeArrayAttr(ctx, clauses.reductionSyms),
2634 clauses.threadLimit);
2635}
2636
2637LogicalResult TeamsOp::verify() {
2638 // Check parent region
2639 // TODO If nested inside of a target region, also check that it does not
2640 // contain any statements, declarations or directives other than this
2641 // omp.teams construct. The issue is how to support the initialization of
2642 // this operation's own arguments (allow SSA values across omp.target?).
2643 Operation *op = getOperation();
2644 if (!isa<TargetOp>(op->getParentOp()) &&
2646 return emitError("expected to be nested inside of omp.target or not nested "
2647 "in any OpenMP dialect operations");
2648
2649 // Check for num_teams clause restrictions
2650 if (auto numTeamsLowerBound = getNumTeamsLower()) {
2651 auto numTeamsUpperBound = getNumTeamsUpper();
2652 if (!numTeamsUpperBound)
2653 return emitError("expected num_teams upper bound to be defined if the "
2654 "lower bound is defined");
2655 if (numTeamsLowerBound.getType() != numTeamsUpperBound.getType())
2656 return emitError(
2657 "expected num_teams upper bound and lower bound to be the same type");
2658 }
2659
2660 // Check for allocate clause restrictions
2661 if (getAllocateVars().size() != getAllocatorVars().size())
2662 return emitError(
2663 "expected equal sizes for allocate and allocator variables");
2664
2665 return verifyReductionVarList(*this, getReductionSyms(), getReductionVars(),
2666 getReductionByref());
2667}
2668
2669//===----------------------------------------------------------------------===//
2670// SectionOp
2671//===----------------------------------------------------------------------===//
2672
2673OperandRange SectionOp::getPrivateVars() {
2674 return getParentOp().getPrivateVars();
2675}
2676
2677OperandRange SectionOp::getReductionVars() {
2678 return getParentOp().getReductionVars();
2679}
2680
2681//===----------------------------------------------------------------------===//
2682// SectionsOp
2683//===----------------------------------------------------------------------===//
2684
2685void SectionsOp::build(OpBuilder &builder, OperationState &state,
2686 const SectionsOperands &clauses) {
2687 MLIRContext *ctx = builder.getContext();
2688 // TODO Store clauses in op: privateVars, privateSyms, privateNeedsBarrier
2689 SectionsOp::build(builder, state, clauses.allocateVars, clauses.allocatorVars,
2690 clauses.nowait, /*private_vars=*/{},
2691 /*private_syms=*/nullptr, /*private_needs_barrier=*/nullptr,
2692 clauses.reductionMod, clauses.reductionVars,
2693 makeDenseBoolArrayAttr(ctx, clauses.reductionByref),
2694 makeArrayAttr(ctx, clauses.reductionSyms));
2695}
2696
2697LogicalResult SectionsOp::verify() {
2698 if (getAllocateVars().size() != getAllocatorVars().size())
2699 return emitError(
2700 "expected equal sizes for allocate and allocator variables");
2701
2702 return verifyReductionVarList(*this, getReductionSyms(), getReductionVars(),
2703 getReductionByref());
2704}
2705
2706LogicalResult SectionsOp::verifyRegions() {
2707 for (auto &inst : *getRegion().begin()) {
2708 if (!(isa<SectionOp>(inst) || isa<TerminatorOp>(inst))) {
2709 return emitOpError()
2710 << "expected omp.section op or terminator op inside region";
2711 }
2712 }
2713
2714 return success();
2715}
2716
2717//===----------------------------------------------------------------------===//
2718// SingleOp
2719//===----------------------------------------------------------------------===//
2720
2721void SingleOp::build(OpBuilder &builder, OperationState &state,
2722 const SingleOperands &clauses) {
2723 MLIRContext *ctx = builder.getContext();
2724 // TODO Store clauses in op: privateVars, privateSyms, privateNeedsBarrier
2725 SingleOp::build(builder, state, clauses.allocateVars, clauses.allocatorVars,
2726 clauses.copyprivateVars,
2727 makeArrayAttr(ctx, clauses.copyprivateSyms), clauses.nowait,
2728 /*private_vars=*/{}, /*private_syms=*/nullptr,
2729 /*private_needs_barrier=*/nullptr);
2730}
2731
2732LogicalResult SingleOp::verify() {
2733 // Check for allocate clause restrictions
2734 if (getAllocateVars().size() != getAllocatorVars().size())
2735 return emitError(
2736 "expected equal sizes for allocate and allocator variables");
2737
2738 return verifyCopyprivateVarList(*this, getCopyprivateVars(),
2739 getCopyprivateSyms());
2740}
2741
2742//===----------------------------------------------------------------------===//
2743// WorkshareOp
2744//===----------------------------------------------------------------------===//
2745
2746void WorkshareOp::build(OpBuilder &builder, OperationState &state,
2747 const WorkshareOperands &clauses) {
2748 WorkshareOp::build(builder, state, clauses.nowait);
2749}
2750
2751//===----------------------------------------------------------------------===//
2752// WorkshareLoopWrapperOp
2753//===----------------------------------------------------------------------===//
2754
2755LogicalResult WorkshareLoopWrapperOp::verify() {
2756 if (!(*this)->getParentOfType<WorkshareOp>())
2757 return emitOpError() << "must be nested in an omp.workshare";
2758 return success();
2759}
2760
2761LogicalResult WorkshareLoopWrapperOp::verifyRegions() {
2762 if (isa_and_nonnull<LoopWrapperInterface>((*this)->getParentOp()) ||
2763 getNestedWrapper())
2764 return emitOpError() << "expected to be a standalone loop wrapper";
2765
2766 return success();
2767}
2768
2769//===----------------------------------------------------------------------===//
2770// LoopWrapperInterface
2771//===----------------------------------------------------------------------===//
2772
2773LogicalResult LoopWrapperInterface::verifyImpl() {
2774 Operation *op = this->getOperation();
2775 if (!op->hasTrait<OpTrait::NoTerminator>() ||
2777 return emitOpError() << "loop wrapper must also have the `NoTerminator` "
2778 "and `SingleBlock` traits";
2779
2780 if (op->getNumRegions() != 1)
2781 return emitOpError() << "loop wrapper does not contain exactly one region";
2782
2783 Region &region = op->getRegion(0);
2784 if (range_size(region.getOps()) != 1)
2785 return emitOpError()
2786 << "loop wrapper does not contain exactly one nested op";
2787
2788 Operation &firstOp = *region.op_begin();
2789 if (!isa<LoopNestOp, LoopWrapperInterface>(firstOp))
2790 return emitOpError() << "nested in loop wrapper is not another loop "
2791 "wrapper or `omp.loop_nest`";
2792
2793 return success();
2794}
2795
2796//===----------------------------------------------------------------------===//
2797// LoopOp
2798//===----------------------------------------------------------------------===//
2799
2800void LoopOp::build(OpBuilder &builder, OperationState &state,
2801 const LoopOperands &clauses) {
2802 MLIRContext *ctx = builder.getContext();
2803
2804 LoopOp::build(builder, state, clauses.bindKind, clauses.privateVars,
2805 makeArrayAttr(ctx, clauses.privateSyms),
2806 clauses.privateNeedsBarrier, clauses.order, clauses.orderMod,
2807 clauses.reductionMod, clauses.reductionVars,
2808 makeDenseBoolArrayAttr(ctx, clauses.reductionByref),
2809 makeArrayAttr(ctx, clauses.reductionSyms));
2810}
2811
2812LogicalResult LoopOp::verify() {
2813 return verifyReductionVarList(*this, getReductionSyms(), getReductionVars(),
2814 getReductionByref());
2815}
2816
2817LogicalResult LoopOp::verifyRegions() {
2818 if (llvm::isa_and_nonnull<LoopWrapperInterface>((*this)->getParentOp()) ||
2819 getNestedWrapper())
2820 return emitOpError() << "expected to be a standalone loop wrapper";
2821
2822 return success();
2823}
2824
2825//===----------------------------------------------------------------------===//
2826// WsloopOp
2827//===----------------------------------------------------------------------===//
2828
2829void WsloopOp::build(OpBuilder &builder, OperationState &state,
2830 ArrayRef<NamedAttribute> attributes) {
2831 build(builder, state, /*allocate_vars=*/{}, /*allocator_vars=*/{},
2832 /*linear_vars=*/ValueRange(), /*linear_step_vars=*/ValueRange(),
2833 /*linear_var_types*/ nullptr,
2834 /*nowait=*/false, /*order=*/nullptr, /*order_mod=*/nullptr,
2835 /*ordered=*/nullptr, /*private_vars=*/{}, /*private_syms=*/nullptr,
2836 /*private_needs_barrier=*/false,
2837 /*reduction_mod=*/nullptr, /*reduction_vars=*/ValueRange(),
2838 /*reduction_byref=*/nullptr,
2839 /*reduction_syms=*/nullptr, /*schedule_kind=*/nullptr,
2840 /*schedule_chunk=*/nullptr, /*schedule_mod=*/nullptr,
2841 /*schedule_simd=*/false);
2842 state.addAttributes(attributes);
2843}
2844
2845void WsloopOp::build(OpBuilder &builder, OperationState &state,
2846 const WsloopOperands &clauses) {
2847 MLIRContext *ctx = builder.getContext();
2848 // TODO: Store clauses in op: allocateVars, allocatorVars
2849 WsloopOp::build(
2850 builder, state,
2851 /*allocate_vars=*/{}, /*allocator_vars=*/{}, clauses.linearVars,
2852 clauses.linearStepVars, clauses.linearVarTypes, clauses.nowait,
2853 clauses.order, clauses.orderMod, clauses.ordered, clauses.privateVars,
2854 makeArrayAttr(ctx, clauses.privateSyms), clauses.privateNeedsBarrier,
2855 clauses.reductionMod, clauses.reductionVars,
2856 makeDenseBoolArrayAttr(ctx, clauses.reductionByref),
2857 makeArrayAttr(ctx, clauses.reductionSyms), clauses.scheduleKind,
2858 clauses.scheduleChunk, clauses.scheduleMod, clauses.scheduleSimd);
2859}
2860
2861LogicalResult WsloopOp::verify() {
2862 if (getLinearVars().size() &&
2863 getLinearVarTypes().value().size() != getLinearVars().size())
2864 return emitError() << "Ill-formed type attributes for linear variables";
2865 return verifyReductionVarList(*this, getReductionSyms(), getReductionVars(),
2866 getReductionByref());
2867}
2868
2869LogicalResult WsloopOp::verifyRegions() {
2870 bool isCompositeChildLeaf =
2871 llvm::dyn_cast_if_present<LoopWrapperInterface>((*this)->getParentOp());
2872
2873 if (LoopWrapperInterface nested = getNestedWrapper()) {
2874 if (!isComposite())
2875 return emitError()
2876 << "'omp.composite' attribute missing from composite wrapper";
2877
2878 // Check for the allowed leaf constructs that may appear in a composite
2879 // construct directly after DO/FOR.
2880 if (!isa<SimdOp>(nested))
2881 return emitError() << "only supported nested wrapper is 'omp.simd'";
2882
2883 } else if (isComposite() && !isCompositeChildLeaf) {
2884 return emitError()
2885 << "'omp.composite' attribute present in non-composite wrapper";
2886 } else if (!isComposite() && isCompositeChildLeaf) {
2887 return emitError()
2888 << "'omp.composite' attribute missing from composite wrapper";
2889 }
2890
2891 return success();
2892}
2893
2894//===----------------------------------------------------------------------===//
2895// Simd construct [2.9.3.1]
2896//===----------------------------------------------------------------------===//
2897
2898void SimdOp::build(OpBuilder &builder, OperationState &state,
2899 const SimdOperands &clauses) {
2900 MLIRContext *ctx = builder.getContext();
2901 SimdOp::build(
2902 builder, state, clauses.alignedVars,
2903 makeArrayAttr(ctx, clauses.alignments), clauses.ifExpr,
2904 clauses.linearVars, clauses.linearStepVars, clauses.linearVarTypes,
2905 clauses.nontemporalVars, clauses.order, clauses.orderMod,
2906 clauses.privateVars, makeArrayAttr(ctx, clauses.privateSyms),
2907 clauses.privateNeedsBarrier, clauses.reductionMod, clauses.reductionVars,
2908 makeDenseBoolArrayAttr(ctx, clauses.reductionByref),
2909 makeArrayAttr(ctx, clauses.reductionSyms), clauses.safelen,
2910 clauses.simdlen);
2911}
2912
2913LogicalResult SimdOp::verify() {
2914 if (getSimdlen().has_value() && getSafelen().has_value() &&
2915 getSimdlen().value() > getSafelen().value())
2916 return emitOpError()
2917 << "simdlen clause and safelen clause are both present, but the "
2918 "simdlen value is not less than or equal to safelen value";
2919
2920 if (verifyAlignedClause(*this, getAlignments(), getAlignedVars()).failed())
2921 return failure();
2922
2923 if (verifyNontemporalClause(*this, getNontemporalVars()).failed())
2924 return failure();
2925
2926 bool isCompositeChildLeaf =
2927 llvm::dyn_cast_if_present<LoopWrapperInterface>((*this)->getParentOp());
2928
2929 if (!isComposite() && isCompositeChildLeaf)
2930 return emitError()
2931 << "'omp.composite' attribute missing from composite wrapper";
2932
2933 if (isComposite() && !isCompositeChildLeaf)
2934 return emitError()
2935 << "'omp.composite' attribute present in non-composite wrapper";
2936
2937 // Firstprivate is not allowed for SIMD in the standard. Check that none of
2938 // the private decls are for firstprivate.
2939 std::optional<ArrayAttr> privateSyms = getPrivateSyms();
2940 if (privateSyms) {
2941 for (const Attribute &sym : *privateSyms) {
2942 auto symRef = cast<SymbolRefAttr>(sym);
2943 omp::PrivateClauseOp privatizer =
2945 getOperation(), symRef);
2946 if (!privatizer)
2947 return emitError() << "Cannot find privatizer '" << symRef << "'";
2948 if (privatizer.getDataSharingType() ==
2949 DataSharingClauseType::FirstPrivate)
2950 return emitError() << "FIRSTPRIVATE cannot be used with SIMD";
2951 }
2952 }
2953
2954 if (getLinearVars().size() &&
2955 getLinearVarTypes().value().size() != getLinearVars().size())
2956 return emitError() << "Ill-formed type attributes for linear variables";
2957 return success();
2958}
2959
2960LogicalResult SimdOp::verifyRegions() {
2961 if (getNestedWrapper())
2962 return emitOpError() << "must wrap an 'omp.loop_nest' directly";
2963
2964 return success();
2965}
2966
2967//===----------------------------------------------------------------------===//
2968// Distribute construct [2.9.4.1]
2969//===----------------------------------------------------------------------===//
2970
2971void DistributeOp::build(OpBuilder &builder, OperationState &state,
2972 const DistributeOperands &clauses) {
2973 DistributeOp::build(builder, state, clauses.allocateVars,
2974 clauses.allocatorVars, clauses.distScheduleStatic,
2975 clauses.distScheduleChunkSize, clauses.order,
2976 clauses.orderMod, clauses.privateVars,
2977 makeArrayAttr(builder.getContext(), clauses.privateSyms),
2978 clauses.privateNeedsBarrier);
2979}
2980
2981LogicalResult DistributeOp::verify() {
2982 if (this->getDistScheduleChunkSize() && !this->getDistScheduleStatic())
2983 return emitOpError() << "chunk size set without "
2984 "dist_schedule_static being present";
2985
2986 if (getAllocateVars().size() != getAllocatorVars().size())
2987 return emitError(
2988 "expected equal sizes for allocate and allocator variables");
2989
2990 return success();
2991}
2992
2993LogicalResult DistributeOp::verifyRegions() {
2994 if (LoopWrapperInterface nested = getNestedWrapper()) {
2995 if (!isComposite())
2996 return emitError()
2997 << "'omp.composite' attribute missing from composite wrapper";
2998 // Check for the allowed leaf constructs that may appear in a composite
2999 // construct directly after DISTRIBUTE.
3000 if (isa<WsloopOp>(nested)) {
3001 Operation *parentOp = (*this)->getParentOp();
3002 if (!llvm::dyn_cast_if_present<ParallelOp>(parentOp) ||
3003 !cast<ComposableOpInterface>(parentOp).isComposite()) {
3004 return emitError() << "an 'omp.wsloop' nested wrapper is only allowed "
3005 "when a composite 'omp.parallel' is the direct "
3006 "parent";
3007 }
3008 } else if (!isa<SimdOp>(nested))
3009 return emitError() << "only supported nested wrappers are 'omp.simd' and "
3010 "'omp.wsloop'";
3011 } else if (isComposite()) {
3012 return emitError()
3013 << "'omp.composite' attribute present in non-composite wrapper";
3014 }
3015
3016 return success();
3017}
3018
3019//===----------------------------------------------------------------------===//
3020// DeclareMapperOp / DeclareMapperInfoOp
3021//===----------------------------------------------------------------------===//
3022
3023LogicalResult DeclareMapperInfoOp::verify() {
3024 return verifyMapClause(*this, getMapVars());
3025}
3026
3027LogicalResult DeclareMapperOp::verifyRegions() {
3028 if (!llvm::isa_and_present<DeclareMapperInfoOp>(
3029 getRegion().getBlocks().front().getTerminator()))
3030 return emitOpError() << "expected terminator to be a DeclareMapperInfoOp";
3031
3032 return success();
3033}
3034
3035//===----------------------------------------------------------------------===//
3036// DeclareReductionOp
3037//===----------------------------------------------------------------------===//
3038
3039LogicalResult DeclareReductionOp::verifyRegions() {
3040 if (!getAllocRegion().empty()) {
3041 for (YieldOp yieldOp : getAllocRegion().getOps<YieldOp>()) {
3042 if (yieldOp.getResults().size() != 1 ||
3043 yieldOp.getResults().getTypes()[0] != getType())
3044 return emitOpError() << "expects alloc region to yield a value "
3045 "of the reduction type";
3046 }
3047 }
3048
3049 if (getInitializerRegion().empty())
3050 return emitOpError() << "expects non-empty initializer region";
3051 Block &initializerEntryBlock = getInitializerRegion().front();
3052
3053 if (initializerEntryBlock.getNumArguments() == 1) {
3054 if (!getAllocRegion().empty())
3055 return emitOpError() << "expects two arguments to the initializer region "
3056 "when an allocation region is used";
3057 } else if (initializerEntryBlock.getNumArguments() == 2) {
3058 if (getAllocRegion().empty())
3059 return emitOpError() << "expects one argument to the initializer region "
3060 "when no allocation region is used";
3061 } else {
3062 return emitOpError()
3063 << "expects one or two arguments to the initializer region";
3064 }
3065
3066 for (mlir::Value arg : initializerEntryBlock.getArguments())
3067 if (arg.getType() != getType())
3068 return emitOpError() << "expects initializer region argument to match "
3069 "the reduction type";
3070
3071 for (YieldOp yieldOp : getInitializerRegion().getOps<YieldOp>()) {
3072 if (yieldOp.getResults().size() != 1 ||
3073 yieldOp.getResults().getTypes()[0] != getType())
3074 return emitOpError() << "expects initializer region to yield a value "
3075 "of the reduction type";
3076 }
3077
3078 if (getReductionRegion().empty())
3079 return emitOpError() << "expects non-empty reduction region";
3080 Block &reductionEntryBlock = getReductionRegion().front();
3081 if (reductionEntryBlock.getNumArguments() != 2 ||
3082 reductionEntryBlock.getArgumentTypes()[0] !=
3083 reductionEntryBlock.getArgumentTypes()[1] ||
3084 reductionEntryBlock.getArgumentTypes()[0] != getType())
3085 return emitOpError() << "expects reduction region with two arguments of "
3086 "the reduction type";
3087 for (YieldOp yieldOp : getReductionRegion().getOps<YieldOp>()) {
3088 if (yieldOp.getResults().size() != 1 ||
3089 yieldOp.getResults().getTypes()[0] != getType())
3090 return emitOpError() << "expects reduction region to yield a value "
3091 "of the reduction type";
3092 }
3093
3094 if (!getAtomicReductionRegion().empty()) {
3095 Block &atomicReductionEntryBlock = getAtomicReductionRegion().front();
3096 if (atomicReductionEntryBlock.getNumArguments() != 2 ||
3097 atomicReductionEntryBlock.getArgumentTypes()[0] !=
3098 atomicReductionEntryBlock.getArgumentTypes()[1])
3099 return emitOpError() << "expects atomic reduction region with two "
3100 "arguments of the same type";
3101 auto ptrType = llvm::dyn_cast<PointerLikeType>(
3102 atomicReductionEntryBlock.getArgumentTypes()[0]);
3103 if (!ptrType ||
3104 (ptrType.getElementType() && ptrType.getElementType() != getType()))
3105 return emitOpError() << "expects atomic reduction region arguments to "
3106 "be accumulators containing the reduction type";
3107 }
3108
3109 if (getCleanupRegion().empty())
3110 return success();
3111 Block &cleanupEntryBlock = getCleanupRegion().front();
3112 if (cleanupEntryBlock.getNumArguments() != 1 ||
3113 cleanupEntryBlock.getArgument(0).getType() != getType())
3114 return emitOpError() << "expects cleanup region with one argument "
3115 "of the reduction type";
3116
3117 return success();
3118}
3119
3120//===----------------------------------------------------------------------===//
3121// TaskOp
3122//===----------------------------------------------------------------------===//
3123
3124void TaskOp::build(OpBuilder &builder, OperationState &state,
3125 const TaskOperands &clauses) {
3126 MLIRContext *ctx = builder.getContext();
3127 TaskOp::build(builder, state, clauses.allocateVars, clauses.allocatorVars,
3128 makeArrayAttr(ctx, clauses.dependKinds), clauses.dependVars,
3129 clauses.final, clauses.ifExpr, clauses.inReductionVars,
3130 makeDenseBoolArrayAttr(ctx, clauses.inReductionByref),
3131 makeArrayAttr(ctx, clauses.inReductionSyms), clauses.mergeable,
3132 clauses.priority, /*private_vars=*/clauses.privateVars,
3133 /*private_syms=*/makeArrayAttr(ctx, clauses.privateSyms),
3134 clauses.privateNeedsBarrier, clauses.untied,
3135 clauses.eventHandle);
3136}
3137
3138LogicalResult TaskOp::verify() {
3139 LogicalResult verifyDependVars =
3140 verifyDependVarList(*this, getDependKinds(), getDependVars());
3141 return failed(verifyDependVars)
3142 ? verifyDependVars
3143 : verifyReductionVarList(*this, getInReductionSyms(),
3144 getInReductionVars(),
3145 getInReductionByref());
3146}
3147
3148//===----------------------------------------------------------------------===//
3149// TaskgroupOp
3150//===----------------------------------------------------------------------===//
3151
3152void TaskgroupOp::build(OpBuilder &builder, OperationState &state,
3153 const TaskgroupOperands &clauses) {
3154 MLIRContext *ctx = builder.getContext();
3155 TaskgroupOp::build(builder, state, clauses.allocateVars,
3156 clauses.allocatorVars, clauses.taskReductionVars,
3157 makeDenseBoolArrayAttr(ctx, clauses.taskReductionByref),
3158 makeArrayAttr(ctx, clauses.taskReductionSyms));
3159}
3160
3161LogicalResult TaskgroupOp::verify() {
3162 return verifyReductionVarList(*this, getTaskReductionSyms(),
3163 getTaskReductionVars(),
3164 getTaskReductionByref());
3165}
3166
3167//===----------------------------------------------------------------------===//
3168// TaskloopOp
3169//===----------------------------------------------------------------------===//
3170
3171void TaskloopOp::build(OpBuilder &builder, OperationState &state,
3172 const TaskloopOperands &clauses) {
3173 MLIRContext *ctx = builder.getContext();
3174 TaskloopOp::build(
3175 builder, state, clauses.allocateVars, clauses.allocatorVars,
3176 clauses.final, clauses.grainsizeMod, clauses.grainsize, clauses.ifExpr,
3177 clauses.inReductionVars,
3178 makeDenseBoolArrayAttr(ctx, clauses.inReductionByref),
3179 makeArrayAttr(ctx, clauses.inReductionSyms), clauses.mergeable,
3180 clauses.nogroup, clauses.numTasksMod, clauses.numTasks, clauses.priority,
3181 /*private_vars=*/clauses.privateVars,
3182 /*private_syms=*/makeArrayAttr(ctx, clauses.privateSyms),
3183 clauses.privateNeedsBarrier, clauses.reductionMod, clauses.reductionVars,
3184 makeDenseBoolArrayAttr(ctx, clauses.reductionByref),
3185 makeArrayAttr(ctx, clauses.reductionSyms), clauses.untied);
3186}
3187
3188LogicalResult TaskloopOp::verify() {
3189 if (getAllocateVars().size() != getAllocatorVars().size())
3190 return emitError(
3191 "expected equal sizes for allocate and allocator variables");
3192 if (failed(verifyReductionVarList(*this, getReductionSyms(),
3193 getReductionVars(), getReductionByref())) ||
3194 failed(verifyReductionVarList(*this, getInReductionSyms(),
3195 getInReductionVars(),
3196 getInReductionByref())))
3197 return failure();
3198
3199 if (!getReductionVars().empty() && getNogroup())
3200 return emitError("if a reduction clause is present on the taskloop "
3201 "directive, the nogroup clause must not be specified");
3202 for (auto var : getReductionVars()) {
3203 if (llvm::is_contained(getInReductionVars(), var))
3204 return emitError("the same list item cannot appear in both a reduction "
3205 "and an in_reduction clause");
3206 }
3207
3208 if (getGrainsize() && getNumTasks()) {
3209 return emitError(
3210 "the grainsize clause and num_tasks clause are mutually exclusive and "
3211 "may not appear on the same taskloop directive");
3212 }
3213
3214 return success();
3215}
3216
3217LogicalResult TaskloopOp::verifyRegions() {
3218 if (LoopWrapperInterface nested = getNestedWrapper()) {
3219 if (!isComposite())
3220 return emitError()
3221 << "'omp.composite' attribute missing from composite wrapper";
3222
3223 // Check for the allowed leaf constructs that may appear in a composite
3224 // construct directly after TASKLOOP.
3225 if (!isa<SimdOp>(nested))
3226 return emitError() << "only supported nested wrapper is 'omp.simd'";
3227 } else if (isComposite()) {
3228 return emitError()
3229 << "'omp.composite' attribute present in non-composite wrapper";
3230 }
3231
3232 return success();
3233}
3234
3235//===----------------------------------------------------------------------===//
3236// LoopNestOp
3237//===----------------------------------------------------------------------===//
3238
3239ParseResult LoopNestOp::parse(OpAsmParser &parser, OperationState &result) {
3240 // Parse an opening `(` followed by induction variables followed by `)`
3243 Type loopVarType;
3245 parser.parseColonType(loopVarType) ||
3246 // Parse loop bounds.
3247 parser.parseEqual() ||
3248 parser.parseOperandList(lbs, ivs.size(), OpAsmParser::Delimiter::Paren) ||
3249 parser.parseKeyword("to") ||
3250 parser.parseOperandList(ubs, ivs.size(), OpAsmParser::Delimiter::Paren))
3251 return failure();
3252
3253 for (auto &iv : ivs)
3254 iv.type = loopVarType;
3255
3256 auto *ctx = parser.getBuilder().getContext();
3257 // Parse "inclusive" flag.
3258 if (succeeded(parser.parseOptionalKeyword("inclusive")))
3259 result.addAttribute("loop_inclusive", UnitAttr::get(ctx));
3260
3261 // Parse step values.
3263 if (parser.parseKeyword("step") ||
3264 parser.parseOperandList(steps, ivs.size(), OpAsmParser::Delimiter::Paren))
3265 return failure();
3266
3267 // Parse collapse
3268 int64_t value = 0;
3269 if (!parser.parseOptionalKeyword("collapse") &&
3270 (parser.parseLParen() || parser.parseInteger(value) ||
3271 parser.parseRParen()))
3272 return failure();
3273 if (value > 1)
3274 result.addAttribute(
3275 "collapse_num_loops",
3276 IntegerAttr::get(parser.getBuilder().getI64Type(), value));
3277
3278 // Parse tiles
3280 auto parseTiles = [&]() -> ParseResult {
3281 int64_t tile;
3282 if (parser.parseInteger(tile))
3283 return failure();
3284 tiles.push_back(tile);
3285 return success();
3286 };
3287
3288 if (!parser.parseOptionalKeyword("tiles") &&
3289 (parser.parseLParen() || parser.parseCommaSeparatedList(parseTiles) ||
3290 parser.parseRParen()))
3291 return failure();
3292
3293 if (tiles.size() > 0)
3294 result.addAttribute("tile_sizes", DenseI64ArrayAttr::get(ctx, tiles));
3295
3296 // Parse the body.
3297 Region *region = result.addRegion();
3298 if (parser.parseRegion(*region, ivs))
3299 return failure();
3300
3301 // Resolve operands.
3302 if (parser.resolveOperands(lbs, loopVarType, result.operands) ||
3303 parser.resolveOperands(ubs, loopVarType, result.operands) ||
3304 parser.resolveOperands(steps, loopVarType, result.operands))
3305 return failure();
3306
3307 // Parse the optional attribute list.
3308 return parser.parseOptionalAttrDict(result.attributes);
3309}
3310
3311void LoopNestOp::print(OpAsmPrinter &p) {
3312 Region &region = getRegion();
3313 auto args = region.getArguments();
3314 p << " (" << args << ") : " << args[0].getType() << " = ("
3315 << getLoopLowerBounds() << ") to (" << getLoopUpperBounds() << ") ";
3316 if (getLoopInclusive())
3317 p << "inclusive ";
3318 p << "step (" << getLoopSteps() << ") ";
3319 if (int64_t numCollapse = getCollapseNumLoops())
3320 if (numCollapse > 1)
3321 p << "collapse(" << numCollapse << ") ";
3322
3323 if (const auto tiles = getTileSizes())
3324 p << "tiles(" << tiles.value() << ") ";
3325
3326 p.printRegion(region, /*printEntryBlockArgs=*/false);
3327}
3328
3329void LoopNestOp::build(OpBuilder &builder, OperationState &state,
3330 const LoopNestOperands &clauses) {
3331 MLIRContext *ctx = builder.getContext();
3332 LoopNestOp::build(builder, state, clauses.collapseNumLoops,
3333 clauses.loopLowerBounds, clauses.loopUpperBounds,
3334 clauses.loopSteps, clauses.loopInclusive,
3335 makeDenseI64ArrayAttr(ctx, clauses.tileSizes));
3336}
3337
3338LogicalResult LoopNestOp::verify() {
3339 if (getLoopLowerBounds().empty())
3340 return emitOpError() << "must represent at least one loop";
3341
3342 if (getLoopLowerBounds().size() != getIVs().size())
3343 return emitOpError() << "number of range arguments and IVs do not match";
3344
3345 for (auto [lb, iv] : llvm::zip_equal(getLoopLowerBounds(), getIVs())) {
3346 if (lb.getType() != iv.getType())
3347 return emitOpError()
3348 << "range argument type does not match corresponding IV type";
3349 }
3350
3351 uint64_t numIVs = getIVs().size();
3352
3353 if (const auto &numCollapse = getCollapseNumLoops())
3354 if (numCollapse > numIVs)
3355 return emitOpError()
3356 << "collapse value is larger than the number of loops";
3357
3358 if (const auto &tiles = getTileSizes())
3359 if (tiles.value().size() > numIVs)
3360 return emitOpError() << "too few canonical loops for tile dimensions";
3361
3362 if (!llvm::dyn_cast_if_present<LoopWrapperInterface>((*this)->getParentOp()))
3363 return emitOpError() << "expects parent op to be a loop wrapper";
3364
3365 return success();
3366}
3367
3368void LoopNestOp::gatherWrappers(
3370 Operation *parent = (*this)->getParentOp();
3371 while (auto wrapper =
3372 llvm::dyn_cast_if_present<LoopWrapperInterface>(parent)) {
3373 wrappers.push_back(wrapper);
3374 parent = parent->getParentOp();
3375 }
3376}
3377
3378//===----------------------------------------------------------------------===//
3379// OpenMP canonical loop handling
3380//===----------------------------------------------------------------------===//
3381
3382std::tuple<NewCliOp, OpOperand *, OpOperand *>
3383mlir::omp ::decodeCli(Value cli) {
3384
3385 // Defining a CLI for a generated loop is optional; if there is none then
3386 // there is no followup-tranformation
3387 if (!cli)
3388 return {{}, nullptr, nullptr};
3389
3390 assert(cli.getType() == CanonicalLoopInfoType::get(cli.getContext()) &&
3391 "Unexpected type of cli");
3392
3393 NewCliOp create = cast<NewCliOp>(cli.getDefiningOp());
3394 OpOperand *gen = nullptr;
3395 OpOperand *cons = nullptr;
3396 for (OpOperand &use : cli.getUses()) {
3397 auto op = cast<LoopTransformationInterface>(use.getOwner());
3398
3399 unsigned opnum = use.getOperandNumber();
3400 if (op.isGeneratee(opnum)) {
3401 assert(!gen && "Each CLI may have at most one def");
3402 gen = &use;
3403 } else if (op.isApplyee(opnum)) {
3404 assert(!cons && "Each CLI may have at most one consumer");
3405 cons = &use;
3406 } else {
3407 llvm_unreachable("Unexpected operand for a CLI");
3408 }
3409 }
3410
3411 return {create, gen, cons};
3412}
3413
3414void NewCliOp::build(::mlir::OpBuilder &odsBuilder,
3415 ::mlir::OperationState &odsState) {
3416 odsState.addTypes(CanonicalLoopInfoType::get(odsBuilder.getContext()));
3417}
3418
3419void NewCliOp::getAsmResultNames(OpAsmSetValueNameFn setNameFn) {
3420 Value result = getResult();
3421 auto [newCli, gen, cons] = decodeCli(result);
3422
3423 // Structured binding `gen` cannot be captured in lambdas before C++20
3424 OpOperand *generator = gen;
3425
3426 // Derive the CLI variable name from its generator:
3427 // * "canonloop" for omp.canonical_loop
3428 // * custom name for loop transformation generatees
3429 // * "cli" as fallback if no generator
3430 // * "_r<idx>" suffix for nested loops, where <idx> is the sequential order
3431 // at that level
3432 // * "_s<idx>" suffix for operations with multiple regions, where <idx> is
3433 // the index of that region
3434 std::string cliName{"cli"};
3435 if (gen) {
3436 cliName =
3438 .Case([&](CanonicalLoopOp op) {
3439 return generateLoopNestingName("canonloop", op);
3440 })
3441 .Case([&](UnrollHeuristicOp op) -> std::string {
3442 llvm_unreachable("heuristic unrolling does not generate a loop");
3443 })
3444 .Case([&](TileOp op) -> std::string {
3445 auto [generateesFirst, generateesCount] =
3446 op.getGenerateesODSOperandIndexAndLength();
3447 unsigned firstGrid = generateesFirst;
3448 unsigned firstIntratile = generateesFirst + generateesCount / 2;
3449 unsigned end = generateesFirst + generateesCount;
3450 unsigned opnum = generator->getOperandNumber();
3451 // In the OpenMP apply and looprange clauses, indices are 1-based
3452 if (firstGrid <= opnum && opnum < firstIntratile) {
3453 unsigned gridnum = opnum - firstGrid + 1;
3454 return ("grid" + Twine(gridnum)).str();
3455 }
3456 if (firstIntratile <= opnum && opnum < end) {
3457 unsigned intratilenum = opnum - firstIntratile + 1;
3458 return ("intratile" + Twine(intratilenum)).str();
3459 }
3460 llvm_unreachable("Unexpected generatee argument");
3461 })
3462 .DefaultUnreachable("TODO: Custom name for this operation");
3463 }
3464
3465 setNameFn(result, cliName);
3466}
3467
3468LogicalResult NewCliOp::verify() {
3469 Value cli = getResult();
3470
3471 assert(cli.getType() == CanonicalLoopInfoType::get(cli.getContext()) &&
3472 "Unexpected type of cli");
3473
3474 // Check that the CLI is used in at most generator and one consumer
3475 OpOperand *gen = nullptr;
3476 OpOperand *cons = nullptr;
3477 for (mlir::OpOperand &use : cli.getUses()) {
3478 auto op = cast<mlir::omp::LoopTransformationInterface>(use.getOwner());
3479
3480 unsigned opnum = use.getOperandNumber();
3481 if (op.isGeneratee(opnum)) {
3482 if (gen) {
3483 InFlightDiagnostic error =
3484 emitOpError("CLI must have at most one generator");
3485 error.attachNote(gen->getOwner()->getLoc())
3486 .append("first generator here:");
3487 error.attachNote(use.getOwner()->getLoc())
3488 .append("second generator here:");
3489 return error;
3490 }
3491
3492 gen = &use;
3493 } else if (op.isApplyee(opnum)) {
3494 if (cons) {
3495 InFlightDiagnostic error =
3496 emitOpError("CLI must have at most one consumer");
3497 error.attachNote(cons->getOwner()->getLoc())
3498 .append("first consumer here:")
3499 .appendOp(*cons->getOwner(),
3500 OpPrintingFlags().printGenericOpForm());
3501 error.attachNote(use.getOwner()->getLoc())
3502 .append("second consumer here:")
3503 .appendOp(*use.getOwner(), OpPrintingFlags().printGenericOpForm());
3504 return error;
3505 }
3506
3507 cons = &use;
3508 } else {
3509 llvm_unreachable("Unexpected operand for a CLI");
3510 }
3511 }
3512
3513 // If the CLI is source of a transformation, it must have a generator
3514 if (cons && !gen) {
3515 InFlightDiagnostic error = emitOpError("CLI has no generator");
3516 error.attachNote(cons->getOwner()->getLoc())
3517 .append("see consumer here: ")
3518 .appendOp(*cons->getOwner(), OpPrintingFlags().printGenericOpForm());
3519 return error;
3520 }
3521
3522 return success();
3523}
3524
3525void CanonicalLoopOp::build(OpBuilder &odsBuilder, OperationState &odsState,
3526 Value tripCount) {
3527 odsState.addOperands(tripCount);
3528 odsState.addOperands(Value());
3529 (void)odsState.addRegion();
3530}
3531
3532void CanonicalLoopOp::build(OpBuilder &odsBuilder, OperationState &odsState,
3533 Value tripCount, ::mlir::Value cli) {
3534 odsState.addOperands(tripCount);
3535 odsState.addOperands(cli);
3536 (void)odsState.addRegion();
3537}
3538
3539void CanonicalLoopOp::getAsmBlockNames(OpAsmSetBlockNameFn setNameFn) {
3540 setNameFn(&getRegion().front(), "body_entry");
3541}
3542
3543void CanonicalLoopOp::getAsmBlockArgumentNames(Region &region,
3544 OpAsmSetValueNameFn setNameFn) {
3545 std::string ivName = generateLoopNestingName("iv", *this);
3546 setNameFn(region.getArgument(0), ivName);
3547}
3548
3549void CanonicalLoopOp::print(OpAsmPrinter &p) {
3550 if (getCli())
3551 p << '(' << getCli() << ')';
3552 p << ' ' << getInductionVar() << " : " << getInductionVar().getType()
3553 << " in range(" << getTripCount() << ") ";
3554
3555 p.printRegion(getRegion(), /*printEntryBlockArgs=*/false,
3556 /*printBlockTerminators=*/true);
3557
3558 p.printOptionalAttrDict((*this)->getAttrs());
3559}
3560
3561mlir::ParseResult CanonicalLoopOp::parse(::mlir::OpAsmParser &parser,
3563 CanonicalLoopInfoType cliType =
3564 CanonicalLoopInfoType::get(parser.getContext());
3565
3566 // Parse (optional) omp.cli identifier
3568 SmallVector<mlir::Value, 1> cliOperand;
3569 if (!parser.parseOptionalLParen()) {
3570 if (parser.parseOperand(cli) ||
3571 parser.resolveOperand(cli, cliType, cliOperand) || parser.parseRParen())
3572 return failure();
3573 }
3574
3575 // We derive the type of tripCount from inductionVariable. MLIR requires the
3576 // type of tripCount to be known when calling resolveOperand so we have parse
3577 // the type before processing the inductionVariable.
3578 OpAsmParser::Argument inductionVariable;
3580 if (parser.parseArgument(inductionVariable, /*allowType*/ true) ||
3581 parser.parseKeyword("in") || parser.parseKeyword("range") ||
3582 parser.parseLParen() || parser.parseOperand(tripcount) ||
3583 parser.parseRParen() ||
3584 parser.resolveOperand(tripcount, inductionVariable.type, result.operands))
3585 return failure();
3586
3587 // Parse the loop body.
3588 Region *region = result.addRegion();
3589 if (parser.parseRegion(*region, {inductionVariable}))
3590 return failure();
3591
3592 // We parsed the cli operand forst, but because it is optional, it must be
3593 // last in the operand list.
3594 result.operands.append(cliOperand);
3595
3596 // Parse the optional attribute list.
3597 if (parser.parseOptionalAttrDict(result.attributes))
3598 return failure();
3599
3600 return mlir::success();
3601}
3602
3603LogicalResult CanonicalLoopOp::verify() {
3604 // The region's entry must accept the induction variable
3605 // It can also be empty if just created
3606 if (!getRegion().empty()) {
3607 Region &region = getRegion();
3608 if (region.getNumArguments() != 1)
3609 return emitOpError(
3610 "Canonical loop region must have exactly one argument");
3611
3612 if (getInductionVar().getType() != getTripCount().getType())
3613 return emitOpError(
3614 "Region argument must be the same type as the trip count");
3615 }
3616
3617 return success();
3618}
3619
3620Value CanonicalLoopOp::getInductionVar() { return getRegion().getArgument(0); }
3621
3622std::pair<unsigned, unsigned>
3623CanonicalLoopOp::getApplyeesODSOperandIndexAndLength() {
3624 // No applyees
3625 return {0, 0};
3626}
3627
3628std::pair<unsigned, unsigned>
3629CanonicalLoopOp::getGenerateesODSOperandIndexAndLength() {
3630 return getODSOperandIndexAndLength(odsIndex_cli);
3631}
3632
3633//===----------------------------------------------------------------------===//
3634// UnrollHeuristicOp
3635//===----------------------------------------------------------------------===//
3636
3637void UnrollHeuristicOp::build(::mlir::OpBuilder &odsBuilder,
3638 ::mlir::OperationState &odsState,
3639 ::mlir::Value cli) {
3640 odsState.addOperands(cli);
3641}
3642
3643void UnrollHeuristicOp::print(OpAsmPrinter &p) {
3644 p << '(' << getApplyee() << ')';
3645
3646 p.printOptionalAttrDict((*this)->getAttrs());
3647}
3648
3649mlir::ParseResult UnrollHeuristicOp::parse(::mlir::OpAsmParser &parser,
3651 auto cliType = CanonicalLoopInfoType::get(parser.getContext());
3652
3653 if (parser.parseLParen())
3654 return failure();
3655
3657 if (parser.parseOperand(applyee) ||
3658 parser.resolveOperand(applyee, cliType, result.operands))
3659 return failure();
3660
3661 if (parser.parseRParen())
3662 return failure();
3663
3664 // Optional output loop (full unrolling has none)
3665 if (!parser.parseOptionalArrow()) {
3666 if (parser.parseLParen() || parser.parseRParen())
3667 return failure();
3668 }
3669
3670 // Parse the optional attribute list.
3671 if (parser.parseOptionalAttrDict(result.attributes))
3672 return failure();
3673
3674 return mlir::success();
3675}
3676
3677std::pair<unsigned, unsigned>
3678UnrollHeuristicOp ::getApplyeesODSOperandIndexAndLength() {
3679 return getODSOperandIndexAndLength(odsIndex_applyee);
3680}
3681
3682std::pair<unsigned, unsigned>
3683UnrollHeuristicOp::getGenerateesODSOperandIndexAndLength() {
3684 return {0, 0};
3685}
3686
3687//===----------------------------------------------------------------------===//
3688// TileOp
3689//===----------------------------------------------------------------------===//
3690
3691static void printLoopTransformClis(OpAsmPrinter &p, TileOp op,
3692 OperandRange generatees,
3693 OperandRange applyees) {
3694 if (!generatees.empty())
3695 p << '(' << llvm::interleaved(generatees) << ')';
3696
3697 if (!applyees.empty())
3698 p << " <- (" << llvm::interleaved(applyees) << ')';
3699}
3700
3701static ParseResult parseLoopTransformClis(
3702 OpAsmParser &parser,
3705 if (parser.parseOptionalLess()) {
3706 // Syntax 1: generatees present
3707
3708 if (parser.parseOperandList(generateesOperands,
3710 return failure();
3711
3712 if (parser.parseLess())
3713 return failure();
3714 } else {
3715 // Syntax 2: generatees omitted
3716 }
3717
3718 // Parse `<-` (`<` has already been parsed)
3719 if (parser.parseMinus())
3720 return failure();
3721
3722 if (parser.parseOperandList(applyeesOperands,
3724 return failure();
3725
3726 return success();
3727}
3728
3729LogicalResult TileOp::verify() {
3730 if (getApplyees().empty())
3731 return emitOpError() << "must apply to at least one loop";
3732
3733 if (getSizes().size() != getApplyees().size())
3734 return emitOpError() << "there must be one tile size for each applyee";
3735
3736 if (!getGeneratees().empty() &&
3737 2 * getSizes().size() != getGeneratees().size())
3738 return emitOpError()
3739 << "expecting two times the number of generatees than applyees";
3740
3741 DenseSet<Value> parentIVs;
3742
3743 Value parent = getApplyees().front();
3744 for (auto &&applyee : llvm::drop_begin(getApplyees())) {
3745 auto [parentCreate, parentGen, parentCons] = decodeCli(parent);
3746 auto [create, gen, cons] = decodeCli(applyee);
3747
3748 if (!parentGen)
3749 return emitOpError() << "applyee CLI has no generator";
3750
3751 auto parentLoop = dyn_cast_or_null<CanonicalLoopOp>(parentGen->getOwner());
3752 if (!parentGen)
3753 return emitOpError()
3754 << "currently only supports omp.canonical_loop as applyee";
3755
3756 parentIVs.insert(parentLoop.getInductionVar());
3757
3758 if (!gen)
3759 return emitOpError() << "applyee CLI has no generator";
3760 auto loop = dyn_cast_or_null<CanonicalLoopOp>(gen->getOwner());
3761 if (!loop)
3762 return emitOpError()
3763 << "currently only supports omp.canonical_loop as applyee";
3764
3765 // Canonical loop must be perfectly nested, i.e. the body of the parent must
3766 // only contain the omp.canonical_loop of the nested loops, and
3767 // omp.terminator
3768 bool isPerfectlyNested = [&]() {
3769 auto &parentBody = parentLoop.getRegion();
3770 if (!parentBody.hasOneBlock())
3771 return false;
3772 auto &parentBlock = parentBody.getBlocks().front();
3773
3774 auto nestedLoopIt = parentBlock.begin();
3775 if (nestedLoopIt == parentBlock.end() ||
3776 (&*nestedLoopIt != loop.getOperation()))
3777 return false;
3778
3779 auto termIt = std::next(nestedLoopIt);
3780 if (termIt == parentBlock.end() || !isa<TerminatorOp>(termIt))
3781 return false;
3782
3783 if (std::next(termIt) != parentBlock.end())
3784 return false;
3785
3786 return true;
3787 }();
3788 if (!isPerfectlyNested)
3789 return emitOpError() << "tiled loop nest must be perfectly nested";
3790
3791 if (parentIVs.contains(loop.getTripCount()))
3792 return emitOpError() << "tiled loop nest must be rectangular";
3793
3794 parent = applyee;
3795 }
3796
3797 // TODO: The tile sizes must be computed before the loop, but checking this
3798 // requires dominance analysis. For instance:
3799 //
3800 // %canonloop = omp.new_cli
3801 // omp.canonical_loop(%canonloop) %iv : i32 in range(%tc) {
3802 // // write to %x
3803 // omp.terminator
3804 // }
3805 // %ts = llvm.load %x
3806 // omp.tile <- (%canonloop) sizes(%ts : i32)
3807
3808 return success();
3809}
3810
3811std::pair<unsigned, unsigned> TileOp ::getApplyeesODSOperandIndexAndLength() {
3812 return getODSOperandIndexAndLength(odsIndex_applyees);
3813}
3814
3815std::pair<unsigned, unsigned> TileOp::getGenerateesODSOperandIndexAndLength() {
3816 return getODSOperandIndexAndLength(odsIndex_generatees);
3817}
3818
3819//===----------------------------------------------------------------------===//
3820// Critical construct (2.17.1)
3821//===----------------------------------------------------------------------===//
3822
3823void CriticalDeclareOp::build(OpBuilder &builder, OperationState &state,
3824 const CriticalDeclareOperands &clauses) {
3825 CriticalDeclareOp::build(builder, state, clauses.symName, clauses.hint);
3826}
3827
3828LogicalResult CriticalDeclareOp::verify() {
3829 return verifySynchronizationHint(*this, getHint());
3830}
3831
3832LogicalResult CriticalOp::verifySymbolUses(SymbolTableCollection &symbolTable) {
3833 if (getNameAttr()) {
3834 SymbolRefAttr symbolRef = getNameAttr();
3835 auto decl = symbolTable.lookupNearestSymbolFrom<CriticalDeclareOp>(
3836 *this, symbolRef);
3837 if (!decl) {
3838 return emitOpError() << "expected symbol reference " << symbolRef
3839 << " to point to a critical declaration";
3840 }
3841 }
3842
3843 return success();
3844}
3845
3846//===----------------------------------------------------------------------===//
3847// Ordered construct
3848//===----------------------------------------------------------------------===//
3849
3850static LogicalResult verifyOrderedParent(Operation &op) {
3851 bool hasRegion = op.getNumRegions() > 0;
3852 auto loopOp = op.getParentOfType<LoopNestOp>();
3853 if (!loopOp) {
3854 if (hasRegion)
3855 return success();
3856
3857 // TODO: Consider if this needs to be the case only for the standalone
3858 // variant of the ordered construct.
3859 return op.emitOpError() << "must be nested inside of a loop";
3860 }
3861
3862 Operation *wrapper = loopOp->getParentOp();
3863 if (auto wsloopOp = dyn_cast<WsloopOp>(wrapper)) {
3864 IntegerAttr orderedAttr = wsloopOp.getOrderedAttr();
3865 if (!orderedAttr)
3866 return op.emitOpError() << "the enclosing worksharing-loop region must "
3867 "have an ordered clause";
3868
3869 if (hasRegion && orderedAttr.getInt() != 0)
3870 return op.emitOpError() << "the enclosing loop's ordered clause must not "
3871 "have a parameter present";
3872
3873 if (!hasRegion && orderedAttr.getInt() == 0)
3874 return op.emitOpError() << "the enclosing loop's ordered clause must "
3875 "have a parameter present";
3876 } else if (!isa<SimdOp>(wrapper)) {
3877 return op.emitOpError() << "must be nested inside of a worksharing, simd "
3878 "or worksharing simd loop";
3879 }
3880 return success();
3881}
3882
3883void OrderedOp::build(OpBuilder &builder, OperationState &state,
3884 const OrderedOperands &clauses) {
3885 OrderedOp::build(builder, state, clauses.doacrossDependType,
3886 clauses.doacrossNumLoops, clauses.doacrossDependVars);
3887}
3888
3889LogicalResult OrderedOp::verify() {
3890 if (failed(verifyOrderedParent(**this)))
3891 return failure();
3892
3893 auto wrapper = (*this)->getParentOfType<WsloopOp>();
3894 if (!wrapper || *wrapper.getOrdered() != *getDoacrossNumLoops())
3895 return emitOpError() << "number of variables in depend clause does not "
3896 << "match number of iteration variables in the "
3897 << "doacross loop";
3898
3899 return success();
3900}
3901
3902void OrderedRegionOp::build(OpBuilder &builder, OperationState &state,
3903 const OrderedRegionOperands &clauses) {
3904 OrderedRegionOp::build(builder, state, clauses.parLevelSimd);
3905}
3906
3907LogicalResult OrderedRegionOp::verify() { return verifyOrderedParent(**this); }
3908
3909//===----------------------------------------------------------------------===//
3910// TaskwaitOp
3911//===----------------------------------------------------------------------===//
3912
3913void TaskwaitOp::build(OpBuilder &builder, OperationState &state,
3914 const TaskwaitOperands &clauses) {
3915 // TODO Store clauses in op: dependKinds, dependVars, nowait.
3916 TaskwaitOp::build(builder, state, /*depend_kinds=*/nullptr,
3917 /*depend_vars=*/{}, /*nowait=*/nullptr);
3918}
3919
3920//===----------------------------------------------------------------------===//
3921// Verifier for AtomicReadOp
3922//===----------------------------------------------------------------------===//
3923
3924LogicalResult AtomicReadOp::verify() {
3925 if (verifyCommon().failed())
3926 return mlir::failure();
3927
3928 if (auto mo = getMemoryOrder()) {
3929 if (*mo == ClauseMemoryOrderKind::Acq_rel ||
3930 *mo == ClauseMemoryOrderKind::Release) {
3931 return emitError(
3932 "memory-order must not be acq_rel or release for atomic reads");
3933 }
3934 }
3935 return verifySynchronizationHint(*this, getHint());
3936}
3937
3938//===----------------------------------------------------------------------===//
3939// Verifier for AtomicWriteOp
3940//===----------------------------------------------------------------------===//
3941
3942LogicalResult AtomicWriteOp::verify() {
3943 if (verifyCommon().failed())
3944 return mlir::failure();
3945
3946 if (auto mo = getMemoryOrder()) {
3947 if (*mo == ClauseMemoryOrderKind::Acq_rel ||
3948 *mo == ClauseMemoryOrderKind::Acquire) {
3949 return emitError(
3950 "memory-order must not be acq_rel or acquire for atomic writes");
3951 }
3952 }
3953 return verifySynchronizationHint(*this, getHint());
3954}
3955
3956//===----------------------------------------------------------------------===//
3957// Verifier for AtomicUpdateOp
3958//===----------------------------------------------------------------------===//
3959
3960LogicalResult AtomicUpdateOp::canonicalize(AtomicUpdateOp op,
3961 PatternRewriter &rewriter) {
3962 if (op.isNoOp()) {
3963 rewriter.eraseOp(op);
3964 return success();
3965 }
3966 if (Value writeVal = op.getWriteOpVal()) {
3967 rewriter.replaceOpWithNewOp<AtomicWriteOp>(
3968 op, op.getX(), writeVal, op.getHintAttr(), op.getMemoryOrderAttr());
3969 return success();
3970 }
3971 return failure();
3972}
3973
3974LogicalResult AtomicUpdateOp::verify() {
3975 if (verifyCommon().failed())
3976 return mlir::failure();
3977
3978 if (auto mo = getMemoryOrder()) {
3979 if (*mo == ClauseMemoryOrderKind::Acq_rel ||
3980 *mo == ClauseMemoryOrderKind::Acquire) {
3981 return emitError(
3982 "memory-order must not be acq_rel or acquire for atomic updates");
3983 }
3984 }
3985
3986 return verifySynchronizationHint(*this, getHint());
3987}
3988
3989LogicalResult AtomicUpdateOp::verifyRegions() { return verifyRegionsCommon(); }
3990
3991//===----------------------------------------------------------------------===//
3992// Verifier for AtomicCaptureOp
3993//===----------------------------------------------------------------------===//
3994
3995AtomicReadOp AtomicCaptureOp::getAtomicReadOp() {
3996 if (auto op = dyn_cast<AtomicReadOp>(getFirstOp()))
3997 return op;
3998 return dyn_cast<AtomicReadOp>(getSecondOp());
3999}
4000
4001AtomicWriteOp AtomicCaptureOp::getAtomicWriteOp() {
4002 if (auto op = dyn_cast<AtomicWriteOp>(getFirstOp()))
4003 return op;
4004 return dyn_cast<AtomicWriteOp>(getSecondOp());
4005}
4006
4007AtomicUpdateOp AtomicCaptureOp::getAtomicUpdateOp() {
4008 if (auto op = dyn_cast<AtomicUpdateOp>(getFirstOp()))
4009 return op;
4010 return dyn_cast<AtomicUpdateOp>(getSecondOp());
4011}
4012
4013LogicalResult AtomicCaptureOp::verify() {
4014 return verifySynchronizationHint(*this, getHint());
4015}
4016
4017LogicalResult AtomicCaptureOp::verifyRegions() {
4018 if (verifyRegionsCommon().failed())
4019 return mlir::failure();
4020
4021 if (getFirstOp()->getAttr("hint") || getSecondOp()->getAttr("hint"))
4022 return emitOpError(
4023 "operations inside capture region must not have hint clause");
4024
4025 if (getFirstOp()->getAttr("memory_order") ||
4026 getSecondOp()->getAttr("memory_order"))
4027 return emitOpError(
4028 "operations inside capture region must not have memory_order clause");
4029 return success();
4030}
4031
4032//===----------------------------------------------------------------------===//
4033// CancelOp
4034//===----------------------------------------------------------------------===//
4035
4036void CancelOp::build(OpBuilder &builder, OperationState &state,
4037 const CancelOperands &clauses) {
4038 CancelOp::build(builder, state, clauses.cancelDirective, clauses.ifExpr);
4039}
4040
4042 Operation *parent = thisOp->getParentOp();
4043 while (parent) {
4044 if (parent->getDialect() == thisOp->getDialect())
4045 return parent;
4046 parent = parent->getParentOp();
4047 }
4048 return nullptr;
4049}
4050
4051LogicalResult CancelOp::verify() {
4052 ClauseCancellationConstructType cct = getCancelDirective();
4053 // The next OpenMP operation in the chain of parents
4054 Operation *structuralParent = getParentInSameDialect((*this).getOperation());
4055 if (!structuralParent)
4056 return emitOpError() << "Orphaned cancel construct";
4057
4058 if ((cct == ClauseCancellationConstructType::Parallel) &&
4059 !mlir::isa<ParallelOp>(structuralParent)) {
4060 return emitOpError() << "cancel parallel must appear "
4061 << "inside a parallel region";
4062 }
4063 if (cct == ClauseCancellationConstructType::Loop) {
4064 // structural parent will be omp.loop_nest, directly nested inside
4065 // omp.wsloop
4066 auto wsloopOp = mlir::dyn_cast<WsloopOp>(structuralParent->getParentOp());
4067
4068 if (!wsloopOp) {
4069 return emitOpError()
4070 << "cancel loop must appear inside a worksharing-loop region";
4071 }
4072 if (wsloopOp.getNowaitAttr()) {
4073 return emitError() << "A worksharing construct that is canceled "
4074 << "must not have a nowait clause";
4075 }
4076 if (wsloopOp.getOrderedAttr()) {
4077 return emitError() << "A worksharing construct that is canceled "
4078 << "must not have an ordered clause";
4079 }
4080
4081 } else if (cct == ClauseCancellationConstructType::Sections) {
4082 // structural parent will be an omp.section, directly nested inside
4083 // omp.sections
4084 auto sectionsOp =
4085 mlir::dyn_cast<SectionsOp>(structuralParent->getParentOp());
4086 if (!sectionsOp) {
4087 return emitOpError() << "cancel sections must appear "
4088 << "inside a sections region";
4089 }
4090 if (sectionsOp.getNowait()) {
4091 return emitError() << "A sections construct that is canceled "
4092 << "must not have a nowait clause";
4093 }
4094 }
4095 if ((cct == ClauseCancellationConstructType::Taskgroup) &&
4096 (!mlir::isa<omp::TaskOp>(structuralParent) &&
4097 !mlir::isa<omp::TaskloopOp>(structuralParent->getParentOp()))) {
4098 return emitOpError() << "cancel taskgroup must appear "
4099 << "inside a task region";
4100 }
4101 return success();
4102}
4103
4104//===----------------------------------------------------------------------===//
4105// CancellationPointOp
4106//===----------------------------------------------------------------------===//
4107
4108void CancellationPointOp::build(OpBuilder &builder, OperationState &state,
4109 const CancellationPointOperands &clauses) {
4110 CancellationPointOp::build(builder, state, clauses.cancelDirective);
4111}
4112
4113LogicalResult CancellationPointOp::verify() {
4114 ClauseCancellationConstructType cct = getCancelDirective();
4115 // The next OpenMP operation in the chain of parents
4116 Operation *structuralParent = getParentInSameDialect((*this).getOperation());
4117 if (!structuralParent)
4118 return emitOpError() << "Orphaned cancellation point";
4119
4120 if ((cct == ClauseCancellationConstructType::Parallel) &&
4121 !mlir::isa<ParallelOp>(structuralParent)) {
4122 return emitOpError() << "cancellation point parallel must appear "
4123 << "inside a parallel region";
4124 }
4125 // Strucutal parent here will be an omp.loop_nest. Get the parent of that to
4126 // find the wsloop
4127 if ((cct == ClauseCancellationConstructType::Loop) &&
4128 !mlir::isa<WsloopOp>(structuralParent->getParentOp())) {
4129 return emitOpError() << "cancellation point loop must appear "
4130 << "inside a worksharing-loop region";
4131 }
4132 if ((cct == ClauseCancellationConstructType::Sections) &&
4133 !mlir::isa<omp::SectionOp>(structuralParent)) {
4134 return emitOpError() << "cancellation point sections must appear "
4135 << "inside a sections region";
4136 }
4137 if ((cct == ClauseCancellationConstructType::Taskgroup) &&
4138 (!mlir::isa<omp::TaskOp>(structuralParent) &&
4139 !mlir::isa<omp::TaskloopOp>(structuralParent->getParentOp()))) {
4140 return emitOpError() << "cancellation point taskgroup must appear "
4141 << "inside a task region";
4142 }
4143 return success();
4144}
4145
4146//===----------------------------------------------------------------------===//
4147// MapBoundsOp
4148//===----------------------------------------------------------------------===//
4149
4150LogicalResult MapBoundsOp::verify() {
4151 auto extent = getExtent();
4152 auto upperbound = getUpperBound();
4153 if (!extent && !upperbound)
4154 return emitError("expected extent or upperbound.");
4155 return success();
4156}
4157
4158void PrivateClauseOp::build(OpBuilder &odsBuilder, OperationState &odsState,
4159 TypeRange /*result_types*/, StringAttr symName,
4160 TypeAttr type) {
4161 PrivateClauseOp::build(
4162 odsBuilder, odsState, symName, type,
4163 DataSharingClauseTypeAttr::get(odsBuilder.getContext(),
4164 DataSharingClauseType::Private));
4165}
4166
4167LogicalResult PrivateClauseOp::verifyRegions() {
4168 Type argType = getArgType();
4169 auto verifyTerminator = [&](Operation *terminator,
4170 bool yieldsValue) -> LogicalResult {
4171 if (!terminator->getBlock()->getSuccessors().empty())
4172 return success();
4173
4174 if (!llvm::isa<YieldOp>(terminator))
4175 return mlir::emitError(terminator->getLoc())
4176 << "expected exit block terminator to be an `omp.yield` op.";
4177
4178 YieldOp yieldOp = llvm::cast<YieldOp>(terminator);
4179 TypeRange yieldedTypes = yieldOp.getResults().getTypes();
4180
4181 if (!yieldsValue) {
4182 if (yieldedTypes.empty())
4183 return success();
4184
4185 return mlir::emitError(terminator->getLoc())
4186 << "Did not expect any values to be yielded.";
4187 }
4188
4189 if (yieldedTypes.size() == 1 && yieldedTypes.front() == argType)
4190 return success();
4191
4192 auto error = mlir::emitError(yieldOp.getLoc())
4193 << "Invalid yielded value. Expected type: " << argType
4194 << ", got: ";
4195
4196 if (yieldedTypes.empty())
4197 error << "None";
4198 else
4199 error << yieldedTypes;
4200
4201 return error;
4202 };
4203
4204 auto verifyRegion = [&](Region &region, unsigned expectedNumArgs,
4205 StringRef regionName,
4206 bool yieldsValue) -> LogicalResult {
4207 assert(!region.empty());
4208
4209 if (region.getNumArguments() != expectedNumArgs)
4210 return mlir::emitError(region.getLoc())
4211 << "`" << regionName << "`: "
4212 << "expected " << expectedNumArgs
4213 << " region arguments, got: " << region.getNumArguments();
4214
4215 for (Block &block : region) {
4216 // MLIR will verify the absence of the terminator for us.
4217 if (!block.mightHaveTerminator())
4218 continue;
4219
4220 if (failed(verifyTerminator(block.getTerminator(), yieldsValue)))
4221 return failure();
4222 }
4223
4224 return success();
4225 };
4226
4227 // Ensure all of the region arguments have the same type
4228 for (Region *region : getRegions())
4229 for (Type ty : region->getArgumentTypes())
4230 if (ty != argType)
4231 return emitError() << "Region argument type mismatch: got " << ty
4232 << " expected " << argType << ".";
4233
4234 mlir::Region &initRegion = getInitRegion();
4235 if (!initRegion.empty() &&
4236 failed(verifyRegion(getInitRegion(), /*expectedNumArgs=*/2, "init",
4237 /*yieldsValue=*/true)))
4238 return failure();
4239
4240 DataSharingClauseType dsType = getDataSharingType();
4241
4242 if (dsType == DataSharingClauseType::Private && !getCopyRegion().empty())
4243 return emitError("`private` clauses do not require a `copy` region.");
4244
4245 if (dsType == DataSharingClauseType::FirstPrivate && getCopyRegion().empty())
4246 return emitError(
4247 "`firstprivate` clauses require at least a `copy` region.");
4248
4249 if (dsType == DataSharingClauseType::FirstPrivate &&
4250 failed(verifyRegion(getCopyRegion(), /*expectedNumArgs=*/2, "copy",
4251 /*yieldsValue=*/true)))
4252 return failure();
4253
4254 if (!getDeallocRegion().empty() &&
4255 failed(verifyRegion(getDeallocRegion(), /*expectedNumArgs=*/1, "dealloc",
4256 /*yieldsValue=*/false)))
4257 return failure();
4258
4259 return success();
4260}
4261
4262//===----------------------------------------------------------------------===//
4263// Spec 5.2: Masked construct (10.5)
4264//===----------------------------------------------------------------------===//
4265
4266void MaskedOp::build(OpBuilder &builder, OperationState &state,
4267 const MaskedOperands &clauses) {
4268 MaskedOp::build(builder, state, clauses.filteredThreadId);
4269}
4270
4271//===----------------------------------------------------------------------===//
4272// Spec 5.2: Scan construct (5.6)
4273//===----------------------------------------------------------------------===//
4274
4275void ScanOp::build(OpBuilder &builder, OperationState &state,
4276 const ScanOperands &clauses) {
4277 ScanOp::build(builder, state, clauses.inclusiveVars, clauses.exclusiveVars);
4278}
4279
4280LogicalResult ScanOp::verify() {
4281 if (hasExclusiveVars() == hasInclusiveVars())
4282 return emitError(
4283 "Exactly one of EXCLUSIVE or INCLUSIVE clause is expected");
4284 if (WsloopOp parentWsLoopOp = (*this)->getParentOfType<WsloopOp>()) {
4285 if (parentWsLoopOp.getReductionModAttr() &&
4286 parentWsLoopOp.getReductionModAttr().getValue() ==
4287 ReductionModifier::inscan)
4288 return success();
4289 }
4290 if (SimdOp parentSimdOp = (*this)->getParentOfType<SimdOp>()) {
4291 if (parentSimdOp.getReductionModAttr() &&
4292 parentSimdOp.getReductionModAttr().getValue() ==
4293 ReductionModifier::inscan)
4294 return success();
4295 }
4296 return emitError("SCAN directive needs to be enclosed within a parent "
4297 "worksharing loop construct or SIMD construct with INSCAN "
4298 "reduction modifier");
4299}
4300
4301/// Verifies align clause in allocate directive
4302
4303LogicalResult AllocateDirOp::verify() {
4304 std::optional<uint64_t> align = this->getAlign();
4305
4306 if (align.has_value()) {
4307 if ((align.value() > 0) && !llvm::has_single_bit(align.value()))
4308 return emitError() << "ALIGN value : " << align.value()
4309 << " must be power of 2";
4310 }
4311
4312 return success();
4313}
4314
4315//===----------------------------------------------------------------------===//
4316// TargetAllocMemOp
4317//===----------------------------------------------------------------------===//
4318
4319mlir::Type omp::TargetAllocMemOp::getAllocatedType() {
4320 return getInTypeAttr().getValue();
4321}
4322
4323/// operation ::= %res = (`omp.target_alloc_mem`) $device : devicetype,
4324/// $in_type ( `(` $typeparams `)` )? ( `,` $shape )?
4325/// attr-dict-without-keyword
4326static mlir::ParseResult parseTargetAllocMemOp(mlir::OpAsmParser &parser,
4328 auto &builder = parser.getBuilder();
4329 bool hasOperands = false;
4330 std::int32_t typeparamsSize = 0;
4331
4332 // Parse device number as a new operand
4334 mlir::Type deviceType;
4335 if (parser.parseOperand(deviceOperand) || parser.parseColonType(deviceType))
4336 return mlir::failure();
4337 if (parser.resolveOperand(deviceOperand, deviceType, result.operands))
4338 return mlir::failure();
4339 if (parser.parseComma())
4340 return mlir::failure();
4341
4342 mlir::Type intype;
4343 if (parser.parseType(intype))
4344 return mlir::failure();
4345 result.addAttribute("in_type", mlir::TypeAttr::get(intype));
4348 if (!parser.parseOptionalLParen()) {
4349 // parse the LEN params of the derived type. (<params> : <types>)
4351 parser.parseColonTypeList(typeVec) || parser.parseRParen())
4352 return mlir::failure();
4353 typeparamsSize = operands.size();
4354 hasOperands = true;
4355 }
4356 std::int32_t shapeSize = 0;
4357 if (!parser.parseOptionalComma()) {
4358 // parse size to scale by, vector of n dimensions of type index
4360 return mlir::failure();
4361 shapeSize = operands.size() - typeparamsSize;
4362 auto idxTy = builder.getIndexType();
4363 for (std::int32_t i = typeparamsSize, end = operands.size(); i != end; ++i)
4364 typeVec.push_back(idxTy);
4365 hasOperands = true;
4366 }
4367 if (hasOperands &&
4368 parser.resolveOperands(operands, typeVec, parser.getNameLoc(),
4369 result.operands))
4370 return mlir::failure();
4371
4372 mlir::Type restype = builder.getIntegerType(64);
4373 if (!restype) {
4374 parser.emitError(parser.getNameLoc(), "invalid allocate type: ") << intype;
4375 return mlir::failure();
4376 }
4377 llvm::SmallVector<std::int32_t> segmentSizes{1, typeparamsSize, shapeSize};
4378 result.addAttribute("operandSegmentSizes",
4379 builder.getDenseI32ArrayAttr(segmentSizes));
4380 if (parser.parseOptionalAttrDict(result.attributes) ||
4381 parser.addTypeToList(restype, result.types))
4382 return mlir::failure();
4383 return mlir::success();
4384}
4385
4386mlir::ParseResult omp::TargetAllocMemOp::parse(mlir::OpAsmParser &parser,
4388 return parseTargetAllocMemOp(parser, result);
4389}
4390
4391void omp::TargetAllocMemOp::print(mlir::OpAsmPrinter &p) {
4392 p << " ";
4394 p << " : ";
4395 p << getDevice().getType();
4396 p << ", ";
4397 p << getInType();
4398 if (!getTypeparams().empty()) {
4399 p << '(' << getTypeparams() << " : " << getTypeparams().getTypes() << ')';
4400 }
4401 for (auto sh : getShape()) {
4402 p << ", ";
4403 p.printOperand(sh);
4404 }
4405 p.printOptionalAttrDict((*this)->getAttrs(),
4406 {"in_type", "operandSegmentSizes"});
4407}
4408
4409llvm::LogicalResult omp::TargetAllocMemOp::verify() {
4410 mlir::Type outType = getType();
4411 if (!mlir::dyn_cast<IntegerType>(outType))
4412 return emitOpError("must be a integer type");
4413 return mlir::success();
4414}
4415
4416//===----------------------------------------------------------------------===//
4417// WorkdistributeOp
4418//===----------------------------------------------------------------------===//
4419
4420LogicalResult WorkdistributeOp::verify() {
4421 // Check that region exists and is not empty
4422 Region &region = getRegion();
4423 if (region.empty())
4424 return emitOpError("region cannot be empty");
4425 // Verify single entry point.
4426 Block &entryBlock = region.front();
4427 if (entryBlock.empty())
4428 return emitOpError("region must contain a structured block");
4429 // Verify single exit point.
4430 bool hasTerminator = false;
4431 for (Block &block : region) {
4432 if (isa<TerminatorOp>(block.back())) {
4433 if (hasTerminator) {
4434 return emitOpError("region must have exactly one terminator");
4435 }
4436 hasTerminator = true;
4437 }
4438 }
4439 if (!hasTerminator) {
4440 return emitOpError("region must be terminated with omp.terminator");
4441 }
4442 auto walkResult = region.walk([&](Operation *op) -> WalkResult {
4443 // No implicit barrier at end
4444 if (isa<BarrierOp>(op)) {
4445 return emitOpError(
4446 "explicit barriers are not allowed in workdistribute region");
4447 }
4448 // Check for invalid nested constructs
4449 if (isa<ParallelOp>(op)) {
4450 return emitOpError(
4451 "nested parallel constructs not allowed in workdistribute");
4452 }
4453 if (isa<TeamsOp>(op)) {
4454 return emitOpError(
4455 "nested teams constructs not allowed in workdistribute");
4456 }
4457 return WalkResult::advance();
4458 });
4459 if (walkResult.wasInterrupted())
4460 return failure();
4461
4462 Operation *parentOp = (*this)->getParentOp();
4463 if (!llvm::dyn_cast<TeamsOp>(parentOp))
4464 return emitOpError("workdistribute must be nested under teams");
4465 return success();
4466}
4467
4468#define GET_ATTRDEF_CLASSES
4469#include "mlir/Dialect/OpenMP/OpenMPOpsAttributes.cpp.inc"
4470
4471#define GET_OP_CLASSES
4472#include "mlir/Dialect/OpenMP/OpenMPOps.cpp.inc"
4473
4474#define GET_TYPEDEF_CLASSES
4475#include "mlir/Dialect/OpenMP/OpenMPOpsTypes.cpp.inc"
static SmallVector< Value > getTileSizes(Location loc, amx::TileType tType, RewriterBase &rewriter)
Maps the 2-dim vector shape to the two 16-bit tile sizes.
return success()
p<< " : "<< getMemRefType()<< ", "<< getType();}static LogicalResult verifyVectorMemoryOp(Operation *op, MemRefType memrefType, VectorType vectorType) { if(memrefType.getElementType() !=vectorType.getElementType()) return op-> emitOpError("requires memref and vector types of the same elemental type")
Given a list of lists of parsed operands, populates uniqueOperands with unique operands.
static std::optional< int64_t > getUpperBound(Value iv)
Gets the constant upper bound on an affine.for iv.
static LogicalResult verifyRegion(emitc::SwitchOp op, Region &region, const Twine &name)
Definition EmitC.cpp:1400
static Type getElementType(Type type)
Determine the element type of type.
static ze_device_handle_t getDevice(const uint32_t driverIdx=0, const int32_t devIdx=0)
b
Return true if permutation is a valid permutation of the outer_dims_perm (case OuterOrInnerPerm::Oute...
ArrayAttr()
b getContext())
static const mlir::GenInfo * generator
static LogicalResult verifyNontemporalClause(Operation *op, OperandRange nontemporalVars)
static DenseI64ArrayAttr makeDenseI64ArrayAttr(MLIRContext *ctx, const ArrayRef< int64_t > intArray)
static constexpr StringRef getPrivateNeedsBarrierSpelling()
static LogicalResult verifyMapClause(Operation *op, OperandRange mapVars)
static LogicalResult verifyReductionVarList(Operation *op, std::optional< ArrayAttr > reductionSyms, OperandRange reductionVars, std::optional< ArrayRef< bool > > reductionByref)
Verifies Reduction Clause.
static ParseResult parseInReductionPrivateRegion(OpAsmParser &parser, Region &region, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &inReductionVars, SmallVectorImpl< Type > &inReductionTypes, DenseBoolArrayAttr &inReductionByref, ArrayAttr &inReductionSyms, llvm::SmallVectorImpl< OpAsmParser::UnresolvedOperand > &privateVars, llvm::SmallVectorImpl< Type > &privateTypes, ArrayAttr &privateSyms, UnitAttr &privateNeedsBarrier)
static ArrayAttr makeArrayAttr(MLIRContext *context, llvm::ArrayRef< Attribute > attrs)
static ParseResult parseClauseAttr(AsmParser &parser, ClauseAttr &attr)
static void printAllocateAndAllocator(OpAsmPrinter &p, Operation *op, OperandRange allocateVars, TypeRange allocateTypes, OperandRange allocatorVars, TypeRange allocatorTypes)
Print allocate clause.
static DenseBoolArrayAttr makeDenseBoolArrayAttr(MLIRContext *ctx, const ArrayRef< bool > boolArray)
static std::string generateLoopNestingName(StringRef prefix, CanonicalLoopOp op)
Generate a name of a canonical loop nest of the format <prefix>(_r<idx>_s<idx>)*.
static void printClauseWithRegionArgs(OpAsmPrinter &p, MLIRContext *ctx, StringRef clauseName, ValueRange argsSubrange, ValueRange operands, TypeRange types, ArrayAttr symbols=nullptr, DenseI64ArrayAttr mapIndices=nullptr, DenseBoolArrayAttr byref=nullptr, ReductionModifierAttr modifier=nullptr, UnitAttr needsBarrier=nullptr)
static void printBlockArgClause(OpAsmPrinter &p, MLIRContext *ctx, StringRef clauseName, ValueRange argsSubrange, std::optional< MapPrintArgs > mapArgs)
static void printBlockArgRegion(OpAsmPrinter &p, Operation *op, Region &region, const AllRegionPrintArgs &args)
static ParseResult parseGranularityClause(OpAsmParser &parser, ClauseTypeAttr &prescriptiveness, std::optional< OpAsmParser::UnresolvedOperand > &operand, Type &operandType, std::optional< ClauseType >(*symbolizeClause)(StringRef), StringRef clauseName)
static ParseResult parseBlockArgRegion(OpAsmParser &parser, Region &region, AllRegionParseArgs args)
static ParseResult parseLoopTransformClis(OpAsmParser &parser, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &generateesOperands, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &applyeesOperands)
static ParseResult parseSynchronizationHint(OpAsmParser &parser, IntegerAttr &hintAttr)
Parses a Synchronization Hint clause.
static ParseResult parseLinearClause(OpAsmParser &parser, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &linearVars, SmallVectorImpl< Type > &linearTypes, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &linearStepVars)
linear ::= linear ( linear-list ) linear-list := linear-val | linear-val linear-list linear-val := ss...
static void printScheduleClause(OpAsmPrinter &p, Operation *op, ClauseScheduleKindAttr scheduleKind, ScheduleModifierAttr scheduleMod, UnitAttr scheduleSimd, Value scheduleChunk, Type scheduleChunkType)
Print schedule clause.
static void printCopyprivate(OpAsmPrinter &p, Operation *op, OperandRange copyprivateVars, TypeRange copyprivateTypes, std::optional< ArrayAttr > copyprivateSyms)
Print Copyprivate clause.
static ParseResult parseOrderClause(OpAsmParser &parser, ClauseOrderKindAttr &order, OrderModifierAttr &orderMod)
static bool mapTypeToBool(ClauseMapFlags value, ClauseMapFlags flag)
static void printAlignedClause(OpAsmPrinter &p, Operation *op, ValueRange alignedVars, TypeRange alignedTypes, std::optional< ArrayAttr > alignments)
Print Aligned Clause.
static LogicalResult verifySynchronizationHint(Operation *op, uint64_t hint)
Verifies a synchronization hint clause.
static ParseResult parseUseDeviceAddrUseDevicePtrRegion(OpAsmParser &parser, Region &region, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &useDeviceAddrVars, SmallVectorImpl< Type > &useDeviceAddrTypes, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &useDevicePtrVars, SmallVectorImpl< Type > &useDevicePtrTypes)
static void printLinearClause(OpAsmPrinter &p, Operation *op, ValueRange linearVars, TypeRange linearTypes, ValueRange linearStepVars)
Print Linear Clause.
*attr dict without keyword *static mlir::ParseResult parseTargetAllocMemOp(mlir::OpAsmParser &parser, mlir::OperationState &result)
operation ::= res = (omp.target_alloc_mem) $device : devicetype, $in_type ( ( $typeparams ) )?...
static Operation * findCapturedOmpOp(Operation *rootOp, bool checkSingleMandatoryExec, llvm::function_ref< bool(Operation *)> siblingAllowedFn)
static void printInReductionPrivateReductionRegion(OpAsmPrinter &p, Operation *op, Region &region, ValueRange inReductionVars, TypeRange inReductionTypes, DenseBoolArrayAttr inReductionByref, ArrayAttr inReductionSyms, ValueRange privateVars, TypeRange privateTypes, ArrayAttr privateSyms, UnitAttr privateNeedsBarrier, ReductionModifierAttr reductionMod, ValueRange reductionVars, TypeRange reductionTypes, DenseBoolArrayAttr reductionByref, ArrayAttr reductionSyms)
static void printInReductionPrivateRegion(OpAsmPrinter &p, Operation *op, Region &region, ValueRange inReductionVars, TypeRange inReductionTypes, DenseBoolArrayAttr inReductionByref, ArrayAttr inReductionSyms, ValueRange privateVars, TypeRange privateTypes, ArrayAttr privateSyms, UnitAttr privateNeedsBarrier)
static void printSynchronizationHint(OpAsmPrinter &p, Operation *op, IntegerAttr hintAttr)
Prints a Synchronization Hint clause.
static void printGranularityClause(OpAsmPrinter &p, Operation *op, ClauseTypeAttr prescriptiveness, Value operand, mlir::Type operandType, StringRef(*stringifyClauseType)(ClauseType))
static void printDependVarList(OpAsmPrinter &p, Operation *op, OperandRange dependVars, TypeRange dependTypes, std::optional< ArrayAttr > dependKinds)
Print Depend clause.
static void printTargetOpRegion(OpAsmPrinter &p, Operation *op, Region &region, ValueRange hasDeviceAddrVars, TypeRange hasDeviceAddrTypes, ValueRange hostEvalVars, TypeRange hostEvalTypes, ValueRange inReductionVars, TypeRange inReductionTypes, DenseBoolArrayAttr inReductionByref, ArrayAttr inReductionSyms, ValueRange mapVars, TypeRange mapTypes, ValueRange privateVars, TypeRange privateTypes, ArrayAttr privateSyms, UnitAttr privateNeedsBarrier, DenseI64ArrayAttr privateMaps)
static Operation * getParentInSameDialect(Operation *thisOp)
static LogicalResult verifyCopyprivateVarList(Operation *op, OperandRange copyprivateVars, std::optional< ArrayAttr > copyprivateSyms)
Verifies CopyPrivate Clause.
static LogicalResult verifyAlignedClause(Operation *op, std::optional< ArrayAttr > alignments, OperandRange alignedVars)
static ParseResult parseTargetOpRegion(OpAsmParser &parser, Region &region, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &hasDeviceAddrVars, SmallVectorImpl< Type > &hasDeviceAddrTypes, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &hostEvalVars, SmallVectorImpl< Type > &hostEvalTypes, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &inReductionVars, SmallVectorImpl< Type > &inReductionTypes, DenseBoolArrayAttr &inReductionByref, ArrayAttr &inReductionSyms, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &mapVars, SmallVectorImpl< Type > &mapTypes, llvm::SmallVectorImpl< OpAsmParser::UnresolvedOperand > &privateVars, llvm::SmallVectorImpl< Type > &privateTypes, ArrayAttr &privateSyms, UnitAttr &privateNeedsBarrier, DenseI64ArrayAttr &privateMaps)
static ParseResult parsePrivateRegion(OpAsmParser &parser, Region &region, llvm::SmallVectorImpl< OpAsmParser::UnresolvedOperand > &privateVars, llvm::SmallVectorImpl< Type > &privateTypes, ArrayAttr &privateSyms, UnitAttr &privateNeedsBarrier)
static void printNumTasksClause(OpAsmPrinter &p, Operation *op, ClauseNumTasksTypeAttr numTasksMod, Value numTasks, mlir::Type numTasksType)
static void printLoopTransformClis(OpAsmPrinter &p, TileOp op, OperandRange generatees, OperandRange applyees)
static void printPrivateRegion(OpAsmPrinter &p, Operation *op, Region &region, ValueRange privateVars, TypeRange privateTypes, ArrayAttr privateSyms, UnitAttr privateNeedsBarrier)
static void printPrivateReductionRegion(OpAsmPrinter &p, Operation *op, Region &region, ValueRange privateVars, TypeRange privateTypes, ArrayAttr privateSyms, UnitAttr privateNeedsBarrier, ReductionModifierAttr reductionMod, ValueRange reductionVars, TypeRange reductionTypes, DenseBoolArrayAttr reductionByref, ArrayAttr reductionSyms)
static void printTaskReductionRegion(OpAsmPrinter &p, Operation *op, Region &region, ValueRange taskReductionVars, TypeRange taskReductionTypes, DenseBoolArrayAttr taskReductionByref, ArrayAttr taskReductionSyms)
return success()
static LogicalResult verifyOrderedParent(Operation &op)
static void printOrderClause(OpAsmPrinter &p, Operation *op, ClauseOrderKindAttr order, OrderModifierAttr orderMod)
static ParseResult parseBlockArgClause(OpAsmParser &parser, llvm::SmallVectorImpl< OpAsmParser::Argument > &entryBlockArgs, StringRef keyword, std::optional< MapParseArgs > mapArgs)
static ParseResult parseClauseWithRegionArgs(OpAsmParser &parser, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &operands, SmallVectorImpl< Type > &types, SmallVectorImpl< OpAsmParser::Argument > &regionPrivateArgs, ArrayAttr *symbols=nullptr, DenseI64ArrayAttr *mapIndices=nullptr, DenseBoolArrayAttr *byref=nullptr, ReductionModifierAttr *modifier=nullptr, UnitAttr *needsBarrier=nullptr)
static LogicalResult verifyPrivateVarsMapping(TargetOp targetOp)
static ParseResult parseScheduleClause(OpAsmParser &parser, ClauseScheduleKindAttr &scheduleAttr, ScheduleModifierAttr &scheduleMod, UnitAttr &scheduleSimd, std::optional< OpAsmParser::UnresolvedOperand > &chunkSize, Type &chunkType)
schedule ::= schedule ( sched-list ) sched-list ::= sched-val | sched-val sched-list | sched-val ,...
static void printClauseAttr(OpAsmPrinter &p, Operation *op, ClauseAttr attr)
static ParseResult parseAllocateAndAllocator(OpAsmParser &parser, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &allocateVars, SmallVectorImpl< Type > &allocateTypes, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &allocatorVars, SmallVectorImpl< Type > &allocatorTypes)
Parse an allocate clause with allocators and a list of operands with types.
static void printMembersIndex(OpAsmPrinter &p, MapInfoOp op, ArrayAttr membersIdx)
static bool canPromoteToNoLoop(Operation *capturedOp, TeamsOp teamsOp, WsloopOp *wsLoopOp)
Check if we can promote SPMD kernel to No-Loop kernel.
static void printCaptureType(OpAsmPrinter &p, Operation *op, VariableCaptureKindAttr mapCaptureType)
static bool opInGlobalImplicitParallelRegion(Operation *op)
static void printUseDeviceAddrUseDevicePtrRegion(OpAsmPrinter &p, Operation *op, Region &region, ValueRange useDeviceAddrVars, TypeRange useDeviceAddrTypes, ValueRange useDevicePtrVars, TypeRange useDevicePtrTypes)
static LogicalResult verifyPrivateVarList(OpType &op)
static ParseResult parseNumTasksClause(OpAsmParser &parser, ClauseNumTasksTypeAttr &numTasksMod, std::optional< OpAsmParser::UnresolvedOperand > &numTasks, Type &numTasksType)
static ParseResult parseAlignedClause(OpAsmParser &parser, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &alignedVars, SmallVectorImpl< Type > &alignedTypes, ArrayAttr &alignmentsAttr)
aligned ::= aligned ( aligned-list ) aligned-list := aligned-val | aligned-val aligned-list aligned-v...
static ParseResult parsePrivateReductionRegion(OpAsmParser &parser, Region &region, llvm::SmallVectorImpl< OpAsmParser::UnresolvedOperand > &privateVars, llvm::SmallVectorImpl< Type > &privateTypes, ArrayAttr &privateSyms, UnitAttr &privateNeedsBarrier, ReductionModifierAttr &reductionMod, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &reductionVars, SmallVectorImpl< Type > &reductionTypes, DenseBoolArrayAttr &reductionByref, ArrayAttr &reductionSyms)
static ParseResult parseInReductionPrivateReductionRegion(OpAsmParser &parser, Region &region, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &inReductionVars, SmallVectorImpl< Type > &inReductionTypes, DenseBoolArrayAttr &inReductionByref, ArrayAttr &inReductionSyms, llvm::SmallVectorImpl< OpAsmParser::UnresolvedOperand > &privateVars, llvm::SmallVectorImpl< Type > &privateTypes, ArrayAttr &privateSyms, UnitAttr &privateNeedsBarrier, ReductionModifierAttr &reductionMod, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &reductionVars, SmallVectorImpl< Type > &reductionTypes, DenseBoolArrayAttr &reductionByref, ArrayAttr &reductionSyms)
static ParseResult parseCaptureType(OpAsmParser &parser, VariableCaptureKindAttr &mapCaptureType)
static ParseResult parseTaskReductionRegion(OpAsmParser &parser, Region &region, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &taskReductionVars, SmallVectorImpl< Type > &taskReductionTypes, DenseBoolArrayAttr &taskReductionByref, ArrayAttr &taskReductionSyms)
static ParseResult parseGrainsizeClause(OpAsmParser &parser, ClauseGrainsizeTypeAttr &grainsizeMod, std::optional< OpAsmParser::UnresolvedOperand > &grainsize, Type &grainsizeType)
static ParseResult parseCopyprivate(OpAsmParser &parser, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &copyprivateVars, SmallVectorImpl< Type > &copyprivateTypes, ArrayAttr &copyprivateSyms)
copyprivate-entry-list ::= copyprivate-entry | copyprivate-entry-list , copyprivate-entry copyprivate...
static LogicalResult verifyDependVarList(Operation *op, std::optional< ArrayAttr > dependKinds, OperandRange dependVars)
Verifies Depend clause.
static ParseResult parseDependVarList(OpAsmParser &parser, SmallVectorImpl< OpAsmParser::UnresolvedOperand > &dependVars, SmallVectorImpl< Type > &dependTypes, ArrayAttr &dependKinds)
depend-entry-list ::= depend-entry | depend-entry-list , depend-entry depend-entry ::= depend-kind ->...
static LogicalResult verifyMapInfoDefinedArgs(Operation *op, StringRef clauseName, OperandRange vars)
static void printGrainsizeClause(OpAsmPrinter &p, Operation *op, ClauseGrainsizeTypeAttr grainsizeMod, Value grainsize, mlir::Type grainsizeType)
static ParseResult verifyScheduleModifiers(OpAsmParser &parser, SmallVectorImpl< SmallString< 12 > > &modifiers)
static bool isUnique(It begin, It end)
Definition ShardOps.cpp:161
static ArrayRef< int64_t > getShape(Type type)
Returns the shape of the given type.
Definition Traits.cpp:117
This base class exposes generic asm parser hooks, usable across the various derived parsers.
virtual ParseResult parseMinus()=0
Parse a '-' token.
@ Paren
Parens surrounding zero or more operands.
@ None
Zero or more operands with no delimiters.
virtual ParseResult parseColonTypeList(SmallVectorImpl< Type > &result)=0
Parse a colon followed by a type list, which must have at least one type.
virtual Builder & getBuilder() const =0
Return a builder which provides useful access to MLIRContext, global objects like types and attribute...
virtual ParseResult parseCommaSeparatedList(Delimiter delimiter, function_ref< ParseResult()> parseElementFn, StringRef contextMessage=StringRef())=0
Parse a list of comma-separated items with an optional delimiter.
virtual ParseResult parseOptionalAttrDict(NamedAttrList &result)=0
Parse a named dictionary into 'result' if it is present.
virtual ParseResult parseOptionalEqual()=0
Parse a = token if present.
virtual ParseResult parseOptionalKeyword(StringRef keyword)=0
Parse the given keyword if present.
MLIRContext * getContext() const
virtual ParseResult parseRParen()=0
Parse a ) token.
virtual InFlightDiagnostic emitError(SMLoc loc, const Twine &message={})=0
Emit a diagnostic at the specified location and return failure.
virtual ParseResult parseOptionalColon()=0
Parse a : token if present.
virtual ParseResult parseLSquare()=0
Parse a [ token.
virtual ParseResult parseRSquare()=0
Parse a ] token.
ParseResult parseInteger(IntT &result)
Parse an integer value from the stream.
virtual ParseResult parseOptionalArrow()=0
Parse a '->' token if present.
ParseResult addTypeToList(Type type, SmallVectorImpl< Type > &result)
Add the specified type to the end of the specified type list and return success.
virtual ParseResult parseLess()=0
Parse a '<' token.
virtual ParseResult parseEqual()=0
Parse a = token.
virtual ParseResult parseColonType(Type &result)=0
Parse a colon followed by a type.
virtual SMLoc getCurrentLocation()=0
Get the location of the next token and store it into the argument.
virtual ParseResult parseOptionalComma()=0
Parse a , token if present.
virtual ParseResult parseColon()=0
Parse a : token.
virtual SMLoc getNameLoc() const =0
Return the location of the original name token.
virtual ParseResult parseOptionalLess()=0
Parse a '<' token if present.
virtual ParseResult parseArrow()=0
Parse a '->' token.
virtual ParseResult parseLParen()=0
Parse a ( token.
virtual ParseResult parseType(Type &result)=0
Parse a type.
virtual ParseResult parseComma()=0
Parse a , token.
virtual ParseResult parseOptionalLParen()=0
Parse a ( token if present.
ParseResult parseKeyword(StringRef keyword)
Parse a given keyword.
Attributes are known-constant values of operations.
Definition Attributes.h:25
Block represents an ordered list of Operations.
Definition Block.h:33
ValueTypeRange< BlockArgListType > getArgumentTypes()
Return a range containing the types of the arguments for this block.
Definition Block.cpp:154
bool empty()
Definition Block.h:158
BlockArgument getArgument(unsigned i)
Definition Block.h:139
unsigned getNumArguments()
Definition Block.h:138
Operation & front()
Definition Block.h:163
SuccessorRange getSuccessors()
Definition Block.h:280
BlockArgListType getArguments()
Definition Block.h:97
DenseI32ArrayAttr getDenseI32ArrayAttr(ArrayRef< int32_t > values)
Definition Builders.cpp:163
IntegerType getI64Type()
Definition Builders.cpp:65
IntegerType getIntegerType(unsigned width)
Definition Builders.cpp:67
MLIRContext * getContext() const
Definition Builders.h:56
IndexType getIndexType()
Definition Builders.cpp:51
Attr getAttr(Args &&...args)
Get or construct an instance of the attribute Attr with provided arguments.
Definition Builders.h:98
Diagnostic & append(Arg1 &&arg1, Arg2 &&arg2, Args &&...args)
Append arguments to the diagnostic.
Diagnostic & appendOp(Operation &op, const OpPrintingFlags &flags)
Append an operation with the given printing flags.
Dialects are groups of MLIR operations, types and attributes, as well as behavior associated with the...
Definition Dialect.h:38
A class for computing basic dominance information.
Definition Dominance.h:140
bool dominates(Operation *a, Operation *b) const
Return true if operation A dominates operation B, i.e.
Definition Dominance.h:158
This class represents a diagnostic that is inflight and set to be reported.
Diagnostic & attachNote(std::optional< Location > noteLoc=std::nullopt)
Attaches a note to this diagnostic.
MLIRContext is the top-level object for a collection of MLIR operations.
Definition MLIRContext.h:63
The OpAsmParser has methods for interacting with the asm parser: parsing things from it,...
virtual ParseResult parseRegion(Region &region, ArrayRef< Argument > arguments={}, bool enableNameShadowing=false)=0
Parses a region.
virtual ParseResult parseArgument(Argument &result, bool allowType=false, bool allowAttrs=false)=0
Parse a single argument with the following syntax:
virtual ParseResult parseArgumentList(SmallVectorImpl< Argument > &result, Delimiter delimiter=Delimiter::None, bool allowType=false, bool allowAttrs=false)=0
Parse zero or more arguments with a specified surrounding delimiter.
virtual ParseResult resolveOperand(const UnresolvedOperand &operand, Type type, SmallVectorImpl< Value > &result)=0
Resolve an operand to an SSA value, emitting an error on failure.
ParseResult resolveOperands(Operands &&operands, Type type, SmallVectorImpl< Value > &result)
Resolve a list of operands to SSA values, emitting an error on failure, or appending the results to t...
virtual ParseResult parseOperand(UnresolvedOperand &result, bool allowResultNumber=true)=0
Parse a single SSA value operand name along with a result number if allowResultNumber is true.
virtual ParseResult parseOperandList(SmallVectorImpl< UnresolvedOperand > &result, Delimiter delimiter=Delimiter::None, bool allowResultNumber=true, int requiredOperandCount=-1)=0
Parse zero or more SSA comma-separated operand references with a specified surrounding delimiter,...
This is a pure-virtual base class that exposes the asmprinter hooks necessary to implement a custom p...
virtual void printOptionalAttrDict(ArrayRef< NamedAttribute > attrs, ArrayRef< StringRef > elidedAttrs={})=0
If the specified operation has attributes, print out an attribute dictionary with their values.
virtual void printRegion(Region &blocks, bool printEntryBlockArgs=true, bool printBlockTerminators=true, bool printEmptyBlock=false)=0
Prints a region.
virtual void printOperand(Value value)=0
Print implementations for various things an operation contains.
This class helps build Operations.
Definition Builders.h:207
This class represents an operand of an operation.
Definition Value.h:257
Set of flags used to control the behavior of the various IR print methods (e.g.
This class provides the API for ops that are known to be isolated from above.
This class provides the API for ops that are known to be terminators.
This class indicates that the regions associated with this op don't have terminators.
This class implements the operand iterators for the Operation class.
Definition ValueRange.h:43
Operation is the basic unit of execution within MLIR.
Definition Operation.h:88
Dialect * getDialect()
Return the dialect this operation is associated with, or nullptr if the associated dialect is not loa...
Definition Operation.h:220
Region & getRegion(unsigned index)
Returns the region held by this operation at position 'index'.
Definition Operation.h:686
bool hasTrait()
Returns true if the operation was registered with a particular trait, e.g.
Definition Operation.h:749
Block * getBlock()
Returns the operation block that contains this operation.
Definition Operation.h:213
unsigned getNumRegions()
Returns the number of regions held by this operation.
Definition Operation.h:674
Location getLoc()
The source location the operation was defined or derived from.
Definition Operation.h:223
Operation * getParentOp()
Returns the closest surrounding operation that contains this operation or nullptr if this is a top-le...
Definition Operation.h:234
InFlightDiagnostic emitError(const Twine &message={})
Emit an error about fatal conditions with this operation, reporting up to any diagnostic handlers tha...
OpTy getParentOfType()
Return the closest surrounding parent operation that is of type 'OpTy'.
Definition Operation.h:238
MutableArrayRef< Region > getRegions()
Returns the regions held by this operation.
Definition Operation.h:677
std::enable_if_t< llvm::function_traits< std::decay_t< FnT > >::num_args==1, RetT > walk(FnT &&callback)
Walk the operation by calling the callback for each nested operation (including this one),...
Definition Operation.h:797
user_range getUsers()
Returns a range of all users.
Definition Operation.h:873
Region * getParentRegion()
Returns the region to which the instruction belongs.
Definition Operation.h:230
MLIRContext * getContext()
Return the context this operation is associated with.
Definition Operation.h:216
InFlightDiagnostic emitOpError(const Twine &message={})
Emit an error with the op name prefixed, like "'dim' op " which is convenient for verifiers.
A special type of RewriterBase that coordinates the application of a rewrite pattern on the current I...
This class contains a list of basic blocks and a link to the parent operation it is attached to.
Definition Region.h:26
Block & front()
Definition Region.h:65
BlockArgListType getArguments()
Definition Region.h:81
OpIterator op_begin()
Return iterators that walk the operations nested directly within this region.
Definition Region.h:170
iterator_range< OpIterator > getOps()
Definition Region.h:172
bool empty()
Definition Region.h:60
unsigned getNumArguments()
Definition Region.h:123
Location getLoc()
Return a location for this region.
Definition Region.cpp:31
BlockArgument getArgument(unsigned i)
Definition Region.h:124
Operation * getParentOp()
Return the parent operation this region is attached to.
Definition Region.h:200
BlockListType & getBlocks()
Definition Region.h:45
virtual void eraseOp(Operation *op)
This method erases an operation that is known to have no uses.
OpTy replaceOpWithNewOp(Operation *op, Args &&...args)
Replace the results of the given (original) op with a new op that is created without verification (re...
Resource * getResource() const
Return the resource that the effect applies to.
EffectT * getEffect() const
Return the effect being applied.
This class represents a collection of SymbolTables.
virtual Operation * lookupNearestSymbolFrom(Operation *from, StringAttr symbol)
Returns the operation registered with the given symbol name within the closest parent operation of,...
static Operation * lookupNearestSymbolFrom(Operation *from, StringAttr symbol)
Returns the operation registered with the given symbol name within the closest parent operation of,...
This class provides an abstraction over the various different ranges of value types.
Definition TypeRange.h:37
Instances of the Type class are uniqued, have an immutable identifier and an optional mutable compone...
Definition Types.h:74
This class provides an abstraction over the different types of ranges over Values.
Definition ValueRange.h:387
type_range getType() const
This class represents an instance of an SSA value in the MLIR system, representing a computable value...
Definition Value.h:96
MLIRContext * getContext() const
Utility to get the associated MLIRContext that this value is defined in.
Definition Value.h:108
Type getType() const
Return the type of this value.
Definition Value.h:105
use_range getUses() const
Returns a range of all uses, which is useful for iterating over all uses.
Definition Value.h:188
Operation * getDefiningOp() const
If this value is the result of an operation, return the operation that defines it.
Definition Value.cpp:18
A utility result that is used to signal how to proceed with an ongoing walk:
Definition WalkResult.h:29
static WalkResult skip()
Definition WalkResult.h:48
static WalkResult advance()
Definition WalkResult.h:47
static WalkResult interrupt()
Definition WalkResult.h:46
static DenseArrayAttrImpl get(MLIRContext *context, ArrayRef< bool > content)
bool isReachableFromEntry(Block *a) const
Return true if the specified block is reachable from the entry block of its region.
Operation * getOwner() const
Return the owner of this operand.
Definition UseDefLists.h:38
SideEffects::EffectInstance< Effect > EffectInstance
bool isPerfectlyNested(ArrayRef< AffineForOp > loops)
Returns true if loops is a perfectly nested loop nest, where loops appear in it from outermost to inn...
TargetEnterDataOperands TargetEnterExitUpdateDataOperands
omp.target_enter_data, omp.target_exit_data and omp.target_update take the same clauses,...
std::tuple< NewCliOp, OpOperand *, OpOperand * > decodeCli(mlir::Value cli)
Find the omp.new_cli, generator, and consumer of a canonical loop info.
detail::InFlightRemark failed(Location loc, RemarkOpts opts)
Report an optimization remark that failed.
Definition Remarks.h:573
Include the generated interface declarations.
detail::DenseArrayAttrImpl< int64_t > DenseI64ArrayAttr
function_ref< void(Value, StringRef)> OpAsmSetValueNameFn
A functor used to set the name of the start of a result group of an operation.
Type getType(OpFoldResult ofr)
Returns the int type of the integer in ofr.
Definition Utils.cpp:304
llvm::DenseSet< ValueT, ValueInfoT > DenseSet
Definition LLVM.h:128
InFlightDiagnostic emitError(Location loc)
Utility method to emit an error message using this location.
llvm::TypeSwitch< T, ResultT > TypeSwitch
Definition LLVM.h:144
SmallVector< Loops, 8 > tile(ArrayRef< scf::ForOp > forOps, ArrayRef< Value > sizes, ArrayRef< scf::ForOp > targets)
Performs tiling fo imperfectly nested loops (with interchange) by strip-mining the forOps by sizes an...
Definition Utils.cpp:1293
detail::DenseArrayAttrImpl< bool > DenseBoolArrayAttr
function_ref< void(Block *, StringRef)> OpAsmSetBlockNameFn
A functor used to set the name of blocks in regions directly nested under an operation.
This is the representation of an operand reference.
This class provides APIs and verifiers for ops with regions having a single block.
This represents an operation in an abstracted form, suitable for use with the builder APIs.
void addOperands(ValueRange newOperands)
void addAttributes(ArrayRef< NamedAttribute > newAttributes)
Add an array of named attributes.
void addTypes(ArrayRef< Type > newTypes)
Region * addRegion()
Create a region that should be attached to the operation.