doxygen/Spmdization_8cpp_source.html

 //===- Spmdization.cpp --------------------------------------------- C++ --===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//


 #include "mlir/Dialect/Mesh/Transforms/Spmdization.h"


 #include "mlir/Dialect/Func/IR/FuncOps.h"

 #include "mlir/Dialect/Mesh/IR/MeshDialect.h"

 #include "mlir/Dialect/Mesh/IR/MeshOps.h"

 #include "mlir/Dialect/Mesh/Interfaces/ShardingInterface.h"

 #include "mlir/Dialect/Tensor/IR/Tensor.h"

 #include "mlir/IR/Builders.h"

 #include "mlir/IR/BuiltinAttributes.h"

 #include "mlir/IR/BuiltinTypeInterfaces.h"

 #include "mlir/IR/BuiltinTypes.h"

 #include "mlir/IR/Diagnostics.h"

 #include "mlir/IR/IRMapping.h"

 #include "mlir/IR/ImplicitLocOpBuilder.h"

 #include "mlir/IR/Location.h"

 #include "mlir/IR/MLIRContext.h"

 #include "mlir/IR/SymbolTable.h"

 #include "mlir/IR/Value.h"

 #include "mlir/Interfaces/ControlFlowInterfaces.h"

 #include "mlir/Interfaces/FunctionInterfaces.h"

 #include "mlir/Pass/Pass.h"

 #include "mlir/Support/LLVM.h"

 #include "llvm/ADT/APInt.h"

 #include "llvm/ADT/DenseSet.h"

 #include "llvm/ADT/STLExtras.h"

 #include "llvm/ADT/SmallVector.h"

 #include "llvm/Support/Casting.h"

 #include <iterator>

 #include <optional>

 #include <tuple>

 #include <type_traits>


 namespace mlir::mesh {


 template <typename SourceAxes, typename TargetAxes>

 static bool arePartialAxesCompatible(const SourceAxes &sourceAxes,

                                      const TargetAxes &targetAxes) {

   return llvm::all_of(targetAxes, [&sourceAxes](auto &targetAxis) {

     return sourceAxes.contains(targetAxis);

   });

 }


 // Return the reduced value and its corresponding sharding.

 // Example:

 // sourceSharding = <@mesh_1d, [[0]], partial = sum[0]>

 // targetSharding = <@mesh_1d, [[]]>

 // Then will apply all-reduce on the source value

 // and return it with the sharding <@mesh_1d, [[0]]>.

 static std::tuple<TypedValue<ShapedType>, MeshSharding>

 handlePartialAxesDuringResharding(OpBuilder &builder,

                                   MeshSharding sourceSharding,

                                   MeshSharding targetSharding,

                                   TypedValue<ShapedType> sourceShard) {

   if (sourceSharding.getPartialAxes().empty() &&

       targetSharding.getPartialAxes().empty()) {

     return {sourceShard, sourceSharding};

   }

   assert(targetSharding.getPartialAxes().empty() ||

          (!sourceSharding.getPartialAxes().empty() &&

           sourceSharding.getPartialType() == targetSharding.getPartialType()));

   using Axis = std::decay_t<decltype(sourceSharding.getPartialAxes().front())>;

   using AxisSet = llvm::SmallDenseSet<Axis>;

   AxisSet sourceShardingPartialAxesSet(sourceSharding.getPartialAxes().begin(),

                                        sourceSharding.getPartialAxes().end());

   AxisSet targetShardingPartialAxesSet(targetSharding.getPartialAxes().begin(),

                                        targetSharding.getPartialAxes().end());

   assert(arePartialAxesCompatible(sourceShardingPartialAxesSet,

                                   targetShardingPartialAxesSet));

   llvm::SmallVector<MeshAxis> allReduceMeshAxes;

   llvm::copy_if(sourceShardingPartialAxesSet,

                 std::back_inserter(allReduceMeshAxes),

                 [&targetShardingPartialAxesSet](Axis a) {

                   return !targetShardingPartialAxesSet.contains(a);

                 });

   if (allReduceMeshAxes.empty()) {

     return {sourceShard, sourceSharding};

   }


   builder.setInsertionPointAfterValue(sourceShard);

   TypedValue<ShapedType> resultValue = cast<TypedValue<ShapedType>>(

       builder

           .create<AllReduceOp>(sourceShard.getLoc(), sourceShard.getType(),

                                sourceSharding.getMeshAttr().getLeafReference(),

                                allReduceMeshAxes, sourceShard,

                                sourceSharding.getPartialType())

           .getResult());


   llvm::SmallVector<MeshAxis> remainingPartialAxes;

   llvm::copy_if(sourceShardingPartialAxesSet,

                 std::back_inserter(allReduceMeshAxes),

                 [&targetShardingPartialAxesSet](Axis a) {

                   return targetShardingPartialAxesSet.contains(a);

                 });

   MeshSharding resultSharding = MeshSharding::get(

       sourceSharding.getMeshAttr(), sourceSharding.getSplitAxes(),

       remainingPartialAxes, sourceSharding.getPartialType());

   return {resultValue, resultSharding};

 }


 static MeshSharding targetShardingInSplitLastAxis(MLIRContext *ctx,

                                                   MeshSharding sourceSharding,

                                                   int64_t splitTensorAxis,

                                                   MeshAxis splitMeshAxis) {

   SmallVector<MeshAxesAttr> targetShardingSplitAxes =

       llvm::to_vector(sourceSharding.getSplitAxes());

   while (static_cast<int64_t>(targetShardingSplitAxes.size()) <=

          splitTensorAxis) {

     targetShardingSplitAxes.push_back(MeshAxesAttr::get(ctx, {}));

   }

   auto targetSplitAxes =

       llvm::to_vector(targetShardingSplitAxes[splitTensorAxis].asArrayRef());

   targetSplitAxes.push_back(splitMeshAxis);

   targetShardingSplitAxes[splitTensorAxis] =

       MeshAxesAttr::get(ctx, targetSplitAxes);

   return MeshSharding::get(

       sourceSharding.getMeshAttr(), targetShardingSplitAxes,

       sourceSharding.getPartialAxes(), sourceSharding.getPartialType());

 }


 // Split a replicated tensor along a mesh axis.

 // E.g. [[0, 1]] -> [[0, 1, 2]].

 // Returns the spmdized target value with its sharding.

 static std::tuple<TypedValue<ShapedType>, MeshSharding>

 splitLastAxisInResharding(ImplicitLocOpBuilder &builder,

                           MeshSharding sourceSharding,

                           TypedValue<ShapedType> sourceShard, MeshOp mesh,

                           int64_t splitTensorAxis, MeshAxis splitMeshAxis) {

   TypedValue<ShapedType> targetShard = cast<TypedValue<ShapedType>>(

       builder

           .create<AllSliceOp>(sourceShard, mesh,

                               ArrayRef<MeshAxis>(splitMeshAxis),

                               splitTensorAxis)

           .getResult());

   MeshSharding targetSharding = targetShardingInSplitLastAxis(

       builder.getContext(), sourceSharding, splitTensorAxis, splitMeshAxis);

   return {targetShard, targetSharding};

 }


 // Detect if the resharding is of type e.g.

 // [[0, 1]] -> [[0, 1, 2]].

 // If detected, returns the corresponding tensor axis mesh axis pair.

 // Does not detect insertions like

 // [[0, 1]] -> [[0, 2, 1]].

 static std::optional<std::tuple<int64_t, MeshAxis>>

 detectSplitLastAxisInResharding(MeshSharding sourceSharding,

                                 MeshSharding targetSharding) {

   for (size_t tensorAxis = 0; tensorAxis < targetSharding.getSplitAxes().size();

        ++tensorAxis) {

     if (sourceSharding.getSplitAxes().size() > tensorAxis) {

       if (sourceSharding.getSplitAxes()[tensorAxis].size() + 1 !=

           targetSharding.getSplitAxes()[tensorAxis].size()) {

         continue;

       }

       if (!llvm::equal(

               sourceSharding.getSplitAxes()[tensorAxis].asArrayRef(),

               llvm::make_range(

                   targetSharding.getSplitAxes()[tensorAxis]

                       .asArrayRef()

                       .begin(),

                   targetSharding.getSplitAxes()[tensorAxis].asArrayRef().end() -

                       1))) {

         continue;

       }

     } else {

       if (targetSharding.getSplitAxes()[tensorAxis].size() != 1) {

         continue;

       }

     }

     return std::make_tuple(

         tensorAxis,

         targetSharding.getSplitAxes()[tensorAxis].asArrayRef().back());

   }

   return std::nullopt;

 }


 static std::optional<std::tuple<TypedValue<ShapedType>, MeshSharding>>

 trySplitLastAxisInResharding(ImplicitLocOpBuilder &builder, MeshOp mesh,

                              MeshSharding sourceSharding,

                              MeshSharding targetSharding,

                              TypedValue<ShapedType> sourceShard) {

   if (auto detectRes =

           detectSplitLastAxisInResharding(sourceSharding, targetSharding)) {

     auto [tensorAxis, meshAxis] = detectRes.value();

     return splitLastAxisInResharding(builder, sourceSharding, sourceShard, mesh,

                                      tensorAxis, meshAxis);

   }


   return std::nullopt;

 }


 // Detect if the resharding is of type e.g.

 // [[0, 1, 2]] -> [[0, 1]].

 // If detected, returns the corresponding tensor axis mesh axis pair.

 static std::optional<std::tuple<int64_t, MeshAxis>>

 detectUnsplitLastAxisInResharding(MeshSharding sourceSharding,

                                   MeshSharding targetSharding) {

   for (size_t tensorAxis = 0; tensorAxis < sourceSharding.getSplitAxes().size();

        ++tensorAxis) {

     if (targetSharding.getSplitAxes().size() > tensorAxis) {

       if (sourceSharding.getSplitAxes()[tensorAxis].size() !=

           targetSharding.getSplitAxes()[tensorAxis].size() + 1)

         continue;

       if (!llvm::equal(

               llvm::make_range(

                   sourceSharding.getSplitAxes()[tensorAxis]

                       .asArrayRef()

                       .begin(),

                   sourceSharding.getSplitAxes()[tensorAxis].asArrayRef().end() -

                       1),

               targetSharding.getSplitAxes()[tensorAxis].asArrayRef()))

         continue;

     } else {

       if (sourceSharding.getSplitAxes()[tensorAxis].size() != 1)

         continue;

     }

     return std::make_tuple(

         tensorAxis,

         sourceSharding.getSplitAxes()[tensorAxis].asArrayRef().back());

   }

   return std::nullopt;

 }


 static MeshSharding targetShardingInUnsplitLastAxis(MLIRContext *ctx,

                                                     MeshSharding sourceSharding,

                                                     int64_t splitTensorAxis) {

   SmallVector<MeshAxesAttr> targetShardingSplitAxes =

       llvm::to_vector(sourceSharding.getSplitAxes());

   assert(static_cast<int64_t>(targetShardingSplitAxes.size()) >

          splitTensorAxis);

   auto targetSplitAxes =

       llvm::to_vector(targetShardingSplitAxes[splitTensorAxis].asArrayRef());


   targetSplitAxes.pop_back();

   targetShardingSplitAxes[splitTensorAxis] =

       MeshAxesAttr::get(ctx, targetSplitAxes);

   return MeshSharding::get(

       sourceSharding.getMeshAttr(), targetShardingSplitAxes,

       sourceSharding.getPartialAxes(), sourceSharding.getPartialType());

 }


 static ShapedType allGatherResultShapeInUnsplitLastAxis(

     ShapedType sourceShape, int64_t splitCount, int64_t splitTensorAxis) {

   SmallVector<int64_t> targetShape = llvm::to_vector(sourceShape.getShape());

   targetShape[splitTensorAxis] =

       gatherDimension(targetShape[splitTensorAxis], splitCount);

   return sourceShape.cloneWith(targetShape, sourceShape.getElementType());

 }


 static std::tuple<TypedValue<ShapedType>, MeshSharding>

 unsplitLastAxisInResharding(ImplicitLocOpBuilder &builder,

                             MeshSharding sourceSharding,

                             ShapedType sourceUnshardedShape,

                             TypedValue<ShapedType> sourceShard, MeshOp mesh,

                             int64_t splitTensorAxis, MeshAxis splitMeshAxis) {

   MLIRContext *ctx = builder.getContext();

   builder.setInsertionPointAfterValue(sourceShard);


   MeshSharding targetSharding =

       targetShardingInUnsplitLastAxis(ctx, sourceSharding, splitTensorAxis);

   ShapedType allGatherResultShape = allGatherResultShapeInUnsplitLastAxis(

       sourceShard.getType(), mesh.getShape()[splitMeshAxis], splitTensorAxis);

   Value allGatherResult = builder.create<AllGatherOp>(

       RankedTensorType::get(allGatherResultShape.getShape(),

                             allGatherResultShape.getElementType()),

       mesh.getSymName(), SmallVector<MeshAxis>({splitMeshAxis}), sourceShard,

       APInt(64, splitTensorAxis));

   ShapedType targetShape =

       shardShapedType(sourceUnshardedShape, mesh, targetSharding);

   TypedValue<ShapedType> targetShard = cast<TypedValue<ShapedType>>(

       builder.create<tensor::CastOp>(targetShape, allGatherResult).getResult());

   return {targetShard, targetSharding};

 }


 static std::optional<std::tuple<TypedValue<ShapedType>, MeshSharding>>

 tryUnsplitLastAxisInResharding(ImplicitLocOpBuilder &builder, MeshOp mesh,

                                MeshSharding sourceSharding,

                                MeshSharding targetSharding,

                                ShapedType sourceUnshardedShape,

                                TypedValue<ShapedType> sourceShard) {

   if (auto detectRes =

           detectUnsplitLastAxisInResharding(sourceSharding, targetSharding)) {

     auto [tensorAxis, meshAxis] = detectRes.value();

     return unsplitLastAxisInResharding(builder, sourceSharding,

                                        sourceUnshardedShape, sourceShard, mesh,

                                        tensorAxis, meshAxis);

   }


   return std::nullopt;

 }


 // Detect if the resharding is of type e.g.

 // [[0, 1], [2]] -> [[0], [1, 2]].

 // Only moving the last axis counts.

 // If detected, returns the corresponding (source_tensor_axis,

 // target_tensor_axis, mesh_axis) tuple.

 static std::optional<std::tuple<int64_t, int64_t, MeshAxis>>

 detectMoveLastSplitAxisInResharding(MeshSharding sourceSharding,

                                     MeshSharding targetSharding) {

   for (size_t sourceTensorAxis = 0;

        sourceTensorAxis < sourceSharding.getSplitAxes().size();

        ++sourceTensorAxis) {

     for (size_t targetTensorAxis = 0;

          targetTensorAxis < targetSharding.getSplitAxes().size();

          ++targetTensorAxis) {

       if (sourceTensorAxis == targetTensorAxis)

         continue;

       if (sourceSharding.getSplitAxes()[sourceTensorAxis].empty() ||

           targetSharding.getSplitAxes()[targetTensorAxis].empty() ||

           sourceSharding.getSplitAxes()[sourceTensorAxis].asArrayRef().back() !=

               targetSharding.getSplitAxes()[targetTensorAxis]

                   .asArrayRef()

                   .back())

         continue;

       if (!llvm::equal(

               llvm::make_range(sourceSharding.getSplitAxes()[sourceTensorAxis]

                                    .asArrayRef()

                                    .begin(),

                                sourceSharding.getSplitAxes()[sourceTensorAxis]

                                        .asArrayRef()

                                        .end() -

                                    1),

               llvm::make_range(targetSharding.getSplitAxes()[targetTensorAxis]

                                    .asArrayRef()

                                    .begin(),

                                targetSharding.getSplitAxes()[targetTensorAxis]

                                        .asArrayRef()

                                        .end() -

                                    1)))

         continue;

       return std::make_tuple(

           sourceTensorAxis, targetTensorAxis,

           sourceSharding.getSplitAxes()[sourceTensorAxis].asArrayRef().back());

     }

   }

   return std::nullopt;

 }


 static MeshSharding targetShardingInMoveLastAxis(MLIRContext *ctx,

                                                  MeshSharding sourceSharding,

                                                  int64_t sourceTensorAxis,

                                                  int64_t targetTensorAxis) {

   SmallVector<MeshAxesAttr> targetShardingSplitAxes =

       llvm::to_vector(sourceSharding.getSplitAxes());

   while (static_cast<int64_t>(targetShardingSplitAxes.size()) <=

          targetTensorAxis) {

     targetShardingSplitAxes.push_back(MeshAxesAttr::get(ctx, {}));

   }


   auto sourceSplitAxes =

       llvm::to_vector(targetShardingSplitAxes[sourceTensorAxis].asArrayRef());

   assert(!sourceSplitAxes.empty());

   auto meshAxis = sourceSplitAxes.back();

   sourceSplitAxes.pop_back();

   targetShardingSplitAxes[sourceTensorAxis] =

       MeshAxesAttr::get(ctx, sourceSplitAxes);


   auto targetSplitAxes =

       llvm::to_vector(targetShardingSplitAxes[targetTensorAxis].asArrayRef());

   targetSplitAxes.push_back(meshAxis);

   targetShardingSplitAxes[targetTensorAxis] =

       MeshAxesAttr::get(ctx, targetSplitAxes);


   return MeshSharding::get(

       sourceSharding.getMeshAttr(), targetShardingSplitAxes,

       sourceSharding.getPartialAxes(), sourceSharding.getPartialType());

 }


 static ShapedType allToAllResultShapeInMoveLastAxis(ShapedType sourceShape,

                                                     int64_t splitCount,

                                                     int64_t sourceTensorAxis,

                                                     int64_t targetTensorAxis) {

   SmallVector<int64_t> targetShape = llvm::to_vector(sourceShape.getShape());

   targetShape[sourceTensorAxis] =

       gatherDimension(targetShape[sourceTensorAxis], splitCount);

   targetShape[targetTensorAxis] =

       shardDimension(targetShape[targetTensorAxis], splitCount);

   return sourceShape.cloneWith(targetShape, sourceShape.getElementType());

 }


 static std::tuple<TypedValue<ShapedType>, MeshSharding>

 moveLastSplitAxisInResharding(ImplicitLocOpBuilder &builder, MeshOp mesh,

                               MeshSharding sourceSharding,

                               ShapedType sourceUnshardedShape,

                               TypedValue<ShapedType> sourceShard,

                               int64_t sourceTensorAxis,

                               int64_t targetTensorAxis, MeshAxis meshAxis) {

   MLIRContext *ctx = builder.getContext();

   builder.setInsertionPointAfterValue(sourceShard);


   MeshSharding targetSharding = targetShardingInMoveLastAxis(

       ctx, sourceSharding, sourceTensorAxis, targetTensorAxis);

   ShapedType allToAllResultShape = allToAllResultShapeInMoveLastAxis(

       sourceShard.getType(), mesh.getShape()[meshAxis], sourceTensorAxis,

       targetTensorAxis);

   Value allToAllResult = builder.create<AllToAllOp>(

       RankedTensorType::get(allToAllResultShape.getShape(),

                             allToAllResultShape.getElementType()),

       mesh.getSymName(), SmallVector<MeshAxis>({meshAxis}), sourceShard,

       APInt(64, targetTensorAxis), APInt(64, sourceTensorAxis));

   ShapedType targetShape =

       shardShapedType(sourceUnshardedShape, mesh, targetSharding);

   TypedValue<ShapedType> targetShard = cast<TypedValue<ShapedType>>(

       builder.create<tensor::CastOp>(targetShape, allToAllResult).getResult());

   return {targetShard, targetSharding};

 }


 static std::optional<std::tuple<TypedValue<ShapedType>, MeshSharding>>

 tryMoveLastSplitAxisInResharding(ImplicitLocOpBuilder &builder, MeshOp mesh,

                                  MeshSharding sourceSharding,

                                  MeshSharding targetSharding,

                                  ShapedType sourceUnshardedShape,

                                  TypedValue<ShapedType> sourceShard) {

   if (auto detectRes =

           detectMoveLastSplitAxisInResharding(sourceSharding, targetSharding)) {

     auto [sourceTensorAxis, targetTensorAxis, meshAxis] = detectRes.value();

     return moveLastSplitAxisInResharding(

         builder, mesh, sourceSharding, sourceUnshardedShape, sourceShard,

         sourceTensorAxis, targetTensorAxis, meshAxis);

   }


   return std::nullopt;

 }


 // Detect a change in the halo size (only) and create necessary operations if

 // needed. A changed halo sizes requires copying the "core" of the source tensor

 // into the "core" of the destination tensor followed by an update halo

 // operation.

 static std::optional<std::tuple<TypedValue<ShapedType>, MeshSharding>>

 tryUpdateHaloInResharding(ImplicitLocOpBuilder &builder, MeshOp mesh,

                           MeshSharding sourceSharding,

                           MeshSharding targetSharding,

                           ShapedType sourceUnshardedShape,

                           TypedValue<ShapedType> sourceShard) {

   // Currently handles only cases where halo sizes differ but everything else

   // stays the same (from source to destination sharding).

   if (!sourceSharding.equalSplitAndPartialAxes(targetSharding) ||

       !sourceSharding.getPartialAxes().empty() ||

       !targetSharding.getPartialAxes().empty() ||

       !sourceSharding.getStaticShardedDimsOffsets().empty() ||

       !targetSharding.getStaticShardedDimsOffsets().empty() ||

       sourceSharding.equalHaloSizes(targetSharding)) {

     return std::nullopt;

   }


   auto srcHaloSizes = sourceSharding.getStaticHaloSizes();

   auto tgtHaloSizes = targetSharding.getStaticHaloSizes();

   assert(srcHaloSizes.empty() || srcHaloSizes.size() == tgtHaloSizes.size());

   assert(((srcHaloSizes.empty() || !ShapedType::isDynamicShape(srcHaloSizes)) &&

           !ShapedType::isDynamicShape(tgtHaloSizes) &&

           sourceShard.getType().hasStaticShape()) &&

          "dynamic shapes/halos are not supported yet for mesh-spmdization");

   auto rank = sourceShard.getType().getRank();

   auto splitAxes = sourceSharding.getSplitAxes();

   SmallVector<int64_t> srcCoreOffs(rank, 0), tgtCoreOffs(rank, 0),

       strides(rank, 1), outShape(sourceShard.getType().getShape()),

       coreShape(sourceShard.getType().getShape());


   // Determine "core" of source and destination.

   // The core is the local part of the shard excluding halo regions.

   for (auto i = 0u; i < rank; ++i) {

     if (i < splitAxes.size() && !splitAxes[i].empty()) {

       if (!srcHaloSizes.empty()) {

         coreShape[i] -= srcHaloSizes[i * 2] + srcHaloSizes[i * 2 + 1];

         srcCoreOffs[i] = srcHaloSizes[i * 2];

       }

       tgtCoreOffs[i] = tgtHaloSizes[i * 2];

       outShape[i] =

           coreShape[i] + tgtHaloSizes[i * 2] + tgtHaloSizes[i * 2 + 1];

     }

   }


   // Extract core from source and copy into destination core.

   auto noVals = ValueRange{};

   auto initVal = builder.create<tensor::EmptyOp>(

       sourceShard.getLoc(), outShape, sourceShard.getType().getElementType());

   auto core = builder.create<tensor::ExtractSliceOp>(

       sourceShard.getLoc(),

       RankedTensorType::get(coreShape, sourceShard.getType().getElementType()),

       sourceShard, noVals, noVals, noVals, srcCoreOffs, coreShape, strides);

   auto initOprnd = builder.create<tensor::InsertSliceOp>(

       sourceShard.getLoc(), core, initVal, noVals, noVals, noVals, tgtCoreOffs,

       coreShape, strides);


   // Finally update the halo.

   auto updateHaloResult =

       builder

           .create<UpdateHaloOp>(

               sourceShard.getLoc(),

               RankedTensorType::get(outShape,

                                     sourceShard.getType().getElementType()),

               initOprnd, mesh.getSymName(),

               MeshAxesArrayAttr::get(builder.getContext(),

                                      sourceSharding.getSplitAxes()),

               targetSharding.getDynamicHaloSizes(),

               targetSharding.getStaticHaloSizes())

           .getResult();

   return std::make_tuple(cast<TypedValue<ShapedType>>(updateHaloResult),

                          targetSharding);

 }


 // Handles only resharding on a 1D mesh.

 // Currently the sharded tensor axes must be exactly divisible by the single

 // mesh axis size.

 static TypedValue<ShapedType>

 reshardOn1DMesh(ImplicitLocOpBuilder &builder, MeshOp mesh,

                 MeshSharding sourceSharding, MeshSharding targetSharding,

                 TypedValue<ShapedType> sourceUnshardedValue,

                 TypedValue<ShapedType> sourceShard) {

   assert(sourceShard.getType() ==

          shardShapedType(sourceUnshardedValue.getType(), mesh, sourceSharding));

   [[maybe_unused]] ShapedType targetShardType =

       shardShapedType(sourceUnshardedValue.getType(), mesh, targetSharding);

   assert(sourceShard.getType().getRank() == targetShardType.getRank());

   assert(mesh.getRank() == 1 && "Only 1D meshes are currently supported.");


   auto [reducedSourceShard, reducedSourceSharding] =

       handlePartialAxesDuringResharding(builder, sourceSharding, targetSharding,

                                         sourceShard);


   if (reducedSourceSharding == targetSharding) {

     return reducedSourceShard;

   }


   TypedValue<ShapedType> targetShard;

   MeshSharding actualTargetSharding;

   if (reducedSourceSharding.getStaticShardedDimsOffsets().empty() &&

       targetSharding.getStaticShardedDimsOffsets().empty() &&

       reducedSourceSharding.getStaticHaloSizes().empty() &&

       targetSharding.getStaticHaloSizes().empty()) {

     if (auto tryRes = tryMoveLastSplitAxisInResharding(

             builder, mesh, reducedSourceSharding, targetSharding,

             sourceUnshardedValue.getType(), reducedSourceShard)) {

       std::tie(targetShard, actualTargetSharding) = tryRes.value();

     } else if (auto tryRes = trySplitLastAxisInResharding(

                    builder, mesh, reducedSourceSharding, targetSharding,

                    reducedSourceShard)) {

       std::tie(targetShard, actualTargetSharding) = tryRes.value();

     } else if (auto tryRes = tryUnsplitLastAxisInResharding(

                    builder, mesh, reducedSourceSharding, targetSharding,

                    sourceUnshardedValue.getType(), reducedSourceShard)) {

       std::tie(targetShard, actualTargetSharding) = tryRes.value();

     }

   }

   assert(targetShard && "Did not find any pattern to apply.");

   assert(actualTargetSharding == targetSharding);

   assert(targetShard.getType() == targetShardType);

   return targetShard;

 }


 TypedValue<ShapedType> reshard(ImplicitLocOpBuilder &builder, MeshOp mesh,

                                MeshSharding sourceSharding,

                                MeshSharding targetSharding,

                                TypedValue<ShapedType> sourceUnshardedValue,

                                TypedValue<ShapedType> sourceShard) {

   // If source and destination sharding are the same, no need to do anything.

   if (sourceSharding == targetSharding || (isFullReplication(sourceSharding) &&

                                            isFullReplication(targetSharding))) {

     return sourceShard;

   }


   // Tries to handle the case where the resharding is needed because the halo

   // sizes are different. Supports arbitrary mesh dimensionality.

   if (auto tryRes = tryUpdateHaloInResharding(

           builder, mesh, sourceSharding, targetSharding,

           sourceUnshardedValue.getType(), sourceShard)) {

     return std::get<0>(tryRes.value()); // targetShard

   }


   // Resort to handling only 1D meshes since the general case is complicated if

   // it needs to be communication efficient in terms of minimizing the data

   // transfered between devices.

   return reshardOn1DMesh(builder, mesh, sourceSharding, targetSharding,

                          sourceUnshardedValue, sourceShard);

 }


 TypedValue<ShapedType> reshard(OpBuilder &builder, MeshOp mesh, ShardOp source,

                                ShardOp target,

                                TypedValue<ShapedType> sourceShardValue) {

   assert(source.getResult() == target.getSrc());

   auto sourceSharding = source.getSharding();

   auto targetSharding = target.getSharding();

   ImplicitLocOpBuilder implicitLocOpBuilder(target->getLoc(), builder);

   return reshard(implicitLocOpBuilder, mesh, sourceSharding, targetSharding,

                  cast<TypedValue<ShapedType>>(source.getSrc()),

                  sourceShardValue);

 }


 TypedValue<ShapedType> reshard(OpBuilder &builder, ShardOp source,

                                ShardOp target,

                                TypedValue<ShapedType> sourceShardValue,

                                SymbolTableCollection &symbolTableCollection) {

   MeshOp srcMesh = getMesh(source, symbolTableCollection);

   assert(srcMesh && srcMesh == getMesh(target, symbolTableCollection));

   return reshard(builder, srcMesh, source, target, sourceShardValue);

 }


 void reshardingRegisterDependentDialects(DialectRegistry &registry) {

   registry.insert<mesh::MeshDialect, tensor::TensorDialect>();

 }


 #define GEN_PASS_DEF_SPMDIZATION

 #include "mlir/Dialect/Mesh/Transforms/Passes.h.inc"


 using UnshardedToShardedValueMap = DenseMap<Value, Value>;


 // Get the types of block arguments for an spmdized block.

 // Reads the sharding annotations of the arguments to deduce the sharded types.

 // Types that are not ranked tensors are left unchanged.

 SmallVector<Type>

 shardedBlockArgumentTypes(Block &block,

                           SymbolTableCollection &symbolTableCollection) {

   SmallVector<Type> res;

   llvm::transform(

       block.getArguments(), std::back_inserter(res),

       [&symbolTableCollection](BlockArgument arg) {

         auto rankedTensorArg = dyn_cast<TypedValue<RankedTensorType>>(arg);

         if (!rankedTensorArg || rankedTensorArg.getType().getRank() == 0) {

           return arg.getType();

         }


         assert(rankedTensorArg.hasOneUse());

         Operation *useOp = *rankedTensorArg.getUsers().begin();

         ShardOp shardOp = llvm::dyn_cast<ShardOp>(useOp);

         assert(shardOp);

         MeshOp mesh = getMesh(shardOp, symbolTableCollection);

         return cast<Type>(shardShapedType(rankedTensorArg.getType(), mesh,

                                           shardOp.getSharding()));

       });

   return res;

 }


 static LogicalResult spmdizeOperation(

     Operation &op, ArrayRef<Value> spmdizedOperands,

     ArrayRef<MeshSharding> operandShardings,

     ArrayRef<MeshSharding> resultShardings, IRMapping &spmdizationMap,

     SymbolTableCollection &symbolTableCollection, OpBuilder &builder) {

   ShardingInterface shardingInterface = llvm::dyn_cast<ShardingInterface>(op);

   if (!shardingInterface) {

     // If there is no sharding interface we are conservative and assume that

     // the op should be fully replicated no all devices.

     spmdizeFullyReplicatedOperation(op, spmdizedOperands, operandShardings,

                                     resultShardings, spmdizationMap,

                                     symbolTableCollection, builder);

   } else {

     if (failed(shardingInterface.spmdize(spmdizedOperands, operandShardings,

                                          resultShardings, spmdizationMap,

                                          symbolTableCollection, builder))) {

       return failure();

     }

   }


   assert(llvm::all_of(op.getResults(), [&spmdizationMap](OpResult result) {

     return spmdizationMap.contains(result);

   }));


   return success();

 }


 // Retrieve the sharding annotations for the operands of the given operation.

 // If the type is not a ranked tensor it is not require to have an annotation.

 static std::vector<MeshSharding> getOperandShardings(Operation &op) {

   std::vector<MeshSharding> res;

   res.reserve(op.getNumOperands());

   llvm::transform(op.getOperands(), std::back_inserter(res), [](Value operand) {

     TypedValue<RankedTensorType> rankedTensor =

         dyn_cast<TypedValue<RankedTensorType>>(operand);

     if (!rankedTensor || rankedTensor.getType().getRank() == 0) {

       return MeshSharding();

     }


     Operation *definingOp = operand.getDefiningOp();

     assert(definingOp);

     ShardOp shardOp = llvm::cast<ShardOp>(definingOp);

     return MeshSharding(shardOp.getSharding());

   });

   return res;

 }


 // Retrieve the sharding annotations for the results of the given operation.

 // If the type is not a ranked tensor it is not require to have an annotation.

 static std::vector<MeshSharding> getResultShardings(Operation &op) {

   std::vector<MeshSharding> res;

   res.reserve(op.getNumResults());

   llvm::transform(

       op.getResults(), std::back_inserter(res), [&op](OpResult result) {

         if (!result.hasOneUse() || result.use_empty()) {

           return MeshSharding();

         }

         TypedValue<RankedTensorType> rankedTensor =

             dyn_cast<TypedValue<RankedTensorType>>(result);

         if (!rankedTensor) {

           return MeshSharding();

         }

         Operation *userOp = *result.getUsers().begin();

         ShardOp shardOp = llvm::dyn_cast<ShardOp>(userOp);

         if (shardOp) {

           return MeshSharding(shardOp.getSharding());

         }

         if (rankedTensor.getType().getRank() == 0) {

           // This is a 0d tensor result without explicit sharding.

           // Find mesh symbol from operands, if any.

           // Shardings without mesh are not always fully supported yet.

           for (auto operand : op.getOperands()) {

             if (auto sharding = operand.getDefiningOp<ShardingOp>()) {

               return MeshSharding(sharding.getMeshAttr());

             }

           }

         }

         return MeshSharding();

       });

   return res;

 }


 static LogicalResult

 spmdizeOperation(ShardOp shardOp, IRMapping &spmdizationMap,

                  SymbolTableCollection &symbolTableCollection,

                  OpBuilder &builder) {

   Value targetSpmdValue;


   // Check if 2 shard ops are chained. If not there is no need for resharding

   // as the source and target shared the same sharding.

   ShardOp srcShardOp =

       dyn_cast_or_null<ShardOp>(shardOp.getSrc().getDefiningOp());

   if (!srcShardOp) {

     targetSpmdValue = spmdizationMap.lookup(shardOp.getSrc());

   } else {

     // Insert resharding.

     TypedValue<ShapedType> srcSpmdValue =

         cast<TypedValue<ShapedType>>(spmdizationMap.lookup(srcShardOp));

     targetSpmdValue = reshard(builder, srcShardOp, shardOp, srcSpmdValue,

                               symbolTableCollection);

   }


   assert(!spmdizationMap.contains(shardOp.getResult()));

   spmdizationMap.map(shardOp.getResult(), targetSpmdValue);

   return success();

 }


 static LogicalResult

 spmdizeOperation(Operation &op, IRMapping &spmdizationMap,

                  SymbolTableCollection &symbolTableCollection,

                  OpBuilder &builder) {

   if (isa<ShardingOp>(op)) {

     return success();

   }

   if (auto getShardingOp = dyn_cast<GetShardingOp>(op)) {

     auto shardOp = getShardingOp.getSource().getDefiningOp<ShardOp>();

     if (!shardOp) {

       return op.emitError("expected a shard op as source of get_sharding");

     }

     auto newSharding = builder.clone(*shardOp.getSharding().getDefiningOp());

     spmdizationMap.map(op.getResult(0), newSharding->getResult(0));

     return success();

   }


   ShardOp shardOp = llvm::dyn_cast<ShardOp>(op);

   if (shardOp) {

     return spmdizeOperation(shardOp, spmdizationMap, symbolTableCollection,

                             builder);

   }


   SmallVector<Value> spmdizedOperands;

   llvm::transform(op.getOperands(), std::back_inserter(spmdizedOperands),

                   [&spmdizationMap](Value operand) {

                     assert(spmdizationMap.contains(operand));

                     return spmdizationMap.lookup(operand);

                   });

   return spmdizeOperation(op, spmdizedOperands, getOperandShardings(op),

                           getResultShardings(op), spmdizationMap,

                           symbolTableCollection, builder);

 }


 static LogicalResult spmdizeBlock(Block &block, IRMapping &spmdizationMap,

                                   SymbolTableCollection &symbolTableCollection,

                                   OpBuilder &builder) {


   SmallVector<Location> argLocations;

   llvm::transform(block.getArguments(), std::back_inserter(argLocations),

                   [](BlockArgument arg) { return arg.getLoc(); });

   Block *newBlock = builder.createBlock(

       block.getParent(), {},

       shardedBlockArgumentTypes(block, symbolTableCollection), argLocations);

   for (auto [unshardedBlockArg, spmdizedBlockArg] :

        llvm::zip(block.getArguments(), newBlock->getArguments())) {

     spmdizationMap.map(unshardedBlockArg, spmdizedBlockArg);

   }


   OpBuilder::InsertionGuard insertionGuard(builder);

   builder.setInsertionPointToEnd(newBlock);

   for (Operation &op : block.getOperations()) {

     if (failed(spmdizeOperation(op, spmdizationMap, symbolTableCollection,

                                 builder))) {

       return failure();

     }

   }


   return success();

 }


 static LogicalResult

 spmdizeFuncOp(FunctionOpInterface op, IRMapping &spmdizationMap,

               SymbolTableCollection &symbolTableCollection) {

   OpBuilder builder(op.getFunctionBody());


   // Snapshot the original blocks to not mess up the iteration when adding new

   // blocks.

   SmallVector<Block *> originalBlocks;

   for (Block &b : op.getBlocks()) {

     if (llvm::any_of(b.getOperations(),

                      [](Operation &op) { return isa<ShardOp>(op); })) {

       originalBlocks.push_back(&b);

     }

   }


   for (Block *block : originalBlocks) {

     if (failed(spmdizeBlock(*block, spmdizationMap, symbolTableCollection,

                             builder))) {

       return failure();

     }

   }


   for (Block *block : originalBlocks) {

     block->erase();

   }


   // Find a return op and change the function results signature to its operands

   // signature.

   Operation *returnOp = nullptr;

   for (Block &block : op.getFunctionBody()) {

     if (block.empty()) {

       continue;

     }


     if (block.back().hasTrait<OpTrait::ReturnLike>()) {

       returnOp = &block.back();

       break;

     }

   }

   if (returnOp) {

     op.setType(FunctionType::get(

         op->getContext(), op.getFunctionBody().front().getArgumentTypes(),

         returnOp->getOperandTypes()));

   }


   return success();

 }


 namespace {


 struct Spmdization : public impl::SpmdizationBase<Spmdization> {

   void runOnOperation() override {

     IRMapping spmdizationMap;

     SymbolTableCollection symbolTableCollection;

     if (failed(spmdizeFuncOp(getOperation(), spmdizationMap,

                              symbolTableCollection))) {

       return signalPassFailure();

     }

   }


   void getDependentDialects(DialectRegistry &registry) const override {

     reshardingRegisterDependentDialects(registry);

     registry.insert<mesh::MeshDialect>();

   }

 };


 } // namespace


 } // namespace mlir::mesh

Builders.h

BuiltinTypeInterfaces.h

ControlFlowInterfaces.h

FuncOps.h

FunctionInterfaces.h

IRMapping.h

ImplicitLocOpBuilder.h

Location.h

MLIRContext.h

MeshDialect.h

MeshOps.h

ShardingInterface.h

Spmdization.h

SymbolTable.h

Value.h

llvm::ArrayRef
Definition: LLVM.h:48

llvm::DenseMap
Definition: LLVM.h:55

llvm::SmallVector< MeshAxis >

mlir::BlockArgument
This class represents an argument of a Block.
Definition: Value.h:309

mlir::Block
Block represents an ordered list of Operations.
Definition: Block.h:33

mlir::Block::getParent
Region * getParent() const
Provide a 'getParent' method for ilist_node_with_parent methods.
Definition: Block.cpp:29

mlir::Block::getOperations
OpListType & getOperations()
Definition: Block.h:137

mlir::Block::getArguments
BlockArgListType getArguments()
Definition: Block.h:87

mlir::Builder::getContext
MLIRContext * getContext() const
Definition: Builders.h:55

mlir::DialectRegistry
The DialectRegistry maps a dialect namespace to a constructor for the matching dialect.
Definition: DialectRegistry.h:139

mlir::DialectRegistry::insert
void insert()
Definition: DialectRegistry.h:152

mlir::IRMapping
This is a utility class for mapping one set of IR entities to another.
Definition: IRMapping.h:26

mlir::IRMapping::lookup
auto lookup(T from) const
Lookup a mapped value within the map.
Definition: IRMapping.h:72

mlir::IRMapping::map
void map(Value from, Value to)
Inserts a new mapping for 'from' to 'to'.
Definition: IRMapping.h:30

mlir::IRMapping::contains
bool contains(T from) const
Checks to see if a mapping for 'from' exists.
Definition: IRMapping.h:51

mlir::ImplicitLocOpBuilder
ImplicitLocOpBuilder maintains a 'current location', allowing use of the create<> method without spec...
Definition: ImplicitLocOpBuilder.h:23

mlir::ImplicitLocOpBuilder::create
OpTy create(Args &&...args)
Create an operation of specific op type at the current insertion point and location.
Definition: ImplicitLocOpBuilder.h:66

mlir::MLIRContext
MLIRContext is the top-level object for a collection of MLIR operations.
Definition: MLIRContext.h:60

mlir::OpBuilder::InsertionGuard
RAII guard to reset the insertion point of the builder when destroyed.
Definition: Builders.h:346

mlir::OpBuilder
This class helps build Operations.
Definition: Builders.h:205

mlir::OpBuilder::createBlock
Block * createBlock(Region *parent, Region::iterator insertPt={}, TypeRange argTypes={}, ArrayRef< Location > locs={})
Add new block with 'argTypes' arguments and set the insertion point to the end of it.
Definition: Builders.cpp:428

mlir::OpBuilder::clone
Operation * clone(Operation &op, IRMapping &mapper)
Creates a deep copy of the specified operation, remapping any operands that use values outside of the...
Definition: Builders.cpp:551

mlir::OpBuilder::setInsertionPointToEnd
void setInsertionPointToEnd(Block *block)
Sets the insertion point to the end of the specified block.
Definition: Builders.h:434

mlir::OpBuilder::setInsertionPointAfterValue
void setInsertionPointAfterValue(Value val)
Sets the insertion point to the node after the specified value.
Definition: Builders.h:419

mlir::OpBuilder::create
Operation * create(const OperationState &state)
Creates an operation given the fields represented as an OperationState.
Definition: Builders.cpp:455

mlir::OpResult
This is a value defined by a result of an operation.
Definition: Value.h:447

mlir::Operation
Operation is the basic unit of execution within MLIR.
Definition: Operation.h:88

mlir::Operation::getResult
OpResult getResult(unsigned idx)
Get the 'idx'th result of this operation.
Definition: Operation.h:407

mlir::Operation::getNumOperands
unsigned getNumOperands()
Definition: Operation.h:346

mlir::Operation::emitError
InFlightDiagnostic emitError(const Twine &message={})
Emit an error about fatal conditions with this operation, reporting up to any diagnostic handlers tha...
Definition: Operation.cpp:268

mlir::Operation::getOperandTypes
operand_type_range getOperandTypes()
Definition: Operation.h:397

mlir::Operation::getOperands
operand_range getOperands()
Returns an iterator on the underlying Value's.
Definition: Operation.h:378

mlir::Operation::getUsers
user_range getUsers()
Returns a range of all users.
Definition: Operation.h:873

mlir::Operation::getResults
result_range getResults()
Definition: Operation.h:415

mlir::Operation::getNumResults
unsigned getNumResults()
Return the number of results held by this operation.
Definition: Operation.h:404

mlir::SymbolTableCollection
This class represents a collection of SymbolTables.
Definition: SymbolTable.h:283

mlir::ValueRange
This class provides an abstraction over the different types of ranges over Values.
Definition: ValueRange.h:387

mlir::Value
This class represents an instance of an SSA value in the MLIR system, representing a computable value...
Definition: Value.h:96

mlir::Value::getUsers
user_range getUsers() const
Definition: Value.h:218

mlir::Value::getDefiningOp
Operation * getDefiningOp() const
If this value is the result of an operation, return the operation that defines it.
Definition: Value.cpp:20

mlir::detail::DenseArrayAttrImpl::get
static DenseArrayAttrImpl get(MLIRContext *context, ArrayRef< T > content)
Builder from ArrayRef<T>.
Definition: BuiltinAttributes.cpp:873

mlir::mesh::MeshSharding
Definition: MeshOps.h:42

mlir::mesh::MeshSharding::equalSplitAndPartialAxes
bool equalSplitAndPartialAxes(const MeshSharding &rhs) const
Definition: MeshOps.cpp:691

mlir::mesh::MeshSharding::getStaticShardedDimsOffsets
ArrayRef< int64_t > getStaticShardedDimsOffsets() const
Definition: MeshOps.h:70

mlir::mesh::MeshSharding::getMeshAttr
::mlir::FlatSymbolRefAttr getMeshAttr() const
Definition: MeshOps.h:64

mlir::mesh::MeshSharding::equalHaloSizes
bool equalHaloSizes(const MeshSharding &rhs) const
Definition: MeshOps.cpp:736

mlir::mesh::MeshSharding::getSplitAxes
ArrayRef< MeshAxesAttr > getSplitAxes() const
Definition: MeshOps.h:66

mlir::mesh::MeshSharding::getPartialType
ReductionKind getPartialType() const
Definition: MeshOps.h:68

mlir::mesh::MeshSharding::getPartialAxes
ArrayRef< MeshAxis > getPartialAxes() const
Definition: MeshOps.h:67

mlir::mesh::MeshSharding::getDynamicHaloSizes
ArrayRef< Value > getDynamicHaloSizes() const
Definition: MeshOps.h:73

mlir::mesh::MeshSharding::getStaticHaloSizes
ArrayRef< int64_t > getStaticHaloSizes() const
Definition: MeshOps.h:69

mlir::mesh::MeshSharding::get
static MeshSharding get(::mlir::FlatSymbolRefAttr mesh_, ArrayRef< MeshAxesAttr > split_axes_, ArrayRef< MeshAxis > partial_axes_={}, ReductionKind partial_type_=ReductionKind::Sum, ArrayRef< int64_t > static_halo_sizes_={}, ArrayRef< int64_t > static_sharded_dims_offsets_={}, ArrayRef< Value > dynamic_halo_sizes_={}, ArrayRef< Value > dynamic_sharded_dims_offsets_={})
Definition: MeshOps.cpp:782

Diagnostics.h

Pass.h

Tensor.h

BuiltinAttributes.h

BuiltinTypes.h

LLVM.h

mlir::linalg::MeshSharding
mesh::MeshSharding MeshSharding
Definition: MeshShardingInterfaceImpl.cpp:46

mlir::linalg::MeshOp
mesh::MeshOp MeshOp
Definition: MeshShardingInterfaceImpl.cpp:48

mlir::mesh
Definition: ShardingInterface.h:23

mlir::mesh::spmdizeFuncOp
static LogicalResult spmdizeFuncOp(FunctionOpInterface op, IRMapping &spmdizationMap, SymbolTableCollection &symbolTableCollection)
Definition: Spmdization.cpp:809

mlir::mesh::handlePartialAxesDuringResharding
static std::tuple< TypedValue< ShapedType >, MeshSharding > handlePartialAxesDuringResharding(OpBuilder &builder, MeshSharding sourceSharding, MeshSharding targetSharding, TypedValue< ShapedType > sourceShard)
Definition: Spmdization.cpp:58

mlir::mesh::shardedBlockArgumentTypes
SmallVector< Type > shardedBlockArgumentTypes(Block &block, SymbolTableCollection &symbolTableCollection)
Definition: Spmdization.cpp:618

mlir::mesh::allGatherResultShapeInUnsplitLastAxis
static ShapedType allGatherResultShapeInUnsplitLastAxis(ShapedType sourceShape, int64_t splitCount, int64_t splitTensorAxis)
Definition: Spmdization.cpp:249

mlir::mesh::spmdizeFullyReplicatedOperation
void spmdizeFullyReplicatedOperation(Operation &op, ArrayRef< Value > spmdizedOperands, ArrayRef< MeshSharding > operandShardings, ArrayRef< MeshSharding > resultShardings, IRMapping &spmdizationMap, SymbolTableCollection &symbolTable, OpBuilder &builder)
Definition: ShardingInterface.cpp:613

mlir::mesh::detectMoveLastSplitAxisInResharding
static std::optional< std::tuple< int64_t, int64_t, MeshAxis > > detectMoveLastSplitAxisInResharding(MeshSharding sourceSharding, MeshSharding targetSharding)
Definition: Spmdization.cpp:305

mlir::mesh::tryUnsplitLastAxisInResharding
static std::optional< std::tuple< TypedValue< ShapedType >, MeshSharding > > tryUnsplitLastAxisInResharding(ImplicitLocOpBuilder &builder, MeshOp mesh, MeshSharding sourceSharding, MeshSharding targetSharding, ShapedType sourceUnshardedShape, TypedValue< ShapedType > sourceShard)
Definition: Spmdization.cpp:283

mlir::mesh::allToAllResultShapeInMoveLastAxis
static ShapedType allToAllResultShapeInMoveLastAxis(ShapedType sourceShape, int64_t splitCount, int64_t sourceTensorAxis, int64_t targetTensorAxis)
Definition: Spmdization.cpp:376

mlir::mesh::trySplitLastAxisInResharding
static std::optional< std::tuple< TypedValue< ShapedType >, MeshSharding > > trySplitLastAxisInResharding(ImplicitLocOpBuilder &builder, MeshOp mesh, MeshSharding sourceSharding, MeshSharding targetSharding, TypedValue< ShapedType > sourceShard)
Definition: Spmdization.cpp:185

mlir::mesh::getResultShardings
static std::vector< MeshSharding > getResultShardings(Operation &op)
Definition: Spmdization.cpp:689

mlir::mesh::arePartialAxesCompatible
static bool arePartialAxesCompatible(const SourceAxes &sourceAxes, const TargetAxes &targetAxes)
Definition: Spmdization.cpp:44

mlir::mesh::detectUnsplitLastAxisInResharding
static std::optional< std::tuple< int64_t, MeshAxis > > detectUnsplitLastAxisInResharding(MeshSharding sourceSharding, MeshSharding targetSharding)
Definition: Spmdization.cpp:203

mlir::mesh::gatherDimension
int64_t gatherDimension(int64_t dimSize, int64_t shardCount)
Definition: MeshOps.h:184

mlir::mesh::targetShardingInUnsplitLastAxis
static MeshSharding targetShardingInUnsplitLastAxis(MLIRContext *ctx, MeshSharding sourceSharding, int64_t splitTensorAxis)
Definition: Spmdization.cpp:231

mlir::mesh::unsplitLastAxisInResharding
static std::tuple< TypedValue< ShapedType >, MeshSharding > unsplitLastAxisInResharding(ImplicitLocOpBuilder &builder, MeshSharding sourceSharding, ShapedType sourceUnshardedShape, TypedValue< ShapedType > sourceShard, MeshOp mesh, int64_t splitTensorAxis, MeshAxis splitMeshAxis)
Definition: Spmdization.cpp:258

mlir::mesh::shardShapedType
ShapedType shardShapedType(ShapedType shape, MeshOp mesh, MeshSharding sharding)
Definition: MeshOps.cpp:260

mlir::mesh::getMesh
mesh::MeshOp getMesh(Operation *op, FlatSymbolRefAttr meshSymbol, SymbolTableCollection &symbolTableCollection)
Definition: MeshOps.h:128

mlir::mesh::shardDimension
int64_t shardDimension(int64_t dimSize, int64_t shardCount)
Definition: MeshOps.h:175

mlir::mesh::reshard
TypedValue< ShapedType > reshard(OpBuilder &builder, MeshOp mesh, ShardOp source, ShardOp target, TypedValue< ShapedType > sourceShardValue)
Definition: Spmdization.cpp:584

mlir::mesh::isFullReplication
bool isFullReplication(MeshSharding sharding)
Definition: MeshOps.h:112

mlir::mesh::reshardOn1DMesh
static TypedValue< ShapedType > reshardOn1DMesh(ImplicitLocOpBuilder &builder, MeshOp mesh, MeshSharding sourceSharding, MeshSharding targetSharding, TypedValue< ShapedType > sourceUnshardedValue, TypedValue< ShapedType > sourceShard)
Definition: Spmdization.cpp:513

mlir::mesh::targetShardingInSplitLastAxis
static MeshSharding targetShardingInSplitLastAxis(MLIRContext *ctx, MeshSharding sourceSharding, int64_t splitTensorAxis, MeshAxis splitMeshAxis)
Definition: Spmdization.cpp:108

mlir::mesh::reshardingRegisterDependentDialects
void reshardingRegisterDependentDialects(DialectRegistry &registry)
Definition: Spmdization.cpp:605

mlir::mesh::splitLastAxisInResharding
static std::tuple< TypedValue< ShapedType >, MeshSharding > splitLastAxisInResharding(ImplicitLocOpBuilder &builder, MeshSharding sourceSharding, TypedValue< ShapedType > sourceShard, MeshOp mesh, int64_t splitTensorAxis, MeshAxis splitMeshAxis)
Definition: Spmdization.cpp:132

mlir::mesh::getOperandShardings
static std::vector< MeshSharding > getOperandShardings(Operation &op)
Definition: Spmdization.cpp:669

mlir::mesh::MeshAxis
int16_t MeshAxis
Definition: MeshOps.h:26

mlir::mesh::tryMoveLastSplitAxisInResharding
static std::optional< std::tuple< TypedValue< ShapedType >, MeshSharding > > tryMoveLastSplitAxisInResharding(ImplicitLocOpBuilder &builder, MeshOp mesh, MeshSharding sourceSharding, MeshSharding targetSharding, ShapedType sourceUnshardedShape, TypedValue< ShapedType > sourceShard)
Definition: Spmdization.cpp:416

mlir::mesh::spmdizeOperation
static LogicalResult spmdizeOperation(Operation &op, IRMapping &spmdizationMap, SymbolTableCollection &symbolTableCollection, OpBuilder &builder)
Definition: Spmdization.cpp:748

mlir::mesh::targetShardingInMoveLastAxis
static MeshSharding targetShardingInMoveLastAxis(MLIRContext *ctx, MeshSharding sourceSharding, int64_t sourceTensorAxis, int64_t targetTensorAxis)
Definition: Spmdization.cpp:346

mlir::mesh::tryUpdateHaloInResharding
static std::optional< std::tuple< TypedValue< ShapedType >, MeshSharding > > tryUpdateHaloInResharding(ImplicitLocOpBuilder &builder, MeshOp mesh, MeshSharding sourceSharding, MeshSharding targetSharding, ShapedType sourceUnshardedShape, TypedValue< ShapedType > sourceShard)
Definition: Spmdization.cpp:437

mlir::mesh::moveLastSplitAxisInResharding
static std::tuple< TypedValue< ShapedType >, MeshSharding > moveLastSplitAxisInResharding(ImplicitLocOpBuilder &builder, MeshOp mesh, MeshSharding sourceSharding, ShapedType sourceUnshardedShape, TypedValue< ShapedType > sourceShard, int64_t sourceTensorAxis, int64_t targetTensorAxis, MeshAxis meshAxis)
Definition: Spmdization.cpp:389

mlir::mesh::reshard
TypedValue< ShapedType > reshard(ImplicitLocOpBuilder &builder, MeshOp mesh, MeshSharding sourceSharding, MeshSharding targetSharding, TypedValue< ShapedType > sourceUnshardedValue, TypedValue< ShapedType > sourceShard)
Definition: Spmdization.cpp:558

mlir::mesh::spmdizeBlock
static LogicalResult spmdizeBlock(Block &block, IRMapping &spmdizationMap, SymbolTableCollection &symbolTableCollection, OpBuilder &builder)
Definition: Spmdization.cpp:781

mlir::mesh::detectSplitLastAxisInResharding
static std::optional< std::tuple< int64_t, MeshAxis > > detectSplitLastAxisInResharding(MeshSharding sourceSharding, MeshSharding targetSharding)
Definition: Spmdization.cpp:153

mlir::TypedValue
std::conditional_t< std::is_same_v< Ty, mlir::Type >, mlir::Value, detail::TypedValue< Ty > > TypedValue
If Ty is mlir::Type this will select Value instead of having a wrapper around it.
Definition: Value.h:488

mlir::get
auto get(MLIRContext *context, Ts &&...params)
Helper method that injects context only if needed, this helps unify some of the attribute constructio...
Definition: BytecodeImplementation.h:509

mlir::OpTrait::ReturnLike
This trait indicates that a terminator operation is "return-like".
Definition: ControlFlowInterfaces.h:329