doxygen/SerializeToBlob_8cpp_source.html

 //===- SerializeToBlob.cpp - MLIR GPU lowering pass -----------------------===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//

 //

 // This file implements a base class for a pass to serialize a gpu module

 // into a binary blob that can be executed on a GPU. The binary blob is added

 // as a string attribute to the gpu module.

 //

 //===----------------------------------------------------------------------===//


 #include "mlir/Dialect/GPU/IR/GPUDialect.h"

 #include "mlir/Dialect/GPU/Transforms/Passes.h"

 #include "mlir/Dialect/LLVMIR/LLVMDialect.h"

 #include "mlir/ExecutionEngine/OptUtils.h"

 #include "mlir/Pass/Pass.h"

 #include "mlir/Target/LLVMIR/Dialect/GPU/GPUToLLVMIRTranslation.h"

 #include "mlir/Target/LLVMIR/Dialect/LLVMIR/LLVMToLLVMIRTranslation.h"

 #include "mlir/Target/LLVMIR/Export.h"

 #include "llvm/IR/LegacyPassManager.h"

 #include "llvm/MC/TargetRegistry.h"

 #include "llvm/Support/TargetSelect.h"

 #include "llvm/Target/TargetMachine.h"


 #include <optional>

 #include <string>


 #define DEBUG_TYPE "serialize-to-blob"


 using namespace mlir;


 std::string gpu::getDefaultGpuBinaryAnnotation() { return "gpu.binary"; }


 gpu::SerializeToBlobPass::SerializeToBlobPass(TypeID passID)

     : OperationPass<gpu::GPUModuleOp>(passID) {}


 gpu::SerializeToBlobPass::SerializeToBlobPass(const SerializeToBlobPass &other)

     : OperationPass<gpu::GPUModuleOp>(other) {}


 std::optional<std::string>

 gpu::SerializeToBlobPass::translateToISA(llvm::Module &llvmModule,

                                          llvm::TargetMachine &targetMachine) {

   llvmModule.setDataLayout(targetMachine.createDataLayout());


   if (failed(optimizeLlvm(llvmModule, targetMachine)))

     return std::nullopt;


   std::string targetISA;

   llvm::raw_string_ostream stream(targetISA);


   { // Drop pstream after this to prevent the ISA from being stuck buffering

     llvm::buffer_ostream pstream(stream);

     llvm::legacy::PassManager codegenPasses;


     if (targetMachine.addPassesToEmitFile(codegenPasses, pstream, nullptr,

                                           llvm::CodeGenFileType::AssemblyFile))

       return std::nullopt;


     codegenPasses.run(llvmModule);

   }

   return stream.str();

 }


 void gpu::SerializeToBlobPass::runOnOperation() {

   // Lower the module to an LLVM IR module using a separate context to enable

   // multi-threaded processing.

   llvm::LLVMContext llvmContext;

   std::unique_ptr<llvm::Module> llvmModule = translateToLLVMIR(llvmContext);

   if (!llvmModule)

     return signalPassFailure();


   // Lower the LLVM IR module to target ISA.

   std::unique_ptr<llvm::TargetMachine> targetMachine = createTargetMachine();

   if (!targetMachine)

     return signalPassFailure();


   std::optional<std::string> maybeTargetISA =

       translateToISA(*llvmModule, *targetMachine);


   if (!maybeTargetISA.has_value())

     return signalPassFailure();


   std::string targetISA = std::move(*maybeTargetISA);


   LLVM_DEBUG({

     llvm::dbgs() << "ISA for module: " << getOperation().getNameAttr() << "\n";

     llvm::dbgs() << targetISA << "\n";

     llvm::dbgs().flush();

   });


   // Serialize the target ISA.

   std::unique_ptr<std::vector<char>> blob = serializeISA(targetISA);

   if (!blob)

     return signalPassFailure();


   // Add the blob as module attribute.

   auto attr =

       StringAttr::get(&getContext(), StringRef(blob->data(), blob->size()));

   getOperation()->setAttr(gpuBinaryAnnotation, attr);

 }


 LogicalResult

 gpu::SerializeToBlobPass::optimizeLlvm(llvm::Module &llvmModule,

                                        llvm::TargetMachine &targetMachine) {

   int optLevel = this->optLevel.getValue();

   if (optLevel < 0 || optLevel > 3)

     return getOperation().emitError()

            << "invalid optimization level " << optLevel;


   targetMachine.setOptLevel(static_cast<llvm::CodeGenOptLevel>(optLevel));


   auto transformer =

       makeOptimizingTransformer(optLevel, /*sizeLevel=*/0, &targetMachine);

   auto error = transformer(&llvmModule);

   if (error) {

     InFlightDiagnostic mlirError = getOperation()->emitError();

     llvm::handleAllErrors(

         std::move(error), [&mlirError](const llvm::ErrorInfoBase &ei) {

           mlirError << "could not optimize LLVM IR: " << ei.message();

         });

     return mlirError;

   }

   return success();

 }


 std::unique_ptr<llvm::TargetMachine>

 gpu::SerializeToBlobPass::createTargetMachine() {

   Location loc = getOperation().getLoc();

   std::string error;

   const llvm::Target *target =

       llvm::TargetRegistry::lookupTarget(triple, error);

   if (!target) {

     emitError(loc, Twine("failed to lookup target: ") + error);

     return {};

   }

   llvm::TargetMachine *machine =

       target->createTargetMachine(triple, chip, features, {}, {});

   if (!machine) {

     emitError(loc, "failed to create target machine");

     return {};

   }


   return std::unique_ptr<llvm::TargetMachine>{machine};

 }


 std::unique_ptr<llvm::Module>

 gpu::SerializeToBlobPass::translateToLLVMIR(llvm::LLVMContext &llvmContext) {

   return translateModuleToLLVMIR(getOperation(), llvmContext,

                                  "LLVMDialectModule");

 }

Passes.h

Export.h

GPUDialect.h

GPUToLLVMIRTranslation.h

getContext
static MLIRContext * getContext(OpFoldResult val)
Definition: IndexingUtils.cpp:269

LLVMDialect.h

LLVMToLLVMIRTranslation.h

OptUtils.h

mlir::InFlightDiagnostic
This class represents a diagnostic that is inflight and set to be reported.
Definition: Diagnostics.h:308

mlir::Location
This class defines the main interface for locations in MLIR and acts as a non-nullable wrapper around...
Definition: Location.h:63

mlir::OperationPass
Pass to transform an operation of a specific type.
Definition: Pass.h:356

mlir::TypeID
This class provides an efficient unique identifier for a specific C++ type.
Definition: TypeID.h:104

mlir::gpu::SerializeToBlobPass
Base pass class to serialize kernel functions through LLVM into user-specified IR and add the resulti...
Definition: Passes.h:97

mlir::gpu::SerializeToBlobPass::runOnOperation
void runOnOperation() final
The polymorphic API that runs the pass over the currently held operation.
Definition: SerializeToBlob.cpp:67

mlir::gpu::SerializeToBlobPass::SerializeToBlobPass
SerializeToBlobPass(TypeID passID)
Definition: SerializeToBlob.cpp:37

mlir::gpu::SerializeToBlobPass::translateToLLVMIR
virtual std::unique_ptr< llvm::Module > translateToLLVMIR(llvm::LLVMContext &llvmContext)
Translates the 'getOperation()' result to an LLVM module.
Definition: SerializeToBlob.cpp:150

mlir::gpu::SerializeToBlobPass::optimizeLlvm
virtual LogicalResult optimizeLlvm(llvm::Module &llvmModule, llvm::TargetMachine &targetMachine)
Hook allowing the application of optimizations before codegen By default, does nothing.
Definition: SerializeToBlob.cpp:106

Pass.h

mlir::gpu::getDefaultGpuBinaryAnnotation
std::string getDefaultGpuBinaryAnnotation()
Returns the default annotation name for GPU binary blobs.
Definition: SerializeToBlob.cpp:35

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20

mlir::emitError
InFlightDiagnostic emitError(Location loc)
Utility method to emit an error message using this location.
Definition: Diagnostics.cpp:328

mlir::success
LogicalResult success(bool isSuccess=true)
Utility function to generate a LogicalResult.
Definition: LogicalResult.h:56

mlir::makeOptimizingTransformer
std::function< llvm::Error(llvm::Module *)> makeOptimizingTransformer(unsigned optLevel, unsigned sizeLevel, llvm::TargetMachine *targetMachine)
Create a module transformer function for MLIR ExecutionEngine that runs LLVM IR passes corresponding ...

mlir::get
auto get(MLIRContext *context, Ts &&...params)
Helper method that injects context only if needed, this helps unify some of the attribute constructio...
Definition: BytecodeImplementation.h:510

mlir::translateModuleToLLVMIR
std::unique_ptr< llvm::Module > translateModuleToLLVMIR(Operation *module, llvm::LLVMContext &llvmContext, llvm::StringRef name="LLVMDialectModule")
Translate operation that satisfies LLVM dialect module requirements into an LLVM IR module living in ...

mlir::failed
bool failed(LogicalResult result)
Utility function that returns true if the provided LogicalResult corresponds to a failure value.
Definition: LogicalResult.h:72

mlir::LogicalResult
This class represents an efficient way to signal success or failure.
Definition: LogicalResult.h:26