bolt/deps/llvm-18.1.8/mlir/lib/Conversion/GPUToSPIRV/GPUToSPIRVPass.cpp

//===- GPUToSPIRVPass.cpp - GPU to SPIR-V Passes --------------------------===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
//
// This file implements a pass to convert a kernel function in the GPU Dialect
// into a spirv.module operation.
//
//===----------------------------------------------------------------------===//

#include "mlir/Conversion/GPUToSPIRV/GPUToSPIRVPass.h"

#include "mlir/Conversion/ArithToSPIRV/ArithToSPIRV.h"
#include "mlir/Conversion/FuncToSPIRV/FuncToSPIRV.h"
#include "mlir/Conversion/GPUToSPIRV/GPUToSPIRV.h"
#include "mlir/Conversion/MemRefToSPIRV/MemRefToSPIRV.h"
#include "mlir/Conversion/SCFToSPIRV/SCFToSPIRV.h"
#include "mlir/Dialect/Func/IR/FuncOps.h"
#include "mlir/Dialect/GPU/IR/GPUDialect.h"
#include "mlir/Dialect/SPIRV/IR/SPIRVDialect.h"
#include "mlir/Dialect/SPIRV/IR/SPIRVOps.h"
#include "mlir/Dialect/SPIRV/Transforms/SPIRVConversion.h"

namespace mlir {
#define GEN_PASS_DEF_CONVERTGPUTOSPIRV
#include "mlir/Conversion/Passes.h.inc"
} // namespace mlir

using namespace mlir;

namespace {
/// Pass to lower GPU Dialect to SPIR-V. The pass only converts the gpu.func ops
/// inside gpu.module ops. i.e., the function that are referenced in
/// gpu.launch_func ops. For each such function
///
/// 1) Create a spirv::ModuleOp, and clone the function into spirv::ModuleOp
/// (the original function is still needed by the gpu::LaunchKernelOp, so cannot
/// replace it).
///
/// 2) Lower the body of the spirv::ModuleOp.
struct GPUToSPIRVPass final : impl::ConvertGPUToSPIRVBase<GPUToSPIRVPass> {
  explicit GPUToSPIRVPass(bool mapMemorySpace)
      : mapMemorySpace(mapMemorySpace) {}
  void runOnOperation() override;

private:
  bool mapMemorySpace;
};

void GPUToSPIRVPass::runOnOperation() {
  MLIRContext *context = &getContext();
  ModuleOp module = getOperation();

  SmallVector<Operation *, 1> gpuModules;
  OpBuilder builder(context);

  auto targetEnvSupportsKernelCapability = [](gpu::GPUModuleOp moduleOp) {
    Operation *gpuModule = moduleOp.getOperation();
    auto targetAttr = spirv::lookupTargetEnvOrDefault(gpuModule);
    spirv::TargetEnv targetEnv(targetAttr);
    return targetEnv.allows(spirv::Capability::Kernel);
  };

  module.walk([&](gpu::GPUModuleOp moduleOp) {
    // Clone each GPU kernel module for conversion, given that the GPU
    // launch op still needs the original GPU kernel module.
    // For Vulkan Shader capabilities, we insert the newly converted SPIR-V
    // module right after the original GPU module, as that's the expectation of
    // the in-tree Vulkan runner.
    // For OpenCL Kernel capabilities, we insert the newly converted SPIR-V
    // module inside the original GPU module, as that's the expectaion of the
    // normal GPU compilation pipeline.
    if (targetEnvSupportsKernelCapability(moduleOp)) {
      builder.setInsertionPoint(moduleOp.getBody(),
                                moduleOp.getBody()->begin());
    } else {
      builder.setInsertionPoint(moduleOp.getOperation());
    }
    gpuModules.push_back(builder.clone(*moduleOp.getOperation()));
  });

  // Run conversion for each module independently as they can have different
  // TargetEnv attributes.
  for (Operation *gpuModule : gpuModules) {
    spirv::TargetEnvAttr targetAttr =
        spirv::lookupTargetEnvOrDefault(gpuModule);

    // Map MemRef memory space to SPIR-V storage class first if requested.
    if (mapMemorySpace) {
      std::unique_ptr<ConversionTarget> target =
          spirv::getMemorySpaceToStorageClassTarget(*context);
      spirv::MemorySpaceToStorageClassMap memorySpaceMap =
          targetEnvSupportsKernelCapability(
              dyn_cast<gpu::GPUModuleOp>(gpuModule))
              ? spirv::mapMemorySpaceToOpenCLStorageClass
              : spirv::mapMemorySpaceToVulkanStorageClass;
      spirv::MemorySpaceToStorageClassConverter converter(memorySpaceMap);

      RewritePatternSet patterns(context);
      spirv::populateMemorySpaceToStorageClassPatterns(converter, patterns);

      if (failed(applyFullConversion(gpuModule, *target, std::move(patterns))))
        return signalPassFailure();
    }

    std::unique_ptr<ConversionTarget> target =
        SPIRVConversionTarget::get(targetAttr);

    SPIRVConversionOptions options;
    options.use64bitIndex = this->use64bitIndex;
    SPIRVTypeConverter typeConverter(targetAttr, options);
    populateMMAToSPIRVCoopMatrixTypeConversion(typeConverter);

    RewritePatternSet patterns(context);
    populateGPUToSPIRVPatterns(typeConverter, patterns);
    populateGpuWMMAToSPIRVCoopMatrixKHRConversionPatterns(typeConverter,
                                                          patterns);

    // TODO: Change SPIR-V conversion to be progressive and remove the following
    // patterns.
    ScfToSPIRVContext scfContext;
    populateSCFToSPIRVPatterns(typeConverter, scfContext, patterns);
    mlir::arith::populateArithToSPIRVPatterns(typeConverter, patterns);
    populateMemRefToSPIRVPatterns(typeConverter, patterns);
    populateFuncToSPIRVPatterns(typeConverter, patterns);

    if (failed(applyFullConversion(gpuModule, *target, std::move(patterns))))
      return signalPassFailure();
  }

  // For OpenCL, the gpu.func op in the original gpu.module op needs to be
  // replaced with an empty func.func op with the same arguments as the gpu.func
  // op. The func.func op needs gpu.kernel attribute set.
  module.walk([&](gpu::GPUModuleOp moduleOp) {
    if (targetEnvSupportsKernelCapability(moduleOp)) {
      moduleOp.walk([&](gpu::GPUFuncOp funcOp) {
        builder.setInsertionPoint(funcOp);
        auto newFuncOp = builder.create<func::FuncOp>(
            funcOp.getLoc(), funcOp.getName(), funcOp.getFunctionType());
        auto entryBlock = newFuncOp.addEntryBlock();
        builder.setInsertionPointToEnd(entryBlock);
        builder.create<func::ReturnOp>(funcOp.getLoc());
        newFuncOp->setAttr(gpu::GPUDialect::getKernelFuncAttrName(),
                           builder.getUnitAttr());
        funcOp.erase();
      });
    }
  });
}

} // namespace

std::unique_ptr<OperationPass<ModuleOp>>
mlir::createConvertGPUToSPIRVPass(bool mapMemorySpace) {
  return std::make_unique<GPUToSPIRVPass>(mapMemorySpace);
}
Embed LLVM 18.1.8 2025-02-14 19:21:04 +01:00			`//===- GPUToSPIRVPass.cpp - GPU to SPIR-V Passes --------------------------===//`
			`//`
			`// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.`
			`// See https://llvm.org/LICENSE.txt for license information.`
			`// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception`
			`//`
			`//===----------------------------------------------------------------------===//`
			`//`
			`// This file implements a pass to convert a kernel function in the GPU Dialect`
			`// into a spirv.module operation.`
			`//`
			`//===----------------------------------------------------------------------===//`

			`#include "mlir/Conversion/GPUToSPIRV/GPUToSPIRVPass.h"`

			`#include "mlir/Conversion/ArithToSPIRV/ArithToSPIRV.h"`
			`#include "mlir/Conversion/FuncToSPIRV/FuncToSPIRV.h"`
			`#include "mlir/Conversion/GPUToSPIRV/GPUToSPIRV.h"`
			`#include "mlir/Conversion/MemRefToSPIRV/MemRefToSPIRV.h"`
			`#include "mlir/Conversion/SCFToSPIRV/SCFToSPIRV.h"`
			`#include "mlir/Dialect/Func/IR/FuncOps.h"`
			`#include "mlir/Dialect/GPU/IR/GPUDialect.h"`
			`#include "mlir/Dialect/SPIRV/IR/SPIRVDialect.h"`
			`#include "mlir/Dialect/SPIRV/IR/SPIRVOps.h"`
			`#include "mlir/Dialect/SPIRV/Transforms/SPIRVConversion.h"`

			`namespace mlir {`
			`#define GEN_PASS_DEF_CONVERTGPUTOSPIRV`
			`#include "mlir/Conversion/Passes.h.inc"`
			`} // namespace mlir`

			`using namespace mlir;`

			`namespace {`
			`/// Pass to lower GPU Dialect to SPIR-V. The pass only converts the gpu.func ops`
			`/// inside gpu.module ops. i.e., the function that are referenced in`
			`/// gpu.launch_func ops. For each such function`
			`///`
			`/// 1) Create a spirv::ModuleOp, and clone the function into spirv::ModuleOp`
			`/// (the original function is still needed by the gpu::LaunchKernelOp, so cannot`
			`/// replace it).`
			`///`
			`/// 2) Lower the body of the spirv::ModuleOp.`
			`struct GPUToSPIRVPass final : impl::ConvertGPUToSPIRVBase<GPUToSPIRVPass> {`
			`explicit GPUToSPIRVPass(bool mapMemorySpace)`
			`: mapMemorySpace(mapMemorySpace) {}`
			`void runOnOperation() override;`

			`private:`
			`bool mapMemorySpace;`
			`};`

			`void GPUToSPIRVPass::runOnOperation() {`
			`MLIRContext *context = &getContext();`
			`ModuleOp module = getOperation();`

			`SmallVector<Operation *, 1> gpuModules;`
			`OpBuilder builder(context);`

			`auto targetEnvSupportsKernelCapability = [](gpu::GPUModuleOp moduleOp) {`
			`Operation *gpuModule = moduleOp.getOperation();`
			`auto targetAttr = spirv::lookupTargetEnvOrDefault(gpuModule);`
			`spirv::TargetEnv targetEnv(targetAttr);`
			`return targetEnv.allows(spirv::Capability::Kernel);`
			`};`

			`module.walk([&](gpu::GPUModuleOp moduleOp) {`
			`// Clone each GPU kernel module for conversion, given that the GPU`
			`// launch op still needs the original GPU kernel module.`
			`// For Vulkan Shader capabilities, we insert the newly converted SPIR-V`
			`// module right after the original GPU module, as that's the expectation of`
			`// the in-tree Vulkan runner.`
			`// For OpenCL Kernel capabilities, we insert the newly converted SPIR-V`
			`// module inside the original GPU module, as that's the expectaion of the`
			`// normal GPU compilation pipeline.`
			`if (targetEnvSupportsKernelCapability(moduleOp)) {`
			`builder.setInsertionPoint(moduleOp.getBody(),`
			`moduleOp.getBody()->begin());`
			`} else {`
			`builder.setInsertionPoint(moduleOp.getOperation());`
			`}`
			`gpuModules.push_back(builder.clone(*moduleOp.getOperation()));`
			`});`

			`// Run conversion for each module independently as they can have different`
			`// TargetEnv attributes.`
			`for (Operation *gpuModule : gpuModules) {`
			`spirv::TargetEnvAttr targetAttr =`
			`spirv::lookupTargetEnvOrDefault(gpuModule);`

			`// Map MemRef memory space to SPIR-V storage class first if requested.`
			`if (mapMemorySpace) {`
			`std::unique_ptr<ConversionTarget> target =`
			`spirv::getMemorySpaceToStorageClassTarget(*context);`
			`spirv::MemorySpaceToStorageClassMap memorySpaceMap =`
			`targetEnvSupportsKernelCapability(`
			`dyn_cast<gpu::GPUModuleOp>(gpuModule))`
			`? spirv::mapMemorySpaceToOpenCLStorageClass`
			`: spirv::mapMemorySpaceToVulkanStorageClass;`
			`spirv::MemorySpaceToStorageClassConverter converter(memorySpaceMap);`

			`RewritePatternSet patterns(context);`
			`spirv::populateMemorySpaceToStorageClassPatterns(converter, patterns);`

			`if (failed(applyFullConversion(gpuModule, *target, std::move(patterns))))`
			`return signalPassFailure();`
			`}`

			`std::unique_ptr<ConversionTarget> target =`
			`SPIRVConversionTarget::get(targetAttr);`

			`SPIRVConversionOptions options;`
			`options.use64bitIndex = this->use64bitIndex;`
			`SPIRVTypeConverter typeConverter(targetAttr, options);`
			`populateMMAToSPIRVCoopMatrixTypeConversion(typeConverter);`

			`RewritePatternSet patterns(context);`
			`populateGPUToSPIRVPatterns(typeConverter, patterns);`
			`populateGpuWMMAToSPIRVCoopMatrixKHRConversionPatterns(typeConverter,`
			`patterns);`

			`// TODO: Change SPIR-V conversion to be progressive and remove the following`
			`// patterns.`
			`ScfToSPIRVContext scfContext;`
			`populateSCFToSPIRVPatterns(typeConverter, scfContext, patterns);`
			`mlir::arith::populateArithToSPIRVPatterns(typeConverter, patterns);`
			`populateMemRefToSPIRVPatterns(typeConverter, patterns);`
			`populateFuncToSPIRVPatterns(typeConverter, patterns);`

			`if (failed(applyFullConversion(gpuModule, *target, std::move(patterns))))`
			`return signalPassFailure();`
			`}`

			`// For OpenCL, the gpu.func op in the original gpu.module op needs to be`
			`// replaced with an empty func.func op with the same arguments as the gpu.func`
			`// op. The func.func op needs gpu.kernel attribute set.`
			`module.walk([&](gpu::GPUModuleOp moduleOp) {`
			`if (targetEnvSupportsKernelCapability(moduleOp)) {`
			`moduleOp.walk([&](gpu::GPUFuncOp funcOp) {`
			`builder.setInsertionPoint(funcOp);`
			`auto newFuncOp = builder.create<func::FuncOp>(`
			`funcOp.getLoc(), funcOp.getName(), funcOp.getFunctionType());`
			`auto entryBlock = newFuncOp.addEntryBlock();`
			`builder.setInsertionPointToEnd(entryBlock);`
			`builder.create<func::ReturnOp>(funcOp.getLoc());`
			`newFuncOp->setAttr(gpu::GPUDialect::getKernelFuncAttrName(),`
			`builder.getUnitAttr());`
			`funcOp.erase();`
			`});`
			`}`
			`});`
			`}`

			`} // namespace`

			`std::unique_ptr<OperationPass<ModuleOp>>`
			`mlir::createConvertGPUToSPIRVPass(bool mapMemorySpace) {`
			`return std::make_unique<GPUToSPIRVPass>(mapMemorySpace);`
			`}`