
We already bump to COV6 by default in the front-end and backend. This PR is for MLIR. Note that COV6 requires ROCm 6.3+.
277 lines
10 KiB
C++
277 lines
10 KiB
C++
//===- SerializeROCDLTarget.cpp ---------------------------------*- C++ -*-===//
|
|
//
|
|
// This file is licensed under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "mlir/Dialect/GPU/IR/GPUDialect.h"
|
|
#include "mlir/Dialect/LLVMIR/ROCDLDialect.h"
|
|
#include "mlir/IR/MLIRContext.h"
|
|
#include "mlir/InitAllDialects.h"
|
|
#include "mlir/Parser/Parser.h"
|
|
#include "mlir/Target/LLVM/ROCDL/Target.h"
|
|
#include "mlir/Target/LLVM/ROCDL/Utils.h"
|
|
#include "mlir/Target/LLVMIR/Dialect/Builtin/BuiltinToLLVMIRTranslation.h"
|
|
#include "mlir/Target/LLVMIR/Dialect/GPU/GPUToLLVMIRTranslation.h"
|
|
#include "mlir/Target/LLVMIR/Dialect/LLVMIR/LLVMToLLVMIRTranslation.h"
|
|
#include "mlir/Target/LLVMIR/Dialect/ROCDL/ROCDLToLLVMIRTranslation.h"
|
|
|
|
#include "llvm/IRReader/IRReader.h"
|
|
#include "llvm/Support/FileSystem.h"
|
|
#include "llvm/Support/MemoryBufferRef.h"
|
|
#include "llvm/Support/Path.h"
|
|
#include "llvm/Support/TargetSelect.h"
|
|
#include "llvm/Support/raw_ostream.h"
|
|
#include "llvm/TargetParser/Host.h"
|
|
|
|
#include "gmock/gmock.h"
|
|
|
|
using namespace mlir;
|
|
|
|
// Skip the test if the AMDGPU target was not built.
|
|
#if MLIR_ENABLE_ROCM_CONVERSIONS
|
|
#define SKIP_WITHOUT_AMDGPU(x) x
|
|
#else
|
|
#define SKIP_WITHOUT_AMDGPU(x) DISABLED_##x
|
|
#endif
|
|
|
|
class MLIRTargetLLVMROCDL : public ::testing::Test {
|
|
protected:
|
|
void SetUp() override {
|
|
registerBuiltinDialectTranslation(registry);
|
|
registerLLVMDialectTranslation(registry);
|
|
registerGPUDialectTranslation(registry);
|
|
registerROCDLDialectTranslation(registry);
|
|
ROCDL::registerROCDLTargetInterfaceExternalModels(registry);
|
|
}
|
|
|
|
// Checks if a ROCm installation is available.
|
|
bool hasROCMTools() {
|
|
StringRef rocmPath = ROCDL::getROCMPath();
|
|
if (rocmPath.empty())
|
|
return false;
|
|
llvm::SmallString<128> lldPath(rocmPath);
|
|
llvm::sys::path::append(lldPath, "llvm", "bin", "ld.lld");
|
|
return llvm::sys::fs::can_execute(lldPath);
|
|
}
|
|
|
|
// Dialect registry.
|
|
DialectRegistry registry;
|
|
|
|
// MLIR module used for the tests.
|
|
const std::string moduleStr = R"mlir(
|
|
gpu.module @rocdl_test {
|
|
llvm.func @rocdl_kernel(%arg0: f32) attributes {gpu.kernel, rocdl.kernel} {
|
|
llvm.return
|
|
}
|
|
})mlir";
|
|
};
|
|
|
|
// Test ROCDL serialization to LLVM.
|
|
TEST_F(MLIRTargetLLVMROCDL, SKIP_WITHOUT_AMDGPU(SerializeROCDLToLLVM)) {
|
|
MLIRContext context(registry);
|
|
|
|
OwningOpRef<ModuleOp> module =
|
|
parseSourceString<ModuleOp>(moduleStr, &context);
|
|
ASSERT_TRUE(!!module);
|
|
|
|
// Create a ROCDL target.
|
|
ROCDL::ROCDLTargetAttr target = ROCDL::ROCDLTargetAttr::get(&context);
|
|
|
|
// Serialize the module.
|
|
auto serializer = dyn_cast<gpu::TargetAttrInterface>(target);
|
|
ASSERT_TRUE(!!serializer);
|
|
gpu::TargetOptions options("", {}, "", "", gpu::CompilationTarget::Offload);
|
|
for (auto gpuModule : (*module).getBody()->getOps<gpu::GPUModuleOp>()) {
|
|
std::optional<SmallVector<char, 0>> object =
|
|
serializer.serializeToObject(gpuModule, options);
|
|
// Check that the serializer was successful.
|
|
ASSERT_TRUE(object != std::nullopt);
|
|
ASSERT_TRUE(!object->empty());
|
|
|
|
// Read the serialized module.
|
|
llvm::MemoryBufferRef buffer(StringRef(object->data(), object->size()),
|
|
"module");
|
|
llvm::LLVMContext llvmContext;
|
|
llvm::Expected<std::unique_ptr<llvm::Module>> llvmModule =
|
|
llvm::getLazyBitcodeModule(buffer, llvmContext);
|
|
ASSERT_TRUE(!!llvmModule);
|
|
ASSERT_TRUE(!!*llvmModule);
|
|
|
|
// Check that it has a function named `foo`.
|
|
ASSERT_TRUE((*llvmModule)->getFunction("rocdl_kernel") != nullptr);
|
|
}
|
|
}
|
|
// Test ROCDL serialization to ISA with default code object version.
|
|
TEST_F(MLIRTargetLLVMROCDL,
|
|
SKIP_WITHOUT_AMDGPU(SerializeROCDLToISAWithDefaultCOV)) {
|
|
MLIRContext context(registry);
|
|
|
|
OwningOpRef<ModuleOp> module =
|
|
parseSourceString<ModuleOp>(moduleStr, &context);
|
|
ASSERT_TRUE(!!module);
|
|
|
|
// Create a ROCDL target.
|
|
ROCDL::ROCDLTargetAttr target = ROCDL::ROCDLTargetAttr::get(&context);
|
|
|
|
// Serialize the module.
|
|
auto serializer = dyn_cast<gpu::TargetAttrInterface>(target);
|
|
ASSERT_TRUE(!!serializer);
|
|
gpu::TargetOptions options("", {}, "", "", gpu::CompilationTarget::Assembly);
|
|
for (auto gpuModule : (*module).getBody()->getOps<gpu::GPUModuleOp>()) {
|
|
std::optional<SmallVector<char, 0>> object =
|
|
serializer.serializeToObject(gpuModule, options);
|
|
// Check that the serializer was successful.
|
|
EXPECT_TRUE(StringRef(object->data(), object->size())
|
|
.contains(".amdhsa_code_object_version 6"));
|
|
}
|
|
}
|
|
|
|
// Test ROCDL serialization to ISA with non-default code object version.
|
|
TEST_F(MLIRTargetLLVMROCDL,
|
|
SKIP_WITHOUT_AMDGPU(SerializeROCDLToISAWithNonDefaultCOV)) {
|
|
MLIRContext context(registry);
|
|
|
|
OwningOpRef<ModuleOp> module =
|
|
parseSourceString<ModuleOp>(moduleStr, &context);
|
|
ASSERT_TRUE(!!module);
|
|
|
|
// Create a ROCDL target.
|
|
ROCDL::ROCDLTargetAttr target = ROCDL::ROCDLTargetAttr::get(
|
|
&context, 2, "amdgcn-amd-amdhsa", "gfx900", "", "400");
|
|
|
|
// Serialize the module.
|
|
auto serializer = dyn_cast<gpu::TargetAttrInterface>(target);
|
|
ASSERT_TRUE(!!serializer);
|
|
gpu::TargetOptions options("", {}, "", "", gpu::CompilationTarget::Assembly);
|
|
for (auto gpuModule : (*module).getBody()->getOps<gpu::GPUModuleOp>()) {
|
|
std::optional<SmallVector<char, 0>> object =
|
|
serializer.serializeToObject(gpuModule, options);
|
|
// Check that the serializer was successful.
|
|
EXPECT_TRUE(StringRef(object->data(), object->size())
|
|
.contains(".amdhsa_code_object_version 4"));
|
|
}
|
|
}
|
|
|
|
// Test ROCDL serialization to PTX.
|
|
TEST_F(MLIRTargetLLVMROCDL, SKIP_WITHOUT_AMDGPU(SerializeROCDLToPTX)) {
|
|
MLIRContext context(registry);
|
|
|
|
OwningOpRef<ModuleOp> module =
|
|
parseSourceString<ModuleOp>(moduleStr, &context);
|
|
ASSERT_TRUE(!!module);
|
|
|
|
// Create a ROCDL target.
|
|
ROCDL::ROCDLTargetAttr target = ROCDL::ROCDLTargetAttr::get(&context);
|
|
|
|
// Serialize the module.
|
|
auto serializer = dyn_cast<gpu::TargetAttrInterface>(target);
|
|
ASSERT_TRUE(!!serializer);
|
|
gpu::TargetOptions options("", {}, "", "", gpu::CompilationTarget::Assembly);
|
|
for (auto gpuModule : (*module).getBody()->getOps<gpu::GPUModuleOp>()) {
|
|
std::optional<SmallVector<char, 0>> object =
|
|
serializer.serializeToObject(gpuModule, options);
|
|
// Check that the serializer was successful.
|
|
ASSERT_TRUE(object != std::nullopt);
|
|
ASSERT_TRUE(!object->empty());
|
|
|
|
ASSERT_TRUE(
|
|
StringRef(object->data(), object->size()).contains("rocdl_kernel"));
|
|
}
|
|
}
|
|
|
|
// Test ROCDL serialization to Binary.
|
|
TEST_F(MLIRTargetLLVMROCDL, SKIP_WITHOUT_AMDGPU(SerializeROCDLToBinary)) {
|
|
if (!hasROCMTools())
|
|
GTEST_SKIP() << "ROCm installation not found, skipping test.";
|
|
|
|
MLIRContext context(registry);
|
|
|
|
OwningOpRef<ModuleOp> module =
|
|
parseSourceString<ModuleOp>(moduleStr, &context);
|
|
ASSERT_TRUE(!!module);
|
|
|
|
// Create a ROCDL target.
|
|
ROCDL::ROCDLTargetAttr target = ROCDL::ROCDLTargetAttr::get(&context);
|
|
|
|
// Serialize the module.
|
|
auto serializer = dyn_cast<gpu::TargetAttrInterface>(target);
|
|
ASSERT_TRUE(!!serializer);
|
|
gpu::TargetOptions options("", {}, "", "", gpu::CompilationTarget::Binary);
|
|
for (auto gpuModule : (*module).getBody()->getOps<gpu::GPUModuleOp>()) {
|
|
std::optional<SmallVector<char, 0>> object =
|
|
serializer.serializeToObject(gpuModule, options);
|
|
// Check that the serializer was successful.
|
|
ASSERT_TRUE(object != std::nullopt);
|
|
ASSERT_FALSE(object->empty());
|
|
}
|
|
}
|
|
|
|
// Test ROCDL metadata.
|
|
TEST_F(MLIRTargetLLVMROCDL, SKIP_WITHOUT_AMDGPU(GetELFMetadata)) {
|
|
if (!hasROCMTools())
|
|
GTEST_SKIP() << "ROCm installation not found, skipping test.";
|
|
|
|
MLIRContext context(registry);
|
|
|
|
// MLIR module used for the tests.
|
|
const std::string moduleStr = R"mlir(
|
|
gpu.module @rocdl_test {
|
|
llvm.func @rocdl_kernel_1(%arg0: f32) attributes {gpu.kernel, rocdl.kernel} {
|
|
llvm.return
|
|
}
|
|
llvm.func @rocdl_kernel_0(%arg0: f32) attributes {gpu.kernel, rocdl.kernel} {
|
|
llvm.return
|
|
}
|
|
llvm.func @rocdl_kernel_2(%arg0: f32) attributes {gpu.kernel, rocdl.kernel} {
|
|
llvm.return
|
|
}
|
|
llvm.func @a_kernel(%arg0: f32) attributes {gpu.kernel, rocdl.kernel} {
|
|
llvm.return
|
|
}
|
|
})mlir";
|
|
|
|
OwningOpRef<ModuleOp> module =
|
|
parseSourceString<ModuleOp>(moduleStr, &context);
|
|
ASSERT_TRUE(!!module);
|
|
|
|
// Create a ROCDL target.
|
|
ROCDL::ROCDLTargetAttr target = ROCDL::ROCDLTargetAttr::get(&context);
|
|
|
|
// Serialize the module.
|
|
auto serializer = dyn_cast<gpu::TargetAttrInterface>(target);
|
|
ASSERT_TRUE(!!serializer);
|
|
gpu::TargetOptions options("", {}, "", "", gpu::CompilationTarget::Binary);
|
|
for (auto gpuModule : (*module).getBody()->getOps<gpu::GPUModuleOp>()) {
|
|
std::optional<SmallVector<char, 0>> object =
|
|
serializer.serializeToObject(gpuModule, options);
|
|
// Check that the serializer was successful.
|
|
ASSERT_TRUE(object != std::nullopt);
|
|
ASSERT_FALSE(object->empty());
|
|
if (!object)
|
|
continue;
|
|
// Get the metadata.
|
|
gpu::KernelTableAttr metadata =
|
|
ROCDL::getKernelMetadata(gpuModule, *object);
|
|
ASSERT_TRUE(metadata != nullptr);
|
|
// There should be 4 kernels.
|
|
ASSERT_TRUE(metadata.size() == 4);
|
|
// Check that the lookup method returns finds the kernel.
|
|
ASSERT_TRUE(metadata.lookup("a_kernel") != nullptr);
|
|
ASSERT_TRUE(metadata.lookup("rocdl_kernel_0") != nullptr);
|
|
// Check that the kernel doesn't exist.
|
|
ASSERT_TRUE(metadata.lookup("not_existent_kernel") == nullptr);
|
|
// Test the `KernelMetadataAttr` iterators.
|
|
for (gpu::KernelMetadataAttr kernel : metadata) {
|
|
// Check that the ELF metadata is present.
|
|
ASSERT_TRUE(kernel.getMetadata() != nullptr);
|
|
// Verify that `sgpr_count` is present and it is an integer attribute.
|
|
ASSERT_TRUE(kernel.getAttr<IntegerAttr>("sgpr_count") != nullptr);
|
|
// Verify that `vgpr_count` is present and it is an integer attribute.
|
|
ASSERT_TRUE(kernel.getAttr<IntegerAttr>("vgpr_count") != nullptr);
|
|
}
|
|
}
|
|
}
|