forked from OSchip/llvm-project
Reapply "[AMDGPU][OpenMP] Add amdgpu-arch tool to list AMD GPUs installed"
This reverts commit 93604305bb
.
This commit is contained in:
parent
4581bf31bb
commit
59ad4e0f01
|
@ -67,6 +67,8 @@ def err_drv_no_hip_runtime : Error<
|
||||||
"cannot find HIP runtime. Provide its path via --rocm-path, or pass "
|
"cannot find HIP runtime. Provide its path via --rocm-path, or pass "
|
||||||
"-nogpuinc to build without HIP runtime.">;
|
"-nogpuinc to build without HIP runtime.">;
|
||||||
|
|
||||||
|
def err_drv_undetermined_amdgpu_arch : Error<
|
||||||
|
"Cannot determine AMDGPU architecture: %0. Consider passing it via --march.">;
|
||||||
def err_drv_cuda_version_unsupported : Error<
|
def err_drv_cuda_version_unsupported : Error<
|
||||||
"GPU arch %0 is supported by CUDA versions between %1 and %2 (inclusive), "
|
"GPU arch %0 is supported by CUDA versions between %1 and %2 (inclusive), "
|
||||||
"but installation at %3 is %4. Use --cuda-path to specify a different CUDA "
|
"but installation at %3 is %4. Use --cuda-path to specify a different CUDA "
|
||||||
|
|
|
@ -924,6 +924,8 @@ def rocm_path_EQ : Joined<["--"], "rocm-path=">, Group<i_Group>,
|
||||||
HelpText<"ROCm installation path, used for finding and automatically linking required bitcode libraries.">;
|
HelpText<"ROCm installation path, used for finding and automatically linking required bitcode libraries.">;
|
||||||
def hip_path_EQ : Joined<["--"], "hip-path=">, Group<i_Group>,
|
def hip_path_EQ : Joined<["--"], "hip-path=">, Group<i_Group>,
|
||||||
HelpText<"HIP runtime installation path, used for finding HIP version and adding HIP include path.">;
|
HelpText<"HIP runtime installation path, used for finding HIP version and adding HIP include path.">;
|
||||||
|
def amdgpu_arch_tool_EQ : Joined<["--"], "amdgpu-arch-tool=">, Group<i_Group>,
|
||||||
|
HelpText<"Tool used for detecting AMD GPU arch in the system.">;
|
||||||
def rocm_device_lib_path_EQ : Joined<["--"], "rocm-device-lib-path=">, Group<Link_Group>,
|
def rocm_device_lib_path_EQ : Joined<["--"], "rocm-device-lib-path=">, Group<Link_Group>,
|
||||||
HelpText<"ROCm device library path. Alternative to rocm-path.">;
|
HelpText<"ROCm device library path. Alternative to rocm-path.">;
|
||||||
def : Joined<["--"], "hip-device-lib-path=">, Alias<rocm_device_lib_path_EQ>;
|
def : Joined<["--"], "hip-device-lib-path=">, Alias<rocm_device_lib_path_EQ>;
|
||||||
|
|
|
@ -12,9 +12,16 @@
|
||||||
#include "clang/Basic/TargetID.h"
|
#include "clang/Basic/TargetID.h"
|
||||||
#include "clang/Driver/Compilation.h"
|
#include "clang/Driver/Compilation.h"
|
||||||
#include "clang/Driver/DriverDiagnostic.h"
|
#include "clang/Driver/DriverDiagnostic.h"
|
||||||
|
#include "clang/Driver/Options.h"
|
||||||
#include "llvm/Option/ArgList.h"
|
#include "llvm/Option/ArgList.h"
|
||||||
|
#include "llvm/Support/Error.h"
|
||||||
|
#include "llvm/Support/FileUtilities.h"
|
||||||
|
#include "llvm/Support/LineIterator.h"
|
||||||
#include "llvm/Support/Path.h"
|
#include "llvm/Support/Path.h"
|
||||||
#include "llvm/Support/VirtualFileSystem.h"
|
#include "llvm/Support/VirtualFileSystem.h"
|
||||||
|
#include <system_error>
|
||||||
|
|
||||||
|
#define AMDGPU_ARCH_PROGRAM_NAME "amdgpu-arch"
|
||||||
|
|
||||||
using namespace clang::driver;
|
using namespace clang::driver;
|
||||||
using namespace clang::driver::tools;
|
using namespace clang::driver::tools;
|
||||||
|
@ -715,6 +722,78 @@ void AMDGPUToolChain::checkTargetID(
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
llvm::Error
|
||||||
|
AMDGPUToolChain::detectSystemGPUs(const ArgList &Args,
|
||||||
|
SmallVector<std::string, 1> &GPUArchs) const {
|
||||||
|
std::string Program;
|
||||||
|
if (Arg *A = Args.getLastArg(options::OPT_amdgpu_arch_tool_EQ))
|
||||||
|
Program = A->getValue();
|
||||||
|
else
|
||||||
|
Program = GetProgramPath(AMDGPU_ARCH_PROGRAM_NAME);
|
||||||
|
llvm::SmallString<64> OutputFile;
|
||||||
|
llvm::sys::fs::createTemporaryFile("print-system-gpus", "" /* No Suffix */,
|
||||||
|
OutputFile);
|
||||||
|
llvm::FileRemover OutputRemover(OutputFile.c_str());
|
||||||
|
llvm::Optional<llvm::StringRef> Redirects[] = {
|
||||||
|
{""},
|
||||||
|
StringRef(OutputFile),
|
||||||
|
{""},
|
||||||
|
};
|
||||||
|
|
||||||
|
std::string ErrorMessage;
|
||||||
|
if (int Result = llvm::sys::ExecuteAndWait(
|
||||||
|
Program.c_str(), {}, {}, Redirects, /* SecondsToWait */ 0,
|
||||||
|
/*MemoryLimit*/ 0, &ErrorMessage)) {
|
||||||
|
if (Result > 0) {
|
||||||
|
ErrorMessage = "Exited with error code " + std::to_string(Result);
|
||||||
|
} else if (Result == -1) {
|
||||||
|
ErrorMessage = "Execute failed: " + ErrorMessage;
|
||||||
|
} else {
|
||||||
|
ErrorMessage = "Crashed: " + ErrorMessage;
|
||||||
|
}
|
||||||
|
|
||||||
|
return llvm::createStringError(std::error_code(),
|
||||||
|
Program + ": " + ErrorMessage);
|
||||||
|
}
|
||||||
|
|
||||||
|
llvm::ErrorOr<std::unique_ptr<llvm::MemoryBuffer>> OutputBuf =
|
||||||
|
llvm::MemoryBuffer::getFile(OutputFile.c_str());
|
||||||
|
if (!OutputBuf) {
|
||||||
|
return llvm::createStringError(OutputBuf.getError(),
|
||||||
|
"Failed to read stdout of " + Program +
|
||||||
|
": " + OutputBuf.getError().message());
|
||||||
|
}
|
||||||
|
|
||||||
|
for (llvm::line_iterator LineIt(**OutputBuf); !LineIt.is_at_end(); ++LineIt) {
|
||||||
|
GPUArchs.push_back(LineIt->str());
|
||||||
|
}
|
||||||
|
return llvm::Error::success();
|
||||||
|
}
|
||||||
|
|
||||||
|
llvm::Error AMDGPUToolChain::getSystemGPUArch(const ArgList &Args,
|
||||||
|
std::string &GPUArch) const {
|
||||||
|
// detect the AMDGPU installed in system
|
||||||
|
SmallVector<std::string, 1> GPUArchs;
|
||||||
|
auto Err = detectSystemGPUs(Args, GPUArchs);
|
||||||
|
if (Err) {
|
||||||
|
return Err;
|
||||||
|
}
|
||||||
|
if (GPUArchs.empty()) {
|
||||||
|
return llvm::createStringError(std::error_code(),
|
||||||
|
"No AMD GPU detected in the system");
|
||||||
|
}
|
||||||
|
GPUArch = GPUArchs[0];
|
||||||
|
if (GPUArchs.size() > 1) {
|
||||||
|
bool AllSame = std::all_of(
|
||||||
|
GPUArchs.begin(), GPUArchs.end(),
|
||||||
|
[&](const StringRef &GPUArch) { return GPUArch == GPUArchs.front(); });
|
||||||
|
if (!AllSame)
|
||||||
|
return llvm::createStringError(
|
||||||
|
std::error_code(), "Multiple AMD GPUs found with different archs");
|
||||||
|
}
|
||||||
|
return llvm::Error::success();
|
||||||
|
}
|
||||||
|
|
||||||
void ROCMToolChain::addClangTargetOptions(
|
void ROCMToolChain::addClangTargetOptions(
|
||||||
const llvm::opt::ArgList &DriverArgs, llvm::opt::ArgStringList &CC1Args,
|
const llvm::opt::ArgList &DriverArgs, llvm::opt::ArgStringList &CC1Args,
|
||||||
Action::OffloadKind DeviceOffloadingKind) const {
|
Action::OffloadKind DeviceOffloadingKind) const {
|
||||||
|
|
|
@ -100,12 +100,20 @@ public:
|
||||||
/// Should skip argument.
|
/// Should skip argument.
|
||||||
bool shouldSkipArgument(const llvm::opt::Arg *Arg) const;
|
bool shouldSkipArgument(const llvm::opt::Arg *Arg) const;
|
||||||
|
|
||||||
|
/// Uses amdgpu_arch tool to get arch of the system GPU. Will return error
|
||||||
|
/// if unable to find one.
|
||||||
|
llvm::Error getSystemGPUArch(const llvm::opt::ArgList &Args,
|
||||||
|
std::string &GPUArch) const;
|
||||||
|
|
||||||
protected:
|
protected:
|
||||||
/// Check and diagnose invalid target ID specified by -mcpu.
|
/// Check and diagnose invalid target ID specified by -mcpu.
|
||||||
void checkTargetID(const llvm::opt::ArgList &DriverArgs) const;
|
void checkTargetID(const llvm::opt::ArgList &DriverArgs) const;
|
||||||
|
|
||||||
/// Get GPU arch from -mcpu without checking.
|
/// Get GPU arch from -mcpu without checking.
|
||||||
StringRef getGPUArch(const llvm::opt::ArgList &DriverArgs) const;
|
StringRef getGPUArch(const llvm::opt::ArgList &DriverArgs) const;
|
||||||
|
|
||||||
|
llvm::Error detectSystemGPUs(const llvm::opt::ArgList &Args,
|
||||||
|
SmallVector<std::string, 1> &GPUArchs) const;
|
||||||
};
|
};
|
||||||
|
|
||||||
class LLVM_LIBRARY_VISIBILITY ROCMToolChain : public AMDGPUToolChain {
|
class LLVM_LIBRARY_VISIBILITY ROCMToolChain : public AMDGPUToolChain {
|
||||||
|
|
|
@ -10,11 +10,14 @@
|
||||||
#include "AMDGPU.h"
|
#include "AMDGPU.h"
|
||||||
#include "CommonArgs.h"
|
#include "CommonArgs.h"
|
||||||
#include "InputInfo.h"
|
#include "InputInfo.h"
|
||||||
|
#include "clang/Basic/DiagnosticDriver.h"
|
||||||
#include "clang/Driver/Compilation.h"
|
#include "clang/Driver/Compilation.h"
|
||||||
#include "clang/Driver/Driver.h"
|
#include "clang/Driver/Driver.h"
|
||||||
#include "clang/Driver/DriverDiagnostic.h"
|
#include "clang/Driver/DriverDiagnostic.h"
|
||||||
#include "clang/Driver/Options.h"
|
#include "clang/Driver/Options.h"
|
||||||
#include "llvm/Support/FileSystem.h"
|
#include "llvm/Support/FileSystem.h"
|
||||||
|
#include "llvm/Support/FormatAdapters.h"
|
||||||
|
#include "llvm/Support/FormatVariadic.h"
|
||||||
#include "llvm/Support/Path.h"
|
#include "llvm/Support/Path.h"
|
||||||
|
|
||||||
using namespace clang::driver;
|
using namespace clang::driver;
|
||||||
|
@ -66,6 +69,18 @@ static void addLLCOptArg(const llvm::opt::ArgList &Args,
|
||||||
CmdArgs.push_back(Args.MakeArgString("-O" + OOpt));
|
CmdArgs.push_back(Args.MakeArgString("-O" + OOpt));
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static bool checkSystemForAMDGPU(const ArgList &Args, const AMDGPUToolChain &TC,
|
||||||
|
std::string &GPUArch) {
|
||||||
|
if (auto Err = TC.getSystemGPUArch(Args, GPUArch)) {
|
||||||
|
std::string ErrMsg =
|
||||||
|
llvm::formatv("{0}", llvm::fmt_consume(std::move(Err)));
|
||||||
|
TC.getDriver().Diag(diag::err_drv_undetermined_amdgpu_arch) << ErrMsg;
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
return true;
|
||||||
|
}
|
||||||
} // namespace
|
} // namespace
|
||||||
|
|
||||||
const char *AMDGCN::OpenMPLinker::constructLLVMLinkCommand(
|
const char *AMDGCN::OpenMPLinker::constructLLVMLinkCommand(
|
||||||
|
@ -145,17 +160,23 @@ void AMDGCN::OpenMPLinker::ConstructJob(Compilation &C, const JobAction &JA,
|
||||||
const InputInfoList &Inputs,
|
const InputInfoList &Inputs,
|
||||||
const ArgList &Args,
|
const ArgList &Args,
|
||||||
const char *LinkingOutput) const {
|
const char *LinkingOutput) const {
|
||||||
|
const ToolChain &TC = getToolChain();
|
||||||
assert(getToolChain().getTriple().isAMDGCN() && "Unsupported target");
|
assert(getToolChain().getTriple().isAMDGCN() && "Unsupported target");
|
||||||
|
|
||||||
StringRef GPUArch = Args.getLastArgValue(options::OPT_march_EQ);
|
const toolchains::AMDGPUOpenMPToolChain &AMDGPUOpenMPTC =
|
||||||
assert(GPUArch.startswith("gfx") && "Unsupported sub arch");
|
static_cast<const toolchains::AMDGPUOpenMPToolChain &>(TC);
|
||||||
|
|
||||||
|
std::string GPUArch = Args.getLastArgValue(options::OPT_march_EQ).str();
|
||||||
|
if (GPUArch.empty()) {
|
||||||
|
if (!checkSystemForAMDGPU(Args, AMDGPUOpenMPTC, GPUArch))
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
// Prefix for temporary file name.
|
// Prefix for temporary file name.
|
||||||
std::string Prefix;
|
std::string Prefix;
|
||||||
for (const auto &II : Inputs)
|
for (const auto &II : Inputs)
|
||||||
if (II.isFilename())
|
if (II.isFilename())
|
||||||
Prefix =
|
Prefix = llvm::sys::path::stem(II.getFilename()).str() + "-" + GPUArch;
|
||||||
llvm::sys::path::stem(II.getFilename()).str() + "-" + GPUArch.str();
|
|
||||||
assert(Prefix.length() && "no linker inputs are files ");
|
assert(Prefix.length() && "no linker inputs are files ");
|
||||||
|
|
||||||
// Each command outputs different files.
|
// Each command outputs different files.
|
||||||
|
@ -186,18 +207,22 @@ void AMDGPUOpenMPToolChain::addClangTargetOptions(
|
||||||
Action::OffloadKind DeviceOffloadingKind) const {
|
Action::OffloadKind DeviceOffloadingKind) const {
|
||||||
HostTC.addClangTargetOptions(DriverArgs, CC1Args, DeviceOffloadingKind);
|
HostTC.addClangTargetOptions(DriverArgs, CC1Args, DeviceOffloadingKind);
|
||||||
|
|
||||||
StringRef GpuArch = DriverArgs.getLastArgValue(options::OPT_march_EQ);
|
std::string GPUArch = DriverArgs.getLastArgValue(options::OPT_march_EQ).str();
|
||||||
assert(!GpuArch.empty() && "Must have an explicit GPU arch.");
|
if (GPUArch.empty()) {
|
||||||
|
if (!checkSystemForAMDGPU(DriverArgs, *this, GPUArch))
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
assert(DeviceOffloadingKind == Action::OFK_OpenMP &&
|
assert(DeviceOffloadingKind == Action::OFK_OpenMP &&
|
||||||
"Only OpenMP offloading kinds are supported.");
|
"Only OpenMP offloading kinds are supported.");
|
||||||
|
|
||||||
CC1Args.push_back("-target-cpu");
|
CC1Args.push_back("-target-cpu");
|
||||||
CC1Args.push_back(DriverArgs.MakeArgStringRef(GpuArch));
|
CC1Args.push_back(DriverArgs.MakeArgStringRef(GPUArch));
|
||||||
CC1Args.push_back("-fcuda-is-device");
|
CC1Args.push_back("-fcuda-is-device");
|
||||||
|
|
||||||
if (DriverArgs.hasArg(options::OPT_nogpulib))
|
if (DriverArgs.hasArg(options::OPT_nogpulib))
|
||||||
return;
|
return;
|
||||||
std::string BitcodeSuffix = "amdgcn-" + GpuArch.str();
|
std::string BitcodeSuffix = "amdgcn-" + GPUArch;
|
||||||
addOpenMPDeviceRTL(getDriver(), DriverArgs, CC1Args, BitcodeSuffix,
|
addOpenMPDeviceRTL(getDriver(), DriverArgs, CC1Args, BitcodeSuffix,
|
||||||
getTriple());
|
getTriple());
|
||||||
}
|
}
|
||||||
|
|
|
@ -0,0 +1,4 @@
|
||||||
|
#!/bin/sh
|
||||||
|
echo gfx908
|
||||||
|
echo gfx906
|
||||||
|
exit 0
|
|
@ -0,0 +1,2 @@
|
||||||
|
#!/bin/sh
|
||||||
|
exit 1
|
|
@ -0,0 +1,3 @@
|
||||||
|
#!/bin/sh
|
||||||
|
echo "gfx906"
|
||||||
|
exit 0
|
|
@ -0,0 +1,4 @@
|
||||||
|
#!/bin/sh
|
||||||
|
echo gfx908
|
||||||
|
echo gfx908
|
||||||
|
exit 0
|
|
@ -0,0 +1,28 @@
|
||||||
|
// REQUIRES: system-linux
|
||||||
|
// REQUIRES: x86-registered-target
|
||||||
|
// REQUIRES: amdgpu-registered-target
|
||||||
|
// REQUIRES: shell
|
||||||
|
|
||||||
|
// RUN: mkdir -p %t
|
||||||
|
// RUN: rm -f %t/amdgpu_arch_fail %t/amdgpu_arch_different
|
||||||
|
// RUN: cp %S/Inputs/amdgpu-arch/amdgpu_arch_fail %t/
|
||||||
|
// RUN: cp %S/Inputs/amdgpu-arch/amdgpu_arch_different %t/
|
||||||
|
// RUN: echo '#!/bin/sh' > %t/amdgpu_arch_empty
|
||||||
|
// RUN: chmod +x %t/amdgpu_arch_fail
|
||||||
|
// RUN: chmod +x %t/amdgpu_arch_different
|
||||||
|
// RUN: chmod +x %t/amdgpu_arch_empty
|
||||||
|
|
||||||
|
// case when amdgpu_arch returns nothing or fails
|
||||||
|
// RUN: %clang -### --target=x86_64-unknown-linux-gnu -fopenmp -fopenmp-targets=amdgcn-amd-amdhsa -nogpulib --amdgpu-arch-tool=%t/amdgpu_arch_fail %s 2>&1 \
|
||||||
|
// RUN: | FileCheck %s --check-prefix=NO-OUTPUT-ERROR
|
||||||
|
// NO-OUTPUT-ERROR: error: Cannot determine AMDGPU architecture{{.*}}Exited with error code 1. Consider passing it via --march
|
||||||
|
|
||||||
|
// case when amdgpu_arch returns multiple gpus but all are different
|
||||||
|
// RUN: %clang -### --target=x86_64-unknown-linux-gnu -fopenmp -fopenmp-targets=amdgcn-amd-amdhsa -nogpulib --amdgpu-arch-tool=%t/amdgpu_arch_different %s 2>&1 \
|
||||||
|
// RUN: | FileCheck %s --check-prefix=MULTIPLE-OUTPUT-ERROR
|
||||||
|
// MULTIPLE-OUTPUT-ERROR: error: Cannot determine AMDGPU architecture: Multiple AMD GPUs found with different archs. Consider passing it via --march
|
||||||
|
|
||||||
|
// case when amdgpu_arch does not return anything with successful execution
|
||||||
|
// RUN: %clang -### --target=x86_64-unknown-linux-gnu -fopenmp -fopenmp-targets=amdgcn-amd-amdhsa -nogpulib --amdgpu-arch-tool=%t/amdgpu_arch_empty %s 2>&1 \
|
||||||
|
// RUN: | FileCheck %s --check-prefix=EMPTY-OUTPUT
|
||||||
|
// EMPTY-OUTPUT: error: Cannot determine AMDGPU architecture: No AMD GPU detected in the system. Consider passing it via --march
|
|
@ -0,0 +1,24 @@
|
||||||
|
// REQUIRES: system-linux
|
||||||
|
// REQUIRES: x86-registered-target
|
||||||
|
// REQUIRES: amdgpu-registered-target
|
||||||
|
// REQUIRES: shell
|
||||||
|
|
||||||
|
// RUN: mkdir -p %t
|
||||||
|
// RUN: rm -f %t/amdgpu_arch_gfx906
|
||||||
|
// RUN: cp %S/Inputs/amdgpu-arch/amdgpu_arch_gfx906 %t/
|
||||||
|
// RUN: cp %S/Inputs/amdgpu-arch/amdgpu_arch_gfx908_gfx908 %t/
|
||||||
|
// RUN: chmod +x %t/amdgpu_arch_gfx906
|
||||||
|
// RUN: chmod +x %t/amdgpu_arch_gfx908_gfx908
|
||||||
|
|
||||||
|
// RUN: %clang -### --target=x86_64-unknown-linux-gnu -fopenmp -fopenmp-targets=amdgcn-amd-amdhsa -nogpulib --amdgpu-arch-tool=%t/amdgpu_arch_gfx906 %s 2>&1 \
|
||||||
|
// RUN: | FileCheck %s
|
||||||
|
// CHECK: clang{{.*}}"-cc1"{{.*}}"-triple" "amdgcn-amd-amdhsa"{{.*}}"-target-cpu" "[[GFX:gfx906]]"
|
||||||
|
// CHECK: llvm-link{{.*}}"-o" "{{.*}}amdgpu-openmp-system-arch-{{.*}}-[[GFX]]-linked-{{.*}}.bc"
|
||||||
|
// CHECK: llc{{.*}}amdgpu-openmp-system-arch-{{.*}}-[[GFX]]-linked-{{.*}}.bc" "-mtriple=amdgcn-amd-amdhsa" "-mcpu=[[GFX]]" "-filetype=obj" "-o"{{.*}}amdgpu-openmp-system-arch-{{.*}}-[[GFX]]-{{.*}}.o"
|
||||||
|
|
||||||
|
// case when amdgpu_arch returns multiple gpus but of same arch
|
||||||
|
// RUN: %clang -### --target=x86_64-unknown-linux-gnu -fopenmp -fopenmp-targets=amdgcn-amd-amdhsa -nogpulib --amdgpu-arch-tool=%t/amdgpu_arch_gfx908_gfx908 %s 2>&1 \
|
||||||
|
// RUN: | FileCheck %s --check-prefix=CHECK-MULTIPLE
|
||||||
|
// CHECK-MULTIPLE: clang{{.*}}"-cc1"{{.*}}"-triple" "amdgcn-amd-amdhsa"{{.*}}"-target-cpu" "[[GFX:gfx908]]"
|
||||||
|
// CHECK-MULTIPLE: llvm-link{{.*}}"-o" "{{.*}}amdgpu-openmp-system-arch-{{.*}}-[[GFX]]-linked-{{.*}}.bc"
|
||||||
|
// CHECK-MULTIPLE: llc{{.*}}amdgpu-openmp-system-arch-{{.*}}-[[GFX]]-linked-{{.*}}.bc" "-mtriple=amdgcn-amd-amdhsa" "-mcpu=[[GFX]]" "-filetype=obj" "-o"{{.*}}amdgpu-openmp-system-arch-{{.*}}-[[GFX]]-{{.*}}.o"
|
|
@ -43,3 +43,5 @@ add_llvm_external_project(clang-tools-extra extra)
|
||||||
|
|
||||||
# libclang may require clang-tidy in clang-tools-extra.
|
# libclang may require clang-tidy in clang-tools-extra.
|
||||||
add_clang_subdirectory(libclang)
|
add_clang_subdirectory(libclang)
|
||||||
|
|
||||||
|
add_clang_subdirectory(amdgpu-arch)
|
||||||
|
|
|
@ -0,0 +1,59 @@
|
||||||
|
//===- AMDGPUArch.cpp - list AMDGPU installed ----------*- C++ -*---------===//
|
||||||
|
//
|
||||||
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
||||||
|
// See https://llvm.org/LICENSE.txt for license information.
|
||||||
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
||||||
|
//
|
||||||
|
//===----------------------------------------------------------------------===//
|
||||||
|
//
|
||||||
|
// This file implements a tool for detecting name of AMDGPU installed in system
|
||||||
|
// using HSA. This tool is used by AMDGPU OpenMP driver.
|
||||||
|
//
|
||||||
|
//===----------------------------------------------------------------------===//
|
||||||
|
|
||||||
|
#include <hsa.h>
|
||||||
|
#include <string>
|
||||||
|
#include <vector>
|
||||||
|
|
||||||
|
static hsa_status_t iterateAgentsCallback(hsa_agent_t Agent, void *Data) {
|
||||||
|
hsa_device_type_t DeviceType;
|
||||||
|
hsa_status_t Status =
|
||||||
|
hsa_agent_get_info(Agent, HSA_AGENT_INFO_DEVICE, &DeviceType);
|
||||||
|
|
||||||
|
// continue only if device type if GPU
|
||||||
|
if (Status != HSA_STATUS_SUCCESS || DeviceType != HSA_DEVICE_TYPE_GPU) {
|
||||||
|
return Status;
|
||||||
|
}
|
||||||
|
|
||||||
|
std::vector<std::string> *GPUs =
|
||||||
|
static_cast<std::vector<std::string> *>(Data);
|
||||||
|
char GPUName[64];
|
||||||
|
Status = hsa_agent_get_info(Agent, HSA_AGENT_INFO_NAME, GPUName);
|
||||||
|
if (Status != HSA_STATUS_SUCCESS) {
|
||||||
|
return Status;
|
||||||
|
}
|
||||||
|
GPUs->push_back(GPUName);
|
||||||
|
return HSA_STATUS_SUCCESS;
|
||||||
|
}
|
||||||
|
|
||||||
|
int main() {
|
||||||
|
hsa_status_t Status = hsa_init();
|
||||||
|
if (Status != HSA_STATUS_SUCCESS) {
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
std::vector<std::string> GPUs;
|
||||||
|
Status = hsa_iterate_agents(iterateAgentsCallback, &GPUs);
|
||||||
|
if (Status != HSA_STATUS_SUCCESS) {
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
for (const auto &GPU : GPUs)
|
||||||
|
printf("%s\n", GPU.c_str());
|
||||||
|
|
||||||
|
if (GPUs.size() < 1)
|
||||||
|
return 1;
|
||||||
|
|
||||||
|
hsa_shut_down();
|
||||||
|
return 0;
|
||||||
|
}
|
|
@ -0,0 +1,17 @@
|
||||||
|
# //===----------------------------------------------------------------------===//
|
||||||
|
# //
|
||||||
|
# // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
||||||
|
# // See https://llvm.org/LICENSE.txt for details.
|
||||||
|
# // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
||||||
|
# //
|
||||||
|
# //===----------------------------------------------------------------------===//
|
||||||
|
|
||||||
|
find_package(hsa-runtime64 QUIET 1.2.0 HINTS ${CMAKE_INSTALL_PREFIX} PATHS /opt/rocm)
|
||||||
|
if (NOT ${hsa-runtime64_FOUND})
|
||||||
|
message(STATUS "Not building amdgpu-arch: hsa-runtime64 not found")
|
||||||
|
return()
|
||||||
|
endif()
|
||||||
|
|
||||||
|
add_clang_tool(amdgpu-arch AMDGPUArch.cpp)
|
||||||
|
|
||||||
|
clang_target_link_libraries(amdgpu-arch PRIVATE hsa-runtime64::hsa-runtime64)
|
Loading…
Reference in New Issue