forked from OSchip/llvm-project
379 lines
10 KiB
C++
379 lines
10 KiB
C++
#include "clang/Basic/Cuda.h"
|
|
|
|
#include "llvm/ADT/StringRef.h"
|
|
#include "llvm/ADT/StringSwitch.h"
|
|
#include "llvm/Support/ErrorHandling.h"
|
|
#include "llvm/Support/VersionTuple.h"
|
|
|
|
namespace clang {
|
|
|
|
const char *CudaVersionToString(CudaVersion V) {
|
|
switch (V) {
|
|
case CudaVersion::UNKNOWN:
|
|
return "unknown";
|
|
case CudaVersion::CUDA_70:
|
|
return "7.0";
|
|
case CudaVersion::CUDA_75:
|
|
return "7.5";
|
|
case CudaVersion::CUDA_80:
|
|
return "8.0";
|
|
case CudaVersion::CUDA_90:
|
|
return "9.0";
|
|
case CudaVersion::CUDA_91:
|
|
return "9.1";
|
|
case CudaVersion::CUDA_92:
|
|
return "9.2";
|
|
case CudaVersion::CUDA_100:
|
|
return "10.0";
|
|
case CudaVersion::CUDA_101:
|
|
return "10.1";
|
|
}
|
|
llvm_unreachable("invalid enum");
|
|
}
|
|
|
|
CudaVersion CudaStringToVersion(llvm::StringRef S) {
|
|
return llvm::StringSwitch<CudaVersion>(S)
|
|
.Case("7.0", CudaVersion::CUDA_70)
|
|
.Case("7.5", CudaVersion::CUDA_75)
|
|
.Case("8.0", CudaVersion::CUDA_80)
|
|
.Case("9.0", CudaVersion::CUDA_90)
|
|
.Case("9.1", CudaVersion::CUDA_91)
|
|
.Case("9.2", CudaVersion::CUDA_92)
|
|
.Case("10.0", CudaVersion::CUDA_100)
|
|
.Case("10.1", CudaVersion::CUDA_101);
|
|
}
|
|
|
|
const char *CudaArchToString(CudaArch A) {
|
|
switch (A) {
|
|
case CudaArch::LAST:
|
|
break;
|
|
case CudaArch::UNKNOWN:
|
|
return "unknown";
|
|
case CudaArch::SM_20:
|
|
return "sm_20";
|
|
case CudaArch::SM_21:
|
|
return "sm_21";
|
|
case CudaArch::SM_30:
|
|
return "sm_30";
|
|
case CudaArch::SM_32:
|
|
return "sm_32";
|
|
case CudaArch::SM_35:
|
|
return "sm_35";
|
|
case CudaArch::SM_37:
|
|
return "sm_37";
|
|
case CudaArch::SM_50:
|
|
return "sm_50";
|
|
case CudaArch::SM_52:
|
|
return "sm_52";
|
|
case CudaArch::SM_53:
|
|
return "sm_53";
|
|
case CudaArch::SM_60:
|
|
return "sm_60";
|
|
case CudaArch::SM_61:
|
|
return "sm_61";
|
|
case CudaArch::SM_62:
|
|
return "sm_62";
|
|
case CudaArch::SM_70:
|
|
return "sm_70";
|
|
case CudaArch::SM_72:
|
|
return "sm_72";
|
|
case CudaArch::SM_75:
|
|
return "sm_75";
|
|
case CudaArch::GFX600: // tahiti
|
|
return "gfx600";
|
|
case CudaArch::GFX601: // pitcairn, verde, oland,hainan
|
|
return "gfx601";
|
|
case CudaArch::GFX700: // kaveri
|
|
return "gfx700";
|
|
case CudaArch::GFX701: // hawaii
|
|
return "gfx701";
|
|
case CudaArch::GFX702: // 290,290x,R390,R390x
|
|
return "gfx702";
|
|
case CudaArch::GFX703: // kabini mullins
|
|
return "gfx703";
|
|
case CudaArch::GFX704: // bonaire
|
|
return "gfx704";
|
|
case CudaArch::GFX801: // carrizo
|
|
return "gfx801";
|
|
case CudaArch::GFX802: // tonga,iceland
|
|
return "gfx802";
|
|
case CudaArch::GFX803: // fiji,polaris10
|
|
return "gfx803";
|
|
case CudaArch::GFX810: // stoney
|
|
return "gfx810";
|
|
case CudaArch::GFX900: // vega, instinct
|
|
return "gfx900";
|
|
case CudaArch::GFX902: // TBA
|
|
return "gfx902";
|
|
case CudaArch::GFX904: // TBA
|
|
return "gfx904";
|
|
case CudaArch::GFX906: // TBA
|
|
return "gfx906";
|
|
case CudaArch::GFX909: // TBA
|
|
return "gfx909";
|
|
}
|
|
llvm_unreachable("invalid enum");
|
|
}
|
|
|
|
CudaArch StringToCudaArch(llvm::StringRef S) {
|
|
return llvm::StringSwitch<CudaArch>(S)
|
|
.Case("sm_20", CudaArch::SM_20)
|
|
.Case("sm_21", CudaArch::SM_21)
|
|
.Case("sm_30", CudaArch::SM_30)
|
|
.Case("sm_32", CudaArch::SM_32)
|
|
.Case("sm_35", CudaArch::SM_35)
|
|
.Case("sm_37", CudaArch::SM_37)
|
|
.Case("sm_50", CudaArch::SM_50)
|
|
.Case("sm_52", CudaArch::SM_52)
|
|
.Case("sm_53", CudaArch::SM_53)
|
|
.Case("sm_60", CudaArch::SM_60)
|
|
.Case("sm_61", CudaArch::SM_61)
|
|
.Case("sm_62", CudaArch::SM_62)
|
|
.Case("sm_70", CudaArch::SM_70)
|
|
.Case("sm_72", CudaArch::SM_72)
|
|
.Case("sm_75", CudaArch::SM_75)
|
|
.Case("gfx600", CudaArch::GFX600)
|
|
.Case("gfx601", CudaArch::GFX601)
|
|
.Case("gfx700", CudaArch::GFX700)
|
|
.Case("gfx701", CudaArch::GFX701)
|
|
.Case("gfx702", CudaArch::GFX702)
|
|
.Case("gfx703", CudaArch::GFX703)
|
|
.Case("gfx704", CudaArch::GFX704)
|
|
.Case("gfx801", CudaArch::GFX801)
|
|
.Case("gfx802", CudaArch::GFX802)
|
|
.Case("gfx803", CudaArch::GFX803)
|
|
.Case("gfx810", CudaArch::GFX810)
|
|
.Case("gfx900", CudaArch::GFX900)
|
|
.Case("gfx902", CudaArch::GFX902)
|
|
.Case("gfx904", CudaArch::GFX904)
|
|
.Case("gfx906", CudaArch::GFX906)
|
|
.Case("gfx909", CudaArch::GFX909)
|
|
.Default(CudaArch::UNKNOWN);
|
|
}
|
|
|
|
const char *CudaVirtualArchToString(CudaVirtualArch A) {
|
|
switch (A) {
|
|
case CudaVirtualArch::UNKNOWN:
|
|
return "unknown";
|
|
case CudaVirtualArch::COMPUTE_20:
|
|
return "compute_20";
|
|
case CudaVirtualArch::COMPUTE_30:
|
|
return "compute_30";
|
|
case CudaVirtualArch::COMPUTE_32:
|
|
return "compute_32";
|
|
case CudaVirtualArch::COMPUTE_35:
|
|
return "compute_35";
|
|
case CudaVirtualArch::COMPUTE_37:
|
|
return "compute_37";
|
|
case CudaVirtualArch::COMPUTE_50:
|
|
return "compute_50";
|
|
case CudaVirtualArch::COMPUTE_52:
|
|
return "compute_52";
|
|
case CudaVirtualArch::COMPUTE_53:
|
|
return "compute_53";
|
|
case CudaVirtualArch::COMPUTE_60:
|
|
return "compute_60";
|
|
case CudaVirtualArch::COMPUTE_61:
|
|
return "compute_61";
|
|
case CudaVirtualArch::COMPUTE_62:
|
|
return "compute_62";
|
|
case CudaVirtualArch::COMPUTE_70:
|
|
return "compute_70";
|
|
case CudaVirtualArch::COMPUTE_72:
|
|
return "compute_72";
|
|
case CudaVirtualArch::COMPUTE_75:
|
|
return "compute_75";
|
|
case CudaVirtualArch::COMPUTE_AMDGCN:
|
|
return "compute_amdgcn";
|
|
}
|
|
llvm_unreachable("invalid enum");
|
|
}
|
|
|
|
CudaVirtualArch StringToCudaVirtualArch(llvm::StringRef S) {
|
|
return llvm::StringSwitch<CudaVirtualArch>(S)
|
|
.Case("compute_20", CudaVirtualArch::COMPUTE_20)
|
|
.Case("compute_30", CudaVirtualArch::COMPUTE_30)
|
|
.Case("compute_32", CudaVirtualArch::COMPUTE_32)
|
|
.Case("compute_35", CudaVirtualArch::COMPUTE_35)
|
|
.Case("compute_37", CudaVirtualArch::COMPUTE_37)
|
|
.Case("compute_50", CudaVirtualArch::COMPUTE_50)
|
|
.Case("compute_52", CudaVirtualArch::COMPUTE_52)
|
|
.Case("compute_53", CudaVirtualArch::COMPUTE_53)
|
|
.Case("compute_60", CudaVirtualArch::COMPUTE_60)
|
|
.Case("compute_61", CudaVirtualArch::COMPUTE_61)
|
|
.Case("compute_62", CudaVirtualArch::COMPUTE_62)
|
|
.Case("compute_70", CudaVirtualArch::COMPUTE_70)
|
|
.Case("compute_72", CudaVirtualArch::COMPUTE_72)
|
|
.Case("compute_75", CudaVirtualArch::COMPUTE_75)
|
|
.Case("compute_amdgcn", CudaVirtualArch::COMPUTE_AMDGCN)
|
|
.Default(CudaVirtualArch::UNKNOWN);
|
|
}
|
|
|
|
CudaVirtualArch VirtualArchForCudaArch(CudaArch A) {
|
|
switch (A) {
|
|
case CudaArch::LAST:
|
|
break;
|
|
case CudaArch::UNKNOWN:
|
|
return CudaVirtualArch::UNKNOWN;
|
|
case CudaArch::SM_20:
|
|
case CudaArch::SM_21:
|
|
return CudaVirtualArch::COMPUTE_20;
|
|
case CudaArch::SM_30:
|
|
return CudaVirtualArch::COMPUTE_30;
|
|
case CudaArch::SM_32:
|
|
return CudaVirtualArch::COMPUTE_32;
|
|
case CudaArch::SM_35:
|
|
return CudaVirtualArch::COMPUTE_35;
|
|
case CudaArch::SM_37:
|
|
return CudaVirtualArch::COMPUTE_37;
|
|
case CudaArch::SM_50:
|
|
return CudaVirtualArch::COMPUTE_50;
|
|
case CudaArch::SM_52:
|
|
return CudaVirtualArch::COMPUTE_52;
|
|
case CudaArch::SM_53:
|
|
return CudaVirtualArch::COMPUTE_53;
|
|
case CudaArch::SM_60:
|
|
return CudaVirtualArch::COMPUTE_60;
|
|
case CudaArch::SM_61:
|
|
return CudaVirtualArch::COMPUTE_61;
|
|
case CudaArch::SM_62:
|
|
return CudaVirtualArch::COMPUTE_62;
|
|
case CudaArch::SM_70:
|
|
return CudaVirtualArch::COMPUTE_70;
|
|
case CudaArch::SM_72:
|
|
return CudaVirtualArch::COMPUTE_72;
|
|
case CudaArch::SM_75:
|
|
return CudaVirtualArch::COMPUTE_75;
|
|
case CudaArch::GFX600:
|
|
case CudaArch::GFX601:
|
|
case CudaArch::GFX700:
|
|
case CudaArch::GFX701:
|
|
case CudaArch::GFX702:
|
|
case CudaArch::GFX703:
|
|
case CudaArch::GFX704:
|
|
case CudaArch::GFX801:
|
|
case CudaArch::GFX802:
|
|
case CudaArch::GFX803:
|
|
case CudaArch::GFX810:
|
|
case CudaArch::GFX900:
|
|
case CudaArch::GFX902:
|
|
case CudaArch::GFX904:
|
|
case CudaArch::GFX906:
|
|
case CudaArch::GFX909:
|
|
return CudaVirtualArch::COMPUTE_AMDGCN;
|
|
}
|
|
llvm_unreachable("invalid enum");
|
|
}
|
|
|
|
CudaVersion MinVersionForCudaArch(CudaArch A) {
|
|
switch (A) {
|
|
case CudaArch::LAST:
|
|
break;
|
|
case CudaArch::UNKNOWN:
|
|
return CudaVersion::UNKNOWN;
|
|
case CudaArch::SM_20:
|
|
case CudaArch::SM_21:
|
|
case CudaArch::SM_30:
|
|
case CudaArch::SM_32:
|
|
case CudaArch::SM_35:
|
|
case CudaArch::SM_37:
|
|
case CudaArch::SM_50:
|
|
case CudaArch::SM_52:
|
|
case CudaArch::SM_53:
|
|
return CudaVersion::CUDA_70;
|
|
case CudaArch::SM_60:
|
|
case CudaArch::SM_61:
|
|
case CudaArch::SM_62:
|
|
return CudaVersion::CUDA_80;
|
|
case CudaArch::SM_70:
|
|
return CudaVersion::CUDA_90;
|
|
case CudaArch::SM_72:
|
|
return CudaVersion::CUDA_91;
|
|
case CudaArch::SM_75:
|
|
return CudaVersion::CUDA_100;
|
|
case CudaArch::GFX600:
|
|
case CudaArch::GFX601:
|
|
case CudaArch::GFX700:
|
|
case CudaArch::GFX701:
|
|
case CudaArch::GFX702:
|
|
case CudaArch::GFX703:
|
|
case CudaArch::GFX704:
|
|
case CudaArch::GFX801:
|
|
case CudaArch::GFX802:
|
|
case CudaArch::GFX803:
|
|
case CudaArch::GFX810:
|
|
case CudaArch::GFX900:
|
|
case CudaArch::GFX902:
|
|
case CudaArch::GFX904:
|
|
case CudaArch::GFX906:
|
|
case CudaArch::GFX909:
|
|
return CudaVersion::CUDA_70;
|
|
}
|
|
llvm_unreachable("invalid enum");
|
|
}
|
|
|
|
CudaVersion MaxVersionForCudaArch(CudaArch A) {
|
|
switch (A) {
|
|
case CudaArch::UNKNOWN:
|
|
return CudaVersion::UNKNOWN;
|
|
case CudaArch::SM_20:
|
|
case CudaArch::SM_21:
|
|
case CudaArch::GFX600:
|
|
case CudaArch::GFX601:
|
|
case CudaArch::GFX700:
|
|
case CudaArch::GFX701:
|
|
case CudaArch::GFX702:
|
|
case CudaArch::GFX703:
|
|
case CudaArch::GFX704:
|
|
case CudaArch::GFX801:
|
|
case CudaArch::GFX802:
|
|
case CudaArch::GFX803:
|
|
case CudaArch::GFX810:
|
|
case CudaArch::GFX900:
|
|
case CudaArch::GFX902:
|
|
return CudaVersion::CUDA_80;
|
|
default:
|
|
return CudaVersion::LATEST;
|
|
}
|
|
}
|
|
|
|
static CudaVersion ToCudaVersion(llvm::VersionTuple Version) {
|
|
int IVer =
|
|
Version.getMajor() * 10 + Version.getMinor().getValueOr(0);
|
|
switch(IVer) {
|
|
case 70:
|
|
return CudaVersion::CUDA_70;
|
|
case 75:
|
|
return CudaVersion::CUDA_75;
|
|
case 80:
|
|
return CudaVersion::CUDA_80;
|
|
case 90:
|
|
return CudaVersion::CUDA_90;
|
|
case 91:
|
|
return CudaVersion::CUDA_91;
|
|
case 92:
|
|
return CudaVersion::CUDA_92;
|
|
case 100:
|
|
return CudaVersion::CUDA_100;
|
|
case 101:
|
|
return CudaVersion::CUDA_101;
|
|
default:
|
|
return CudaVersion::UNKNOWN;
|
|
}
|
|
}
|
|
|
|
bool CudaFeatureEnabled(llvm::VersionTuple Version, CudaFeature Feature) {
|
|
return CudaFeatureEnabled(ToCudaVersion(Version), Feature);
|
|
}
|
|
|
|
bool CudaFeatureEnabled(CudaVersion Version, CudaFeature Feature) {
|
|
switch (Feature) {
|
|
case CudaFeature::CUDA_USES_NEW_LAUNCH:
|
|
return Version >= CudaVersion::CUDA_92;
|
|
case CudaFeature::CUDA_USES_FATBIN_REGISTER_END:
|
|
return Version >= CudaVersion::CUDA_101;
|
|
}
|
|
llvm_unreachable("Unknown CUDA feature.");
|
|
}
|
|
} // namespace clang
|