llvm-project/llvm/lib/Target/AMDGPU/AMDGPUSubtarget.cpp

//===-- AMDGPUSubtarget.cpp - AMDGPU Subtarget Information ----------------===//
//
//                     The LLVM Compiler Infrastructure
//
// This file is distributed under the University of Illinois Open Source
// License. See LICENSE.TXT for details.
//
//===----------------------------------------------------------------------===//
//
/// \file
/// \brief Implements the AMDGPU specific subclass of TargetSubtarget.
//
//===----------------------------------------------------------------------===//

#include "AMDGPUSubtarget.h"
#include "R600ISelLowering.h"
#include "R600InstrInfo.h"
#include "R600MachineScheduler.h"
#include "SIISelLowering.h"
#include "SIInstrInfo.h"
#include "SIMachineFunctionInfo.h"
#include "llvm/ADT/SmallString.h"
#include "llvm/CodeGen/MachineScheduler.h"

using namespace llvm;

#define DEBUG_TYPE "amdgpu-subtarget"

#define GET_SUBTARGETINFO_ENUM
#define GET_SUBTARGETINFO_TARGET_DESC
#define GET_SUBTARGETINFO_CTOR
#include "AMDGPUGenSubtargetInfo.inc"

AMDGPUSubtarget &
AMDGPUSubtarget::initializeSubtargetDependencies(const Triple &TT,
                                                 StringRef GPU, StringRef FS) {
  // Determine default and user-specified characteristics
  // On SI+, we want FP64 denormals to be on by default. FP32 denormals can be
  // enabled, but some instructions do not respect them and they run at the
  // double precision rate, so don't enable by default.
  //
  // We want to be able to turn these off, but making this a subtarget feature
  // for SI has the unhelpful behavior that it unsets everything else if you
  // disable it.

  SmallString<256> FullFS("+promote-alloca,+fp64-denormals,");
  FullFS += FS;

  if (GPU == "" && TT.getArch() == Triple::amdgcn)
    GPU = "SI";

  ParseSubtargetFeatures(GPU, FullFS);

  // FIXME: I don't think think Evergreen has any useful support for
  // denormals, but should be checked. Should we issue a warning somewhere
  // if someone tries to enable these?
  if (getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
    FP32Denormals = false;
    FP64Denormals = false;
  }
  return *this;
}

AMDGPUSubtarget::AMDGPUSubtarget(const Triple &TT, StringRef GPU, StringRef FS,
                                 TargetMachine &TM)
    : AMDGPUGenSubtargetInfo(TT, GPU, FS), DevName(GPU), Is64bit(false),
      DumpCode(false), R600ALUInst(false), HasVertexCache(false),
      TexVTXClauseSize(0), Gen(AMDGPUSubtarget::R600), FP64(false),
      FP64Denormals(false), FP32Denormals(false), FastFMAF32(false),
      CaymanISA(false), FlatAddressSpace(false), EnableIRStructurizer(true),
      EnablePromoteAlloca(false), EnableIfCvt(true), EnableLoadStoreOpt(false),
      EnableUnsafeDSOffsetFolding(false),
      WavefrontSize(0), CFALUBug(false), LocalMemorySize(0),
      EnableVGPRSpilling(false), SGPRInitBug(false), IsGCN(false),
      GCN1Encoding(false), GCN3Encoding(false), CIInsts(false), LDSBankCount(0),
      IsaVersion(ISAVersion0_0_0), EnableHugeScratchBuffer(false),
      FrameLowering(TargetFrameLowering::StackGrowsUp,
                    64 * 16, // Maximum stack alignment (long16)
                    0),
      InstrItins(getInstrItineraryForCPU(GPU)), TargetTriple(TT) {

  initializeSubtargetDependencies(TT, GPU, FS);

  if (getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
    InstrInfo.reset(new R600InstrInfo(*this));
    TLInfo.reset(new R600TargetLowering(TM, *this));
  } else {
    InstrInfo.reset(new SIInstrInfo(*this));
    TLInfo.reset(new SITargetLowering(TM, *this));
  }
}

unsigned AMDGPUSubtarget::getStackEntrySize() const {
  assert(getGeneration() <= NORTHERN_ISLANDS);
  switch(getWavefrontSize()) {
  case 16:
    return 8;
  case 32:
    return hasCaymanISA() ? 4 : 8;
  case 64:
    return 4;
  default:
    llvm_unreachable("Illegal wavefront size.");
  }
}

unsigned AMDGPUSubtarget::getAmdKernelCodeChipID() const {
  switch(getGeneration()) {
  default: llvm_unreachable("ChipID unknown");
  case SEA_ISLANDS: return 12;
  }
}

AMDGPU::IsaVersion AMDGPUSubtarget::getIsaVersion() const {
  return AMDGPU::getIsaVersion(getFeatureBits());
}

bool AMDGPUSubtarget::isVGPRSpillingEnabled(
                                       const SIMachineFunctionInfo *MFI) const {
  return MFI->getShaderType() == ShaderType::COMPUTE || EnableVGPRSpilling;
}

void AMDGPUSubtarget::overrideSchedPolicy(MachineSchedPolicy &Policy,
                                          MachineInstr *begin,
                                          MachineInstr *end,
                                          unsigned NumRegionInstrs) const {
  if (getGeneration() >= SOUTHERN_ISLANDS) {

    // Track register pressure so the scheduler can try to decrease
    // pressure once register usage is above the threshold defined by
    // SIRegisterInfo::getRegPressureSetLimit()
    Policy.ShouldTrackPressure = true;

    // Enabling both top down and bottom up scheduling seems to give us less
    // register spills than just using one of these approaches on its own.
    Policy.OnlyTopDown = false;
    Policy.OnlyBottomUp = false;
  }
}
Add R600 backend A new backend supporting AMD GPUs: Radeon HD2XXX - HD7XXX llvm-svn: 169915 2012-12-12 05:25:42 +08:00			`//===-- AMDGPUSubtarget.cpp - AMDGPU Subtarget Information ----------------===//`
			`//`
			`// The LLVM Compiler Infrastructure`
			`//`
			`// This file is distributed under the University of Illinois Open Source`
			`// License. See LICENSE.TXT for details.`
			`//`
			`//===----------------------------------------------------------------------===//`
			`//`
			`/// \file`
			`/// \brief Implements the AMDGPU specific subclass of TargetSubtarget.`
			`//`
			`//===----------------------------------------------------------------------===//`

			`#include "AMDGPUSubtarget.h"`
Move R600 subtarget dependent variables onto the subtarget. No functional change. llvm-svn: 213982 2014-07-26 06:22:39 +08:00			`#include "R600ISelLowering.h"`
R600: Move AMDGPUInstrInfo from AMDGPUTargetMachine into AMDGPUSubtarget llvm-svn: 210869 2014-06-13 09:32:00 +08:00			`#include "R600InstrInfo.h"`
Move R600 subtarget dependent variables onto the subtarget. No functional change. llvm-svn: 213982 2014-07-26 06:22:39 +08:00			`#include "R600MachineScheduler.h"`
			`#include "SIISelLowering.h"`
[cleanup] Re-sort all the #include lines in LLVM using utils/sort_includes.py. I clearly haven't done this in a while, so more changed than usual. This even uncovered a missing include from the InstrProf library that I've added. No functionality changed here, just mechanical cleanup of the include order. llvm-svn: 225974 2015-01-14 19:23:27 +08:00			`#include "SIInstrInfo.h"`
R600/SI: Add subtarget feature to enable VGPR spilling for all shader types This is disabled by default, but can be enabled with the subtarget feature: 'vgpr-spilling' llvm-svn: 226597 2015-01-21 03:33:04 +08:00			`#include "SIMachineFunctionInfo.h"`
R600: Add option to disable promote alloca This can make writing some tests harder, so add a flag to disable it. llvm-svn: 212893 2014-07-13 10:08:26 +08:00			`#include "llvm/ADT/SmallString.h"`
R600/SI: Define a schedule model and enable the generic machine scheduler The schedule model is not complete yet, and could be improved. llvm-svn: 227461 2015-01-30 00:55:25 +08:00			`#include "llvm/CodeGen/MachineScheduler.h"`
R600: Add option to disable promote alloca This can make writing some tests harder, so add a flag to disable it. llvm-svn: 212893 2014-07-13 10:08:26 +08:00
Add R600 backend A new backend supporting AMD GPUs: Radeon HD2XXX - HD7XXX llvm-svn: 169915 2012-12-12 05:25:42 +08:00			`using namespace llvm;`

[Modules] Make Support/Debug.h modular. This requires it to not change behavior based on other files defining DEBUG_TYPE, which means it cannot define DEBUG_TYPE at all. This is actually better IMO as it forces folks to define relevant DEBUG_TYPEs for their files. However, it requires all files that currently use DEBUG(...) to define a DEBUG_TYPE if they don't already. I've updated all such files in LLVM and will do the same for other upstream projects. This still leaves one important change in how LLVM uses the DEBUG_TYPE macro going forward: we need to only define the macro after header files have been #include-ed. Previously, this wasn't possible because Debug.h required the macro to be pre-defined. This commit removes that. By defining DEBUG_TYPE after the includes two things are fixed: - Header files that need to provide a DEBUG_TYPE for some inline code can do so by defining the macro before their inline code and undef-ing it afterward so the macro does not escape. - We no longer have rampant ODR violations due to including headers with different DEBUG_TYPE definitions. This may be mostly an academic violation today, but with modules these types of violations are easy to check for and potentially very relevant. Where necessary to suppor headers with DEBUG_TYPE, I have moved the definitions below the includes in this commit. I plan to move the rest of the DEBUG_TYPE macros in LLVM in subsequent commits; this one is big enough. The comments in Debug.h, which were hilariously out of date already, have been updated to reflect the recommended practice going forward. llvm-svn: 206822 2014-04-22 06:55:11 +08:00			`#define DEBUG_TYPE "amdgpu-subtarget"`

Add R600 backend A new backend supporting AMD GPUs: Radeon HD2XXX - HD7XXX llvm-svn: 169915 2012-12-12 05:25:42 +08:00			`#define GET_SUBTARGETINFO_ENUM`
			`#define GET_SUBTARGETINFO_TARGET_DESC`
			`#define GET_SUBTARGETINFO_CTOR`
			`#include "AMDGPUGenSubtargetInfo.inc"`

Move R600 subtarget dependent variables onto the subtarget. No functional change. llvm-svn: 213982 2014-07-26 06:22:39 +08:00			`AMDGPUSubtarget &`
Replace string GNU Triples with llvm::Triple in MCSubtargetInfo and create*MCSubtargetInfo(). NFC. Summary: This continues the patch series to eliminate StringRef forms of GNU triples from the internals of LLVM that began in r239036. Reviewers: rafael Reviewed By: rafael Subscribers: rafael, ted, jfb, llvm-commits, rengolin, jholewinski Differential Revision: http://reviews.llvm.org/D10311 llvm-svn: 239467 2015-06-10 20:11:26 +08:00			`AMDGPUSubtarget::initializeSubtargetDependencies(const Triple &TT,`
			`StringRef GPU, StringRef FS) {`
Move R600 subtarget dependent variables onto the subtarget. No functional change. llvm-svn: 213982 2014-07-26 06:22:39 +08:00			`// Determine default and user-specified characteristics`
R600: Add denormal handling subtarget features. llvm-svn: 213018 2014-07-15 07:40:49 +08:00			`// On SI+, we want FP64 denormals to be on by default. FP32 denormals can be`
			`// enabled, but some instructions do not respect them and they run at the`
			`// double precision rate, so don't enable by default.`
			`//`
			`// We want to be able to turn these off, but making this a subtarget feature`
			`// for SI has the unhelpful behavior that it unsets everything else if you`
			`// disable it.`
R600: Add option to disable promote alloca This can make writing some tests harder, so add a flag to disable it. llvm-svn: 212893 2014-07-13 10:08:26 +08:00
R600: Add denormal handling subtarget features. llvm-svn: 213018 2014-07-15 07:40:49 +08:00			`SmallString<256> FullFS("+promote-alloca,+fp64-denormals,");`
R600: Add option to disable promote alloca This can make writing some tests harder, so add a flag to disable it. llvm-svn: 212893 2014-07-13 10:08:26 +08:00			`FullFS += FS;`

Replace string GNU Triples with llvm::Triple in MCSubtargetInfo and create*MCSubtargetInfo(). NFC. Summary: This continues the patch series to eliminate StringRef forms of GNU triples from the internals of LLVM that began in r239036. Reviewers: rafael Reviewed By: rafael Subscribers: rafael, ted, jfb, llvm-commits, rengolin, jholewinski Differential Revision: http://reviews.llvm.org/D10311 llvm-svn: 239467 2015-06-10 20:11:26 +08:00			`if (GPU == "" && TT.getArch() == Triple::amdgcn)`
R600: Use a Southern Islands GPU as the default for the amdgcn target llvm-svn: 227314 2015-01-28 23:38:42 +08:00			`GPU = "SI";`

R600: Add option to disable promote alloca This can make writing some tests harder, so add a flag to disable it. llvm-svn: 212893 2014-07-13 10:08:26 +08:00			`ParseSubtargetFeatures(GPU, FullFS);`
R600: Move AMDGPUInstrInfo from AMDGPUTargetMachine into AMDGPUSubtarget llvm-svn: 210869 2014-06-13 09:32:00 +08:00
Move R600 subtarget dependent variables onto the subtarget. No functional change. llvm-svn: 213982 2014-07-26 06:22:39 +08:00			`// FIXME: I don't think think Evergreen has any useful support for`
			`// denormals, but should be checked. Should we issue a warning somewhere`
			`// if someone tries to enable these?`
R600: Move AMDGPUInstrInfo from AMDGPUTargetMachine into AMDGPUSubtarget llvm-svn: 210869 2014-06-13 09:32:00 +08:00			`if (getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {`
R600: Add denormal handling subtarget features. llvm-svn: 213018 2014-07-15 07:40:49 +08:00			`FP32Denormals = false;`
			`FP64Denormals = false;`
Move R600 subtarget dependent variables onto the subtarget. No functional change. llvm-svn: 213982 2014-07-26 06:22:39 +08:00			`}`
			`return *this;`
			`}`

Replace string GNU Triples with llvm::Triple in MCSubtargetInfo and create*MCSubtargetInfo(). NFC. Summary: This continues the patch series to eliminate StringRef forms of GNU triples from the internals of LLVM that began in r239036. Reviewers: rafael Reviewed By: rafael Subscribers: rafael, ted, jfb, llvm-commits, rengolin, jholewinski Differential Revision: http://reviews.llvm.org/D10311 llvm-svn: 239467 2015-06-10 20:11:26 +08:00			`AMDGPUSubtarget::AMDGPUSubtarget(const Triple &TT, StringRef GPU, StringRef FS,`
Move R600 subtarget dependent variables onto the subtarget. No functional change. llvm-svn: 213982 2014-07-26 06:22:39 +08:00			`TargetMachine &TM)`
Revert r247692: Replace Triple with a new TargetTuple in MCTargetDesc/* and related. NFC. Eric has replied and has demanded the patch be reverted. llvm-svn: 247702 2015-09-16 00:17:27 +08:00			`: AMDGPUGenSubtargetInfo(TT, GPU, FS), DevName(GPU), Is64bit(false),`
			`DumpCode(false), R600ALUInst(false), HasVertexCache(false),`
			`TexVTXClauseSize(0), Gen(AMDGPUSubtarget::R600), FP64(false),`
			`FP64Denormals(false), FP32Denormals(false), FastFMAF32(false),`
			`CaymanISA(false), FlatAddressSpace(false), EnableIRStructurizer(true),`
			`EnablePromoteAlloca(false), EnableIfCvt(true), EnableLoadStoreOpt(false),`
			`EnableUnsafeDSOffsetFolding(false),`
80-column fixups. llvm-svn: 229789 2015-02-19 08:15:33 +08:00			`WavefrontSize(0), CFALUBug(false), LocalMemorySize(0),`
Replace string GNU Triples with llvm::Triple in MCSubtargetInfo and create*MCSubtargetInfo(). NFC. Summary: This continues the patch series to eliminate StringRef forms of GNU triples from the internals of LLVM that began in r239036. Reviewers: rafael Reviewed By: rafael Subscribers: rafael, ted, jfb, llvm-commits, rengolin, jholewinski Differential Revision: http://reviews.llvm.org/D10311 llvm-svn: 239467 2015-06-10 20:11:26 +08:00			`EnableVGPRSpilling(false), SGPRInitBug(false), IsGCN(false),`
			`GCN1Encoding(false), GCN3Encoding(false), CIInsts(false), LDSBankCount(0),`
AMDPGU/SI: Use AssertZext node to mask high bit for scratch offsets Summary: We can safely assume that the high bit of scratch offsets will never be set, because this would require at least 128 GB of GPU memory. Reviewers: arsenm Subscribers: llvm-commits Differential Revision: http://reviews.llvm.org/D11225 llvm-svn: 242433 2015-07-17 03:40:07 +08:00			`IsaVersion(ISAVersion0_0_0), EnableHugeScratchBuffer(false),`
Move R600 subtarget dependent variables onto the subtarget. No functional change. llvm-svn: 213982 2014-07-26 06:22:39 +08:00			`FrameLowering(TargetFrameLowering::StackGrowsUp,`
			`64 * 16, // Maximum stack alignment (long16)`
			`0),`
80-column fixups. llvm-svn: 229789 2015-02-19 08:15:33 +08:00			`InstrItins(getInstrItineraryForCPU(GPU)), TargetTriple(TT) {`
R600: Move DataLayout to AMDGPUTargetMachine This is a follow up to r227113. It is now required to use the amdgcn target for SI and newer GPUs. llvm-svn: 227316 2015-01-29 00:04:26 +08:00
			`initializeSubtargetDependencies(TT, GPU, FS);`

Move R600 subtarget dependent variables onto the subtarget. No functional change. llvm-svn: 213982 2014-07-26 06:22:39 +08:00			`if (getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {`
			`InstrInfo.reset(new R600InstrInfo(*this));`
Reuse a bunch of cached subtargets and remove getSubtarget calls without a Function argument. llvm-svn: 227638 2015-01-31 07:24:40 +08:00			`TLInfo.reset(new R600TargetLowering(TM, *this));`
R600: Move AMDGPUInstrInfo from AMDGPUTargetMachine into AMDGPUSubtarget llvm-svn: 210869 2014-06-13 09:32:00 +08:00			`} else {`
			`InstrInfo.reset(new SIInstrInfo(*this));`
Reuse a bunch of cached subtargets and remove getSubtarget calls without a Function argument. llvm-svn: 227638 2015-01-31 07:24:40 +08:00			`TLInfo.reset(new SITargetLowering(TM, *this));`
R600: Move AMDGPUInstrInfo from AMDGPUTargetMachine into AMDGPUSubtarget llvm-svn: 210869 2014-06-13 09:32:00 +08:00			`}`
Add R600 backend A new backend supporting AMD GPUs: Radeon HD2XXX - HD7XXX llvm-svn: 169915 2012-12-12 05:25:42 +08:00			`}`

R600: Move trivial getters into header, use initializer list llvm-svn: 211917 2014-06-28 01:57:00 +08:00			`unsigned AMDGPUSubtarget::getStackEntrySize() const {`
R600: Refactor stack size calculation reviewed-by: Vincent Lejeune <vljn at ovi.com> llvm-svn: 199840 2014-01-23 05:55:43 +08:00			`assert(getGeneration() <= NORTHERN_ISLANDS);`
			`switch(getWavefrontSize()) {`
			`case 16:`
			`return 8;`
			`case 32:`
R600: Move trivial getters into header, use initializer list llvm-svn: 211917 2014-06-28 01:57:00 +08:00			`return hasCaymanISA() ? 4 : 8;`
R600: Refactor stack size calculation reviewed-by: Vincent Lejeune <vljn at ovi.com> llvm-svn: 199840 2014-01-23 05:55:43 +08:00			`case 64:`
			`return 4;`
			`default:`
			`llvm_unreachable("Illegal wavefront size.");`
			`}`
			`}`
R600/SI: Emit amd_kernel_code_t header for AMDGPU environment llvm-svn: 223160 2014-12-03 06:00:07 +08:00
			`unsigned AMDGPUSubtarget::getAmdKernelCodeChipID() const {`
			`switch(getGeneration()) {`
			`default: llvm_unreachable("ChipID unknown");`
			`case SEA_ISLANDS: return 12;`
			`}`
			`}`
R600/SI: Add subtarget feature to enable VGPR spilling for all shader types This is disabled by default, but can be enabled with the subtarget feature: 'vgpr-spilling' llvm-svn: 226597 2015-01-21 03:33:04 +08:00
AMDGPU/SI: Add hsa code object directives Reviewers: arsenm Subscribers: llvm-commits Differential Revision: http://reviews.llvm.org/D10757 llvm-svn: 240831 2015-06-27 05:15:07 +08:00			`AMDGPU::IsaVersion AMDGPUSubtarget::getIsaVersion() const {`
			`return AMDGPU::getIsaVersion(getFeatureBits());`
			`}`

R600/SI: Add subtarget feature to enable VGPR spilling for all shader types This is disabled by default, but can be enabled with the subtarget feature: 'vgpr-spilling' llvm-svn: 226597 2015-01-21 03:33:04 +08:00			`bool AMDGPUSubtarget::isVGPRSpillingEnabled(`
			`const SIMachineFunctionInfo *MFI) const {`
			`return MFI->getShaderType() == ShaderType::COMPUTE \|\| EnableVGPRSpilling;`
			`}`
R600/SI: Define a schedule model and enable the generic machine scheduler The schedule model is not complete yet, and could be improved. llvm-svn: 227461 2015-01-30 00:55:25 +08:00
			`void AMDGPUSubtarget::overrideSchedPolicy(MachineSchedPolicy &Policy,`
			`MachineInstr *begin,`
			`MachineInstr *end,`
			`unsigned NumRegionInstrs) const {`
			`if (getGeneration() >= SOUTHERN_ISLANDS) {`

			`// Track register pressure so the scheduler can try to decrease`
			`// pressure once register usage is above the threshold defined by`
			`// SIRegisterInfo::getRegPressureSetLimit()`
			`Policy.ShouldTrackPressure = true;`

			`// Enabling both top down and bottom up scheduling seems to give us less`
			`// register spills than just using one of these approaches on its own.`
			`Policy.OnlyTopDown = false;`
			`Policy.OnlyBottomUp = false;`
			`}`
			`}`
AMDGPU/SI: Add hsa code object directives Reviewers: arsenm Subscribers: llvm-commits Differential Revision: http://reviews.llvm.org/D10757 llvm-svn: 240831 2015-06-27 05:15:07 +08:00