llvm-6502/lib/Target/R600/AMDGPUSubtarget.cpp

//===-- AMDGPUSubtarget.cpp - AMDGPU Subtarget Information ----------------===//
//
//                     The LLVM Compiler Infrastructure
//
// This file is distributed under the University of Illinois Open Source
// License. See LICENSE.TXT for details.
//
//===----------------------------------------------------------------------===//
//
/// \file
/// \brief Implements the AMDGPU specific subclass of TargetSubtarget.
//
//===----------------------------------------------------------------------===//

#include "AMDGPUSubtarget.h"
#include "R600ISelLowering.h"
#include "R600InstrInfo.h"
#include "R600MachineScheduler.h"
#include "SIISelLowering.h"
#include "SIInstrInfo.h"
#include "SIMachineFunctionInfo.h"
#include "llvm/ADT/SmallString.h"
#include "llvm/CodeGen/MachineScheduler.h"

using namespace llvm;

#define DEBUG_TYPE "amdgpu-subtarget"

#define GET_SUBTARGETINFO_ENUM
#define GET_SUBTARGETINFO_TARGET_DESC
#define GET_SUBTARGETINFO_CTOR
#include "AMDGPUGenSubtargetInfo.inc"

AMDGPUSubtarget &
AMDGPUSubtarget::initializeSubtargetDependencies(StringRef TT, StringRef GPU,
                                                 StringRef FS) {
  // Determine default and user-specified characteristics
  // On SI+, we want FP64 denormals to be on by default. FP32 denormals can be
  // enabled, but some instructions do not respect them and they run at the
  // double precision rate, so don't enable by default.
  //
  // We want to be able to turn these off, but making this a subtarget feature
  // for SI has the unhelpful behavior that it unsets everything else if you
  // disable it.

  SmallString<256> FullFS("+promote-alloca,+fp64-denormals,");
  FullFS += FS;

  if (GPU == "" && Triple(TT).getArch() == Triple::amdgcn)
    GPU = "SI";

  ParseSubtargetFeatures(GPU, FullFS);

  // FIXME: I don't think think Evergreen has any useful support for
  // denormals, but should be checked. Should we issue a warning somewhere
  // if someone tries to enable these?
  if (getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
    FP32Denormals = false;
    FP64Denormals = false;
  }
  return *this;
}

AMDGPUSubtarget::AMDGPUSubtarget(StringRef TT, StringRef GPU, StringRef FS,
                                 TargetMachine &TM)
    : AMDGPUGenSubtargetInfo(TT, GPU, FS), DevName(GPU), Is64bit(false),
      DumpCode(false), R600ALUInst(false), HasVertexCache(false),
      TexVTXClauseSize(0), Gen(AMDGPUSubtarget::R600), FP64(false),
      FP64Denormals(false), FP32Denormals(false), FastFMAF32(false),
      CaymanISA(false), FlatAddressSpace(false), EnableIRStructurizer(true),
      EnablePromoteAlloca(false), EnableIfCvt(true), EnableLoadStoreOpt(false),
      WavefrontSize(0), CFALUBug(false), LocalMemorySize(0),
      EnableVGPRSpilling(false),
      FrameLowering(TargetFrameLowering::StackGrowsUp,
                    64 * 16, // Maximum stack alignment (long16)
                    0),
      InstrItins(getInstrItineraryForCPU(GPU)), TargetTriple(TT) {

  initializeSubtargetDependencies(TT, GPU, FS);

  if (getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
    InstrInfo.reset(new R600InstrInfo(*this));
    TLInfo.reset(new R600TargetLowering(TM, *this));
  } else {
    InstrInfo.reset(new SIInstrInfo(*this));
    TLInfo.reset(new SITargetLowering(TM, *this));
  }
}

unsigned AMDGPUSubtarget::getStackEntrySize() const {
  assert(getGeneration() <= NORTHERN_ISLANDS);
  switch(getWavefrontSize()) {
  case 16:
    return 8;
  case 32:
    return hasCaymanISA() ? 4 : 8;
  case 64:
    return 4;
  default:
    llvm_unreachable("Illegal wavefront size.");
  }
}

unsigned AMDGPUSubtarget::getAmdKernelCodeChipID() const {
  switch(getGeneration()) {
  default: llvm_unreachable("ChipID unknown");
  case SEA_ISLANDS: return 12;
  }
}

bool AMDGPUSubtarget::isVGPRSpillingEnabled(
                                       const SIMachineFunctionInfo *MFI) const {
  return MFI->getShaderType() == ShaderType::COMPUTE || EnableVGPRSpilling;
}

void AMDGPUSubtarget::overrideSchedPolicy(MachineSchedPolicy &Policy,
                                          MachineInstr *begin,
                                          MachineInstr *end,
                                          unsigned NumRegionInstrs) const {
  if (getGeneration() >= SOUTHERN_ISLANDS) {

    // Track register pressure so the scheduler can try to decrease
    // pressure once register usage is above the threshold defined by
    // SIRegisterInfo::getRegPressureSetLimit()
    Policy.ShouldTrackPressure = true;

    // Enabling both top down and bottom up scheduling seems to give us less
    // register spills than just using one of these approaches on its own.
    Policy.OnlyTopDown = false;
    Policy.OnlyBottomUp = false;
  }
}
Add R600 backend A new backend supporting AMD GPUs: Radeon HD2XXX - HD7XXX git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@169915 91177308-0d34-0410-b5e6-96231b3b80d8 2012-12-11 21:25:42 +00:00			`//===-- AMDGPUSubtarget.cpp - AMDGPU Subtarget Information ----------------===//`
			`//`
			`// The LLVM Compiler Infrastructure`
			`//`
			`// This file is distributed under the University of Illinois Open Source`
			`// License. See LICENSE.TXT for details.`
			`//`
			`//===----------------------------------------------------------------------===//`
			`//`
			`/// \file`
			`/// \brief Implements the AMDGPU specific subclass of TargetSubtarget.`
			`//`
			`//===----------------------------------------------------------------------===//`

			`#include "AMDGPUSubtarget.h"`
Move R600 subtarget dependent variables onto the subtarget. No functional change. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@213982 91177308-0d34-0410-b5e6-96231b3b80d8 2014-07-25 22:22:39 +00:00			`#include "R600ISelLowering.h"`
R600: Move AMDGPUInstrInfo from AMDGPUTargetMachine into AMDGPUSubtarget git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@210869 91177308-0d34-0410-b5e6-96231b3b80d8 2014-06-13 01:32:00 +00:00			`#include "R600InstrInfo.h"`
Move R600 subtarget dependent variables onto the subtarget. No functional change. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@213982 91177308-0d34-0410-b5e6-96231b3b80d8 2014-07-25 22:22:39 +00:00			`#include "R600MachineScheduler.h"`
			`#include "SIISelLowering.h"`
[cleanup] Re-sort all the #include lines in LLVM using utils/sort_includes.py. I clearly haven't done this in a while, so more changed than usual. This even uncovered a missing include from the InstrProf library that I've added. No functionality changed here, just mechanical cleanup of the include order. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@225974 91177308-0d34-0410-b5e6-96231b3b80d8 2015-01-14 11:23:27 +00:00			`#include "SIInstrInfo.h"`
R600/SI: Add subtarget feature to enable VGPR spilling for all shader types This is disabled by default, but can be enabled with the subtarget feature: 'vgpr-spilling' git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@226597 91177308-0d34-0410-b5e6-96231b3b80d8 2015-01-20 19:33:04 +00:00			`#include "SIMachineFunctionInfo.h"`
R600: Add option to disable promote alloca This can make writing some tests harder, so add a flag to disable it. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@212893 91177308-0d34-0410-b5e6-96231b3b80d8 2014-07-13 02:08:26 +00:00			`#include "llvm/ADT/SmallString.h"`
R600/SI: Define a schedule model and enable the generic machine scheduler The schedule model is not complete yet, and could be improved. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@227461 91177308-0d34-0410-b5e6-96231b3b80d8 2015-01-29 16:55:25 +00:00			`#include "llvm/CodeGen/MachineScheduler.h"`
R600: Add option to disable promote alloca This can make writing some tests harder, so add a flag to disable it. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@212893 91177308-0d34-0410-b5e6-96231b3b80d8 2014-07-13 02:08:26 +00:00
Add R600 backend A new backend supporting AMD GPUs: Radeon HD2XXX - HD7XXX git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@169915 91177308-0d34-0410-b5e6-96231b3b80d8 2012-12-11 21:25:42 +00:00			`using namespace llvm;`

[Modules] Make Support/Debug.h modular. This requires it to not change behavior based on other files defining DEBUG_TYPE, which means it cannot define DEBUG_TYPE at all. This is actually better IMO as it forces folks to define relevant DEBUG_TYPEs for their files. However, it requires all files that currently use DEBUG(...) to define a DEBUG_TYPE if they don't already. I've updated all such files in LLVM and will do the same for other upstream projects. This still leaves one important change in how LLVM uses the DEBUG_TYPE macro going forward: we need to only define the macro after header files have been #include-ed. Previously, this wasn't possible because Debug.h required the macro to be pre-defined. This commit removes that. By defining DEBUG_TYPE after the includes two things are fixed: - Header files that need to provide a DEBUG_TYPE for some inline code can do so by defining the macro before their inline code and undef-ing it afterward so the macro does not escape. - We no longer have rampant ODR violations due to including headers with different DEBUG_TYPE definitions. This may be mostly an academic violation today, but with modules these types of violations are easy to check for and potentially very relevant. Where necessary to suppor headers with DEBUG_TYPE, I have moved the definitions below the includes in this commit. I plan to move the rest of the DEBUG_TYPE macros in LLVM in subsequent commits; this one is big enough. The comments in Debug.h, which were hilariously out of date already, have been updated to reflect the recommended practice going forward. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@206822 91177308-0d34-0410-b5e6-96231b3b80d8 2014-04-21 22:55:11 +00:00			`#define DEBUG_TYPE "amdgpu-subtarget"`

Add R600 backend A new backend supporting AMD GPUs: Radeon HD2XXX - HD7XXX git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@169915 91177308-0d34-0410-b5e6-96231b3b80d8 2012-12-11 21:25:42 +00:00			`#define GET_SUBTARGETINFO_ENUM`
			`#define GET_SUBTARGETINFO_TARGET_DESC`
			`#define GET_SUBTARGETINFO_CTOR`
			`#include "AMDGPUGenSubtargetInfo.inc"`

Move R600 subtarget dependent variables onto the subtarget. No functional change. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@213982 91177308-0d34-0410-b5e6-96231b3b80d8 2014-07-25 22:22:39 +00:00			`AMDGPUSubtarget &`
80-column fixups. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@229789 91177308-0d34-0410-b5e6-96231b3b80d8 2015-02-19 00:15:33 +00:00			`AMDGPUSubtarget::initializeSubtargetDependencies(StringRef TT, StringRef GPU,`
			`StringRef FS) {`
Move R600 subtarget dependent variables onto the subtarget. No functional change. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@213982 91177308-0d34-0410-b5e6-96231b3b80d8 2014-07-25 22:22:39 +00:00			`// Determine default and user-specified characteristics`
R600: Add denormal handling subtarget features. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@213018 91177308-0d34-0410-b5e6-96231b3b80d8 2014-07-14 23:40:49 +00:00			`// On SI+, we want FP64 denormals to be on by default. FP32 denormals can be`
			`// enabled, but some instructions do not respect them and they run at the`
			`// double precision rate, so don't enable by default.`
			`//`
			`// We want to be able to turn these off, but making this a subtarget feature`
			`// for SI has the unhelpful behavior that it unsets everything else if you`
			`// disable it.`
R600: Add option to disable promote alloca This can make writing some tests harder, so add a flag to disable it. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@212893 91177308-0d34-0410-b5e6-96231b3b80d8 2014-07-13 02:08:26 +00:00
R600: Add denormal handling subtarget features. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@213018 91177308-0d34-0410-b5e6-96231b3b80d8 2014-07-14 23:40:49 +00:00			`SmallString<256> FullFS("+promote-alloca,+fp64-denormals,");`
R600: Add option to disable promote alloca This can make writing some tests harder, so add a flag to disable it. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@212893 91177308-0d34-0410-b5e6-96231b3b80d8 2014-07-13 02:08:26 +00:00			`FullFS += FS;`

R600: Use a Southern Islands GPU as the default for the amdgcn target git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@227314 91177308-0d34-0410-b5e6-96231b3b80d8 2015-01-28 15:38:42 +00:00			`if (GPU == "" && Triple(TT).getArch() == Triple::amdgcn)`
			`GPU = "SI";`

R600: Add option to disable promote alloca This can make writing some tests harder, so add a flag to disable it. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@212893 91177308-0d34-0410-b5e6-96231b3b80d8 2014-07-13 02:08:26 +00:00			`ParseSubtargetFeatures(GPU, FullFS);`
R600: Move AMDGPUInstrInfo from AMDGPUTargetMachine into AMDGPUSubtarget git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@210869 91177308-0d34-0410-b5e6-96231b3b80d8 2014-06-13 01:32:00 +00:00
Move R600 subtarget dependent variables onto the subtarget. No functional change. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@213982 91177308-0d34-0410-b5e6-96231b3b80d8 2014-07-25 22:22:39 +00:00			`// FIXME: I don't think think Evergreen has any useful support for`
			`// denormals, but should be checked. Should we issue a warning somewhere`
			`// if someone tries to enable these?`
R600: Move AMDGPUInstrInfo from AMDGPUTargetMachine into AMDGPUSubtarget git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@210869 91177308-0d34-0410-b5e6-96231b3b80d8 2014-06-13 01:32:00 +00:00			`if (getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {`
R600: Add denormal handling subtarget features. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@213018 91177308-0d34-0410-b5e6-96231b3b80d8 2014-07-14 23:40:49 +00:00			`FP32Denormals = false;`
			`FP64Denormals = false;`
Move R600 subtarget dependent variables onto the subtarget. No functional change. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@213982 91177308-0d34-0410-b5e6-96231b3b80d8 2014-07-25 22:22:39 +00:00			`}`
			`return *this;`
			`}`

			`AMDGPUSubtarget::AMDGPUSubtarget(StringRef TT, StringRef GPU, StringRef FS,`
			`TargetMachine &TM)`
			`: AMDGPUGenSubtargetInfo(TT, GPU, FS), DevName(GPU), Is64bit(false),`
			`DumpCode(false), R600ALUInst(false), HasVertexCache(false),`
			`TexVTXClauseSize(0), Gen(AMDGPUSubtarget::R600), FP64(false),`
80-column fixups. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@229789 91177308-0d34-0410-b5e6-96231b3b80d8 2015-02-19 00:15:33 +00:00			`FP64Denormals(false), FP32Denormals(false), FastFMAF32(false),`
			`CaymanISA(false), FlatAddressSpace(false), EnableIRStructurizer(true),`
			`EnablePromoteAlloca(false), EnableIfCvt(true), EnableLoadStoreOpt(false),`
			`WavefrontSize(0), CFALUBug(false), LocalMemorySize(0),`
R600/SI: Add subtarget feature to enable VGPR spilling for all shader types This is disabled by default, but can be enabled with the subtarget feature: 'vgpr-spilling' git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@226597 91177308-0d34-0410-b5e6-96231b3b80d8 2015-01-20 19:33:04 +00:00			`EnableVGPRSpilling(false),`
Move R600 subtarget dependent variables onto the subtarget. No functional change. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@213982 91177308-0d34-0410-b5e6-96231b3b80d8 2014-07-25 22:22:39 +00:00			`FrameLowering(TargetFrameLowering::StackGrowsUp,`
			`64 * 16, // Maximum stack alignment (long16)`
			`0),`
80-column fixups. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@229789 91177308-0d34-0410-b5e6-96231b3b80d8 2015-02-19 00:15:33 +00:00			`InstrItins(getInstrItineraryForCPU(GPU)), TargetTriple(TT) {`
R600: Move DataLayout to AMDGPUTargetMachine This is a follow up to r227113. It is now required to use the amdgcn target for SI and newer GPUs. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@227316 91177308-0d34-0410-b5e6-96231b3b80d8 2015-01-28 16:04:26 +00:00
			`initializeSubtargetDependencies(TT, GPU, FS);`

Move R600 subtarget dependent variables onto the subtarget. No functional change. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@213982 91177308-0d34-0410-b5e6-96231b3b80d8 2014-07-25 22:22:39 +00:00			`if (getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {`
			`InstrInfo.reset(new R600InstrInfo(*this));`
Reuse a bunch of cached subtargets and remove getSubtarget calls without a Function argument. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@227638 91177308-0d34-0410-b5e6-96231b3b80d8 2015-01-30 23:24:40 +00:00			`TLInfo.reset(new R600TargetLowering(TM, *this));`
R600: Move AMDGPUInstrInfo from AMDGPUTargetMachine into AMDGPUSubtarget git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@210869 91177308-0d34-0410-b5e6-96231b3b80d8 2014-06-13 01:32:00 +00:00			`} else {`
			`InstrInfo.reset(new SIInstrInfo(*this));`
Reuse a bunch of cached subtargets and remove getSubtarget calls without a Function argument. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@227638 91177308-0d34-0410-b5e6-96231b3b80d8 2015-01-30 23:24:40 +00:00			`TLInfo.reset(new SITargetLowering(TM, *this));`
R600: Move AMDGPUInstrInfo from AMDGPUTargetMachine into AMDGPUSubtarget git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@210869 91177308-0d34-0410-b5e6-96231b3b80d8 2014-06-13 01:32:00 +00:00			`}`
Add R600 backend A new backend supporting AMD GPUs: Radeon HD2XXX - HD7XXX git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@169915 91177308-0d34-0410-b5e6-96231b3b80d8 2012-12-11 21:25:42 +00:00			`}`

R600: Move trivial getters into header, use initializer list git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@211917 91177308-0d34-0410-b5e6-96231b3b80d8 2014-06-27 17:57:00 +00:00			`unsigned AMDGPUSubtarget::getStackEntrySize() const {`
R600: Refactor stack size calculation reviewed-by: Vincent Lejeune <vljn at ovi.com> git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@199840 91177308-0d34-0410-b5e6-96231b3b80d8 2014-01-22 21:55:43 +00:00			`assert(getGeneration() <= NORTHERN_ISLANDS);`
			`switch(getWavefrontSize()) {`
			`case 16:`
			`return 8;`
			`case 32:`
R600: Move trivial getters into header, use initializer list git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@211917 91177308-0d34-0410-b5e6-96231b3b80d8 2014-06-27 17:57:00 +00:00			`return hasCaymanISA() ? 4 : 8;`
R600: Refactor stack size calculation reviewed-by: Vincent Lejeune <vljn at ovi.com> git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@199840 91177308-0d34-0410-b5e6-96231b3b80d8 2014-01-22 21:55:43 +00:00			`case 64:`
			`return 4;`
			`default:`
			`llvm_unreachable("Illegal wavefront size.");`
			`}`
			`}`
R600/SI: Emit amd_kernel_code_t header for AMDGPU environment git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@223160 91177308-0d34-0410-b5e6-96231b3b80d8 2014-12-02 22:00:07 +00:00
			`unsigned AMDGPUSubtarget::getAmdKernelCodeChipID() const {`
			`switch(getGeneration()) {`
			`default: llvm_unreachable("ChipID unknown");`
			`case SEA_ISLANDS: return 12;`
			`}`
			`}`
R600/SI: Add subtarget feature to enable VGPR spilling for all shader types This is disabled by default, but can be enabled with the subtarget feature: 'vgpr-spilling' git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@226597 91177308-0d34-0410-b5e6-96231b3b80d8 2015-01-20 19:33:04 +00:00
			`bool AMDGPUSubtarget::isVGPRSpillingEnabled(`
			`const SIMachineFunctionInfo *MFI) const {`
			`return MFI->getShaderType() == ShaderType::COMPUTE \|\| EnableVGPRSpilling;`
			`}`
R600/SI: Define a schedule model and enable the generic machine scheduler The schedule model is not complete yet, and could be improved. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@227461 91177308-0d34-0410-b5e6-96231b3b80d8 2015-01-29 16:55:25 +00:00
			`void AMDGPUSubtarget::overrideSchedPolicy(MachineSchedPolicy &Policy,`
			`MachineInstr *begin,`
			`MachineInstr *end,`
			`unsigned NumRegionInstrs) const {`
			`if (getGeneration() >= SOUTHERN_ISLANDS) {`

			`// Track register pressure so the scheduler can try to decrease`
			`// pressure once register usage is above the threshold defined by`
			`// SIRegisterInfo::getRegPressureSetLimit()`
			`Policy.ShouldTrackPressure = true;`

			`// Enabling both top down and bottom up scheduling seems to give us less`
			`// register spills than just using one of these approaches on its own.`
			`Policy.OnlyTopDown = false;`
			`Policy.OnlyBottomUp = false;`
			`}`
			`}`