forked from OSchip/llvm-project
101 lines
2.3 KiB
C++
101 lines
2.3 KiB
C++
//===-- AMDGPUMachineFunctionInfo.h -------------------------------*- C++ -*-=//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUMACHINEFUNCTION_H
|
|
#define LLVM_LIB_TARGET_AMDGPU_AMDGPUMACHINEFUNCTION_H
|
|
|
|
#include "llvm/ADT/DenseMap.h"
|
|
#include "llvm/CodeGen/MachineFunction.h"
|
|
|
|
namespace llvm {
|
|
|
|
class AMDGPUMachineFunction : public MachineFunctionInfo {
|
|
/// A map to keep track of local memory objects and their offsets within the
|
|
/// local memory space.
|
|
SmallDenseMap<const GlobalValue *, unsigned, 4> LocalMemoryObjects;
|
|
|
|
protected:
|
|
uint64_t KernArgSize;
|
|
unsigned MaxKernArgAlign;
|
|
|
|
/// Number of bytes in the LDS that are being used.
|
|
unsigned LDSSize;
|
|
|
|
// FIXME: This should probably be removed.
|
|
/// Start of implicit kernel args
|
|
unsigned ABIArgOffset;
|
|
|
|
// Kernels + shaders. i.e. functions called by the driver and not called
|
|
// by other functions.
|
|
bool IsEntryFunction;
|
|
|
|
bool NoSignedZerosFPMath;
|
|
|
|
// Function may be memory bound.
|
|
bool MemoryBound;
|
|
|
|
// Kernel may need limited waves per EU for better performance.
|
|
bool WaveLimiter;
|
|
|
|
public:
|
|
AMDGPUMachineFunction(const MachineFunction &MF);
|
|
|
|
uint64_t allocateKernArg(uint64_t Size, unsigned Align) {
|
|
assert(isPowerOf2_32(Align));
|
|
KernArgSize = alignTo(KernArgSize, Align);
|
|
|
|
uint64_t Result = KernArgSize;
|
|
KernArgSize += Size;
|
|
|
|
MaxKernArgAlign = std::max(Align, MaxKernArgAlign);
|
|
return Result;
|
|
}
|
|
|
|
uint64_t getKernArgSize() const {
|
|
return KernArgSize;
|
|
}
|
|
|
|
unsigned getMaxKernArgAlign() const {
|
|
return MaxKernArgAlign;
|
|
}
|
|
|
|
void setABIArgOffset(unsigned NewOffset) {
|
|
ABIArgOffset = NewOffset;
|
|
}
|
|
|
|
unsigned getABIArgOffset() const {
|
|
return ABIArgOffset;
|
|
}
|
|
|
|
unsigned getLDSSize() const {
|
|
return LDSSize;
|
|
}
|
|
|
|
bool isEntryFunction() const {
|
|
return IsEntryFunction;
|
|
}
|
|
|
|
bool hasNoSignedZerosFPMath() const {
|
|
return NoSignedZerosFPMath;
|
|
}
|
|
|
|
bool isMemoryBound() const {
|
|
return MemoryBound;
|
|
}
|
|
|
|
bool needsWaveLimiter() const {
|
|
return WaveLimiter;
|
|
}
|
|
|
|
unsigned allocateLDSGlobal(const DataLayout &DL, const GlobalValue &GV);
|
|
};
|
|
|
|
}
|
|
#endif
|