2016-12-22 03:06:24 +08:00
|
|
|
//===-- llvm/lib/Target/AMDGPU/AMDGPUCallLowering.cpp - Call lowering -----===//
|
2016-04-15 03:09:28 +08:00
|
|
|
//
|
2019-01-19 16:50:56 +08:00
|
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
2016-04-15 03:09:28 +08:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
///
|
|
|
|
/// \file
|
|
|
|
/// This file implements the lowering of LLVM calls to machine code calls for
|
|
|
|
/// GlobalISel.
|
|
|
|
///
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#include "AMDGPUCallLowering.h"
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
#include "AMDGPU.h"
|
2016-04-15 03:09:28 +08:00
|
|
|
#include "AMDGPUISelLowering.h"
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
#include "AMDGPUSubtarget.h"
|
|
|
|
#include "SIISelLowering.h"
|
|
|
|
#include "SIMachineFunctionInfo.h"
|
2017-06-06 19:49:48 +08:00
|
|
|
#include "SIRegisterInfo.h"
|
AMDGPU: Remove #include "MCTargetDesc/AMDGPUMCTargetDesc.h" from common headers
Summary:
MCTargetDesc/AMDGPUMCTargetDesc.h contains enums for all the instuction
and register defintions, which are huge so we only want to include
them where needed.
This will also make it easier if we want to split the R600 and GCN
definitions into separate tablegenerated files.
I was unable to remove AMDGPUMCTargetDesc.h from SIMachineFunctionInfo.h
because it uses some enums from the header to initialize default values
for the SIMachineFunction class, so I ended up having to remove includes of
SIMachineFunctionInfo.h from headers too.
Reviewers: arsenm, nhaehnle
Reviewed By: nhaehnle
Subscribers: MatzeB, kzhuravl, wdng, yaxunl, dstuttard, tpr, t-tye, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D46272
llvm-svn: 332930
2018-05-22 10:03:23 +08:00
|
|
|
#include "MCTargetDesc/AMDGPUMCTargetDesc.h"
|
AMDGPU/GlobalISel: Implement call lowering for shaders returning values
Reviewers: arsenm, nhaehnle
Subscribers: kzhuravl, jvesely, wdng, yaxunl, rovka, kristof.beyls, dstuttard, tpr, t-tye, volkan, llvm-commits
Differential Revision: https://reviews.llvm.org/D57166
llvm-svn: 357964
2019-04-09 10:26:03 +08:00
|
|
|
#include "llvm/CodeGen/Analysis.h"
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
#include "llvm/CodeGen/CallingConvLower.h"
|
2016-04-15 03:09:28 +08:00
|
|
|
#include "llvm/CodeGen/GlobalISel/MachineIRBuilder.h"
|
|
|
|
#include "llvm/CodeGen/MachineInstrBuilder.h"
|
AMDGPU/GlobalISel: Implement call lowering for shaders returning values
Reviewers: arsenm, nhaehnle
Subscribers: kzhuravl, jvesely, wdng, yaxunl, rovka, kristof.beyls, dstuttard, tpr, t-tye, volkan, llvm-commits
Differential Revision: https://reviews.llvm.org/D57166
llvm-svn: 357964
2019-04-09 10:26:03 +08:00
|
|
|
#include "llvm/Support/LowLevelTypeImpl.h"
|
2016-04-15 03:09:28 +08:00
|
|
|
|
|
|
|
using namespace llvm;
|
|
|
|
|
AMDGPU/GlobalISel: Implement call lowering for shaders returning values
Reviewers: arsenm, nhaehnle
Subscribers: kzhuravl, jvesely, wdng, yaxunl, rovka, kristof.beyls, dstuttard, tpr, t-tye, volkan, llvm-commits
Differential Revision: https://reviews.llvm.org/D57166
llvm-svn: 357964
2019-04-09 10:26:03 +08:00
|
|
|
namespace {
|
|
|
|
|
|
|
|
struct OutgoingArgHandler : public CallLowering::ValueHandler {
|
|
|
|
OutgoingArgHandler(MachineIRBuilder &MIRBuilder, MachineRegisterInfo &MRI,
|
|
|
|
MachineInstrBuilder MIB, CCAssignFn *AssignFn)
|
|
|
|
: ValueHandler(MIRBuilder, MRI, AssignFn), MIB(MIB) {}
|
|
|
|
|
|
|
|
MachineInstrBuilder MIB;
|
|
|
|
|
2019-06-25 00:16:12 +08:00
|
|
|
Register getStackAddress(uint64_t Size, int64_t Offset,
|
AMDGPU/GlobalISel: Implement call lowering for shaders returning values
Reviewers: arsenm, nhaehnle
Subscribers: kzhuravl, jvesely, wdng, yaxunl, rovka, kristof.beyls, dstuttard, tpr, t-tye, volkan, llvm-commits
Differential Revision: https://reviews.llvm.org/D57166
llvm-svn: 357964
2019-04-09 10:26:03 +08:00
|
|
|
MachinePointerInfo &MPO) override {
|
|
|
|
llvm_unreachable("not implemented");
|
|
|
|
}
|
|
|
|
|
2019-06-25 00:16:12 +08:00
|
|
|
void assignValueToAddress(Register ValVReg, Register Addr, uint64_t Size,
|
AMDGPU/GlobalISel: Implement call lowering for shaders returning values
Reviewers: arsenm, nhaehnle
Subscribers: kzhuravl, jvesely, wdng, yaxunl, rovka, kristof.beyls, dstuttard, tpr, t-tye, volkan, llvm-commits
Differential Revision: https://reviews.llvm.org/D57166
llvm-svn: 357964
2019-04-09 10:26:03 +08:00
|
|
|
MachinePointerInfo &MPO, CCValAssign &VA) override {
|
|
|
|
llvm_unreachable("not implemented");
|
|
|
|
}
|
|
|
|
|
2019-06-25 00:16:12 +08:00
|
|
|
void assignValueToReg(Register ValVReg, Register PhysReg,
|
AMDGPU/GlobalISel: Implement call lowering for shaders returning values
Reviewers: arsenm, nhaehnle
Subscribers: kzhuravl, jvesely, wdng, yaxunl, rovka, kristof.beyls, dstuttard, tpr, t-tye, volkan, llvm-commits
Differential Revision: https://reviews.llvm.org/D57166
llvm-svn: 357964
2019-04-09 10:26:03 +08:00
|
|
|
CCValAssign &VA) override {
|
|
|
|
MIB.addUse(PhysReg);
|
|
|
|
MIRBuilder.buildCopy(PhysReg, ValVReg);
|
|
|
|
}
|
|
|
|
|
|
|
|
bool assignArg(unsigned ValNo, MVT ValVT, MVT LocVT,
|
|
|
|
CCValAssign::LocInfo LocInfo,
|
|
|
|
const CallLowering::ArgInfo &Info,
|
|
|
|
CCState &State) override {
|
|
|
|
return AssignFn(ValNo, ValVT, LocVT, LocInfo, Info.Flags, State);
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2019-07-19 22:15:18 +08:00
|
|
|
struct IncomingArgHandler : public CallLowering::ValueHandler {
|
|
|
|
uint64_t StackUsed = 0;
|
|
|
|
|
|
|
|
IncomingArgHandler(MachineIRBuilder &MIRBuilder, MachineRegisterInfo &MRI,
|
|
|
|
CCAssignFn *AssignFn)
|
|
|
|
: ValueHandler(MIRBuilder, MRI, AssignFn) {}
|
|
|
|
|
|
|
|
Register getStackAddress(uint64_t Size, int64_t Offset,
|
|
|
|
MachinePointerInfo &MPO) override {
|
|
|
|
auto &MFI = MIRBuilder.getMF().getFrameInfo();
|
|
|
|
int FI = MFI.CreateFixedObject(Size, Offset, true);
|
|
|
|
MPO = MachinePointerInfo::getFixedStack(MIRBuilder.getMF(), FI);
|
|
|
|
Register AddrReg = MRI.createGenericVirtualRegister(
|
|
|
|
LLT::pointer(AMDGPUAS::PRIVATE_ADDRESS, 32));
|
|
|
|
MIRBuilder.buildFrameIndex(AddrReg, FI);
|
|
|
|
StackUsed = std::max(StackUsed, Size + Offset);
|
|
|
|
return AddrReg;
|
|
|
|
}
|
|
|
|
|
|
|
|
void assignValueToReg(Register ValVReg, Register PhysReg,
|
|
|
|
CCValAssign &VA) override {
|
|
|
|
markPhysRegUsed(PhysReg);
|
|
|
|
|
|
|
|
if (VA.getLocVT().getSizeInBits() < 32) {
|
|
|
|
// 16-bit types are reported as legal for 32-bit registers. We need to do
|
|
|
|
// a 32-bit copy, and truncate to avoid the verifier complaining about it.
|
|
|
|
auto Copy = MIRBuilder.buildCopy(LLT::scalar(32), PhysReg);
|
|
|
|
MIRBuilder.buildTrunc(ValVReg, Copy);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
switch (VA.getLocInfo()) {
|
|
|
|
case CCValAssign::LocInfo::SExt:
|
|
|
|
case CCValAssign::LocInfo::ZExt:
|
|
|
|
case CCValAssign::LocInfo::AExt: {
|
|
|
|
auto Copy = MIRBuilder.buildCopy(LLT{VA.getLocVT()}, PhysReg);
|
|
|
|
MIRBuilder.buildTrunc(ValVReg, Copy);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
MIRBuilder.buildCopy(ValVReg, PhysReg);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void assignValueToAddress(Register ValVReg, Register Addr, uint64_t Size,
|
|
|
|
MachinePointerInfo &MPO, CCValAssign &VA) override {
|
|
|
|
// FIXME: Get alignment
|
|
|
|
auto MMO = MIRBuilder.getMF().getMachineMemOperand(
|
|
|
|
MPO, MachineMemOperand::MOLoad | MachineMemOperand::MOInvariant, Size, 1);
|
|
|
|
MIRBuilder.buildLoad(ValVReg, Addr, *MMO);
|
|
|
|
}
|
|
|
|
|
|
|
|
/// How the physical register gets marked varies between formal
|
|
|
|
/// parameters (it's a basic-block live-in), and a call instruction
|
|
|
|
/// (it's an implicit-def of the BL).
|
|
|
|
virtual void markPhysRegUsed(unsigned PhysReg) = 0;
|
|
|
|
|
|
|
|
// FIXME: What is the point of this being a callback?
|
|
|
|
bool isArgumentHandler() const override { return true; }
|
|
|
|
};
|
|
|
|
|
|
|
|
struct FormalArgHandler : public IncomingArgHandler {
|
|
|
|
FormalArgHandler(MachineIRBuilder &MIRBuilder, MachineRegisterInfo &MRI,
|
|
|
|
CCAssignFn *AssignFn)
|
|
|
|
: IncomingArgHandler(MIRBuilder, MRI, AssignFn) {}
|
|
|
|
|
|
|
|
void markPhysRegUsed(unsigned PhysReg) override {
|
|
|
|
MIRBuilder.getMBB().addLiveIn(PhysReg);
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
AMDGPU/GlobalISel: Implement call lowering for shaders returning values
Reviewers: arsenm, nhaehnle
Subscribers: kzhuravl, jvesely, wdng, yaxunl, rovka, kristof.beyls, dstuttard, tpr, t-tye, volkan, llvm-commits
Differential Revision: https://reviews.llvm.org/D57166
llvm-svn: 357964
2019-04-09 10:26:03 +08:00
|
|
|
}
|
|
|
|
|
2016-04-15 03:09:28 +08:00
|
|
|
AMDGPUCallLowering::AMDGPUCallLowering(const AMDGPUTargetLowering &TLI)
|
2018-08-31 13:49:54 +08:00
|
|
|
: CallLowering(&TLI) {
|
2016-04-15 03:09:28 +08:00
|
|
|
}
|
|
|
|
|
2019-07-19 22:15:18 +08:00
|
|
|
void AMDGPUCallLowering::splitToValueTypes(
|
|
|
|
const ArgInfo &OrigArg, SmallVectorImpl<ArgInfo> &SplitArgs,
|
|
|
|
const DataLayout &DL, MachineRegisterInfo &MRI, CallingConv::ID CallConv,
|
|
|
|
SplitArgTy PerformArgSplit) const {
|
|
|
|
const SITargetLowering &TLI = *getTLI<SITargetLowering>();
|
|
|
|
LLVMContext &Ctx = OrigArg.Ty->getContext();
|
|
|
|
|
|
|
|
if (OrigArg.Ty->isVoidTy())
|
|
|
|
return;
|
|
|
|
|
|
|
|
SmallVector<EVT, 4> SplitVTs;
|
|
|
|
ComputeValueVTs(TLI, DL, OrigArg.Ty, SplitVTs);
|
|
|
|
|
2019-07-19 22:29:30 +08:00
|
|
|
assert(OrigArg.Regs.size() == SplitVTs.size());
|
2019-07-19 22:15:18 +08:00
|
|
|
|
2019-07-19 22:29:30 +08:00
|
|
|
int SplitIdx = 0;
|
|
|
|
for (EVT VT : SplitVTs) {
|
|
|
|
unsigned NumParts = TLI.getNumRegistersForCallingConv(Ctx, CallConv, VT);
|
|
|
|
Type *Ty = VT.getTypeForEVT(Ctx);
|
2019-07-19 22:15:18 +08:00
|
|
|
|
|
|
|
|
|
|
|
|
2019-07-19 22:29:30 +08:00
|
|
|
if (NumParts == 1) {
|
|
|
|
// No splitting to do, but we want to replace the original type (e.g. [1 x
|
|
|
|
// double] -> double).
|
|
|
|
SplitArgs.emplace_back(OrigArg.Regs[SplitIdx], Ty,
|
|
|
|
OrigArg.Flags, OrigArg.IsFixed);
|
|
|
|
|
|
|
|
++SplitIdx;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
LLT LLTy = getLLTForType(*Ty, DL);
|
|
|
|
|
|
|
|
SmallVector<Register, 8> SplitRegs;
|
|
|
|
|
|
|
|
EVT PartVT = TLI.getRegisterTypeForCallingConv(Ctx, CallConv, VT);
|
|
|
|
Type *PartTy = PartVT.getTypeForEVT(Ctx);
|
|
|
|
LLT PartLLT = getLLTForType(*PartTy, DL);
|
|
|
|
|
|
|
|
// FIXME: Should we be reporting all of the part registers for a single
|
|
|
|
// argument, and let handleAssignments take care of the repacking?
|
|
|
|
for (unsigned i = 0; i < NumParts; ++i) {
|
|
|
|
Register PartReg = MRI.createGenericVirtualRegister(PartLLT);
|
|
|
|
SplitRegs.push_back(PartReg);
|
|
|
|
SplitArgs.emplace_back(ArrayRef<Register>(PartReg), PartTy, OrigArg.Flags);
|
|
|
|
}
|
|
|
|
|
|
|
|
PerformArgSplit(SplitRegs, LLTy, PartLLT, SplitIdx);
|
|
|
|
|
|
|
|
++SplitIdx;
|
|
|
|
}
|
2019-07-19 22:15:18 +08:00
|
|
|
}
|
|
|
|
|
2016-04-15 03:09:28 +08:00
|
|
|
bool AMDGPUCallLowering::lowerReturn(MachineIRBuilder &MIRBuilder,
|
2018-08-02 16:33:31 +08:00
|
|
|
const Value *Val,
|
2019-06-24 23:50:29 +08:00
|
|
|
ArrayRef<Register> VRegs) const {
|
AMDGPU/GlobalISel: Implement call lowering for shaders returning values
Reviewers: arsenm, nhaehnle
Subscribers: kzhuravl, jvesely, wdng, yaxunl, rovka, kristof.beyls, dstuttard, tpr, t-tye, volkan, llvm-commits
Differential Revision: https://reviews.llvm.org/D57166
llvm-svn: 357964
2019-04-09 10:26:03 +08:00
|
|
|
|
|
|
|
MachineFunction &MF = MIRBuilder.getMF();
|
|
|
|
MachineRegisterInfo &MRI = MF.getRegInfo();
|
|
|
|
SIMachineFunctionInfo *MFI = MF.getInfo<SIMachineFunctionInfo>();
|
|
|
|
MFI->setIfReturnsVoid(!Val);
|
|
|
|
|
|
|
|
if (!Val) {
|
|
|
|
MIRBuilder.buildInstr(AMDGPU::S_ENDPGM).addImm(0);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2019-06-24 23:50:29 +08:00
|
|
|
Register VReg = VRegs[0];
|
AMDGPU/GlobalISel: Implement call lowering for shaders returning values
Reviewers: arsenm, nhaehnle
Subscribers: kzhuravl, jvesely, wdng, yaxunl, rovka, kristof.beyls, dstuttard, tpr, t-tye, volkan, llvm-commits
Differential Revision: https://reviews.llvm.org/D57166
llvm-svn: 357964
2019-04-09 10:26:03 +08:00
|
|
|
|
|
|
|
const Function &F = MF.getFunction();
|
|
|
|
auto &DL = F.getParent()->getDataLayout();
|
|
|
|
if (!AMDGPU::isShader(F.getCallingConv()))
|
|
|
|
return false;
|
|
|
|
|
|
|
|
|
|
|
|
const AMDGPUTargetLowering &TLI = *getTLI<AMDGPUTargetLowering>();
|
|
|
|
SmallVector<EVT, 4> SplitVTs;
|
|
|
|
SmallVector<uint64_t, 4> Offsets;
|
|
|
|
ArgInfo OrigArg{VReg, Val->getType()};
|
|
|
|
setArgFlags(OrigArg, AttributeList::ReturnIndex, DL, F);
|
|
|
|
ComputeValueVTs(TLI, DL, OrigArg.Ty, SplitVTs, &Offsets, 0);
|
|
|
|
|
|
|
|
SmallVector<ArgInfo, 8> SplitArgs;
|
|
|
|
CCAssignFn *AssignFn = CCAssignFnForReturn(F.getCallingConv(), false);
|
|
|
|
for (unsigned i = 0, e = Offsets.size(); i != e; ++i) {
|
|
|
|
Type *SplitTy = SplitVTs[i].getTypeForEVT(F.getContext());
|
|
|
|
SplitArgs.push_back({VRegs[i], SplitTy, OrigArg.Flags, OrigArg.IsFixed});
|
|
|
|
}
|
|
|
|
auto RetInstr = MIRBuilder.buildInstrNoInsert(AMDGPU::SI_RETURN_TO_EPILOG);
|
|
|
|
OutgoingArgHandler Handler(MIRBuilder, MRI, RetInstr, AssignFn);
|
|
|
|
if (!handleAssignments(MIRBuilder, SplitArgs, Handler))
|
AMDGPU/GlobalISel: Fall-back to SelectionDAG for non-void functions
Reviewers: arsenm, nhaehnle
Reviewed By: nhaehnle
Subscribers: kzhuravl, wdng, nhaehnle, yaxunl, rovka, kristof.beyls, dstuttard, tpr, t-tye, llvm-commits
Differential Revision: https://reviews.llvm.org/D45843
llvm-svn: 330774
2018-04-25 05:29:36 +08:00
|
|
|
return false;
|
AMDGPU/GlobalISel: Implement call lowering for shaders returning values
Reviewers: arsenm, nhaehnle
Subscribers: kzhuravl, jvesely, wdng, yaxunl, rovka, kristof.beyls, dstuttard, tpr, t-tye, volkan, llvm-commits
Differential Revision: https://reviews.llvm.org/D57166
llvm-svn: 357964
2019-04-09 10:26:03 +08:00
|
|
|
MIRBuilder.insertInstr(RetInstr);
|
AMDGPU/GlobalISel: Fall-back to SelectionDAG for non-void functions
Reviewers: arsenm, nhaehnle
Reviewed By: nhaehnle
Subscribers: kzhuravl, wdng, nhaehnle, yaxunl, rovka, kristof.beyls, dstuttard, tpr, t-tye, llvm-commits
Differential Revision: https://reviews.llvm.org/D45843
llvm-svn: 330774
2018-04-25 05:29:36 +08:00
|
|
|
|
2016-04-15 03:09:28 +08:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2019-06-25 00:16:12 +08:00
|
|
|
Register AMDGPUCallLowering::lowerParameterPtr(MachineIRBuilder &MIRBuilder,
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
Type *ParamTy,
|
2018-07-06 01:01:20 +08:00
|
|
|
uint64_t Offset) const {
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
|
|
|
|
MachineFunction &MF = MIRBuilder.getMF();
|
2017-08-04 07:00:29 +08:00
|
|
|
const SIMachineFunctionInfo *MFI = MF.getInfo<SIMachineFunctionInfo>();
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
MachineRegisterInfo &MRI = MF.getRegInfo();
|
2017-12-16 06:22:58 +08:00
|
|
|
const Function &F = MF.getFunction();
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
const DataLayout &DL = F.getParent()->getDataLayout();
|
2018-08-31 13:49:54 +08:00
|
|
|
PointerType *PtrTy = PointerType::get(ParamTy, AMDGPUAS::CONSTANT_ADDRESS);
|
Recommit: [globalisel] Change LLT constructor string into an LLT-based object that knows how to generate it.
Summary:
This will allow future patches to inspect the details of the LLT. The implementation is now split between
the Support and CodeGen libraries to allow TableGen to use this class without introducing layering concerns.
Thanks to Ahmed Bougacha for finding a reasonable way to avoid the layering issue and providing the version of this patch without that problem.
The problem with the previous commit appears to have been that TableGen was including CodeGen/LowLevelType.h instead of Support/LowLevelTypeImpl.h.
Reviewers: t.p.northover, qcolombet, rovka, aditya_nandakumar, ab, javed.absar
Subscribers: arsenm, nhaehnle, mgorny, dberris, llvm-commits, kristof.beyls
Differential Revision: https://reviews.llvm.org/D30046
llvm-svn: 297241
2017-03-08 07:20:35 +08:00
|
|
|
LLT PtrType = getLLTForType(*PtrTy, DL);
|
2019-06-25 00:16:12 +08:00
|
|
|
Register DstReg = MRI.createGenericVirtualRegister(PtrType);
|
|
|
|
Register KernArgSegmentPtr =
|
2017-08-04 07:00:29 +08:00
|
|
|
MFI->getPreloadedReg(AMDGPUFunctionArgInfo::KERNARG_SEGMENT_PTR);
|
2019-06-25 00:16:12 +08:00
|
|
|
Register KernArgSegmentVReg = MRI.getLiveInVirtReg(KernArgSegmentPtr);
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
|
2019-06-25 00:16:12 +08:00
|
|
|
Register OffsetReg = MRI.createGenericVirtualRegister(LLT::scalar(64));
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
MIRBuilder.buildConstant(OffsetReg, Offset);
|
|
|
|
|
|
|
|
MIRBuilder.buildGEP(DstReg, KernArgSegmentVReg, OffsetReg);
|
|
|
|
|
|
|
|
return DstReg;
|
|
|
|
}
|
|
|
|
|
|
|
|
void AMDGPUCallLowering::lowerParameter(MachineIRBuilder &MIRBuilder,
|
2018-07-06 01:01:20 +08:00
|
|
|
Type *ParamTy, uint64_t Offset,
|
|
|
|
unsigned Align,
|
2019-06-24 23:50:29 +08:00
|
|
|
Register DstReg) const {
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
MachineFunction &MF = MIRBuilder.getMF();
|
2017-12-16 06:22:58 +08:00
|
|
|
const Function &F = MF.getFunction();
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
const DataLayout &DL = F.getParent()->getDataLayout();
|
2018-08-31 13:49:54 +08:00
|
|
|
PointerType *PtrTy = PointerType::get(ParamTy, AMDGPUAS::CONSTANT_ADDRESS);
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
MachinePointerInfo PtrInfo(UndefValue::get(PtrTy));
|
|
|
|
unsigned TypeSize = DL.getTypeStoreSize(ParamTy);
|
2019-06-24 23:50:29 +08:00
|
|
|
Register PtrReg = lowerParameterPtr(MIRBuilder, ParamTy, Offset);
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
|
|
|
|
MachineMemOperand *MMO =
|
|
|
|
MF.getMachineMemOperand(PtrInfo, MachineMemOperand::MOLoad |
|
|
|
|
MachineMemOperand::MONonTemporal |
|
|
|
|
MachineMemOperand::MOInvariant,
|
|
|
|
TypeSize, Align);
|
|
|
|
|
|
|
|
MIRBuilder.buildLoad(DstReg, PtrReg, *MMO);
|
|
|
|
}
|
|
|
|
|
2019-07-02 02:50:50 +08:00
|
|
|
// Allocate special inputs passed in user SGPRs.
|
|
|
|
static void allocateHSAUserSGPRs(CCState &CCInfo,
|
|
|
|
MachineIRBuilder &MIRBuilder,
|
|
|
|
MachineFunction &MF,
|
|
|
|
const SIRegisterInfo &TRI,
|
|
|
|
SIMachineFunctionInfo &Info) {
|
|
|
|
// FIXME: How should these inputs interact with inreg / custom SGPR inputs?
|
|
|
|
if (Info.hasPrivateSegmentBuffer()) {
|
|
|
|
unsigned PrivateSegmentBufferReg = Info.addPrivateSegmentBuffer(TRI);
|
|
|
|
MF.addLiveIn(PrivateSegmentBufferReg, &AMDGPU::SGPR_128RegClass);
|
|
|
|
CCInfo.AllocateReg(PrivateSegmentBufferReg);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (Info.hasDispatchPtr()) {
|
|
|
|
unsigned DispatchPtrReg = Info.addDispatchPtr(TRI);
|
|
|
|
MF.addLiveIn(DispatchPtrReg, &AMDGPU::SGPR_64RegClass);
|
|
|
|
CCInfo.AllocateReg(DispatchPtrReg);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (Info.hasQueuePtr()) {
|
|
|
|
unsigned QueuePtrReg = Info.addQueuePtr(TRI);
|
|
|
|
MF.addLiveIn(QueuePtrReg, &AMDGPU::SGPR_64RegClass);
|
|
|
|
CCInfo.AllocateReg(QueuePtrReg);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (Info.hasKernargSegmentPtr()) {
|
|
|
|
MachineRegisterInfo &MRI = MF.getRegInfo();
|
|
|
|
Register InputPtrReg = Info.addKernargSegmentPtr(TRI);
|
|
|
|
const LLT P4 = LLT::pointer(AMDGPUAS::CONSTANT_ADDRESS, 64);
|
|
|
|
Register VReg = MRI.createGenericVirtualRegister(P4);
|
|
|
|
MRI.addLiveIn(InputPtrReg, VReg);
|
|
|
|
MIRBuilder.getMBB().addLiveIn(InputPtrReg);
|
|
|
|
MIRBuilder.buildCopy(VReg, InputPtrReg);
|
|
|
|
CCInfo.AllocateReg(InputPtrReg);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (Info.hasDispatchID()) {
|
|
|
|
unsigned DispatchIDReg = Info.addDispatchID(TRI);
|
|
|
|
MF.addLiveIn(DispatchIDReg, &AMDGPU::SGPR_64RegClass);
|
|
|
|
CCInfo.AllocateReg(DispatchIDReg);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (Info.hasFlatScratchInit()) {
|
|
|
|
unsigned FlatScratchInitReg = Info.addFlatScratchInit(TRI);
|
|
|
|
MF.addLiveIn(FlatScratchInitReg, &AMDGPU::SGPR_64RegClass);
|
|
|
|
CCInfo.AllocateReg(FlatScratchInitReg);
|
|
|
|
}
|
|
|
|
|
|
|
|
// TODO: Add GridWorkGroupCount user SGPRs when used. For now with HSA we read
|
|
|
|
// these from the dispatch pointer.
|
|
|
|
}
|
|
|
|
|
2019-07-11 22:18:25 +08:00
|
|
|
bool AMDGPUCallLowering::lowerFormalArgumentsKernel(
|
|
|
|
MachineIRBuilder &MIRBuilder, const Function &F,
|
|
|
|
ArrayRef<ArrayRef<Register>> VRegs) const {
|
|
|
|
MachineFunction &MF = MIRBuilder.getMF();
|
|
|
|
const GCNSubtarget *Subtarget = &MF.getSubtarget<GCNSubtarget>();
|
|
|
|
MachineRegisterInfo &MRI = MF.getRegInfo();
|
|
|
|
SIMachineFunctionInfo *Info = MF.getInfo<SIMachineFunctionInfo>();
|
2019-07-19 22:15:18 +08:00
|
|
|
const SIRegisterInfo *TRI = Subtarget->getRegisterInfo();
|
|
|
|
const SITargetLowering &TLI = *getTLI<SITargetLowering>();
|
|
|
|
|
2019-07-11 22:18:25 +08:00
|
|
|
const DataLayout &DL = F.getParent()->getDataLayout();
|
|
|
|
|
|
|
|
SmallVector<CCValAssign, 16> ArgLocs;
|
|
|
|
CCState CCInfo(F.getCallingConv(), F.isVarArg(), MF, ArgLocs, F.getContext());
|
|
|
|
|
|
|
|
allocateHSAUserSGPRs(CCInfo, MIRBuilder, MF, *TRI, *Info);
|
|
|
|
|
|
|
|
unsigned i = 0;
|
|
|
|
const unsigned KernArgBaseAlign = 16;
|
|
|
|
const unsigned BaseOffset = Subtarget->getExplicitKernelArgOffset(F);
|
|
|
|
uint64_t ExplicitArgOffset = 0;
|
|
|
|
|
|
|
|
// TODO: Align down to dword alignment and extract bits for extending loads.
|
|
|
|
for (auto &Arg : F.args()) {
|
|
|
|
Type *ArgTy = Arg.getType();
|
|
|
|
unsigned AllocSize = DL.getTypeAllocSize(ArgTy);
|
|
|
|
if (AllocSize == 0)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
unsigned ABIAlign = DL.getABITypeAlignment(ArgTy);
|
|
|
|
|
|
|
|
uint64_t ArgOffset = alignTo(ExplicitArgOffset, ABIAlign) + BaseOffset;
|
|
|
|
ExplicitArgOffset = alignTo(ExplicitArgOffset, ABIAlign) + AllocSize;
|
|
|
|
|
|
|
|
ArrayRef<Register> OrigArgRegs = VRegs[i];
|
|
|
|
Register ArgReg =
|
|
|
|
OrigArgRegs.size() == 1
|
|
|
|
? OrigArgRegs[0]
|
|
|
|
: MRI.createGenericVirtualRegister(getLLTForType(*ArgTy, DL));
|
|
|
|
unsigned Align = MinAlign(KernArgBaseAlign, ArgOffset);
|
|
|
|
ArgOffset = alignTo(ArgOffset, DL.getABITypeAlignment(ArgTy));
|
|
|
|
lowerParameter(MIRBuilder, ArgTy, ArgOffset, Align, ArgReg);
|
|
|
|
if (OrigArgRegs.size() > 1)
|
|
|
|
unpackRegs(OrigArgRegs, ArgReg, ArgTy, MIRBuilder);
|
|
|
|
++i;
|
|
|
|
}
|
|
|
|
|
2019-07-19 22:15:18 +08:00
|
|
|
TLI.allocateSpecialEntryInputVGPRs(CCInfo, MF, *TRI, *Info);
|
|
|
|
TLI.allocateSystemSGPRs(CCInfo, MF, *Info, F.getCallingConv(), false);
|
2019-07-11 22:18:25 +08:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2019-07-19 22:15:18 +08:00
|
|
|
static void packSplitRegsToOrigType(MachineIRBuilder &MIRBuilder,
|
|
|
|
ArrayRef<Register> OrigRegs,
|
|
|
|
ArrayRef<Register> Regs,
|
|
|
|
LLT LLTy,
|
|
|
|
LLT PartLLT) {
|
|
|
|
if (!LLTy.isVector() && !PartLLT.isVector()) {
|
|
|
|
MIRBuilder.buildMerge(OrigRegs[0], Regs);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (LLTy.isVector() && PartLLT.isVector()) {
|
|
|
|
assert(LLTy.getElementType() == PartLLT.getElementType());
|
|
|
|
|
|
|
|
int DstElts = LLTy.getNumElements();
|
|
|
|
int PartElts = PartLLT.getNumElements();
|
|
|
|
if (DstElts % PartElts == 0)
|
|
|
|
MIRBuilder.buildConcatVectors(OrigRegs[0], Regs);
|
|
|
|
else {
|
|
|
|
// Deal with v3s16 split into v2s16
|
|
|
|
assert(PartElts == 2 && DstElts % 2 != 0);
|
|
|
|
int RoundedElts = PartElts * ((DstElts + PartElts - 1) / PartElts);
|
|
|
|
|
|
|
|
LLT RoundedDestTy = LLT::vector(RoundedElts, PartLLT.getElementType());
|
|
|
|
auto RoundedConcat = MIRBuilder.buildConcatVectors(RoundedDestTy, Regs);
|
|
|
|
MIRBuilder.buildExtract(OrigRegs[0], RoundedConcat, 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
assert(LLTy.isVector() && !PartLLT.isVector());
|
|
|
|
|
|
|
|
LLT DstEltTy = LLTy.getElementType();
|
|
|
|
if (DstEltTy == PartLLT) {
|
|
|
|
// Vector was trivially scalarized.
|
|
|
|
MIRBuilder.buildBuildVector(OrigRegs[0], Regs);
|
|
|
|
} else if (DstEltTy.getSizeInBits() > PartLLT.getSizeInBits()) {
|
|
|
|
// Deal with vector with 64-bit elements decomposed to 32-bit
|
|
|
|
// registers. Need to create intermediate 64-bit elements.
|
|
|
|
SmallVector<Register, 8> EltMerges;
|
|
|
|
int PartsPerElt = DstEltTy.getSizeInBits() / PartLLT.getSizeInBits();
|
|
|
|
|
|
|
|
assert(DstEltTy.getSizeInBits() % PartLLT.getSizeInBits() == 0);
|
|
|
|
|
|
|
|
for (int I = 0, NumElts = LLTy.getNumElements(); I != NumElts; ++I) {
|
|
|
|
auto Merge = MIRBuilder.buildMerge(DstEltTy,
|
|
|
|
Regs.take_front(PartsPerElt));
|
|
|
|
EltMerges.push_back(Merge.getReg(0));
|
|
|
|
Regs = Regs.drop_front(PartsPerElt);
|
|
|
|
}
|
|
|
|
|
|
|
|
MIRBuilder.buildBuildVector(OrigRegs[0], EltMerges);
|
|
|
|
} else {
|
|
|
|
// Vector was split, and elements promoted to a wider type.
|
|
|
|
LLT BVType = LLT::vector(LLTy.getNumElements(), PartLLT);
|
|
|
|
auto BV = MIRBuilder.buildBuildVector(BVType, Regs);
|
|
|
|
MIRBuilder.buildTrunc(OrigRegs[0], BV);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-06-27 16:54:17 +08:00
|
|
|
bool AMDGPUCallLowering::lowerFormalArguments(
|
|
|
|
MachineIRBuilder &MIRBuilder, const Function &F,
|
|
|
|
ArrayRef<ArrayRef<Register>> VRegs) const {
|
2019-07-19 22:15:18 +08:00
|
|
|
CallingConv::ID CC = F.getCallingConv();
|
|
|
|
|
2019-07-11 22:18:25 +08:00
|
|
|
// The infrastructure for normal calling convention lowering is essentially
|
|
|
|
// useless for kernels. We want to avoid any kind of legalization or argument
|
|
|
|
// splitting.
|
2019-07-19 22:15:18 +08:00
|
|
|
if (CC == CallingConv::AMDGPU_KERNEL)
|
2019-07-11 22:18:25 +08:00
|
|
|
return lowerFormalArgumentsKernel(MIRBuilder, F, VRegs);
|
|
|
|
|
2018-05-08 06:17:54 +08:00
|
|
|
// AMDGPU_GS and AMDGP_HS are not supported yet.
|
2019-07-19 22:15:18 +08:00
|
|
|
if (CC == CallingConv::AMDGPU_GS || CC == CallingConv::AMDGPU_HS)
|
2018-04-30 23:15:23 +08:00
|
|
|
return false;
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
|
2019-07-19 22:15:18 +08:00
|
|
|
const bool IsShader = AMDGPU::isShader(CC);
|
|
|
|
const bool IsEntryFunc = AMDGPU::isEntryFunctionCC(CC);
|
|
|
|
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
MachineFunction &MF = MIRBuilder.getMF();
|
2019-07-19 22:15:18 +08:00
|
|
|
MachineBasicBlock &MBB = MIRBuilder.getMBB();
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
MachineRegisterInfo &MRI = MF.getRegInfo();
|
|
|
|
SIMachineFunctionInfo *Info = MF.getInfo<SIMachineFunctionInfo>();
|
2019-07-19 22:15:18 +08:00
|
|
|
const GCNSubtarget &Subtarget = MF.getSubtarget<GCNSubtarget>();
|
|
|
|
const SIRegisterInfo *TRI = Subtarget.getRegisterInfo();
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
const DataLayout &DL = F.getParent()->getDataLayout();
|
|
|
|
|
2019-05-31 03:33:18 +08:00
|
|
|
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
SmallVector<CCValAssign, 16> ArgLocs;
|
2019-07-19 22:15:18 +08:00
|
|
|
CCState CCInfo(CC, F.isVarArg(), MF, ArgLocs, F.getContext());
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
|
2019-07-02 02:50:50 +08:00
|
|
|
if (Info->hasImplicitBufferPtr()) {
|
2019-07-19 22:15:18 +08:00
|
|
|
Register ImplicitBufferPtrReg = Info->addImplicitBufferPtr(*TRI);
|
2019-07-02 02:50:50 +08:00
|
|
|
MF.addLiveIn(ImplicitBufferPtrReg, &AMDGPU::SGPR_64RegClass);
|
|
|
|
CCInfo.AllocateReg(ImplicitBufferPtrReg);
|
|
|
|
}
|
|
|
|
|
2019-07-19 22:15:18 +08:00
|
|
|
|
|
|
|
SmallVector<ArgInfo, 32> SplitArgs;
|
|
|
|
unsigned Idx = 0;
|
2018-04-25 04:51:28 +08:00
|
|
|
unsigned PSInputNum = 0;
|
2019-07-19 22:15:18 +08:00
|
|
|
|
|
|
|
for (auto &Arg : F.args()) {
|
|
|
|
if (DL.getTypeStoreSize(Arg.getType()) == 0)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
const bool InReg = Arg.hasAttribute(Attribute::InReg);
|
|
|
|
|
|
|
|
// SGPR arguments to functions not implemented.
|
|
|
|
if (!IsShader && InReg)
|
|
|
|
return false;
|
|
|
|
|
2019-07-19 22:29:30 +08:00
|
|
|
// TODO: Handle sret.
|
2019-07-19 22:15:18 +08:00
|
|
|
if (Arg.hasAttribute(Attribute::StructRet) ||
|
|
|
|
Arg.hasAttribute(Attribute::SwiftSelf) ||
|
|
|
|
Arg.hasAttribute(Attribute::SwiftError) ||
|
2019-07-19 22:29:30 +08:00
|
|
|
Arg.hasAttribute(Attribute::Nest))
|
2019-07-19 22:15:18 +08:00
|
|
|
return false;
|
|
|
|
|
|
|
|
if (CC == CallingConv::AMDGPU_PS && !InReg && PSInputNum <= 15) {
|
|
|
|
const bool ArgUsed = !Arg.use_empty();
|
|
|
|
bool SkipArg = !ArgUsed && !Info->isPSInputAllocated(PSInputNum);
|
|
|
|
|
|
|
|
if (!SkipArg) {
|
|
|
|
Info->markPSInputAllocated(PSInputNum);
|
|
|
|
if (ArgUsed)
|
|
|
|
Info->markPSInputEnabled(PSInputNum);
|
|
|
|
}
|
|
|
|
|
|
|
|
++PSInputNum;
|
|
|
|
|
|
|
|
if (SkipArg) {
|
2019-07-19 22:29:30 +08:00
|
|
|
for (int I = 0, E = VRegs[Idx].size(); I != E; ++I)
|
|
|
|
MIRBuilder.buildUndef(VRegs[Idx][I]);
|
|
|
|
|
2019-07-19 22:15:18 +08:00
|
|
|
++Idx;
|
2018-04-25 04:51:28 +08:00
|
|
|
continue;
|
|
|
|
}
|
2019-07-19 22:15:18 +08:00
|
|
|
}
|
2018-04-25 04:51:28 +08:00
|
|
|
|
2019-07-19 22:15:18 +08:00
|
|
|
ArgInfo OrigArg(VRegs[Idx], Arg.getType());
|
|
|
|
setArgFlags(OrigArg, Idx + AttributeList::FirstArgIndex, DL, F);
|
2019-07-19 22:29:30 +08:00
|
|
|
|
|
|
|
splitToValueTypes(
|
|
|
|
OrigArg, SplitArgs, DL, MRI, CC,
|
2019-07-19 22:15:18 +08:00
|
|
|
// FIXME: We should probably be passing multiple registers to
|
|
|
|
// handleAssignments to do this
|
2019-07-19 22:29:30 +08:00
|
|
|
[&](ArrayRef<Register> Regs, LLT LLTy, LLT PartLLT, int VTSplitIdx) {
|
|
|
|
packSplitRegsToOrigType(MIRBuilder, VRegs[Idx][VTSplitIdx], Regs,
|
|
|
|
LLTy, PartLLT);
|
2019-07-19 22:15:18 +08:00
|
|
|
});
|
2018-04-25 04:51:28 +08:00
|
|
|
|
2019-07-19 22:15:18 +08:00
|
|
|
++Idx;
|
|
|
|
}
|
|
|
|
|
|
|
|
// At least one interpolation mode must be enabled or else the GPU will
|
|
|
|
// hang.
|
|
|
|
//
|
|
|
|
// Check PSInputAddr instead of PSInputEnable. The idea is that if the user
|
|
|
|
// set PSInputAddr, the user wants to enable some bits after the compilation
|
|
|
|
// based on run-time states. Since we can't know what the final PSInputEna
|
|
|
|
// will look like, so we shouldn't do anything here and the user should take
|
|
|
|
// responsibility for the correct programming.
|
|
|
|
//
|
|
|
|
// Otherwise, the following restrictions apply:
|
|
|
|
// - At least one of PERSP_* (0xF) or LINEAR_* (0x70) must be enabled.
|
|
|
|
// - If POS_W_FLOAT (11) is enabled, at least one of PERSP_* must be
|
|
|
|
// enabled too.
|
|
|
|
if (CC == CallingConv::AMDGPU_PS) {
|
|
|
|
if ((Info->getPSInputAddr() & 0x7F) == 0 ||
|
|
|
|
((Info->getPSInputAddr() & 0xF) == 0 &&
|
|
|
|
Info->isPSInputAllocated(11))) {
|
|
|
|
CCInfo.AllocateReg(AMDGPU::VGPR0);
|
|
|
|
CCInfo.AllocateReg(AMDGPU::VGPR1);
|
|
|
|
Info->markPSInputAllocated(0);
|
|
|
|
Info->markPSInputEnabled(0);
|
2018-04-25 04:51:28 +08:00
|
|
|
}
|
|
|
|
|
2019-07-19 22:15:18 +08:00
|
|
|
if (Subtarget.isAmdPalOS()) {
|
|
|
|
// For isAmdPalOS, the user does not enable some bits after compilation
|
|
|
|
// based on run-time states; the register values being generated here are
|
|
|
|
// the final ones set in hardware. Therefore we need to apply the
|
|
|
|
// workaround to PSInputAddr and PSInputEnable together. (The case where
|
|
|
|
// a bit is set in PSInputAddr but not PSInputEnable is where the frontend
|
|
|
|
// set up an input arg for a particular interpolation mode, but nothing
|
|
|
|
// uses that input arg. Really we should have an earlier pass that removes
|
|
|
|
// such an arg.)
|
|
|
|
unsigned PsInputBits = Info->getPSInputAddr() & Info->getPSInputEnable();
|
|
|
|
if ((PsInputBits & 0x7F) == 0 ||
|
|
|
|
((PsInputBits & 0xF) == 0 &&
|
|
|
|
(PsInputBits >> 11 & 1)))
|
|
|
|
Info->markPSInputEnabled(
|
|
|
|
countTrailingZeros(Info->getPSInputAddr(), ZB_Undefined));
|
2018-04-25 04:51:28 +08:00
|
|
|
}
|
Re-commit AMDGPU/GlobalISel: Add support for simple shaders
Fix build when global-isel is disabled and fix a warning.
Summary: We can select constant/global G_LOAD, global G_STORE, and G_GEP.
Reviewers: qcolombet, MatzeB, t.p.northover, ab, arsenm
Subscribers: mehdi_amini, vkalintiris, kzhuravl, wdng, nhaehnle, mgorny, yaxunl, tony-tye, modocache, llvm-commits, dberris
Differential Revision: https://reviews.llvm.org/D26730
llvm-svn: 293551
2017-01-31 05:56:46 +08:00
|
|
|
}
|
|
|
|
|
2019-07-19 22:15:18 +08:00
|
|
|
const SITargetLowering &TLI = *getTLI<SITargetLowering>();
|
|
|
|
CCAssignFn *AssignFn = TLI.CCAssignFnForCall(CC, F.isVarArg());
|
2019-05-31 03:33:18 +08:00
|
|
|
|
2019-07-19 22:15:18 +08:00
|
|
|
if (!MBB.empty())
|
|
|
|
MIRBuilder.setInstr(*MBB.begin());
|
|
|
|
|
|
|
|
FormalArgHandler Handler(MIRBuilder, MRI, AssignFn);
|
|
|
|
if (!handleAssignments(CCInfo, ArgLocs, MIRBuilder, SplitArgs, Handler))
|
|
|
|
return false;
|
|
|
|
|
|
|
|
if (!IsEntryFunc) {
|
|
|
|
// Special inputs come after user arguments.
|
|
|
|
TLI.allocateSpecialInputVGPRs(CCInfo, MF, *TRI, *Info);
|
AMDGPU/GlobalISel: Add support for amdgpu_vs calling convention
Reviewers: arsenm
Reviewed By: arsenm
Subscribers: kzhuravl, wdng, nhaehnle, yaxunl, rovka, kristof.beyls, igorb, dstuttard, tpr, llvm-commits, t-tye
Differential Revision: https://reviews.llvm.org/D35916
llvm-svn: 309675
2017-08-01 20:38:33 +08:00
|
|
|
}
|
|
|
|
|
2019-07-19 22:15:18 +08:00
|
|
|
// Start adding system SGPRs.
|
|
|
|
if (IsEntryFunc) {
|
|
|
|
TLI.allocateSystemSGPRs(CCInfo, MF, *Info, CC, IsShader);
|
|
|
|
} else {
|
|
|
|
CCInfo.AllocateReg(Info->getScratchRSrcReg());
|
|
|
|
CCInfo.AllocateReg(Info->getScratchWaveOffsetReg());
|
|
|
|
CCInfo.AllocateReg(Info->getFrameOffsetReg());
|
|
|
|
TLI.allocateSpecialInputSGPRs(CCInfo, MF, *TRI, *Info);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Move back to the end of the basic block.
|
|
|
|
MIRBuilder.setMBB(MBB);
|
|
|
|
|
|
|
|
return true;
|
2016-04-15 03:09:28 +08:00
|
|
|
}
|