2020-04-09 19:40:53 +08:00
|
|
|
//===-- FixupStatepointCallerSaved.cpp - Fixup caller saved registers ----===//
|
|
|
|
//
|
2021-08-05 11:16:17 +08:00
|
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
2020-04-09 19:40:53 +08:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
///
|
|
|
|
/// \file
|
|
|
|
/// Statepoint instruction in deopt parameters contains values which are
|
|
|
|
/// meaningful to the runtime and should be able to be read at the moment the
|
|
|
|
/// call returns. So we can say that we need to encode the fact that these
|
|
|
|
/// values are "late read" by runtime. If we could express this notion for
|
|
|
|
/// register allocator it would produce the right form for us.
|
|
|
|
/// The need to fixup (i.e this pass) is specifically handling the fact that
|
|
|
|
/// we cannot describe such a late read for the register allocator.
|
|
|
|
/// Register allocator may put the value on a register clobbered by the call.
|
|
|
|
/// This pass forces the spill of such registers and replaces corresponding
|
|
|
|
/// statepoint operands to added spill slots.
|
|
|
|
///
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#include "llvm/ADT/SmallSet.h"
|
|
|
|
#include "llvm/ADT/Statistic.h"
|
|
|
|
#include "llvm/CodeGen/MachineFrameInfo.h"
|
|
|
|
#include "llvm/CodeGen/MachineFunctionPass.h"
|
2022-03-10 20:54:41 +08:00
|
|
|
#include "llvm/CodeGen/MachineRegisterInfo.h"
|
|
|
|
#include "llvm/CodeGen/Passes.h"
|
2020-04-09 19:40:53 +08:00
|
|
|
#include "llvm/CodeGen/StackMaps.h"
|
2022-03-10 20:54:41 +08:00
|
|
|
#include "llvm/CodeGen/TargetFrameLowering.h"
|
2020-04-09 19:40:53 +08:00
|
|
|
#include "llvm/CodeGen/TargetInstrInfo.h"
|
|
|
|
#include "llvm/IR/Statepoint.h"
|
|
|
|
#include "llvm/InitializePasses.h"
|
|
|
|
#include "llvm/Support/Debug.h"
|
|
|
|
|
|
|
|
using namespace llvm;
|
|
|
|
|
|
|
|
#define DEBUG_TYPE "fixup-statepoint-caller-saved"
|
|
|
|
STATISTIC(NumSpilledRegisters, "Number of spilled register");
|
|
|
|
STATISTIC(NumSpillSlotsAllocated, "Number of spill slots allocated");
|
|
|
|
STATISTIC(NumSpillSlotsExtended, "Number of spill slots extended");
|
|
|
|
|
|
|
|
static cl::opt<bool> FixupSCSExtendSlotSize(
|
|
|
|
"fixup-scs-extend-slot-size", cl::Hidden, cl::init(false),
|
|
|
|
cl::desc("Allow spill in spill slot of greater size than register size"),
|
|
|
|
cl::Hidden);
|
|
|
|
|
2020-06-10 21:52:25 +08:00
|
|
|
static cl::opt<bool> PassGCPtrInCSR(
|
|
|
|
"fixup-allow-gcptr-in-csr", cl::Hidden, cl::init(false),
|
|
|
|
cl::desc("Allow passing GC Pointer arguments in callee saved registers"));
|
|
|
|
|
|
|
|
static cl::opt<bool> EnableCopyProp(
|
|
|
|
"fixup-scs-enable-copy-propagation", cl::Hidden, cl::init(true),
|
|
|
|
cl::desc("Enable simple copy propagation during register reloading"));
|
|
|
|
|
|
|
|
// This is purely debugging option.
|
|
|
|
// It may be handy for investigating statepoint spilling issues.
|
|
|
|
static cl::opt<unsigned> MaxStatepointsWithRegs(
|
|
|
|
"fixup-max-csr-statepoints", cl::Hidden,
|
|
|
|
cl::desc("Max number of statepoints allowed to pass GC Ptrs in registers"));
|
|
|
|
|
2020-04-09 19:40:53 +08:00
|
|
|
namespace {
|
|
|
|
|
|
|
|
class FixupStatepointCallerSaved : public MachineFunctionPass {
|
|
|
|
public:
|
|
|
|
static char ID;
|
|
|
|
|
|
|
|
FixupStatepointCallerSaved() : MachineFunctionPass(ID) {
|
|
|
|
initializeFixupStatepointCallerSavedPass(*PassRegistry::getPassRegistry());
|
|
|
|
}
|
|
|
|
|
|
|
|
void getAnalysisUsage(AnalysisUsage &AU) const override {
|
2020-05-14 01:29:04 +08:00
|
|
|
AU.setPreservesCFG();
|
2020-04-09 19:40:53 +08:00
|
|
|
MachineFunctionPass::getAnalysisUsage(AU);
|
|
|
|
}
|
|
|
|
|
|
|
|
StringRef getPassName() const override {
|
|
|
|
return "Fixup Statepoint Caller Saved";
|
|
|
|
}
|
|
|
|
|
|
|
|
bool runOnMachineFunction(MachineFunction &MF) override;
|
|
|
|
};
|
2020-06-10 21:52:25 +08:00
|
|
|
|
2020-04-09 19:40:53 +08:00
|
|
|
} // End anonymous namespace.
|
|
|
|
|
|
|
|
char FixupStatepointCallerSaved::ID = 0;
|
|
|
|
char &llvm::FixupStatepointCallerSavedID = FixupStatepointCallerSaved::ID;
|
|
|
|
|
|
|
|
INITIALIZE_PASS_BEGIN(FixupStatepointCallerSaved, DEBUG_TYPE,
|
|
|
|
"Fixup Statepoint Caller Saved", false, false)
|
|
|
|
INITIALIZE_PASS_END(FixupStatepointCallerSaved, DEBUG_TYPE,
|
|
|
|
"Fixup Statepoint Caller Saved", false, false)
|
|
|
|
|
|
|
|
// Utility function to get size of the register.
|
|
|
|
static unsigned getRegisterSize(const TargetRegisterInfo &TRI, Register Reg) {
|
|
|
|
const TargetRegisterClass *RC = TRI.getMinimalPhysRegClass(Reg);
|
|
|
|
return TRI.getSpillSize(*RC);
|
|
|
|
}
|
|
|
|
|
2020-06-10 21:52:25 +08:00
|
|
|
// Try to eliminate redundant copy to register which we're going to
|
|
|
|
// spill, i.e. try to change:
|
|
|
|
// X = COPY Y
|
|
|
|
// SPILL X
|
|
|
|
// to
|
|
|
|
// SPILL Y
|
|
|
|
// If there are no uses of X between copy and STATEPOINT, that COPY
|
|
|
|
// may be eliminated.
|
|
|
|
// Reg - register we're about to spill
|
|
|
|
// RI - On entry points to statepoint.
|
|
|
|
// On successful copy propagation set to new spill point.
|
|
|
|
// IsKill - set to true if COPY is Kill (there are no uses of Y)
|
|
|
|
// Returns either found source copy register or original one.
|
|
|
|
static Register performCopyPropagation(Register Reg,
|
|
|
|
MachineBasicBlock::iterator &RI,
|
|
|
|
bool &IsKill, const TargetInstrInfo &TII,
|
|
|
|
const TargetRegisterInfo &TRI) {
|
|
|
|
// First check if statepoint itself uses Reg in non-meta operands.
|
|
|
|
int Idx = RI->findRegisterUseOperandIdx(Reg, false, &TRI);
|
2020-08-14 23:08:54 +08:00
|
|
|
if (Idx >= 0 && (unsigned)Idx < StatepointOpers(&*RI).getNumDeoptArgsIdx()) {
|
|
|
|
IsKill = false;
|
|
|
|
return Reg;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!EnableCopyProp)
|
2020-06-10 21:52:25 +08:00
|
|
|
return Reg;
|
|
|
|
|
|
|
|
MachineBasicBlock *MBB = RI->getParent();
|
|
|
|
MachineBasicBlock::reverse_iterator E = MBB->rend();
|
|
|
|
MachineInstr *Def = nullptr, *Use = nullptr;
|
|
|
|
for (auto It = ++(RI.getReverse()); It != E; ++It) {
|
|
|
|
if (It->readsRegister(Reg, &TRI) && !Use)
|
|
|
|
Use = &*It;
|
|
|
|
if (It->modifiesRegister(Reg, &TRI)) {
|
|
|
|
Def = &*It;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!Def)
|
|
|
|
return Reg;
|
|
|
|
|
|
|
|
auto DestSrc = TII.isCopyInstr(*Def);
|
|
|
|
if (!DestSrc || DestSrc->Destination->getReg() != Reg)
|
|
|
|
return Reg;
|
|
|
|
|
|
|
|
Register SrcReg = DestSrc->Source->getReg();
|
|
|
|
|
|
|
|
if (getRegisterSize(TRI, Reg) != getRegisterSize(TRI, SrcReg))
|
|
|
|
return Reg;
|
|
|
|
|
|
|
|
LLVM_DEBUG(dbgs() << "spillRegisters: perform copy propagation "
|
|
|
|
<< printReg(Reg, &TRI) << " -> " << printReg(SrcReg, &TRI)
|
|
|
|
<< "\n");
|
|
|
|
|
|
|
|
// Insert spill immediately after Def
|
|
|
|
RI = ++MachineBasicBlock::iterator(Def);
|
|
|
|
IsKill = DestSrc->Source->isKill();
|
|
|
|
|
|
|
|
// There are no uses of original register between COPY and STATEPOINT.
|
|
|
|
// There can't be any after STATEPOINT, so we can eliminate Def.
|
|
|
|
if (!Use) {
|
|
|
|
LLVM_DEBUG(dbgs() << "spillRegisters: removing dead copy " << *Def);
|
|
|
|
Def->eraseFromParent();
|
|
|
|
}
|
|
|
|
return SrcReg;
|
|
|
|
}
|
|
|
|
|
2020-04-25 17:50:52 +08:00
|
|
|
namespace {
|
2020-06-10 21:52:25 +08:00
|
|
|
// Pair {Register, FrameIndex}
|
|
|
|
using RegSlotPair = std::pair<Register, int>;
|
|
|
|
|
|
|
|
// Keeps track of what reloads were inserted in MBB.
|
|
|
|
class RegReloadCache {
|
|
|
|
using ReloadSet = SmallSet<RegSlotPair, 8>;
|
|
|
|
DenseMap<const MachineBasicBlock *, ReloadSet> Reloads;
|
|
|
|
|
|
|
|
public:
|
|
|
|
RegReloadCache() = default;
|
|
|
|
|
|
|
|
// Record reload of Reg from FI in block MBB
|
|
|
|
void recordReload(Register Reg, int FI, const MachineBasicBlock *MBB) {
|
|
|
|
RegSlotPair RSP(Reg, FI);
|
|
|
|
auto Res = Reloads[MBB].insert(RSP);
|
2020-08-14 23:35:58 +08:00
|
|
|
(void)Res;
|
2020-06-10 21:52:25 +08:00
|
|
|
assert(Res.second && "reload already exists");
|
|
|
|
}
|
|
|
|
|
|
|
|
// Does basic block MBB contains reload of Reg from FI?
|
|
|
|
bool hasReload(Register Reg, int FI, const MachineBasicBlock *MBB) {
|
|
|
|
RegSlotPair RSP(Reg, FI);
|
|
|
|
return Reloads.count(MBB) && Reloads[MBB].count(RSP);
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2020-04-09 19:40:53 +08:00
|
|
|
// Cache used frame indexes during statepoint re-write to re-use them in
|
|
|
|
// processing next statepoint instruction.
|
|
|
|
// Two strategies. One is to preserve the size of spill slot while another one
|
|
|
|
// extends the size of spill slots to reduce the number of them, causing
|
|
|
|
// the less total frame size. But unspill will have "implicit" any extend.
|
|
|
|
class FrameIndexesCache {
|
|
|
|
private:
|
|
|
|
struct FrameIndexesPerSize {
|
|
|
|
// List of used frame indexes during processing previous statepoints.
|
|
|
|
SmallVector<int, 8> Slots;
|
|
|
|
// Current index of un-used yet frame index.
|
|
|
|
unsigned Index = 0;
|
|
|
|
};
|
|
|
|
MachineFrameInfo &MFI;
|
|
|
|
const TargetRegisterInfo &TRI;
|
|
|
|
// Map size to list of frame indexes of this size. If the mode is
|
|
|
|
// FixupSCSExtendSlotSize then the key 0 is used to keep all frame indexes.
|
|
|
|
// If the size of required spill slot is greater than in a cache then the
|
|
|
|
// size will be increased.
|
|
|
|
DenseMap<unsigned, FrameIndexesPerSize> Cache;
|
|
|
|
|
2020-06-10 21:52:25 +08:00
|
|
|
// Keeps track of slots reserved for the shared landing pad processing.
|
|
|
|
// Initialized from GlobalIndices for the current EHPad.
|
|
|
|
SmallSet<int, 8> ReservedSlots;
|
|
|
|
|
|
|
|
// Landing pad can be destination of several statepoints. Every register
|
|
|
|
// defined by such statepoints must be spilled to the same stack slot.
|
|
|
|
// This map keeps that information.
|
|
|
|
DenseMap<const MachineBasicBlock *, SmallVector<RegSlotPair, 8>>
|
|
|
|
GlobalIndices;
|
|
|
|
|
|
|
|
FrameIndexesPerSize &getCacheBucket(unsigned Size) {
|
|
|
|
// In FixupSCSExtendSlotSize mode the bucket with 0 index is used
|
|
|
|
// for all sizes.
|
|
|
|
return Cache[FixupSCSExtendSlotSize ? 0 : Size];
|
|
|
|
}
|
|
|
|
|
2020-04-09 19:40:53 +08:00
|
|
|
public:
|
|
|
|
FrameIndexesCache(MachineFrameInfo &MFI, const TargetRegisterInfo &TRI)
|
|
|
|
: MFI(MFI), TRI(TRI) {}
|
|
|
|
// Reset the current state of used frame indexes. After invocation of
|
2020-06-10 21:52:25 +08:00
|
|
|
// this function all frame indexes are available for allocation with
|
|
|
|
// the exception of slots reserved for landing pad processing (if any).
|
|
|
|
void reset(const MachineBasicBlock *EHPad) {
|
2020-04-09 19:40:53 +08:00
|
|
|
for (auto &It : Cache)
|
|
|
|
It.second.Index = 0;
|
2020-06-10 21:52:25 +08:00
|
|
|
|
|
|
|
ReservedSlots.clear();
|
|
|
|
if (EHPad && GlobalIndices.count(EHPad))
|
|
|
|
for (auto &RSP : GlobalIndices[EHPad])
|
|
|
|
ReservedSlots.insert(RSP.second);
|
2020-04-09 19:40:53 +08:00
|
|
|
}
|
2020-06-10 21:52:25 +08:00
|
|
|
|
2020-04-09 19:40:53 +08:00
|
|
|
// Get frame index to spill the register.
|
2020-06-10 21:52:25 +08:00
|
|
|
int getFrameIndex(Register Reg, MachineBasicBlock *EHPad) {
|
|
|
|
// Check if slot for Reg is already reserved at EHPad.
|
|
|
|
auto It = GlobalIndices.find(EHPad);
|
|
|
|
if (It != GlobalIndices.end()) {
|
|
|
|
auto &Vec = It->second;
|
|
|
|
auto Idx = llvm::find_if(
|
|
|
|
Vec, [Reg](RegSlotPair &RSP) { return Reg == RSP.first; });
|
|
|
|
if (Idx != Vec.end()) {
|
|
|
|
int FI = Idx->second;
|
|
|
|
LLVM_DEBUG(dbgs() << "Found global FI " << FI << " for register "
|
|
|
|
<< printReg(Reg, &TRI) << " at "
|
|
|
|
<< printMBBReference(*EHPad) << "\n");
|
|
|
|
assert(ReservedSlots.count(FI) && "using unreserved slot");
|
|
|
|
return FI;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-04-09 19:40:53 +08:00
|
|
|
unsigned Size = getRegisterSize(TRI, Reg);
|
2020-06-10 21:52:25 +08:00
|
|
|
FrameIndexesPerSize &Line = getCacheBucket(Size);
|
|
|
|
while (Line.Index < Line.Slots.size()) {
|
2020-04-09 19:40:53 +08:00
|
|
|
int FI = Line.Slots[Line.Index++];
|
2020-06-10 21:52:25 +08:00
|
|
|
if (ReservedSlots.count(FI))
|
|
|
|
continue;
|
2020-04-09 19:40:53 +08:00
|
|
|
// If all sizes are kept together we probably need to extend the
|
|
|
|
// spill slot size.
|
|
|
|
if (MFI.getObjectSize(FI) < Size) {
|
|
|
|
MFI.setObjectSize(FI, Size);
|
|
|
|
MFI.setObjectAlignment(FI, Align(Size));
|
|
|
|
NumSpillSlotsExtended++;
|
|
|
|
}
|
|
|
|
return FI;
|
|
|
|
}
|
2020-07-01 16:49:28 +08:00
|
|
|
int FI = MFI.CreateSpillStackObject(Size, Align(Size));
|
2020-04-09 19:40:53 +08:00
|
|
|
NumSpillSlotsAllocated++;
|
|
|
|
Line.Slots.push_back(FI);
|
|
|
|
++Line.Index;
|
2020-06-10 21:52:25 +08:00
|
|
|
|
|
|
|
// Remember assignment {Reg, FI} for EHPad
|
|
|
|
if (EHPad) {
|
|
|
|
GlobalIndices[EHPad].push_back(std::make_pair(Reg, FI));
|
|
|
|
LLVM_DEBUG(dbgs() << "Reserved FI " << FI << " for spilling reg "
|
|
|
|
<< printReg(Reg, &TRI) << " at landing pad "
|
|
|
|
<< printMBBReference(*EHPad) << "\n");
|
|
|
|
}
|
|
|
|
|
2020-04-09 19:40:53 +08:00
|
|
|
return FI;
|
|
|
|
}
|
2020-06-10 21:52:25 +08:00
|
|
|
|
2020-04-09 19:40:53 +08:00
|
|
|
// Sort all registers to spill in descendent order. In the
|
|
|
|
// FixupSCSExtendSlotSize mode it will minimize the total frame size.
|
|
|
|
// In non FixupSCSExtendSlotSize mode we can skip this step.
|
|
|
|
void sortRegisters(SmallVectorImpl<Register> &Regs) {
|
|
|
|
if (!FixupSCSExtendSlotSize)
|
|
|
|
return;
|
2021-01-15 12:30:31 +08:00
|
|
|
llvm::sort(Regs, [&](Register &A, Register &B) {
|
2020-04-09 19:40:53 +08:00
|
|
|
return getRegisterSize(TRI, A) > getRegisterSize(TRI, B);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
// Describes the state of the current processing statepoint instruction.
|
|
|
|
class StatepointState {
|
|
|
|
private:
|
|
|
|
// statepoint instruction.
|
|
|
|
MachineInstr &MI;
|
|
|
|
MachineFunction &MF;
|
2020-06-10 21:52:25 +08:00
|
|
|
// If non-null then statepoint is invoke, and this points to the landing pad.
|
|
|
|
MachineBasicBlock *EHPad;
|
2020-04-09 19:40:53 +08:00
|
|
|
const TargetRegisterInfo &TRI;
|
|
|
|
const TargetInstrInfo &TII;
|
|
|
|
MachineFrameInfo &MFI;
|
|
|
|
// Mask with callee saved registers.
|
|
|
|
const uint32_t *Mask;
|
|
|
|
// Cache of frame indexes used on previous instruction processing.
|
|
|
|
FrameIndexesCache &CacheFI;
|
2020-06-10 21:52:25 +08:00
|
|
|
bool AllowGCPtrInCSR;
|
2020-04-09 19:40:53 +08:00
|
|
|
// Operands with physical registers requiring spilling.
|
|
|
|
SmallVector<unsigned, 8> OpsToSpill;
|
|
|
|
// Set of register to spill.
|
|
|
|
SmallVector<Register, 8> RegsToSpill;
|
2020-06-10 21:52:25 +08:00
|
|
|
// Set of registers to reload after statepoint.
|
|
|
|
SmallVector<Register, 8> RegsToReload;
|
2020-04-09 19:40:53 +08:00
|
|
|
// Map Register to Frame Slot index.
|
|
|
|
DenseMap<Register, int> RegToSlotIdx;
|
|
|
|
|
|
|
|
public:
|
|
|
|
StatepointState(MachineInstr &MI, const uint32_t *Mask,
|
2020-06-10 21:52:25 +08:00
|
|
|
FrameIndexesCache &CacheFI, bool AllowGCPtrInCSR)
|
2020-04-09 19:40:53 +08:00
|
|
|
: MI(MI), MF(*MI.getMF()), TRI(*MF.getSubtarget().getRegisterInfo()),
|
|
|
|
TII(*MF.getSubtarget().getInstrInfo()), MFI(MF.getFrameInfo()),
|
2020-06-10 21:52:25 +08:00
|
|
|
Mask(Mask), CacheFI(CacheFI), AllowGCPtrInCSR(AllowGCPtrInCSR) {
|
|
|
|
|
|
|
|
// Find statepoint's landing pad, if any.
|
|
|
|
EHPad = nullptr;
|
|
|
|
MachineBasicBlock *MBB = MI.getParent();
|
|
|
|
// Invoke statepoint must be last one in block.
|
|
|
|
bool Last = std::none_of(++MI.getIterator(), MBB->end().getInstrIterator(),
|
|
|
|
[](MachineInstr &I) {
|
|
|
|
return I.getOpcode() == TargetOpcode::STATEPOINT;
|
|
|
|
});
|
|
|
|
|
|
|
|
if (!Last)
|
|
|
|
return;
|
|
|
|
|
|
|
|
auto IsEHPad = [](MachineBasicBlock *B) { return B->isEHPad(); };
|
|
|
|
|
|
|
|
assert(llvm::count_if(MBB->successors(), IsEHPad) < 2 && "multiple EHPads");
|
|
|
|
|
|
|
|
auto It = llvm::find_if(MBB->successors(), IsEHPad);
|
|
|
|
if (It != MBB->succ_end())
|
|
|
|
EHPad = *It;
|
|
|
|
}
|
|
|
|
|
|
|
|
MachineBasicBlock *getEHPad() const { return EHPad; }
|
|
|
|
|
2020-04-09 19:40:53 +08:00
|
|
|
// Return true if register is callee saved.
|
|
|
|
bool isCalleeSaved(Register Reg) { return (Mask[Reg / 32] >> Reg % 32) & 1; }
|
2020-06-10 21:52:25 +08:00
|
|
|
|
2020-04-09 19:40:53 +08:00
|
|
|
// Iterates over statepoint meta args to find caller saver registers.
|
|
|
|
// Also cache the size of found registers.
|
|
|
|
// Returns true if caller save registers found.
|
|
|
|
bool findRegistersToSpill() {
|
[Statepoints] Change statepoint machine instr format to better suit VReg lowering.
Current Statepoint MI format is this:
STATEPOINT
<id>, <num patch bytes >, <num call arguments>, <call target>,
[call arguments...],
<StackMaps::ConstantOp>, <calling convention>,
<StackMaps::ConstantOp>, <statepoint flags>,
<StackMaps::ConstantOp>, <num deopt args>, [deopt args...],
<gc base/derived pairs...> <gc allocas...>
Note that GC pointers are listed in pairs <base,derived>.
This causes base pointers to appear many times (at least twice) in
instruction, which is bad for us when VReg lowering is ON.
The problem is that machine operand tiedness is 1-1 relation, so
it might look like this:
%vr2 = STATEPOINT ... %vr1, %vr1(tied-def0)
Since only one instance of %vr1 is tied, that may lead to incorrect
codegen (see PR46917 for more details), so we have to always spill
base pointers. This mostly defeats new VReg lowering scheme.
This patch changes statepoint instruction format so that every
gc pointer appears only once in operand list. That way they all can
be tied. Additional set of operands is added to preserve base-derived
relation required to build stackmap.
New statepoint has following format:
STATEPOINT
<id>, <num patch bytes>, <num call arguments>, <call target>,
[call arguments...],
<StackMaps::ConstantOp>, <calling convention>,
<StackMaps::ConstantOp>, <statepoint flags>,
<StackMaps::ConstantOp>, <num deopt args>, [deopt args...],
<StackMaps::ConstantOp>, <num gc pointers>, [gc pointers...],
<StackMaps::ConstantOp>, <num gc allocas>, [gc allocas...]
<StackMaps::ConstantOp>, <num entries in gc map>, [base/derived indices...]
Changes are:
- every gc pointer is listed only once in a flat length-prefixed list;
- alloca list is prefixed with its length too;
- following alloca list is length-prefixed list of base-derived
indices of pointers from gc pointer list. Note that indices are
logical (number of pointer), not absolute (index of machine operand).
Differential Revision: https://reviews.llvm.org/D87154
2020-09-05 01:45:41 +08:00
|
|
|
SmallSet<Register, 8> GCRegs;
|
|
|
|
// All GC pointer operands assigned to registers produce new value.
|
|
|
|
// Since they're tied to their defs, it is enough to collect def registers.
|
|
|
|
for (const auto &Def : MI.defs())
|
|
|
|
GCRegs.insert(Def.getReg());
|
|
|
|
|
2020-04-09 19:40:53 +08:00
|
|
|
SmallSet<Register, 8> VisitedRegs;
|
|
|
|
for (unsigned Idx = StatepointOpers(&MI).getVarIdx(),
|
|
|
|
EndIdx = MI.getNumOperands();
|
|
|
|
Idx < EndIdx; ++Idx) {
|
|
|
|
MachineOperand &MO = MI.getOperand(Idx);
|
2021-01-15 03:35:18 +08:00
|
|
|
// Leave `undef` operands as is, StackMaps will rewrite them
|
|
|
|
// into a constant.
|
|
|
|
if (!MO.isReg() || MO.isImplicit() || MO.isUndef())
|
2020-04-09 19:40:53 +08:00
|
|
|
continue;
|
|
|
|
Register Reg = MO.getReg();
|
|
|
|
assert(Reg.isPhysical() && "Only physical regs are expected");
|
2020-06-10 21:52:25 +08:00
|
|
|
|
|
|
|
if (isCalleeSaved(Reg) && (AllowGCPtrInCSR || !is_contained(GCRegs, Reg)))
|
2020-04-09 19:40:53 +08:00
|
|
|
continue;
|
2020-06-10 21:52:25 +08:00
|
|
|
|
|
|
|
LLVM_DEBUG(dbgs() << "Will spill " << printReg(Reg, &TRI) << " at index "
|
|
|
|
<< Idx << "\n");
|
|
|
|
|
2020-04-09 19:40:53 +08:00
|
|
|
if (VisitedRegs.insert(Reg).second)
|
|
|
|
RegsToSpill.push_back(Reg);
|
|
|
|
OpsToSpill.push_back(Idx);
|
|
|
|
}
|
|
|
|
CacheFI.sortRegisters(RegsToSpill);
|
|
|
|
return !RegsToSpill.empty();
|
|
|
|
}
|
2020-06-10 21:52:25 +08:00
|
|
|
|
2020-04-09 19:40:53 +08:00
|
|
|
// Spill all caller saved registers right before statepoint instruction.
|
|
|
|
// Remember frame index where register is spilled.
|
|
|
|
void spillRegisters() {
|
|
|
|
for (Register Reg : RegsToSpill) {
|
2020-06-10 21:52:25 +08:00
|
|
|
int FI = CacheFI.getFrameIndex(Reg, EHPad);
|
2020-04-09 19:40:53 +08:00
|
|
|
const TargetRegisterClass *RC = TRI.getMinimalPhysRegClass(Reg);
|
2020-06-10 21:52:25 +08:00
|
|
|
|
2020-04-09 19:40:53 +08:00
|
|
|
NumSpilledRegisters++;
|
|
|
|
RegToSlotIdx[Reg] = FI;
|
2020-06-10 21:52:25 +08:00
|
|
|
|
|
|
|
LLVM_DEBUG(dbgs() << "Spilling " << printReg(Reg, &TRI) << " to FI " << FI
|
|
|
|
<< "\n");
|
|
|
|
|
|
|
|
// Perform trivial copy propagation
|
|
|
|
bool IsKill = true;
|
|
|
|
MachineBasicBlock::iterator InsertBefore(MI);
|
|
|
|
Reg = performCopyPropagation(Reg, InsertBefore, IsKill, TII, TRI);
|
|
|
|
|
|
|
|
LLVM_DEBUG(dbgs() << "Insert spill before " << *InsertBefore);
|
|
|
|
TII.storeRegToStackSlot(*MI.getParent(), InsertBefore, Reg, IsKill, FI,
|
|
|
|
RC, &TRI);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void insertReloadBefore(unsigned Reg, MachineBasicBlock::iterator It,
|
|
|
|
MachineBasicBlock *MBB) {
|
|
|
|
const TargetRegisterClass *RC = TRI.getMinimalPhysRegClass(Reg);
|
|
|
|
int FI = RegToSlotIdx[Reg];
|
|
|
|
if (It != MBB->end()) {
|
|
|
|
TII.loadRegFromStackSlot(*MBB, It, Reg, FI, RC, &TRI);
|
|
|
|
return;
|
2020-04-09 19:40:53 +08:00
|
|
|
}
|
2020-06-10 21:52:25 +08:00
|
|
|
|
|
|
|
// To insert reload at the end of MBB, insert it before last instruction
|
|
|
|
// and then swap them.
|
2021-01-17 01:40:54 +08:00
|
|
|
assert(!MBB->empty() && "Empty block");
|
2020-06-10 21:52:25 +08:00
|
|
|
--It;
|
|
|
|
TII.loadRegFromStackSlot(*MBB, It, Reg, FI, RC, &TRI);
|
|
|
|
MachineInstr *Reload = It->getPrevNode();
|
|
|
|
int Dummy = 0;
|
2020-08-14 23:35:58 +08:00
|
|
|
(void)Dummy;
|
2020-06-10 21:52:25 +08:00
|
|
|
assert(TII.isLoadFromStackSlot(*Reload, Dummy) == Reg);
|
|
|
|
assert(Dummy == FI);
|
|
|
|
MBB->remove(Reload);
|
|
|
|
MBB->insertAfter(It, Reload);
|
2020-04-09 19:40:53 +08:00
|
|
|
}
|
2020-06-10 21:52:25 +08:00
|
|
|
|
|
|
|
// Insert reloads of (relocated) registers spilled in statepoint.
|
|
|
|
void insertReloads(MachineInstr *NewStatepoint, RegReloadCache &RC) {
|
|
|
|
MachineBasicBlock *MBB = NewStatepoint->getParent();
|
|
|
|
auto InsertPoint = std::next(NewStatepoint->getIterator());
|
|
|
|
|
|
|
|
for (auto Reg : RegsToReload) {
|
|
|
|
insertReloadBefore(Reg, InsertPoint, MBB);
|
|
|
|
LLVM_DEBUG(dbgs() << "Reloading " << printReg(Reg, &TRI) << " from FI "
|
|
|
|
<< RegToSlotIdx[Reg] << " after statepoint\n");
|
|
|
|
|
|
|
|
if (EHPad && !RC.hasReload(Reg, RegToSlotIdx[Reg], EHPad)) {
|
|
|
|
RC.recordReload(Reg, RegToSlotIdx[Reg], EHPad);
|
|
|
|
auto EHPadInsertPoint = EHPad->SkipPHIsLabelsAndDebug(EHPad->begin());
|
|
|
|
insertReloadBefore(Reg, EHPadInsertPoint, EHPad);
|
|
|
|
LLVM_DEBUG(dbgs() << "...also reload at EHPad "
|
|
|
|
<< printMBBReference(*EHPad) << "\n");
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-04-09 19:40:53 +08:00
|
|
|
// Re-write statepoint machine instruction to replace caller saved operands
|
|
|
|
// with indirect memory location (frame index).
|
2020-06-10 21:52:25 +08:00
|
|
|
MachineInstr *rewriteStatepoint() {
|
2020-04-09 19:40:53 +08:00
|
|
|
MachineInstr *NewMI =
|
|
|
|
MF.CreateMachineInstr(TII.get(MI.getOpcode()), MI.getDebugLoc(), true);
|
|
|
|
MachineInstrBuilder MIB(MF, NewMI);
|
|
|
|
|
2020-06-10 21:52:25 +08:00
|
|
|
unsigned NumOps = MI.getNumOperands();
|
|
|
|
|
|
|
|
// New indices for the remaining defs.
|
|
|
|
SmallVector<unsigned, 8> NewIndices;
|
|
|
|
unsigned NumDefs = MI.getNumDefs();
|
|
|
|
for (unsigned I = 0; I < NumDefs; ++I) {
|
|
|
|
MachineOperand &DefMO = MI.getOperand(I);
|
|
|
|
assert(DefMO.isReg() && DefMO.isDef() && "Expected Reg Def operand");
|
|
|
|
Register Reg = DefMO.getReg();
|
2021-02-02 17:25:11 +08:00
|
|
|
assert(DefMO.isTied() && "Def is expected to be tied");
|
|
|
|
// We skipped undef uses and did not spill them, so we should not
|
|
|
|
// proceed with defs here.
|
|
|
|
if (MI.getOperand(MI.findTiedOperandIdx(I)).isUndef()) {
|
|
|
|
if (AllowGCPtrInCSR) {
|
|
|
|
NewIndices.push_back(NewMI->getNumOperands());
|
|
|
|
MIB.addReg(Reg, RegState::Define);
|
|
|
|
}
|
|
|
|
continue;
|
|
|
|
}
|
2020-06-10 21:52:25 +08:00
|
|
|
if (!AllowGCPtrInCSR) {
|
|
|
|
assert(is_contained(RegsToSpill, Reg));
|
|
|
|
RegsToReload.push_back(Reg);
|
|
|
|
} else {
|
|
|
|
if (isCalleeSaved(Reg)) {
|
|
|
|
NewIndices.push_back(NewMI->getNumOperands());
|
|
|
|
MIB.addReg(Reg, RegState::Define);
|
|
|
|
} else {
|
|
|
|
NewIndices.push_back(NumOps);
|
|
|
|
RegsToReload.push_back(Reg);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-04-09 19:40:53 +08:00
|
|
|
// Add End marker.
|
|
|
|
OpsToSpill.push_back(MI.getNumOperands());
|
|
|
|
unsigned CurOpIdx = 0;
|
|
|
|
|
2020-06-10 21:52:25 +08:00
|
|
|
for (unsigned I = NumDefs; I < MI.getNumOperands(); ++I) {
|
2020-04-09 19:40:53 +08:00
|
|
|
MachineOperand &MO = MI.getOperand(I);
|
|
|
|
if (I == OpsToSpill[CurOpIdx]) {
|
|
|
|
int FI = RegToSlotIdx[MO.getReg()];
|
|
|
|
MIB.addImm(StackMaps::IndirectMemRefOp);
|
|
|
|
MIB.addImm(getRegisterSize(TRI, MO.getReg()));
|
|
|
|
assert(MO.isReg() && "Should be register");
|
|
|
|
assert(MO.getReg().isPhysical() && "Should be physical register");
|
|
|
|
MIB.addFrameIndex(FI);
|
|
|
|
MIB.addImm(0);
|
|
|
|
++CurOpIdx;
|
2020-06-10 21:52:25 +08:00
|
|
|
} else {
|
2020-04-09 19:40:53 +08:00
|
|
|
MIB.add(MO);
|
2020-06-10 21:52:25 +08:00
|
|
|
unsigned OldDef;
|
|
|
|
if (AllowGCPtrInCSR && MI.isRegTiedToDefOperand(I, &OldDef)) {
|
|
|
|
assert(OldDef < NumDefs);
|
|
|
|
assert(NewIndices[OldDef] < NumOps);
|
|
|
|
MIB->tieOperands(NewIndices[OldDef], MIB->getNumOperands() - 1);
|
|
|
|
}
|
|
|
|
}
|
2020-04-09 19:40:53 +08:00
|
|
|
}
|
|
|
|
assert(CurOpIdx == (OpsToSpill.size() - 1) && "Not all operands processed");
|
|
|
|
// Add mem operands.
|
|
|
|
NewMI->setMemRefs(MF, MI.memoperands());
|
|
|
|
for (auto It : RegToSlotIdx) {
|
2020-06-10 21:52:25 +08:00
|
|
|
Register R = It.first;
|
2020-04-09 19:40:53 +08:00
|
|
|
int FrameIndex = It.second;
|
|
|
|
auto PtrInfo = MachinePointerInfo::getFixedStack(MF, FrameIndex);
|
2020-06-10 21:52:25 +08:00
|
|
|
MachineMemOperand::Flags Flags = MachineMemOperand::MOLoad;
|
|
|
|
if (is_contained(RegsToReload, R))
|
|
|
|
Flags |= MachineMemOperand::MOStore;
|
|
|
|
auto *MMO =
|
|
|
|
MF.getMachineMemOperand(PtrInfo, Flags, getRegisterSize(TRI, R),
|
|
|
|
MFI.getObjectAlign(FrameIndex));
|
2020-04-09 19:40:53 +08:00
|
|
|
NewMI->addMemOperand(MF, MMO);
|
|
|
|
}
|
2020-06-10 21:52:25 +08:00
|
|
|
|
2020-04-09 19:40:53 +08:00
|
|
|
// Insert new statepoint and erase old one.
|
|
|
|
MI.getParent()->insert(MI, NewMI);
|
2020-06-10 21:52:25 +08:00
|
|
|
|
|
|
|
LLVM_DEBUG(dbgs() << "rewritten statepoint to : " << *NewMI << "\n");
|
2020-04-09 19:40:53 +08:00
|
|
|
MI.eraseFromParent();
|
2020-06-10 21:52:25 +08:00
|
|
|
return NewMI;
|
2020-04-09 19:40:53 +08:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
class StatepointProcessor {
|
|
|
|
private:
|
|
|
|
MachineFunction &MF;
|
|
|
|
const TargetRegisterInfo &TRI;
|
|
|
|
FrameIndexesCache CacheFI;
|
2020-06-10 21:52:25 +08:00
|
|
|
RegReloadCache ReloadCache;
|
2020-04-09 19:40:53 +08:00
|
|
|
|
|
|
|
public:
|
|
|
|
StatepointProcessor(MachineFunction &MF)
|
|
|
|
: MF(MF), TRI(*MF.getSubtarget().getRegisterInfo()),
|
|
|
|
CacheFI(MF.getFrameInfo(), TRI) {}
|
|
|
|
|
2020-06-10 21:52:25 +08:00
|
|
|
bool process(MachineInstr &MI, bool AllowGCPtrInCSR) {
|
2020-04-14 23:30:51 +08:00
|
|
|
StatepointOpers SO(&MI);
|
|
|
|
uint64_t Flags = SO.getFlags();
|
2020-04-09 19:40:53 +08:00
|
|
|
// Do nothing for LiveIn, it supports all registers.
|
|
|
|
if (Flags & (uint64_t)StatepointFlags::DeoptLiveIn)
|
|
|
|
return false;
|
2020-06-10 21:52:25 +08:00
|
|
|
LLVM_DEBUG(dbgs() << "\nMBB " << MI.getParent()->getNumber() << " "
|
|
|
|
<< MI.getParent()->getName() << " : process statepoint "
|
|
|
|
<< MI);
|
2020-04-14 23:30:51 +08:00
|
|
|
CallingConv::ID CC = SO.getCallingConv();
|
2020-04-09 19:40:53 +08:00
|
|
|
const uint32_t *Mask = TRI.getCallPreservedMask(MF, CC);
|
2020-06-10 21:52:25 +08:00
|
|
|
StatepointState SS(MI, Mask, CacheFI, AllowGCPtrInCSR);
|
|
|
|
CacheFI.reset(SS.getEHPad());
|
2020-04-09 19:40:53 +08:00
|
|
|
|
|
|
|
if (!SS.findRegistersToSpill())
|
|
|
|
return false;
|
|
|
|
|
|
|
|
SS.spillRegisters();
|
2020-06-10 21:52:25 +08:00
|
|
|
auto *NewStatepoint = SS.rewriteStatepoint();
|
|
|
|
SS.insertReloads(NewStatepoint, ReloadCache);
|
2020-04-09 19:40:53 +08:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
};
|
2020-04-25 17:50:52 +08:00
|
|
|
} // namespace
|
2020-04-09 19:40:53 +08:00
|
|
|
|
|
|
|
bool FixupStatepointCallerSaved::runOnMachineFunction(MachineFunction &MF) {
|
|
|
|
if (skipFunction(MF.getFunction()))
|
|
|
|
return false;
|
|
|
|
|
|
|
|
const Function &F = MF.getFunction();
|
|
|
|
if (!F.hasGC())
|
|
|
|
return false;
|
|
|
|
|
|
|
|
SmallVector<MachineInstr *, 16> Statepoints;
|
|
|
|
for (MachineBasicBlock &BB : MF)
|
|
|
|
for (MachineInstr &I : BB)
|
|
|
|
if (I.getOpcode() == TargetOpcode::STATEPOINT)
|
|
|
|
Statepoints.push_back(&I);
|
|
|
|
|
|
|
|
if (Statepoints.empty())
|
|
|
|
return false;
|
|
|
|
|
|
|
|
bool Changed = false;
|
|
|
|
StatepointProcessor SPP(MF);
|
2020-06-10 21:52:25 +08:00
|
|
|
unsigned NumStatepoints = 0;
|
|
|
|
bool AllowGCPtrInCSR = PassGCPtrInCSR;
|
|
|
|
for (MachineInstr *I : Statepoints) {
|
|
|
|
++NumStatepoints;
|
|
|
|
if (MaxStatepointsWithRegs.getNumOccurrences() &&
|
|
|
|
NumStatepoints >= MaxStatepointsWithRegs)
|
|
|
|
AllowGCPtrInCSR = false;
|
|
|
|
Changed |= SPP.process(*I, AllowGCPtrInCSR);
|
|
|
|
}
|
2020-04-09 19:40:53 +08:00
|
|
|
return Changed;
|
|
|
|
}
|