forked from OSchip/llvm-project
[LiveDebugValues] Speed up collectIDsForRegs, NFC
Use the advanceToLowerBound operation available on CoalescingBitVector iterators to speed up collection of variables which reside within some set of registers. The speedup comes from avoiding repeated top-down traversals in IntervalMap::find. The linear scan forward from one register interval to the next is unlikely to be as expensive as a full IntervalMap search starting from the root. This reduces time spent in LiveDebugValues when compiling sqlite3 by 200ms (about 0.1% - 0.2% of the total User Time). Depends on D76466. rdar://60046261 Differential Revision: https://reviews.llvm.org/D76467
This commit is contained in:
parent
a3fd1a1c74
commit
a245943355
|
@ -110,7 +110,10 @@ static bool isRegOtherThanSPAndFP(const MachineOperand &Op,
|
||||||
|
|
||||||
namespace {
|
namespace {
|
||||||
|
|
||||||
|
// Max out the number of statically allocated elements in DefinedRegsSet, as
|
||||||
|
// this prevents fallback to std::set::count() operations.
|
||||||
using DefinedRegsSet = SmallSet<Register, 32>;
|
using DefinedRegsSet = SmallSet<Register, 32>;
|
||||||
|
|
||||||
using VarLocSet = CoalescingBitVector<uint64_t>;
|
using VarLocSet = CoalescingBitVector<uint64_t>;
|
||||||
|
|
||||||
/// A type-checked pair of {Register Location (or 0), Index}, used to index
|
/// A type-checked pair of {Register Location (or 0), Index}, used to index
|
||||||
|
@ -563,10 +566,11 @@ private:
|
||||||
}
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
/// Collect all VarLoc IDs from \p CollectFrom for VarLocs which are located
|
/// Collect all VarLoc IDs from \p CollectFrom for VarLocs of kind
|
||||||
/// in \p Reg, of kind RegisterKind. Insert collected IDs in \p Collected.
|
/// RegisterKind which are located in any reg in \p Regs. Insert collected IDs
|
||||||
void collectIDsForReg(VarLocSet &Collected, uint32_t Reg,
|
/// into \p Collected.
|
||||||
const VarLocSet &CollectFrom) const;
|
void collectIDsForRegs(VarLocSet &Collected, const DefinedRegsSet &Regs,
|
||||||
|
const VarLocSet &CollectFrom) const;
|
||||||
|
|
||||||
/// Get the registers which are used by VarLocs of kind RegisterKind tracked
|
/// Get the registers which are used by VarLocs of kind RegisterKind tracked
|
||||||
/// by \p CollectFrom.
|
/// by \p CollectFrom.
|
||||||
|
@ -773,16 +777,30 @@ LiveDebugValues::OpenRangesSet::getEntryValueBackup(DebugVariable Var) {
|
||||||
return llvm::None;
|
return llvm::None;
|
||||||
}
|
}
|
||||||
|
|
||||||
void LiveDebugValues::collectIDsForReg(VarLocSet &Collected, uint32_t Reg,
|
void LiveDebugValues::collectIDsForRegs(VarLocSet &Collected,
|
||||||
const VarLocSet &CollectFrom) const {
|
const DefinedRegsSet &Regs,
|
||||||
// The half-open interval [FirstIndexForReg, FirstInvalidIndex) contains all
|
const VarLocSet &CollectFrom) const {
|
||||||
// possible VarLoc IDs for VarLocs of kind RegisterKind which live in Reg.
|
assert(!Regs.empty() && "Nothing to collect");
|
||||||
uint64_t FirstIndexForReg = LocIndex::rawIndexForReg(Reg);
|
SmallVector<uint32_t, 32> SortedRegs;
|
||||||
uint64_t FirstInvalidIndex = LocIndex::rawIndexForReg(Reg + 1);
|
for (Register Reg : Regs)
|
||||||
// Iterate through that half-open interval and collect all the set IDs.
|
SortedRegs.push_back(Reg);
|
||||||
for (auto It = CollectFrom.find(FirstIndexForReg), End = CollectFrom.end();
|
array_pod_sort(SortedRegs.begin(), SortedRegs.end());
|
||||||
It != End && *It < FirstInvalidIndex; ++It)
|
auto It = CollectFrom.find(LocIndex::rawIndexForReg(SortedRegs.front()));
|
||||||
Collected.set(*It);
|
auto End = CollectFrom.end();
|
||||||
|
for (uint32_t Reg : SortedRegs) {
|
||||||
|
// The half-open interval [FirstIndexForReg, FirstInvalidIndex) contains all
|
||||||
|
// possible VarLoc IDs for VarLocs of kind RegisterKind which live in Reg.
|
||||||
|
uint64_t FirstIndexForReg = LocIndex::rawIndexForReg(Reg);
|
||||||
|
uint64_t FirstInvalidIndex = LocIndex::rawIndexForReg(Reg + 1);
|
||||||
|
It.advanceToLowerBound(FirstIndexForReg);
|
||||||
|
|
||||||
|
// Iterate through that half-open interval and collect all the set IDs.
|
||||||
|
for (; It != End && *It < FirstInvalidIndex; ++It)
|
||||||
|
Collected.set(*It);
|
||||||
|
|
||||||
|
if (It == End)
|
||||||
|
return;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void LiveDebugValues::getUsedRegs(const VarLocSet &CollectFrom,
|
void LiveDebugValues::getUsedRegs(const VarLocSet &CollectFrom,
|
||||||
|
@ -803,7 +821,7 @@ void LiveDebugValues::getUsedRegs(const VarLocSet &CollectFrom,
|
||||||
// even if there aren't any VarLocs living in `FoundReg+1`, we're still
|
// even if there aren't any VarLocs living in `FoundReg+1`, we're still
|
||||||
// guaranteed to move on to the next register (or to end()).
|
// guaranteed to move on to the next register (or to end()).
|
||||||
uint64_t NextRegIndex = LocIndex::rawIndexForReg(FoundReg + 1);
|
uint64_t NextRegIndex = LocIndex::rawIndexForReg(FoundReg + 1);
|
||||||
It = CollectFrom.find(NextRegIndex);
|
It.advanceToLowerBound(NextRegIndex);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -1076,9 +1094,7 @@ void LiveDebugValues::transferRegisterDef(
|
||||||
unsigned SP = TLI->getStackPointerRegisterToSaveRestore();
|
unsigned SP = TLI->getStackPointerRegisterToSaveRestore();
|
||||||
|
|
||||||
// Find the regs killed by MI, and find regmasks of preserved regs.
|
// Find the regs killed by MI, and find regmasks of preserved regs.
|
||||||
// Max out the number of statically allocated elements in `DeadRegs`, as this
|
DefinedRegsSet DeadRegs;
|
||||||
// prevents fallback to std::set::count() operations.
|
|
||||||
SmallSet<uint32_t, 32> DeadRegs;
|
|
||||||
SmallVector<const uint32_t *, 4> RegMasks;
|
SmallVector<const uint32_t *, 4> RegMasks;
|
||||||
for (const MachineOperand &MO : MI.operands()) {
|
for (const MachineOperand &MO : MI.operands()) {
|
||||||
// Determine whether the operand is a register def.
|
// Determine whether the operand is a register def.
|
||||||
|
@ -1097,9 +1113,6 @@ void LiveDebugValues::transferRegisterDef(
|
||||||
// Erase VarLocs which reside in one of the dead registers. For performance
|
// Erase VarLocs which reside in one of the dead registers. For performance
|
||||||
// reasons, it's critical to not iterate over the full set of open VarLocs.
|
// reasons, it's critical to not iterate over the full set of open VarLocs.
|
||||||
// Iterate over the set of dying/used regs instead.
|
// Iterate over the set of dying/used regs instead.
|
||||||
VarLocSet KillSet(Alloc);
|
|
||||||
for (uint32_t DeadReg : DeadRegs)
|
|
||||||
collectIDsForReg(KillSet, DeadReg, OpenRanges.getVarLocs());
|
|
||||||
if (!RegMasks.empty()) {
|
if (!RegMasks.empty()) {
|
||||||
SmallVector<uint32_t, 32> UsedRegs;
|
SmallVector<uint32_t, 32> UsedRegs;
|
||||||
getUsedRegs(OpenRanges.getVarLocs(), UsedRegs);
|
getUsedRegs(OpenRanges.getVarLocs(), UsedRegs);
|
||||||
|
@ -1121,9 +1134,15 @@ void LiveDebugValues::transferRegisterDef(
|
||||||
return MachineOperand::clobbersPhysReg(RegMask, Reg);
|
return MachineOperand::clobbersPhysReg(RegMask, Reg);
|
||||||
});
|
});
|
||||||
if (AnyRegMaskKillsReg)
|
if (AnyRegMaskKillsReg)
|
||||||
collectIDsForReg(KillSet, Reg, OpenRanges.getVarLocs());
|
DeadRegs.insert(Reg);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if (DeadRegs.empty())
|
||||||
|
return;
|
||||||
|
|
||||||
|
VarLocSet KillSet(Alloc);
|
||||||
|
collectIDsForRegs(KillSet, DeadRegs, OpenRanges.getVarLocs());
|
||||||
OpenRanges.erase(KillSet, VarLocIDs);
|
OpenRanges.erase(KillSet, VarLocIDs);
|
||||||
|
|
||||||
if (auto *TPC = getAnalysisIfAvailable<TargetPassConfig>()) {
|
if (auto *TPC = getAnalysisIfAvailable<TargetPassConfig>()) {
|
||||||
|
|
Loading…
Reference in New Issue