forked from OSchip/llvm-project
[DSE,MemorySSA] Skip access already dominated by a killing def.
If we already found a killing def (= a def that completely overwrites the location) that dominates an access, we can skip processing it further. This does not help with compile-time, but increases the number of memory accesses we can process with the same scan budget, leading to more stores being eliminated. Improvements with this change Same hash: 203 (filtered out) Remaining: 34 Metric: dse.NumFastStores Program base dom diff test-suite...rolangs-C++/family/family.test 2.00 4.00 100.0% test-suite...ProxyApps-C++/CLAMR/CLAMR.test 172.00 229.00 33.1% test-suite...ks/Prolangs-C/agrep/agrep.test 10.00 12.00 20.0% test-suite...oxyApps-C++/miniFE/miniFE.test 44.00 51.00 15.9% test-suite...marks/7zip/7zip-benchmark.test 1285.00 1474.00 14.7% test-suite...006/450.soplex/450.soplex.test 254.00 289.00 13.8% test-suite...006/447.dealII/447.dealII.test 2466.00 2798.00 13.5% test-suite...000/197.parser/197.parser.test 9.00 10.00 11.1% test-suite.../Benchmarks/nbench/nbench.test 85.00 91.00 7.1% test-suite...ce/Applications/siod/siod.test 68.00 72.00 5.9% test-suite...ications/JM/lencod/lencod.test 786.00 824.00 4.8% test-suite...6/464.h264ref/464.h264ref.test 765.00 798.00 4.3% test-suite.../Benchmarks/Ptrdist/bc/bc.test 105.00 109.00 3.8% test-suite...lications/obsequi/Obsequi.test 29.00 28.00 -3.4% test-suite...3.xalancbmk/483.xalancbmk.test 1322.00 1367.00 3.4% test-suite...chmarks/MallocBench/gs/gs.test 118.00 122.00 3.4% test-suite...T2006/401.bzip2/401.bzip2.test 60.00 62.00 3.3% test-suite...6/482.sphinx3/482.sphinx3.test 30.00 31.00 3.3% test-suite...rks/tramp3d-v4/tramp3d-v4.test 862.00 887.00 2.9% test-suite...telecomm-gsm/telecomm-gsm.test 78.00 80.00 2.6% test-suite...ediabench/gsm/toast/toast.test 78.00 80.00 2.6% test-suite.../Applications/SPASS/SPASS.test 163.00 167.00 2.5% test-suite...lications/ClamAV/clamscan.test 240.00 245.00 2.1% test-suite...006/453.povray/453.povray.test 1392.00 1419.00 1.9% test-suite...000/255.vortex/255.vortex.test 211.00 215.00 1.9% test-suite...:: External/Povray/povray.test 1295.00 1317.00 1.7% test-suite...lications/sqlite3/sqlite3.test 175.00 177.00 1.1% test-suite...T2000/256.bzip2/256.bzip2.test 99.00 100.00 1.0% test-suite...0/253.perlbmk/253.perlbmk.test 629.00 635.00 1.0% test-suite.../CINT2006/403.gcc/403.gcc.test 1183.00 1194.00 0.9% test-suite.../CINT2000/176.gcc/176.gcc.test 647.00 653.00 0.9% test-suite...ications/JM/ldecod/ldecod.test 512.00 516.00 0.8% test-suite...0.perlbench/400.perlbench.test 1026.00 1034.00 0.8% test-suite...-typeset/consumer-typeset.test 1876.00 1877.00 0.1% Geomean difference 7.3%
This commit is contained in:
parent
98e01f56b0
commit
4cc20aa743
|
@ -1787,7 +1787,8 @@ struct DSEState {
|
||||||
// eliminated if the access is killed along all paths to the exit. Collect
|
// eliminated if the access is killed along all paths to the exit. Collect
|
||||||
// the blocks with killing (=completely overwriting MemoryDefs) and check if
|
// the blocks with killing (=completely overwriting MemoryDefs) and check if
|
||||||
// they cover all paths from DomAccess to any function exit.
|
// they cover all paths from DomAccess to any function exit.
|
||||||
SmallPtrSet<BasicBlock *, 16> KillingBlocks = {KillingDef->getBlock()};
|
SmallPtrSet<Instruction *, 16> KillingDefs;
|
||||||
|
KillingDefs.insert(KillingDef->getMemoryInst());
|
||||||
LLVM_DEBUG({
|
LLVM_DEBUG({
|
||||||
dbgs() << " Checking for reads of " << *DomAccess;
|
dbgs() << " Checking for reads of " << *DomAccess;
|
||||||
if (isa<MemoryDef>(DomAccess))
|
if (isa<MemoryDef>(DomAccess))
|
||||||
|
@ -1816,6 +1817,13 @@ struct DSEState {
|
||||||
--ScanLimit;
|
--ScanLimit;
|
||||||
|
|
||||||
if (isa<MemoryPhi>(UseAccess)) {
|
if (isa<MemoryPhi>(UseAccess)) {
|
||||||
|
if (any_of(KillingDefs, [this, UseAccess](Instruction *KI) {
|
||||||
|
return DT.properlyDominates(KI->getParent(),
|
||||||
|
UseAccess->getBlock());
|
||||||
|
})) {
|
||||||
|
LLVM_DEBUG(dbgs() << " ... skipping, dominated by killing block\n");
|
||||||
|
continue;
|
||||||
|
}
|
||||||
LLVM_DEBUG(dbgs() << "\n ... adding PHI uses\n");
|
LLVM_DEBUG(dbgs() << "\n ... adding PHI uses\n");
|
||||||
PushMemUses(UseAccess);
|
PushMemUses(UseAccess);
|
||||||
continue;
|
continue;
|
||||||
|
@ -1824,6 +1832,13 @@ struct DSEState {
|
||||||
Instruction *UseInst = cast<MemoryUseOrDef>(UseAccess)->getMemoryInst();
|
Instruction *UseInst = cast<MemoryUseOrDef>(UseAccess)->getMemoryInst();
|
||||||
LLVM_DEBUG(dbgs() << " (" << *UseInst << ")\n");
|
LLVM_DEBUG(dbgs() << " (" << *UseInst << ")\n");
|
||||||
|
|
||||||
|
if (any_of(KillingDefs, [this, UseInst](Instruction *KI) {
|
||||||
|
return DT.dominates(KI, UseInst);
|
||||||
|
})) {
|
||||||
|
LLVM_DEBUG(dbgs() << " ... skipping, dominated by killing def\n");
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
|
||||||
if (isNoopIntrinsic(cast<MemoryUseOrDef>(UseAccess))) {
|
if (isNoopIntrinsic(cast<MemoryUseOrDef>(UseAccess))) {
|
||||||
LLVM_DEBUG(dbgs() << " ... adding uses of intrinsic\n");
|
LLVM_DEBUG(dbgs() << " ... adding uses of intrinsic\n");
|
||||||
PushMemUses(UseAccess);
|
PushMemUses(UseAccess);
|
||||||
|
@ -1868,9 +1883,9 @@ struct DSEState {
|
||||||
if (PostOrderNumbers.find(MaybeKillingBlock)->second <
|
if (PostOrderNumbers.find(MaybeKillingBlock)->second <
|
||||||
PostOrderNumbers.find(DomAccess->getBlock())->second) {
|
PostOrderNumbers.find(DomAccess->getBlock())->second) {
|
||||||
|
|
||||||
LLVM_DEBUG(dbgs() << " ... found killing block "
|
LLVM_DEBUG(dbgs()
|
||||||
<< MaybeKillingBlock->getName() << "\n");
|
<< " ... found killing def " << *UseInst << "\n");
|
||||||
KillingBlocks.insert(MaybeKillingBlock);
|
KillingDefs.insert(UseInst);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
} else
|
} else
|
||||||
|
@ -1882,8 +1897,12 @@ struct DSEState {
|
||||||
// that the location is killed (=overwritten) along all paths from DomAccess
|
// that the location is killed (=overwritten) along all paths from DomAccess
|
||||||
// to the exit.
|
// to the exit.
|
||||||
if (DefVisibleToCallerAfterRet) {
|
if (DefVisibleToCallerAfterRet) {
|
||||||
|
SmallPtrSet<BasicBlock *, 16> KillingBlocks;
|
||||||
|
for (Instruction *KD : KillingDefs)
|
||||||
|
KillingBlocks.insert(KD->getParent());
|
||||||
assert(!KillingBlocks.empty() &&
|
assert(!KillingBlocks.empty() &&
|
||||||
"Expected at least a single killing block");
|
"Expected at least a single killing block");
|
||||||
|
|
||||||
// Find the common post-dominator of all killing blocks.
|
// Find the common post-dominator of all killing blocks.
|
||||||
BasicBlock *CommonPred = *KillingBlocks.begin();
|
BasicBlock *CommonPred = *KillingBlocks.begin();
|
||||||
for (auto I = std::next(KillingBlocks.begin()), E = KillingBlocks.end();
|
for (auto I = std::next(KillingBlocks.begin()), E = KillingBlocks.end();
|
||||||
|
|
Loading…
Reference in New Issue