2007-10-31 11:30:14 +08:00
|
|
|
//===- MachineDominators.cpp - Machine Dominator Calculation --------------===//
|
|
|
|
//
|
2019-01-19 16:50:56 +08:00
|
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
2007-10-31 11:30:14 +08:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
|
|
|
// This file implements simple dominator construction algorithms for finding
|
|
|
|
// forward dominators on machine functions.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#include "llvm/CodeGen/MachineDominators.h"
|
2015-02-28 07:13:13 +08:00
|
|
|
#include "llvm/ADT/SmallBitVector.h"
|
2017-06-06 19:49:48 +08:00
|
|
|
#include "llvm/CodeGen/Passes.h"
|
Sink all InitializePasses.h includes
This file lists every pass in LLVM, and is included by Pass.h, which is
very popular. Every time we add, remove, or rename a pass in LLVM, it
caused lots of recompilation.
I found this fact by looking at this table, which is sorted by the
number of times a file was changed over the last 100,000 git commits
multiplied by the number of object files that depend on it in the
current checkout:
recompiles touches affected_files header
342380 95 3604 llvm/include/llvm/ADT/STLExtras.h
314730 234 1345 llvm/include/llvm/InitializePasses.h
307036 118 2602 llvm/include/llvm/ADT/APInt.h
213049 59 3611 llvm/include/llvm/Support/MathExtras.h
170422 47 3626 llvm/include/llvm/Support/Compiler.h
162225 45 3605 llvm/include/llvm/ADT/Optional.h
158319 63 2513 llvm/include/llvm/ADT/Triple.h
140322 39 3598 llvm/include/llvm/ADT/StringRef.h
137647 59 2333 llvm/include/llvm/Support/Error.h
131619 73 1803 llvm/include/llvm/Support/FileSystem.h
Before this change, touching InitializePasses.h would cause 1345 files
to recompile. After this change, touching it only causes 550 compiles in
an incremental rebuild.
Reviewers: bkramer, asbirlea, bollu, jdoerfert
Differential Revision: https://reviews.llvm.org/D70211
2019-11-14 05:15:01 +08:00
|
|
|
#include "llvm/InitializePasses.h"
|
2022-03-15 17:54:19 +08:00
|
|
|
#include "llvm/Pass.h"
|
|
|
|
#include "llvm/PassRegistry.h"
|
2016-06-24 21:32:22 +08:00
|
|
|
#include "llvm/Support/CommandLine.h"
|
2007-10-31 11:30:14 +08:00
|
|
|
|
|
|
|
using namespace llvm;
|
|
|
|
|
2019-10-01 23:23:27 +08:00
|
|
|
namespace llvm {
|
2016-06-25 01:15:04 +08:00
|
|
|
// Always verify dominfo if expensive checking is enabled.
|
2016-06-24 21:32:22 +08:00
|
|
|
#ifdef EXPENSIVE_CHECKS
|
2019-10-01 23:23:27 +08:00
|
|
|
bool VerifyMachineDomInfo = true;
|
2016-06-24 21:32:22 +08:00
|
|
|
#else
|
2019-10-01 23:23:27 +08:00
|
|
|
bool VerifyMachineDomInfo = false;
|
2016-06-24 21:32:22 +08:00
|
|
|
#endif
|
2019-10-01 23:23:27 +08:00
|
|
|
} // namespace llvm
|
|
|
|
|
2016-06-24 21:32:22 +08:00
|
|
|
static cl::opt<bool, true> VerifyMachineDomInfoX(
|
2017-12-01 08:53:10 +08:00
|
|
|
"verify-machine-dom-info", cl::location(VerifyMachineDomInfo), cl::Hidden,
|
2016-06-24 21:32:22 +08:00
|
|
|
cl::desc("Verify machine dominator info (time consuming)"));
|
|
|
|
|
2009-12-16 08:13:24 +08:00
|
|
|
namespace llvm {
|
2015-07-14 01:21:31 +08:00
|
|
|
template class DomTreeNodeBase<MachineBasicBlock>;
|
2017-07-15 02:26:09 +08:00
|
|
|
template class DominatorTreeBase<MachineBasicBlock, false>; // DomTreeBase
|
2009-12-16 08:13:24 +08:00
|
|
|
}
|
2007-10-31 11:30:14 +08:00
|
|
|
|
2008-01-06 04:15:42 +08:00
|
|
|
char MachineDominatorTree::ID = 0;
|
|
|
|
|
2010-08-24 01:52:01 +08:00
|
|
|
INITIALIZE_PASS(MachineDominatorTree, "machinedomtree",
|
2010-10-08 06:25:06 +08:00
|
|
|
"MachineDominator Tree Construction", true, true)
|
2008-01-05 04:54:55 +08:00
|
|
|
|
2010-08-07 02:33:48 +08:00
|
|
|
char &llvm::MachineDominatorsID = MachineDominatorTree::ID;
|
2009-01-06 01:59:02 +08:00
|
|
|
|
|
|
|
void MachineDominatorTree::getAnalysisUsage(AnalysisUsage &AU) const {
|
|
|
|
AU.setPreservesAll();
|
|
|
|
MachineFunctionPass::getAnalysisUsage(AU);
|
|
|
|
}
|
|
|
|
|
|
|
|
bool MachineDominatorTree::runOnMachineFunction(MachineFunction &F) {
|
2019-10-29 03:35:34 +08:00
|
|
|
calculate(F);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
void MachineDominatorTree::calculate(MachineFunction &F) {
|
[MachineDominatorTree] Provide a method to inform a MachineDominatorTree that a
critical edge has been split. The MachineDominatorTree will when lazy update the
underlying dominance properties when require.
** Context **
This is a follow-up of r215410.
Each time a critical edge is split this invalidates the dominator tree
information. Thus, subsequent queries of that interface will be slow until the
underlying information is actually recomputed (costly).
** Problem **
Prior to this patch, splitting a critical edge needed to query the dominator
tree to update the dominator information.
Therefore, splitting a bunch of critical edges will likely produce poor
performance as each query to the dominator tree will use the slow query path.
This happens a lot in passes like MachineSink and PHIElimination.
** Proposed Solution **
Splitting a critical edge is a local modification of the CFG. Moreover, as soon
as a critical edge is split, it is not critical anymore and thus cannot be a
candidate for critical edge splitting anymore. In other words, the predecessor
and successor of a basic block inserted on a critical edge cannot be inserted by
critical edge splitting.
Using these observations, we can pile up the splitting of critical edge and
apply then at once before updating the DT information.
The core of this patch moves the update of the MachineDominatorTree information
from MachineBasicBlock::SplitCriticalEdge to a lazy MachineDominatorTree.
** Performance **
Thanks to this patch, the motivating example compiles in 4- minutes instead of
6+ minutes. No test case added as the motivating example as nothing special but
being huge!
The binaries are strictly identical for all the llvm test-suite + SPECs with and
without this patch for both Os and O3.
Regarding compile time, I observed only noise, although on average I saw a
small improvement.
<rdar://problem/17894619>
llvm-svn: 215576
2014-08-14 05:00:07 +08:00
|
|
|
CriticalEdgesToSplit.clear();
|
|
|
|
NewBBs.clear();
|
2017-07-15 02:26:09 +08:00
|
|
|
DT.reset(new DomTreeBase<MachineBasicBlock>());
|
2009-01-06 01:59:02 +08:00
|
|
|
DT->recalculate(F);
|
|
|
|
}
|
|
|
|
|
|
|
|
MachineDominatorTree::MachineDominatorTree()
|
2010-08-07 02:33:48 +08:00
|
|
|
: MachineFunctionPass(ID) {
|
2010-10-20 01:21:58 +08:00
|
|
|
initializeMachineDominatorTreePass(*PassRegistry::getPassRegistry());
|
2009-01-06 01:59:02 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void MachineDominatorTree::releaseMemory() {
|
2017-03-02 20:00:10 +08:00
|
|
|
CriticalEdgesToSplit.clear();
|
|
|
|
DT.reset(nullptr);
|
2009-01-06 01:59:02 +08:00
|
|
|
}
|
2009-08-23 13:17:37 +08:00
|
|
|
|
2016-06-24 21:32:22 +08:00
|
|
|
void MachineDominatorTree::verifyAnalysis() const {
|
2019-10-02 02:27:14 +08:00
|
|
|
if (DT && VerifyMachineDomInfo)
|
2021-10-28 13:19:34 +08:00
|
|
|
if (!DT->verify(MachineDomTree::VerificationLevel::Basic)) {
|
2019-10-02 02:27:14 +08:00
|
|
|
errs() << "MachineDominatorTree verification failed\n";
|
2018-02-28 19:00:08 +08:00
|
|
|
abort();
|
|
|
|
}
|
2016-06-24 21:32:22 +08:00
|
|
|
}
|
|
|
|
|
2009-08-23 14:03:38 +08:00
|
|
|
void MachineDominatorTree::print(raw_ostream &OS, const Module*) const {
|
2017-03-02 20:00:10 +08:00
|
|
|
if (DT)
|
|
|
|
DT->print(OS);
|
2009-08-23 13:17:37 +08:00
|
|
|
}
|
2015-02-28 07:13:13 +08:00
|
|
|
|
|
|
|
void MachineDominatorTree::applySplitCriticalEdges() const {
|
|
|
|
// Bail out early if there is nothing to do.
|
|
|
|
if (CriticalEdgesToSplit.empty())
|
|
|
|
return;
|
|
|
|
|
|
|
|
// For each element in CriticalEdgesToSplit, remember whether or not element
|
|
|
|
// is the new immediate domminator of its successor. The mapping is done by
|
|
|
|
// index, i.e., the information for the ith element of CriticalEdgesToSplit is
|
|
|
|
// the ith element of IsNewIDom.
|
|
|
|
SmallBitVector IsNewIDom(CriticalEdgesToSplit.size(), true);
|
|
|
|
size_t Idx = 0;
|
|
|
|
|
|
|
|
// Collect all the dominance properties info, before invalidating
|
|
|
|
// the underlying DT.
|
|
|
|
for (CriticalEdge &Edge : CriticalEdgesToSplit) {
|
|
|
|
// Update dominator information.
|
|
|
|
MachineBasicBlock *Succ = Edge.ToBB;
|
|
|
|
MachineDomTreeNode *SuccDTNode = DT->getNode(Succ);
|
|
|
|
|
|
|
|
for (MachineBasicBlock *PredBB : Succ->predecessors()) {
|
|
|
|
if (PredBB == Edge.NewBB)
|
|
|
|
continue;
|
|
|
|
// If we are in this situation:
|
|
|
|
// FromBB1 FromBB2
|
|
|
|
// + +
|
|
|
|
// + + + +
|
|
|
|
// + + + +
|
|
|
|
// ... Split1 Split2 ...
|
|
|
|
// + +
|
|
|
|
// + +
|
|
|
|
// +
|
|
|
|
// Succ
|
|
|
|
// Instead of checking the domiance property with Split2, we check it with
|
|
|
|
// FromBB2 since Split2 is still unknown of the underlying DT structure.
|
|
|
|
if (NewBBs.count(PredBB)) {
|
|
|
|
assert(PredBB->pred_size() == 1 && "A basic block resulting from a "
|
|
|
|
"critical edge split has more "
|
|
|
|
"than one predecessor!");
|
|
|
|
PredBB = *PredBB->pred_begin();
|
|
|
|
}
|
|
|
|
if (!DT->dominates(SuccDTNode, DT->getNode(PredBB))) {
|
|
|
|
IsNewIDom[Idx] = false;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
++Idx;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Now, update DT with the collected dominance properties info.
|
|
|
|
Idx = 0;
|
|
|
|
for (CriticalEdge &Edge : CriticalEdgesToSplit) {
|
|
|
|
// We know FromBB dominates NewBB.
|
|
|
|
MachineDomTreeNode *NewDTNode = DT->addNewBlock(Edge.NewBB, Edge.FromBB);
|
|
|
|
|
|
|
|
// If all the other predecessors of "Succ" are dominated by "Succ" itself
|
|
|
|
// then the new block is the new immediate dominator of "Succ". Otherwise,
|
|
|
|
// the new block doesn't dominate anything.
|
|
|
|
if (IsNewIDom[Idx])
|
|
|
|
DT->changeImmediateDominator(DT->getNode(Edge.ToBB), NewDTNode);
|
|
|
|
++Idx;
|
|
|
|
}
|
|
|
|
NewBBs.clear();
|
|
|
|
CriticalEdgesToSplit.clear();
|
|
|
|
}
|