forked from OSchip/llvm-project
[JumpThreading] Unfold selects that depend on the same condition
Summary: These are good candidates for jump threading. This enables later opts (such as InstCombine) to combine instructions from the selects with instructions out of the selects. SimplifyCFG will fold the select again if unfolding wasn't worth it. Patch by James Molloy and Pablo Barrio. Reviewers: reames, bkramer, mcrosier, gberry, haicheng, jmolloy, sebpop Subscribers: jojo, rengolin, llvm-commits Differential Revision: https://reviews.llvm.org/D25477 llvm-svn: 284971
This commit is contained in:
parent
16706dcbd4
commit
f9e0d0b7d0
|
@ -129,6 +129,8 @@ private:
|
|||
BasicBlock *NewBB, BasicBlock *SuccBB);
|
||||
/// Check if the block has profile metadata for its outgoing edges.
|
||||
bool doesBlockHaveProfileData(BasicBlock *BB);
|
||||
SelectInst *getSelectFedByPhi(PHINode *PN);
|
||||
void expandSelect(SelectInst *SI);
|
||||
};
|
||||
|
||||
} // end namespace llvm
|
||||
|
|
|
@ -1963,51 +1963,45 @@ bool JumpThreadingPass::TryToUnfoldSelect(CmpInst *CondCmp, BasicBlock *BB) {
|
|||
return false;
|
||||
}
|
||||
|
||||
/// TryToUnfoldSelectInCurrBB - Look for PHI/Select in the same BB of the form
|
||||
/// GetSelectFedByPhi - Look for PHI/Select in the same BB of the form
|
||||
/// bb:
|
||||
/// %p = phi [false, %bb1], [true, %bb2], [false, %bb3], [true, %bb4], ...
|
||||
/// %s = select p, trueval, falseval
|
||||
///
|
||||
/// And expand the select into a branch structure. This later enables
|
||||
/// And return the select. Unfolding it into a branch structure later enables
|
||||
/// jump-threading over bb in this pass.
|
||||
///
|
||||
/// Using the similar approach of SimplifyCFG::FoldCondBranchOnPHI(), unfold
|
||||
/// select if the associated PHI has at least one constant. If the unfolded
|
||||
/// select is not jump-threaded, it will be folded again in the later
|
||||
/// optimizations.
|
||||
bool JumpThreadingPass::TryToUnfoldSelectInCurrBB(BasicBlock *BB) {
|
||||
// If threading this would thread across a loop header, don't thread the edge.
|
||||
// See the comments above FindLoopHeaders for justifications and caveats.
|
||||
if (LoopHeaders.count(BB))
|
||||
return false;
|
||||
/// Using the similar approach of SimplifyCFG::FoldCondBranchOnPHI(), return
|
||||
/// select if the associated PHI has at least one constant.
|
||||
SelectInst *JumpThreadingPass::getSelectFedByPhi(PHINode *PN) {
|
||||
|
||||
// Look for a Phi/Select pair in the same basic block. The Phi feeds the
|
||||
// condition of the Select and at least one of the incoming values is a
|
||||
// constant.
|
||||
for (BasicBlock::iterator BI = BB->begin();
|
||||
PHINode *PN = dyn_cast<PHINode>(BI); ++BI) {
|
||||
unsigned NumPHIValues = PN->getNumIncomingValues();
|
||||
if (NumPHIValues == 0 || !PN->hasOneUse())
|
||||
continue;
|
||||
return nullptr;
|
||||
|
||||
SelectInst *SI = dyn_cast<SelectInst>(PN->user_back());
|
||||
BasicBlock *BB = PN->getParent();
|
||||
if (!SI || SI->getParent() != BB)
|
||||
continue;
|
||||
return nullptr;
|
||||
|
||||
Value *Cond = SI->getCondition();
|
||||
if (!Cond || Cond != PN || !Cond->getType()->isIntegerTy(1))
|
||||
continue;
|
||||
return nullptr;
|
||||
|
||||
bool HasConst = false;
|
||||
for (unsigned i = 0; i != NumPHIValues; ++i) {
|
||||
if (PN->getIncomingBlock(i) == BB)
|
||||
return false;
|
||||
return nullptr;
|
||||
if (isa<ConstantInt>(PN->getIncomingValue(i)))
|
||||
HasConst = true;
|
||||
return SI;
|
||||
}
|
||||
|
||||
if (HasConst) {
|
||||
// Expand the select.
|
||||
return nullptr;
|
||||
}
|
||||
|
||||
/// ExpandSelect - Expand a select into an if-then-else construct.
|
||||
void JumpThreadingPass::expandSelect(SelectInst *SI) {
|
||||
|
||||
BasicBlock *BB = SI->getParent();
|
||||
TerminatorInst *Term =
|
||||
SplitBlockAndInsertIfThen(SI->getCondition(), SI, false);
|
||||
PHINode *NewPN = PHINode::Create(SI->getType(), 2, "", SI);
|
||||
|
@ -2015,9 +2009,50 @@ bool JumpThreadingPass::TryToUnfoldSelectInCurrBB(BasicBlock *BB) {
|
|||
NewPN->addIncoming(SI->getFalseValue(), BB);
|
||||
SI->replaceAllUsesWith(NewPN);
|
||||
SI->eraseFromParent();
|
||||
return true;
|
||||
}
|
||||
|
||||
/// TryToUnfoldSelectInCurrBB - Unfold selects that could be jump-threaded were
|
||||
/// they if-then-elses. If the unfolded selects are not jump-threaded, it will
|
||||
/// be folded again in the later optimizations.
|
||||
bool JumpThreadingPass::TryToUnfoldSelectInCurrBB(BasicBlock *BB) {
|
||||
|
||||
// If threading this would thread across a loop header, don't thread the edge.
|
||||
// See the comments above FindLoopHeaders for justifications and caveats.
|
||||
if (LoopHeaders.count(BB))
|
||||
return false;
|
||||
|
||||
bool Changed = false;
|
||||
for (auto &I : *BB) {
|
||||
|
||||
// Look for a Phi/Select pair in the same basic block. The Phi feeds the
|
||||
// condition of the Select and at least one of the incoming values is a
|
||||
// constant.
|
||||
PHINode *PN;
|
||||
SelectInst *SI;
|
||||
if ((PN = dyn_cast<PHINode>(&I)) && (SI = getSelectFedByPhi(PN))) {
|
||||
expandSelect(SI);
|
||||
Changed = true;
|
||||
continue;
|
||||
}
|
||||
|
||||
if (I.getType()->isIntegerTy(1)) {
|
||||
|
||||
SmallVector<SelectInst *, 4> Selects;
|
||||
|
||||
// Look for scalar booleans used in selects as conditions. If there are
|
||||
// several selects that use the same boolean, they are candidates for jump
|
||||
// threading and therefore we should unfold them.
|
||||
for (Value *U : I.users())
|
||||
if (auto *SI = dyn_cast<SelectInst>(U))
|
||||
Selects.push_back(SI);
|
||||
if (Selects.size() <= 1)
|
||||
continue;
|
||||
|
||||
Changed = true;
|
||||
for (auto *SI : Selects)
|
||||
expandSelect(SI);
|
||||
}
|
||||
}
|
||||
|
||||
return false;
|
||||
return Changed;
|
||||
}
|
||||
|
|
|
@ -0,0 +1,23 @@
|
|||
; RUN: opt < %s -jump-threading -instcombine -simplifycfg -S | FileCheck %s
|
||||
|
||||
; The three selects are jump-threaded so that instcombine can optimize, and
|
||||
; simplifycfg should turn the result into a single select.
|
||||
define i32 @f(i32 %a, i32 %b) {
|
||||
; CHECK: select
|
||||
; CHECK-NOT: select
|
||||
entry:
|
||||
%0 = and i32 %a, 1
|
||||
%1 = and i32 %b, 1
|
||||
%xor = xor i32 %1, %a
|
||||
%shr32 = lshr i32 %a, 1
|
||||
%cmp10 = icmp eq i32 %xor, 1
|
||||
%2 = xor i32 %b, 12345
|
||||
%b.addr.1 = select i1 %cmp10, i32 %2, i32 %b
|
||||
%shr1633 = lshr i32 %b.addr.1, 1
|
||||
%3 = or i32 %shr1633, 54321
|
||||
%b.addr.2 = select i1 %cmp10, i32 %3, i32 %shr1633
|
||||
%shr1634 = lshr i32 %b.addr.2, 2
|
||||
%4 = or i32 %shr1634, 54320
|
||||
%b.addr.3 = select i1 %cmp10, i32 %4, i32 %shr1634
|
||||
ret i32 %b.addr.3
|
||||
}
|
Loading…
Reference in New Issue