2012-12-20 06:10:31 +08:00
|
|
|
//===-- SIAnnotateControlFlow.cpp - ------------------===//
|
|
|
|
//
|
|
|
|
// The LLVM Compiler Infrastructure
|
|
|
|
//
|
|
|
|
// This file is distributed under the University of Illinois Open Source
|
|
|
|
// License. See LICENSE.TXT for details.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
|
|
|
/// \file
|
|
|
|
/// Annotates the control flow with hardware specific intrinsics.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#include "AMDGPU.h"
|
2013-01-02 18:22:59 +08:00
|
|
|
#include "llvm/ADT/DepthFirstIterator.h"
|
2016-02-13 07:45:29 +08:00
|
|
|
#include "llvm/Analysis/DivergenceAnalysis.h"
|
R600/SI: Fix bug from insertion of llvm.SI.end.cf into loop headers
The llvm.SI.end.cf intrinsic is used to mark the end of if-then blocks,
if-then-else blocks, and loops. It is responsible for updating the
exec mask to re-enable threads that had been masked during the preceding
control flow block. For example:
s_mov_b64 exec, 0x3 ; Initial exec mask
s_mov_b64 s[0:1], exec ; Saved exec mask
v_cmpx_gt_u32 exec, s[2:3], v0, 0 ; llvm.SI.if
do_stuff()
s_or_b64 exec, exec, s[0:1] ; llvm.SI.end.cf
The bug fixed by this patch was one where the llvm.SI.end.cf intrinsic
was being inserted into the header of loops. This would happen when
an if block terminated in a loop header and we would end up with
code like this:
s_mov_b64 exec, 0x3 ; Initial exec mask
s_mov_b64 s[0:1], exec ; Saved exec mask
v_cmpx_gt_u32 exec, s[2:3], v0, 0 ; llvm.SI.if
do_stuff()
LOOP: ; Start of loop header
s_or_b64 exec, exec, s[0:1] ; llvm.SI.end.cf <-BUG: The exec mask has the
same value at the beginning of each loop
iteration.
do_stuff();
s_cbranch_execnz LOOP
The fix is to create a new basic block before the loop and insert the
llvm.SI.end.cf there. This way the exec mask is restored before the
start of the loop instead of at the beginning of each iteration.
llvm-svn: 228302
2015-02-05 23:32:15 +08:00
|
|
|
#include "llvm/Analysis/LoopInfo.h"
|
2013-06-08 04:28:43 +08:00
|
|
|
#include "llvm/IR/Constants.h"
|
2014-01-13 17:26:24 +08:00
|
|
|
#include "llvm/IR/Dominators.h"
|
2013-06-08 04:28:43 +08:00
|
|
|
#include "llvm/IR/Instructions.h"
|
2013-01-02 19:36:10 +08:00
|
|
|
#include "llvm/IR/Module.h"
|
2013-01-02 18:22:59 +08:00
|
|
|
#include "llvm/Pass.h"
|
2012-12-20 06:10:31 +08:00
|
|
|
#include "llvm/Transforms/Utils/BasicBlockUtils.h"
|
|
|
|
#include "llvm/Transforms/Utils/SSAUpdater.h"
|
|
|
|
|
|
|
|
using namespace llvm;
|
|
|
|
|
2014-04-22 10:41:26 +08:00
|
|
|
#define DEBUG_TYPE "si-annotate-control-flow"
|
|
|
|
|
2012-12-20 06:10:31 +08:00
|
|
|
namespace {
|
|
|
|
|
|
|
|
// Complex types used in this pass
|
|
|
|
typedef std::pair<BasicBlock *, Value *> StackEntry;
|
|
|
|
typedef SmallVector<StackEntry, 16> StackVector;
|
|
|
|
|
|
|
|
// Intrinsic names the control flow is annotated with
|
2016-01-23 02:42:55 +08:00
|
|
|
static const char *const IfIntrinsic = "llvm.amdgcn.if";
|
|
|
|
static const char *const ElseIntrinsic = "llvm.amdgcn.else";
|
|
|
|
static const char *const BreakIntrinsic = "llvm.amdgcn.break";
|
|
|
|
static const char *const IfBreakIntrinsic = "llvm.amdgcn.if.break";
|
|
|
|
static const char *const ElseBreakIntrinsic = "llvm.amdgcn.else.break";
|
|
|
|
static const char *const LoopIntrinsic = "llvm.amdgcn.loop";
|
|
|
|
static const char *const EndCfIntrinsic = "llvm.amdgcn.end.cf";
|
2012-12-20 06:10:31 +08:00
|
|
|
|
|
|
|
class SIAnnotateControlFlow : public FunctionPass {
|
2016-02-13 07:45:29 +08:00
|
|
|
DivergenceAnalysis *DA;
|
2012-12-20 06:10:31 +08:00
|
|
|
|
|
|
|
Type *Boolean;
|
|
|
|
Type *Void;
|
|
|
|
Type *Int64;
|
|
|
|
Type *ReturnStruct;
|
|
|
|
|
|
|
|
ConstantInt *BoolTrue;
|
|
|
|
ConstantInt *BoolFalse;
|
|
|
|
UndefValue *BoolUndef;
|
|
|
|
Constant *Int64Zero;
|
|
|
|
|
|
|
|
Constant *If;
|
|
|
|
Constant *Else;
|
|
|
|
Constant *Break;
|
|
|
|
Constant *IfBreak;
|
|
|
|
Constant *ElseBreak;
|
|
|
|
Constant *Loop;
|
|
|
|
Constant *EndCf;
|
|
|
|
|
|
|
|
DominatorTree *DT;
|
|
|
|
StackVector Stack;
|
|
|
|
|
R600/SI: Fix bug from insertion of llvm.SI.end.cf into loop headers
The llvm.SI.end.cf intrinsic is used to mark the end of if-then blocks,
if-then-else blocks, and loops. It is responsible for updating the
exec mask to re-enable threads that had been masked during the preceding
control flow block. For example:
s_mov_b64 exec, 0x3 ; Initial exec mask
s_mov_b64 s[0:1], exec ; Saved exec mask
v_cmpx_gt_u32 exec, s[2:3], v0, 0 ; llvm.SI.if
do_stuff()
s_or_b64 exec, exec, s[0:1] ; llvm.SI.end.cf
The bug fixed by this patch was one where the llvm.SI.end.cf intrinsic
was being inserted into the header of loops. This would happen when
an if block terminated in a loop header and we would end up with
code like this:
s_mov_b64 exec, 0x3 ; Initial exec mask
s_mov_b64 s[0:1], exec ; Saved exec mask
v_cmpx_gt_u32 exec, s[2:3], v0, 0 ; llvm.SI.if
do_stuff()
LOOP: ; Start of loop header
s_or_b64 exec, exec, s[0:1] ; llvm.SI.end.cf <-BUG: The exec mask has the
same value at the beginning of each loop
iteration.
do_stuff();
s_cbranch_execnz LOOP
The fix is to create a new basic block before the loop and insert the
llvm.SI.end.cf there. This way the exec mask is restored before the
start of the loop instead of at the beginning of each iteration.
llvm-svn: 228302
2015-02-05 23:32:15 +08:00
|
|
|
LoopInfo *LI;
|
|
|
|
|
2016-04-15 01:42:35 +08:00
|
|
|
bool isUniform(BranchInst *T);
|
|
|
|
|
2012-12-20 06:10:31 +08:00
|
|
|
bool isTopOfStack(BasicBlock *BB);
|
|
|
|
|
|
|
|
Value *popSaved();
|
|
|
|
|
|
|
|
void push(BasicBlock *BB, Value *Saved);
|
|
|
|
|
|
|
|
bool isElse(PHINode *Phi);
|
|
|
|
|
|
|
|
void eraseIfUnused(PHINode *Phi);
|
|
|
|
|
|
|
|
void openIf(BranchInst *Term);
|
|
|
|
|
|
|
|
void insertElse(BranchInst *Term);
|
|
|
|
|
2016-02-13 01:11:04 +08:00
|
|
|
Value *handleLoopCondition(Value *Cond, PHINode *Broken,
|
|
|
|
llvm::Loop *L, BranchInst *Term);
|
2012-12-20 06:10:31 +08:00
|
|
|
|
|
|
|
void handleLoop(BranchInst *Term);
|
|
|
|
|
|
|
|
void closeControlFlow(BasicBlock *BB);
|
|
|
|
|
|
|
|
public:
|
2016-01-20 23:48:27 +08:00
|
|
|
static char ID;
|
|
|
|
|
2012-12-20 06:10:31 +08:00
|
|
|
SIAnnotateControlFlow():
|
|
|
|
FunctionPass(ID) { }
|
|
|
|
|
2014-04-29 15:57:24 +08:00
|
|
|
bool doInitialization(Module &M) override;
|
2012-12-20 06:10:31 +08:00
|
|
|
|
2014-04-29 15:57:24 +08:00
|
|
|
bool runOnFunction(Function &F) override;
|
2012-12-20 06:10:31 +08:00
|
|
|
|
2014-04-29 15:57:24 +08:00
|
|
|
const char *getPassName() const override {
|
2012-12-20 06:10:31 +08:00
|
|
|
return "SI annotate control flow";
|
|
|
|
}
|
|
|
|
|
2014-04-29 15:57:24 +08:00
|
|
|
void getAnalysisUsage(AnalysisUsage &AU) const override {
|
R600/SI: Fix bug from insertion of llvm.SI.end.cf into loop headers
The llvm.SI.end.cf intrinsic is used to mark the end of if-then blocks,
if-then-else blocks, and loops. It is responsible for updating the
exec mask to re-enable threads that had been masked during the preceding
control flow block. For example:
s_mov_b64 exec, 0x3 ; Initial exec mask
s_mov_b64 s[0:1], exec ; Saved exec mask
v_cmpx_gt_u32 exec, s[2:3], v0, 0 ; llvm.SI.if
do_stuff()
s_or_b64 exec, exec, s[0:1] ; llvm.SI.end.cf
The bug fixed by this patch was one where the llvm.SI.end.cf intrinsic
was being inserted into the header of loops. This would happen when
an if block terminated in a loop header and we would end up with
code like this:
s_mov_b64 exec, 0x3 ; Initial exec mask
s_mov_b64 s[0:1], exec ; Saved exec mask
v_cmpx_gt_u32 exec, s[2:3], v0, 0 ; llvm.SI.if
do_stuff()
LOOP: ; Start of loop header
s_or_b64 exec, exec, s[0:1] ; llvm.SI.end.cf <-BUG: The exec mask has the
same value at the beginning of each loop
iteration.
do_stuff();
s_cbranch_execnz LOOP
The fix is to create a new basic block before the loop and insert the
llvm.SI.end.cf there. This way the exec mask is restored before the
start of the loop instead of at the beginning of each iteration.
llvm-svn: 228302
2015-02-05 23:32:15 +08:00
|
|
|
AU.addRequired<LoopInfoWrapperPass>();
|
2014-01-13 21:07:17 +08:00
|
|
|
AU.addRequired<DominatorTreeWrapperPass>();
|
2016-02-13 07:45:29 +08:00
|
|
|
AU.addRequired<DivergenceAnalysis>();
|
2014-01-13 21:07:17 +08:00
|
|
|
AU.addPreserved<DominatorTreeWrapperPass>();
|
2012-12-20 06:10:31 +08:00
|
|
|
FunctionPass::getAnalysisUsage(AU);
|
|
|
|
}
|
|
|
|
|
|
|
|
};
|
|
|
|
|
|
|
|
} // end anonymous namespace
|
|
|
|
|
2016-01-20 23:48:27 +08:00
|
|
|
INITIALIZE_PASS_BEGIN(SIAnnotateControlFlow, DEBUG_TYPE,
|
|
|
|
"Annotate SI Control Flow", false, false)
|
2016-02-13 07:45:29 +08:00
|
|
|
INITIALIZE_PASS_DEPENDENCY(DivergenceAnalysis)
|
2016-01-20 23:48:27 +08:00
|
|
|
INITIALIZE_PASS_END(SIAnnotateControlFlow, DEBUG_TYPE,
|
|
|
|
"Annotate SI Control Flow", false, false)
|
|
|
|
|
2012-12-20 06:10:31 +08:00
|
|
|
char SIAnnotateControlFlow::ID = 0;
|
|
|
|
|
|
|
|
/// \brief Initialize all the types and constants used in the pass
|
|
|
|
bool SIAnnotateControlFlow::doInitialization(Module &M) {
|
|
|
|
LLVMContext &Context = M.getContext();
|
|
|
|
|
|
|
|
Void = Type::getVoidTy(Context);
|
|
|
|
Boolean = Type::getInt1Ty(Context);
|
|
|
|
Int64 = Type::getInt64Ty(Context);
|
2014-04-25 13:30:21 +08:00
|
|
|
ReturnStruct = StructType::get(Boolean, Int64, (Type *)nullptr);
|
2012-12-20 06:10:31 +08:00
|
|
|
|
|
|
|
BoolTrue = ConstantInt::getTrue(Context);
|
|
|
|
BoolFalse = ConstantInt::getFalse(Context);
|
|
|
|
BoolUndef = UndefValue::get(Boolean);
|
|
|
|
Int64Zero = ConstantInt::get(Int64, 0);
|
|
|
|
|
|
|
|
If = M.getOrInsertFunction(
|
2014-04-25 13:30:21 +08:00
|
|
|
IfIntrinsic, ReturnStruct, Boolean, (Type *)nullptr);
|
2012-12-20 06:10:31 +08:00
|
|
|
|
|
|
|
Else = M.getOrInsertFunction(
|
2014-04-25 13:30:21 +08:00
|
|
|
ElseIntrinsic, ReturnStruct, Int64, (Type *)nullptr);
|
2012-12-20 06:10:31 +08:00
|
|
|
|
|
|
|
Break = M.getOrInsertFunction(
|
2014-04-25 13:30:21 +08:00
|
|
|
BreakIntrinsic, Int64, Int64, (Type *)nullptr);
|
2012-12-20 06:10:31 +08:00
|
|
|
|
|
|
|
IfBreak = M.getOrInsertFunction(
|
2014-04-25 13:30:21 +08:00
|
|
|
IfBreakIntrinsic, Int64, Boolean, Int64, (Type *)nullptr);
|
2012-12-20 06:10:31 +08:00
|
|
|
|
|
|
|
ElseBreak = M.getOrInsertFunction(
|
2014-04-25 13:30:21 +08:00
|
|
|
ElseBreakIntrinsic, Int64, Int64, Int64, (Type *)nullptr);
|
2012-12-20 06:10:31 +08:00
|
|
|
|
|
|
|
Loop = M.getOrInsertFunction(
|
2014-04-25 13:30:21 +08:00
|
|
|
LoopIntrinsic, Boolean, Int64, (Type *)nullptr);
|
2012-12-20 06:10:31 +08:00
|
|
|
|
|
|
|
EndCf = M.getOrInsertFunction(
|
2014-04-25 13:30:21 +08:00
|
|
|
EndCfIntrinsic, Void, Int64, (Type *)nullptr);
|
2012-12-20 06:10:31 +08:00
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2016-04-15 01:42:35 +08:00
|
|
|
/// \brief Is the branch condition uniform or did the StructurizeCFG pass
|
|
|
|
/// consider it as such?
|
|
|
|
bool SIAnnotateControlFlow::isUniform(BranchInst *T) {
|
|
|
|
return DA->isUniform(T->getCondition()) ||
|
|
|
|
T->getMetadata("structurizecfg.uniform") != nullptr;
|
|
|
|
}
|
|
|
|
|
2012-12-20 06:10:31 +08:00
|
|
|
/// \brief Is BB the last block saved on the stack ?
|
|
|
|
bool SIAnnotateControlFlow::isTopOfStack(BasicBlock *BB) {
|
2013-02-14 16:00:33 +08:00
|
|
|
return !Stack.empty() && Stack.back().first == BB;
|
2012-12-20 06:10:31 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/// \brief Pop the last saved value from the control flow stack
|
|
|
|
Value *SIAnnotateControlFlow::popSaved() {
|
|
|
|
return Stack.pop_back_val().second;
|
|
|
|
}
|
|
|
|
|
|
|
|
/// \brief Push a BB and saved value to the control flow stack
|
|
|
|
void SIAnnotateControlFlow::push(BasicBlock *BB, Value *Saved) {
|
|
|
|
Stack.push_back(std::make_pair(BB, Saved));
|
|
|
|
}
|
|
|
|
|
|
|
|
/// \brief Can the condition represented by this PHI node treated like
|
|
|
|
/// an "Else" block?
|
|
|
|
bool SIAnnotateControlFlow::isElse(PHINode *Phi) {
|
|
|
|
BasicBlock *IDom = DT->getNode(Phi->getParent())->getIDom()->getBlock();
|
|
|
|
for (unsigned i = 0, e = Phi->getNumIncomingValues(); i != e; ++i) {
|
|
|
|
if (Phi->getIncomingBlock(i) == IDom) {
|
|
|
|
|
|
|
|
if (Phi->getIncomingValue(i) != BoolTrue)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
} else {
|
|
|
|
if (Phi->getIncomingValue(i) != BoolFalse)
|
|
|
|
return false;
|
2014-06-21 01:06:02 +08:00
|
|
|
|
2012-12-20 06:10:31 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
// \brief Erase "Phi" if it is not used any more
|
|
|
|
void SIAnnotateControlFlow::eraseIfUnused(PHINode *Phi) {
|
|
|
|
if (!Phi->hasNUsesOrMore(1))
|
|
|
|
Phi->eraseFromParent();
|
|
|
|
}
|
|
|
|
|
|
|
|
/// \brief Open a new "If" block
|
|
|
|
void SIAnnotateControlFlow::openIf(BranchInst *Term) {
|
2016-04-15 01:42:35 +08:00
|
|
|
if (isUniform(Term)) {
|
2016-02-13 07:45:29 +08:00
|
|
|
return;
|
|
|
|
}
|
2012-12-20 06:10:31 +08:00
|
|
|
Value *Ret = CallInst::Create(If, Term->getCondition(), "", Term);
|
|
|
|
Term->setCondition(ExtractValueInst::Create(Ret, 0, "", Term));
|
|
|
|
push(Term->getSuccessor(1), ExtractValueInst::Create(Ret, 1, "", Term));
|
|
|
|
}
|
|
|
|
|
|
|
|
/// \brief Close the last "If" block and open a new "Else" block
|
|
|
|
void SIAnnotateControlFlow::insertElse(BranchInst *Term) {
|
2016-04-15 01:42:35 +08:00
|
|
|
if (isUniform(Term)) {
|
2016-02-13 07:45:29 +08:00
|
|
|
return;
|
|
|
|
}
|
2012-12-20 06:10:31 +08:00
|
|
|
Value *Ret = CallInst::Create(Else, popSaved(), "", Term);
|
|
|
|
Term->setCondition(ExtractValueInst::Create(Ret, 0, "", Term));
|
|
|
|
push(Term->getSuccessor(1), ExtractValueInst::Create(Ret, 1, "", Term));
|
|
|
|
}
|
|
|
|
|
|
|
|
/// \brief Recursively handle the condition leading to a loop
|
2015-04-14 22:36:45 +08:00
|
|
|
Value *SIAnnotateControlFlow::handleLoopCondition(Value *Cond, PHINode *Broken,
|
2016-02-13 01:11:04 +08:00
|
|
|
llvm::Loop *L, BranchInst *Term) {
|
2015-05-01 11:44:08 +08:00
|
|
|
|
|
|
|
// Only search through PHI nodes which are inside the loop. If we try this
|
|
|
|
// with PHI nodes that are outside of the loop, we end up inserting new PHI
|
|
|
|
// nodes outside of the loop which depend on values defined inside the loop.
|
|
|
|
// This will break the module with
|
|
|
|
// 'Instruction does not dominate all users!' errors.
|
|
|
|
PHINode *Phi = nullptr;
|
|
|
|
if ((Phi = dyn_cast<PHINode>(Cond)) && L->contains(Phi)) {
|
|
|
|
|
2014-06-21 01:06:02 +08:00
|
|
|
BasicBlock *Parent = Phi->getParent();
|
|
|
|
PHINode *NewPhi = PHINode::Create(Int64, 0, "", &Parent->front());
|
|
|
|
Value *Ret = NewPhi;
|
2012-12-20 06:10:31 +08:00
|
|
|
|
2013-12-05 13:44:44 +08:00
|
|
|
// Handle all non-constant incoming values first
|
2012-12-20 06:10:31 +08:00
|
|
|
for (unsigned i = 0, e = Phi->getNumIncomingValues(); i != e; ++i) {
|
|
|
|
Value *Incoming = Phi->getIncomingValue(i);
|
2014-06-21 01:06:02 +08:00
|
|
|
BasicBlock *From = Phi->getIncomingBlock(i);
|
|
|
|
if (isa<ConstantInt>(Incoming)) {
|
|
|
|
NewPhi->addIncoming(Broken, From);
|
2012-12-20 06:10:31 +08:00
|
|
|
continue;
|
2014-06-21 01:06:02 +08:00
|
|
|
}
|
2012-12-20 06:10:31 +08:00
|
|
|
|
|
|
|
Phi->setIncomingValue(i, BoolFalse);
|
2016-02-13 01:11:04 +08:00
|
|
|
Value *PhiArg = handleLoopCondition(Incoming, Broken, L, Term);
|
2014-06-21 01:06:02 +08:00
|
|
|
NewPhi->addIncoming(PhiArg, From);
|
2012-12-20 06:10:31 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
BasicBlock *IDom = DT->getNode(Parent)->getIDom()->getBlock();
|
|
|
|
|
|
|
|
for (unsigned i = 0, e = Phi->getNumIncomingValues(); i != e; ++i) {
|
|
|
|
|
|
|
|
Value *Incoming = Phi->getIncomingValue(i);
|
|
|
|
if (Incoming != BoolTrue)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
BasicBlock *From = Phi->getIncomingBlock(i);
|
|
|
|
if (From == IDom) {
|
2016-04-13 00:10:38 +08:00
|
|
|
// We're in the following situation:
|
|
|
|
// IDom/From
|
|
|
|
// | \
|
|
|
|
// | If-block
|
|
|
|
// | /
|
|
|
|
// Parent
|
|
|
|
// where we want to break out of the loop if the If-block is not taken.
|
|
|
|
// Due to the depth-first traversal, there should be an end.cf
|
|
|
|
// intrinsic in Parent, and we insert an else.break before it.
|
|
|
|
//
|
|
|
|
// Note that the end.cf need not be the first non-phi instruction
|
|
|
|
// of parent, particularly when we're dealing with a multi-level
|
|
|
|
// break, but it should occur within a group of intrinsic calls
|
|
|
|
// at the beginning of the block.
|
2012-12-20 06:10:31 +08:00
|
|
|
CallInst *OldEnd = dyn_cast<CallInst>(Parent->getFirstInsertionPt());
|
2016-04-13 00:10:38 +08:00
|
|
|
while (OldEnd && OldEnd->getCalledFunction() != EndCf)
|
|
|
|
OldEnd = dyn_cast<CallInst>(OldEnd->getNextNode());
|
2012-12-20 06:10:31 +08:00
|
|
|
if (OldEnd && OldEnd->getCalledFunction() == EndCf) {
|
2014-06-21 01:06:02 +08:00
|
|
|
Value *Args[] = { OldEnd->getArgOperand(0), NewPhi };
|
|
|
|
Ret = CallInst::Create(ElseBreak, Args, "", OldEnd);
|
2012-12-20 06:10:31 +08:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
TerminatorInst *Insert = From->getTerminator();
|
2014-06-21 01:06:02 +08:00
|
|
|
Value *PhiArg = CallInst::Create(Break, Broken, "", Insert);
|
|
|
|
NewPhi->setIncomingValue(i, PhiArg);
|
2012-12-20 06:10:31 +08:00
|
|
|
}
|
|
|
|
eraseIfUnused(Phi);
|
2014-06-21 01:06:02 +08:00
|
|
|
return Ret;
|
2012-12-20 06:10:31 +08:00
|
|
|
|
|
|
|
} else if (Instruction *Inst = dyn_cast<Instruction>(Cond)) {
|
|
|
|
BasicBlock *Parent = Inst->getParent();
|
2015-04-14 22:36:45 +08:00
|
|
|
Instruction *Insert;
|
|
|
|
if (L->contains(Inst)) {
|
|
|
|
Insert = Parent->getTerminator();
|
|
|
|
} else {
|
|
|
|
Insert = L->getHeader()->getFirstNonPHIOrDbgOrLifetime();
|
|
|
|
}
|
2014-06-21 01:06:02 +08:00
|
|
|
Value *Args[] = { Cond, Broken };
|
|
|
|
return CallInst::Create(IfBreak, Args, "", Insert);
|
2012-12-20 06:10:31 +08:00
|
|
|
|
2016-02-13 01:11:04 +08:00
|
|
|
// Insert IfBreak before TERM for constant COND.
|
|
|
|
} else if (isa<ConstantInt>(Cond)) {
|
|
|
|
Value *Args[] = { Cond, Broken };
|
|
|
|
return CallInst::Create(IfBreak, Args, "", Term);
|
|
|
|
|
2012-12-20 06:10:31 +08:00
|
|
|
} else {
|
2013-12-11 05:37:42 +08:00
|
|
|
llvm_unreachable("Unhandled loop condition!");
|
2012-12-20 06:10:31 +08:00
|
|
|
}
|
2014-06-21 01:06:02 +08:00
|
|
|
return 0;
|
2012-12-20 06:10:31 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/// \brief Handle a back edge (loop)
|
|
|
|
void SIAnnotateControlFlow::handleLoop(BranchInst *Term) {
|
2016-04-15 01:42:35 +08:00
|
|
|
if (isUniform(Term)) {
|
2016-02-13 07:45:29 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2015-04-14 22:36:45 +08:00
|
|
|
BasicBlock *BB = Term->getParent();
|
|
|
|
llvm::Loop *L = LI->getLoopFor(BB);
|
2012-12-20 06:10:31 +08:00
|
|
|
BasicBlock *Target = Term->getSuccessor(1);
|
|
|
|
PHINode *Broken = PHINode::Create(Int64, 0, "", &Target->front());
|
|
|
|
|
|
|
|
Value *Cond = Term->getCondition();
|
|
|
|
Term->setCondition(BoolTrue);
|
2016-02-13 01:11:04 +08:00
|
|
|
Value *Arg = handleLoopCondition(Cond, Broken, L, Term);
|
2012-12-20 06:10:31 +08:00
|
|
|
|
|
|
|
for (pred_iterator PI = pred_begin(Target), PE = pred_end(Target);
|
|
|
|
PI != PE; ++PI) {
|
|
|
|
|
|
|
|
Broken->addIncoming(*PI == BB ? Arg : Int64Zero, *PI);
|
|
|
|
}
|
|
|
|
|
|
|
|
Term->setCondition(CallInst::Create(Loop, Arg, "", Term));
|
|
|
|
push(Term->getSuccessor(0), Arg);
|
R600/SI: Fix bug from insertion of llvm.SI.end.cf into loop headers
The llvm.SI.end.cf intrinsic is used to mark the end of if-then blocks,
if-then-else blocks, and loops. It is responsible for updating the
exec mask to re-enable threads that had been masked during the preceding
control flow block. For example:
s_mov_b64 exec, 0x3 ; Initial exec mask
s_mov_b64 s[0:1], exec ; Saved exec mask
v_cmpx_gt_u32 exec, s[2:3], v0, 0 ; llvm.SI.if
do_stuff()
s_or_b64 exec, exec, s[0:1] ; llvm.SI.end.cf
The bug fixed by this patch was one where the llvm.SI.end.cf intrinsic
was being inserted into the header of loops. This would happen when
an if block terminated in a loop header and we would end up with
code like this:
s_mov_b64 exec, 0x3 ; Initial exec mask
s_mov_b64 s[0:1], exec ; Saved exec mask
v_cmpx_gt_u32 exec, s[2:3], v0, 0 ; llvm.SI.if
do_stuff()
LOOP: ; Start of loop header
s_or_b64 exec, exec, s[0:1] ; llvm.SI.end.cf <-BUG: The exec mask has the
same value at the beginning of each loop
iteration.
do_stuff();
s_cbranch_execnz LOOP
The fix is to create a new basic block before the loop and insert the
llvm.SI.end.cf there. This way the exec mask is restored before the
start of the loop instead of at the beginning of each iteration.
llvm-svn: 228302
2015-02-05 23:32:15 +08:00
|
|
|
}/// \brief Close the last opened control flow
|
2012-12-20 06:10:31 +08:00
|
|
|
void SIAnnotateControlFlow::closeControlFlow(BasicBlock *BB) {
|
R600/SI: Fix bug from insertion of llvm.SI.end.cf into loop headers
The llvm.SI.end.cf intrinsic is used to mark the end of if-then blocks,
if-then-else blocks, and loops. It is responsible for updating the
exec mask to re-enable threads that had been masked during the preceding
control flow block. For example:
s_mov_b64 exec, 0x3 ; Initial exec mask
s_mov_b64 s[0:1], exec ; Saved exec mask
v_cmpx_gt_u32 exec, s[2:3], v0, 0 ; llvm.SI.if
do_stuff()
s_or_b64 exec, exec, s[0:1] ; llvm.SI.end.cf
The bug fixed by this patch was one where the llvm.SI.end.cf intrinsic
was being inserted into the header of loops. This would happen when
an if block terminated in a loop header and we would end up with
code like this:
s_mov_b64 exec, 0x3 ; Initial exec mask
s_mov_b64 s[0:1], exec ; Saved exec mask
v_cmpx_gt_u32 exec, s[2:3], v0, 0 ; llvm.SI.if
do_stuff()
LOOP: ; Start of loop header
s_or_b64 exec, exec, s[0:1] ; llvm.SI.end.cf <-BUG: The exec mask has the
same value at the beginning of each loop
iteration.
do_stuff();
s_cbranch_execnz LOOP
The fix is to create a new basic block before the loop and insert the
llvm.SI.end.cf there. This way the exec mask is restored before the
start of the loop instead of at the beginning of each iteration.
llvm-svn: 228302
2015-02-05 23:32:15 +08:00
|
|
|
llvm::Loop *L = LI->getLoopFor(BB);
|
|
|
|
|
2016-04-15 01:42:18 +08:00
|
|
|
assert(Stack.back().first == BB);
|
2016-02-13 07:45:29 +08:00
|
|
|
|
R600/SI: Fix bug from insertion of llvm.SI.end.cf into loop headers
The llvm.SI.end.cf intrinsic is used to mark the end of if-then blocks,
if-then-else blocks, and loops. It is responsible for updating the
exec mask to re-enable threads that had been masked during the preceding
control flow block. For example:
s_mov_b64 exec, 0x3 ; Initial exec mask
s_mov_b64 s[0:1], exec ; Saved exec mask
v_cmpx_gt_u32 exec, s[2:3], v0, 0 ; llvm.SI.if
do_stuff()
s_or_b64 exec, exec, s[0:1] ; llvm.SI.end.cf
The bug fixed by this patch was one where the llvm.SI.end.cf intrinsic
was being inserted into the header of loops. This would happen when
an if block terminated in a loop header and we would end up with
code like this:
s_mov_b64 exec, 0x3 ; Initial exec mask
s_mov_b64 s[0:1], exec ; Saved exec mask
v_cmpx_gt_u32 exec, s[2:3], v0, 0 ; llvm.SI.if
do_stuff()
LOOP: ; Start of loop header
s_or_b64 exec, exec, s[0:1] ; llvm.SI.end.cf <-BUG: The exec mask has the
same value at the beginning of each loop
iteration.
do_stuff();
s_cbranch_execnz LOOP
The fix is to create a new basic block before the loop and insert the
llvm.SI.end.cf there. This way the exec mask is restored before the
start of the loop instead of at the beginning of each iteration.
llvm-svn: 228302
2015-02-05 23:32:15 +08:00
|
|
|
if (L && L->getHeader() == BB) {
|
|
|
|
// We can't insert an EndCF call into a loop header, because it will
|
|
|
|
// get executed on every iteration of the loop, when it should be
|
|
|
|
// executed only once before the loop.
|
|
|
|
SmallVector <BasicBlock*, 8> Latches;
|
|
|
|
L->getLoopLatches(Latches);
|
|
|
|
|
|
|
|
std::vector<BasicBlock*> Preds;
|
|
|
|
for (pred_iterator PI = pred_begin(BB), PE = pred_end(BB); PI != PE; ++PI) {
|
|
|
|
if (std::find(Latches.begin(), Latches.end(), *PI) == Latches.end())
|
|
|
|
Preds.push_back(*PI);
|
|
|
|
}
|
2015-07-22 17:52:54 +08:00
|
|
|
BB = llvm::SplitBlockPredecessors(BB, Preds, "endcf.split", DT, LI, false);
|
R600/SI: Fix bug from insertion of llvm.SI.end.cf into loop headers
The llvm.SI.end.cf intrinsic is used to mark the end of if-then blocks,
if-then-else blocks, and loops. It is responsible for updating the
exec mask to re-enable threads that had been masked during the preceding
control flow block. For example:
s_mov_b64 exec, 0x3 ; Initial exec mask
s_mov_b64 s[0:1], exec ; Saved exec mask
v_cmpx_gt_u32 exec, s[2:3], v0, 0 ; llvm.SI.if
do_stuff()
s_or_b64 exec, exec, s[0:1] ; llvm.SI.end.cf
The bug fixed by this patch was one where the llvm.SI.end.cf intrinsic
was being inserted into the header of loops. This would happen when
an if block terminated in a loop header and we would end up with
code like this:
s_mov_b64 exec, 0x3 ; Initial exec mask
s_mov_b64 s[0:1], exec ; Saved exec mask
v_cmpx_gt_u32 exec, s[2:3], v0, 0 ; llvm.SI.if
do_stuff()
LOOP: ; Start of loop header
s_or_b64 exec, exec, s[0:1] ; llvm.SI.end.cf <-BUG: The exec mask has the
same value at the beginning of each loop
iteration.
do_stuff();
s_cbranch_execnz LOOP
The fix is to create a new basic block before the loop and insert the
llvm.SI.end.cf there. This way the exec mask is restored before the
start of the loop instead of at the beginning of each iteration.
llvm-svn: 228302
2015-02-05 23:32:15 +08:00
|
|
|
}
|
|
|
|
|
2016-02-13 07:45:29 +08:00
|
|
|
Value *Exec = popSaved();
|
|
|
|
if (!isa<UndefValue>(Exec))
|
|
|
|
CallInst::Create(EndCf, Exec, "", &*BB->getFirstInsertionPt());
|
2012-12-20 06:10:31 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/// \brief Annotate the control flow with intrinsics so the backend can
|
|
|
|
/// recognize if/then/else and loops.
|
|
|
|
bool SIAnnotateControlFlow::runOnFunction(Function &F) {
|
2016-02-13 07:45:29 +08:00
|
|
|
|
2014-01-13 21:07:17 +08:00
|
|
|
DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree();
|
R600/SI: Fix bug from insertion of llvm.SI.end.cf into loop headers
The llvm.SI.end.cf intrinsic is used to mark the end of if-then blocks,
if-then-else blocks, and loops. It is responsible for updating the
exec mask to re-enable threads that had been masked during the preceding
control flow block. For example:
s_mov_b64 exec, 0x3 ; Initial exec mask
s_mov_b64 s[0:1], exec ; Saved exec mask
v_cmpx_gt_u32 exec, s[2:3], v0, 0 ; llvm.SI.if
do_stuff()
s_or_b64 exec, exec, s[0:1] ; llvm.SI.end.cf
The bug fixed by this patch was one where the llvm.SI.end.cf intrinsic
was being inserted into the header of loops. This would happen when
an if block terminated in a loop header and we would end up with
code like this:
s_mov_b64 exec, 0x3 ; Initial exec mask
s_mov_b64 s[0:1], exec ; Saved exec mask
v_cmpx_gt_u32 exec, s[2:3], v0, 0 ; llvm.SI.if
do_stuff()
LOOP: ; Start of loop header
s_or_b64 exec, exec, s[0:1] ; llvm.SI.end.cf <-BUG: The exec mask has the
same value at the beginning of each loop
iteration.
do_stuff();
s_cbranch_execnz LOOP
The fix is to create a new basic block before the loop and insert the
llvm.SI.end.cf there. This way the exec mask is restored before the
start of the loop instead of at the beginning of each iteration.
llvm-svn: 228302
2015-02-05 23:32:15 +08:00
|
|
|
LI = &getAnalysis<LoopInfoWrapperPass>().getLoopInfo();
|
2016-02-13 07:45:29 +08:00
|
|
|
DA = &getAnalysis<DivergenceAnalysis>();
|
2012-12-20 06:10:31 +08:00
|
|
|
|
|
|
|
for (df_iterator<BasicBlock *> I = df_begin(&F.getEntryBlock()),
|
|
|
|
E = df_end(&F.getEntryBlock()); I != E; ++I) {
|
|
|
|
|
|
|
|
BranchInst *Term = dyn_cast<BranchInst>((*I)->getTerminator());
|
|
|
|
|
|
|
|
if (!Term || Term->isUnconditional()) {
|
|
|
|
if (isTopOfStack(*I))
|
|
|
|
closeControlFlow(*I);
|
2016-02-13 07:45:29 +08:00
|
|
|
|
2012-12-20 06:10:31 +08:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (I.nodeVisited(Term->getSuccessor(1))) {
|
|
|
|
if (isTopOfStack(*I))
|
|
|
|
closeControlFlow(*I);
|
2016-02-13 07:45:29 +08:00
|
|
|
|
2012-12-20 06:10:31 +08:00
|
|
|
handleLoop(Term);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (isTopOfStack(*I)) {
|
|
|
|
PHINode *Phi = dyn_cast<PHINode>(Term->getCondition());
|
|
|
|
if (Phi && Phi->getParent() == *I && isElse(Phi)) {
|
|
|
|
insertElse(Term);
|
|
|
|
eraseIfUnused(Phi);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
closeControlFlow(*I);
|
|
|
|
}
|
|
|
|
openIf(Term);
|
|
|
|
}
|
|
|
|
|
|
|
|
assert(Stack.empty());
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
/// \brief Create the annotation pass
|
|
|
|
FunctionPass *llvm::createSIAnnotateControlFlowPass() {
|
|
|
|
return new SIAnnotateControlFlow();
|
|
|
|
}
|