[FlattenCFG] Fix `MergeIfRegion` in case then-path is empty

In case the then-path of an if-region is empty, then merging with the
else-path should be handled with the inverse of the condition (leading
to that path).

Fix PR37662

Differential Revision: https://reviews.llvm.org/D78881
This commit is contained in:
Ehud Katz 2020-05-21 14:06:44 +03:00
parent eeff1a970a
commit 111ddc57d3
2 changed files with 210 additions and 35 deletions

View File

@ -45,12 +45,12 @@ class FlattenCFGOpt {
bool MergeIfRegion(BasicBlock *BB, IRBuilder<> &Builder); bool MergeIfRegion(BasicBlock *BB, IRBuilder<> &Builder);
/// Compare a pair of blocks: \p Block1 and \p Block2, which /// Compare a pair of blocks: \p Block1 and \p Block2, which
/// are from two if-regions whose entry blocks are \p Head1 and \p /// are from two if-regions, where \p Head2 is the entry block of the 2nd
/// Head2. \returns true if \p Block1 and \p Block2 contain identical /// if-region. \returns true if \p Block1 and \p Block2 contain identical
/// instructions, and have no memory reference alias with \p Head2. /// instructions, and have no memory reference alias with \p Head2.
/// This is used as a legality check for merging if-regions. /// This is used as a legality check for merging if-regions.
bool CompareIfRegionBlock(BasicBlock *Head1, BasicBlock *Head2, bool CompareIfRegionBlock(BasicBlock *Block1, BasicBlock *Block2,
BasicBlock *Block1, BasicBlock *Block2); BasicBlock *Head2);
public: public:
FlattenCFGOpt(AliasAnalysis *AA) : AA(AA) {} FlattenCFGOpt(AliasAnalysis *AA) : AA(AA) {}
@ -315,25 +315,16 @@ bool FlattenCFGOpt::FlattenParallelAndOr(BasicBlock *BB, IRBuilder<> &Builder) {
return true; return true;
} }
/// Compare blocks from two if-regions, where \param Head1 is the entry of the /// Compare blocks from two if-regions, where \param Head2 is the entry of the
/// 1st if-region. \param Head2 is the entry of the 2nd if-region. \param /// 2nd if-region. \param Block1 is a block in the 1st if-region to compare.
/// Block1 is a block in the 1st if-region to compare. \param Block2 is a block /// \param Block2 is a block in the 2nd if-region to compare. \returns true if
// in the 2nd if-region to compare. \returns true if \param Block1 and \param /// \param Block1 and \param Block2 have identical instructions and do not have
/// Block2 have identical instructions and do not have memory reference alias /// memory reference alias with \param Head2.
/// with \param Head2. bool FlattenCFGOpt::CompareIfRegionBlock(BasicBlock *Block1, BasicBlock *Block2,
bool FlattenCFGOpt::CompareIfRegionBlock(BasicBlock *Head1, BasicBlock *Head2, BasicBlock *Head2) {
BasicBlock *Block1,
BasicBlock *Block2) {
Instruction *PTI2 = Head2->getTerminator(); Instruction *PTI2 = Head2->getTerminator();
Instruction *PBI2 = &Head2->front(); Instruction *PBI2 = &Head2->front();
bool eq1 = (Block1 == Head1);
bool eq2 = (Block2 == Head2);
if (eq1 || eq2) {
// An empty then-path or else-path.
return (eq1 == eq2);
}
// Check whether instructions in Block1 and Block2 are identical // Check whether instructions in Block1 and Block2 are identical
// and do not alias with instructions in Head2. // and do not alias with instructions in Head2.
BasicBlock::iterator iter1 = Block1->begin(); BasicBlock::iterator iter1 = Block1->begin();
@ -395,6 +386,29 @@ bool FlattenCFGOpt::CompareIfRegionBlock(BasicBlock *Head1, BasicBlock *Head2,
/// To: /// To:
/// if (a || b) /// if (a || b)
/// statement; /// statement;
///
///
/// And from:
/// if (a)
/// ;
/// else
/// statement;
/// if (b)
/// ;
/// else
/// statement;
///
/// To:
/// if (a && b)
/// ;
/// else
/// statement;
///
/// We always take the form of the first if-region. This means that if the
/// statement in the first if-region, is in the "then-path", while in the second
/// if-region it is in the "else-path", then we convert the second to the first
/// form, by inverting the condition and the branch successors. The same
/// approach goes for the opposite case.
bool FlattenCFGOpt::MergeIfRegion(BasicBlock *BB, IRBuilder<> &Builder) { bool FlattenCFGOpt::MergeIfRegion(BasicBlock *BB, IRBuilder<> &Builder) {
BasicBlock *IfTrue2, *IfFalse2; BasicBlock *IfTrue2, *IfFalse2;
Value *IfCond2 = GetIfCondition(BB, IfTrue2, IfFalse2); Value *IfCond2 = GetIfCondition(BB, IfTrue2, IfFalse2);
@ -415,22 +429,42 @@ bool FlattenCFGOpt::MergeIfRegion(BasicBlock *BB, IRBuilder<> &Builder) {
BasicBlock *FirstEntryBlock = CInst1->getParent(); BasicBlock *FirstEntryBlock = CInst1->getParent();
// Either then-path or else-path should be empty. // Either then-path or else-path should be empty.
if ((IfTrue1 != FirstEntryBlock) && (IfFalse1 != FirstEntryBlock)) bool InvertCond2 = false;
BinaryOperator::BinaryOps CombineOp;
if (IfFalse1 == FirstEntryBlock) {
// The else-path is empty, so we must use "or" operation to combine the
// conditions.
CombineOp = BinaryOperator::Or;
if (IfFalse2 != SecondEntryBlock) {
if (IfTrue2 != SecondEntryBlock)
return false; return false;
if ((IfTrue2 != SecondEntryBlock) && (IfFalse2 != SecondEntryBlock))
InvertCond2 = true;
std::swap(IfTrue2, IfFalse2);
}
if (!CompareIfRegionBlock(IfTrue1, IfTrue2, SecondEntryBlock))
return false;
} else if (IfTrue1 == FirstEntryBlock) {
// The then-path is empty, so we must use "and" operation to combine the
// conditions.
CombineOp = BinaryOperator::And;
if (IfTrue2 != SecondEntryBlock) {
if (IfFalse2 != SecondEntryBlock)
return false;
InvertCond2 = true;
std::swap(IfTrue2, IfFalse2);
}
if (!CompareIfRegionBlock(IfFalse1, IfFalse2, SecondEntryBlock))
return false;
} else
return false; return false;
Instruction *PTI2 = SecondEntryBlock->getTerminator(); Instruction *PTI2 = SecondEntryBlock->getTerminator();
Instruction *PBI2 = &SecondEntryBlock->front(); Instruction *PBI2 = &SecondEntryBlock->front();
if (!CompareIfRegionBlock(FirstEntryBlock, SecondEntryBlock, IfTrue1,
IfTrue2))
return false;
if (!CompareIfRegionBlock(FirstEntryBlock, SecondEntryBlock, IfFalse1,
IfFalse2))
return false;
// Check whether \param SecondEntryBlock has side-effect and is safe to // Check whether \param SecondEntryBlock has side-effect and is safe to
// speculate. // speculate.
for (BasicBlock::iterator BI(PBI2), BE(PTI2); BI != BE; ++BI) { for (BasicBlock::iterator BI(PBI2), BE(PTI2); BI != BE; ++BI) {
@ -445,12 +479,22 @@ bool FlattenCFGOpt::MergeIfRegion(BasicBlock *BB, IRBuilder<> &Builder) {
FirstEntryBlock->getInstList() FirstEntryBlock->getInstList()
.splice(FirstEntryBlock->end(), SecondEntryBlock->getInstList()); .splice(FirstEntryBlock->end(), SecondEntryBlock->getInstList());
BranchInst *PBI = cast<BranchInst>(FirstEntryBlock->getTerminator()); BranchInst *PBI = cast<BranchInst>(FirstEntryBlock->getTerminator());
Value *CC = PBI->getCondition(); assert(PBI->getCondition() == IfCond2);
BasicBlock *SaveInsertBB = Builder.GetInsertBlock(); BasicBlock *SaveInsertBB = Builder.GetInsertBlock();
BasicBlock::iterator SaveInsertPt = Builder.GetInsertPoint(); BasicBlock::iterator SaveInsertPt = Builder.GetInsertPoint();
Builder.SetInsertPoint(PBI); Builder.SetInsertPoint(PBI);
Value *NC = Builder.CreateOr(CInst1, CC); if (InvertCond2) {
PBI->replaceUsesOfWith(CC, NC); // If this is a "cmp" instruction, only used for branching (and nowhere
// else), then we can simply invert the predicate.
auto Cmp2 = dyn_cast<CmpInst>(CInst2);
if (Cmp2 && Cmp2->hasOneUse())
Cmp2->setPredicate(Cmp2->getInversePredicate());
else
CInst2 = cast<Instruction>(Builder.CreateNot(CInst2));
PBI->swapSuccessors();
}
Value *NC = Builder.CreateBinOp(CombineOp, CInst1, CInst2);
PBI->replaceUsesOfWith(IfCond2, NC);
Builder.SetInsertPoint(SaveInsertBB, SaveInsertPt); Builder.SetInsertPoint(SaveInsertBB, SaveInsertPt);
// Handle PHI node to replace its predecessors to FirstEntryBlock. // Handle PHI node to replace its predecessors to FirstEntryBlock.

View File

@ -29,7 +29,7 @@ exit: ; preds = %entry, %b0, %b1
; CHECK-NEXT: entry: ; CHECK-NEXT: entry:
; CHECK-NEXT: %0 = fcmp ult float %a ; CHECK-NEXT: %0 = fcmp ult float %a
; CHECK-NEXT: %1 = fcmp ult float %b ; CHECK-NEXT: %1 = fcmp ult float %b
; CHECK-NEXT: [[COND:%[a-z0-9]+]] = or i1 %0, %1 ; CHECK-NEXT: [[COND:%[a-z0-9]+]] = and i1 %0, %1
; CHECK-NEXT: br i1 [[COND]], label %bb4, label %bb3 ; CHECK-NEXT: br i1 [[COND]], label %bb4, label %bb3
; CHECK: bb3: ; CHECK: bb3:
; CHECK-NEXT: br label %bb4 ; CHECK-NEXT: br label %bb4
@ -84,3 +84,134 @@ bb3: ; preds = %bb2, %bb1
%check_badref = phi i32 [ 17, %bb1 ], [ 11, %bb2 ] %check_badref = phi i32 [ 17, %bb1 ], [ 11, %bb2 ]
ret void ret void
} }
@g = global i32 0, align 4
; CHECK-LABEL: @test_then
; CHECK-NEXT: entry.x:
; CHECK-NEXT: %cmp.x = icmp ne i32 %x, 0
; CHECK-NEXT: %cmp.y = icmp ne i32 %y, 0
; CHECK-NEXT: [[COND:%[a-z0-9]+]] = or i1 %cmp.x, %cmp.y
; CHECK-NEXT: br i1 [[COND]], label %if.then.y, label %exit
; CHECK: if.then.y:
; CHECK-NEXT: store i32 %z, i32* @g, align 4
; CHECK-NEXT: br label %exit
; CHECK: exit:
; CHECK-NEXT: ret void
define void @test_then(i32 %x, i32 %y, i32 %z) {
entry.x:
%cmp.x = icmp ne i32 %x, 0
br i1 %cmp.x, label %if.then.x, label %entry.y
if.then.x:
store i32 %z, i32* @g, align 4
br label %entry.y
entry.y:
%cmp.y = icmp ne i32 %y, 0
br i1 %cmp.y, label %if.then.y, label %exit
if.then.y:
store i32 %z, i32* @g, align 4
br label %exit
exit:
ret void
}
; CHECK-LABEL: @test_else
; CHECK-NEXT: entry.x:
; CHECK-NEXT: %cmp.x = icmp eq i32 %x, 0
; CHECK-NEXT: %cmp.y = icmp eq i32 %y, 0
; CHECK-NEXT: [[COND:%[a-z0-9]+]] = and i1 %cmp.x, %cmp.y
; CHECK-NEXT: br i1 [[COND]], label %exit, label %if.else.y
; CHECK: if.else.y:
; CHECK-NEXT: store i32 %z, i32* @g, align 4
; CHECK-NEXT: br label %exit
; CHECK: exit:
; CHECK-NEXT: ret void
define void @test_else(i32 %x, i32 %y, i32 %z) {
entry.x:
%cmp.x = icmp eq i32 %x, 0
br i1 %cmp.x, label %entry.y, label %if.else.x
if.else.x:
store i32 %z, i32* @g, align 4
br label %entry.y
entry.y:
%cmp.y = icmp eq i32 %y, 0
br i1 %cmp.y, label %exit, label %if.else.y
if.else.y:
store i32 %z, i32* @g, align 4
br label %exit
exit:
ret void
}
; CHECK-LABEL: @test_combine_and
; CHECK-NEXT: entry.x:
; CHECK-NEXT: %cmp.x = icmp eq i32 %x, 0
; CHECK-NEXT: %cmp.y = icmp eq i32 %y, 0
; CHECK-NEXT: [[COND:%[a-z0-9]+]] = and i1 %cmp.x, %cmp.y
; CHECK-NEXT: br i1 [[COND]], label %exit, label %if.then.y
; CHECK: if.then.y:
; CHECK-NEXT: store i32 %z, i32* @g, align 4
; CHECK-NEXT: br label %exit
; CHECK: exit:
; CHECK-NEXT: ret void
define void @test_combine_and(i32 %x, i32 %y, i32 %z) {
entry.x:
%cmp.x = icmp eq i32 %x, 0
br i1 %cmp.x, label %entry.y, label %if.else.x
if.else.x:
store i32 %z, i32* @g, align 4
br label %entry.y
entry.y:
%cmp.y = icmp ne i32 %y, 0
br i1 %cmp.y, label %if.then.y, label %exit
if.then.y:
store i32 %z, i32* @g, align 4
br label %exit
exit:
ret void
}
; CHECK-LABEL: @test_combine_or
; CHECK-NEXT: entry.x:
; CHECK-NEXT: %cmp.x = icmp ne i32 %x, 0
; CHECK-NEXT: %cmp.y = icmp ne i32 %y, 0
; CHECK-NEXT: [[COND:%[a-z0-9]+]] = or i1 %cmp.x, %cmp.y
; CHECK-NEXT: br i1 [[COND]], label %if.else.y, label %exit
; CHECK: if.else.y:
; CHECK-NEXT: store i32 %z, i32* @g, align 4
; CHECK-NEXT: br label %exit
; CHECK: exit:
; CHECK-NEXT: ret void
define void @test_combine_or(i32 %x, i32 %y, i32 %z) {
entry.x:
%cmp.x = icmp ne i32 %x, 0
br i1 %cmp.x, label %if.then.x, label %entry.y
if.then.x:
store i32 %z, i32* @g, align 4
br label %entry.y
entry.y:
%cmp.y = icmp eq i32 %y, 0
br i1 %cmp.y, label %exit, label %if.else.y
if.else.y:
store i32 %z, i32* @g, align 4
br label %exit
exit:
ret void
}