forked from OSchip/llvm-project
301 lines
9.4 KiB
LLVM
301 lines
9.4 KiB
LLVM
; REQUIRES: asserts
|
|
; RUN: opt < %s -loop-vectorize -force-vector-width=2 -force-vector-interleave=1 -debug-only=loop-vectorize 2>&1 | FileCheck %s
|
|
|
|
target datalayout = "e-m:e-i64:64-i128:128-n32:64-S128"
|
|
|
|
; Test cases for PR50009, which require sinking a replicate-region due to a
|
|
; first-order recurrence.
|
|
|
|
define void @sink_replicate_region_1(i32 %x, i8* %ptr) optsize {
|
|
; CHECK-LABEL: sink_replicate_region_1
|
|
; CHECK: VPlan 'Initial VPlan for VF={2},UF>=1' {
|
|
; CHECK-NEXT: loop:
|
|
; CHECK-NEXT: WIDEN-PHI %0 = phi 0, %conv
|
|
; CHECK-NEXT: WIDEN-INDUCTION %iv = phi 0, %iv.next
|
|
; CHECK-NEXT: EMIT vp<%3> = icmp ule ir<%iv> vp<%0>
|
|
; CHECK-NEXT: Successor(s): loop.0
|
|
|
|
; CHECK: loop.0:
|
|
; CHECK-NEXT: REPLICATE ir<%gep> = getelementptr ir<%ptr>, ir<%iv>
|
|
; CHECK-NEXT: Successor(s): pred.load
|
|
|
|
; CHECK: <xVFxUF> pred.load: {
|
|
; CHECK-NEXT: pred.load.entry:
|
|
; CHECK-NEXT: BRANCH-ON-MASK vp<%3>
|
|
; CHECK-NEXT: Successor(s): pred.load.if, pred.load.continue
|
|
; CHECK-NEXT: CondBit: vp<%3> (loop)
|
|
|
|
; CHECK: pred.load.if:
|
|
; CHECK-NEXT: REPLICATE ir<%lv> = load ir<%gep> (S->V)
|
|
; CHECK-NEXT: Successor(s): pred.load.continue
|
|
|
|
; CHECK: pred.load.continue:
|
|
; CHECK-NEXT: PHI-PREDICATED-INSTRUCTION vp<%6> = ir<%lv>
|
|
; CHECK-NEXT: No successors
|
|
; CHECK-NEXT: }
|
|
|
|
; CHECK: loop.1:
|
|
; CHECK-NEXT: WIDEN ir<%conv> = sext vp<%6>
|
|
; CHECK-NEXT: Successor(s): pred.srem
|
|
|
|
; CHECK: <xVFxUF> pred.srem: {
|
|
; CHECK-NEXT: pred.srem.entry:
|
|
; CHECK-NEXT: BRANCH-ON-MASK vp<%3>
|
|
; CHECK-NEXT: Successor(s): pred.srem.if, pred.srem.continue
|
|
; CHECK-NEXT: CondBit: vp<%3> (loop)
|
|
|
|
; CHECK: pred.srem.if:
|
|
; CHECK-NEXT: REPLICATE ir<%rem> = srem ir<%0>, ir<%x> (S->V)
|
|
; CHECK-NEXT: Successor(s): pred.srem.continue
|
|
|
|
; CHECK: pred.srem.continue:
|
|
; CHECK-NEXT: PHI-PREDICATED-INSTRUCTION vp<%9> = ir<%rem>
|
|
; CHECK-NEXT: No successors
|
|
; CHECK-NEXT: }
|
|
|
|
; CHECK: loop.1.split:
|
|
; CHECK-NEXT: WIDEN ir<%add> = add ir<%conv>, vp<%9>
|
|
; CHECK-NEXT: No successors
|
|
; CHECK-NEXT: }
|
|
;
|
|
entry:
|
|
br label %loop
|
|
|
|
loop:
|
|
%0 = phi i32 [ 0, %entry ], [ %conv, %loop ]
|
|
%iv = phi i32 [ 0, %entry ], [ %iv.next, %loop ]
|
|
%rem = srem i32 %0, %x
|
|
%gep = getelementptr i8, i8* %ptr, i32 %iv
|
|
%lv = load i8, i8* %gep
|
|
%conv = sext i8 %lv to i32
|
|
%add = add i32 %conv, %rem
|
|
%iv.next = add nsw i32 %iv, 1
|
|
%ec = icmp eq i32 %iv.next, 20001
|
|
br i1 %ec, label %exit, label %loop
|
|
|
|
exit:
|
|
ret void
|
|
}
|
|
|
|
define void @sink_replicate_region_2(i32 %x, i8 %y, i32* %ptr) optsize {
|
|
; CHECK-LABEL: sink_replicate_region_2
|
|
; CHECK: VPlan 'Initial VPlan for VF={2},UF>=1' {
|
|
; CHECK-NEXT: loop:
|
|
; CHECK-NEXT: WIDEN-PHI %recur = phi 0, %recur.next
|
|
; CHECK-NEXT: WIDEN-INDUCTION %iv = phi 0, %iv.next
|
|
; CHECK-NEXT: EMIT vp<%3> = icmp ule ir<%iv> vp<%0>
|
|
; CHECK-NEXT: Successor(s): loop.0
|
|
|
|
; CHECK: loop.0:
|
|
; CHECK-NEXT: WIDEN ir<%recur.next> = sext ir<%y>
|
|
; CHECK-NEXT: Successor(s): pred.srem
|
|
|
|
; CHECK: <xVFxUF> pred.srem: {
|
|
; CHECK-NEXT: pred.srem.entry:
|
|
; CHECK-NEXT: BRANCH-ON-MASK vp<%3>
|
|
; CHECK-NEXT: Successor(s): pred.srem.if, pred.srem.continue
|
|
; CHECK-NEXT: CondBit: vp<%3> (loop)
|
|
|
|
; CHECK: pred.srem.if:
|
|
; CHECK-NEXT: REPLICATE ir<%rem> = srem ir<%recur>, ir<%x>
|
|
; CHECK-NEXT: Successor(s): pred.srem.continue
|
|
|
|
; CHECK: pred.srem.continue:
|
|
; CHECK-NEXT: PHI-PREDICATED-INSTRUCTION vp<%6> = ir<%rem>
|
|
; CHECK-NEXT: No successors
|
|
; CHECK-NEXT: }
|
|
|
|
; CHECK: loop.0.split:
|
|
; CHECK-NEXT: REPLICATE ir<%add> = add vp<%6>, ir<%recur.next>
|
|
; CHECK-NEXT: REPLICATE ir<%gep> = getelementptr ir<%ptr>, ir<%iv>
|
|
; CHECK-NEXT: Successor(s): pred.store
|
|
|
|
; CHECK: <xVFxUF> pred.store: {
|
|
; CHECK-NEXT: pred.store.entry:
|
|
; CHECK-NEXT: BRANCH-ON-MASK vp<%3>
|
|
; CHECK-NEXT: Successor(s): pred.store.if, pred.store.continue
|
|
; CHECK-NEXT: CondBit: vp<%3> (loop)
|
|
|
|
; CHECK: pred.store.if:
|
|
; CHECK-NEXT: REPLICATE store ir<%add>, ir<%gep>
|
|
; CHECK-NEXT: Successor(s): pred.store.continue
|
|
|
|
; CHECK: pred.store.continue:
|
|
; CHECK-NEXT: No successors
|
|
; CHECK-NEXT: }
|
|
|
|
; CHECK: loop.1:
|
|
; CHECK-NEXT: No successors
|
|
; CHECK-NEXT: }
|
|
;
|
|
entry:
|
|
br label %loop
|
|
|
|
loop:
|
|
%recur = phi i32 [ 0, %entry ], [ %recur.next, %loop ]
|
|
%iv = phi i32 [ 0, %entry ], [ %iv.next, %loop ]
|
|
%rem = srem i32 %recur, %x
|
|
%recur.next = sext i8 %y to i32
|
|
%add = add i32 %rem, %recur.next
|
|
%gep = getelementptr i32, i32* %ptr, i32 %iv
|
|
store i32 %add, i32* %gep
|
|
%iv.next = add nsw i32 %iv, 1
|
|
%ec = icmp eq i32 %iv.next, 20001
|
|
br i1 %ec, label %exit, label %loop
|
|
|
|
exit:
|
|
ret void
|
|
}
|
|
|
|
define i32 @sink_replicate_region_3_reduction(i32 %x, i8 %y, i32* %ptr) optsize {
|
|
; CHECK-LABEL: sink_replicate_region_3_reduction
|
|
; CHECK: VPlan 'Initial VPlan for VF={2},UF>=1' {
|
|
; CHECK-NEXT: loop:
|
|
; CHECK-NEXT: WIDEN-PHI %recur = phi 0, %recur.next
|
|
; CHECK-NEXT: WIDEN-INDUCTION %iv = phi 0, %iv.next
|
|
; CHECK-NEXT: WIDEN-PHI ir<%and.red> = phi ir<1234>, ir<%and.red.next>
|
|
; CHECK-NEXT: EMIT vp<%4> = icmp ule ir<%iv> vp<%0>
|
|
; CHECK-NEXT: Successor(s): loop.0
|
|
|
|
; CHECK: loop.0:
|
|
; CHECK-NEXT: WIDEN ir<%recur.next> = sext ir<%y>
|
|
; CHECK-NEXT: Successor(s): pred.srem
|
|
|
|
; CHECK: <xVFxUF> pred.srem: {
|
|
; CHECK-NEXT: pred.srem.entry:
|
|
; CHECK-NEXT: BRANCH-ON-MASK vp<%4>
|
|
; CHECK-NEXT: Successor(s): pred.srem.if, pred.srem.continue
|
|
; CHECK-NEXT: CondBit: vp<%4> (loop)
|
|
|
|
; CHECK: pred.srem.if:
|
|
; CHECK-NEXT: REPLICATE ir<%rem> = srem ir<%recur>, ir<%x> (S->V)
|
|
; CHECK-NEXT: Successor(s): pred.srem.continue
|
|
|
|
; CHECK: pred.srem.continue:
|
|
; CHECK-NEXT: PHI-PREDICATED-INSTRUCTION vp<%7> = ir<%rem>
|
|
; CHECK-NEXT: No successors
|
|
; CHECK-NEXT: }
|
|
|
|
; CHECK: loop.0.split:
|
|
; CHECK-NEXT: WIDEN ir<%add> = add vp<%7>, ir<%recur.next>
|
|
; CHECK-NEXT: WIDEN ir<%and.red.next> = and ir<%and.red>, ir<%add>
|
|
; CHECK-NEXT: EMIT vp<%10> = select vp<%4> ir<%and.red.next> ir<%and.red>
|
|
; CHECK-NEXT: No successors
|
|
; CHECK-NEXT: }
|
|
;
|
|
entry:
|
|
br label %loop
|
|
|
|
loop:
|
|
%recur = phi i32 [ 0, %entry ], [ %recur.next, %loop ]
|
|
%iv = phi i32 [ 0, %entry ], [ %iv.next, %loop ]
|
|
%and.red = phi i32 [ 1234, %entry ], [ %and.red.next, %loop ]
|
|
%rem = srem i32 %recur, %x
|
|
%recur.next = sext i8 %y to i32
|
|
%add = add i32 %rem, %recur.next
|
|
%and.red.next = and i32 %and.red, %add
|
|
%iv.next = add nsw i32 %iv, 1
|
|
%ec = icmp eq i32 %iv.next, 20001
|
|
br i1 %ec, label %exit, label %loop
|
|
|
|
exit:
|
|
%res = phi i32 [ %and.red.next, %loop ]
|
|
ret i32 %res
|
|
}
|
|
|
|
; To sink the replicate region containing %rem, we need to split the block
|
|
; containing %conv at the end, because %conv is the last recipe in the block.
|
|
define void @sink_replicate_region_4_requires_split_at_end_of_block(i32 %x, i8* %ptr) optsize {
|
|
; CHECK-LABEL: sink_replicate_region_4_requires_split_at_end_of_block
|
|
; CHECK: VPlan 'Initial VPlan for VF={2},UF>=1' {
|
|
; CHECK-NEXT: loop:
|
|
; CHECK-NEXT: WIDEN-PHI %0 = phi 0, %conv
|
|
; CHECK-NEXT: WIDEN-INDUCTION %iv = phi 0, %iv.next
|
|
; CHECK-NEXT: EMIT vp<%3> = icmp ule ir<%iv> vp<%0>
|
|
; CHECK-NEXT: REPLICATE ir<%gep> = getelementptr ir<%ptr>, ir<%iv>
|
|
; CHECK-NEXT: Successor(s): loop.0
|
|
|
|
; CHECK: loop.0:
|
|
; CHECK-NEXT: Successor(s): pred.load
|
|
|
|
; CHECK: <xVFxUF> pred.load: {
|
|
; CHECK-NEXT: pred.load.entry:
|
|
; CHECK-NEXT: BRANCH-ON-MASK vp<%3>
|
|
; CHECK-NEXT: Successor(s): pred.load.if, pred.load.continue
|
|
; CHECK-NEXT: CondBit: vp<%3> (loop)
|
|
|
|
; CHECK: pred.load.if:
|
|
; CHECK-NEXT: REPLICATE ir<%lv> = load ir<%gep> (S->V)
|
|
; CHECK-NEXT: Successor(s): pred.load.continue
|
|
|
|
; CHECK: pred.load.continue:
|
|
; CHECK-NEXT: PHI-PREDICATED-INSTRUCTION vp<%6> = ir<%lv>
|
|
; CHECK-NEXT: No successors
|
|
; CHECK-NEXT: }
|
|
|
|
; CHECK: loop.1:
|
|
; CHECK-NEXT: WIDEN ir<%conv> = sext vp<%6>
|
|
; CHECK-NEXT: Successor(s): pred.srem
|
|
|
|
; CHECK: <xVFxUF> pred.srem: {
|
|
; CHECK-NEXT: pred.srem.entry:
|
|
; CHECK-NEXT: BRANCH-ON-MASK vp<%3>
|
|
; CHECK-NEXT: Successor(s): pred.srem.if, pred.srem.continue
|
|
; CHECK-NEXT: CondBit: vp<%3> (loop)
|
|
|
|
; CHECK: pred.srem.if:
|
|
; CHECK-NEXT: REPLICATE ir<%rem> = srem ir<%0>, ir<%x> (S->V)
|
|
; CHECK-NEXT: Successor(s): pred.srem.continue
|
|
|
|
; CHECK: pred.srem.continue:
|
|
; CHECK-NEXT: PHI-PREDICATED-INSTRUCTION vp<%9> = ir<%rem>
|
|
; CHECK-NEXT: No successors
|
|
; CHECK-NEXT: }
|
|
|
|
; CHECK: loop.1.split:
|
|
; CHECK-NEXT: Successor(s): pred.load
|
|
|
|
; CHECK: <xVFxUF> pred.load: {
|
|
; CHECK-NEXT: pred.load.entry:
|
|
; CHECK-NEXT: BRANCH-ON-MASK vp<%3>
|
|
; CHECK-NEXT: Successor(s): pred.load.if, pred.load.continue
|
|
; CHECK-NEXT: CondBit: vp<%3> (loop)
|
|
|
|
; CHECK: pred.load.if:
|
|
; CHECK-NEXT: REPLICATE ir<%lv.2> = load ir<%gep> (S->V)
|
|
; CHECK-NEXT: Successor(s): pred.load.continue
|
|
|
|
; CHECK: pred.load.continue:
|
|
; CHECK-NEXT: PHI-PREDICATED-INSTRUCTION vp<%11> = ir<%lv.2>
|
|
; CHECK-NEXT: No successors
|
|
; CHECK-NEXT: }
|
|
|
|
; CHECK: loop.2:
|
|
; CHECK-NEXT: WIDEN ir<%add.1> = add ir<%conv>, vp<%9>
|
|
; CHECK-NEXT: WIDEN ir<%conv.lv.2> = sext vp<%11>
|
|
; CHECK-NEXT: WIDEN ir<%add> = add ir<%add.1>, ir<%conv.lv.2>
|
|
; CHECK-NEXT: No successors
|
|
; CHECK-NEXT: }
|
|
;
|
|
entry:
|
|
br label %loop
|
|
|
|
loop:
|
|
%0 = phi i32 [ 0, %entry ], [ %conv, %loop ]
|
|
%iv = phi i32 [ 0, %entry ], [ %iv.next, %loop ]
|
|
%gep = getelementptr i8, i8* %ptr, i32 %iv
|
|
%rem = srem i32 %0, %x
|
|
%lv = load i8, i8* %gep
|
|
%conv = sext i8 %lv to i32
|
|
%lv.2 = load i8, i8* %gep
|
|
%add.1 = add i32 %conv, %rem
|
|
%conv.lv.2 = sext i8 %lv.2 to i32
|
|
%add = add i32 %add.1, %conv.lv.2
|
|
%iv.next = add nsw i32 %iv, 1
|
|
%ec = icmp eq i32 %iv.next, 20001
|
|
br i1 %ec, label %exit, label %loop
|
|
|
|
exit:
|
|
ret void
|
|
}
|