forked from OSchip/llvm-project
43 lines
1.5 KiB
LLVM
43 lines
1.5 KiB
LLVM
|
; RUN: opt -passes='loop-vectorize' -force-vector-width=2 -S < %s | FileCheck %s
|
||
|
;
|
||
|
; Forcing VF=2 to trigger vector code gen
|
||
|
;
|
||
|
; This is a test case that let's vectorizer's code gen to generate
|
||
|
; more than one BasicBlocks in the loop body (emulated masked scatter)
|
||
|
; for those targets that do not support masked scatter. Broadcast
|
||
|
; code generation was previously dependent on loop body being
|
||
|
; a single basic block and this test case exposed incorrect code gen
|
||
|
; resulting in an assert in IL verification. Test passes if IL verification
|
||
|
; does not fail.
|
||
|
;
|
||
|
; Performing minimal check in the output to ensure the loop is actually
|
||
|
; vectorized.
|
||
|
;
|
||
|
; CHECK: vector.body
|
||
|
|
||
|
@a = external global [2 x i16], align 1
|
||
|
|
||
|
define void @f1() {
|
||
|
entry:
|
||
|
br label %for.body
|
||
|
|
||
|
for.body: ; preds = %land.end, %entry
|
||
|
%0 = phi i32 [ undef, %entry ], [ %dec, %land.end ]
|
||
|
br i1 undef, label %land.end, label %land.rhs
|
||
|
|
||
|
land.rhs: ; preds = %for.body
|
||
|
%1 = load i32, i32* undef, align 1
|
||
|
br label %land.end
|
||
|
|
||
|
land.end: ; preds = %land.rhs, %for.body
|
||
|
%2 = trunc i32 %0 to i16
|
||
|
%arrayidx = getelementptr inbounds [2 x i16], [2 x i16]* @a, i16 0, i16 %2
|
||
|
store i16 undef, i16* %arrayidx, align 1
|
||
|
%dec = add nsw i32 %0, -1
|
||
|
%cmp = icmp sgt i32 %0, 1
|
||
|
br i1 %cmp, label %for.body, label %for.cond.for.end_crit_edge
|
||
|
|
||
|
for.cond.for.end_crit_edge: ; preds = %land.end
|
||
|
unreachable
|
||
|
}
|