forked from OSchip/llvm-project
58 lines
2.2 KiB
LLVM
58 lines
2.2 KiB
LLVM
; RUN: opt -disable-verify -debug-pass-manager -passes='default<O1>' -force-vector-width=4 -S %s 2>&1 | FileCheck %s --check-prefixes=O1
|
|
; RUN: opt -disable-verify -debug-pass-manager -passes='default<O2>' -force-vector-width=4 -S %s 2>&1 | FileCheck %s --check-prefixes=O2
|
|
; RUN: opt -disable-verify -debug-pass-manager -passes='default<O2>' -force-vector-width=4 -extra-vectorizer-passes -S %s 2>&1 | FileCheck %s --check-prefixes=O2_EXTRA
|
|
|
|
; When the loop doesn't get vectorized, no extra vector passes should run.
|
|
; RUN: opt -disable-verify -debug-pass-manager -passes='default<O2>' -force-vector-width=0 -extra-vectorizer-passes -S %s 2>&1 | FileCheck %s --check-prefixes=O2
|
|
|
|
; REQUIRES: asserts
|
|
|
|
; The loop vectorizer still runs at both -O1/-O2 even with the
|
|
; debug flag, but it only works on loops explicitly annotated
|
|
; with pragmas.
|
|
|
|
; SLP does not run at -O1. Loop vectorization runs, but it only
|
|
; works on loops explicitly annotated with pragmas.
|
|
; O1-LABEL: Running pass: LoopVectorizePass
|
|
; O1-NOT: Running pass: SLPVectorizerPass
|
|
; O1: Running pass: VectorCombinePass
|
|
|
|
; Everything runs at -O2.
|
|
; O2-LABEL: Running pass: LoopVectorizePass
|
|
; O2-NOT: Running pass: EarlyCSEPass
|
|
; O2-NOT: Running pass: LICMPass
|
|
; O2: Running pass: SLPVectorizerPass
|
|
; O2: Running pass: VectorCombinePass
|
|
|
|
; Optionally run cleanup passes.
|
|
; O2_EXTRA-LABEL: Running pass: LoopVectorizePass
|
|
; O2_EXTRA: Running pass: EarlyCSEPass
|
|
; O2_EXTRA: Running pass: CorrelatedValuePropagationPass
|
|
; O2_EXTRA: Running pass: InstCombinePass
|
|
; O2_EXTRA: Running pass: LICMPass
|
|
; O2_EXTRA: Running pass: SimpleLoopUnswitchPass
|
|
; O2_EXTRA: Running pass: SimplifyCFGPass
|
|
; O2_EXTRA: Running pass: InstCombinePass
|
|
; O2_EXTRA: Running pass: SLPVectorizerPass
|
|
; O2_EXTRA: Running pass: EarlyCSEPass
|
|
; O2_EXTRA: Running pass: VectorCombinePass
|
|
|
|
define i64 @f(i1 %cond, i32* %src, i32* %dst) {
|
|
entry:
|
|
br label %loop
|
|
|
|
loop:
|
|
%i = phi i64 [ 0, %entry ], [ %inc, %loop ]
|
|
%src.i = getelementptr i32, i32* %src, i64 %i
|
|
%src.v = load i32, i32* %src.i
|
|
%add = add i32 %src.v, 10
|
|
%dst.i = getelementptr i32, i32* %dst, i64 %i
|
|
store i32 %add, i32* %dst.i
|
|
%inc = add nuw nsw i64 %i, 1
|
|
%ec = icmp ne i64 %inc, 1000
|
|
br i1 %ec, label %loop, label %exit
|
|
|
|
exit:
|
|
ret i64 %i
|
|
}
|