forked from OSchip/llvm-project
72 lines
2.1 KiB
LLVM
72 lines
2.1 KiB
LLVM
; RUN: opt %loadPolly -analyze -polly-ast -polly-vectorizer=polly < %s | \
|
|
; RUN: FileCheck %s -check-prefix=AST
|
|
|
|
; RUN: opt %loadPolly -polly-codegen -polly-vectorizer=polly -S < %s | \
|
|
; RUN: FileCheck %s
|
|
;
|
|
; void foo(float *A) {
|
|
; for (long i = 0; i < 16; i++) {
|
|
; if (i % 2)
|
|
; A[i] += 2;
|
|
; if (i % 3)
|
|
; A[i] += 3;
|
|
; }
|
|
; }
|
|
;
|
|
target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
|
|
|
|
; AST: #pragma simd
|
|
; AST: #pragma known-parallel
|
|
; AST: for (int c0 = 0; c0 <= 15; c0 += 1) {
|
|
; AST: if ((c0 - 1) % 2 == 0)
|
|
; AST: Stmt_bb4(c0);
|
|
; AST: if (c0 % 3 >= 1)
|
|
; AST: Stmt_bb11(c0);
|
|
; AST: }
|
|
|
|
; CHECK: polly.split_new_and_old
|
|
|
|
define void @foo(float* %A) {
|
|
bb:
|
|
br label %bb1
|
|
|
|
bb1: ; preds = %bb16, %bb
|
|
%i.0 = phi i64 [ 0, %bb ], [ %tmp17, %bb16 ]
|
|
%exitcond = icmp ne i64 %i.0, 16
|
|
br i1 %exitcond, label %bb2, label %bb18
|
|
|
|
bb2: ; preds = %bb1
|
|
%tmp = srem i64 %i.0, 2
|
|
%tmp3 = icmp eq i64 %tmp, 0
|
|
br i1 %tmp3, label %bb8, label %bb4
|
|
|
|
bb4: ; preds = %bb2
|
|
%tmp5 = getelementptr inbounds float, float* %A, i64 %i.0
|
|
%tmp6 = load float, float* %tmp5, align 4
|
|
%tmp7 = fadd float %tmp6, 2.000000e+00
|
|
store float %tmp7, float* %tmp5, align 4
|
|
br label %bb8
|
|
|
|
bb8: ; preds = %bb2, %bb4
|
|
%tmp9 = srem i64 %i.0, 3
|
|
%tmp10 = icmp eq i64 %tmp9, 0
|
|
br i1 %tmp10, label %bb15, label %bb11
|
|
|
|
bb11: ; preds = %bb8
|
|
%tmp12 = getelementptr inbounds float, float* %A, i64 %i.0
|
|
%tmp13 = load float, float* %tmp12, align 4
|
|
%tmp14 = fadd float %tmp13, 3.000000e+00
|
|
store float %tmp14, float* %tmp12, align 4
|
|
br label %bb15
|
|
|
|
bb15: ; preds = %bb8, %bb11
|
|
br label %bb16
|
|
|
|
bb16: ; preds = %bb15
|
|
%tmp17 = add nsw i64 %i.0, 1
|
|
br label %bb1
|
|
|
|
bb18: ; preds = %bb1
|
|
ret void
|
|
}
|