forked from OSchip/llvm-project
163 lines
6.9 KiB
LLVM
163 lines
6.9 KiB
LLVM
; RUN: opt %loadPolly -polly-scops \
|
|
; RUN: -polly-allow-nonaffine -polly-allow-nonaffine-branches \
|
|
; RUN: -polly-allow-nonaffine-loops -analyze < %s | FileCheck %s
|
|
; RUN: opt %loadPolly -polly-scops -polly-allow-nonaffine \
|
|
; RUN: -polly-unprofitable-scalar-accs=true \
|
|
; RUN: -polly-process-unprofitable=false \
|
|
; RUN: -polly-allow-nonaffine-branches -polly-allow-nonaffine-loops \
|
|
; RUN: -analyze < %s | FileCheck %s --check-prefix=PROFIT
|
|
;
|
|
; Verify that we over approximate the read acces of A[j] in the last statement as j is
|
|
; computed in a non-affine loop we do not model.
|
|
;
|
|
; CHECK: Function: f
|
|
; CHECK-NEXT: Region: %bb2---%bb24
|
|
; CHECK-NEXT: Max Loop Depth: 1
|
|
; CHECK-NEXT: Invariant Accesses: {
|
|
; CHECK-NEXT: }
|
|
; CHECK-NEXT: Context:
|
|
; CHECK-NEXT: [N] -> { : -2147483648 <= N <= 2147483647 }
|
|
; CHECK-NEXT: Assumed Context:
|
|
; CHECK-NEXT: [N] -> { : }
|
|
; CHECK-NEXT: Invalid Context:
|
|
; CHECK-NEXT: [N] -> { : false }
|
|
; CHECK: p0: %N
|
|
; CHECK-NEXT: Arrays {
|
|
; CHECK-NEXT: i32 MemRef_j_0__phi; // Element size 4
|
|
; CHECK-NEXT: i32 MemRef_j_0; // Element size 4
|
|
; CHECK-NEXT: i32 MemRef_A[*]; // Element size 4
|
|
; CHECK-NEXT: i32 MemRef_j_2__phi; // Element size 4
|
|
; CHECK-NEXT: i32 MemRef_j_2; // Element size 4
|
|
; CHECK-NEXT: }
|
|
; CHECK-NEXT: Arrays (Bounds as pw_affs) {
|
|
; CHECK-NEXT: i32 MemRef_j_0__phi; // Element size 4
|
|
; CHECK-NEXT: i32 MemRef_j_0; // Element size 4
|
|
; CHECK-NEXT: i32 MemRef_A[*]; // Element size 4
|
|
; CHECK-NEXT: i32 MemRef_j_2__phi; // Element size 4
|
|
; CHECK-NEXT: i32 MemRef_j_2; // Element size 4
|
|
; CHECK-NEXT: }
|
|
; CHECK-NEXT: Alias Groups (0):
|
|
; CHECK-NEXT: n/a
|
|
; CHECK-NEXT: Statements {
|
|
; CHECK-NEXT: Stmt_bb2
|
|
; CHECK-NEXT: Domain :=
|
|
; CHECK-NEXT: [N] -> { Stmt_bb2[i0] : 0 <= i0 <= N; Stmt_bb2[0] : N < 0 };
|
|
; CHECK-NEXT: Schedule :=
|
|
; CHECK-NEXT: [N] -> { Stmt_bb2[i0] -> [i0, 0] : i0 <= N; Stmt_bb2[0] -> [0, 0] : N < 0 };
|
|
; CHECK-NEXT: ReadAccess := [Reduction Type: NONE] [Scalar: 1]
|
|
; CHECK-NEXT: [N] -> { Stmt_bb2[i0] -> MemRef_j_0__phi[] };
|
|
; CHECK-NEXT: MustWriteAccess := [Reduction Type: NONE] [Scalar: 1]
|
|
; CHECK-NEXT: [N] -> { Stmt_bb2[i0] -> MemRef_j_0[] };
|
|
; CHECK-NEXT: Stmt_bb4__TO__bb18
|
|
; CHECK-NEXT: Domain :=
|
|
; CHECK-NEXT: [N] -> { Stmt_bb4__TO__bb18[i0] : 0 <= i0 < N };
|
|
; CHECK-NEXT: Schedule :=
|
|
; CHECK-NEXT: [N] -> { Stmt_bb4__TO__bb18[i0] -> [i0, 1] };
|
|
; CHECK-NEXT: ReadAccess := [Reduction Type: NONE] [Scalar: 0]
|
|
; CHECK-NEXT: [N] -> { Stmt_bb4__TO__bb18[i0] -> MemRef_A[i0] };
|
|
; CHECK-NEXT: ReadAccess := [Reduction Type: NONE] [Scalar: 0]
|
|
; CHECK-NEXT: [N] -> { Stmt_bb4__TO__bb18[i0] -> MemRef_A[i0] };
|
|
; CHECK-NEXT: MayWriteAccess := [Reduction Type: NONE] [Scalar: 0]
|
|
; CHECK-NEXT: [N] -> { Stmt_bb4__TO__bb18[i0] -> MemRef_A[i0] };
|
|
; CHECK-NEXT: MustWriteAccess := [Reduction Type: NONE] [Scalar: 1]
|
|
; CHECK-NEXT: [N] -> { Stmt_bb4__TO__bb18[i0] -> MemRef_j_2__phi[] };
|
|
; CHECK-NEXT: ReadAccess := [Reduction Type: NONE] [Scalar: 1]
|
|
; CHECK-NEXT: [N] -> { Stmt_bb4__TO__bb18[i0] -> MemRef_j_0[] };
|
|
; CHECK-NEXT: Stmt_bb18
|
|
; CHECK-NEXT: Domain :=
|
|
; CHECK-NEXT: [N] -> { Stmt_bb18[i0] : 0 <= i0 < N };
|
|
; CHECK-NEXT: Schedule :=
|
|
; CHECK-NEXT: [N] -> { Stmt_bb18[i0] -> [i0, 2] };
|
|
; CHECK-NEXT: MustWriteAccess := [Reduction Type: NONE] [Scalar: 1]
|
|
; CHECK-NEXT: [N] -> { Stmt_bb18[i0] -> MemRef_j_2[] };
|
|
; CHECK-NEXT: ReadAccess := [Reduction Type: NONE] [Scalar: 1]
|
|
; CHECK-NEXT: [N] -> { Stmt_bb18[i0] -> MemRef_j_2__phi[] };
|
|
; CHECK-NEXT: ReadAccess := [Reduction Type: NONE] [Scalar: 0]
|
|
; CHECK-NEXT: [N] -> { Stmt_bb18[i0] -> MemRef_A[o0] };
|
|
; CHECK-NEXT: MustWriteAccess := [Reduction Type: NONE] [Scalar: 0]
|
|
; CHECK-NEXT: [N] -> { Stmt_bb18[i0] -> MemRef_A[i0] };
|
|
; CHECK-NEXT: Stmt_bb23
|
|
; CHECK-NEXT: Domain :=
|
|
; CHECK-NEXT: [N] -> { Stmt_bb23[i0] : 0 <= i0 < N };
|
|
; CHECK-NEXT: Schedule :=
|
|
; CHECK-NEXT: [N] -> { Stmt_bb23[i0] -> [i0, 3] };
|
|
; CHECK-NEXT: ReadAccess := [Reduction Type: NONE] [Scalar: 1]
|
|
; CHECK-NEXT: [N] -> { Stmt_bb23[i0] -> MemRef_j_2[] };
|
|
; CHECK-NEXT: MustWriteAccess := [Reduction Type: NONE] [Scalar: 1]
|
|
; CHECK-NEXT: [N] -> { Stmt_bb23[i0] -> MemRef_j_0__phi[] };
|
|
; CHECK-NEXT: }
|
|
;
|
|
; Due to the scalar accesses we are not able to distribute the outer loop, thus we do not consider the region profitable.
|
|
;
|
|
; PROFIT-NOT: Statements
|
|
;
|
|
; void f(int *A, int N, int M) {
|
|
; int i = 0, j = 0;
|
|
; for (i = 0; i < N; i++) {
|
|
; if (A[i])
|
|
; for (j = 0; j < M; j++)
|
|
; A[i]++;
|
|
; A[i] = A[j];
|
|
; }
|
|
; }
|
|
;
|
|
target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
|
|
|
|
define void @f(i32* %A, i32 %N, i32 %M) {
|
|
bb:
|
|
%tmp = icmp sgt i32 %M, 0
|
|
%smax = select i1 %tmp, i32 %M, i32 0
|
|
%tmp1 = sext i32 %N to i64
|
|
br label %bb2
|
|
|
|
bb2: ; preds = %bb23, %bb
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %bb23 ], [ 0, %bb ]
|
|
%j.0 = phi i32 [ 0, %bb ], [ %j.2, %bb23 ]
|
|
%tmp3 = icmp slt i64 %indvars.iv, %tmp1
|
|
br i1 %tmp3, label %bb4, label %bb24
|
|
|
|
bb4: ; preds = %bb2
|
|
%tmp5 = getelementptr inbounds i32, i32* %A, i64 %indvars.iv
|
|
%tmp6 = load i32, i32* %tmp5, align 4
|
|
%tmp7 = icmp eq i32 %tmp6, 0
|
|
br i1 %tmp7, label %bb18, label %bb8
|
|
|
|
bb8: ; preds = %bb4
|
|
br label %bb9
|
|
|
|
bb9: ; preds = %bb15, %bb8
|
|
%j.1 = phi i32 [ 0, %bb8 ], [ %tmp16, %bb15 ]
|
|
%tmp10 = icmp slt i32 %j.1, %M
|
|
br i1 %tmp10, label %bb11, label %bb17
|
|
|
|
bb11: ; preds = %bb9
|
|
%tmp12 = getelementptr inbounds i32, i32* %A, i64 %indvars.iv
|
|
%tmp13 = load i32, i32* %tmp12, align 4
|
|
%tmp14 = add nsw i32 %tmp13, 1
|
|
store i32 %tmp14, i32* %tmp12, align 4
|
|
br label %bb15
|
|
|
|
bb15: ; preds = %bb11
|
|
%tmp16 = add nuw nsw i32 %j.1, 1
|
|
br label %bb9
|
|
|
|
bb17: ; preds = %bb9
|
|
br label %bb18
|
|
|
|
bb18: ; preds = %bb4, %bb17
|
|
%j.2 = phi i32 [ %smax, %bb17 ], [ %j.0, %bb4 ]
|
|
%tmp19 = sext i32 %j.2 to i64
|
|
%tmp20 = getelementptr inbounds i32, i32* %A, i64 %tmp19
|
|
%tmp21 = load i32, i32* %tmp20, align 4
|
|
%tmp22 = getelementptr inbounds i32, i32* %A, i64 %indvars.iv
|
|
store i32 %tmp21, i32* %tmp22, align 4
|
|
br label %bb23
|
|
|
|
bb23: ; preds = %bb18
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
br label %bb2
|
|
|
|
bb24: ; preds = %bb2
|
|
ret void
|
|
}
|