llvm-project/polly/test/Isl/Ast/alias_simple_3.ll

; RUN: opt %loadPolly -polly-code-generator=isl -polly-ast -analyze < %s | FileCheck %s --check-prefix=NOAA
; RUN: opt %loadPolly -polly-code-generator=isl -polly-ast -analyze -basicaa < %s | FileCheck %s --check-prefix=BASI
; RUN: opt %loadPolly -polly-code-generator=isl -polly-ast -analyze -tbaa < %s | FileCheck %s --check-prefix=TBAA
; RUN: opt %loadPolly -polly-code-generator=isl -polly-ast -analyze -scev-aa < %s | FileCheck %s --check-prefix=SCEV
; RUN: opt %loadPolly -polly-code-generator=isl -polly-ast -analyze -globalsmodref-aa < %s | FileCheck %s --check-prefix=GLOB
;
;    int A[1024];
;    float B[1024];
;
;    void jd(int N) {
;      for (int i = 0; i < N; i++)
;        A[i] = B[i];
;    }
;
; NOAA: if ((N <= 1024 ? 1 : 0) && (&MemRef_A[N] <= &MemRef_B[0] || &MemRef_B[N] <= &MemRef_A[0]))
; BASI: if (N <= 1024 ? 1 : 0)
; TBAA: if (N <= 1024 ? 1 : 0)
; SCEV: if ((N <= 1024 ? 1 : 0) && (&MemRef_A[N] <= &MemRef_B[0] || &MemRef_B[N] <= &MemRef_A[0]))
; GLOB: if ((N <= 1024 ? 1 : 0) && (&MemRef_A[N] <= &MemRef_B[0] || &MemRef_B[N] <= &MemRef_A[0]))
;
target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"

@A = common global [1024 x i32] zeroinitializer, align 16
@B = common global [1024 x float] zeroinitializer, align 16

define void @jd(i32 %N) {
entry:
  %cmp6 = icmp sgt i32 %N, 0
  br i1 %cmp6, label %for.body.preheader, label %for.end

for.body.preheader:                               ; preds = %entry
  br label %for.body

for.body:                                         ; preds = %for.body.preheader, %for.body
  %indvars.iv = phi i64 [ %indvars.iv.next, %for.body ], [ 0, %for.body.preheader ]
  %arrayidx = getelementptr inbounds  [1024 x float]* @B, i64 0, i64 %indvars.iv
  %tmp = load float* %arrayidx, align 4, !tbaa !1
  %conv = fptosi float %tmp to i32
  %arrayidx2 = getelementptr inbounds [1024 x i32]* @A, i64 0, i64 %indvars.iv
  store i32 %conv, i32* %arrayidx2, align 4, !tbaa !5
  %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
  %lftr.wideiv1 = trunc i64 %indvars.iv.next to i32
  %exitcond2 = icmp eq i32 %lftr.wideiv1, %N
  br i1 %exitcond2, label %for.end.loopexit, label %for.body

for.end.loopexit:                                 ; preds = %for.body
  br label %for.end

for.end:                                          ; preds = %for.end.loopexit, %entry
  ret void
}

!0 = metadata !{metadata !""}
!1 = metadata !{metadata !2, metadata !2, i64 0}
!2 = metadata !{metadata !"float", metadata !3, i64 0}
!3 = metadata !{metadata !"omnipotent char", metadata !4, i64 0}
!4 = metadata !{metadata !"Simple C/C++ TBAA"}
!5 = metadata !{metadata !6, metadata !6, i64 0}
!6 = metadata !{metadata !"int", metadata !3, i64 0}
[RTC] Runtime Alias Checks for the ISL backend (missing tests) Test files missing in r218046. llvm-svn: 218047 2014-09-18 19:20:36 +08:00			`; RUN: opt %loadPolly -polly-code-generator=isl -polly-ast -analyze < %s \| FileCheck %s --check-prefix=NOAA`
			`; RUN: opt %loadPolly -polly-code-generator=isl -polly-ast -analyze -basicaa < %s \| FileCheck %s --check-prefix=BASI`
			`; RUN: opt %loadPolly -polly-code-generator=isl -polly-ast -analyze -tbaa < %s \| FileCheck %s --check-prefix=TBAA`
			`; RUN: opt %loadPolly -polly-code-generator=isl -polly-ast -analyze -scev-aa < %s \| FileCheck %s --check-prefix=SCEV`
			`; RUN: opt %loadPolly -polly-code-generator=isl -polly-ast -analyze -globalsmodref-aa < %s \| FileCheck %s --check-prefix=GLOB`
			`;`
			`; int A[1024];`
			`; float B[1024];`
			`;`
			`; void jd(int N) {`
			`; for (int i = 0; i < N; i++)`
			`; A[i] = B[i];`
			`; }`
			`;`
Assume GetElementPtr offsets to be inbounds In case a GEP instruction references into a fixed size array e.g., an access A[i][j] into an array A[100x100], LLVM-IR does not guarantee that the subscripts always compute values that are within array bounds. We now derive the set of parameter values for which all accesses are within bounds and add the assumption that the scop is only every executed with this set of parameter values. Example: void foo(float A[][20], long n, long m { for (long i = 0; i < n; i++) for (long j = 0; j < m; j++) A[i][j] = ... This loop yields out-of-bound accesses if m is at least 20 and at the same time at least one iteration of the outer loop is executed. Hence, we assume: n <= 0 or m <= 20. Doing so simplifies the dependence analysis problem, allows us to perform more optimizations and generate better code. TODO: The location where the GEP instruction is executed is not necessarily the location where the memory is actually accessed. As a result scanning for GEP[s] is imprecise. Even though this is not a correctness problem, this imprecision may result in missed optimizations or non-optimal run-time checks. In polybench where this mismatch between parametric loop bounds and fixed size arrays is common, we see with this patch significant reductions in compile time (up to 50%) and execution time (up to 70%). We see two significant compile time regressions (fdtd-2d, jacobi-2d-imper), and one execution time regression (trmm). Both regressions arise due to additional optimizations that have been enabled by this patch. They can be addressed in subsequent commits. http://reviews.llvm.org/D6369 llvm-svn: 222754 2014-11-25 18:51:12 +08:00			`; NOAA: if ((N <= 1024 ? 1 : 0) && (&MemRef_A[N] <= &MemRef_B[0] \|\| &MemRef_B[N] <= &MemRef_A[0]))`
			`; BASI: if (N <= 1024 ? 1 : 0)`
			`; TBAA: if (N <= 1024 ? 1 : 0)`
			`; SCEV: if ((N <= 1024 ? 1 : 0) && (&MemRef_A[N] <= &MemRef_B[0] \|\| &MemRef_B[N] <= &MemRef_A[0]))`
			`; GLOB: if ((N <= 1024 ? 1 : 0) && (&MemRef_A[N] <= &MemRef_B[0] \|\| &MemRef_B[N] <= &MemRef_A[0]))`
[RTC] Runtime Alias Checks for the ISL backend (missing tests) Test files missing in r218046. llvm-svn: 218047 2014-09-18 19:20:36 +08:00			`;`
			`target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"`

			`@A = common global [1024 x i32] zeroinitializer, align 16`
			`@B = common global [1024 x float] zeroinitializer, align 16`

			`define void @jd(i32 %N) {`
			`entry:`
			`%cmp6 = icmp sgt i32 %N, 0`
			`br i1 %cmp6, label %for.body.preheader, label %for.end`

			`for.body.preheader: ; preds = %entry`
			`br label %for.body`

			`for.body: ; preds = %for.body.preheader, %for.body`
			`%indvars.iv = phi i64 [ %indvars.iv.next, %for.body ], [ 0, %for.body.preheader ]`
			`%arrayidx = getelementptr inbounds [1024 x float]* @B, i64 0, i64 %indvars.iv`
			`%tmp = load float* %arrayidx, align 4, !tbaa !1`
			`%conv = fptosi float %tmp to i32`
			`%arrayidx2 = getelementptr inbounds [1024 x i32]* @A, i64 0, i64 %indvars.iv`
			`store i32 %conv, i32* %arrayidx2, align 4, !tbaa !5`
			`%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1`
			`%lftr.wideiv1 = trunc i64 %indvars.iv.next to i32`
			`%exitcond2 = icmp eq i32 %lftr.wideiv1, %N`
			`br i1 %exitcond2, label %for.end.loopexit, label %for.body`

			`for.end.loopexit: ; preds = %for.body`
			`br label %for.end`

			`for.end: ; preds = %for.end.loopexit, %entry`
			`ret void`
			`}`

			`!0 = metadata !{metadata !""}`
			`!1 = metadata !{metadata !2, metadata !2, i64 0}`
			`!2 = metadata !{metadata !"float", metadata !3, i64 0}`
			`!3 = metadata !{metadata !"omnipotent char", metadata !4, i64 0}`
			`!4 = metadata !{metadata !"Simple C/C++ TBAA"}`
			`!5 = metadata !{metadata !6, metadata !6, i64 0}`
			`!6 = metadata !{metadata !"int", metadata !3, i64 0}`