2016-08-15 23:56:24 +08:00
|
|
|
; RUN: opt %loadPolly -polly-scops -analyze \
|
|
|
|
; RUN: -polly-invariant-load-hoisting=true < %s | FileCheck %s
|
2016-05-12 23:13:49 +08:00
|
|
|
;
|
|
|
|
; void f(unsigned *restrict I, unsigned *restrict A, unsigned N, unsigned M) {
|
|
|
|
; for (unsigned i = 0; i < N; i++) {
|
|
|
|
; unsigned char V = *I;
|
|
|
|
; if (V < M)
|
|
|
|
; A[i]++;
|
|
|
|
; }
|
|
|
|
; }
|
|
|
|
;
|
[SCEVAffinator] Make precise modular math more correct.
Integer math in LLVM IR is modular. Integer math in isl is
arbitrary-precision. Modeling LLVM IR math correctly in isl requires
either adding assumptions that math doesn't actually overflow, or
explicitly wrapping the math. However, expressions with the "nsw" flag
are special; we can pretend they're arbitrary-precision because it's
undefined behavior if the result wraps. SCEV expressions based on IR
instructions with an nsw flag also carry an nsw flag (roughly; actually,
the real rule is a bit more complicated, but the details don't matter
here).
Before this patch, SCEV flags were also overloaded with an additional
function: the ZExt code was mutating SCEV expressions as a hack to
indicate to checkForWrapping that we don't need to add assumptions to
the operand of a ZExt; it'll add explicit wrapping itself. This kind of
works... the problem is that if anything else ever touches that SCEV
expression, it'll get confused by the incorrect flags.
Instead, with this patch, we make the decision about whether to
explicitly wrap the math a bit earlier, basing the decision purely on
the SCEV expression itself, and not its users.
Differential Revision: https://reviews.llvm.org/D25287
llvm-svn: 284848
2016-10-22 02:08:02 +08:00
|
|
|
; FIXME: The truncated value should be a paramter.
|
2016-05-12 23:13:49 +08:00
|
|
|
; CHECK: Assumed Context:
|
|
|
|
; CHECK-NEXT: [N, tmp, M] -> { : }
|
|
|
|
; CHECK-NEXT: Invalid Context:
|
[SCEVAffinator] Make precise modular math more correct.
Integer math in LLVM IR is modular. Integer math in isl is
arbitrary-precision. Modeling LLVM IR math correctly in isl requires
either adding assumptions that math doesn't actually overflow, or
explicitly wrapping the math. However, expressions with the "nsw" flag
are special; we can pretend they're arbitrary-precision because it's
undefined behavior if the result wraps. SCEV expressions based on IR
instructions with an nsw flag also carry an nsw flag (roughly; actually,
the real rule is a bit more complicated, but the details don't matter
here).
Before this patch, SCEV flags were also overloaded with an additional
function: the ZExt code was mutating SCEV expressions as a hack to
indicate to checkForWrapping that we don't need to add assumptions to
the operand of a ZExt; it'll add explicit wrapping itself. This kind of
works... the problem is that if anything else ever touches that SCEV
expression, it'll get confused by the incorrect flags.
Instead, with this patch, we make the decision about whether to
explicitly wrap the math a bit earlier, basing the decision purely on
the SCEV expression itself, and not its users.
Differential Revision: https://reviews.llvm.org/D25287
llvm-svn: 284848
2016-10-22 02:08:02 +08:00
|
|
|
; CHECK-NEXT: [N, tmp, M] -> { : N < 0 or (N > 0 and tmp >= 128) or (N > 0 and tmp < 0) or (N > 0 and M < 0) }
|
2016-05-12 23:13:49 +08:00
|
|
|
;
|
|
|
|
; CHECK: Domain :=
|
2017-07-20 20:37:02 +08:00
|
|
|
; CHECK-NEXT: [N, tmp, M] -> { Stmt_if_then[i0] : tmp >= 0 and M > tmp and 0 <= i0 < N };
|
2016-05-12 23:13:49 +08:00
|
|
|
;
|
|
|
|
target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
|
|
|
|
|
|
|
|
define void @f(i32* noalias %I, i32* noalias %A, i32 %N, i32 %M) {
|
|
|
|
entry:
|
|
|
|
br label %for.cond
|
|
|
|
|
|
|
|
for.cond: ; preds = %for.inc, %entry
|
|
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %entry ]
|
|
|
|
%lftr.wideiv = trunc i64 %indvars.iv to i32
|
|
|
|
%exitcond = icmp ne i32 %lftr.wideiv, %N
|
|
|
|
br i1 %exitcond, label %for.body, label %for.end
|
|
|
|
|
|
|
|
for.body: ; preds = %for.cond
|
|
|
|
%tmp = load i32, i32* %I, align 4
|
|
|
|
%conv1 = and i32 %tmp, 255
|
|
|
|
%cmp2 = icmp ult i32 %conv1, %M
|
|
|
|
br i1 %cmp2, label %if.then, label %if.end
|
|
|
|
|
|
|
|
if.then: ; preds = %for.body
|
|
|
|
%arrayidx = getelementptr inbounds i32, i32* %A, i64 %indvars.iv
|
|
|
|
%tmp1 = load i32, i32* %arrayidx, align 4
|
|
|
|
%inc = add i32 %tmp1, 1
|
|
|
|
store i32 %inc, i32* %arrayidx, align 4
|
|
|
|
br label %if.end
|
|
|
|
|
|
|
|
if.end: ; preds = %if.then, %for.body
|
|
|
|
br label %for.inc
|
|
|
|
|
|
|
|
for.inc: ; preds = %if.end
|
|
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
|
|
br label %for.cond
|
|
|
|
|
|
|
|
for.end: ; preds = %for.cond
|
|
|
|
ret void
|
|
|
|
}
|