2020-06-27 11:41:37 +08:00
|
|
|
; RUN: opt -S -basic-aa -licm < %s | FileCheck %s
|
2020-09-19 05:43:36 +08:00
|
|
|
; RUN: opt -aa-pipeline=basic-aa -passes='require<opt-remark-emit>,loop(loop-simplifycfg,licm)' -S < %s | FileCheck %s
|
2020-06-27 11:41:37 +08:00
|
|
|
; RUN: opt -S -basic-aa -licm -enable-mssa-loop-dependency=true -verify-memoryssa < %s | FileCheck %s
|
2020-09-19 05:43:36 +08:00
|
|
|
; RUN: opt -aa-pipeline=basic-aa -passes='require<opt-remark-emit>,loop-mssa(loop-simplifycfg,licm)' -verify-memoryssa -S < %s | FileCheck %s
|
2019-04-17 12:52:47 +08:00
|
|
|
|
|
|
|
target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
|
|
|
|
target triple = "x86_64-unknown-linux-gnu"
|
|
|
|
|
|
|
|
; This test represents the following function:
|
|
|
|
; void test1(int * __restrict__ a, int * __restrict__ b, int &c, int n) {
|
|
|
|
; for (int i = 0; i < n; ++i)
|
|
|
|
; if (a[i] > 0)
|
|
|
|
; a[i] = c*b[i];
|
|
|
|
; }
|
|
|
|
; and we want to hoist the load of %c out of the loop. This can be done only
|
|
|
|
; because the dereferenceable attribute is on %c.
|
|
|
|
|
|
|
|
; CHECK-LABEL: @test1
|
|
|
|
; CHECK: load i32, i32* %c, align 4
|
|
|
|
; CHECK: for.body:
|
|
|
|
|
2020-05-17 08:55:18 +08:00
|
|
|
define void @test1(i32* noalias nocapture %a, i32* noalias nocapture readonly %b, i32* nocapture readonly nonnull dereferenceable(4) align 4 %c, i32 %n) #0 {
|
2019-04-17 12:52:47 +08:00
|
|
|
entry:
|
|
|
|
%cmp11 = icmp sgt i32 %n, 0
|
|
|
|
br i1 %cmp11, label %for.body, label %for.end
|
|
|
|
|
|
|
|
for.body: ; preds = %entry, %for.inc
|
|
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %entry ]
|
|
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
|
|
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
|
|
%cmp1 = icmp sgt i32 %0, 0
|
|
|
|
br i1 %cmp1, label %if.then, label %for.inc
|
|
|
|
|
|
|
|
if.then: ; preds = %for.body
|
|
|
|
%1 = load i32, i32* %c, align 4
|
|
|
|
%arrayidx3 = getelementptr inbounds i32, i32* %b, i64 %indvars.iv
|
|
|
|
%2 = load i32, i32* %arrayidx3, align 4
|
|
|
|
%mul = mul nsw i32 %2, %1
|
|
|
|
store i32 %mul, i32* %arrayidx, align 4
|
|
|
|
br label %for.inc
|
|
|
|
|
|
|
|
for.inc: ; preds = %for.body, %if.then
|
|
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
|
|
%lftr.wideiv = trunc i64 %indvars.iv.next to i32
|
|
|
|
%exitcond = icmp eq i32 %lftr.wideiv, %n
|
|
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
|
|
|
|
for.end: ; preds = %for.inc, %entry
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
; This is the same as @test1, but without the dereferenceable attribute on %c.
|
|
|
|
; Without this attribute, we should not hoist the load of %c.
|
|
|
|
|
|
|
|
; CHECK-LABEL: @test2
|
|
|
|
; CHECK: if.then:
|
|
|
|
; CHECK: load i32, i32* %c, align 4
|
|
|
|
|
|
|
|
define void @test2(i32* noalias nocapture %a, i32* noalias nocapture readonly %b, i32* nocapture readonly nonnull %c, i32 %n) #0 {
|
|
|
|
entry:
|
|
|
|
%cmp11 = icmp sgt i32 %n, 0
|
|
|
|
br i1 %cmp11, label %for.body, label %for.end
|
|
|
|
|
|
|
|
for.body: ; preds = %entry, %for.inc
|
|
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %entry ]
|
|
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
|
|
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
|
|
%cmp1 = icmp sgt i32 %0, 0
|
|
|
|
br i1 %cmp1, label %if.then, label %for.inc
|
|
|
|
|
|
|
|
if.then: ; preds = %for.body
|
|
|
|
%1 = load i32, i32* %c, align 4
|
|
|
|
%arrayidx3 = getelementptr inbounds i32, i32* %b, i64 %indvars.iv
|
|
|
|
%2 = load i32, i32* %arrayidx3, align 4
|
|
|
|
%mul = mul nsw i32 %2, %1
|
|
|
|
store i32 %mul, i32* %arrayidx, align 4
|
|
|
|
br label %for.inc
|
|
|
|
|
|
|
|
for.inc: ; preds = %for.body, %if.then
|
|
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
|
|
%lftr.wideiv = trunc i64 %indvars.iv.next to i32
|
|
|
|
%exitcond = icmp eq i32 %lftr.wideiv, %n
|
|
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
|
|
|
|
for.end: ; preds = %for.inc, %entry
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
; This test represents the following function:
|
|
|
|
; void test3(int * restrict a, int * restrict b, int c[static 3], int n) {
|
|
|
|
; for (int i = 0; i < n; ++i)
|
|
|
|
; if (a[i] > 0)
|
|
|
|
; a[i] = c[2]*b[i];
|
|
|
|
; }
|
|
|
|
; and we want to hoist the load of c[2] out of the loop. This can be done only
|
|
|
|
; because the dereferenceable attribute is on %c.
|
|
|
|
|
|
|
|
; CHECK-LABEL: @test3
|
|
|
|
; CHECK: load i32, i32* %c2, align 4
|
|
|
|
; CHECK: for.body:
|
|
|
|
|
2020-05-17 08:55:18 +08:00
|
|
|
define void @test3(i32* noalias nocapture %a, i32* noalias nocapture readonly %b, i32* nocapture readonly dereferenceable(12) align 4 %c, i32 %n) #0 {
|
2019-04-17 12:52:47 +08:00
|
|
|
entry:
|
|
|
|
%cmp11 = icmp sgt i32 %n, 0
|
|
|
|
br i1 %cmp11, label %for.body, label %for.end
|
|
|
|
|
|
|
|
for.body: ; preds = %entry, %for.inc
|
|
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %entry ]
|
|
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
|
|
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
|
|
%cmp1 = icmp sgt i32 %0, 0
|
|
|
|
br i1 %cmp1, label %if.then, label %for.inc
|
|
|
|
|
|
|
|
if.then: ; preds = %for.body
|
|
|
|
%c2 = getelementptr inbounds i32, i32* %c, i64 2
|
|
|
|
%1 = load i32, i32* %c2, align 4
|
|
|
|
%arrayidx3 = getelementptr inbounds i32, i32* %b, i64 %indvars.iv
|
|
|
|
%2 = load i32, i32* %arrayidx3, align 4
|
|
|
|
%mul = mul nsw i32 %2, %1
|
|
|
|
store i32 %mul, i32* %arrayidx, align 4
|
|
|
|
br label %for.inc
|
|
|
|
|
|
|
|
for.inc: ; preds = %for.body, %if.then
|
|
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
|
|
%lftr.wideiv = trunc i64 %indvars.iv.next to i32
|
|
|
|
%exitcond = icmp eq i32 %lftr.wideiv, %n
|
|
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
|
|
|
|
for.end: ; preds = %for.inc, %entry
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
; This is the same as @test3, but with a dereferenceable attribute on %c with a
|
|
|
|
; size too small to cover c[2] (and so we should not hoist it).
|
|
|
|
|
|
|
|
; CHECK-LABEL: @test4
|
|
|
|
; CHECK: if.then:
|
|
|
|
; CHECK: load i32, i32* %c2, align 4
|
|
|
|
|
|
|
|
define void @test4(i32* noalias nocapture %a, i32* noalias nocapture readonly %b, i32* nocapture readonly dereferenceable(11) %c, i32 %n) #0 {
|
|
|
|
entry:
|
|
|
|
%cmp11 = icmp sgt i32 %n, 0
|
|
|
|
br i1 %cmp11, label %for.body, label %for.end
|
|
|
|
|
|
|
|
for.body: ; preds = %entry, %for.inc
|
|
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %entry ]
|
|
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
|
|
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
|
|
%cmp1 = icmp sgt i32 %0, 0
|
|
|
|
br i1 %cmp1, label %if.then, label %for.inc
|
|
|
|
|
|
|
|
if.then: ; preds = %for.body
|
|
|
|
%c2 = getelementptr inbounds i32, i32* %c, i64 2
|
|
|
|
%1 = load i32, i32* %c2, align 4
|
|
|
|
%arrayidx3 = getelementptr inbounds i32, i32* %b, i64 %indvars.iv
|
|
|
|
%2 = load i32, i32* %arrayidx3, align 4
|
|
|
|
%mul = mul nsw i32 %2, %1
|
|
|
|
store i32 %mul, i32* %arrayidx, align 4
|
|
|
|
br label %for.inc
|
|
|
|
|
|
|
|
for.inc: ; preds = %for.body, %if.then
|
|
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
|
|
%lftr.wideiv = trunc i64 %indvars.iv.next to i32
|
|
|
|
%exitcond = icmp eq i32 %lftr.wideiv, %n
|
|
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
|
|
|
|
for.end: ; preds = %for.inc, %entry
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
; This test represents the following function:
|
|
|
|
; void test1(int * __restrict__ a, int *b, int &c, int n) {
|
|
|
|
; if (c != null)
|
|
|
|
; for (int i = 0; i < n; ++i)
|
|
|
|
; if (a[i] > 0)
|
|
|
|
; a[i] = c*b[i];
|
|
|
|
; }
|
|
|
|
; and we want to hoist the load of %c out of the loop. This can be done only
|
|
|
|
; because the dereferenceable_or_null attribute is on %c and there is a null
|
|
|
|
; check on %c.
|
|
|
|
|
|
|
|
; CHECK-LABEL: @test5
|
|
|
|
; CHECK: load i32, i32* %c, align 4
|
|
|
|
; CHECK: for.body:
|
|
|
|
|
2020-05-17 08:55:18 +08:00
|
|
|
define void @test5(i32* noalias %a, i32* %b, i32* dereferenceable_or_null(4) align 4 %c, i32 %n) #0 {
|
2019-04-17 12:52:47 +08:00
|
|
|
entry:
|
|
|
|
%not_null = icmp ne i32* %c, null
|
|
|
|
br i1 %not_null, label %not.null, label %for.end
|
|
|
|
|
|
|
|
not.null:
|
|
|
|
%cmp11 = icmp sgt i32 %n, 0
|
|
|
|
br i1 %cmp11, label %for.body, label %for.end
|
|
|
|
|
|
|
|
for.body: ; preds = %not.null, %for.inc
|
|
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %not.null ]
|
|
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
|
|
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
|
|
%cmp1 = icmp sgt i32 %0, 0
|
|
|
|
br i1 %cmp1, label %if.then, label %for.inc
|
|
|
|
|
|
|
|
if.then: ; preds = %for.body
|
|
|
|
%1 = load i32, i32* %c, align 4
|
|
|
|
%arrayidx3 = getelementptr inbounds i32, i32* %b, i64 %indvars.iv
|
|
|
|
%2 = load i32, i32* %arrayidx3, align 4
|
|
|
|
%mul = mul nsw i32 %2, %1
|
|
|
|
store i32 %mul, i32* %arrayidx, align 4
|
|
|
|
br label %for.inc
|
|
|
|
|
|
|
|
for.inc: ; preds = %for.body, %if.then
|
|
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
|
|
%lftr.wideiv = trunc i64 %indvars.iv.next to i32
|
|
|
|
%exitcond = icmp eq i32 %lftr.wideiv, %n
|
|
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
|
|
|
|
for.end: ; preds = %for.inc, %entry, %not.null
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
; This is the same as @test5, but without the null check on %c.
|
|
|
|
; Without this check, we should not hoist the load of %c.
|
|
|
|
|
|
|
|
; This test case has an icmp on c but the use of this comparison is
|
|
|
|
; not a branch.
|
|
|
|
|
|
|
|
; CHECK-LABEL: @test6
|
|
|
|
; CHECK: if.then:
|
|
|
|
; CHECK: load i32, i32* %c, align 4
|
|
|
|
|
|
|
|
define i1 @test6(i32* noalias %a, i32* %b, i32* dereferenceable_or_null(4) %c, i32 %n) #0 {
|
|
|
|
entry:
|
|
|
|
%not_null = icmp ne i32* %c, null
|
|
|
|
%cmp11 = icmp sgt i32 %n, 0
|
|
|
|
br i1 %cmp11, label %for.body, label %for.end
|
|
|
|
|
|
|
|
for.body: ; preds = %entry, %for.inc
|
|
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %entry ]
|
|
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
|
|
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
|
|
%cmp1 = icmp sgt i32 %0, 0
|
|
|
|
br i1 %cmp1, label %if.then, label %for.inc
|
|
|
|
|
|
|
|
if.then: ; preds = %for.body
|
|
|
|
%1 = load i32, i32* %c, align 4
|
|
|
|
%arrayidx3 = getelementptr inbounds i32, i32* %b, i64 %indvars.iv
|
|
|
|
%2 = load i32, i32* %arrayidx3, align 4
|
|
|
|
%mul = mul nsw i32 %2, %1
|
|
|
|
store i32 %mul, i32* %arrayidx, align 4
|
|
|
|
br label %for.inc
|
|
|
|
|
|
|
|
for.inc: ; preds = %for.body, %if.then
|
|
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
|
|
%lftr.wideiv = trunc i64 %indvars.iv.next to i32
|
|
|
|
%exitcond = icmp eq i32 %lftr.wideiv, %n
|
|
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
|
|
|
|
for.end: ; preds = %for.inc, %entry
|
|
|
|
ret i1 %not_null
|
|
|
|
}
|
|
|
|
|
|
|
|
; This test represents the following function:
|
|
|
|
; void test1(int * __restrict__ a, int *b, int **cptr, int n) {
|
|
|
|
; c = *cptr;
|
|
|
|
; for (int i = 0; i < n; ++i)
|
|
|
|
; if (a[i] > 0)
|
|
|
|
; a[i] = (*c)*b[i];
|
|
|
|
; }
|
|
|
|
; and we want to hoist the load of %c out of the loop. This can be done only
|
|
|
|
; because the dereferenceable meatdata on the c = *cptr load.
|
|
|
|
|
|
|
|
; CHECK-LABEL: @test7
|
|
|
|
; CHECK: load i32, i32* %c, align 4
|
|
|
|
; CHECK: for.body:
|
|
|
|
|
|
|
|
define void @test7(i32* noalias %a, i32* %b, i32** %cptr, i32 %n) #0 {
|
|
|
|
entry:
|
2020-05-17 08:55:18 +08:00
|
|
|
%c = load i32*, i32** %cptr, !dereferenceable !0, !align !{i64 4}
|
2019-04-17 12:52:47 +08:00
|
|
|
%cmp11 = icmp sgt i32 %n, 0
|
|
|
|
br i1 %cmp11, label %for.body, label %for.end
|
|
|
|
|
|
|
|
for.body: ; preds = %entry, %for.inc
|
|
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %entry ]
|
|
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
|
|
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
|
|
%cmp1 = icmp sgt i32 %0, 0
|
|
|
|
br i1 %cmp1, label %if.then, label %for.inc
|
|
|
|
|
|
|
|
if.then: ; preds = %for.body
|
|
|
|
%1 = load i32, i32* %c, align 4
|
|
|
|
%arrayidx3 = getelementptr inbounds i32, i32* %b, i64 %indvars.iv
|
|
|
|
%2 = load i32, i32* %arrayidx3, align 4
|
|
|
|
%mul = mul nsw i32 %2, %1
|
|
|
|
store i32 %mul, i32* %arrayidx, align 4
|
|
|
|
br label %for.inc
|
|
|
|
|
|
|
|
for.inc: ; preds = %for.body, %if.then
|
|
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
|
|
%lftr.wideiv = trunc i64 %indvars.iv.next to i32
|
|
|
|
%exitcond = icmp eq i32 %lftr.wideiv, %n
|
|
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
|
|
|
|
for.end: ; preds = %for.inc, %entry
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
; This test represents the following function:
|
|
|
|
; void test1(int * __restrict__ a, int *b, int **cptr, int n) {
|
|
|
|
; c = *cptr;
|
|
|
|
; if (c != null)
|
|
|
|
; for (int i = 0; i < n; ++i)
|
|
|
|
; if (a[i] > 0)
|
|
|
|
; a[i] = (*c)*b[i];
|
|
|
|
; }
|
|
|
|
; and we want to hoist the load of %c out of the loop. This can be done only
|
|
|
|
; because the dereferenceable_or_null meatdata on the c = *cptr load and there
|
|
|
|
; is a null check on %c.
|
|
|
|
|
|
|
|
; CHECK-LABEL: @test8
|
|
|
|
; CHECK: load i32, i32* %c, align 4
|
|
|
|
; CHECK: for.body:
|
|
|
|
|
|
|
|
define void @test8(i32* noalias %a, i32* %b, i32** %cptr, i32 %n) #0 {
|
|
|
|
entry:
|
2020-05-17 08:55:18 +08:00
|
|
|
%c = load i32*, i32** %cptr, !dereferenceable_or_null !0, !align !{i64 4}
|
2019-04-17 12:52:47 +08:00
|
|
|
%not_null = icmp ne i32* %c, null
|
|
|
|
br i1 %not_null, label %not.null, label %for.end
|
|
|
|
|
|
|
|
not.null:
|
|
|
|
%cmp11 = icmp sgt i32 %n, 0
|
|
|
|
br i1 %cmp11, label %for.body, label %for.end
|
|
|
|
|
|
|
|
for.body: ; preds = %not.null, %for.inc
|
|
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %not.null ]
|
|
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
|
|
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
|
|
%cmp1 = icmp sgt i32 %0, 0
|
|
|
|
br i1 %cmp1, label %if.then, label %for.inc
|
|
|
|
|
|
|
|
if.then: ; preds = %for.body
|
|
|
|
%1 = load i32, i32* %c, align 4
|
|
|
|
%arrayidx3 = getelementptr inbounds i32, i32* %b, i64 %indvars.iv
|
|
|
|
%2 = load i32, i32* %arrayidx3, align 4
|
|
|
|
%mul = mul nsw i32 %2, %1
|
|
|
|
store i32 %mul, i32* %arrayidx, align 4
|
|
|
|
br label %for.inc
|
|
|
|
|
|
|
|
for.inc: ; preds = %for.body, %if.then
|
|
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
|
|
%lftr.wideiv = trunc i64 %indvars.iv.next to i32
|
|
|
|
%exitcond = icmp eq i32 %lftr.wideiv, %n
|
|
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
|
|
|
|
for.end: ; preds = %for.inc, %entry, %not.null
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
; This is the same as @test8, but without the null check on %c.
|
|
|
|
; Without this check, we should not hoist the load of %c.
|
|
|
|
|
|
|
|
; CHECK-LABEL: @test9
|
|
|
|
; CHECK: if.then:
|
|
|
|
; CHECK: load i32, i32* %c, align 4
|
|
|
|
|
|
|
|
define void @test9(i32* noalias %a, i32* %b, i32** %cptr, i32 %n) #0 {
|
|
|
|
entry:
|
|
|
|
%c = load i32*, i32** %cptr, !dereferenceable_or_null !0
|
|
|
|
%cmp11 = icmp sgt i32 %n, 0
|
|
|
|
br i1 %cmp11, label %for.body, label %for.end
|
|
|
|
|
|
|
|
for.body: ; preds = %entry, %for.inc
|
|
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %entry ]
|
|
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
|
|
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
|
|
%cmp1 = icmp sgt i32 %0, 0
|
|
|
|
br i1 %cmp1, label %if.then, label %for.inc
|
|
|
|
|
|
|
|
if.then: ; preds = %for.body
|
|
|
|
%1 = load i32, i32* %c, align 4
|
|
|
|
%arrayidx3 = getelementptr inbounds i32, i32* %b, i64 %indvars.iv
|
|
|
|
%2 = load i32, i32* %arrayidx3, align 4
|
|
|
|
%mul = mul nsw i32 %2, %1
|
|
|
|
store i32 %mul, i32* %arrayidx, align 4
|
|
|
|
br label %for.inc
|
|
|
|
|
|
|
|
for.inc: ; preds = %for.body, %if.then
|
|
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
|
|
%lftr.wideiv = trunc i64 %indvars.iv.next to i32
|
|
|
|
%exitcond = icmp eq i32 %lftr.wideiv, %n
|
|
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
|
|
|
|
for.end: ; preds = %for.inc, %entry
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
; In this test we should be able to only hoist load from %cptr. We can't hoist
|
|
|
|
; load from %c because it's dereferenceability can depend on %cmp1 condition.
|
|
|
|
; By moving it out of the loop we break this dependency and can not rely
|
|
|
|
; on the dereferenceability anymore.
|
|
|
|
; In other words this test checks that we strip dereferenceability metadata
|
|
|
|
; after hoisting an instruction.
|
|
|
|
|
|
|
|
; CHECK-LABEL: @test10
|
|
|
|
; CHECK: %c = load i32*, i32** %cptr
|
|
|
|
; CHECK-NOT: dereferenceable
|
|
|
|
; CHECK: if.then:
|
|
|
|
; CHECK: load i32, i32* %c, align 4
|
|
|
|
|
2020-05-17 08:55:18 +08:00
|
|
|
define void @test10(i32* noalias %a, i32* %b, i32** dereferenceable(8) align 8 %cptr, i32 %n) #0 {
|
2019-04-17 12:52:47 +08:00
|
|
|
entry:
|
|
|
|
%cmp11 = icmp sgt i32 %n, 0
|
|
|
|
br i1 %cmp11, label %for.body, label %for.end
|
|
|
|
|
|
|
|
for.body: ; preds = %entry, %for.inc
|
|
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %entry ]
|
|
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
|
|
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
|
|
%cmp1 = icmp sgt i32 %0, 0
|
|
|
|
br i1 %cmp1, label %if.then, label %for.inc
|
|
|
|
|
|
|
|
if.then: ; preds = %for.body
|
|
|
|
%c = load i32*, i32** %cptr, !dereferenceable !0
|
|
|
|
%1 = load i32, i32* %c, align 4
|
|
|
|
%arrayidx3 = getelementptr inbounds i32, i32* %b, i64 %indvars.iv
|
|
|
|
%2 = load i32, i32* %arrayidx3, align 4
|
|
|
|
%mul = mul nsw i32 %2, %1
|
|
|
|
store i32 %mul, i32* %arrayidx, align 4
|
|
|
|
br label %for.inc
|
|
|
|
|
|
|
|
for.inc: ; preds = %for.body, %if.then
|
|
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
|
|
%lftr.wideiv = trunc i64 %indvars.iv.next to i32
|
|
|
|
%exitcond = icmp eq i32 %lftr.wideiv, %n
|
|
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
|
|
|
|
for.end: ; preds = %for.inc, %entry
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @test11(i32* noalias %a, i32* %b, i32** dereferenceable(8) %cptr, i32 %n) #0 {
|
|
|
|
; CHECK-LABEL: @test11(
|
|
|
|
entry:
|
|
|
|
%cmp11 = icmp sgt i32 %n, 0
|
|
|
|
br i1 %cmp11, label %for.body, label %for.end
|
|
|
|
|
|
|
|
; CHECK: for.body.preheader:
|
Infer alignment of unmarked loads in IR/bitcode parsing.
For IR generated by a compiler, this is really simple: you just take the
datalayout from the beginning of the file, and apply it to all the IR
later in the file. For optimization testcases that don't care about the
datalayout, this is also really simple: we just use the default
datalayout.
The complexity here comes from the fact that some LLVM tools allow
overriding the datalayout: some tools have an explicit flag for this,
some tools will infer a datalayout based on the code generation target.
Supporting this properly required plumbing through a bunch of new
machinery: we want to allow overriding the datalayout after the
datalayout is parsed from the file, but before we use any information
from it. Therefore, IR/bitcode parsing now has a callback to allow tools
to compute the datalayout at the appropriate time.
Not sure if I covered all the LLVM tools that want to use the callback.
(clang? lli? Misc IR manipulation tools like llvm-link?). But this is at
least enough for all the LLVM regression tests, and IR without a
datalayout is not something frontends should generate.
This change had some sort of weird effects for certain CodeGen
regression tests: if the datalayout is overridden with a datalayout with
a different program or stack address space, we now parse IR based on the
overridden datalayout, instead of the one written in the file (or the
default one, if none is specified). This broke a few AVR tests, and one
AMDGPU test.
Outside the CodeGen tests I mentioned, the test changes are all just
fixing CHECK lines and moving around datalayout lines in weird places.
Differential Revision: https://reviews.llvm.org/D78403
2020-05-15 03:59:45 +08:00
|
|
|
; CHECK: %c = load i32*, i32** %cptr, align 8, !dereferenceable !0
|
2019-04-17 12:52:47 +08:00
|
|
|
; CHECK: %d = load i32, i32* %c, align 4
|
|
|
|
|
|
|
|
|
|
|
|
for.body: ; preds = %entry, %for.inc
|
|
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %entry ]
|
|
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
|
|
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
|
|
%cmp1 = icmp sgt i32 %0, 0
|
|
|
|
%c = load i32*, i32** %cptr, !dereferenceable !0
|
|
|
|
br i1 %cmp1, label %if.then, label %for.inc
|
|
|
|
|
|
|
|
if.then: ; preds = %for.body
|
|
|
|
%d = load i32, i32* %c, align 4
|
|
|
|
%arrayidx3 = getelementptr inbounds i32, i32* %b, i64 %indvars.iv
|
|
|
|
%e = load i32, i32* %arrayidx3, align 4
|
|
|
|
%mul = mul nsw i32 %e, %d
|
|
|
|
store i32 %mul, i32* %arrayidx, align 4
|
|
|
|
br label %for.inc
|
|
|
|
|
|
|
|
for.inc: ; preds = %for.body, %if.then
|
|
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
|
|
%lftr.wideiv = trunc i64 %indvars.iv.next to i32
|
|
|
|
%exitcond = icmp eq i32 %lftr.wideiv, %n
|
|
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
|
|
|
|
for.end: ; preds = %for.inc, %entry
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
declare void @llvm.experimental.guard(i1, ...)
|
|
|
|
|
2020-05-17 08:55:18 +08:00
|
|
|
define void @test12(i32* noalias %a, i32* %b, i32* dereferenceable_or_null(4) align 4 %c, i32 %n) #0 {
|
2019-04-17 12:52:47 +08:00
|
|
|
; Prove non-null ness of %c via a guard, not a branch.
|
|
|
|
|
|
|
|
; CHECK-LABEL: @test12(
|
|
|
|
entry:
|
|
|
|
%not_null = icmp ne i32* %c, null
|
|
|
|
call void(i1, ...) @llvm.experimental.guard(i1 %not_null) [ "deopt"() ]
|
|
|
|
%cmp11 = icmp sgt i32 %n, 0
|
|
|
|
br i1 %cmp11, label %for.body, label %for.end
|
|
|
|
|
|
|
|
; CHECK: for.body.preheader:
|
|
|
|
; CHECK-NEXT: [[VAL:%[^ ]]] = load i32, i32* %c, align 4
|
|
|
|
; CHECK-NEXT: br label %for.body
|
|
|
|
|
|
|
|
|
|
|
|
for.body: ; preds = %entry, %for.inc
|
|
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %entry ]
|
|
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
|
|
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
|
|
%cmp1 = icmp sgt i32 %0, 0
|
|
|
|
br i1 %cmp1, label %if.then, label %for.inc
|
|
|
|
|
|
|
|
if.then: ; preds = %for.body
|
|
|
|
%1 = load i32, i32* %c, align 4
|
|
|
|
%arrayidx3 = getelementptr inbounds i32, i32* %b, i64 %indvars.iv
|
|
|
|
%2 = load i32, i32* %arrayidx3, align 4
|
|
|
|
%mul = mul nsw i32 %2, %1
|
|
|
|
store i32 %mul, i32* %arrayidx, align 4
|
|
|
|
br label %for.inc
|
|
|
|
|
|
|
|
for.inc: ; preds = %for.body, %if.then
|
|
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
|
|
%lftr.wideiv = trunc i64 %indvars.iv.next to i32
|
|
|
|
%exitcond = icmp eq i32 %lftr.wideiv, %n
|
|
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
|
|
|
|
for.end: ; preds = %for.inc, %entry, %entry
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @test13(i32* noalias %a, i32* %b, i32* dereferenceable_or_null(4) %c, i32 %n) #0 {
|
|
|
|
; Like @test12, but has a post-dominating guard, which cannot be used
|
|
|
|
; to prove %c is nonnull at the point of the load.
|
|
|
|
|
|
|
|
; CHECK-LABEL: @test13(
|
|
|
|
entry:
|
|
|
|
%not_null = icmp ne i32* %c, null
|
|
|
|
%cmp11 = icmp sgt i32 %n, 0
|
|
|
|
br i1 %cmp11, label %for.body, label %for.end
|
|
|
|
|
|
|
|
; CHECK: for.body.preheader:
|
|
|
|
; CHECK-NOT: load i32, i32* %c
|
|
|
|
; CHECK: br label %for.body
|
|
|
|
|
|
|
|
for.body: ; preds = %entry, %for.inc
|
|
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %entry ]
|
|
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
|
|
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
|
|
%cmp1 = icmp sgt i32 %0, 0
|
|
|
|
br i1 %cmp1, label %if.then, label %for.inc
|
|
|
|
|
|
|
|
if.then: ; preds = %for.body
|
|
|
|
; CHECK: if.then:
|
|
|
|
; CHECK: load i32, i32* %c
|
|
|
|
; CHECK: br label %for.inc
|
|
|
|
%1 = load i32, i32* %c, align 4
|
|
|
|
%arrayidx3 = getelementptr inbounds i32, i32* %b, i64 %indvars.iv
|
|
|
|
%2 = load i32, i32* %arrayidx3, align 4
|
|
|
|
%mul = mul nsw i32 %2, %1
|
|
|
|
store i32 %mul, i32* %arrayidx, align 4
|
|
|
|
br label %for.inc
|
|
|
|
|
|
|
|
for.inc: ; preds = %for.body, %if.then
|
|
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
|
|
%lftr.wideiv = trunc i64 %indvars.iv.next to i32
|
|
|
|
%exitcond = icmp eq i32 %lftr.wideiv, %n
|
|
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
|
|
|
|
for.end: ; preds = %for.inc, %entry, %entry
|
|
|
|
call void(i1, ...) @llvm.experimental.guard(i1 %not_null) [ "deopt"() ]
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
; Check that branch by condition "null check AND something" allows to hoist the
|
|
|
|
; load.
|
2020-05-17 08:55:18 +08:00
|
|
|
define void @test14(i32* noalias %a, i32* %b, i32* dereferenceable_or_null(4) align 4 %c, i32 %n, i1 %dummy_cond) #0 {
|
2019-04-17 12:52:47 +08:00
|
|
|
|
|
|
|
; CHECK-LABEL: @test14
|
|
|
|
; CHECK: load i32, i32* %c, align 4
|
|
|
|
; CHECK: for.body:
|
|
|
|
|
|
|
|
entry:
|
|
|
|
%not_null = icmp ne i32* %c, null
|
|
|
|
%dummy_and = and i1 %not_null, %dummy_cond
|
|
|
|
br i1 %dummy_and, label %not.null, label %for.end
|
|
|
|
|
|
|
|
not.null:
|
|
|
|
%cmp11 = icmp sgt i32 %n, 0
|
|
|
|
br i1 %cmp11, label %for.body, label %for.end
|
|
|
|
|
|
|
|
for.body: ; preds = %not.null, %for.inc
|
|
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %not.null ]
|
|
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
|
|
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
|
|
%cmp1 = icmp sgt i32 %0, 0
|
|
|
|
br i1 %cmp1, label %if.then, label %for.inc
|
|
|
|
|
|
|
|
if.then: ; preds = %for.body
|
|
|
|
%1 = load i32, i32* %c, align 4
|
|
|
|
%arrayidx3 = getelementptr inbounds i32, i32* %b, i64 %indvars.iv
|
|
|
|
%2 = load i32, i32* %arrayidx3, align 4
|
|
|
|
%mul = mul nsw i32 %2, %1
|
|
|
|
store i32 %mul, i32* %arrayidx, align 4
|
|
|
|
br label %for.inc
|
|
|
|
|
|
|
|
for.inc: ; preds = %for.body, %if.then
|
|
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
|
|
%lftr.wideiv = trunc i64 %indvars.iv.next to i32
|
|
|
|
%exitcond = icmp eq i32 %lftr.wideiv, %n
|
|
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
|
|
|
|
for.end: ; preds = %for.inc, %entry, %not.null
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
; Check that guard by condition "null check AND something" allows to hoist the
|
|
|
|
; load.
|
2020-05-17 08:55:18 +08:00
|
|
|
define void @test15(i32* noalias %a, i32* %b, i32* dereferenceable_or_null(4) align 4 %c, i32 %n, i1 %dummy_cond) #0 {
|
2019-04-17 12:52:47 +08:00
|
|
|
|
|
|
|
; CHECK-LABEL: @test15
|
|
|
|
; CHECK: load i32, i32* %c, align 4
|
|
|
|
; CHECK: for.body:
|
|
|
|
|
|
|
|
entry:
|
|
|
|
%not_null = icmp ne i32* %c, null
|
|
|
|
%dummy_and = and i1 %not_null, %dummy_cond
|
|
|
|
call void(i1, ...) @llvm.experimental.guard(i1 %dummy_and) [ "deopt"() ]
|
|
|
|
%cmp11 = icmp sgt i32 %n, 0
|
|
|
|
br i1 %cmp11, label %for.body, label %for.end
|
|
|
|
|
|
|
|
for.body: ; preds = %entry, %for.inc
|
|
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %entry ]
|
|
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
|
|
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
|
|
%cmp1 = icmp sgt i32 %0, 0
|
|
|
|
br i1 %cmp1, label %if.then, label %for.inc
|
|
|
|
|
|
|
|
if.then: ; preds = %for.body
|
|
|
|
%1 = load i32, i32* %c, align 4
|
|
|
|
%arrayidx3 = getelementptr inbounds i32, i32* %b, i64 %indvars.iv
|
|
|
|
%2 = load i32, i32* %arrayidx3, align 4
|
|
|
|
%mul = mul nsw i32 %2, %1
|
|
|
|
store i32 %mul, i32* %arrayidx, align 4
|
|
|
|
br label %for.inc
|
|
|
|
|
|
|
|
for.inc: ; preds = %for.body, %if.then
|
|
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
|
|
%lftr.wideiv = trunc i64 %indvars.iv.next to i32
|
|
|
|
%exitcond = icmp eq i32 %lftr.wideiv, %n
|
|
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
|
|
|
|
for.end: ; preds = %for.inc, %entry
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
; Ensure that (c == null && other_cond) does not automatically mean that c is
|
|
|
|
; non-null in false branch. So the condition ((c == null && other_cond) == false)
|
|
|
|
; is not sufficient to conclude that c != null.
|
|
|
|
define void @test16(i32* noalias %a, i32* %b, i32* dereferenceable_or_null(4) %c, i32 %n, i1 %dummy_cond) #0 {
|
|
|
|
|
|
|
|
; CHECK-LABEL: @test16
|
|
|
|
; CHECK: for.body:
|
|
|
|
; CHECK: load i32, i32* %c, align 4
|
|
|
|
|
|
|
|
entry:
|
|
|
|
%not_null = icmp eq i32* %c, null
|
|
|
|
%dummy_and = and i1 %not_null, %dummy_cond
|
|
|
|
br i1 %dummy_and, label %for.end, label %not.null
|
|
|
|
|
|
|
|
not.null:
|
|
|
|
%cmp11 = icmp sgt i32 %n, 0
|
|
|
|
br i1 %cmp11, label %for.body, label %for.end
|
|
|
|
|
|
|
|
for.body: ; preds = %not.null, %for.inc
|
|
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %not.null ]
|
|
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
|
|
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
|
|
%cmp1 = icmp sgt i32 %0, 0
|
|
|
|
br i1 %cmp1, label %if.then, label %for.inc
|
|
|
|
|
|
|
|
if.then: ; preds = %for.body
|
|
|
|
%1 = load i32, i32* %c, align 4
|
|
|
|
%arrayidx3 = getelementptr inbounds i32, i32* %b, i64 %indvars.iv
|
|
|
|
%2 = load i32, i32* %arrayidx3, align 4
|
|
|
|
%mul = mul nsw i32 %2, %1
|
|
|
|
store i32 %mul, i32* %arrayidx, align 4
|
|
|
|
br label %for.inc
|
|
|
|
|
|
|
|
for.inc: ; preds = %for.body, %if.then
|
|
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
|
|
%lftr.wideiv = trunc i64 %indvars.iv.next to i32
|
|
|
|
%exitcond = icmp eq i32 %lftr.wideiv, %n
|
|
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
|
|
|
|
for.end: ; preds = %for.inc, %entry, %not.null
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
; Ensure that (c == null && other_cond) does not automatically mean that c is
|
|
|
|
; non-null in false branch. So the condition ((c == null && other_cond) == false)
|
|
|
|
; is not sufficient to conclude that c != null.
|
|
|
|
define void @test17(i32* noalias %a, i32* %b, i32* dereferenceable_or_null(4) %c, i32 %n, i1 %dummy_cond) #0 {
|
|
|
|
|
|
|
|
; CHECK-LABEL: @test17
|
|
|
|
; CHECK: for.body:
|
|
|
|
; CHECK: load i32, i32* %c, align 4
|
|
|
|
|
|
|
|
entry:
|
|
|
|
%not_null = icmp eq i32* %c, null
|
|
|
|
%dummy_and = and i1 %not_null, %dummy_cond
|
|
|
|
call void(i1, ...) @llvm.experimental.guard(i1 %dummy_and) [ "deopt"() ]
|
|
|
|
%cmp11 = icmp sgt i32 %n, 0
|
|
|
|
br i1 %cmp11, label %for.end, label %for.body
|
|
|
|
|
|
|
|
for.body: ; preds = %entry, %for.inc
|
|
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %entry ]
|
|
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
|
|
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
|
|
%cmp1 = icmp sgt i32 %0, 0
|
|
|
|
br i1 %cmp1, label %if.then, label %for.inc
|
|
|
|
|
|
|
|
if.then: ; preds = %for.body
|
|
|
|
%1 = load i32, i32* %c, align 4
|
|
|
|
%arrayidx3 = getelementptr inbounds i32, i32* %b, i64 %indvars.iv
|
|
|
|
%2 = load i32, i32* %arrayidx3, align 4
|
|
|
|
%mul = mul nsw i32 %2, %1
|
|
|
|
store i32 %mul, i32* %arrayidx, align 4
|
|
|
|
br label %for.inc
|
|
|
|
|
|
|
|
for.inc: ; preds = %for.body, %if.then
|
|
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
|
|
%lftr.wideiv = trunc i64 %indvars.iv.next to i32
|
|
|
|
%exitcond = icmp eq i32 %lftr.wideiv, %n
|
|
|
|
br i1 %exitcond, label %for.end, label %for.body
|
|
|
|
|
|
|
|
for.end: ; preds = %for.inc, %entry
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
attributes #0 = { nounwind uwtable }
|
|
|
|
!0 = !{i64 4}
|