forked from OSchip/llvm-project
172 lines
5.4 KiB
LLVM
172 lines
5.4 KiB
LLVM
; RUN: opt < %s -basicaa -loop-interchange -pass-remarks-missed='loop-interchange' -pass-remarks-output=%t
|
|
; RUN: cat %t | FileCheck --check-prefix REMARK %s
|
|
|
|
target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
|
|
target triple = "x86_64-unknown-linux-gnu"
|
|
|
|
@A = common global [100 x [100 x i32]] zeroinitializer
|
|
@C = common global [100 x [100 x i32]] zeroinitializer
|
|
@X = common global i32 0
|
|
@Y = common global i64 0
|
|
@F = common global float 0.0
|
|
|
|
; We cannot interchange this loop at the moment, because iv.outer.next is
|
|
; produced in the outer loop latch and used in the loop exit block. If the inner
|
|
; loop body is not executed, the outer loop latch won't be executed either
|
|
; after interchanging.
|
|
; REMARK: UnsupportedExitPHI
|
|
; REMARK-NEXT: lcssa_01
|
|
|
|
define void @lcssa_01(){
|
|
entry:
|
|
%cmp21 = icmp sgt i64 100, 1
|
|
br i1 %cmp21, label %outer.ph, label %for.end16
|
|
|
|
outer.ph:
|
|
%cmp218 = icmp sgt i64 100, 1
|
|
br label %outer.header
|
|
|
|
outer.header:
|
|
%iv.outer= phi i64 [ 1, %outer.ph ], [ %iv.outer.next, %outer.inc ]
|
|
br i1 %cmp218, label %for.body3, label %outer.inc
|
|
|
|
for.body3:
|
|
%iv.inner = phi i64 [ %iv.inner.next, %for.body3 ], [ 1, %outer.header ]
|
|
%arrayidx5 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %iv.inner, i64 %iv.outer
|
|
%vA = load i32, i32* %arrayidx5
|
|
%arrayidx9 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @C, i64 0, i64 %iv.inner, i64 %iv.outer
|
|
%vC = load i32, i32* %arrayidx9
|
|
%add = add nsw i32 %vA, %vC
|
|
store i32 %add, i32* %arrayidx5
|
|
%iv.inner.next = add nuw nsw i64 %iv.inner, 1
|
|
%exitcond = icmp eq i64 %iv.inner.next, 100
|
|
br i1 %exitcond, label %outer.inc, label %for.body3
|
|
|
|
outer.inc:
|
|
%iv.outer.next = add nsw i64 %iv.outer, 1
|
|
%cmp = icmp eq i64 %iv.outer.next, 100
|
|
br i1 %cmp, label %outer.header, label %for.exit
|
|
|
|
for.exit:
|
|
store i64 %iv.outer.next, i64 * @Y
|
|
br label %for.end16
|
|
|
|
for.end16:
|
|
ret void
|
|
}
|
|
|
|
; REMARK: UnsupportedExitPHI
|
|
; REMARK-NEXT: lcssa_02
|
|
define void @lcssa_02(){
|
|
entry:
|
|
%cmp21 = icmp sgt i64 100, 1
|
|
br i1 %cmp21, label %outer.ph, label %for.end16
|
|
|
|
outer.ph:
|
|
%cmp218 = icmp sgt i64 100, 1
|
|
br label %outer.header
|
|
|
|
outer.header:
|
|
%iv.outer= phi i64 [ 1, %outer.ph ], [ %iv.outer.next, %outer.inc ]
|
|
br i1 %cmp218, label %for.body3, label %outer.inc
|
|
|
|
for.body3:
|
|
%iv.inner = phi i64 [ %iv.inner.next, %for.body3 ], [ 1, %outer.header ]
|
|
%arrayidx5 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %iv.inner, i64 %iv.outer
|
|
%vA = load i32, i32* %arrayidx5
|
|
%arrayidx9 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @C, i64 0, i64 %iv.inner, i64 %iv.outer
|
|
%vC = load i32, i32* %arrayidx9
|
|
%add = add nsw i32 %vA, %vC
|
|
store i32 %add, i32* %arrayidx5
|
|
%iv.inner.next = add nuw nsw i64 %iv.inner, 1
|
|
%exitcond = icmp eq i64 %iv.inner.next, 100
|
|
br i1 %exitcond, label %outer.inc, label %for.body3
|
|
|
|
outer.inc:
|
|
%iv.inner.end = phi i64 [ 0, %outer.header ], [ %iv.inner.next, %for.body3 ]
|
|
%iv.outer.next = add nsw i64 %iv.outer, 1
|
|
%cmp = icmp eq i64 %iv.outer.next, 100
|
|
br i1 %cmp, label %outer.header, label %for.exit
|
|
|
|
for.exit:
|
|
store i64 %iv.inner.end, i64 * @Y
|
|
br label %for.end16
|
|
|
|
for.end16:
|
|
ret void
|
|
}
|
|
|
|
|
|
; REMARK: Interchanged
|
|
; REMARK-NEXT: lcssa_03
|
|
define void @lcssa_03(){
|
|
entry:
|
|
br label %outer.header
|
|
|
|
outer.header:
|
|
%iv.outer= phi i64 [ 1, %entry ], [ %iv.outer.next, %outer.inc ]
|
|
br label %for.body3
|
|
|
|
for.body3:
|
|
%iv.inner = phi i64 [ %iv.inner.next, %for.body3 ], [ 1, %outer.header ]
|
|
%arrayidx5 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %iv.inner, i64 %iv.outer
|
|
%vA = load i32, i32* %arrayidx5
|
|
%arrayidx9 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @C, i64 0, i64 %iv.inner, i64 %iv.outer
|
|
%vC = load i32, i32* %arrayidx9
|
|
%add = add nsw i32 %vA, %vC
|
|
store i32 %add, i32* %arrayidx5
|
|
%iv.inner.next = add nuw nsw i64 %iv.inner, 1
|
|
%exitcond = icmp eq i64 %iv.inner.next, 100
|
|
br i1 %exitcond, label %outer.inc, label %for.body3
|
|
|
|
outer.inc:
|
|
%iv.outer.next = add nsw i64 %iv.outer, 1
|
|
%cmp = icmp eq i64 %iv.outer.next, 100
|
|
br i1 %cmp, label %outer.header, label %for.exit
|
|
|
|
for.exit:
|
|
store i64 %iv.inner, i64 * @Y
|
|
br label %for.end16
|
|
|
|
for.end16:
|
|
ret void
|
|
}
|
|
|
|
; FIXME: We currently do not support LCSSA phi nodes involving floating point
|
|
; types, as we fail to detect floating point reductions for now.
|
|
; REMARK: UnsupportedPHIOuter
|
|
; REMARK-NEXT: lcssa_04
|
|
define void @lcssa_04(){
|
|
entry:
|
|
br label %outer.header
|
|
|
|
outer.header:
|
|
%iv.outer= phi i64 [ 1, %entry ], [ %iv.outer.next, %outer.inc ]
|
|
%float.outer= phi float [ 1.0, %entry ], [ 2.0, %outer.inc ]
|
|
br label %for.body3
|
|
|
|
for.body3:
|
|
%iv.inner = phi i64 [ %iv.inner.next, %for.body3 ], [ 1, %outer.header ]
|
|
%arrayidx5 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %iv.inner, i64 %iv.outer
|
|
%vA = load i32, i32* %arrayidx5
|
|
%arrayidx9 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @C, i64 0, i64 %iv.inner, i64 %iv.outer
|
|
%vC = load i32, i32* %arrayidx9
|
|
%add = add nsw i32 %vA, %vC
|
|
store i32 %add, i32* %arrayidx5
|
|
%iv.inner.next = add nuw nsw i64 %iv.inner, 1
|
|
%exitcond = icmp eq i64 %iv.inner.next, 100
|
|
br i1 %exitcond, label %outer.inc, label %for.body3
|
|
|
|
outer.inc:
|
|
%iv.outer.next = add nsw i64 %iv.outer, 1
|
|
%cmp = icmp eq i64 %iv.outer.next, 100
|
|
br i1 %cmp, label %outer.header, label %for.exit
|
|
|
|
for.exit:
|
|
store float %float.outer, float* @F
|
|
br label %for.end16
|
|
|
|
for.end16:
|
|
ret void
|
|
}
|