llvm-project/polly/test/polybench/linear-algebra/kernels/gesummv/gesummv_without_param.ll

66 lines
3.1 KiB
LLVM

; RUN: opt %loadPolly %defaultOpts -polly-detect -analyze %s | FileCheck %s
target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64"
target triple = "x86_64-unknown-linux-gnu"
%struct._IO_FILE = type { i32, i8*, i8*, i8*, i8*, i8*, i8*, i8*, i8*, i8*, i8*, i8*, %struct._IO_marker*, %struct._IO_FILE*, i32, i32, i64, i16, i8, [1 x i8], i8*, i64, i8*, i8*, i8*, i8*, i64, i32, [20 x i8] }
%struct._IO_marker = type { %struct._IO_marker*, %struct._IO_FILE*, i32 }
@alpha = common global double 0.000000e+00
@beta = common global double 0.000000e+00
@x = common global [4000 x double] zeroinitializer, align 32
@A = common global [4000 x [4000 x double]] zeroinitializer, align 32
@y = common global [4000 x double] zeroinitializer, align 32
@stderr = external global %struct._IO_FILE*
@.str = private constant [8 x i8] c"%0.2lf \00", align 1
@tmp = common global [4000 x double] zeroinitializer, align 32
@B = common global [4000 x [4000 x double]] zeroinitializer, align 32
define void @scop_func() nounwind {
bb.nph10.split.us:
%0 = load double* @alpha, align 8
%1 = load double* @beta, align 8
br label %bb.nph.us
bb3.us: ; preds = %bb1.us
%.lcssa1 = phi double [ %12, %bb1.us ]
%.lcssa = phi double [ %9, %bb1.us ]
store double %.lcssa, double* %scevgep17
%2 = fmul double %.lcssa, %0
%3 = fmul double %.lcssa1, %1
%4 = fadd double %2, %3
store double %4, double* %scevgep18, align 8
%5 = add nsw i64 %storemerge6.us, 1
%exitcond = icmp eq i64 %5, 4000
br i1 %exitcond, label %return, label %bb.nph.us
bb1.us: ; preds = %bb.nph.us, %bb1.us
%.tmp3.0.us = phi double [ 0.000000e+00, %bb.nph.us ], [ %12, %bb1.us ]
%.tmp.0.us = phi double [ 0.000000e+00, %bb.nph.us ], [ %9, %bb1.us ]
%storemerge12.us = phi i64 [ 0, %bb.nph.us ], [ %13, %bb1.us ]
%scevgep13 = getelementptr [4000 x [4000 x double]]* @A, i64 0, i64 %storemerge6.us, i64 %storemerge12.us
%scevgep = getelementptr [4000 x [4000 x double]]* @B, i64 0, i64 %storemerge6.us, i64 %storemerge12.us
%scevgep12 = getelementptr [4000 x double]* @x, i64 0, i64 %storemerge12.us
%6 = load double* %scevgep13, align 8
%7 = load double* %scevgep12, align 8
%8 = fmul double %6, %7
%9 = fadd double %8, %.tmp.0.us
%10 = load double* %scevgep, align 8
%11 = fmul double %10, %7
%12 = fadd double %11, %.tmp3.0.us
%13 = add nsw i64 %storemerge12.us, 1
%exitcond2 = icmp eq i64 %13, 4000
br i1 %exitcond2, label %bb3.us, label %bb1.us
bb.nph.us: ; preds = %bb3.us, %bb.nph10.split.us
%storemerge6.us = phi i64 [ 0, %bb.nph10.split.us ], [ %5, %bb3.us ]
%scevgep18 = getelementptr [4000 x double]* @y, i64 0, i64 %storemerge6.us
%scevgep17 = getelementptr [4000 x double]* @tmp, i64 0, i64 %storemerge6.us
store double 0.000000e+00, double* %scevgep17, align 8
store double 0.000000e+00, double* %scevgep18, align 8
br label %bb1.us
return: ; preds = %bb3.us
ret void
}
; CHECK: Valid Region for Scop: bb.nph.us => return