forked from OSchip/llvm-project
81 lines
3.0 KiB
LLVM
81 lines
3.0 KiB
LLVM
|
; RUN: llc -O2 -march=hexagon < %s | FileCheck %s
|
||
|
; Rely on the comments generated by llc. Check that "if.then" was not predicated.
|
||
|
; CHECK: b2
|
||
|
; CHECK-NOT: if{{.*}}memd
|
||
|
; CHECK: b5
|
||
|
|
||
|
%s.0 = type { [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [3 x i32], [24 x i32], [8 x %s.1], [5 x i32] }
|
||
|
%s.1 = type { i32, i32 }
|
||
|
|
||
|
@g0 = global i64 0
|
||
|
@g1 = global i32 0
|
||
|
@g2 = global i32 0
|
||
|
@g3 = global i8 0
|
||
|
|
||
|
declare i32 @llvm.hexagon.S2.cl0(i32) #0
|
||
|
declare i32 @llvm.hexagon.S2.setbit.r(i32, i32) #0
|
||
|
declare i64 @llvm.hexagon.M2.vmpy2s.s0(i32, i32) #0
|
||
|
declare i64 @llvm.hexagon.M2.vmac2s.s0(i64, i32, i32) #0
|
||
|
declare i64 @llvm.hexagon.A2.vaddws(i64, i64) #0
|
||
|
declare i64 @llvm.hexagon.A2.vsubws(i64, i64) #0
|
||
|
declare i32 @llvm.hexagon.A4.modwrapu(i32, i32) #0
|
||
|
|
||
|
define void @f0(i32 %a0, i64* %a1) #1 {
|
||
|
b0:
|
||
|
br label %b1
|
||
|
|
||
|
b1: ; preds = %b5, %b0
|
||
|
%v0 = phi i32 [ 0, %b0 ], [ %v26, %b5 ]
|
||
|
%v1 = phi i32 [ 0, %b0 ], [ %v25, %b5 ]
|
||
|
%v2 = load i32, i32* @g1, align 4
|
||
|
%v3 = load i32, i32* @g2, align 8
|
||
|
%v4 = and i32 %v3, %v2
|
||
|
br label %b2
|
||
|
|
||
|
b2: ; preds = %b4, %b1
|
||
|
%v5 = phi i64 [ %v21, %b4 ], [ 0, %b1 ]
|
||
|
%v6 = phi i64 [ %v22, %b4 ], [ 0, %b1 ]
|
||
|
%v7 = phi i32 [ %v9, %b4 ], [ %v4, %b1 ]
|
||
|
%v8 = tail call i32 @llvm.hexagon.S2.cl0(i32 %v7)
|
||
|
%v9 = tail call i32 @llvm.hexagon.S2.setbit.r(i32 %v7, i32 %v8)
|
||
|
%v10 = getelementptr [10 x %s.0], [10 x %s.0]* inttoptr (i32 -121502345 to [10 x %s.0]*), i32 0, i32 %v1
|
||
|
%v11 = getelementptr %s.0, %s.0* %v10, i32 0, i32 12, i32 %v8
|
||
|
%v12 = load i32, i32* %v11, align 4
|
||
|
%v13 = tail call i64 @llvm.hexagon.M2.vmpy2s.s0(i32 %v12, i32 %v12)
|
||
|
%v14 = getelementptr %s.0, %s.0* %v10, i32 0, i32 13, i32 %v8
|
||
|
%v15 = load i32, i32* %v14, align 4
|
||
|
%v16 = tail call i64 @llvm.hexagon.M2.vmac2s.s0(i64 %v13, i32 %v15, i32 %v15)
|
||
|
%v17 = load i8, i8* @g3, align 1
|
||
|
%v18 = and i8 %v17, 1
|
||
|
%v19 = icmp eq i8 %v18, 0
|
||
|
br i1 %v19, label %b3, label %b4, !prof !0
|
||
|
|
||
|
b3: ; preds = %b2
|
||
|
%v20 = tail call i64 @llvm.hexagon.A2.vaddws(i64 %v5, i64 %v16)
|
||
|
store i64 %v20, i64* %a1, align 8
|
||
|
br label %b4
|
||
|
|
||
|
b4: ; preds = %b3, %b2
|
||
|
%v21 = phi i64 [ %v20, %b3 ], [ %v5, %b2 ]
|
||
|
%v22 = tail call i64 @llvm.hexagon.A2.vsubws(i64 %v6, i64 %v16)
|
||
|
%v23 = icmp eq i32 %v9, 0
|
||
|
br i1 %v23, label %b5, label %b2, !prof !1
|
||
|
|
||
|
b5: ; preds = %b4
|
||
|
%v24 = add i32 %v1, 1
|
||
|
%v25 = tail call i32 @llvm.hexagon.A4.modwrapu(i32 %v24, i32 10) #0
|
||
|
%v26 = add i32 %v0, 1
|
||
|
%v27 = icmp eq i32 %v26, %a0
|
||
|
br i1 %v27, label %b6, label %b1, !prof !1
|
||
|
|
||
|
b6: ; preds = %b5
|
||
|
store i64 %v16, i64* @g0, align 8
|
||
|
ret void
|
||
|
}
|
||
|
|
||
|
attributes #0 = { nounwind readnone }
|
||
|
attributes #1 = { nounwind }
|
||
|
|
||
|
!0 = !{!"branch_weights", i32 99, i32 1}
|
||
|
!1 = !{!"branch_weights", i32 10, i32 90}
|