llvm-project/llvm/test/CodeGen/Hexagon/swp-memrefs-epilog1.ll

91 lines
3.3 KiB
LLVM

; RUN: llc -march=hexagon -enable-pipeliner < %s | FileCheck %s
; Test that a store and load, that alias, are not put in the same packet. The
; pipeliner altered the size of the memrefs for these instructions, which
; resulted in no order dependence between the instructions in the DAG. No order
; dependence was added since the size was set to UINT_MAX, but there is a
; computation using the size that overflowed.
; CHECK: endloop0
; CHECK: memh([[REG:r([0-9]+)]]+#0) =
; CHECK: = memh([[REG]]++#2)
; Function Attrs: nounwind
define signext i16 @f0(i16* nocapture readonly %a0, i16* nocapture readonly %a1) local_unnamed_addr #0 {
b0:
%v0 = alloca [40 x i16], align 8
%v1 = bitcast [40 x i16]* %v0 to i8*
call void @llvm.lifetime.start.p0i8(i64 80, i8* nonnull %v1) #2
%v2 = getelementptr inbounds [40 x i16], [40 x i16]* %v0, i32 0, i32 0
br label %b1
b1: ; preds = %b1, %b0
%v3 = phi i16* [ %a1, %b0 ], [ %v24, %b1 ]
%v4 = phi i16* [ %v2, %b0 ], [ %v25, %b1 ]
%v5 = phi i32 [ 0, %b0 ], [ %v14, %b1 ]
%v6 = phi i32 [ 1, %b0 ], [ %v22, %b1 ]
%v7 = phi i32 [ 0, %b0 ], [ %v23, %b1 ]
%v8 = load i16, i16* %v3, align 2
%v9 = sext i16 %v8 to i32
%v10 = tail call i32 @llvm.hexagon.A2.aslh(i32 %v9)
%v11 = tail call i32 @llvm.hexagon.S2.asr.r.r.sat(i32 %v10, i32 1)
%v12 = tail call i32 @llvm.hexagon.A2.asrh(i32 %v11)
%v13 = trunc i32 %v12 to i16
store i16 %v13, i16* %v4, align 2
%v14 = add nuw nsw i32 %v5, 1
%v15 = icmp eq i32 %v14, 40
%v16 = getelementptr inbounds i16, i16* %a0, i32 %v7
%v17 = load i16, i16* %v16, align 2
%v18 = sext i16 %v17 to i32
%v19 = getelementptr inbounds [40 x i16], [40 x i16]* %v0, i32 0, i32 %v7
%v20 = load i16, i16* %v19, align 2
%v21 = sext i16 %v20 to i32
%v22 = tail call i32 @llvm.hexagon.M2.mpy.acc.sat.ll.s1(i32 %v6, i32 %v18, i32 %v21)
%v23 = add nuw nsw i32 %v7, 1
%v24 = getelementptr i16, i16* %v3, i32 1
%v25 = getelementptr i16, i16* %v4, i32 1
br i1 %v15, label %b2, label %b1
b2: ; preds = %b1
%v26 = tail call signext i16 @f1(i32 %v22) #0
%v27 = sext i16 %v26 to i32
%v28 = tail call i32 @llvm.hexagon.S2.asl.r.r.sat(i32 %v22, i32 %v27)
%v29 = tail call i32 @llvm.hexagon.A2.asrh(i32 %v28)
%v30 = shl i32 %v29, 16
%v31 = ashr exact i32 %v30, 16
%v32 = icmp slt i32 %v30, 65536
br label %b3
b3: ; preds = %b2
call void @llvm.lifetime.end.p0i8(i64 80, i8* nonnull %v1) #2
ret i16 0
}
; Function Attrs: argmemonly nounwind
declare void @llvm.lifetime.start.p0i8(i64, i8* nocapture) #1
; Function Attrs: nounwind readnone
declare i32 @llvm.hexagon.S2.asr.r.r.sat(i32, i32) #2
; Function Attrs: nounwind readnone
declare i32 @llvm.hexagon.A2.aslh(i32) #2
; Function Attrs: nounwind readnone
declare i32 @llvm.hexagon.A2.asrh(i32) #2
; Function Attrs: nounwind readnone
declare i32 @llvm.hexagon.M2.mpy.acc.sat.ll.s1(i32, i32, i32) #2
; Function Attrs: nounwind
declare signext i16 @f1(i32) local_unnamed_addr #0
; Function Attrs: nounwind readnone
declare i32 @llvm.hexagon.S2.asl.r.r.sat(i32, i32) #2
; Function Attrs: argmemonly nounwind
declare void @llvm.lifetime.end.p0i8(i64, i8* nocapture) #1
attributes #0 = { nounwind }
attributes #1 = { argmemonly nounwind }
attributes #2 = { nounwind readnone }