forked from OSchip/llvm-project
86 lines
2.8 KiB
LLVM
86 lines
2.8 KiB
LLVM
; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -O3 | FileCheck %s
|
|
|
|
; Function Attrs: uwtable
|
|
; When tail-duplicating during placement, we work backward from blocks with
|
|
; multiple successors. In this case, the block dup1 gets duplicated into dup2
|
|
; and if.then64, and then the block dup2 only gets duplicated into land.lhs.true.
|
|
|
|
define void @partial_tail_dup(i1 %a1, i1 %a2, i32* %a4, i32* %a5, i8* %a6, i32 %a7) #0 align 2 !prof !1 {
|
|
; CHECK-LABEL: partial_tail_dup:
|
|
; CHECK: # %bb.0: # %entry
|
|
; CHECK-NEXT: .p2align 4, 0x90
|
|
; CHECK-NEXT: .LBB0_1: # %for.cond
|
|
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
|
|
; CHECK-NEXT: testb $1, %dil
|
|
; CHECK-NEXT: je .LBB0_3
|
|
; CHECK-NEXT: # %bb.2: # %land.lhs.true
|
|
; CHECK-NEXT: # in Loop: Header=BB0_1 Depth=1
|
|
; CHECK-NEXT: movl $10, (%rdx)
|
|
; CHECK-NEXT: movl $2, (%rcx)
|
|
; CHECK-NEXT: testl %r9d, %r9d
|
|
; CHECK-NEXT: je .LBB0_1
|
|
; CHECK-NEXT: jmp .LBB0_8
|
|
; CHECK-NEXT: .p2align 4, 0x90
|
|
; CHECK-NEXT: .LBB0_6: # %dup2
|
|
; CHECK-NEXT: # in Loop: Header=BB0_1 Depth=1
|
|
; CHECK-NEXT: movl $2, (%rcx)
|
|
; CHECK-NEXT: testl %r9d, %r9d
|
|
; CHECK-NEXT: je .LBB0_1
|
|
; CHECK-NEXT: jmp .LBB0_8
|
|
; CHECK-NEXT: .p2align 4, 0x90
|
|
; CHECK-NEXT: .LBB0_3: # %if.end56
|
|
; CHECK-NEXT: # in Loop: Header=BB0_1 Depth=1
|
|
; CHECK-NEXT: testb $1, %sil
|
|
; CHECK-NEXT: je .LBB0_5
|
|
; CHECK-NEXT: # %bb.4: # %if.then64
|
|
; CHECK-NEXT: # in Loop: Header=BB0_1 Depth=1
|
|
; CHECK-NEXT: movb $1, (%r8)
|
|
; CHECK-NEXT: testl %r9d, %r9d
|
|
; CHECK-NEXT: je .LBB0_1
|
|
; CHECK-NEXT: jmp .LBB0_8
|
|
; CHECK-NEXT: .LBB0_5: # %if.end70
|
|
; CHECK-NEXT: # in Loop: Header=BB0_1 Depth=1
|
|
; CHECK-NEXT: movl $12, (%rdx)
|
|
; CHECK-NEXT: jne .LBB0_6
|
|
; CHECK-NEXT: .LBB0_8: # %for.end
|
|
; CHECK-NEXT: retq
|
|
entry:
|
|
br label %for.cond
|
|
|
|
for.cond:
|
|
br i1 %a1, label %land.lhs.true, label %if.end56
|
|
|
|
land.lhs.true:
|
|
store i32 10, i32* %a4, align 8
|
|
br label %dup2
|
|
|
|
if.end56:
|
|
br i1 %a2, label %if.then64, label %if.end70, !prof !2
|
|
|
|
if.then64:
|
|
store i8 1, i8* %a6, align 1
|
|
br label %dup1
|
|
|
|
if.end70:
|
|
store i32 12, i32* %a4, align 8
|
|
br i1 %a2, label %dup2, label %for.end
|
|
|
|
dup2:
|
|
store i32 2, i32* %a5, align 4
|
|
br label %dup1
|
|
|
|
dup1:
|
|
%val = load i32, i32* %a4, align 8
|
|
%switch = icmp ult i32 %a7, 1
|
|
br i1 %switch, label %for.cond, label %for.end, !prof !3
|
|
|
|
for.end:
|
|
ret void
|
|
}
|
|
|
|
attributes #0 = { uwtable }
|
|
|
|
!1 = !{!"function_entry_count", i64 2}
|
|
!2 = !{!"branch_weights", i32 5, i32 1}
|
|
!3 = !{!"branch_weights", i32 5, i32 1}
|