forked from OSchip/llvm-project
150 lines
6.6 KiB
YAML
150 lines
6.6 KiB
YAML
# RUN: llc -mtriple=aarch64 -run-pass=machine-outliner -machine-outliner-reruns=1 -verify-machineinstrs %s -o - | FileCheck %s --check-prefix TWO-RUNS
|
|
# RUN: llc -mtriple=aarch64 -run-pass=machine-outliner -machine-outliner-reruns=0 -verify-machineinstrs %s -o - | FileCheck %s --check-prefix ONE-RUN
|
|
# RUN: llc -mtriple=aarch64 -run-pass=machine-outliner -machine-outliner-reruns=3 -verify-machineinstrs %s -o - | FileCheck %s --check-prefix FOUR-RUNS
|
|
|
|
# Example of Repeated Instruction Sequence - Iterative Machine Outlining
|
|
#
|
|
#; define void @"$s12"(...) { define i64 @"$s5” (...) { define void @"$s13"(...) {
|
|
# ... ... ...
|
|
# %8 = load i1, i1* %7 %8 = load i1, i1* %7
|
|
# %9 = load i4, i4*, %6 %9 = load i4, i4*, %6 %9 = load i4, i4*, %6
|
|
# store i4 %9, i4* %5 store i4 %9, i4* %5 store i4 %9, i4* %5
|
|
# ... ... ...
|
|
# } } }
|
|
#
|
|
# After machine outliner (1st time)
|
|
#
|
|
# define void @"$s12"(...) { define i64 @"$s5” (...) { define void @"$s13"(...) {
|
|
# ... ... ...
|
|
# %8 = load i1, i1* %7 %8 = load i1, i1* %7
|
|
# call void @outlined_function_1_1 call void @outlined_function_1_1 call void @outlined_function_1_1
|
|
# ... ... ...
|
|
# } } }
|
|
#
|
|
# After machine outliner (2nd time)
|
|
#
|
|
# define void @"$s12"(...) { define i64 @"$s5” (...) { define void @"$s13"(...) {
|
|
# ... ... ...
|
|
# call void @outlined_function_2_1 call void @outlined_function_1_1 call void @outlined_function_2_1
|
|
# ... ... ...
|
|
# } } }
|
|
#
|
|
# Check whether machine outliner can further find the outlining opportunity after machine
|
|
# outlining has performed.
|
|
#
|
|
--- |
|
|
declare void @foo() local_unnamed_addr
|
|
|
|
declare void @widget() local_unnamed_addr
|
|
|
|
; Function Attrs: minsize noredzone optsize
|
|
define void @baz.14() #0 {
|
|
ret void
|
|
}
|
|
|
|
; Function Attrs: minsize noredzone optsize
|
|
define void @baz.15() #0 {
|
|
ret void
|
|
}
|
|
|
|
; Function Attrs: minsize noredzone optsize
|
|
define void @baz.16() #0 {
|
|
ret void
|
|
}
|
|
|
|
attributes #0 = { minsize noredzone optsize }
|
|
...
|
|
---
|
|
name: baz.14
|
|
tracksRegLiveness: true
|
|
stack:
|
|
- { id: 0, offset: -8, size: 8 }
|
|
- { id: 1, offset: -16, size: 8 }
|
|
body: |
|
|
bb.0:
|
|
liveins: $x0, $x19, $lr
|
|
|
|
early-clobber $sp = frame-setup STPXpre killed $lr, killed $x19, $sp, -2 :: (store (s64) into %stack.1), (store (s64) into %stack.0)
|
|
frame-setup CFI_INSTRUCTION def_cfa_offset 16
|
|
frame-setup CFI_INSTRUCTION offset $w19, -8
|
|
frame-setup CFI_INSTRUCTION offset $w30, -16
|
|
renamable $x19 = COPY $x0
|
|
renamable $x0 = nuw ADDXri $x0, 48, 0
|
|
$x1 = ADDXri $sp, 0, 0
|
|
dead $w2 = MOVi32imm 33, implicit-def $x2
|
|
$x3 = COPY $xzr
|
|
BL @foo, csr_aarch64_aapcs, implicit-def dead $lr, implicit $sp, implicit $x0, implicit killed $x1, implicit killed $x2, implicit killed $x3, implicit-def $sp
|
|
$x0 = COPY killed renamable $x19
|
|
BL @widget, csr_aarch64_aapcs, implicit-def dead $lr, implicit $sp, implicit $x0, implicit-def $sp
|
|
early-clobber $sp, $lr, $x19 = frame-destroy LDPXpost $sp, 2 :: (load (s64) from %stack.1), (load (s64) from %stack.0)
|
|
RET_ReallyLR
|
|
|
|
...
|
|
---
|
|
name: baz.15
|
|
tracksRegLiveness: true
|
|
stack:
|
|
- { id: 0, offset: -8, size: 8 }
|
|
- { id: 1, offset: -16, size: 8 }
|
|
body: |
|
|
bb.0:
|
|
liveins: $x0, $x19, $lr
|
|
|
|
early-clobber $sp = frame-setup STPXpre killed $lr, killed $x19, $sp, -2 :: (store (s64) into %stack.1), (store (s64) into %stack.0)
|
|
frame-setup CFI_INSTRUCTION def_cfa_offset 16
|
|
frame-setup CFI_INSTRUCTION offset $w19, -8
|
|
frame-setup CFI_INSTRUCTION offset $w30, -16
|
|
renamable $x19 = COPY $x0
|
|
renamable $x0 = nuw ADDXri killed renamable $x0, 16, 0
|
|
$x1 = ADDXri $sp, 0, 0
|
|
dead $w2 = MOVi32imm 33, implicit-def $x2
|
|
$x3 = COPY $xzr
|
|
BL @foo, csr_aarch64_aapcs, implicit-def dead $lr, implicit $sp, implicit $x0, implicit $x1, implicit killed $x2, implicit killed $x3, implicit-def $sp
|
|
$x0 = COPY killed renamable $x19
|
|
BL @widget, csr_aarch64_aapcs, implicit-def dead $lr, implicit $sp, implicit $x0, implicit-def $sp
|
|
early-clobber $sp, $lr, $x19 = frame-destroy LDPXpost $sp, 2 :: (load (s64) from %stack.1), (load (s64) from %stack.0)
|
|
RET_ReallyLR
|
|
|
|
...
|
|
---
|
|
name: baz.16
|
|
tracksRegLiveness: true
|
|
stack:
|
|
- { id: 0, offset: -8, size: 8 }
|
|
- { id: 1, offset: -16, size: 8 }
|
|
body: |
|
|
bb.0:
|
|
liveins: $x0, $x19, $lr
|
|
|
|
early-clobber $sp = frame-setup STPXpre killed $lr, killed $x19, $sp, -2 :: (store (s64) into %stack.1), (store (s64) into %stack.0)
|
|
frame-setup CFI_INSTRUCTION def_cfa_offset 16
|
|
frame-setup CFI_INSTRUCTION offset $w19, -8
|
|
frame-setup CFI_INSTRUCTION offset $w30, -16
|
|
renamable $x19 = COPY $x0
|
|
renamable $x0 = nuw ADDXri $x0, 48, 0
|
|
$x1 = ADDXri $sp, 0, 0
|
|
dead $w2 = MOVi32imm 33, implicit-def $x2
|
|
$x3 = COPY $xzr
|
|
BL @foo, csr_aarch64_aapcs, implicit-def dead $lr, implicit $sp, implicit $x0, implicit killed $x1, implicit killed $x2, implicit killed $x3, implicit-def $sp
|
|
$x0 = COPY killed renamable $x19
|
|
BL @widget, csr_aarch64_aapcs, implicit-def dead $lr, implicit $sp, implicit $x0, implicit-def $sp
|
|
early-clobber $sp, $lr, $x19 = frame-destroy LDPXpost $sp, 2 :: (load (s64) from %stack.1), (load (s64) from %stack.0)
|
|
RET_ReallyLR
|
|
|
|
...
|
|
|
|
# TWO-RUNS: name: OUTLINED_FUNCTION_2_0
|
|
# TWO-RUNS-DAG: bb.0:
|
|
# TWO-RUNS-DAG: renamable $x19 = COPY $x0
|
|
# TWO-RUNS-NEXT: renamable $x0 = nuw ADDXri $x0, 48, 0
|
|
# TWO-RUNS-NEXT: TCRETURNdi @OUTLINED_FUNCTION_0, 0, implicit $sp
|
|
#
|
|
# The machine outliner is expected to stop at the 1st iteration for case ONE-RUN
|
|
# since machine-outline-runs is specified as 1.
|
|
# ONE-RUN-NOT: [[OUTLINED:OUTLINED_FUNCTION_2_[0-9]+]]
|
|
#
|
|
# The machine outliner is expected to stop at the 3rd iteration for case FOUR-RUNS
|
|
# since the MIR has no change at the 3rd iteration.
|
|
# FOUR-RUNS-NOT: [[OUTLINED:OUTLINED_FUNCTION_3_[0-9]+]]
|
|
# FOUR-RUNS-NOT: [[OUTLINED:OUTLINED_FUNCTION_4_[0-9]+]]
|