[ARM] Inline callee if its target-features are a subset of the caller
Summary:
Similar to X86, it should be safe to inline callees if their
target-features are a subset of the caller. As some subtarget features
provide different instructions depending on whether they are set or
unset (e.g. ThumbMode and ModeSoftFloat), we use a whitelist of
target-features describing hardware capabilities only.
Reviewers: kristof.beyls, rengolin, t.p.northover, SjoerdMeijer, peter.smith, silviu.baranga, efriedma
Reviewed By: SjoerdMeijer, efriedma
Subscribers: dschuff, efriedma, aemerson, sdardis, javed.absar, arichardson, eraman, llvm-commits
Differential Revision: https://reviews.llvm.org/D34697
llvm-svn: 307889
2017-07-13 16:26:17 +08:00
|
|
|
; RUN: opt < %s -mtriple=arm-unknown-linux-gnu -S -inline | FileCheck %s
|
|
|
|
; RUN: opt < %s -mtriple=arm-unknown-linux-gnu -S -passes='cgscc(inline)' | FileCheck %s
|
|
|
|
; Check that we only inline when we have compatible target attributes.
|
|
|
|
; ARM has implemented a target attribute that will verify that the attribute
|
|
|
|
; sets are compatible.
|
|
|
|
|
|
|
|
define i32 @foo() #0 {
|
|
|
|
entry:
|
|
|
|
%call = call i32 (...) @baz()
|
|
|
|
ret i32 %call
|
|
|
|
; CHECK-LABEL: foo
|
|
|
|
; CHECK: call i32 (...) @baz()
|
|
|
|
}
|
|
|
|
declare i32 @baz(...) #0
|
|
|
|
|
|
|
|
define i32 @bar() #1 {
|
|
|
|
entry:
|
|
|
|
%call = call i32 @foo()
|
|
|
|
ret i32 %call
|
|
|
|
; CHECK-LABEL: bar
|
|
|
|
; CHECK: call i32 (...) @baz()
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @qux() #0 {
|
|
|
|
entry:
|
|
|
|
%call = call i32 @bar()
|
|
|
|
ret i32 %call
|
|
|
|
; CHECK-LABEL: qux
|
|
|
|
; CHECK: call i32 @bar()
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @thumb_fn() #2 {
|
|
|
|
entry:
|
|
|
|
%call = call i32 @foo()
|
|
|
|
ret i32 %call
|
|
|
|
; CHECK-LABEL: thumb_fn
|
|
|
|
; CHECK: call i32 @foo
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @strict_align() #3 {
|
|
|
|
entry:
|
|
|
|
%call = call i32 @foo()
|
|
|
|
ret i32 %call
|
|
|
|
; CHECK-LABEL: strict_align
|
|
|
|
; CHECK: call i32 (...) @baz()
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @soft_float_fn() #4 {
|
|
|
|
entry:
|
|
|
|
%call = call i32 @foo()
|
|
|
|
ret i32 %call
|
2017-07-13 16:53:43 +08:00
|
|
|
; CHECK-LABEL: soft_float_fn
|
[ARM] Inline callee if its target-features are a subset of the caller
Summary:
Similar to X86, it should be safe to inline callees if their
target-features are a subset of the caller. As some subtarget features
provide different instructions depending on whether they are set or
unset (e.g. ThumbMode and ModeSoftFloat), we use a whitelist of
target-features describing hardware capabilities only.
Reviewers: kristof.beyls, rengolin, t.p.northover, SjoerdMeijer, peter.smith, silviu.baranga, efriedma
Reviewed By: SjoerdMeijer, efriedma
Subscribers: dschuff, efriedma, aemerson, sdardis, javed.absar, arichardson, eraman, llvm-commits
Differential Revision: https://reviews.llvm.org/D34697
llvm-svn: 307889
2017-07-13 16:26:17 +08:00
|
|
|
; CHECK: call i32 @foo
|
|
|
|
}
|
|
|
|
|
|
|
|
attributes #0 = { "target-cpu"="generic" "target-features"="+dsp,+neon" }
|
|
|
|
attributes #1 = { "target-cpu"="generic" "target-features"="+dsp,+neon,+fp16" }
|
|
|
|
attributes #2 = { "target-cpu"="generic" "target-features"="+dsp,+neon,+fp16,+thumb-mode" }
|
|
|
|
attributes #3 = { "target-cpu"="generic" "target-features"="+dsp,+neon,+strict-align" }
|
|
|
|
attributes #4 = { "target-cpu"="generic" "target-features"="+dsp,+neon,+fp16,+soft-float" }
|