2019-04-17 12:52:47 +08:00
|
|
|
; RUN: opt < %s -deadargelim -S | FileCheck %s
|
|
|
|
|
Reland [X86] Codegen for preallocated
See https://reviews.llvm.org/D74651 for the preallocated IR constructs
and LangRef changes.
In X86TargetLowering::LowerCall(), if a call is preallocated, record
each argument's offset from the stack pointer and the total stack
adjustment. Associate the call Value with an integer index. Store the
info in X86MachineFunctionInfo with the integer index as the key.
This adds two new target independent ISDOpcodes and two new target
dependent Opcodes corresponding to @llvm.call.preallocated.{setup,arg}.
The setup ISelDAG node takes in a chain and outputs a chain and a
SrcValue of the preallocated call Value. It is lowered to a target
dependent node with the SrcValue replaced with the integer index key by
looking in X86MachineFunctionInfo. In
X86TargetLowering::EmitInstrWithCustomInserter() this is lowered to an
%esp adjustment, the exact amount determined by looking in
X86MachineFunctionInfo with the integer index key.
The arg ISelDAG node takes in a chain, a SrcValue of the preallocated
call Value, and the arg index int constant. It produces a chain and the
pointer fo the arg. It is lowered to a target dependent node with the
SrcValue replaced with the integer index key by looking in
X86MachineFunctionInfo. In
X86TargetLowering::EmitInstrWithCustomInserter() this is lowered to a
lea of the stack pointer plus an offset determined by looking in
X86MachineFunctionInfo with the integer index key.
Force any function containing a preallocated call to use the frame
pointer.
Does not yet handle a setup without a call, or a conditional call.
Does not yet handle musttail. That requires a LangRef change first.
Tried to look at all references to inalloca and see if they apply to
preallocated. I've made preallocated versions of tests testing inalloca
whenever possible and when they make sense (e.g. not alloca related,
inalloca edge cases).
Aside from the tests added here, I checked that this codegen produces
correct code for something like
```
struct A {
A();
A(A&&);
~A();
};
void bar() {
foo(foo(foo(foo(foo(A(), 4), 5), 6), 7), 8);
}
```
by replacing the inalloca version of the .ll file with the appropriate
preallocated code. Running the executable produces the same results as
using the current inalloca implementation.
Reverted due to unexpectedly passing tests, added REQUIRES: asserts for reland.
Subscribers: hiraditya, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D77689
2020-03-17 03:32:36 +08:00
|
|
|
declare token @llvm.call.preallocated.setup(i32)
|
|
|
|
declare i8* @llvm.call.preallocated.arg(token, i32)
|
|
|
|
|
2019-04-17 12:52:47 +08:00
|
|
|
%Ty = type <{ i32, i32 }>
|
|
|
|
|
|
|
|
; Check if the pass doesn't modify anything that doesn't need changing. We feed
|
|
|
|
; an unused argument to each function to lure it into changing _something_ about
|
|
|
|
; the function and then changing too much.
|
|
|
|
|
|
|
|
; This checks if the return value attributes are not removed
|
2020-10-15 19:04:36 +08:00
|
|
|
; CHECK: define internal zeroext i32 @test1() #1
|
2019-04-17 12:52:47 +08:00
|
|
|
define internal zeroext i32 @test1(i32 %DEADARG1) nounwind {
|
2020-10-15 19:04:36 +08:00
|
|
|
;
|
|
|
|
;
|
|
|
|
ret i32 1
|
2019-04-17 12:52:47 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
; This checks if the struct doesn't get non-packed
|
|
|
|
; CHECK-LABEL: define internal <{ i32, i32 }> @test2(
|
|
|
|
define internal <{ i32, i32 }> @test2(i32 %DEADARG1) {
|
2020-10-15 19:04:36 +08:00
|
|
|
;
|
|
|
|
;
|
|
|
|
ret <{ i32, i32 }> <{ i32 1, i32 2 }>
|
2019-04-17 12:52:47 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
; We use this external function to make sure the return values don't become dead
|
|
|
|
declare void @user(i32, <{ i32, i32 }>)
|
|
|
|
|
|
|
|
define void @caller() {
|
2020-10-15 19:04:36 +08:00
|
|
|
;
|
|
|
|
;
|
|
|
|
%B = call i32 @test1(i32 1)
|
|
|
|
%C = call <{ i32, i32 }> @test2(i32 2)
|
|
|
|
call void @user(i32 %B, <{ i32, i32 }> %C)
|
|
|
|
ret void
|
2019-04-17 12:52:47 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
; We can't remove 'this' here, as that would put argmem in ecx instead of
|
|
|
|
; memory.
|
2021-03-29 20:42:23 +08:00
|
|
|
define internal x86_thiscallcc i32 @unused_this(i32* %this, i32* inalloca(i32) %argmem) {
|
2020-10-15 19:04:36 +08:00
|
|
|
;
|
|
|
|
;
|
|
|
|
%v = load i32, i32* %argmem
|
|
|
|
ret i32 %v
|
2019-04-17 12:52:47 +08:00
|
|
|
}
|
2021-03-29 20:42:23 +08:00
|
|
|
; CHECK-LABEL: define internal x86_thiscallcc i32 @unused_this(i32* %this, i32* inalloca(i32) %argmem)
|
2019-04-17 12:52:47 +08:00
|
|
|
|
|
|
|
define i32 @caller2() {
|
2020-10-15 19:04:36 +08:00
|
|
|
;
|
|
|
|
;
|
|
|
|
%t = alloca i32
|
|
|
|
%m = alloca inalloca i32
|
|
|
|
store i32 42, i32* %m
|
2021-03-29 20:42:23 +08:00
|
|
|
%v = call x86_thiscallcc i32 @unused_this(i32* %t, i32* inalloca(i32) %m)
|
2020-10-15 19:04:36 +08:00
|
|
|
ret i32 %v
|
2019-04-17 12:52:47 +08:00
|
|
|
}
|
|
|
|
|
Reland [X86] Codegen for preallocated
See https://reviews.llvm.org/D74651 for the preallocated IR constructs
and LangRef changes.
In X86TargetLowering::LowerCall(), if a call is preallocated, record
each argument's offset from the stack pointer and the total stack
adjustment. Associate the call Value with an integer index. Store the
info in X86MachineFunctionInfo with the integer index as the key.
This adds two new target independent ISDOpcodes and two new target
dependent Opcodes corresponding to @llvm.call.preallocated.{setup,arg}.
The setup ISelDAG node takes in a chain and outputs a chain and a
SrcValue of the preallocated call Value. It is lowered to a target
dependent node with the SrcValue replaced with the integer index key by
looking in X86MachineFunctionInfo. In
X86TargetLowering::EmitInstrWithCustomInserter() this is lowered to an
%esp adjustment, the exact amount determined by looking in
X86MachineFunctionInfo with the integer index key.
The arg ISelDAG node takes in a chain, a SrcValue of the preallocated
call Value, and the arg index int constant. It produces a chain and the
pointer fo the arg. It is lowered to a target dependent node with the
SrcValue replaced with the integer index key by looking in
X86MachineFunctionInfo. In
X86TargetLowering::EmitInstrWithCustomInserter() this is lowered to a
lea of the stack pointer plus an offset determined by looking in
X86MachineFunctionInfo with the integer index key.
Force any function containing a preallocated call to use the frame
pointer.
Does not yet handle a setup without a call, or a conditional call.
Does not yet handle musttail. That requires a LangRef change first.
Tried to look at all references to inalloca and see if they apply to
preallocated. I've made preallocated versions of tests testing inalloca
whenever possible and when they make sense (e.g. not alloca related,
inalloca edge cases).
Aside from the tests added here, I checked that this codegen produces
correct code for something like
```
struct A {
A();
A(A&&);
~A();
};
void bar() {
foo(foo(foo(foo(foo(A(), 4), 5), 6), 7), 8);
}
```
by replacing the inalloca version of the .ll file with the appropriate
preallocated code. Running the executable produces the same results as
using the current inalloca implementation.
Reverted due to unexpectedly passing tests, added REQUIRES: asserts for reland.
Subscribers: hiraditya, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D77689
2020-03-17 03:32:36 +08:00
|
|
|
; We can't remove 'this' here, as that would put argmem in ecx instead of
|
|
|
|
; memory.
|
|
|
|
define internal x86_thiscallcc i32 @unused_this_preallocated(i32* %this, i32* preallocated(i32) %argmem) {
|
2020-10-15 19:04:36 +08:00
|
|
|
;
|
|
|
|
;
|
|
|
|
%v = load i32, i32* %argmem
|
|
|
|
ret i32 %v
|
Reland [X86] Codegen for preallocated
See https://reviews.llvm.org/D74651 for the preallocated IR constructs
and LangRef changes.
In X86TargetLowering::LowerCall(), if a call is preallocated, record
each argument's offset from the stack pointer and the total stack
adjustment. Associate the call Value with an integer index. Store the
info in X86MachineFunctionInfo with the integer index as the key.
This adds two new target independent ISDOpcodes and two new target
dependent Opcodes corresponding to @llvm.call.preallocated.{setup,arg}.
The setup ISelDAG node takes in a chain and outputs a chain and a
SrcValue of the preallocated call Value. It is lowered to a target
dependent node with the SrcValue replaced with the integer index key by
looking in X86MachineFunctionInfo. In
X86TargetLowering::EmitInstrWithCustomInserter() this is lowered to an
%esp adjustment, the exact amount determined by looking in
X86MachineFunctionInfo with the integer index key.
The arg ISelDAG node takes in a chain, a SrcValue of the preallocated
call Value, and the arg index int constant. It produces a chain and the
pointer fo the arg. It is lowered to a target dependent node with the
SrcValue replaced with the integer index key by looking in
X86MachineFunctionInfo. In
X86TargetLowering::EmitInstrWithCustomInserter() this is lowered to a
lea of the stack pointer plus an offset determined by looking in
X86MachineFunctionInfo with the integer index key.
Force any function containing a preallocated call to use the frame
pointer.
Does not yet handle a setup without a call, or a conditional call.
Does not yet handle musttail. That requires a LangRef change first.
Tried to look at all references to inalloca and see if they apply to
preallocated. I've made preallocated versions of tests testing inalloca
whenever possible and when they make sense (e.g. not alloca related,
inalloca edge cases).
Aside from the tests added here, I checked that this codegen produces
correct code for something like
```
struct A {
A();
A(A&&);
~A();
};
void bar() {
foo(foo(foo(foo(foo(A(), 4), 5), 6), 7), 8);
}
```
by replacing the inalloca version of the .ll file with the appropriate
preallocated code. Running the executable produces the same results as
using the current inalloca implementation.
Reverted due to unexpectedly passing tests, added REQUIRES: asserts for reland.
Subscribers: hiraditya, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D77689
2020-03-17 03:32:36 +08:00
|
|
|
}
|
|
|
|
; CHECK-LABEL: define internal x86_thiscallcc i32 @unused_this_preallocated(i32* %this, i32* preallocated(i32) %argmem)
|
|
|
|
|
|
|
|
define i32 @caller3() {
|
2020-10-15 19:04:36 +08:00
|
|
|
;
|
|
|
|
;
|
|
|
|
%t = alloca i32
|
|
|
|
%c = call token @llvm.call.preallocated.setup(i32 1)
|
|
|
|
%M = call i8* @llvm.call.preallocated.arg(token %c, i32 0) preallocated(i32)
|
|
|
|
%m = bitcast i8* %M to i32*
|
|
|
|
store i32 42, i32* %m
|
|
|
|
%v = call x86_thiscallcc i32 @unused_this_preallocated(i32* %t, i32* preallocated(i32) %m) ["preallocated"(token %c)]
|
|
|
|
ret i32 %v
|
Reland [X86] Codegen for preallocated
See https://reviews.llvm.org/D74651 for the preallocated IR constructs
and LangRef changes.
In X86TargetLowering::LowerCall(), if a call is preallocated, record
each argument's offset from the stack pointer and the total stack
adjustment. Associate the call Value with an integer index. Store the
info in X86MachineFunctionInfo with the integer index as the key.
This adds two new target independent ISDOpcodes and two new target
dependent Opcodes corresponding to @llvm.call.preallocated.{setup,arg}.
The setup ISelDAG node takes in a chain and outputs a chain and a
SrcValue of the preallocated call Value. It is lowered to a target
dependent node with the SrcValue replaced with the integer index key by
looking in X86MachineFunctionInfo. In
X86TargetLowering::EmitInstrWithCustomInserter() this is lowered to an
%esp adjustment, the exact amount determined by looking in
X86MachineFunctionInfo with the integer index key.
The arg ISelDAG node takes in a chain, a SrcValue of the preallocated
call Value, and the arg index int constant. It produces a chain and the
pointer fo the arg. It is lowered to a target dependent node with the
SrcValue replaced with the integer index key by looking in
X86MachineFunctionInfo. In
X86TargetLowering::EmitInstrWithCustomInserter() this is lowered to a
lea of the stack pointer plus an offset determined by looking in
X86MachineFunctionInfo with the integer index key.
Force any function containing a preallocated call to use the frame
pointer.
Does not yet handle a setup without a call, or a conditional call.
Does not yet handle musttail. That requires a LangRef change first.
Tried to look at all references to inalloca and see if they apply to
preallocated. I've made preallocated versions of tests testing inalloca
whenever possible and when they make sense (e.g. not alloca related,
inalloca edge cases).
Aside from the tests added here, I checked that this codegen produces
correct code for something like
```
struct A {
A();
A(A&&);
~A();
};
void bar() {
foo(foo(foo(foo(foo(A(), 4), 5), 6), 7), 8);
}
```
by replacing the inalloca version of the .ll file with the appropriate
preallocated code. Running the executable produces the same results as
using the current inalloca implementation.
Reverted due to unexpectedly passing tests, added REQUIRES: asserts for reland.
Subscribers: hiraditya, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D77689
2020-03-17 03:32:36 +08:00
|
|
|
}
|
|
|
|
|
2020-10-15 19:04:36 +08:00
|
|
|
; CHECK: attributes #0 = { nofree nosync nounwind willreturn }
|
|
|
|
; CHECK: attributes #1 = { nounwind }
|