forked from OSchip/llvm-project
[AArch64] Treat x18 as callee-saved in functions with windows calling convention on non-windows OSes
Treat it as callee-saved, and always back it up. When windows code calls entry points in unix code, marked with the windows calling convention, that unix code can call other functions that isn't compiled with -ffixed-x18 which may clobber x18 freely. By backing it up and restoring it on return, we preserve the register across the function call, fulfilling this part of the windows calling convention on another OS. This isn't enough for making sure that x18 is preseved when non-windows code does a callback to windows code, but is a clear improvement over the current status quo. Additionally, wine is nowadays building many modules as PE DLLs, which avoids the callback issue altogether for those DLLs. Differential Revision: https://reviews.llvm.org/D61892
This commit is contained in:
parent
2388a096e7
commit
cf97e0ec42
|
@ -384,6 +384,10 @@ def CSR_AArch64_AAPCS : CalleeSavedRegs<(add X19, X20, X21, X22, X23, X24,
|
|||
D8, D9, D10, D11,
|
||||
D12, D13, D14, D15)>;
|
||||
|
||||
// A variant for treating X18 as callee saved, when interfacing with
|
||||
// code that needs X18 to be preserved.
|
||||
def CSR_AArch64_AAPCS_X18 : CalleeSavedRegs<(add X18, CSR_AArch64_AAPCS)>;
|
||||
|
||||
// Win64 has unwinding codes for an (FP,LR) pair, save_fplr and save_fplr_x.
|
||||
// We put FP before LR, so that frame lowering logic generates (FP,LR) pairs,
|
||||
// and not (LR,FP) pairs.
|
||||
|
|
|
@ -2389,6 +2389,7 @@ void AArch64FrameLowering::determineCalleeSaves(MachineFunction &MF,
|
|||
TargetFrameLowering::determineCalleeSaves(MF, SavedRegs, RS);
|
||||
const AArch64RegisterInfo *RegInfo = static_cast<const AArch64RegisterInfo *>(
|
||||
MF.getSubtarget().getRegisterInfo());
|
||||
const AArch64Subtarget &Subtarget = MF.getSubtarget<AArch64Subtarget>();
|
||||
AArch64FunctionInfo *AFI = MF.getInfo<AArch64FunctionInfo>();
|
||||
unsigned UnspilledCSGPR = AArch64::NoRegister;
|
||||
unsigned UnspilledCSGPRPaired = AArch64::NoRegister;
|
||||
|
@ -2437,6 +2438,16 @@ void AArch64FrameLowering::determineCalleeSaves(MachineFunction &MF,
|
|||
}
|
||||
}
|
||||
|
||||
if (MF.getFunction().getCallingConv() == CallingConv::Win64 &&
|
||||
!Subtarget.isTargetWindows()) {
|
||||
// For Windows calling convention on a non-windows OS, where X18 is treated
|
||||
// as reserved, back up X18 when entering non-windows code (marked with the
|
||||
// Windows calling convention) and restore when returning regardless of
|
||||
// whether the individual function uses it - it might call other functions
|
||||
// that clobber it.
|
||||
SavedRegs.set(AArch64::X18);
|
||||
}
|
||||
|
||||
// Calculates the callee saved stack size.
|
||||
unsigned CSStackSize = 0;
|
||||
unsigned SVECSStackSize = 0;
|
||||
|
|
|
@ -3958,6 +3958,13 @@ bool AArch64TargetLowering::isEligibleForTailCallOptimization(
|
|||
CallingConv::ID CallerCC = CallerF.getCallingConv();
|
||||
bool CCMatch = CallerCC == CalleeCC;
|
||||
|
||||
// When using the Windows calling convention on a non-windows OS, we want
|
||||
// to back up and restore X18 in such functions; we can't do a tail call
|
||||
// from those functions.
|
||||
if (CallerCC == CallingConv::Win64 && !Subtarget->isTargetWindows() &&
|
||||
CalleeCC != CallingConv::Win64)
|
||||
return false;
|
||||
|
||||
// Byval parameters hand the function a pointer directly into the stack area
|
||||
// we want to reuse during a tail call. Working around this *is* possible (see
|
||||
// X86) but less efficient and uglier in LowerCall.
|
||||
|
|
|
@ -71,6 +71,10 @@ AArch64RegisterInfo::getCalleeSavedRegs(const MachineFunction *MF) const {
|
|||
return CSR_AArch64_AAPCS_SwiftError_SaveList;
|
||||
if (MF->getFunction().getCallingConv() == CallingConv::PreserveMost)
|
||||
return CSR_AArch64_RT_MostRegs_SaveList;
|
||||
if (MF->getFunction().getCallingConv() == CallingConv::Win64)
|
||||
// This is for OSes other than Windows; Windows is a separate case further
|
||||
// above.
|
||||
return CSR_AArch64_AAPCS_X18_SaveList;
|
||||
return CSR_AArch64_AAPCS_SaveList;
|
||||
}
|
||||
|
||||
|
|
|
@ -2,16 +2,18 @@
|
|||
|
||||
define win64cc void @pass_va(i32 %count, ...) nounwind {
|
||||
entry:
|
||||
; CHECK: str x30, [sp, #-80]!
|
||||
; CHECK: add x8, sp, #24
|
||||
; CHECK: add x0, sp, #24
|
||||
; CHECK: stp x1, x2, [sp, #24]
|
||||
; CHECK: stp x3, x4, [sp, #40]
|
||||
; CHECK: stp x5, x6, [sp, #56]
|
||||
; CHECK: str x7, [sp, #72]
|
||||
; CHECK: sub sp, sp, #96
|
||||
; CHECK: add x8, sp, #40
|
||||
; CHECK: add x0, sp, #40
|
||||
; CHECK: stp x30, x18, [sp, #16]
|
||||
; CHECK: stp x1, x2, [sp, #40]
|
||||
; CHECK: stp x3, x4, [sp, #56]
|
||||
; CHECK: stp x5, x6, [sp, #72]
|
||||
; CHECK: str x7, [sp, #88]
|
||||
; CHECK: str x8, [sp, #8]
|
||||
; CHECK: bl other_func
|
||||
; CHECK: ldr x30, [sp], #80
|
||||
; CHECK: ldp x30, x18, [sp, #16]
|
||||
; CHECK: add sp, sp, #96
|
||||
; CHECK: ret
|
||||
%ap = alloca i8*, align 8
|
||||
%ap1 = bitcast i8** %ap to i8*
|
||||
|
@ -27,11 +29,11 @@ declare void @llvm.va_start(i8*) nounwind
|
|||
declare void @llvm.va_copy(i8*, i8*) nounwind
|
||||
|
||||
; CHECK-LABEL: f9:
|
||||
; CHECK: sub sp, sp, #16
|
||||
; CHECK: str x18, [sp, #-16]!
|
||||
; CHECK: add x8, sp, #24
|
||||
; CHECK: add x0, sp, #24
|
||||
; CHECK: str x8, [sp, #8]
|
||||
; CHECK: add sp, sp, #16
|
||||
; CHECK: ldr x18, [sp], #16
|
||||
; CHECK: ret
|
||||
define win64cc i8* @f9(i64 %a0, i64 %a1, i64 %a2, i64 %a3, i64 %a4, i64 %a5, i64 %a6, i64 %a7, i64 %a8, ...) nounwind {
|
||||
entry:
|
||||
|
@ -43,11 +45,11 @@ entry:
|
|||
}
|
||||
|
||||
; CHECK-LABEL: f8:
|
||||
; CHECK: sub sp, sp, #16
|
||||
; CHECK: str x18, [sp, #-16]!
|
||||
; CHECK: add x8, sp, #16
|
||||
; CHECK: add x0, sp, #16
|
||||
; CHECK: str x8, [sp, #8]
|
||||
; CHECK: add sp, sp, #16
|
||||
; CHECK: ldr x18, [sp], #16
|
||||
; CHECK: ret
|
||||
define win64cc i8* @f8(i64 %a0, i64 %a1, i64 %a2, i64 %a3, i64 %a4, i64 %a5, i64 %a6, i64 %a7, ...) nounwind {
|
||||
entry:
|
||||
|
@ -59,12 +61,12 @@ entry:
|
|||
}
|
||||
|
||||
; CHECK-LABEL: f7:
|
||||
; CHECK: sub sp, sp, #32
|
||||
; CHECK: str x18, [sp, #-32]!
|
||||
; CHECK: add x8, sp, #24
|
||||
; CHECK: str x7, [sp, #24]
|
||||
; CHECK: add x0, sp, #24
|
||||
; CHECK: str x8, [sp, #8]
|
||||
; CHECK: add sp, sp, #32
|
||||
; CHECK: ldr x18, [sp], #32
|
||||
; CHECK: ret
|
||||
define win64cc i8* @f7(i64 %a0, i64 %a1, i64 %a2, i64 %a3, i64 %a4, i64 %a5, i64 %a6, ...) nounwind {
|
||||
entry:
|
||||
|
|
|
@ -0,0 +1,26 @@
|
|||
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
||||
|
||||
;; Testing that x18 is backed up and restored, and that x29 (if used) still
|
||||
;; points to the x29,x30 pair on the stack.
|
||||
|
||||
; RUN: llc < %s -mtriple=aarch64-linux-gnu --frame-pointer=non-leaf | FileCheck %s
|
||||
; RUN: llc < %s -mtriple=aarch64-linux-gnu --frame-pointer=non-leaf -mattr=+reserve-x18 | FileCheck %s
|
||||
|
||||
declare dso_local void @other()
|
||||
|
||||
define dso_local win64cc void @func() #0 {
|
||||
; CHECK-LABEL: func:
|
||||
; CHECK: // %bb.0: // %entry
|
||||
; CHECK-NEXT: stp x29, x30, [sp, #-32]! // 16-byte Folded Spill
|
||||
; CHECK-NEXT: str x18, [sp, #16] // 8-byte Folded Spill
|
||||
; CHECK-NEXT: mov x29, sp
|
||||
; CHECK-NEXT: bl other
|
||||
; CHECK-NEXT: ldr x18, [sp, #16] // 8-byte Folded Reload
|
||||
; CHECK-NEXT: ldp x29, x30, [sp], #32 // 16-byte Folded Reload
|
||||
; CHECK-NEXT: ret
|
||||
entry:
|
||||
tail call void @other()
|
||||
ret void
|
||||
}
|
||||
|
||||
attributes #0 = { nounwind }
|
Loading…
Reference in New Issue