2013-03-07 17:03:52 +08:00
|
|
|
//===---- AMDCallingConv.td - Calling Conventions for Radeon GPUs ---------===//
|
|
|
|
//
|
2019-01-19 16:50:56 +08:00
|
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
2013-03-07 17:03:52 +08:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
|
|
|
// This describes the calling conventions for the AMD Radeon GPUs.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
// Inversion of CCIfInReg
|
|
|
|
class CCIfNotInReg<CCAction A> : CCIf<"!ArgFlags.isInReg()", A> {}
|
2017-05-18 05:56:25 +08:00
|
|
|
class CCIfExtend<CCAction A>
|
|
|
|
: CCIf<"ArgFlags.isSExt() || ArgFlags.isZExt()", A>;
|
2013-03-07 17:03:52 +08:00
|
|
|
|
|
|
|
// Calling convention for SI
|
|
|
|
def CC_SI : CallingConv<[
|
|
|
|
|
2018-08-02 03:57:34 +08:00
|
|
|
CCIfInReg<CCIfType<[f32, i32, f16, v2i16, v2f16] , CCAssignToReg<[
|
2013-03-07 17:03:52 +08:00
|
|
|
SGPR0, SGPR1, SGPR2, SGPR3, SGPR4, SGPR5, SGPR6, SGPR7,
|
2013-09-12 10:55:14 +08:00
|
|
|
SGPR8, SGPR9, SGPR10, SGPR11, SGPR12, SGPR13, SGPR14, SGPR15,
|
2016-01-13 19:46:48 +08:00
|
|
|
SGPR16, SGPR17, SGPR18, SGPR19, SGPR20, SGPR21, SGPR22, SGPR23,
|
|
|
|
SGPR24, SGPR25, SGPR26, SGPR27, SGPR28, SGPR29, SGPR30, SGPR31,
|
2019-05-15 22:43:55 +08:00
|
|
|
SGPR32, SGPR33, SGPR34, SGPR35, SGPR36, SGPR37, SGPR38, SGPR39,
|
|
|
|
SGPR40, SGPR41, SGPR42, SGPR43, SGPR44, SGPR45, SGPR46, SGPR47,
|
|
|
|
SGPR48, SGPR49, SGPR50, SGPR51, SGPR52, SGPR53, SGPR54, SGPR55,
|
|
|
|
SGPR56, SGPR57, SGPR58, SGPR59, SGPR60, SGPR61, SGPR62, SGPR63,
|
|
|
|
SGPR64, SGPR65, SGPR66, SGPR67, SGPR68, SGPR69, SGPR70, SGPR71,
|
|
|
|
SGPR72, SGPR73, SGPR74, SGPR75, SGPR76, SGPR77, SGPR78, SGPR79,
|
|
|
|
SGPR80, SGPR81, SGPR82, SGPR83, SGPR84, SGPR85, SGPR86, SGPR87,
|
|
|
|
SGPR88, SGPR89, SGPR90, SGPR91, SGPR92, SGPR93, SGPR94, SGPR95,
|
|
|
|
SGPR96, SGPR97, SGPR98, SGPR99, SGPR100, SGPR101, SGPR102, SGPR103,
|
|
|
|
SGPR104, SGPR105
|
2013-03-07 17:03:52 +08:00
|
|
|
]>>>,
|
|
|
|
|
2016-01-13 19:46:48 +08:00
|
|
|
// 32*4 + 4 is the minimum for a fetch shader consumer with 32 inputs.
|
2018-08-02 03:57:34 +08:00
|
|
|
CCIfNotInReg<CCIfType<[f32, i32, f16, v2i16, v2f16] , CCAssignToReg<[
|
2013-03-07 17:03:52 +08:00
|
|
|
VGPR0, VGPR1, VGPR2, VGPR3, VGPR4, VGPR5, VGPR6, VGPR7,
|
|
|
|
VGPR8, VGPR9, VGPR10, VGPR11, VGPR12, VGPR13, VGPR14, VGPR15,
|
|
|
|
VGPR16, VGPR17, VGPR18, VGPR19, VGPR20, VGPR21, VGPR22, VGPR23,
|
2016-01-13 19:46:48 +08:00
|
|
|
VGPR24, VGPR25, VGPR26, VGPR27, VGPR28, VGPR29, VGPR30, VGPR31,
|
|
|
|
VGPR32, VGPR33, VGPR34, VGPR35, VGPR36, VGPR37, VGPR38, VGPR39,
|
|
|
|
VGPR40, VGPR41, VGPR42, VGPR43, VGPR44, VGPR45, VGPR46, VGPR47,
|
|
|
|
VGPR48, VGPR49, VGPR50, VGPR51, VGPR52, VGPR53, VGPR54, VGPR55,
|
|
|
|
VGPR56, VGPR57, VGPR58, VGPR59, VGPR60, VGPR61, VGPR62, VGPR63,
|
|
|
|
VGPR64, VGPR65, VGPR66, VGPR67, VGPR68, VGPR69, VGPR70, VGPR71,
|
|
|
|
VGPR72, VGPR73, VGPR74, VGPR75, VGPR76, VGPR77, VGPR78, VGPR79,
|
|
|
|
VGPR80, VGPR81, VGPR82, VGPR83, VGPR84, VGPR85, VGPR86, VGPR87,
|
|
|
|
VGPR88, VGPR89, VGPR90, VGPR91, VGPR92, VGPR93, VGPR94, VGPR95,
|
|
|
|
VGPR96, VGPR97, VGPR98, VGPR99, VGPR100, VGPR101, VGPR102, VGPR103,
|
|
|
|
VGPR104, VGPR105, VGPR106, VGPR107, VGPR108, VGPR109, VGPR110, VGPR111,
|
|
|
|
VGPR112, VGPR113, VGPR114, VGPR115, VGPR116, VGPR117, VGPR118, VGPR119,
|
|
|
|
VGPR120, VGPR121, VGPR122, VGPR123, VGPR124, VGPR125, VGPR126, VGPR127,
|
|
|
|
VGPR128, VGPR129, VGPR130, VGPR131, VGPR132, VGPR133, VGPR134, VGPR135
|
2017-04-07 01:37:27 +08:00
|
|
|
]>>>
|
2013-06-04 01:40:11 +08:00
|
|
|
]>;
|
2013-03-07 17:03:52 +08:00
|
|
|
|
2017-05-18 05:56:25 +08:00
|
|
|
def RetCC_SI_Shader : CallingConv<[
|
2016-01-14 01:23:04 +08:00
|
|
|
CCIfType<[i32] , CCAssignToReg<[
|
|
|
|
SGPR0, SGPR1, SGPR2, SGPR3, SGPR4, SGPR5, SGPR6, SGPR7,
|
|
|
|
SGPR8, SGPR9, SGPR10, SGPR11, SGPR12, SGPR13, SGPR14, SGPR15,
|
|
|
|
SGPR16, SGPR17, SGPR18, SGPR19, SGPR20, SGPR21, SGPR22, SGPR23,
|
|
|
|
SGPR24, SGPR25, SGPR26, SGPR27, SGPR28, SGPR29, SGPR30, SGPR31,
|
2019-05-15 22:43:55 +08:00
|
|
|
SGPR32, SGPR33, SGPR34, SGPR35, SGPR36, SGPR37, SGPR38, SGPR39,
|
|
|
|
SGPR40, SGPR41, SGPR42, SGPR43, SGPR44, SGPR45, SGPR46, SGPR47,
|
|
|
|
SGPR48, SGPR49, SGPR50, SGPR51, SGPR52, SGPR53, SGPR54, SGPR55,
|
|
|
|
SGPR56, SGPR57, SGPR58, SGPR59, SGPR60, SGPR61, SGPR62, SGPR63,
|
|
|
|
SGPR64, SGPR65, SGPR66, SGPR67, SGPR68, SGPR69, SGPR70, SGPR71,
|
|
|
|
SGPR72, SGPR73, SGPR74, SGPR75, SGPR76, SGPR77, SGPR78, SGPR79,
|
|
|
|
SGPR80, SGPR81, SGPR82, SGPR83, SGPR84, SGPR85, SGPR86, SGPR87,
|
|
|
|
SGPR88, SGPR89, SGPR90, SGPR91, SGPR92, SGPR93, SGPR94, SGPR95,
|
|
|
|
SGPR96, SGPR97, SGPR98, SGPR99, SGPR100, SGPR101, SGPR102, SGPR103,
|
|
|
|
SGPR104, SGPR105
|
2016-01-14 01:23:04 +08:00
|
|
|
]>>,
|
|
|
|
|
|
|
|
// 32*4 + 4 is the minimum for a fetch shader with 32 outputs.
|
2018-08-02 03:57:34 +08:00
|
|
|
CCIfType<[f32, f16, v2f16] , CCAssignToReg<[
|
2016-01-14 01:23:04 +08:00
|
|
|
VGPR0, VGPR1, VGPR2, VGPR3, VGPR4, VGPR5, VGPR6, VGPR7,
|
|
|
|
VGPR8, VGPR9, VGPR10, VGPR11, VGPR12, VGPR13, VGPR14, VGPR15,
|
|
|
|
VGPR16, VGPR17, VGPR18, VGPR19, VGPR20, VGPR21, VGPR22, VGPR23,
|
|
|
|
VGPR24, VGPR25, VGPR26, VGPR27, VGPR28, VGPR29, VGPR30, VGPR31,
|
|
|
|
VGPR32, VGPR33, VGPR34, VGPR35, VGPR36, VGPR37, VGPR38, VGPR39,
|
|
|
|
VGPR40, VGPR41, VGPR42, VGPR43, VGPR44, VGPR45, VGPR46, VGPR47,
|
|
|
|
VGPR48, VGPR49, VGPR50, VGPR51, VGPR52, VGPR53, VGPR54, VGPR55,
|
|
|
|
VGPR56, VGPR57, VGPR58, VGPR59, VGPR60, VGPR61, VGPR62, VGPR63,
|
|
|
|
VGPR64, VGPR65, VGPR66, VGPR67, VGPR68, VGPR69, VGPR70, VGPR71,
|
|
|
|
VGPR72, VGPR73, VGPR74, VGPR75, VGPR76, VGPR77, VGPR78, VGPR79,
|
|
|
|
VGPR80, VGPR81, VGPR82, VGPR83, VGPR84, VGPR85, VGPR86, VGPR87,
|
|
|
|
VGPR88, VGPR89, VGPR90, VGPR91, VGPR92, VGPR93, VGPR94, VGPR95,
|
|
|
|
VGPR96, VGPR97, VGPR98, VGPR99, VGPR100, VGPR101, VGPR102, VGPR103,
|
|
|
|
VGPR104, VGPR105, VGPR106, VGPR107, VGPR108, VGPR109, VGPR110, VGPR111,
|
|
|
|
VGPR112, VGPR113, VGPR114, VGPR115, VGPR116, VGPR117, VGPR118, VGPR119,
|
|
|
|
VGPR120, VGPR121, VGPR122, VGPR123, VGPR124, VGPR125, VGPR126, VGPR127,
|
|
|
|
VGPR128, VGPR129, VGPR130, VGPR131, VGPR132, VGPR133, VGPR134, VGPR135
|
|
|
|
]>>
|
|
|
|
]>;
|
|
|
|
|
2017-05-18 05:56:25 +08:00
|
|
|
def CSR_AMDGPU_VGPRs_24_255 : CalleeSavedRegs<
|
|
|
|
(sequence "VGPR%u", 24, 255)
|
|
|
|
>;
|
|
|
|
|
|
|
|
def CSR_AMDGPU_VGPRs_32_255 : CalleeSavedRegs<
|
|
|
|
(sequence "VGPR%u", 32, 255)
|
|
|
|
>;
|
|
|
|
|
2019-05-22 07:23:05 +08:00
|
|
|
def CSR_AMDGPU_SGPRs_32_105 : CalleeSavedRegs<
|
|
|
|
(sequence "SGPR%u", 32, 105)
|
2017-05-18 05:56:25 +08:00
|
|
|
>;
|
|
|
|
|
2019-07-04 07:32:29 +08:00
|
|
|
// Just to get the regmask, not for calling convention purposes.
|
|
|
|
def CSR_AMDGPU_AllVGPRs : CalleeSavedRegs<
|
|
|
|
(sequence "VGPR%u", 0, 255)
|
|
|
|
>;
|
|
|
|
|
|
|
|
// Just to get the regmask, not for calling convention purposes.
|
|
|
|
def CSR_AMDGPU_AllAllocatableSRegs : CalleeSavedRegs<
|
|
|
|
(add (sequence "SGPR%u", 0, 105), VCC_LO, VCC_HI)
|
|
|
|
>;
|
|
|
|
|
2017-05-18 05:56:25 +08:00
|
|
|
def CSR_AMDGPU_HighRegs : CalleeSavedRegs<
|
2019-05-22 07:23:05 +08:00
|
|
|
(add CSR_AMDGPU_VGPRs_32_255, CSR_AMDGPU_SGPRs_32_105)
|
2017-05-18 05:56:25 +08:00
|
|
|
>;
|
|
|
|
|
|
|
|
// Calling convention for leaf functions
|
|
|
|
def CC_AMDGPU_Func : CallingConv<[
|
|
|
|
CCIfByVal<CCPassByVal<4, 4>>,
|
|
|
|
CCIfType<[i1], CCPromoteToType<i32>>,
|
|
|
|
CCIfType<[i1, i8, i16], CCIfExtend<CCPromoteToType<i32>>>,
|
|
|
|
CCIfType<[i32, f32, i16, f16, v2i16, v2f16, i1], CCAssignToReg<[
|
|
|
|
VGPR0, VGPR1, VGPR2, VGPR3, VGPR4, VGPR5, VGPR6, VGPR7,
|
|
|
|
VGPR8, VGPR9, VGPR10, VGPR11, VGPR12, VGPR13, VGPR14, VGPR15,
|
|
|
|
VGPR16, VGPR17, VGPR18, VGPR19, VGPR20, VGPR21, VGPR22, VGPR23,
|
|
|
|
VGPR24, VGPR25, VGPR26, VGPR27, VGPR28, VGPR29, VGPR30, VGPR31]>>,
|
|
|
|
CCIfType<[i32, f32, v2i16, v2f16, i16, f16, i1], CCAssignToStack<4, 4>>,
|
|
|
|
CCIfType<[i64, f64, v2i32, v2f32], CCAssignToStack<8, 4>>,
|
2019-03-21 20:01:21 +08:00
|
|
|
CCIfType<[v3i32, v3f32], CCAssignToStack<12, 4>>,
|
2017-05-18 05:56:25 +08:00
|
|
|
CCIfType<[v4i32, v4f32, v2i64, v2f64], CCAssignToStack<16, 4>>,
|
2019-03-22 18:11:21 +08:00
|
|
|
CCIfType<[v5i32, v5f32], CCAssignToStack<20, 4>>,
|
2017-05-18 05:56:25 +08:00
|
|
|
CCIfType<[v8i32, v8f32], CCAssignToStack<32, 4>>,
|
|
|
|
CCIfType<[v16i32, v16f32], CCAssignToStack<64, 4>>
|
|
|
|
]>;
|
|
|
|
|
|
|
|
// Calling convention for leaf functions
|
|
|
|
def RetCC_AMDGPU_Func : CallingConv<[
|
|
|
|
CCIfType<[i1], CCPromoteToType<i32>>,
|
|
|
|
CCIfType<[i1, i16], CCIfExtend<CCPromoteToType<i32>>>,
|
|
|
|
CCIfType<[i32, f32, i16, f16, v2i16, v2f16], CCAssignToReg<[
|
|
|
|
VGPR0, VGPR1, VGPR2, VGPR3, VGPR4, VGPR5, VGPR6, VGPR7,
|
|
|
|
VGPR8, VGPR9, VGPR10, VGPR11, VGPR12, VGPR13, VGPR14, VGPR15,
|
|
|
|
VGPR16, VGPR17, VGPR18, VGPR19, VGPR20, VGPR21, VGPR22, VGPR23,
|
|
|
|
VGPR24, VGPR25, VGPR26, VGPR27, VGPR28, VGPR29, VGPR30, VGPR31]>>,
|
|
|
|
]>;
|
|
|
|
|
2013-03-07 17:03:52 +08:00
|
|
|
def CC_AMDGPU : CallingConv<[
|
2018-07-12 04:59:01 +08:00
|
|
|
CCIf<"static_cast<const GCNSubtarget&>"
|
2014-08-07 02:45:26 +08:00
|
|
|
"(State.getMachineFunction().getSubtarget()).getGeneration() >= "
|
|
|
|
"AMDGPUSubtarget::SOUTHERN_ISLANDS",
|
|
|
|
CCDelegateTo<CC_SI>>,
|
2018-07-12 04:59:01 +08:00
|
|
|
CCIf<"static_cast<const GCNSubtarget&>"
|
2017-08-02 03:54:18 +08:00
|
|
|
"(State.getMachineFunction().getSubtarget()).getGeneration() >= "
|
|
|
|
"AMDGPUSubtarget::SOUTHERN_ISLANDS && State.getCallingConv() == CallingConv::C",
|
AMDGPU: Separate R600 and GCN TableGen files
Summary:
We now have two sets of generated TableGen files, one for R600 and one
for GCN, so each sub-target now has its own tables of instructions,
registers, ISel patterns, etc. This should help reduce compile time
since each sub-target now only has to consider information that
is specific to itself. This will also help prevent the R600
sub-target from slowing down new features for GCN, like disassembler
support, GlobalISel, etc.
Reviewers: arsenm, nhaehnle, jvesely
Reviewed By: arsenm
Subscribers: MatzeB, kzhuravl, wdng, mgorny, yaxunl, dstuttard, tpr, t-tye, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D46365
llvm-svn: 335942
2018-06-29 07:47:12 +08:00
|
|
|
CCDelegateTo<CC_AMDGPU_Func>>
|
2013-03-07 17:03:52 +08:00
|
|
|
]>;
|