2019-06-15 05:33:51 +08:00
|
|
|
//===- P9InstrResources.td - P9 Instruction Resource Defs -*- tablegen -*-==//
|
2016-12-19 21:35:45 +08:00
|
|
|
//
|
2019-01-19 16:50:56 +08:00
|
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
2016-12-19 21:35:45 +08:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
2019-06-15 01:04:24 +08:00
|
|
|
// This file defines the resources required by P9 instructions. This is part of
|
|
|
|
// the P9 processor model used for instruction scheduling. This file should
|
|
|
|
// contain all the instructions that may be used on Power 9. This is not
|
|
|
|
// just instructions that are new on Power 9 but also instructions that were
|
2018-03-10 05:08:35 +08:00
|
|
|
// available on earlier architectures and are still used in Power 9.
|
2016-12-19 21:35:45 +08:00
|
|
|
//
|
2017-09-23 04:17:25 +08:00
|
|
|
// The makeup of the P9 CPU is modeled as follows:
|
|
|
|
// - Each CPU is made up of two superslices.
|
|
|
|
// - Each superslice is made up of two slices. Therefore, there are 4 slices
|
2019-06-15 01:04:24 +08:00
|
|
|
// for each CPU.
|
2017-09-23 04:17:25 +08:00
|
|
|
// - Up to 6 instructions can be dispatched to each CPU. Three per superslice.
|
|
|
|
// - Each CPU has:
|
|
|
|
// - One CY (Crypto) unit P9_CY_*
|
|
|
|
// - One DFU (Decimal Floating Point and Quad Precision) unit P9_DFU_*
|
|
|
|
// - Two PM (Permute) units. One on each superslice. P9_PM_*
|
|
|
|
// - Two DIV (Fixed Point Divide) units. One on each superslize. P9_DIV_*
|
|
|
|
// - Four ALU (Fixed Point Arithmetic) units. One on each slice. P9_ALU_*
|
|
|
|
// - Four DP (Floating Point) units. One on each slice. P9_DP_*
|
|
|
|
// This also includes fixed point multiply add.
|
|
|
|
// - Four AGEN (Address Generation) units. One for each slice. P9_AGEN_*
|
|
|
|
// - Four Load/Store Queues. P9_LS_*
|
|
|
|
// - Each set of instructions will require a number of these resources.
|
2016-12-19 21:35:45 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// Two cycle ALU vector operation that uses an entire superslice.
|
2018-03-10 05:08:35 +08:00
|
|
|
// Uses both ALU units (the even ALUE and odd ALUO units), two pipelines
|
2019-06-15 01:04:24 +08:00
|
|
|
// (EXECE, EXECO) and 1 dispatch (DISP) to the given superslice.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_ALUE_2C, P9_ALUO_2C, IP_EXECE_1C, IP_EXECO_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2018-02-24 04:37:10 +08:00
|
|
|
(instregex "VADDU(B|H|W|D)M$"),
|
2018-03-02 00:16:08 +08:00
|
|
|
(instregex "VAND(C)?$"),
|
2018-03-02 22:41:38 +08:00
|
|
|
(instregex "VEXTS(B|H|W)2(D|W)(s)?$"),
|
2018-03-09 00:24:33 +08:00
|
|
|
(instregex "V_SET0(B|H)?$"),
|
2018-03-10 05:08:35 +08:00
|
|
|
(instregex "VS(R|L)(B|H|W|D)$"),
|
|
|
|
(instregex "VSUBU(B|H|W|D)M$"),
|
|
|
|
(instregex "VPOPCNT(B|H)$"),
|
|
|
|
(instregex "VRL(B|H|W|D)$"),
|
|
|
|
(instregex "VSRA(B|H|W|D)$"),
|
|
|
|
(instregex "XV(N)?ABS(D|S)P$"),
|
|
|
|
(instregex "XVCPSGN(D|S)P$"),
|
|
|
|
(instregex "XV(I|X)EXP(D|S)P$"),
|
|
|
|
(instregex "VRL(D|W)(MI|NM)$"),
|
|
|
|
(instregex "VMRG(E|O)W$"),
|
2018-03-09 00:24:33 +08:00
|
|
|
MTVSRDD,
|
2016-12-19 21:35:45 +08:00
|
|
|
VEQV,
|
|
|
|
VNAND,
|
|
|
|
VNEGD,
|
|
|
|
VNEGW,
|
|
|
|
VNOR,
|
|
|
|
VOR,
|
|
|
|
VORC,
|
|
|
|
VSEL,
|
|
|
|
VXOR,
|
|
|
|
XVNEGDP,
|
|
|
|
XVNEGSP,
|
|
|
|
XXLAND,
|
|
|
|
XXLANDC,
|
|
|
|
XXLEQV,
|
2019-08-15 22:32:51 +08:00
|
|
|
XXLEQVOnes,
|
2016-12-19 21:35:45 +08:00
|
|
|
XXLNAND,
|
|
|
|
XXLNOR,
|
|
|
|
XXLOR,
|
|
|
|
XXLORf,
|
|
|
|
XXLORC,
|
|
|
|
XXLXOR,
|
2018-03-09 00:24:33 +08:00
|
|
|
XXLXORdpz,
|
|
|
|
XXLXORspz,
|
|
|
|
XXLXORz,
|
2017-09-23 04:17:25 +08:00
|
|
|
XXSEL,
|
2016-12-19 21:35:45 +08:00
|
|
|
XSABSQP,
|
|
|
|
XSCPSGNQP,
|
|
|
|
XSIEXPQP,
|
|
|
|
XSNABSQP,
|
|
|
|
XSNEGQP,
|
2017-09-23 04:17:25 +08:00
|
|
|
XSXEXPQP
|
|
|
|
)>;
|
|
|
|
|
|
|
|
// Restricted Dispatch ALU operation for 3 cycles. The operation runs on a
|
2019-06-15 01:04:24 +08:00
|
|
|
// single slice. However, since it is Restricted, it requires all 3 dispatches
|
2018-03-10 05:08:35 +08:00
|
|
|
// (DISP) for that superslice.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_ALU_3C, IP_EXEC_1C, DISP_3SLOTS_1C],
|
2017-09-23 04:17:25 +08:00
|
|
|
(instrs
|
2018-03-09 00:24:33 +08:00
|
|
|
(instregex "TABORT(D|W)C(I)?$"),
|
|
|
|
(instregex "MTFSB(0|1)$"),
|
|
|
|
(instregex "MFFSC(D)?RN(I)?$"),
|
2018-02-24 04:37:10 +08:00
|
|
|
(instregex "CMPRB(8)?$"),
|
|
|
|
(instregex "TD(I)?$"),
|
2018-03-10 05:08:35 +08:00
|
|
|
(instregex "TW(I)?$"),
|
|
|
|
(instregex "FCMPU(S|D)$"),
|
|
|
|
(instregex "XSTSTDC(S|D)P$"),
|
|
|
|
FTDIV,
|
|
|
|
FTSQRT,
|
|
|
|
CMPEQB
|
2017-09-23 04:17:25 +08:00
|
|
|
)>;
|
|
|
|
|
|
|
|
// Standard Dispatch ALU operation for 3 cycles. Only one slice used.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_ALU_3C, IP_EXEC_1C, DISP_1C],
|
2017-09-23 04:17:25 +08:00
|
|
|
(instrs
|
2018-02-24 04:37:10 +08:00
|
|
|
(instregex "XSMAX(C|J)?DP$"),
|
|
|
|
(instregex "XSMIN(C|J)?DP$"),
|
|
|
|
(instregex "XSCMP(EQ|EXP|GE|GT|O|U)DP$"),
|
2020-01-07 03:05:12 +08:00
|
|
|
(instregex "CNT(L|T)Z(D|W)(8)?(_rec)?$"),
|
2018-03-10 05:08:35 +08:00
|
|
|
(instregex "POPCNT(D|W)$"),
|
|
|
|
(instregex "CMPB(8)?$"),
|
[PowerPC] Exploit power9 new instruction setb
Check the expected pattens feeding to SELECT_CC like:
(select_cc lhs, rhs, 1, (sext (setcc [lr]hs, [lr]hs, cc2)), cc1)
(select_cc lhs, rhs, -1, (zext (setcc [lr]hs, [lr]hs, cc2)), cc1)
(select_cc lhs, rhs, 0, (select_cc [lr]hs, [lr]hs, 1, -1, cc2), seteq)
(select_cc lhs, rhs, 0, (select_cc [lr]hs, [lr]hs, -1, 1, cc2), seteq)
Further transform the sequence to comparison + setb if hits.
Differential Revision: https://reviews.llvm.org/D53275
llvm-svn: 349445
2018-12-18 15:53:26 +08:00
|
|
|
(instregex "SETB(8)?$"),
|
2017-09-23 04:17:25 +08:00
|
|
|
XSTDIVDP,
|
|
|
|
XSTSQRTDP,
|
|
|
|
XSXSIGDP,
|
2018-02-24 04:37:10 +08:00
|
|
|
XSCVSPDPN,
|
2018-03-10 05:08:35 +08:00
|
|
|
BPERMD
|
2017-09-23 04:17:25 +08:00
|
|
|
)>;
|
|
|
|
|
|
|
|
// Standard Dispatch ALU operation for 2 cycles. Only one slice used.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_ALU_2C, IP_EXEC_1C, DISP_1C],
|
2017-09-23 04:17:25 +08:00
|
|
|
(instrs
|
2018-02-24 04:37:10 +08:00
|
|
|
(instregex "S(L|R)D$"),
|
|
|
|
(instregex "SRAD(I)?$"),
|
2019-07-09 10:55:08 +08:00
|
|
|
(instregex "EXTSWSLI_32_64$"),
|
2018-03-09 00:24:33 +08:00
|
|
|
(instregex "MFV(S)?RD$"),
|
[PowerPC] Support extended mnemonics mffprwz etc.
Summary:
Reported in https://github.com/opencv/opencv/issues/15413.
We have serveral extended mnemonics for Move To/From Vector-Scalar Register Instructions
eg: mffprd,mtfprd etc.
We only support one of them, this patch add the others.
Reviewers: nemanjai, steven.zhang, hfinkel, #powerpc
Reviewed By: hfinkel
Subscribers: wuzish, qcolombet, hiraditya, kbarton, MaskRay, shchenz, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D66963
llvm-svn: 370411
2019-08-30 05:53:59 +08:00
|
|
|
(instregex "MTV(S)?RD$"),
|
|
|
|
(instregex "MTV(S)?RW(A|Z)$"),
|
2018-02-24 04:37:10 +08:00
|
|
|
(instregex "CMP(WI|LWI|W|LW)(8)?$"),
|
2018-03-05 22:34:59 +08:00
|
|
|
(instregex "CMP(L)?D(I)?$"),
|
2019-11-09 06:14:28 +08:00
|
|
|
(instregex "SUBF(I)?C(8)?(O)?$"),
|
2020-01-07 03:05:12 +08:00
|
|
|
(instregex "ANDI(S)?(8)?(_rec)?$"),
|
2019-11-09 06:14:28 +08:00
|
|
|
(instregex "ADDC(8)?(O)?$"),
|
2020-01-07 03:05:12 +08:00
|
|
|
(instregex "ADDIC(8)?(_rec)?$"),
|
|
|
|
(instregex "ADD(8|4)(O)?(_rec)?$"),
|
|
|
|
(instregex "ADD(E|ME|ZE)(8)?(O)?(_rec)?$"),
|
|
|
|
(instregex "SUBF(E|ME|ZE)?(8)?(O)?(_rec)?$"),
|
|
|
|
(instregex "NEG(8)?(O)?(_rec)?$"),
|
2018-02-24 04:37:10 +08:00
|
|
|
(instregex "POPCNTB$"),
|
|
|
|
(instregex "ADD(I|IS)?(8)?$"),
|
|
|
|
(instregex "LI(S)?(8)?$"),
|
2020-01-07 03:05:12 +08:00
|
|
|
(instregex "(X)?OR(I|IS)?(8)?(_rec)?$"),
|
|
|
|
(instregex "NAND(8)?(_rec)?$"),
|
|
|
|
(instregex "AND(C)?(8)?(_rec)?$"),
|
|
|
|
(instregex "NOR(8)?(_rec)?$"),
|
|
|
|
(instregex "OR(C)?(8)?(_rec)?$"),
|
|
|
|
(instregex "EQV(8)?(_rec)?$"),
|
|
|
|
(instregex "EXTS(B|H|W)(8)?(_32)?(_64)?(_rec)?$"),
|
2018-02-24 04:37:10 +08:00
|
|
|
(instregex "ADD(4|8)(TLS)?(_)?$"),
|
2019-11-09 06:14:28 +08:00
|
|
|
(instregex "NEG(8)?(O)?$"),
|
2019-07-23 03:55:33 +08:00
|
|
|
(instregex "ADDI(S)?toc(HA|L)(8)?$"),
|
2018-03-28 01:51:53 +08:00
|
|
|
COPY,
|
2018-03-10 05:08:35 +08:00
|
|
|
MCRF,
|
|
|
|
MCRXRX,
|
|
|
|
XSNABSDP,
|
|
|
|
XSXEXPDP,
|
|
|
|
XSABSDP,
|
|
|
|
XSNEGDP,
|
|
|
|
XSCPSGNDP,
|
|
|
|
MFVSRWZ,
|
[PowerPC] Support extended mnemonics mffprwz etc.
Summary:
Reported in https://github.com/opencv/opencv/issues/15413.
We have serveral extended mnemonics for Move To/From Vector-Scalar Register Instructions
eg: mffprd,mtfprd etc.
We only support one of them, this patch add the others.
Reviewers: nemanjai, steven.zhang, hfinkel, #powerpc
Reviewed By: hfinkel
Subscribers: wuzish, qcolombet, hiraditya, kbarton, MaskRay, shchenz, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D66963
llvm-svn: 370411
2019-08-30 05:53:59 +08:00
|
|
|
MFVRWZ,
|
2019-07-09 10:55:08 +08:00
|
|
|
EXTSWSLI,
|
2018-03-10 05:08:35 +08:00
|
|
|
SRADI_32,
|
|
|
|
RLDIC,
|
|
|
|
RFEBB,
|
|
|
|
LA,
|
|
|
|
TBEGIN,
|
|
|
|
TRECHKPT,
|
|
|
|
NOP,
|
|
|
|
WAIT
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// Restricted Dispatch ALU operation for 2 cycles. The operation runs on a
|
2019-06-15 01:04:24 +08:00
|
|
|
// single slice. However, since it is Restricted, it requires all 3 dispatches
|
|
|
|
// (DISP) for that superslice.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_ALU_2C, IP_EXEC_1C, DISP_3SLOTS_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2018-03-10 05:08:35 +08:00
|
|
|
(instregex "RLDC(L|R)$"),
|
2018-02-24 04:37:10 +08:00
|
|
|
(instregex "RLWIMI(8)?$"),
|
2018-03-10 05:08:35 +08:00
|
|
|
(instregex "RLDIC(L|R)(_32)?(_64)?$"),
|
|
|
|
(instregex "M(F|T)OCRF(8)?$"),
|
2018-03-05 22:34:59 +08:00
|
|
|
(instregex "CR(6)?(UN)?SET$"),
|
|
|
|
(instregex "CR(N)?(OR|AND)(C)?$"),
|
2018-02-24 04:37:10 +08:00
|
|
|
(instregex "S(L|R)W(8)?$"),
|
|
|
|
(instregex "RLW(INM|NM)(8)?$"),
|
|
|
|
(instregex "F(N)?ABS(D|S)$"),
|
|
|
|
(instregex "FNEG(D|S)$"),
|
|
|
|
(instregex "FCPSGN(D|S)$"),
|
|
|
|
(instregex "SRAW(I)?$"),
|
2018-03-10 05:08:35 +08:00
|
|
|
(instregex "ISEL(8)?$"),
|
|
|
|
RLDIMI,
|
|
|
|
XSIEXPDP,
|
|
|
|
FMR,
|
|
|
|
CREQV,
|
|
|
|
CRXOR,
|
|
|
|
TRECLAIM,
|
|
|
|
TSR,
|
|
|
|
TABORT
|
2017-09-23 04:17:25 +08:00
|
|
|
)>;
|
2016-12-19 21:35:45 +08:00
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// Three cycle ALU vector operation that uses an entire superslice.
|
2018-03-10 05:08:35 +08:00
|
|
|
// Uses both ALU units (the even ALUE and odd ALUO units), two pipelines
|
2019-06-15 01:04:24 +08:00
|
|
|
// (EXECE, EXECO) and 1 dispatch (DISP) to the given superslice.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_ALUE_3C, P9_ALUO_3C, IP_EXECE_1C, IP_EXECO_1C, DISP_1C],
|
2017-09-23 04:17:25 +08:00
|
|
|
(instrs
|
2018-03-09 00:24:33 +08:00
|
|
|
(instregex "M(T|F)VSCR$"),
|
2018-03-02 00:16:08 +08:00
|
|
|
(instregex "VCMPNEZ(B|H|W)$"),
|
2018-03-10 05:08:35 +08:00
|
|
|
(instregex "VCMPEQU(B|H|W|D)$"),
|
|
|
|
(instregex "VCMPNE(B|H|W)$"),
|
|
|
|
(instregex "VABSDU(B|H|W)$"),
|
|
|
|
(instregex "VADDU(B|H|W)S$"),
|
|
|
|
(instregex "VAVG(S|U)(B|H|W)$"),
|
2020-01-07 03:05:12 +08:00
|
|
|
(instregex "VCMP(EQ|GE|GT)FP(_rec)?$"),
|
|
|
|
(instregex "VCMPBFP(_rec)?$"),
|
2018-03-10 05:08:35 +08:00
|
|
|
(instregex "VC(L|T)Z(B|H|W|D)$"),
|
|
|
|
(instregex "VADDS(B|H|W)S$"),
|
|
|
|
(instregex "V(MIN|MAX)FP$"),
|
|
|
|
(instregex "V(MIN|MAX)(S|U)(B|H|W|D)$"),
|
2017-09-23 04:17:25 +08:00
|
|
|
VBPERMD,
|
2018-03-02 00:16:08 +08:00
|
|
|
VADDCUW,
|
2017-09-23 04:17:25 +08:00
|
|
|
VPOPCNTW,
|
2016-12-19 21:35:45 +08:00
|
|
|
VPOPCNTD,
|
|
|
|
VPRTYBD,
|
|
|
|
VPRTYBW,
|
|
|
|
VSHASIGMAD,
|
|
|
|
VSHASIGMAW,
|
|
|
|
VSUBSBS,
|
|
|
|
VSUBSHS,
|
|
|
|
VSUBSWS,
|
|
|
|
VSUBUBS,
|
|
|
|
VSUBUHS,
|
|
|
|
VSUBUWS,
|
2017-09-23 04:17:25 +08:00
|
|
|
VSUBCUW,
|
|
|
|
VCMPGTSB,
|
2020-01-07 03:05:12 +08:00
|
|
|
VCMPGTSB_rec,
|
2017-09-23 04:17:25 +08:00
|
|
|
VCMPGTSD,
|
2020-01-07 03:05:12 +08:00
|
|
|
VCMPGTSD_rec,
|
2017-09-23 04:17:25 +08:00
|
|
|
VCMPGTSH,
|
2020-01-07 03:05:12 +08:00
|
|
|
VCMPGTSH_rec,
|
2017-09-23 04:17:25 +08:00
|
|
|
VCMPGTSW,
|
2020-01-07 03:05:12 +08:00
|
|
|
VCMPGTSW_rec,
|
2017-09-23 04:17:25 +08:00
|
|
|
VCMPGTUB,
|
2020-01-07 03:05:12 +08:00
|
|
|
VCMPGTUB_rec,
|
2017-09-23 04:17:25 +08:00
|
|
|
VCMPGTUD,
|
2020-01-07 03:05:12 +08:00
|
|
|
VCMPGTUD_rec,
|
2017-09-23 04:17:25 +08:00
|
|
|
VCMPGTUH,
|
2020-01-07 03:05:12 +08:00
|
|
|
VCMPGTUH_rec,
|
2017-09-23 04:17:25 +08:00
|
|
|
VCMPGTUW,
|
2020-01-07 03:05:12 +08:00
|
|
|
VCMPGTUW_rec,
|
|
|
|
VCMPNEB_rec,
|
|
|
|
VCMPNEH_rec,
|
|
|
|
VCMPNEW_rec,
|
|
|
|
VCMPNEZB_rec,
|
|
|
|
VCMPNEZH_rec,
|
|
|
|
VCMPNEZW_rec,
|
|
|
|
VCMPEQUB_rec,
|
|
|
|
VCMPEQUD_rec,
|
|
|
|
VCMPEQUH_rec,
|
|
|
|
VCMPEQUW_rec,
|
2016-12-19 21:35:45 +08:00
|
|
|
XVCMPEQDP,
|
2020-01-07 03:05:12 +08:00
|
|
|
XVCMPEQDP_rec,
|
2016-12-19 21:35:45 +08:00
|
|
|
XVCMPEQSP,
|
2020-01-07 03:05:12 +08:00
|
|
|
XVCMPEQSP_rec,
|
2016-12-19 21:35:45 +08:00
|
|
|
XVCMPGEDP,
|
2020-01-07 03:05:12 +08:00
|
|
|
XVCMPGEDP_rec,
|
2016-12-19 21:35:45 +08:00
|
|
|
XVCMPGESP,
|
2020-01-07 03:05:12 +08:00
|
|
|
XVCMPGESP_rec,
|
2016-12-19 21:35:45 +08:00
|
|
|
XVCMPGTDP,
|
2020-01-07 03:05:12 +08:00
|
|
|
XVCMPGTDP_rec,
|
2016-12-19 21:35:45 +08:00
|
|
|
XVCMPGTSP,
|
2020-01-07 03:05:12 +08:00
|
|
|
XVCMPGTSP_rec,
|
2016-12-19 21:35:45 +08:00
|
|
|
XVMAXDP,
|
|
|
|
XVMAXSP,
|
|
|
|
XVMINDP,
|
|
|
|
XVMINSP,
|
|
|
|
XVTDIVDP,
|
|
|
|
XVTDIVSP,
|
|
|
|
XVTSQRTDP,
|
|
|
|
XVTSQRTSP,
|
|
|
|
XVTSTDCDP,
|
|
|
|
XVTSTDCSP,
|
|
|
|
XVXSIGDP,
|
|
|
|
XVXSIGSP
|
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// 7 cycle DP vector operation that uses an entire superslice.
|
2019-06-15 01:04:24 +08:00
|
|
|
// Uses both DP units (the even DPE and odd DPO units), two pipelines (EXECE,
|
|
|
|
// EXECO) and all three dispatches (DISP) to the given superslice.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DPE_7C, P9_DPO_7C, IP_EXECE_1C, IP_EXECO_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
|
|
|
VADDFP,
|
|
|
|
VCTSXS,
|
|
|
|
VCTSXS_0,
|
|
|
|
VCTUXS,
|
|
|
|
VCTUXS_0,
|
|
|
|
VEXPTEFP,
|
|
|
|
VLOGEFP,
|
|
|
|
VMADDFP,
|
|
|
|
VMHADDSHS,
|
|
|
|
VNMSUBFP,
|
|
|
|
VREFP,
|
|
|
|
VRFIM,
|
|
|
|
VRFIN,
|
|
|
|
VRFIP,
|
|
|
|
VRFIZ,
|
|
|
|
VRSQRTEFP,
|
|
|
|
VSUBFP,
|
|
|
|
XVADDDP,
|
|
|
|
XVADDSP,
|
|
|
|
XVCVDPSP,
|
|
|
|
XVCVDPSXDS,
|
|
|
|
XVCVDPSXWS,
|
|
|
|
XVCVDPUXDS,
|
|
|
|
XVCVDPUXWS,
|
|
|
|
XVCVHPSP,
|
|
|
|
XVCVSPDP,
|
|
|
|
XVCVSPHP,
|
|
|
|
XVCVSPSXDS,
|
|
|
|
XVCVSPSXWS,
|
|
|
|
XVCVSPUXDS,
|
|
|
|
XVCVSPUXWS,
|
|
|
|
XVCVSXDDP,
|
|
|
|
XVCVSXDSP,
|
|
|
|
XVCVSXWDP,
|
|
|
|
XVCVSXWSP,
|
|
|
|
XVCVUXDDP,
|
|
|
|
XVCVUXDSP,
|
|
|
|
XVCVUXWDP,
|
|
|
|
XVCVUXWSP,
|
|
|
|
XVMADDADP,
|
|
|
|
XVMADDASP,
|
|
|
|
XVMADDMDP,
|
|
|
|
XVMADDMSP,
|
|
|
|
XVMSUBADP,
|
|
|
|
XVMSUBASP,
|
|
|
|
XVMSUBMDP,
|
|
|
|
XVMSUBMSP,
|
|
|
|
XVMULDP,
|
|
|
|
XVMULSP,
|
|
|
|
XVNMADDADP,
|
|
|
|
XVNMADDASP,
|
|
|
|
XVNMADDMDP,
|
|
|
|
XVNMADDMSP,
|
|
|
|
XVNMSUBADP,
|
|
|
|
XVNMSUBASP,
|
|
|
|
XVNMSUBMDP,
|
|
|
|
XVNMSUBMSP,
|
|
|
|
XVRDPI,
|
|
|
|
XVRDPIC,
|
|
|
|
XVRDPIM,
|
|
|
|
XVRDPIP,
|
|
|
|
XVRDPIZ,
|
|
|
|
XVREDP,
|
|
|
|
XVRESP,
|
|
|
|
XVRSPI,
|
|
|
|
XVRSPIC,
|
|
|
|
XVRSPIM,
|
|
|
|
XVRSPIP,
|
|
|
|
XVRSPIZ,
|
|
|
|
XVRSQRTEDP,
|
|
|
|
XVRSQRTESP,
|
|
|
|
XVSUBDP,
|
|
|
|
XVSUBSP,
|
|
|
|
VCFSX,
|
|
|
|
VCFSX_0,
|
|
|
|
VCFUX,
|
|
|
|
VCFUX_0,
|
|
|
|
VMHRADDSHS,
|
|
|
|
VMLADDUHM,
|
|
|
|
VMSUMMBM,
|
|
|
|
VMSUMSHM,
|
|
|
|
VMSUMSHS,
|
|
|
|
VMSUMUBM,
|
|
|
|
VMSUMUHM,
|
|
|
|
VMSUMUHS,
|
|
|
|
VMULESB,
|
|
|
|
VMULESH,
|
|
|
|
VMULESW,
|
|
|
|
VMULEUB,
|
|
|
|
VMULEUH,
|
|
|
|
VMULEUW,
|
|
|
|
VMULOSB,
|
|
|
|
VMULOSH,
|
|
|
|
VMULOSW,
|
|
|
|
VMULOUB,
|
|
|
|
VMULOUH,
|
|
|
|
VMULOUW,
|
|
|
|
VMULUWM,
|
|
|
|
VSUM2SWS,
|
|
|
|
VSUM4SBS,
|
|
|
|
VSUM4SHS,
|
|
|
|
VSUM4UBS,
|
|
|
|
VSUMSWS
|
|
|
|
)>;
|
|
|
|
|
2018-03-09 00:24:33 +08:00
|
|
|
// 5 cycle Restricted DP operation. One DP unit, one EXEC pipeline and all three
|
2019-06-15 01:04:24 +08:00
|
|
|
// dispatch units for the superslice.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DP_5C, IP_EXEC_1C, DISP_3SLOTS_1C],
|
2018-03-09 00:24:33 +08:00
|
|
|
(instrs
|
2019-02-20 10:30:06 +08:00
|
|
|
(instregex "MADD(HD|HDU|LD|LD8)$"),
|
2019-11-09 06:14:28 +08:00
|
|
|
(instregex "MUL(HD|HW|LD|LI|LI8|LW)(U)?(O)?$")
|
2018-03-09 00:24:33 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// 7 cycle Restricted DP operation. One DP unit, one EXEC pipeline and all three
|
2019-06-15 01:04:24 +08:00
|
|
|
// dispatch units for the superslice.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DP_7C, IP_EXEC_1C, DISP_3SLOTS_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2017-09-23 04:17:25 +08:00
|
|
|
FRSP,
|
2018-03-05 22:34:59 +08:00
|
|
|
(instregex "FRI(N|P|Z|M)(D|S)$"),
|
|
|
|
(instregex "FRE(S)?$"),
|
|
|
|
(instregex "FADD(S)?$"),
|
|
|
|
(instregex "FMSUB(S)?$"),
|
|
|
|
(instregex "FMADD(S)?$"),
|
2018-03-10 05:08:35 +08:00
|
|
|
(instregex "FSUB(S)?$"),
|
|
|
|
(instregex "FCFID(U)?(S)?$"),
|
|
|
|
(instregex "FCTID(U)?(Z)?$"),
|
|
|
|
(instregex "FCTIW(U)?(Z)?$"),
|
|
|
|
(instregex "FRSQRTE(S)?$"),
|
2017-09-23 04:17:25 +08:00
|
|
|
FNMADDS,
|
|
|
|
FNMADD,
|
|
|
|
FNMSUBS,
|
|
|
|
FNMSUB,
|
|
|
|
FSELD,
|
|
|
|
FSELS,
|
|
|
|
FMULS,
|
|
|
|
FMUL,
|
2016-12-19 21:35:45 +08:00
|
|
|
XSMADDADP,
|
|
|
|
XSMADDASP,
|
|
|
|
XSMADDMDP,
|
|
|
|
XSMADDMSP,
|
|
|
|
XSMSUBADP,
|
|
|
|
XSMSUBASP,
|
|
|
|
XSMSUBMDP,
|
|
|
|
XSMSUBMSP,
|
|
|
|
XSMULDP,
|
|
|
|
XSMULSP,
|
|
|
|
XSNMADDADP,
|
|
|
|
XSNMADDASP,
|
|
|
|
XSNMADDMDP,
|
|
|
|
XSNMADDMSP,
|
|
|
|
XSNMSUBADP,
|
|
|
|
XSNMSUBASP,
|
|
|
|
XSNMSUBMDP,
|
|
|
|
XSNMSUBMSP
|
|
|
|
)>;
|
|
|
|
|
2018-03-02 00:16:08 +08:00
|
|
|
// 7 cycle Restricted DP operation and one 3 cycle ALU operation.
|
2019-06-15 01:04:24 +08:00
|
|
|
// These operations can be done in parallel. The DP is restricted so we need a
|
|
|
|
// full 4 dispatches.
|
2018-03-05 22:34:59 +08:00
|
|
|
def : InstRW<[P9_DP_7C, P9_ALU_3C, IP_EXEC_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_1C],
|
2018-03-05 22:34:59 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
(instregex "FSEL(D|S)_rec$")
|
2018-03-05 22:34:59 +08:00
|
|
|
)>;
|
|
|
|
|
2018-03-09 00:24:33 +08:00
|
|
|
// 5 Cycle Restricted DP operation and one 2 cycle ALU operation.
|
|
|
|
def : InstRW<[P9_DPOpAndALUOp_7C, IP_EXEC_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_1C],
|
2018-03-09 00:24:33 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
(instregex "MUL(H|L)(D|W)(U)?(O)?_rec$")
|
2018-03-09 00:24:33 +08:00
|
|
|
)>;
|
|
|
|
|
2018-03-05 22:34:59 +08:00
|
|
|
// 7 cycle Restricted DP operation and one 3 cycle ALU operation.
|
2019-06-15 01:04:24 +08:00
|
|
|
// These operations must be done sequentially.The DP is restricted so we need a
|
|
|
|
// full 4 dispatches.
|
2018-03-02 00:16:08 +08:00
|
|
|
def : InstRW<[P9_DPOpAndALU2Op_10C, IP_EXEC_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_1C],
|
2017-10-10 21:45:35 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
(instregex "FRI(N|P|Z|M)(D|S)_rec$"),
|
|
|
|
(instregex "FRE(S)?_rec$"),
|
|
|
|
(instregex "FADD(S)?_rec$"),
|
|
|
|
(instregex "FSUB(S)?_rec$"),
|
|
|
|
(instregex "F(N)?MSUB(S)?_rec$"),
|
|
|
|
(instregex "F(N)?MADD(S)?_rec$"),
|
|
|
|
(instregex "FCFID(U)?(S)?_rec$"),
|
|
|
|
(instregex "FCTID(U)?(Z)?_rec$"),
|
|
|
|
(instregex "FCTIW(U)?(Z)?_rec$"),
|
|
|
|
(instregex "FMUL(S)?_rec$"),
|
|
|
|
(instregex "FRSQRTE(S)?_rec$"),
|
|
|
|
FRSP_rec
|
2017-10-10 21:45:35 +08:00
|
|
|
)>;
|
|
|
|
|
2019-06-04 23:22:23 +08:00
|
|
|
// 7 cycle DP operation. One DP unit, one EXEC pipeline and 1 dispatch units.
|
|
|
|
def : InstRW<[P9_DP_7C, IP_EXEC_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
|
|
|
XSADDDP,
|
|
|
|
XSADDSP,
|
|
|
|
XSCVDPHP,
|
|
|
|
XSCVDPSP,
|
|
|
|
XSCVDPSXDS,
|
2017-09-23 04:17:25 +08:00
|
|
|
XSCVDPSXDSs,
|
2016-12-19 21:35:45 +08:00
|
|
|
XSCVDPSXWS,
|
|
|
|
XSCVDPUXDS,
|
2017-09-23 04:17:25 +08:00
|
|
|
XSCVDPUXDSs,
|
2016-12-19 21:35:45 +08:00
|
|
|
XSCVDPUXWS,
|
2018-03-09 00:24:33 +08:00
|
|
|
XSCVDPSXWSs,
|
|
|
|
XSCVDPUXWSs,
|
2016-12-19 21:35:45 +08:00
|
|
|
XSCVHPDP,
|
|
|
|
XSCVSPDP,
|
|
|
|
XSCVSXDDP,
|
|
|
|
XSCVSXDSP,
|
|
|
|
XSCVUXDDP,
|
|
|
|
XSCVUXDSP,
|
|
|
|
XSRDPI,
|
|
|
|
XSRDPIC,
|
|
|
|
XSRDPIM,
|
|
|
|
XSRDPIP,
|
|
|
|
XSRDPIZ,
|
|
|
|
XSREDP,
|
|
|
|
XSRESP,
|
|
|
|
XSRSQRTEDP,
|
|
|
|
XSRSQRTESP,
|
|
|
|
XSSUBDP,
|
|
|
|
XSSUBSP,
|
2018-07-05 05:59:16 +08:00
|
|
|
XSCVDPSPN,
|
|
|
|
XSRSP
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// Three Cycle PM operation. Only one PM unit per superslice so we use the whole
|
2019-06-15 01:04:24 +08:00
|
|
|
// superslice. That includes both exec pipelines (EXECO, EXECE) and one
|
|
|
|
// dispatch.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_PM_3C, IP_EXECO_1C, IP_EXECE_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2018-03-09 00:24:33 +08:00
|
|
|
(instregex "LVS(L|R)$"),
|
|
|
|
(instregex "VSPLTIS(W|H|B)$"),
|
|
|
|
(instregex "VSPLT(W|H|B)(s)?$"),
|
|
|
|
(instregex "V_SETALLONES(B|H)?$"),
|
|
|
|
(instregex "VEXTRACTU(B|H|W)$"),
|
2018-03-10 05:08:35 +08:00
|
|
|
(instregex "VINSERT(B|H|W|D)$"),
|
2018-03-09 00:24:33 +08:00
|
|
|
MFVSRLD,
|
|
|
|
MTVSRWS,
|
2016-12-19 21:35:45 +08:00
|
|
|
VBPERMQ,
|
|
|
|
VCLZLSBB,
|
|
|
|
VCTZLSBB,
|
|
|
|
VEXTRACTD,
|
|
|
|
VEXTUBLX,
|
|
|
|
VEXTUBRX,
|
|
|
|
VEXTUHLX,
|
|
|
|
VEXTUHRX,
|
|
|
|
VEXTUWLX,
|
|
|
|
VEXTUWRX,
|
|
|
|
VGBBD,
|
|
|
|
VMRGHB,
|
|
|
|
VMRGHH,
|
|
|
|
VMRGHW,
|
|
|
|
VMRGLB,
|
|
|
|
VMRGLH,
|
|
|
|
VMRGLW,
|
|
|
|
VPERM,
|
|
|
|
VPERMR,
|
|
|
|
VPERMXOR,
|
|
|
|
VPKPX,
|
|
|
|
VPKSDSS,
|
|
|
|
VPKSDUS,
|
|
|
|
VPKSHSS,
|
|
|
|
VPKSHUS,
|
|
|
|
VPKSWSS,
|
|
|
|
VPKSWUS,
|
|
|
|
VPKUDUM,
|
|
|
|
VPKUDUS,
|
|
|
|
VPKUHUM,
|
|
|
|
VPKUHUS,
|
|
|
|
VPKUWUM,
|
|
|
|
VPKUWUS,
|
|
|
|
VPRTYBQ,
|
|
|
|
VSL,
|
|
|
|
VSLDOI,
|
|
|
|
VSLO,
|
|
|
|
VSLV,
|
|
|
|
VSR,
|
|
|
|
VSRO,
|
|
|
|
VSRV,
|
|
|
|
VUPKHPX,
|
|
|
|
VUPKHSB,
|
|
|
|
VUPKHSH,
|
|
|
|
VUPKHSW,
|
|
|
|
VUPKLPX,
|
|
|
|
VUPKLSB,
|
|
|
|
VUPKLSH,
|
|
|
|
VUPKLSW,
|
|
|
|
XXBRD,
|
|
|
|
XXBRH,
|
|
|
|
XXBRQ,
|
|
|
|
XXBRW,
|
|
|
|
XXEXTRACTUW,
|
|
|
|
XXINSERTW,
|
|
|
|
XXMRGHW,
|
|
|
|
XXMRGLW,
|
|
|
|
XXPERM,
|
|
|
|
XXPERMR,
|
|
|
|
XXSLDWI,
|
2018-08-08 23:20:43 +08:00
|
|
|
XXSLDWIs,
|
2016-12-19 21:35:45 +08:00
|
|
|
XXSPLTIB,
|
|
|
|
XXSPLTW,
|
2017-09-23 04:17:25 +08:00
|
|
|
XXSPLTWs,
|
|
|
|
XXPERMDI,
|
|
|
|
XXPERMDIs,
|
2016-12-19 21:35:45 +08:00
|
|
|
VADDCUQ,
|
|
|
|
VADDECUQ,
|
|
|
|
VADDEUQM,
|
|
|
|
VADDUQM,
|
|
|
|
VMUL10CUQ,
|
|
|
|
VMUL10ECUQ,
|
|
|
|
VMUL10EUQ,
|
|
|
|
VMUL10UQ,
|
|
|
|
VSUBCUQ,
|
|
|
|
VSUBECUQ,
|
|
|
|
VSUBEUQM,
|
|
|
|
VSUBUQM,
|
|
|
|
XSCMPEXPQP,
|
|
|
|
XSCMPOQP,
|
|
|
|
XSCMPUQP,
|
|
|
|
XSTSTDCQP,
|
2018-03-02 00:16:08 +08:00
|
|
|
XSXSIGQP,
|
2020-01-07 03:05:12 +08:00
|
|
|
BCDCFN_rec,
|
|
|
|
BCDCFZ_rec,
|
|
|
|
BCDCPSGN_rec,
|
|
|
|
BCDCTN_rec,
|
|
|
|
BCDCTZ_rec,
|
|
|
|
BCDSETSGN_rec,
|
|
|
|
BCDS_rec,
|
|
|
|
BCDTRUNC_rec,
|
|
|
|
BCDUS_rec,
|
|
|
|
BCDUTRUNC_rec
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// 12 Cycle DFU operation. Only one DFU unit per CPU so we use a whole
|
2019-06-15 01:04:24 +08:00
|
|
|
// superslice. That includes both exec pipelines (EXECO, EXECE) and one
|
|
|
|
// dispatch.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DFU_12C, IP_EXECE_1C, IP_EXECO_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
BCDSR_rec,
|
2016-12-19 21:35:45 +08:00
|
|
|
XSADDQP,
|
|
|
|
XSADDQPO,
|
|
|
|
XSCVDPQP,
|
|
|
|
XSCVQPDP,
|
|
|
|
XSCVQPDPO,
|
|
|
|
XSCVQPSDZ,
|
|
|
|
XSCVQPSWZ,
|
|
|
|
XSCVQPUDZ,
|
|
|
|
XSCVQPUWZ,
|
|
|
|
XSCVSDQP,
|
|
|
|
XSCVUDQP,
|
|
|
|
XSRQPI,
|
2018-03-09 00:24:33 +08:00
|
|
|
XSRQPIX,
|
2016-12-19 21:35:45 +08:00
|
|
|
XSRQPXP,
|
|
|
|
XSSUBQP,
|
|
|
|
XSSUBQPO
|
|
|
|
)>;
|
|
|
|
|
2018-03-02 00:16:08 +08:00
|
|
|
// 23 Cycle DFU operation. Only one DFU unit per CPU so we use a whole
|
2019-06-15 01:04:24 +08:00
|
|
|
// superslice. That includes both exec pipelines (EXECO, EXECE) and one
|
|
|
|
// dispatch.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DFU_23C, IP_EXECE_1C, IP_EXECO_1C, DISP_1C],
|
2018-03-02 00:16:08 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
BCDCTSQ_rec
|
2018-03-02 00:16:08 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// 24 Cycle DFU operation. Only one DFU unit per CPU so we use a whole
|
2019-06-15 01:04:24 +08:00
|
|
|
// superslice. That includes both exec pipelines (EXECO, EXECE) and one
|
|
|
|
// dispatch.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DFU_24C, IP_EXECE_1C, IP_EXECO_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
|
|
|
XSMADDQP,
|
|
|
|
XSMADDQPO,
|
|
|
|
XSMSUBQP,
|
|
|
|
XSMSUBQPO,
|
|
|
|
XSMULQP,
|
|
|
|
XSMULQPO,
|
|
|
|
XSNMADDQP,
|
|
|
|
XSNMADDQPO,
|
|
|
|
XSNMSUBQP,
|
|
|
|
XSNMSUBQPO
|
|
|
|
)>;
|
|
|
|
|
2018-03-02 00:16:08 +08:00
|
|
|
// 37 Cycle DFU operation. Only one DFU unit per CPU so we use a whole
|
2019-06-15 01:04:24 +08:00
|
|
|
// superslice. That includes both exec pipelines (EXECO, EXECE) and one
|
|
|
|
// dispatch.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DFU_37C, IP_EXECE_1C, IP_EXECO_1C, DISP_1C],
|
2018-03-02 00:16:08 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
BCDCFSQ_rec
|
2018-03-02 00:16:08 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// 58 Cycle DFU operation. Only one DFU unit per CPU so we use a whole
|
2019-06-15 01:04:24 +08:00
|
|
|
// superslice. That includes both exec pipelines (EXECO, EXECE) and one
|
|
|
|
// dispatch.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DFU_58C, IP_EXECE_1C, IP_EXECO_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
|
|
|
XSDIVQP,
|
|
|
|
XSDIVQPO
|
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// 76 Cycle DFU operation. Only one DFU unit per CPU so we use a whole
|
2019-06-15 01:04:24 +08:00
|
|
|
// superslice. That includes both exec pipelines (EXECO, EXECE) and all three
|
|
|
|
// dispatches.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DFU_76C, IP_EXECE_1C, IP_EXECO_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
|
|
|
XSSQRTQP,
|
|
|
|
XSSQRTQPO
|
|
|
|
)>;
|
|
|
|
|
2018-03-10 05:08:35 +08:00
|
|
|
// 6 Cycle Load uses a single slice.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_LS_6C, IP_AGEN_1C, DISP_1C],
|
2018-03-09 00:24:33 +08:00
|
|
|
(instrs
|
|
|
|
(instregex "LXVL(L)?")
|
|
|
|
)>;
|
|
|
|
|
2018-03-10 05:08:35 +08:00
|
|
|
// 5 Cycle Load uses a single slice.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_LS_5C, IP_AGEN_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2018-03-09 00:24:33 +08:00
|
|
|
(instregex "LVE(B|H|W)X$"),
|
|
|
|
(instregex "LVX(L)?"),
|
|
|
|
(instregex "LXSI(B|H)ZX$"),
|
2016-12-19 21:35:45 +08:00
|
|
|
LXSDX,
|
2018-03-09 00:24:33 +08:00
|
|
|
LXVB16X,
|
2016-12-19 21:35:45 +08:00
|
|
|
LXVD2X,
|
2018-03-02 00:16:08 +08:00
|
|
|
LXVWSX,
|
2016-12-19 21:35:45 +08:00
|
|
|
LXSIWZX,
|
|
|
|
LXV,
|
2017-09-23 04:17:25 +08:00
|
|
|
LXVX,
|
|
|
|
LXSD,
|
2017-11-20 22:38:30 +08:00
|
|
|
DFLOADf64,
|
2018-02-24 04:37:10 +08:00
|
|
|
XFLOADf64,
|
|
|
|
LIWZX
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2018-03-10 05:08:35 +08:00
|
|
|
// 4 Cycle Load uses a single slice.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_LS_4C, IP_AGEN_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2018-03-05 22:34:59 +08:00
|
|
|
(instregex "DCB(F|T|ST)(EP)?$"),
|
|
|
|
(instregex "DCBZ(L)?(EP)?$"),
|
|
|
|
(instregex "DCBTST(EP)?$"),
|
|
|
|
(instregex "CP_COPY(8)?$"),
|
|
|
|
(instregex "CP_PASTE(8)?$"),
|
|
|
|
(instregex "ICBI(EP)?$"),
|
|
|
|
(instregex "ICBT(LS)?$"),
|
|
|
|
(instregex "LBARX(L)?$"),
|
2018-05-28 23:27:58 +08:00
|
|
|
(instregex "LBZ(CIX|8|X|X8|XTLS|XTLS_32)?(_)?$"),
|
|
|
|
(instregex "LD(ARX|ARXL|BRX|CIX|X|XTLS)?(_)?$"),
|
2018-03-09 00:24:33 +08:00
|
|
|
(instregex "LH(A|B)RX(L)?(8)?$"),
|
2018-05-28 23:27:58 +08:00
|
|
|
(instregex "LHZ(8|CIX|X|X8|XTLS|XTLS_32)?(_)?$"),
|
2018-03-09 00:24:33 +08:00
|
|
|
(instregex "LWARX(L)?$"),
|
|
|
|
(instregex "LWBRX(8)?$"),
|
2018-05-28 23:27:58 +08:00
|
|
|
(instregex "LWZ(8|CIX|X|X8|XTLS|XTLS_32)?(_)?$"),
|
2018-03-10 05:08:35 +08:00
|
|
|
CP_ABORT,
|
|
|
|
DARN,
|
|
|
|
EnforceIEIO,
|
|
|
|
ISYNC,
|
|
|
|
MSGSYNC,
|
|
|
|
TLBSYNC,
|
|
|
|
SYNC,
|
2018-03-09 00:24:33 +08:00
|
|
|
LMW,
|
|
|
|
LSWI
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// 4 Cycle Restricted load uses a single slice but the dispatch for the whole
|
2019-06-15 01:04:24 +08:00
|
|
|
// superslice.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_LS_4C, IP_AGEN_1C, DISP_3SLOTS_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2017-09-23 04:17:25 +08:00
|
|
|
LFIWZX,
|
|
|
|
LFDX,
|
|
|
|
LFD
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2018-03-10 05:08:35 +08:00
|
|
|
// Cracked Load Instructions.
|
|
|
|
// Load instructions that can be done in parallel.
|
2018-03-09 00:24:33 +08:00
|
|
|
def : InstRW<[P9_LS_4C, P9_LS_4C, IP_AGEN_1C, IP_AGEN_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_PAIR_1C],
|
2018-03-09 00:24:33 +08:00
|
|
|
(instrs
|
|
|
|
SLBIA,
|
|
|
|
SLBIE,
|
|
|
|
SLBMFEE,
|
|
|
|
SLBMFEV,
|
|
|
|
SLBMTE,
|
|
|
|
TLBIEL
|
|
|
|
)>;
|
|
|
|
|
2018-03-10 05:08:35 +08:00
|
|
|
// Cracked Load Instruction.
|
2018-03-09 00:24:33 +08:00
|
|
|
// Requires Load and ALU pieces totaling 6 cycles. The Load and ALU
|
|
|
|
// operations can be run in parallel.
|
|
|
|
def : InstRW<[P9_LS_4C, P9_ALU_2C, IP_EXEC_1C, IP_AGEN_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_PAIR_1C, DISP_PAIR_1C],
|
|
|
|
(instrs
|
|
|
|
(instregex "L(W|H)ZU(X)?(8)?$")
|
|
|
|
)>;
|
|
|
|
|
|
|
|
// Cracked TEND Instruction.
|
|
|
|
// Requires Load and ALU pieces totaling 6 cycles. The Load and ALU
|
|
|
|
// operations can be run in parallel.
|
|
|
|
def : InstRW<[P9_LS_4C, P9_ALU_2C, IP_EXEC_1C, IP_AGEN_1C,
|
|
|
|
DISP_1C, DISP_1C],
|
2018-03-09 00:24:33 +08:00
|
|
|
(instrs
|
|
|
|
TEND
|
|
|
|
)>;
|
|
|
|
|
2019-06-04 23:22:23 +08:00
|
|
|
|
2018-03-10 05:08:35 +08:00
|
|
|
// Cracked Store Instruction
|
|
|
|
// Consecutive Store and ALU instructions. The store is restricted and requires
|
|
|
|
// three dispatches.
|
2018-03-09 00:24:33 +08:00
|
|
|
def : InstRW<[P9_StoreAndALUOp_3C, IP_EXEC_1C, IP_EXEC_1C, IP_AGEN_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_1C],
|
2018-03-09 00:24:33 +08:00
|
|
|
(instrs
|
|
|
|
(instregex "ST(B|H|W|D)CX$")
|
|
|
|
)>;
|
|
|
|
|
2018-03-10 05:08:35 +08:00
|
|
|
// Cracked Load Instruction.
|
|
|
|
// Two consecutive load operations for a total of 8 cycles.
|
|
|
|
def : InstRW<[P9_LoadAndLoadOp_8C, IP_AGEN_1C, IP_AGEN_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_1C, DISP_1C],
|
2018-03-10 05:08:35 +08:00
|
|
|
(instrs
|
|
|
|
LDMX
|
|
|
|
)>;
|
|
|
|
|
2018-03-05 22:34:59 +08:00
|
|
|
// Cracked Load instruction.
|
|
|
|
// Requires consecutive Load and ALU pieces totaling 6 cycles. The Load and ALU
|
2019-06-15 01:04:24 +08:00
|
|
|
// operations cannot be done at the same time and so their latencies are added.
|
2018-03-05 22:34:59 +08:00
|
|
|
def : InstRW<[P9_LoadAndALUOp_6C, IP_EXEC_1C, IP_AGEN_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_1C, DISP_1C],
|
2018-03-05 22:34:59 +08:00
|
|
|
(instrs
|
2018-03-09 00:24:33 +08:00
|
|
|
(instregex "LHA(X)?(8)?$"),
|
2020-01-07 03:05:12 +08:00
|
|
|
(instregex "CP_PASTE(8)?_rec$"),
|
2018-03-09 00:24:33 +08:00
|
|
|
(instregex "LWA(X)?(_32)?$"),
|
|
|
|
TCHECK
|
2018-03-05 22:34:59 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// Cracked Restricted Load instruction.
|
|
|
|
// Requires consecutive Load and ALU pieces totaling 6 cycles. The Load and ALU
|
2019-06-15 01:04:24 +08:00
|
|
|
// operations cannot be done at the same time and so their latencies are added.
|
2017-09-23 04:17:25 +08:00
|
|
|
// Full 6 dispatches are required as this is both cracked and restricted.
|
|
|
|
def : InstRW<[P9_LoadAndALUOp_6C, IP_EXEC_1C, IP_AGEN_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_3SLOTS_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2018-03-02 00:16:08 +08:00
|
|
|
LFIWAX
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// Cracked Load instruction.
|
|
|
|
// Requires consecutive Load and ALU pieces totaling 7 cycles. The Load and ALU
|
2019-06-15 01:04:24 +08:00
|
|
|
// operations cannot be done at the same time and so their latencies are added.
|
2017-09-23 04:17:25 +08:00
|
|
|
// Full 4 dispatches are required as this is a cracked instruction.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_LoadAndALUOp_7C, IP_AGEN_1C, IP_EXEC_1C, DISP_1C, DISP_1C],
|
2017-09-23 04:17:25 +08:00
|
|
|
(instrs
|
|
|
|
LXSIWAX,
|
2018-03-02 00:16:08 +08:00
|
|
|
LIWAX
|
|
|
|
)>;
|
|
|
|
|
|
|
|
// Cracked Load instruction.
|
|
|
|
// Requires consecutive Load (4 cycles) and ALU (3 cycles) pieces totaling 7
|
|
|
|
// cycles. The Load and ALU operations cannot be done at the same time and so
|
|
|
|
// their latencies are added.
|
|
|
|
// Full 6 dispatches are required as this is a restricted instruction.
|
|
|
|
def : InstRW<[P9_LoadAndALU2Op_7C, IP_AGEN_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_3SLOTS_1C],
|
2018-03-02 00:16:08 +08:00
|
|
|
(instrs
|
|
|
|
LFSX,
|
|
|
|
LFS
|
|
|
|
)>;
|
|
|
|
|
|
|
|
// Cracked Load instruction.
|
|
|
|
// Requires consecutive Load and ALU pieces totaling 8 cycles. The Load and ALU
|
2019-06-15 01:04:24 +08:00
|
|
|
// operations cannot be done at the same time and so their latencies are added.
|
2018-03-02 00:16:08 +08:00
|
|
|
// Full 4 dispatches are required as this is a cracked instruction.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_LoadAndALU2Op_8C, IP_AGEN_1C, IP_EXEC_1C, DISP_1C, DISP_1C],
|
2018-03-02 00:16:08 +08:00
|
|
|
(instrs
|
2017-09-23 04:17:25 +08:00
|
|
|
LXSSP,
|
2018-03-02 00:16:08 +08:00
|
|
|
LXSSPX,
|
2017-11-20 22:38:30 +08:00
|
|
|
XFLOADf32,
|
2018-03-02 00:16:08 +08:00
|
|
|
DFLOADf32
|
2017-09-23 04:17:25 +08:00
|
|
|
)>;
|
|
|
|
|
2018-03-09 00:24:33 +08:00
|
|
|
// Cracked 3-Way Load Instruction
|
|
|
|
// Load with two ALU operations that depend on each other
|
|
|
|
def : InstRW<[P9_LoadAndALUOp_6C, P9_ALU_2C, IP_AGEN_1C, IP_EXEC_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_PAIR_1C, DISP_PAIR_1C, DISP_1C],
|
2018-03-09 00:24:33 +08:00
|
|
|
(instrs
|
|
|
|
(instregex "LHAU(X)?(8)?$"),
|
|
|
|
LWAUX
|
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// Cracked Load that requires the PM resource.
|
|
|
|
// Since the Load and the PM cannot be done at the same time the latencies are
|
2019-06-15 01:04:24 +08:00
|
|
|
// added. Requires 8 cycles. Since the PM requires the full superslice we need
|
|
|
|
// both EXECE, EXECO pipelines as well as 1 dispatch for the PM. The Load
|
|
|
|
// requires the remaining 1 dispatch.
|
2017-09-23 04:17:25 +08:00
|
|
|
def : InstRW<[P9_LoadAndPMOp_8C, IP_AGEN_1C, IP_EXECE_1C, IP_EXECO_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2018-03-09 00:24:33 +08:00
|
|
|
LXVH8X,
|
2016-12-19 21:35:45 +08:00
|
|
|
LXVDSX,
|
|
|
|
LXVW4X
|
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// Single slice Restricted store operation. The restricted operation requires
|
2019-06-15 01:04:24 +08:00
|
|
|
// all three dispatches for the superslice.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_LS_1C, IP_EXEC_1C, IP_AGEN_1C, DISP_3SLOTS_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2018-02-24 04:37:10 +08:00
|
|
|
(instregex "STF(S|D|IWX|SX|DX)$"),
|
2018-03-09 00:24:33 +08:00
|
|
|
(instregex "STXS(D|DX|SPX|IWX|IBX|IHX|SP)(v)?$"),
|
|
|
|
(instregex "STW(8)?$"),
|
2018-03-10 05:08:35 +08:00
|
|
|
(instregex "(D|X)FSTORE(f32|f64)$"),
|
|
|
|
(instregex "ST(W|H|D)BRX$"),
|
|
|
|
(instregex "ST(B|H|D)(8)?$"),
|
2018-05-28 23:27:58 +08:00
|
|
|
(instregex "ST(B|W|H|D)(CI)?X(TLS|TLS_32)?(8)?(_)?$"),
|
2018-03-09 00:24:33 +08:00
|
|
|
STIWX,
|
|
|
|
SLBIEG,
|
|
|
|
STMW,
|
|
|
|
STSWI,
|
2018-03-10 05:08:35 +08:00
|
|
|
TLBIE
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2018-03-10 05:08:35 +08:00
|
|
|
// Vector Store Instruction
|
2019-06-15 01:04:24 +08:00
|
|
|
// Requires the whole superslice and therefore requires one dispatch
|
2018-03-10 05:08:35 +08:00
|
|
|
// as well as both the Even and Odd exec pipelines.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_LS_1C, IP_EXECE_1C, IP_EXECO_1C, IP_AGEN_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2018-03-09 00:24:33 +08:00
|
|
|
(instregex "STVE(B|H|W)X$"),
|
|
|
|
(instregex "STVX(L)?$"),
|
|
|
|
(instregex "STXV(B16X|H8X|W4X|D2X|L|LL|X)?$")
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2018-03-09 00:24:33 +08:00
|
|
|
// 5 Cycle DIV operation. Only one DIV unit per superslice so we use the whole
|
2019-06-04 23:22:23 +08:00
|
|
|
// superslice. That includes both exec pipelines (EXECO, EXECE) and two
|
2018-03-09 00:24:33 +08:00
|
|
|
// dispatches.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DIV_5C, IP_EXECE_1C, IP_EXECO_1C, DISP_EVEN_1C],
|
2018-02-24 04:37:10 +08:00
|
|
|
(instrs
|
2018-03-09 00:24:33 +08:00
|
|
|
(instregex "MTCTR(8)?(loop)?$"),
|
|
|
|
(instregex "MTLR(8)?$")
|
2018-02-24 04:37:10 +08:00
|
|
|
)>;
|
|
|
|
|
|
|
|
// 12 Cycle DIV operation. Only one DIV unit per superslice so we use the whole
|
2019-06-04 23:22:23 +08:00
|
|
|
// superslice. That includes both exec pipelines (EXECO, EXECE) and two
|
2018-02-24 04:37:10 +08:00
|
|
|
// dispatches.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DIV_12C, IP_EXECE_1C, IP_EXECO_1C, DISP_EVEN_1C],
|
2018-02-24 04:37:10 +08:00
|
|
|
(instrs
|
2018-03-02 00:16:08 +08:00
|
|
|
(instregex "M(T|F)VRSAVE(v)?$"),
|
2018-03-09 00:24:33 +08:00
|
|
|
(instregex "M(T|F)PMR$"),
|
|
|
|
(instregex "M(T|F)TB(8)?$"),
|
2018-03-02 00:16:08 +08:00
|
|
|
(instregex "MF(SPR|CTR|LR)(8)?$"),
|
2018-03-09 00:24:33 +08:00
|
|
|
(instregex "M(T|F)MSR(D)?$"),
|
|
|
|
(instregex "MTSPR(8)?$")
|
2018-02-24 04:37:10 +08:00
|
|
|
)>;
|
2016-12-19 21:35:45 +08:00
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// 16 Cycle DIV operation. Only one DIV unit per superslice so we use the whole
|
2019-06-15 01:04:24 +08:00
|
|
|
// superslice. That includes both exec pipelines (EXECO, EXECE) and two
|
|
|
|
// dispatches.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DIV_16C_8, IP_EXECO_1C, IP_EXECE_1C, DISP_EVEN_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
|
|
|
DIVW,
|
2019-11-09 06:14:28 +08:00
|
|
|
DIVWO,
|
2017-09-23 04:17:25 +08:00
|
|
|
DIVWU,
|
2019-11-09 06:14:28 +08:00
|
|
|
DIVWUO,
|
2017-09-23 04:17:25 +08:00
|
|
|
MODSW
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// 24 Cycle DIV operation. Only one DIV unit per superslice so we use the whole
|
2019-06-15 01:04:24 +08:00
|
|
|
// superslice. That includes both exec pipelines (EXECO, EXECE) and two
|
|
|
|
// dispatches.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DIV_24C_8, IP_EXECO_1C, IP_EXECE_1C, DISP_EVEN_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
|
|
|
DIVWE,
|
2019-11-09 06:14:28 +08:00
|
|
|
DIVWEO,
|
2016-12-19 21:35:45 +08:00
|
|
|
DIVD,
|
2019-11-09 06:14:28 +08:00
|
|
|
DIVDO,
|
2016-12-19 21:35:45 +08:00
|
|
|
DIVWEU,
|
2019-11-09 06:14:28 +08:00
|
|
|
DIVWEUO,
|
2017-09-23 04:17:25 +08:00
|
|
|
DIVDU,
|
2019-11-09 06:14:28 +08:00
|
|
|
DIVDUO,
|
2017-09-23 04:17:25 +08:00
|
|
|
MODSD,
|
|
|
|
MODUD,
|
|
|
|
MODUW
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// 40 Cycle DIV operation. Only one DIV unit per superslice so we use the whole
|
2019-06-15 01:04:24 +08:00
|
|
|
// superslice. That includes both exec pipelines (EXECO, EXECE) and all three
|
|
|
|
// dispatches.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DIV_40C_8, IP_EXECO_1C, IP_EXECE_1C, DISP_EVEN_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
|
|
|
DIVDE,
|
2019-11-09 06:14:28 +08:00
|
|
|
DIVDEO,
|
|
|
|
DIVDEU,
|
|
|
|
DIVDEUO
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2018-03-05 22:34:59 +08:00
|
|
|
// Cracked DIV and ALU operation. Requires one full slice for the ALU operation
|
2019-06-15 01:04:24 +08:00
|
|
|
// and one full superslice for the DIV operation since there is only one DIV per
|
|
|
|
// superslice. Latency of DIV plus ALU is 26.
|
2018-03-05 22:34:59 +08:00
|
|
|
def : InstRW<[P9_IntDivAndALUOp_18C_8, IP_EXECE_1C, IP_EXECO_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_EVEN_1C, DISP_1C],
|
2018-03-05 22:34:59 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
(instregex "DIVW(U)?(O)?_rec$")
|
2018-03-05 22:34:59 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// Cracked DIV and ALU operation. Requires one full slice for the ALU operation
|
2019-06-15 01:04:24 +08:00
|
|
|
// and one full superslice for the DIV operation since there is only one DIV per
|
|
|
|
// superslice. Latency of DIV plus ALU is 26.
|
2017-09-23 04:17:25 +08:00
|
|
|
def : InstRW<[P9_IntDivAndALUOp_26C_8, IP_EXECE_1C, IP_EXECO_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_EVEN_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
DIVD_rec,
|
|
|
|
DIVDO_rec,
|
|
|
|
DIVDU_rec,
|
|
|
|
DIVDUO_rec,
|
|
|
|
DIVWE_rec,
|
|
|
|
DIVWEO_rec,
|
|
|
|
DIVWEU_rec,
|
|
|
|
DIVWEUO_rec
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// Cracked DIV and ALU operation. Requires one full slice for the ALU operation
|
2019-06-15 01:04:24 +08:00
|
|
|
// and one full superslice for the DIV operation since there is only one DIV per
|
|
|
|
// superslice. Latency of DIV plus ALU is 42.
|
2017-09-23 04:17:25 +08:00
|
|
|
def : InstRW<[P9_IntDivAndALUOp_42C_8, IP_EXECE_1C, IP_EXECO_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_EVEN_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
DIVDE_rec,
|
|
|
|
DIVDEO_rec,
|
|
|
|
DIVDEU_rec,
|
|
|
|
DIVDEUO_rec
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
|
|
|
// CR access instructions in _BrMCR, IIC_BrMCRX.
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// Cracked, restricted, ALU operations.
|
|
|
|
// Here the two ALU ops can actually be done in parallel and therefore the
|
2019-06-15 01:04:24 +08:00
|
|
|
// latencies are not added together. Otherwise this is like having two
|
|
|
|
// instructions running together on two pipelines and 6 dispatches. ALU ops are
|
|
|
|
// 2 cycles each.
|
2016-12-19 21:35:45 +08:00
|
|
|
def : InstRW<[P9_ALU_2C, P9_ALU_2C, IP_EXEC_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_3SLOTS_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
|
|
|
MTCRF,
|
|
|
|
MTCRF8
|
|
|
|
)>;
|
|
|
|
|
2018-03-02 00:16:08 +08:00
|
|
|
// Cracked ALU operations.
|
|
|
|
// Here the two ALU ops can actually be done in parallel and therefore the
|
2019-06-15 01:04:24 +08:00
|
|
|
// latencies are not added together. Otherwise this is like having two
|
|
|
|
// instructions running together on two pipelines and 2 dispatches. ALU ops are
|
|
|
|
// 2 cycles each.
|
2018-03-02 00:16:08 +08:00
|
|
|
def : InstRW<[P9_ALU_2C, P9_ALU_2C, IP_EXEC_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_1C, DISP_1C],
|
2018-03-02 00:16:08 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
(instregex "ADDC(8)?(O)?_rec$"),
|
|
|
|
(instregex "SUBFC(8)?(O)?_rec$")
|
2018-03-02 00:16:08 +08:00
|
|
|
)>;
|
|
|
|
|
2018-03-05 22:34:59 +08:00
|
|
|
// Cracked ALU operations.
|
|
|
|
// Two ALU ops can be done in parallel.
|
|
|
|
// One is three cycle ALU the ohter is a two cycle ALU.
|
|
|
|
// One of the ALU ops is restricted the other is not so we have a total of
|
|
|
|
// 5 dispatches.
|
|
|
|
def : InstRW<[P9_ALU_2C, P9_ALU_3C, IP_EXEC_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_1C],
|
2018-03-05 22:34:59 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
(instregex "F(N)?ABS(D|S)_rec$"),
|
|
|
|
(instregex "FCPSGN(D|S)_rec$"),
|
|
|
|
(instregex "FNEG(D|S)_rec$"),
|
|
|
|
FMR_rec
|
2018-03-05 22:34:59 +08:00
|
|
|
)>;
|
|
|
|
|
|
|
|
// Cracked ALU operations.
|
2017-09-23 04:17:25 +08:00
|
|
|
// Here the two ALU ops can actually be done in parallel and therefore the
|
2019-06-15 01:04:24 +08:00
|
|
|
// latencies are not added together. Otherwise this is like having two
|
|
|
|
// instructions running together on two pipelines and 2 dispatches.
|
2017-09-23 04:17:25 +08:00
|
|
|
// ALU ops are 3 cycles each.
|
|
|
|
def : InstRW<[P9_ALU_3C, P9_ALU_3C, IP_EXEC_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
|
|
|
MCRFS
|
|
|
|
)>;
|
|
|
|
|
2018-03-09 00:24:33 +08:00
|
|
|
// Cracked Restricted ALU operations.
|
|
|
|
// Here the two ALU ops can actually be done in parallel and therefore the
|
2019-06-15 01:04:24 +08:00
|
|
|
// latencies are not added together. Otherwise this is like having two
|
|
|
|
// instructions running together on two pipelines and 6 dispatches.
|
2018-03-09 00:24:33 +08:00
|
|
|
// ALU ops are 3 cycles each.
|
|
|
|
def : InstRW<[P9_ALU_3C, P9_ALU_3C, IP_EXEC_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_3SLOTS_1C],
|
2018-03-09 00:24:33 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
(instregex "MTFSF(b|_rec)?$"),
|
|
|
|
(instregex "MTFSFI(_rec)?$")
|
2018-03-09 00:24:33 +08:00
|
|
|
)>;
|
|
|
|
|
2018-03-02 22:41:38 +08:00
|
|
|
// Cracked instruction made of two ALU ops.
|
|
|
|
// The two ops cannot be done in parallel.
|
2018-03-09 00:24:33 +08:00
|
|
|
// One of the ALU ops is restricted and takes 3 dispatches.
|
2018-02-24 04:37:10 +08:00
|
|
|
def : InstRW<[P9_ALUOpAndALUOp_4C, IP_EXEC_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_1C],
|
2018-02-24 04:37:10 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
(instregex "RLD(I)?C(R|L)_rec$"),
|
|
|
|
(instregex "RLW(IMI|INM|NM)(8)?_rec$"),
|
|
|
|
(instregex "SLW(8)?_rec$"),
|
|
|
|
(instregex "SRAW(I)?_rec$"),
|
|
|
|
(instregex "SRW(8)?_rec$"),
|
|
|
|
RLDICL_32_rec,
|
|
|
|
RLDIMI_rec
|
2018-03-09 00:24:33 +08:00
|
|
|
)>;
|
|
|
|
|
|
|
|
// Cracked instruction made of two ALU ops.
|
|
|
|
// The two ops cannot be done in parallel.
|
|
|
|
// Both of the ALU ops are restricted and take 3 dispatches.
|
|
|
|
def : InstRW<[P9_ALU2OpAndALU2Op_6C, IP_EXEC_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_3SLOTS_1C],
|
2018-03-09 00:24:33 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
(instregex "MFFS(L|CE|_rec)?$")
|
2018-03-09 00:24:33 +08:00
|
|
|
)>;
|
|
|
|
|
2018-03-10 05:08:35 +08:00
|
|
|
// Cracked ALU instruction composed of three consecutive 2 cycle loads for a
|
|
|
|
// total of 6 cycles. All of the ALU operations are also restricted so each
|
|
|
|
// takes 3 dispatches for a total of 9.
|
2018-03-09 00:24:33 +08:00
|
|
|
def : InstRW<[P9_ALUOpAndALUOpAndALUOp_6C, IP_EXEC_1C, IP_EXEC_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_3SLOTS_1C, DISP_3SLOTS_1C],
|
2018-03-09 00:24:33 +08:00
|
|
|
(instrs
|
|
|
|
(instregex "MFCR(8)?$")
|
2018-02-24 04:37:10 +08:00
|
|
|
)>;
|
|
|
|
|
2018-03-02 22:41:38 +08:00
|
|
|
// Cracked instruction made of two ALU ops.
|
|
|
|
// The two ops cannot be done in parallel.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_ALUOpAndALUOp_4C, IP_EXEC_1C, IP_EXEC_1C, DISP_1C, DISP_1C],
|
2018-03-02 22:41:38 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
(instregex "EXTSWSLI_32_64_rec$"),
|
|
|
|
(instregex "SRAD(I)?_rec$"),
|
|
|
|
EXTSWSLI_rec,
|
|
|
|
SLD_rec,
|
|
|
|
SRD_rec,
|
|
|
|
RLDIC_rec
|
2018-03-02 22:41:38 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// 33 Cycle DP Instruction Restricted. Takes one slice and 3 dispatches.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DP_33C_8, IP_EXEC_1C, DISP_3SLOTS_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2017-09-23 04:17:25 +08:00
|
|
|
FDIV
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2018-03-05 22:34:59 +08:00
|
|
|
// 33 Cycle DP Instruction Restricted and Cracked with 3 Cycle ALU.
|
2018-03-02 00:16:08 +08:00
|
|
|
def : InstRW<[P9_DPOpAndALU2Op_36C_8, IP_EXEC_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_1C],
|
2017-10-10 21:45:35 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
FDIV_rec
|
2017-10-10 21:45:35 +08:00
|
|
|
)>;
|
|
|
|
|
2018-03-09 00:24:33 +08:00
|
|
|
// 36 Cycle DP Instruction.
|
2018-03-10 05:08:35 +08:00
|
|
|
// Instruction can be done on a single slice.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DP_36C_10, IP_EXEC_1C, DISP_1C],
|
2018-03-09 00:24:33 +08:00
|
|
|
(instrs
|
|
|
|
XSSQRTDP
|
|
|
|
)>;
|
|
|
|
|
2018-03-05 22:34:59 +08:00
|
|
|
// 36 Cycle DP Instruction Restricted. Takes one slice and 3 dispatches.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DP_36C_10, IP_EXEC_1C, DISP_3SLOTS_1C],
|
2018-03-05 22:34:59 +08:00
|
|
|
(instrs
|
|
|
|
FSQRT
|
|
|
|
)>;
|
|
|
|
|
2018-03-09 00:24:33 +08:00
|
|
|
// 36 Cycle DP Vector Instruction.
|
|
|
|
def : InstRW<[P9_DPE_36C_10, P9_DPO_36C_10, IP_EXECE_1C, IP_EXECO_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_1C],
|
2018-03-09 00:24:33 +08:00
|
|
|
(instrs
|
|
|
|
XVSQRTDP
|
|
|
|
)>;
|
|
|
|
|
|
|
|
// 27 Cycle DP Vector Instruction.
|
|
|
|
def : InstRW<[P9_DPE_27C_10, P9_DPO_27C_10, IP_EXECE_1C, IP_EXECO_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_1C],
|
2018-03-09 00:24:33 +08:00
|
|
|
(instrs
|
|
|
|
XVSQRTSP
|
|
|
|
)>;
|
|
|
|
|
2018-03-05 22:34:59 +08:00
|
|
|
// 36 Cycle DP Instruction Restricted and Cracked with 3 Cycle ALU.
|
|
|
|
def : InstRW<[P9_DPOpAndALU2Op_39C_10, IP_EXEC_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_1C],
|
2018-03-05 22:34:59 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
FSQRT_rec
|
2018-03-05 22:34:59 +08:00
|
|
|
)>;
|
|
|
|
|
2018-03-09 00:24:33 +08:00
|
|
|
// 26 Cycle DP Instruction.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DP_26C_5, IP_EXEC_1C, DISP_1C],
|
2018-03-09 00:24:33 +08:00
|
|
|
(instrs
|
|
|
|
XSSQRTSP
|
|
|
|
)>;
|
|
|
|
|
2018-03-05 22:34:59 +08:00
|
|
|
// 26 Cycle DP Instruction Restricted. Takes one slice and 3 dispatches.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DP_26C_5, IP_EXEC_1C, DISP_3SLOTS_1C],
|
2018-03-05 22:34:59 +08:00
|
|
|
(instrs
|
|
|
|
FSQRTS
|
|
|
|
)>;
|
|
|
|
|
|
|
|
// 26 Cycle DP Instruction Restricted and Cracked with 3 Cycle ALU.
|
|
|
|
def : InstRW<[P9_DPOpAndALU2Op_29C_5, IP_EXEC_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_1C],
|
2018-03-05 22:34:59 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
FSQRTS_rec
|
2018-03-05 22:34:59 +08:00
|
|
|
)>;
|
|
|
|
|
2019-06-15 01:04:24 +08:00
|
|
|
// 33 Cycle DP Instruction. Takes one slice and 1 dispatch.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DP_33C_8, IP_EXEC_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2017-09-23 04:17:25 +08:00
|
|
|
XSDIVDP
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// 22 Cycle DP Instruction Restricted. Takes one slice and 3 dispatches.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DP_22C_5, IP_EXEC_1C, DISP_3SLOTS_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2017-09-23 04:17:25 +08:00
|
|
|
FDIVS
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2017-10-10 21:45:35 +08:00
|
|
|
// 22 Cycle DP Instruction Restricted and Cracked with 2 Cycle ALU.
|
2018-03-02 00:16:08 +08:00
|
|
|
def : InstRW<[P9_DPOpAndALU2Op_25C_5, IP_EXEC_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_1C],
|
2017-10-10 21:45:35 +08:00
|
|
|
(instrs
|
2020-01-07 03:05:12 +08:00
|
|
|
FDIVS_rec
|
2017-10-10 21:45:35 +08:00
|
|
|
)>;
|
|
|
|
|
2019-06-15 01:04:24 +08:00
|
|
|
// 22 Cycle DP Instruction. Takes one slice and 1 dispatch.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_DP_22C_5, IP_EXEC_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2017-09-23 04:17:25 +08:00
|
|
|
XSDIVSP
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// 24 Cycle DP Vector Instruction. Takes one full superslice.
|
2019-06-04 23:22:23 +08:00
|
|
|
// Includes both EXECE, EXECO pipelines and 1 dispatch for the given
|
2019-06-15 01:04:24 +08:00
|
|
|
// superslice.
|
2017-09-23 04:17:25 +08:00
|
|
|
def : InstRW<[P9_DPE_24C_8, P9_DPO_24C_8, IP_EXECE_1C, IP_EXECO_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2017-09-23 04:17:25 +08:00
|
|
|
XVDIVSP
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// 33 Cycle DP Vector Instruction. Takes one full superslice.
|
2019-06-04 23:22:23 +08:00
|
|
|
// Includes both EXECE, EXECO pipelines and 1 dispatch for the given
|
2019-06-15 01:04:24 +08:00
|
|
|
// superslice.
|
2017-09-23 04:17:25 +08:00
|
|
|
def : InstRW<[P9_DPE_33C_8, P9_DPO_33C_8, IP_EXECE_1C, IP_EXECO_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2017-09-23 04:17:25 +08:00
|
|
|
XVDIVDP
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// Instruction cracked into three pieces. One Load and two ALU operations.
|
|
|
|
// The Load and one of the ALU ops cannot be run at the same time and so the
|
2019-06-15 01:04:24 +08:00
|
|
|
// latencies are added together for 6 cycles. The remainaing ALU is 2 cycles.
|
2017-09-23 04:17:25 +08:00
|
|
|
// Both the load and the ALU that depends on it are restricted and so they take
|
2019-06-15 01:04:24 +08:00
|
|
|
// a total of 7 dispatches. The final 2 dispatches come from the second ALU op.
|
2017-09-23 04:17:25 +08:00
|
|
|
// The two EXEC pipelines are for the 2 ALUs while the AGEN is for the load.
|
2018-03-02 00:16:08 +08:00
|
|
|
def : InstRW<[P9_LoadAndALU2Op_7C, P9_ALU_2C,
|
2016-12-19 21:35:45 +08:00
|
|
|
IP_AGEN_1C, IP_EXEC_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_3SLOTS_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2018-02-24 04:37:10 +08:00
|
|
|
(instregex "LF(SU|SUX)$")
|
|
|
|
)>;
|
|
|
|
|
|
|
|
// Cracked instruction made up of a Store and an ALU. The ALU does not depend on
|
|
|
|
// the store and so it can be run at the same time as the store. The store is
|
|
|
|
// also restricted.
|
|
|
|
def : InstRW<[P9_LS_1C, P9_ALU_2C, IP_AGEN_1C, IP_EXEC_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_1C],
|
2018-02-24 04:37:10 +08:00
|
|
|
(instrs
|
2018-03-09 00:24:33 +08:00
|
|
|
(instregex "STF(S|D)U(X)?$"),
|
|
|
|
(instregex "ST(B|H|W|D)U(X)?(8)?$")
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2018-03-05 22:34:59 +08:00
|
|
|
// Cracked instruction made up of a Load and an ALU. The ALU does not depend on
|
|
|
|
// the load and so it can be run at the same time as the load.
|
|
|
|
def : InstRW<[P9_LS_4C, P9_ALU_2C, IP_AGEN_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_PAIR_1C, DISP_PAIR_1C],
|
2018-03-05 22:34:59 +08:00
|
|
|
(instrs
|
|
|
|
(instregex "LBZU(X)?(8)?$"),
|
|
|
|
(instregex "LDU(X)?$")
|
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// Cracked instruction made up of a Load and an ALU. The ALU does not depend on
|
2019-06-15 01:04:24 +08:00
|
|
|
// the load and so it can be run at the same time as the load. The load is also
|
|
|
|
// restricted. 3 dispatches are from the restricted load while the other two
|
|
|
|
// are from the ALU. The AGEN pipeline is from the load and the EXEC pipeline
|
|
|
|
// is required for the ALU.
|
2017-09-23 04:17:25 +08:00
|
|
|
def : InstRW<[P9_LS_4C, P9_ALU_2C, IP_AGEN_1C, IP_EXEC_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
DISP_3SLOTS_1C, DISP_1C],
|
2016-12-19 21:35:45 +08:00
|
|
|
(instrs
|
2018-02-24 04:37:10 +08:00
|
|
|
(instregex "LF(DU|DUX)$")
|
2016-12-19 21:35:45 +08:00
|
|
|
)>;
|
|
|
|
|
2017-09-23 04:17:25 +08:00
|
|
|
// Crypto Instructions
|
|
|
|
|
|
|
|
// 6 Cycle CY operation. Only one CY unit per CPU so we use a whole
|
2019-06-15 01:04:24 +08:00
|
|
|
// superslice. That includes both exec pipelines (EXECO, EXECE) and one
|
|
|
|
// dispatch.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_CY_6C, IP_EXECO_1C, IP_EXECE_1C, DISP_1C],
|
2017-09-23 04:17:25 +08:00
|
|
|
(instrs
|
2018-03-02 00:16:08 +08:00
|
|
|
(instregex "VPMSUM(B|H|W|D)$"),
|
|
|
|
(instregex "V(N)?CIPHER(LAST)?$"),
|
|
|
|
VSBOX
|
|
|
|
)>;
|
|
|
|
|
|
|
|
// Branch Instructions
|
|
|
|
|
|
|
|
// Two Cycle Branch
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_BR_2C, DISP_BR_1C],
|
2018-03-02 00:16:08 +08:00
|
|
|
(instrs
|
|
|
|
(instregex "BCCCTR(L)?(8)?$"),
|
|
|
|
(instregex "BCCL(A|R|RL)?$"),
|
|
|
|
(instregex "BCCTR(L)?(8)?(n)?$"),
|
|
|
|
(instregex "BD(N)?Z(8|A|Am|Ap|m|p)?$"),
|
|
|
|
(instregex "BD(N)?ZL(A|Am|Ap|R|R8|RL|RLm|RLp|Rm|Rp|m|p)?$"),
|
2019-05-25 04:54:35 +08:00
|
|
|
(instregex "BL(_TLS|_NOP)?$"),
|
2018-03-02 00:16:08 +08:00
|
|
|
(instregex "BL8(_TLS|_NOP|_NOP_TLS|_TLS_)?$"),
|
|
|
|
(instregex "BLA(8|8_NOP)?$"),
|
|
|
|
(instregex "BLR(8|L)?$"),
|
|
|
|
(instregex "TAILB(A)?(8)?$"),
|
|
|
|
(instregex "TAILBCTR(8)?$"),
|
|
|
|
(instregex "gBC(A|Aat|CTR|CTRL|L|LA|LAat|LR|LRL|Lat|at)?$"),
|
|
|
|
(instregex "BCLR(L)?(n)?$"),
|
|
|
|
(instregex "BCTR(L)?(8)?$"),
|
|
|
|
B,
|
|
|
|
BA,
|
|
|
|
BC,
|
|
|
|
BCC,
|
|
|
|
BCCA,
|
|
|
|
BCL,
|
|
|
|
BCLalways,
|
|
|
|
BCLn,
|
|
|
|
BCTRL8_LDinto_toc,
|
[PowerPC] Add Support for indirect calls on AIX.
Extends the desciptor-based indirect call support for 32-bit codegen,
and enables indirect calls for AIX.
In-depth Description:
In a function descriptor based ABI, a function pointer points at a
descriptor structure as opposed to the function's entry point. The
descriptor takes the form of 3 pointers: 1 for the function's entry
point, 1 for the TOC anchor of the module containing the function
definition, and 1 for the environment pointer:
struct FunctionDescriptor {
void *EntryPoint;
void *TOCAnchor;
void *EnvironmentPointer;
};
An indirect call has several steps of loading the the information from
the descriptor into the proper registers for setting up the call. Namely
it has to:
1) Save the caller's TOC pointer into the TOC save slot in the linkage
area, and then load the callee's TOC pointer into the TOC register
(GPR 2 on AIX).
2) Load the function descriptor's entry point into the count register.
3) Load the environment pointer into the environment pointer register
(GPR 11 on AIX).
4) Perform the call by branching on count register.
5) Restore the caller's TOC pointer after returning from the indirect call.
A couple important caveats to the above:
- There is no way to directly load a value from memory into the count register.
Instead we populate the count register by loading the entry point address into
a gpr and then moving the gpr to the count register.
- The TOC restore has to come immediately after the branch on count register
instruction (i.e., the 1st instruction executed after we return from the
call). This is an implementation limitation. We could, in theory, schedule
the restore elsewhere as long as no uses of the TOC pointer fall in between
the call and the restore; however, to keep it simple, we insert a pseudo
instruction that represents both the indirect branch instruction and the
load instruction that restores the caller's TOC from the linkage area. As
they flow through the compiler as a single pseudo instruction, nothing can be
inserted between them and the caller's TOC is then valid at any use.
Differtential Revision: https://reviews.llvm.org/D70724
2019-12-14 03:34:11 +08:00
|
|
|
BCTRL_LWZinto_toc,
|
2018-03-02 00:16:08 +08:00
|
|
|
BCn,
|
|
|
|
CTRL_DEP
|
|
|
|
)>;
|
|
|
|
|
|
|
|
// Five Cycle Branch with a 2 Cycle ALU Op
|
|
|
|
// Operations must be done consecutively and not in parallel.
|
2019-06-04 23:22:23 +08:00
|
|
|
def : InstRW<[P9_BROpAndALUOp_7C, IP_EXEC_1C, DISP_BR_1C, DISP_1C],
|
2018-03-02 00:16:08 +08:00
|
|
|
(instrs
|
|
|
|
ADDPCIS
|
2017-09-23 04:17:25 +08:00
|
|
|
)>;
|
2018-02-24 04:37:10 +08:00
|
|
|
|
2018-03-10 05:08:35 +08:00
|
|
|
// Special Extracted Instructions For Atomics
|
2018-03-05 22:34:59 +08:00
|
|
|
|
|
|
|
// Atomic Load
|
|
|
|
def : InstRW<[P9_LS_1C, P9_LS_1C, P9_LS_4C, P9_LS_4C, P9_LS_4C,
|
|
|
|
IP_EXEC_1C, IP_EXEC_1C, IP_AGEN_1C, IP_AGEN_1C, IP_AGEN_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
IP_AGEN_1C, IP_AGEN_1C, DISP_1C, DISP_3SLOTS_1C,
|
|
|
|
DISP_3SLOTS_1C, DISP_1C, DISP_1C, DISP_1C],
|
2018-03-05 22:34:59 +08:00
|
|
|
(instrs
|
2018-03-09 00:24:33 +08:00
|
|
|
(instregex "L(D|W)AT$")
|
|
|
|
)>;
|
|
|
|
|
|
|
|
// Atomic Store
|
|
|
|
def : InstRW<[P9_LS_1C, P9_LS_4C, P9_LS_4C, IP_EXEC_1C, IP_AGEN_1C, IP_AGEN_1C,
|
2019-06-04 23:22:23 +08:00
|
|
|
IP_AGEN_1C, DISP_1C, DISP_3SLOTS_1C, DISP_1C],
|
2018-03-09 00:24:33 +08:00
|
|
|
(instrs
|
|
|
|
(instregex "ST(D|W)AT$")
|
2018-03-05 22:34:59 +08:00
|
|
|
)>;
|
|
|
|
|
2018-03-02 22:41:38 +08:00
|
|
|
// Signal Processing Engine (SPE) Instructions
|
|
|
|
// These instructions are not supported on Power 9
|
|
|
|
def : InstRW<[],
|
|
|
|
(instrs
|
|
|
|
BRINC,
|
|
|
|
EVABS,
|
|
|
|
EVEQV,
|
|
|
|
EVMRA,
|
|
|
|
EVNAND,
|
|
|
|
EVNEG,
|
|
|
|
(instregex "EVADD(I)?W$"),
|
|
|
|
(instregex "EVADD(SM|SS|UM|US)IAAW$"),
|
|
|
|
(instregex "EVAND(C)?$"),
|
|
|
|
(instregex "EVCMP(EQ|GTS|GTU|LTS|LTU)$"),
|
|
|
|
(instregex "EVCNTL(S|Z)W$"),
|
|
|
|
(instregex "EVDIVW(S|U)$"),
|
|
|
|
(instregex "EVEXTS(B|H)$"),
|
|
|
|
(instregex "EVLD(H|W|D)(X)?$"),
|
|
|
|
(instregex "EVLHH(E|OS|OU)SPLAT(X)?$"),
|
|
|
|
(instregex "EVLWHE(X)?$"),
|
|
|
|
(instregex "EVLWHO(S|U)(X)?$"),
|
|
|
|
(instregex "EVLW(H|W)SPLAT(X)?$"),
|
|
|
|
(instregex "EVMERGE(HI|LO|HILO|LOHI)$"),
|
|
|
|
(instregex "EVMHEG(S|U)M(F|I)A(A|N)$"),
|
|
|
|
(instregex "EVMHES(M|S)(F|I)(A|AA|AAW|ANW)?$"),
|
|
|
|
(instregex "EVMHEU(M|S)I(A|AA|AAW|ANW)?$"),
|
|
|
|
(instregex "EVMHOG(U|S)M(F|I)A(A|N)$"),
|
|
|
|
(instregex "EVMHOS(M|S)(F|I)(A|AA|AAW|ANW)?$"),
|
|
|
|
(instregex "EVMHOU(M|S)I(A|AA|ANW|AAW)?$"),
|
|
|
|
(instregex "EVMWHS(M|S)(F|FA|I|IA)$"),
|
|
|
|
(instregex "EVMWHUMI(A)?$"),
|
|
|
|
(instregex "EVMWLS(M|S)IA(A|N)W$"),
|
|
|
|
(instregex "EVMWLU(M|S)I(A|AA|AAW|ANW)?$"),
|
|
|
|
(instregex "EVMWSM(F|I)(A|AA|AN)?$"),
|
|
|
|
(instregex "EVMWSSF(A|AA|AN)?$"),
|
|
|
|
(instregex "EVMWUMI(A|AA|AN)?$"),
|
|
|
|
(instregex "EV(N|X)?OR(C)?$"),
|
|
|
|
(instregex "EVR(LW|LWI|NDW)$"),
|
|
|
|
(instregex "EVSLW(I)?$"),
|
|
|
|
(instregex "EVSPLAT(F)?I$"),
|
|
|
|
(instregex "EVSRW(I)?(S|U)$"),
|
|
|
|
(instregex "EVST(DD|DH|DW|WHE|WHO|WWE|WWO)(X)?$"),
|
|
|
|
(instregex "EVSUBF(S|U)(M|S)IAAW$"),
|
|
|
|
(instregex "EVSUB(I)?FW$")
|
|
|
|
)> { let Unsupported = 1; }
|
2018-03-02 00:16:08 +08:00
|
|
|
|
2018-03-02 22:41:38 +08:00
|
|
|
// General Instructions without scheduling support.
|
2018-02-24 04:37:10 +08:00
|
|
|
def : InstRW<[],
|
|
|
|
(instrs
|
2018-03-02 00:16:08 +08:00
|
|
|
(instregex "(H)?RFI(D)?$"),
|
2018-03-05 22:34:59 +08:00
|
|
|
(instregex "DSS(ALL)?$"),
|
|
|
|
(instregex "DST(ST)?(T)?(64)?$"),
|
|
|
|
(instregex "ICBL(C|Q)$"),
|
2018-03-09 00:24:33 +08:00
|
|
|
(instregex "L(W|H|B)EPX$"),
|
|
|
|
(instregex "ST(W|H|B)EPX$"),
|
|
|
|
(instregex "(L|ST)FDEPX$"),
|
|
|
|
(instregex "M(T|F)SR(IN)?$"),
|
|
|
|
(instregex "M(T|F)DCR$"),
|
|
|
|
(instregex "NOP_GT_PWR(6|7)$"),
|
|
|
|
(instregex "TLB(IA|IVAX|SX|SX2|SX2D|LD|LI|RE|RE2|WE|WE2)$"),
|
|
|
|
(instregex "WRTEE(I)?$"),
|
2018-03-02 00:16:08 +08:00
|
|
|
ATTN,
|
|
|
|
CLRBHRB,
|
|
|
|
MFBHRBE,
|
2018-03-09 00:24:33 +08:00
|
|
|
MBAR,
|
|
|
|
MSYNC,
|
|
|
|
SLBSYNC,
|
2020-01-07 03:05:12 +08:00
|
|
|
SLBFEE_rec,
|
2018-03-02 00:16:08 +08:00
|
|
|
NAP,
|
2018-03-09 00:24:33 +08:00
|
|
|
STOP,
|
|
|
|
TRAP,
|
2018-03-02 00:16:08 +08:00
|
|
|
RFCI,
|
|
|
|
RFDI,
|
|
|
|
RFMCI,
|
|
|
|
SC,
|
2018-03-05 22:34:59 +08:00
|
|
|
DCBA,
|
|
|
|
DCBI,
|
|
|
|
DCCCI,
|
2018-03-09 00:24:33 +08:00
|
|
|
ICCCI
|
2018-02-24 04:37:10 +08:00
|
|
|
)> { let Unsupported = 1; }
|