2012-02-28 15:46:26 +08:00
|
|
|
//===-- MipsISelLowering.cpp - Mips DAG Lowering Implementation -----------===//
|
2007-06-06 15:42:06 +08:00
|
|
|
//
|
|
|
|
// The LLVM Compiler Infrastructure
|
|
|
|
//
|
2007-12-30 04:36:04 +08:00
|
|
|
// This file is distributed under the University of Illinois Open Source
|
|
|
|
// License. See LICENSE.TXT for details.
|
2007-06-06 15:42:06 +08:00
|
|
|
//
|
2011-04-16 05:51:11 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
2007-06-06 15:42:06 +08:00
|
|
|
//
|
|
|
|
// This file defines the interfaces that Mips uses to lower LLVM code into a
|
|
|
|
// selection DAG.
|
|
|
|
//
|
2011-04-16 05:51:11 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
2007-06-06 15:42:06 +08:00
|
|
|
#include "MipsISelLowering.h"
|
2012-12-04 00:50:05 +08:00
|
|
|
#include "InstPrinter/MipsInstPrinter.h"
|
|
|
|
#include "MCTargetDesc/MipsBaseInfo.h"
|
2014-11-07 22:24:31 +08:00
|
|
|
#include "MipsCCState.h"
|
2007-08-28 13:08:16 +08:00
|
|
|
#include "MipsMachineFunction.h"
|
2012-12-04 00:50:05 +08:00
|
|
|
#include "MipsSubtarget.h"
|
2007-06-06 15:42:06 +08:00
|
|
|
#include "MipsTargetMachine.h"
|
2009-08-13 14:28:06 +08:00
|
|
|
#include "MipsTargetObjectFile.h"
|
2012-10-20 05:47:33 +08:00
|
|
|
#include "llvm/ADT/Statistic.h"
|
2013-11-12 20:56:01 +08:00
|
|
|
#include "llvm/ADT/StringSwitch.h"
|
2007-06-06 15:42:06 +08:00
|
|
|
#include "llvm/CodeGen/CallingConvLower.h"
|
|
|
|
#include "llvm/CodeGen/MachineFrameInfo.h"
|
|
|
|
#include "llvm/CodeGen/MachineFunction.h"
|
|
|
|
#include "llvm/CodeGen/MachineInstrBuilder.h"
|
2014-09-03 06:28:02 +08:00
|
|
|
#include "llvm/CodeGen/MachineJumpTableInfo.h"
|
2007-12-31 12:13:23 +08:00
|
|
|
#include "llvm/CodeGen/MachineRegisterInfo.h"
|
2015-07-30 20:39:33 +08:00
|
|
|
#include "llvm/CodeGen/FunctionLoweringInfo.h"
|
2007-06-06 15:42:06 +08:00
|
|
|
#include "llvm/CodeGen/SelectionDAGISel.h"
|
|
|
|
#include "llvm/CodeGen/ValueTypes.h"
|
2013-01-02 19:36:10 +08:00
|
|
|
#include "llvm/IR/CallingConv.h"
|
|
|
|
#include "llvm/IR/DerivedTypes.h"
|
|
|
|
#include "llvm/IR/GlobalVariable.h"
|
2012-10-20 05:47:33 +08:00
|
|
|
#include "llvm/Support/CommandLine.h"
|
2007-06-06 15:42:06 +08:00
|
|
|
#include "llvm/Support/Debug.h"
|
2009-07-12 04:10:48 +08:00
|
|
|
#include "llvm/Support/ErrorHandling.h"
|
2012-04-21 23:31:45 +08:00
|
|
|
#include "llvm/Support/raw_ostream.h"
|
2013-08-14 08:21:25 +08:00
|
|
|
#include <cctype>
|
2012-04-21 23:31:45 +08:00
|
|
|
|
2007-06-06 15:42:06 +08:00
|
|
|
using namespace llvm;
|
|
|
|
|
2014-04-22 10:41:26 +08:00
|
|
|
#define DEBUG_TYPE "mips-lower"
|
|
|
|
|
2012-10-20 05:47:33 +08:00
|
|
|
STATISTIC(NumTailCalls, "Number of tail calls");
|
|
|
|
|
2012-11-22 04:21:11 +08:00
|
|
|
static cl::opt<bool>
|
|
|
|
LargeGOT("mxgot", cl::Hidden,
|
|
|
|
cl::desc("MIPS: Enable GOT larger than 64k."), cl::init(false));
|
|
|
|
|
2013-05-21 02:07:43 +08:00
|
|
|
static cl::opt<bool>
|
2013-05-22 01:17:59 +08:00
|
|
|
NoZeroDivCheck("mno-check-zero-division", cl::Hidden,
|
2013-05-21 02:07:43 +08:00
|
|
|
cl::desc("MIPS: Don't trap on integer division by zero."),
|
|
|
|
cl::init(false));
|
|
|
|
|
2014-04-04 13:16:06 +08:00
|
|
|
static const MCPhysReg Mips64DPRegs[8] = {
|
2012-10-27 08:29:43 +08:00
|
|
|
Mips::D12_64, Mips::D13_64, Mips::D14_64, Mips::D15_64,
|
|
|
|
Mips::D16_64, Mips::D17_64, Mips::D18_64, Mips::D19_64
|
|
|
|
};
|
|
|
|
|
2012-02-28 15:46:26 +08:00
|
|
|
// If I is a shifted mask, set the size (Size) and the first bit of the
|
2011-08-19 04:07:42 +08:00
|
|
|
// mask (Pos), and return true.
|
2012-02-28 15:46:26 +08:00
|
|
|
// For example, if I is 0x003ff800, (Pos, Size) = (11, 11).
|
2013-03-12 08:16:36 +08:00
|
|
|
static bool isShiftedMask(uint64_t I, uint64_t &Pos, uint64_t &Size) {
|
2011-12-06 05:26:34 +08:00
|
|
|
if (!isShiftedMask_64(I))
|
2013-10-08 03:33:02 +08:00
|
|
|
return false;
|
2011-08-17 10:05:42 +08:00
|
|
|
|
2015-02-12 23:35:40 +08:00
|
|
|
Size = countPopulation(I);
|
2013-05-25 06:23:49 +08:00
|
|
|
Pos = countTrailingZeros(I);
|
2011-08-19 04:07:42 +08:00
|
|
|
return true;
|
2011-08-17 10:05:42 +08:00
|
|
|
}
|
|
|
|
|
2013-03-13 08:54:29 +08:00
|
|
|
SDValue MipsTargetLowering::getGlobalReg(SelectionDAG &DAG, EVT Ty) const {
|
2012-02-25 06:34:47 +08:00
|
|
|
MipsFunctionInfo *FI = DAG.getMachineFunction().getInfo<MipsFunctionInfo>();
|
|
|
|
return DAG.getRegister(FI->getGlobalBaseReg(), Ty);
|
|
|
|
}
|
|
|
|
|
2013-09-28 03:51:35 +08:00
|
|
|
SDValue MipsTargetLowering::getTargetNode(GlobalAddressSDNode *N, EVT Ty,
|
|
|
|
SelectionDAG &DAG,
|
|
|
|
unsigned Flag) const {
|
|
|
|
return DAG.getTargetGlobalAddress(N->getGlobal(), SDLoc(N), Ty, 0, Flag);
|
|
|
|
}
|
2013-09-25 08:30:25 +08:00
|
|
|
|
2013-09-28 03:51:35 +08:00
|
|
|
SDValue MipsTargetLowering::getTargetNode(ExternalSymbolSDNode *N, EVT Ty,
|
|
|
|
SelectionDAG &DAG,
|
|
|
|
unsigned Flag) const {
|
|
|
|
return DAG.getTargetExternalSymbol(N->getSymbol(), Ty, Flag);
|
2013-09-25 08:30:25 +08:00
|
|
|
}
|
|
|
|
|
2013-09-28 03:51:35 +08:00
|
|
|
SDValue MipsTargetLowering::getTargetNode(BlockAddressSDNode *N, EVT Ty,
|
|
|
|
SelectionDAG &DAG,
|
|
|
|
unsigned Flag) const {
|
|
|
|
return DAG.getTargetBlockAddress(N->getBlockAddress(), Ty, 0, Flag);
|
2012-11-22 04:26:38 +08:00
|
|
|
}
|
|
|
|
|
2013-09-28 03:51:35 +08:00
|
|
|
SDValue MipsTargetLowering::getTargetNode(JumpTableSDNode *N, EVT Ty,
|
|
|
|
SelectionDAG &DAG,
|
2013-03-13 08:54:29 +08:00
|
|
|
unsigned Flag) const {
|
2013-09-28 03:51:35 +08:00
|
|
|
return DAG.getTargetJumpTable(N->getIndex(), Ty, Flag);
|
2012-11-22 04:26:38 +08:00
|
|
|
}
|
|
|
|
|
2013-09-28 03:51:35 +08:00
|
|
|
SDValue MipsTargetLowering::getTargetNode(ConstantPoolSDNode *N, EVT Ty,
|
|
|
|
SelectionDAG &DAG,
|
|
|
|
unsigned Flag) const {
|
|
|
|
return DAG.getTargetConstantPool(N->getConstVal(), Ty, N->getAlignment(),
|
|
|
|
N->getOffset(), Flag);
|
2012-11-22 04:26:38 +08:00
|
|
|
}
|
|
|
|
|
2009-07-28 11:13:23 +08:00
|
|
|
const char *MipsTargetLowering::getTargetNodeName(unsigned Opcode) const {
|
2015-05-08 05:33:59 +08:00
|
|
|
switch ((MipsISD::NodeType)Opcode) {
|
|
|
|
case MipsISD::FIRST_NUMBER: break;
|
2011-05-24 05:13:59 +08:00
|
|
|
case MipsISD::JmpLink: return "MipsISD::JmpLink";
|
2012-10-20 04:59:39 +08:00
|
|
|
case MipsISD::TailCall: return "MipsISD::TailCall";
|
2017-01-27 19:36:52 +08:00
|
|
|
case MipsISD::Highest: return "MipsISD::Highest";
|
|
|
|
case MipsISD::Higher: return "MipsISD::Higher";
|
2011-05-24 05:13:59 +08:00
|
|
|
case MipsISD::Hi: return "MipsISD::Hi";
|
|
|
|
case MipsISD::Lo: return "MipsISD::Lo";
|
2017-01-27 19:36:52 +08:00
|
|
|
case MipsISD::GotHi: return "MipsISD::GotHi";
|
2011-05-24 05:13:59 +08:00
|
|
|
case MipsISD::GPRel: return "MipsISD::GPRel";
|
2011-05-31 10:53:58 +08:00
|
|
|
case MipsISD::ThreadPointer: return "MipsISD::ThreadPointer";
|
2011-05-24 05:13:59 +08:00
|
|
|
case MipsISD::Ret: return "MipsISD::Ret";
|
2015-10-26 20:38:43 +08:00
|
|
|
case MipsISD::ERet: return "MipsISD::ERet";
|
2013-01-30 08:26:49 +08:00
|
|
|
case MipsISD::EH_RETURN: return "MipsISD::EH_RETURN";
|
2011-05-24 05:13:59 +08:00
|
|
|
case MipsISD::FPBrcond: return "MipsISD::FPBrcond";
|
|
|
|
case MipsISD::FPCmp: return "MipsISD::FPCmp";
|
|
|
|
case MipsISD::CMovFP_T: return "MipsISD::CMovFP_T";
|
|
|
|
case MipsISD::CMovFP_F: return "MipsISD::CMovFP_F";
|
2013-05-17 05:17:15 +08:00
|
|
|
case MipsISD::TruncIntFP: return "MipsISD::TruncIntFP";
|
2013-10-15 09:12:50 +08:00
|
|
|
case MipsISD::MFHI: return "MipsISD::MFHI";
|
|
|
|
case MipsISD::MFLO: return "MipsISD::MFLO";
|
|
|
|
case MipsISD::MTLOHI: return "MipsISD::MTLOHI";
|
2013-03-30 09:14:04 +08:00
|
|
|
case MipsISD::Mult: return "MipsISD::Mult";
|
|
|
|
case MipsISD::Multu: return "MipsISD::Multu";
|
2011-05-24 05:13:59 +08:00
|
|
|
case MipsISD::MAdd: return "MipsISD::MAdd";
|
|
|
|
case MipsISD::MAddu: return "MipsISD::MAddu";
|
|
|
|
case MipsISD::MSub: return "MipsISD::MSub";
|
|
|
|
case MipsISD::MSubu: return "MipsISD::MSubu";
|
|
|
|
case MipsISD::DivRem: return "MipsISD::DivRem";
|
|
|
|
case MipsISD::DivRemU: return "MipsISD::DivRemU";
|
2013-03-30 09:14:04 +08:00
|
|
|
case MipsISD::DivRem16: return "MipsISD::DivRem16";
|
|
|
|
case MipsISD::DivRemU16: return "MipsISD::DivRemU16";
|
2011-05-24 05:13:59 +08:00
|
|
|
case MipsISD::BuildPairF64: return "MipsISD::BuildPairF64";
|
|
|
|
case MipsISD::ExtractElementF64: return "MipsISD::ExtractElementF64";
|
2011-12-13 06:38:19 +08:00
|
|
|
case MipsISD::Wrapper: return "MipsISD::Wrapper";
|
2015-05-08 05:33:59 +08:00
|
|
|
case MipsISD::DynAlloc: return "MipsISD::DynAlloc";
|
2011-07-20 07:30:50 +08:00
|
|
|
case MipsISD::Sync: return "MipsISD::Sync";
|
2011-08-17 10:05:42 +08:00
|
|
|
case MipsISD::Ext: return "MipsISD::Ext";
|
|
|
|
case MipsISD::Ins: return "MipsISD::Ins";
|
[Mips] Add support to match more patterns for DEXT and CINS
This patch adds support for recognizing more patterns to match to DEXT and
CINS instructions.
It finds cases where multiple instructions could be replaced with a single
DEXT or CINS instruction.
For example, for the following:
define i64 @dext_and32(i64 zeroext %a) {
entry:
%and = and i64 %a, 4294967295
ret i64 %and
}
instead of generating:
0000000000000088 <dext_and32>:
88: 64010001 daddiu at,zero,1
8c: 0001083c dsll32 at,at,0x0
90: 6421ffff daddiu at,at,-1
94: 03e00008 jr ra
98: 00811024 and v0,a0,at
9c: 00000000 nop
the following gets generated:
0000000000000068 <dext_and32>:
68: 03e00008 jr ra
6c: 7c82f803 dext v0,a0,0x0,0x20
Cases that are covered:
DEXT:
1. and $src, mask where mask > 0xffff
2. zext $src zero extend from i32 to i64
CINS:
1. and (shl $src, pos), mask
2. shl (and $src, mask), pos
3. zext (shl $src, pos) zero extend from i32 to i64
Patch by Violeta Vukobrat.
Differential Revision: https://reviews.llvm.org/D30464
llvm-svn: 297832
2017-03-15 21:10:08 +08:00
|
|
|
case MipsISD::CIns: return "MipsISD::CIns";
|
2012-06-02 08:03:12 +08:00
|
|
|
case MipsISD::LWL: return "MipsISD::LWL";
|
|
|
|
case MipsISD::LWR: return "MipsISD::LWR";
|
|
|
|
case MipsISD::SWL: return "MipsISD::SWL";
|
|
|
|
case MipsISD::SWR: return "MipsISD::SWR";
|
|
|
|
case MipsISD::LDL: return "MipsISD::LDL";
|
|
|
|
case MipsISD::LDR: return "MipsISD::LDR";
|
|
|
|
case MipsISD::SDL: return "MipsISD::SDL";
|
|
|
|
case MipsISD::SDR: return "MipsISD::SDR";
|
2012-09-22 07:52:47 +08:00
|
|
|
case MipsISD::EXTP: return "MipsISD::EXTP";
|
|
|
|
case MipsISD::EXTPDP: return "MipsISD::EXTPDP";
|
|
|
|
case MipsISD::EXTR_S_H: return "MipsISD::EXTR_S_H";
|
|
|
|
case MipsISD::EXTR_W: return "MipsISD::EXTR_W";
|
|
|
|
case MipsISD::EXTR_R_W: return "MipsISD::EXTR_R_W";
|
|
|
|
case MipsISD::EXTR_RS_W: return "MipsISD::EXTR_RS_W";
|
|
|
|
case MipsISD::SHILO: return "MipsISD::SHILO";
|
|
|
|
case MipsISD::MTHLIP: return "MipsISD::MTHLIP";
|
2015-05-08 05:33:59 +08:00
|
|
|
case MipsISD::MULSAQ_S_W_PH: return "MipsISD::MULSAQ_S_W_PH";
|
|
|
|
case MipsISD::MAQ_S_W_PHL: return "MipsISD::MAQ_S_W_PHL";
|
|
|
|
case MipsISD::MAQ_S_W_PHR: return "MipsISD::MAQ_S_W_PHR";
|
|
|
|
case MipsISD::MAQ_SA_W_PHL: return "MipsISD::MAQ_SA_W_PHL";
|
|
|
|
case MipsISD::MAQ_SA_W_PHR: return "MipsISD::MAQ_SA_W_PHR";
|
|
|
|
case MipsISD::DPAU_H_QBL: return "MipsISD::DPAU_H_QBL";
|
|
|
|
case MipsISD::DPAU_H_QBR: return "MipsISD::DPAU_H_QBR";
|
|
|
|
case MipsISD::DPSU_H_QBL: return "MipsISD::DPSU_H_QBL";
|
|
|
|
case MipsISD::DPSU_H_QBR: return "MipsISD::DPSU_H_QBR";
|
|
|
|
case MipsISD::DPAQ_S_W_PH: return "MipsISD::DPAQ_S_W_PH";
|
|
|
|
case MipsISD::DPSQ_S_W_PH: return "MipsISD::DPSQ_S_W_PH";
|
|
|
|
case MipsISD::DPAQ_SA_L_W: return "MipsISD::DPAQ_SA_L_W";
|
|
|
|
case MipsISD::DPSQ_SA_L_W: return "MipsISD::DPSQ_SA_L_W";
|
|
|
|
case MipsISD::DPA_W_PH: return "MipsISD::DPA_W_PH";
|
|
|
|
case MipsISD::DPS_W_PH: return "MipsISD::DPS_W_PH";
|
|
|
|
case MipsISD::DPAQX_S_W_PH: return "MipsISD::DPAQX_S_W_PH";
|
|
|
|
case MipsISD::DPAQX_SA_W_PH: return "MipsISD::DPAQX_SA_W_PH";
|
|
|
|
case MipsISD::DPAX_W_PH: return "MipsISD::DPAX_W_PH";
|
|
|
|
case MipsISD::DPSX_W_PH: return "MipsISD::DPSX_W_PH";
|
|
|
|
case MipsISD::DPSQX_S_W_PH: return "MipsISD::DPSQX_S_W_PH";
|
|
|
|
case MipsISD::DPSQX_SA_W_PH: return "MipsISD::DPSQX_SA_W_PH";
|
|
|
|
case MipsISD::MULSA_W_PH: return "MipsISD::MULSA_W_PH";
|
2012-09-22 07:52:47 +08:00
|
|
|
case MipsISD::MULT: return "MipsISD::MULT";
|
|
|
|
case MipsISD::MULTU: return "MipsISD::MULTU";
|
2013-03-04 09:06:54 +08:00
|
|
|
case MipsISD::MADD_DSP: return "MipsISD::MADD_DSP";
|
2012-09-22 07:52:47 +08:00
|
|
|
case MipsISD::MADDU_DSP: return "MipsISD::MADDU_DSP";
|
|
|
|
case MipsISD::MSUB_DSP: return "MipsISD::MSUB_DSP";
|
|
|
|
case MipsISD::MSUBU_DSP: return "MipsISD::MSUBU_DSP";
|
2013-04-20 07:21:32 +08:00
|
|
|
case MipsISD::SHLL_DSP: return "MipsISD::SHLL_DSP";
|
|
|
|
case MipsISD::SHRA_DSP: return "MipsISD::SHRA_DSP";
|
|
|
|
case MipsISD::SHRL_DSP: return "MipsISD::SHRL_DSP";
|
2013-05-01 06:37:26 +08:00
|
|
|
case MipsISD::SETCC_DSP: return "MipsISD::SETCC_DSP";
|
|
|
|
case MipsISD::SELECT_CC_DSP: return "MipsISD::SELECT_CC_DSP";
|
2013-08-28 20:14:50 +08:00
|
|
|
case MipsISD::VALL_ZERO: return "MipsISD::VALL_ZERO";
|
|
|
|
case MipsISD::VANY_ZERO: return "MipsISD::VANY_ZERO";
|
|
|
|
case MipsISD::VALL_NONZERO: return "MipsISD::VALL_NONZERO";
|
|
|
|
case MipsISD::VANY_NONZERO: return "MipsISD::VANY_NONZERO";
|
2013-09-24 18:46:19 +08:00
|
|
|
case MipsISD::VCEQ: return "MipsISD::VCEQ";
|
|
|
|
case MipsISD::VCLE_S: return "MipsISD::VCLE_S";
|
|
|
|
case MipsISD::VCLE_U: return "MipsISD::VCLE_U";
|
|
|
|
case MipsISD::VCLT_S: return "MipsISD::VCLT_S";
|
|
|
|
case MipsISD::VCLT_U: return "MipsISD::VCLT_U";
|
2013-09-24 20:18:31 +08:00
|
|
|
case MipsISD::VSMAX: return "MipsISD::VSMAX";
|
|
|
|
case MipsISD::VSMIN: return "MipsISD::VSMIN";
|
|
|
|
case MipsISD::VUMAX: return "MipsISD::VUMAX";
|
|
|
|
case MipsISD::VUMIN: return "MipsISD::VUMIN";
|
2013-09-23 22:03:12 +08:00
|
|
|
case MipsISD::VEXTRACT_SEXT_ELT: return "MipsISD::VEXTRACT_SEXT_ELT";
|
|
|
|
case MipsISD::VEXTRACT_ZEXT_ELT: return "MipsISD::VEXTRACT_ZEXT_ELT";
|
2013-09-23 21:22:24 +08:00
|
|
|
case MipsISD::VNOR: return "MipsISD::VNOR";
|
2013-09-24 22:02:15 +08:00
|
|
|
case MipsISD::VSHF: return "MipsISD::VSHF";
|
2013-09-24 22:20:00 +08:00
|
|
|
case MipsISD::SHF: return "MipsISD::SHF";
|
2013-09-24 22:36:12 +08:00
|
|
|
case MipsISD::ILVEV: return "MipsISD::ILVEV";
|
|
|
|
case MipsISD::ILVOD: return "MipsISD::ILVOD";
|
|
|
|
case MipsISD::ILVL: return "MipsISD::ILVL";
|
|
|
|
case MipsISD::ILVR: return "MipsISD::ILVR";
|
2013-09-24 22:53:25 +08:00
|
|
|
case MipsISD::PCKEV: return "MipsISD::PCKEV";
|
|
|
|
case MipsISD::PCKOD: return "MipsISD::PCKOD";
|
[mips] Rewrite MipsAsmParser and MipsOperand.
Summary:
Highlights:
- Registers are resolved much later (by the render method).
Prior to that point, GPR32's/GPR64's are GPR's regardless of register
size. Similarly FGR32's/FGR64's/AFGR64's are FGR's regardless of register
size or FR mode. Numeric registers can be anything.
- All registers are parsed the same way everywhere (even when handling
symbol aliasing)
- One consequence is that all registers can be specified numerically
almost anywhere (e.g. $fccX, $wX). The exception is symbol aliasing
but that can be easily resolved.
- Removes the need for the hasConsumedDollar hack
- Parenthesis and Bracket suffixes are handled generically
- Micromips instructions are parsed directly instead of going through the
standard encodings first.
- rdhwr accepts all 32 registers, and the following instructions that previously
xfailed now work:
ddiv, ddivu, div, divu, cvt.l.[ds], se[bh], wsbh, floor.w.[ds], c.ngl.d,
c.sf.s, dsbh, dshd, madd.s, msub.s, nmadd.s, nmsub.s, swxc1
- Diagnostics involving registers point at the correct character (the $)
- There's only one kind of immediate in MipsOperand. LSA immediates are handled
by the predicate and renderer.
Lowlights:
- Hardcoded '$zero' in the div patterns is handled with a hack.
MipsOperand::isReg() will return true for a k_RegisterIndex token
with Index == 0 and getReg() will return ZERO for this case. Note that it
doesn't return ZERO_64 on isGP64() targets.
- I haven't cleaned up all of the now-unused functions.
Some more of the generic parser could be removed too (integers and relocs
for example).
- insve.df needed a custom decoder to handle the implicit fourth operand that
was needed to make it parse correctly. The difficulty was that the matcher
expected a Token<'0'> but gets an Imm<0>. Adding an implicit zero solved this.
Reviewers: matheusalmeida, vmedic
Reviewed By: matheusalmeida
Differential Revision: http://llvm-reviews.chandlerc.com/D3222
llvm-svn: 205292
2014-04-01 18:35:28 +08:00
|
|
|
case MipsISD::INSVE: return "MipsISD::INSVE";
|
2007-06-06 15:42:06 +08:00
|
|
|
}
|
2015-05-08 05:33:59 +08:00
|
|
|
return nullptr;
|
2007-06-06 15:42:06 +08:00
|
|
|
}
|
|
|
|
|
2014-09-20 07:30:42 +08:00
|
|
|
MipsTargetLowering::MipsTargetLowering(const MipsTargetMachine &TM,
|
2014-07-19 07:25:04 +08:00
|
|
|
const MipsSubtarget &STI)
|
2015-01-30 07:27:36 +08:00
|
|
|
: TargetLowering(TM), Subtarget(STI), ABI(TM.getABI()) {
|
2007-06-06 15:42:06 +08:00
|
|
|
// Mips does not have i1 type, so use i32 for
|
2010-11-23 11:31:01 +08:00
|
|
|
// setcc operations results (slt, sgt, ...).
|
2008-11-23 23:47:28 +08:00
|
|
|
setBooleanContents(ZeroOrOneBooleanContent);
|
2013-05-01 06:37:26 +08:00
|
|
|
setBooleanVectorContents(ZeroOrNegativeOneBooleanContent);
|
2014-07-10 18:18:12 +08:00
|
|
|
// The cmp.cond.fmt instruction in MIPS32r6/MIPS64r6 uses 0 and -1 like MSA
|
|
|
|
// does. Integer booleans still use 0 and 1.
|
2014-07-19 06:55:25 +08:00
|
|
|
if (Subtarget.hasMips32r6())
|
2014-07-10 18:18:12 +08:00
|
|
|
setBooleanContents(ZeroOrOneBooleanContent,
|
|
|
|
ZeroOrNegativeOneBooleanContent);
|
2007-06-06 15:42:06 +08:00
|
|
|
|
2010-11-23 11:31:01 +08:00
|
|
|
// Load extented operations for i1 types must be promoted
|
[SelectionDAG] Allow targets to specify legality of extloads' result
type (in addition to the memory type).
The *LoadExt* legalization handling used to only have one type, the
memory type. This forced users to assume that as long as the extload
for the memory type was declared legal, and the result type was legal,
the whole extload was legal.
However, this isn't always the case. For instance, on X86, with AVX,
this is legal:
v4i32 load, zext from v4i8
but this isn't:
v4i64 load, zext from v4i8
Whereas v4i64 is (arguably) legal, even without AVX2.
Note that the same thing was done a while ago for truncstores (r46140),
but I assume no one needed it yet for extloads, so here we go.
Calls to getLoadExtAction were changed to add the value type, found
manually in the surrounding code.
Calls to setLoadExtAction were mechanically changed, by wrapping the
call in a loop, to match previous behavior. The loop iterates over
the MVT subrange corresponding to the memory type (FP vectors, etc...).
I also pulled neighboring setTruncStoreActions into some of the loops;
those shouldn't make a difference, as the additional types are illegal.
(e.g., i128->i1 truncstores on PPC.)
No functional change intended.
Differential Revision: http://reviews.llvm.org/D6532
llvm-svn: 225421
2015-01-08 08:51:32 +08:00
|
|
|
for (MVT VT : MVT::integer_valuetypes()) {
|
|
|
|
setLoadExtAction(ISD::EXTLOAD, VT, MVT::i1, Promote);
|
|
|
|
setLoadExtAction(ISD::ZEXTLOAD, VT, MVT::i1, Promote);
|
|
|
|
setLoadExtAction(ISD::SEXTLOAD, VT, MVT::i1, Promote);
|
|
|
|
}
|
2007-06-06 15:42:06 +08:00
|
|
|
|
2015-04-21 04:15:36 +08:00
|
|
|
// MIPS doesn't have extending float->double load/store. Set LoadExtAction
|
|
|
|
// for f32, f16
|
|
|
|
for (MVT VT : MVT::fp_valuetypes()) {
|
[SelectionDAG] Allow targets to specify legality of extloads' result
type (in addition to the memory type).
The *LoadExt* legalization handling used to only have one type, the
memory type. This forced users to assume that as long as the extload
for the memory type was declared legal, and the result type was legal,
the whole extload was legal.
However, this isn't always the case. For instance, on X86, with AVX,
this is legal:
v4i32 load, zext from v4i8
but this isn't:
v4i64 load, zext from v4i8
Whereas v4i64 is (arguably) legal, even without AVX2.
Note that the same thing was done a while ago for truncstores (r46140),
but I assume no one needed it yet for extloads, so here we go.
Calls to getLoadExtAction were changed to add the value type, found
manually in the surrounding code.
Calls to setLoadExtAction were mechanically changed, by wrapping the
call in a loop, to match previous behavior. The loop iterates over
the MVT subrange corresponding to the memory type (FP vectors, etc...).
I also pulled neighboring setTruncStoreActions into some of the loops;
those shouldn't make a difference, as the additional types are illegal.
(e.g., i128->i1 truncstores on PPC.)
No functional change intended.
Differential Revision: http://reviews.llvm.org/D6532
llvm-svn: 225421
2015-01-08 08:51:32 +08:00
|
|
|
setLoadExtAction(ISD::EXTLOAD, VT, MVT::f32, Expand);
|
2015-04-21 04:15:36 +08:00
|
|
|
setLoadExtAction(ISD::EXTLOAD, VT, MVT::f16, Expand);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Set LoadExtAction for f16 vectors to Expand
|
|
|
|
for (MVT VT : MVT::fp_vector_valuetypes()) {
|
|
|
|
MVT F16VT = MVT::getVectorVT(MVT::f16, VT.getVectorNumElements());
|
|
|
|
if (F16VT.isValid())
|
|
|
|
setLoadExtAction(ISD::EXTLOAD, VT, F16VT, Expand);
|
|
|
|
}
|
|
|
|
|
|
|
|
setTruncStoreAction(MVT::f32, MVT::f16, Expand);
|
|
|
|
setTruncStoreAction(MVT::f64, MVT::f16, Expand);
|
|
|
|
|
2009-08-12 04:47:22 +08:00
|
|
|
setTruncStoreAction(MVT::f64, MVT::f32, Expand);
|
2009-07-17 10:28:12 +08:00
|
|
|
|
2010-11-23 11:31:01 +08:00
|
|
|
// Used by legalize types to correctly generate the setcc result.
|
|
|
|
// Without this, every float setcc comes with a AND/OR with the result,
|
|
|
|
// we don't want this, since the fpcmp result goes to a flag register,
|
2008-08-01 02:31:28 +08:00
|
|
|
// which is used implicitly by brcond and select operations.
|
2016-03-02 04:25:43 +08:00
|
|
|
AddPromotedToType(ISD::SETCC, MVT::i1, MVT::i32);
|
2008-08-01 02:31:28 +08:00
|
|
|
|
2008-07-09 12:15:08 +08:00
|
|
|
// Mips Custom Operations
|
2016-11-15 20:39:46 +08:00
|
|
|
setOperationAction(ISD::BR_JT, MVT::Other, Expand);
|
2009-08-12 04:47:22 +08:00
|
|
|
setOperationAction(ISD::GlobalAddress, MVT::i32, Custom);
|
2011-03-05 04:01:52 +08:00
|
|
|
setOperationAction(ISD::BlockAddress, MVT::i32, Custom);
|
2009-08-12 04:47:22 +08:00
|
|
|
setOperationAction(ISD::GlobalTLSAddress, MVT::i32, Custom);
|
|
|
|
setOperationAction(ISD::JumpTable, MVT::i32, Custom);
|
|
|
|
setOperationAction(ISD::ConstantPool, MVT::i32, Custom);
|
2016-09-09 19:06:01 +08:00
|
|
|
setOperationAction(ISD::SELECT, MVT::f32, Custom);
|
|
|
|
setOperationAction(ISD::SELECT, MVT::f64, Custom);
|
|
|
|
setOperationAction(ISD::SELECT, MVT::i32, Custom);
|
|
|
|
setOperationAction(ISD::SETCC, MVT::f32, Custom);
|
|
|
|
setOperationAction(ISD::SETCC, MVT::f64, Custom);
|
|
|
|
setOperationAction(ISD::BRCOND, MVT::Other, Custom);
|
2012-03-10 08:03:50 +08:00
|
|
|
setOperationAction(ISD::FCOPYSIGN, MVT::f32, Custom);
|
|
|
|
setOperationAction(ISD::FCOPYSIGN, MVT::f64, Custom);
|
2013-05-17 05:17:15 +08:00
|
|
|
setOperationAction(ISD::FP_TO_SINT, MVT::i32, Custom);
|
2012-03-10 08:03:50 +08:00
|
|
|
|
2014-07-19 06:55:25 +08:00
|
|
|
if (Subtarget.isGP64bit()) {
|
2012-03-10 08:03:50 +08:00
|
|
|
setOperationAction(ISD::GlobalAddress, MVT::i64, Custom);
|
|
|
|
setOperationAction(ISD::BlockAddress, MVT::i64, Custom);
|
|
|
|
setOperationAction(ISD::GlobalTLSAddress, MVT::i64, Custom);
|
|
|
|
setOperationAction(ISD::JumpTable, MVT::i64, Custom);
|
|
|
|
setOperationAction(ISD::ConstantPool, MVT::i64, Custom);
|
2016-09-09 19:06:01 +08:00
|
|
|
setOperationAction(ISD::SELECT, MVT::i64, Custom);
|
2012-06-02 08:04:42 +08:00
|
|
|
setOperationAction(ISD::LOAD, MVT::i64, Custom);
|
|
|
|
setOperationAction(ISD::STORE, MVT::i64, Custom);
|
2013-05-17 05:17:15 +08:00
|
|
|
setOperationAction(ISD::FP_TO_SINT, MVT::i64, Custom);
|
2015-01-26 20:33:22 +08:00
|
|
|
setOperationAction(ISD::SHL_PARTS, MVT::i64, Custom);
|
|
|
|
setOperationAction(ISD::SRA_PARTS, MVT::i64, Custom);
|
|
|
|
setOperationAction(ISD::SRL_PARTS, MVT::i64, Custom);
|
2012-03-10 08:03:50 +08:00
|
|
|
}
|
2010-02-07 05:00:02 +08:00
|
|
|
|
2014-07-19 06:55:25 +08:00
|
|
|
if (!Subtarget.isGP64bit()) {
|
2012-05-09 08:55:21 +08:00
|
|
|
setOperationAction(ISD::SHL_PARTS, MVT::i32, Custom);
|
|
|
|
setOperationAction(ISD::SRA_PARTS, MVT::i32, Custom);
|
|
|
|
setOperationAction(ISD::SRL_PARTS, MVT::i32, Custom);
|
|
|
|
}
|
|
|
|
|
Add ISD::EH_DWARF_CFA, simplify @llvm.eh.dwarf.cfa on Mips, fix on PowerPC
LLVM has an @llvm.eh.dwarf.cfa intrinsic, used to lower the GCC-compatible
__builtin_dwarf_cfa() builtin. As pointed out in PR26761, this is currently
broken on PowerPC (and likely on ARM as well). Currently, @llvm.eh.dwarf.cfa is
lowered using:
ADD(FRAMEADDR, FRAME_TO_ARGS_OFFSET)
where FRAME_TO_ARGS_OFFSET defaults to the constant zero. On x86,
FRAME_TO_ARGS_OFFSET is lowered to 2*SlotSize. This setup, however, does not
work for PowerPC. Because of the way that the stack layout works, the canonical
frame address is not exactly (FRAMEADDR + FRAME_TO_ARGS_OFFSET) on PowerPC
(there is a lower save-area offset as well), so it is not just a matter of
implementing FRAME_TO_ARGS_OFFSET for PowerPC (unless we redefine its
semantics -- We can do that, since it is currently used only for
@llvm.eh.dwarf.cfa lowering, but the better to directly lower the CFA construct
itself (since it can be easily represented as a fixed-offset FrameIndex)). Mips
currently does this, but by using a custom lowering for ADD that specifically
recognizes the (FRAMEADDR, FRAME_TO_ARGS_OFFSET) pattern.
This change introduces a ISD::EH_DWARF_CFA node, which by default expands using
the existing logic, but can be directly lowered by the target. Mips is updated
to use this method (which simplifies its implementation, and I suspect makes it
more robust), and updates PowerPC to do the same.
Fixes PR26761.
Differential Revision: https://reviews.llvm.org/D24038
llvm-svn: 280350
2016-09-01 18:28:47 +08:00
|
|
|
setOperationAction(ISD::EH_DWARF_CFA, MVT::i32, Custom);
|
2014-07-19 06:55:25 +08:00
|
|
|
if (Subtarget.isGP64bit())
|
Add ISD::EH_DWARF_CFA, simplify @llvm.eh.dwarf.cfa on Mips, fix on PowerPC
LLVM has an @llvm.eh.dwarf.cfa intrinsic, used to lower the GCC-compatible
__builtin_dwarf_cfa() builtin. As pointed out in PR26761, this is currently
broken on PowerPC (and likely on ARM as well). Currently, @llvm.eh.dwarf.cfa is
lowered using:
ADD(FRAMEADDR, FRAME_TO_ARGS_OFFSET)
where FRAME_TO_ARGS_OFFSET defaults to the constant zero. On x86,
FRAME_TO_ARGS_OFFSET is lowered to 2*SlotSize. This setup, however, does not
work for PowerPC. Because of the way that the stack layout works, the canonical
frame address is not exactly (FRAMEADDR + FRAME_TO_ARGS_OFFSET) on PowerPC
(there is a lower save-area offset as well), so it is not just a matter of
implementing FRAME_TO_ARGS_OFFSET for PowerPC (unless we redefine its
semantics -- We can do that, since it is currently used only for
@llvm.eh.dwarf.cfa lowering, but the better to directly lower the CFA construct
itself (since it can be easily represented as a fixed-offset FrameIndex)). Mips
currently does this, but by using a custom lowering for ADD that specifically
recognizes the (FRAMEADDR, FRAME_TO_ARGS_OFFSET) pattern.
This change introduces a ISD::EH_DWARF_CFA node, which by default expands using
the existing logic, but can be directly lowered by the target. Mips is updated
to use this method (which simplifies its implementation, and I suspect makes it
more robust), and updates PowerPC to do the same.
Fixes PR26761.
Differential Revision: https://reviews.llvm.org/D24038
llvm-svn: 280350
2016-09-01 18:28:47 +08:00
|
|
|
setOperationAction(ISD::EH_DWARF_CFA, MVT::i64, Custom);
|
2012-11-08 03:10:58 +08:00
|
|
|
|
2011-03-05 05:03:24 +08:00
|
|
|
setOperationAction(ISD::SDIV, MVT::i32, Expand);
|
|
|
|
setOperationAction(ISD::SREM, MVT::i32, Expand);
|
|
|
|
setOperationAction(ISD::UDIV, MVT::i32, Expand);
|
|
|
|
setOperationAction(ISD::UREM, MVT::i32, Expand);
|
2011-10-04 05:06:13 +08:00
|
|
|
setOperationAction(ISD::SDIV, MVT::i64, Expand);
|
|
|
|
setOperationAction(ISD::SREM, MVT::i64, Expand);
|
|
|
|
setOperationAction(ISD::UDIV, MVT::i64, Expand);
|
|
|
|
setOperationAction(ISD::UREM, MVT::i64, Expand);
|
2011-03-05 05:03:24 +08:00
|
|
|
|
2008-07-09 12:15:08 +08:00
|
|
|
// Operations not directly supported by Mips.
|
2013-03-08 23:36:57 +08:00
|
|
|
setOperationAction(ISD::BR_CC, MVT::f32, Expand);
|
|
|
|
setOperationAction(ISD::BR_CC, MVT::f64, Expand);
|
|
|
|
setOperationAction(ISD::BR_CC, MVT::i32, Expand);
|
|
|
|
setOperationAction(ISD::BR_CC, MVT::i64, Expand);
|
2014-06-11 00:01:29 +08:00
|
|
|
setOperationAction(ISD::SELECT_CC, MVT::i32, Expand);
|
|
|
|
setOperationAction(ISD::SELECT_CC, MVT::i64, Expand);
|
2016-01-12 00:44:48 +08:00
|
|
|
setOperationAction(ISD::SELECT_CC, MVT::f32, Expand);
|
|
|
|
setOperationAction(ISD::SELECT_CC, MVT::f64, Expand);
|
2009-08-12 04:47:22 +08:00
|
|
|
setOperationAction(ISD::UINT_TO_FP, MVT::i32, Expand);
|
2011-12-21 07:40:56 +08:00
|
|
|
setOperationAction(ISD::UINT_TO_FP, MVT::i64, Expand);
|
2009-08-12 04:47:22 +08:00
|
|
|
setOperationAction(ISD::FP_TO_UINT, MVT::i32, Expand);
|
2011-12-21 07:40:56 +08:00
|
|
|
setOperationAction(ISD::FP_TO_UINT, MVT::i64, Expand);
|
2009-08-12 04:47:22 +08:00
|
|
|
setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i1, Expand);
|
2014-07-19 06:55:25 +08:00
|
|
|
if (Subtarget.hasCnMips()) {
|
2014-03-20 19:51:58 +08:00
|
|
|
setOperationAction(ISD::CTPOP, MVT::i32, Legal);
|
|
|
|
setOperationAction(ISD::CTPOP, MVT::i64, Legal);
|
|
|
|
} else {
|
|
|
|
setOperationAction(ISD::CTPOP, MVT::i32, Expand);
|
|
|
|
setOperationAction(ISD::CTPOP, MVT::i64, Expand);
|
|
|
|
}
|
2009-08-12 04:47:22 +08:00
|
|
|
setOperationAction(ISD::CTTZ, MVT::i32, Expand);
|
2011-12-21 08:14:05 +08:00
|
|
|
setOperationAction(ISD::CTTZ, MVT::i64, Expand);
|
2009-08-12 04:47:22 +08:00
|
|
|
setOperationAction(ISD::ROTL, MVT::i32, Expand);
|
2011-10-01 02:51:46 +08:00
|
|
|
setOperationAction(ISD::ROTL, MVT::i64, Expand);
|
2012-08-01 04:54:48 +08:00
|
|
|
setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i32, Expand);
|
|
|
|
setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i64, Expand);
|
2010-12-10 01:32:30 +08:00
|
|
|
|
2014-07-19 06:55:25 +08:00
|
|
|
if (!Subtarget.hasMips32r2())
|
2010-12-10 01:32:30 +08:00
|
|
|
setOperationAction(ISD::ROTR, MVT::i32, Expand);
|
|
|
|
|
2014-07-19 06:55:25 +08:00
|
|
|
if (!Subtarget.hasMips64r2())
|
2011-10-01 02:51:46 +08:00
|
|
|
setOperationAction(ISD::ROTR, MVT::i64, Expand);
|
|
|
|
|
2009-08-12 04:47:22 +08:00
|
|
|
setOperationAction(ISD::FSIN, MVT::f32, Expand);
|
2011-03-05 02:54:14 +08:00
|
|
|
setOperationAction(ISD::FSIN, MVT::f64, Expand);
|
2009-08-12 04:47:22 +08:00
|
|
|
setOperationAction(ISD::FCOS, MVT::f32, Expand);
|
2011-03-05 02:54:14 +08:00
|
|
|
setOperationAction(ISD::FCOS, MVT::f64, Expand);
|
2013-01-29 10:32:37 +08:00
|
|
|
setOperationAction(ISD::FSINCOS, MVT::f32, Expand);
|
|
|
|
setOperationAction(ISD::FSINCOS, MVT::f64, Expand);
|
2009-08-12 04:47:22 +08:00
|
|
|
setOperationAction(ISD::FPOWI, MVT::f32, Expand);
|
|
|
|
setOperationAction(ISD::FPOW, MVT::f32, Expand);
|
2011-05-24 06:23:58 +08:00
|
|
|
setOperationAction(ISD::FPOW, MVT::f64, Expand);
|
2009-08-12 04:47:22 +08:00
|
|
|
setOperationAction(ISD::FLOG, MVT::f32, Expand);
|
|
|
|
setOperationAction(ISD::FLOG2, MVT::f32, Expand);
|
|
|
|
setOperationAction(ISD::FLOG10, MVT::f32, Expand);
|
|
|
|
setOperationAction(ISD::FEXP, MVT::f32, Expand);
|
2011-07-09 05:39:21 +08:00
|
|
|
setOperationAction(ISD::FMA, MVT::f32, Expand);
|
|
|
|
setOperationAction(ISD::FMA, MVT::f64, Expand);
|
2012-03-30 02:43:11 +08:00
|
|
|
setOperationAction(ISD::FREM, MVT::f32, Expand);
|
|
|
|
setOperationAction(ISD::FREM, MVT::f64, Expand);
|
2015-04-21 04:15:36 +08:00
|
|
|
|
|
|
|
// Lower f16 conversion operations into library calls
|
|
|
|
setOperationAction(ISD::FP16_TO_FP, MVT::f32, Expand);
|
|
|
|
setOperationAction(ISD::FP_TO_FP16, MVT::f32, Expand);
|
|
|
|
setOperationAction(ISD::FP16_TO_FP, MVT::f64, Expand);
|
|
|
|
setOperationAction(ISD::FP_TO_FP16, MVT::f64, Expand);
|
2008-07-09 12:15:08 +08:00
|
|
|
|
2013-01-30 08:26:49 +08:00
|
|
|
setOperationAction(ISD::EH_RETURN, MVT::Other, Custom);
|
|
|
|
|
2014-08-01 17:17:39 +08:00
|
|
|
setOperationAction(ISD::VASTART, MVT::Other, Custom);
|
|
|
|
setOperationAction(ISD::VAARG, MVT::Other, Custom);
|
2011-03-10 03:22:22 +08:00
|
|
|
setOperationAction(ISD::VACOPY, MVT::Other, Expand);
|
|
|
|
setOperationAction(ISD::VAEND, MVT::Other, Expand);
|
|
|
|
|
2008-07-09 12:15:08 +08:00
|
|
|
// Use the default for now
|
2009-08-12 04:47:22 +08:00
|
|
|
setOperationAction(ISD::STACKSAVE, MVT::Other, Expand);
|
|
|
|
setOperationAction(ISD::STACKRESTORE, MVT::Other, Expand);
|
2011-07-28 06:21:52 +08:00
|
|
|
|
2015-11-06 20:07:20 +08:00
|
|
|
if (!Subtarget.isGP64bit()) {
|
|
|
|
setOperationAction(ISD::ATOMIC_LOAD, MVT::i64, Expand);
|
|
|
|
setOperationAction(ISD::ATOMIC_STORE, MVT::i64, Expand);
|
|
|
|
}
|
2011-08-30 02:23:02 +08:00
|
|
|
|
2011-08-04 05:06:02 +08:00
|
|
|
|
2014-07-19 06:55:25 +08:00
|
|
|
if (!Subtarget.hasMips32r2()) {
|
2009-08-12 04:47:22 +08:00
|
|
|
setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i8, Expand);
|
|
|
|
setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i16, Expand);
|
Several changes to Mips backend, experimental fp support being the most
important.
- Cleanup in the Subtarget info with addition of new features, not all support
yet, but they allow the future inclusion of features easier. Among new features,
we have : Arch family info (mips1, mips2, ...), ABI info (o32, eabi), 64-bit
integer
and float registers, allegrex vector FPU (VFPU), single float only support.
- TargetMachine now detects allegrex core.
- Added allegrex (Mips32r2) sext_inreg instructions.
- *Added Float Point Instructions*, handling single float only, and
aliased accesses for 32-bit FPUs.
- Some cleanup in FP instruction formats and FP register classes.
- Calling conventions improved to support mips 32-bit EABI.
- Added Asm Printer support for fp cond codes.
- Added support for sret copy to a return register.
- EABI support added into LowerCALL and FORMAL_ARGS.
- MipsFunctionInfo now keeps a virtual register per function to track the
sret on function entry until function ret.
- MipsInstrInfo FP support into methods (isMoveInstr, isLoadFromStackSlot, ...),
FP cond codes mapping and initial FP Branch Analysis.
- Two new Mips SDNode to handle fp branch and compare instructions : FPBrcond,
FPCmp
- MipsTargetLowering : handling different FP classes, Allegrex support, sret
return copy, no homing location within EABI, non 32-bit stack objects
arguments, and asm constraint for float.
llvm-svn: 53146
2008-07-06 03:05:21 +08:00
|
|
|
}
|
|
|
|
|
2014-05-12 20:41:59 +08:00
|
|
|
// MIPS16 lacks MIPS32's clz and clo instructions.
|
2014-07-19 06:55:25 +08:00
|
|
|
if (!Subtarget.hasMips32() || Subtarget.inMips16Mode())
|
2009-08-12 04:47:22 +08:00
|
|
|
setOperationAction(ISD::CTLZ, MVT::i32, Expand);
|
2014-07-19 06:55:25 +08:00
|
|
|
if (!Subtarget.hasMips64())
|
2011-12-21 08:20:27 +08:00
|
|
|
setOperationAction(ISD::CTLZ, MVT::i64, Expand);
|
2008-08-08 14:16:31 +08:00
|
|
|
|
2014-07-19 06:55:25 +08:00
|
|
|
if (!Subtarget.hasMips32r2())
|
2009-08-12 04:47:22 +08:00
|
|
|
setOperationAction(ISD::BSWAP, MVT::i32, Expand);
|
2014-07-19 06:55:25 +08:00
|
|
|
if (!Subtarget.hasMips64r2())
|
2011-12-21 07:56:43 +08:00
|
|
|
setOperationAction(ISD::BSWAP, MVT::i64, Expand);
|
2008-08-13 15:13:40 +08:00
|
|
|
|
2014-07-19 06:55:25 +08:00
|
|
|
if (Subtarget.isGP64bit()) {
|
[SelectionDAG] Allow targets to specify legality of extloads' result
type (in addition to the memory type).
The *LoadExt* legalization handling used to only have one type, the
memory type. This forced users to assume that as long as the extload
for the memory type was declared legal, and the result type was legal,
the whole extload was legal.
However, this isn't always the case. For instance, on X86, with AVX,
this is legal:
v4i32 load, zext from v4i8
but this isn't:
v4i64 load, zext from v4i8
Whereas v4i64 is (arguably) legal, even without AVX2.
Note that the same thing was done a while ago for truncstores (r46140),
but I assume no one needed it yet for extloads, so here we go.
Calls to getLoadExtAction were changed to add the value type, found
manually in the surrounding code.
Calls to setLoadExtAction were mechanically changed, by wrapping the
call in a loop, to match previous behavior. The loop iterates over
the MVT subrange corresponding to the memory type (FP vectors, etc...).
I also pulled neighboring setTruncStoreActions into some of the loops;
those shouldn't make a difference, as the additional types are illegal.
(e.g., i128->i1 truncstores on PPC.)
No functional change intended.
Differential Revision: http://reviews.llvm.org/D6532
llvm-svn: 225421
2015-01-08 08:51:32 +08:00
|
|
|
setLoadExtAction(ISD::SEXTLOAD, MVT::i64, MVT::i32, Custom);
|
|
|
|
setLoadExtAction(ISD::ZEXTLOAD, MVT::i64, MVT::i32, Custom);
|
|
|
|
setLoadExtAction(ISD::EXTLOAD, MVT::i64, MVT::i32, Custom);
|
2012-06-02 08:04:42 +08:00
|
|
|
setTruncStoreAction(MVT::i64, MVT::i32, Custom);
|
|
|
|
}
|
|
|
|
|
2013-07-27 04:58:55 +08:00
|
|
|
setOperationAction(ISD::TRAP, MVT::Other, Legal);
|
|
|
|
|
2011-03-05 05:03:24 +08:00
|
|
|
setTargetDAGCombine(ISD::SDIVREM);
|
|
|
|
setTargetDAGCombine(ISD::UDIVREM);
|
2012-03-08 11:26:37 +08:00
|
|
|
setTargetDAGCombine(ISD::SELECT);
|
2011-08-18 01:45:08 +08:00
|
|
|
setTargetDAGCombine(ISD::AND);
|
|
|
|
setTargetDAGCombine(ISD::OR);
|
2012-06-14 04:33:18 +08:00
|
|
|
setTargetDAGCombine(ISD::ADD);
|
2016-04-13 23:07:45 +08:00
|
|
|
setTargetDAGCombine(ISD::AssertZext);
|
[Mips] Add support to match more patterns for DEXT and CINS
This patch adds support for recognizing more patterns to match to DEXT and
CINS instructions.
It finds cases where multiple instructions could be replaced with a single
DEXT or CINS instruction.
For example, for the following:
define i64 @dext_and32(i64 zeroext %a) {
entry:
%and = and i64 %a, 4294967295
ret i64 %and
}
instead of generating:
0000000000000088 <dext_and32>:
88: 64010001 daddiu at,zero,1
8c: 0001083c dsll32 at,at,0x0
90: 6421ffff daddiu at,at,-1
94: 03e00008 jr ra
98: 00811024 and v0,a0,at
9c: 00000000 nop
the following gets generated:
0000000000000068 <dext_and32>:
68: 03e00008 jr ra
6c: 7c82f803 dext v0,a0,0x0,0x20
Cases that are covered:
DEXT:
1. and $src, mask where mask > 0xffff
2. zext $src zero extend from i32 to i64
CINS:
1. and (shl $src, pos), mask
2. shl (and $src, mask), pos
3. zext (shl $src, pos) zero extend from i32 to i64
Patch by Violeta Vukobrat.
Differential Revision: https://reviews.llvm.org/D30464
llvm-svn: 297832
2017-03-15 21:10:08 +08:00
|
|
|
setTargetDAGCombine(ISD::SHL);
|
2011-01-19 03:29:17 +08:00
|
|
|
|
2016-09-07 18:01:18 +08:00
|
|
|
if (ABI.IsO32()) {
|
|
|
|
// These libcalls are not available in 32-bit.
|
|
|
|
setLibcallName(RTLIB::SHL_I128, nullptr);
|
|
|
|
setLibcallName(RTLIB::SRL_I128, nullptr);
|
|
|
|
setLibcallName(RTLIB::SRA_I128, nullptr);
|
|
|
|
}
|
|
|
|
|
2014-07-19 06:55:25 +08:00
|
|
|
setMinFunctionAlignment(Subtarget.isGP64bit() ? 3 : 2);
|
2011-05-07 04:34:06 +08:00
|
|
|
|
2014-08-01 17:17:39 +08:00
|
|
|
// The arguments on the stack are defined in terms of 4-byte slots on O32
|
|
|
|
// and 8-byte slots on N32/N64.
|
2015-01-30 07:27:36 +08:00
|
|
|
setMinStackArgumentAlignment((ABI.IsN32() || ABI.IsN64()) ? 8 : 4);
|
2014-08-01 17:17:39 +08:00
|
|
|
|
2015-01-30 07:27:36 +08:00
|
|
|
setStackPointerRegisterToSaveRestore(ABI.IsN64() ? Mips::SP_64 : Mips::SP);
|
2011-05-27 02:59:03 +08:00
|
|
|
|
2013-02-21 05:13:59 +08:00
|
|
|
MaxStoresPerMemcpy = 16;
|
2013-12-20 00:12:56 +08:00
|
|
|
|
2014-07-19 06:55:25 +08:00
|
|
|
isMicroMips = Subtarget.inMicroMipsMode();
|
2007-06-06 15:42:06 +08:00
|
|
|
}
|
|
|
|
|
2014-09-20 07:30:42 +08:00
|
|
|
const MipsTargetLowering *MipsTargetLowering::create(const MipsTargetMachine &TM,
|
2014-07-19 07:25:04 +08:00
|
|
|
const MipsSubtarget &STI) {
|
|
|
|
if (STI.inMips16Mode())
|
|
|
|
return llvm::createMips16TargetLowering(TM, STI);
|
2012-02-28 15:46:26 +08:00
|
|
|
|
2014-07-19 07:25:04 +08:00
|
|
|
return llvm::createMipsSETargetLowering(TM, STI);
|
2011-08-13 05:30:06 +08:00
|
|
|
}
|
|
|
|
|
2014-04-18 06:15:34 +08:00
|
|
|
// Create a fast isel object.
|
|
|
|
FastISel *
|
|
|
|
MipsTargetLowering::createFastISel(FunctionLoweringInfo &funcInfo,
|
|
|
|
const TargetLibraryInfo *libInfo) const {
|
2016-10-18 21:05:42 +08:00
|
|
|
const MipsTargetMachine &TM =
|
|
|
|
static_cast<const MipsTargetMachine &>(funcInfo.MF->getTarget());
|
|
|
|
|
|
|
|
// We support only the standard encoding [MIPS32,MIPS32R5] ISAs.
|
|
|
|
bool UseFastISel = TM.Options.EnableFastISel && Subtarget.hasMips32() &&
|
|
|
|
!Subtarget.hasMips32r6() && !Subtarget.inMips16Mode() &&
|
|
|
|
!Subtarget.inMicroMipsMode();
|
|
|
|
|
|
|
|
// Disable if we don't generate PIC or the ABI isn't O32.
|
|
|
|
if (!TM.isPositionIndependent() || !TM.getABI().IsO32())
|
|
|
|
UseFastISel = false;
|
|
|
|
|
|
|
|
return UseFastISel ? Mips::createFastISel(funcInfo, libInfo) : nullptr;
|
2014-04-18 06:15:34 +08:00
|
|
|
}
|
|
|
|
|
2015-07-09 10:09:04 +08:00
|
|
|
EVT MipsTargetLowering::getSetCCResultType(const DataLayout &, LLVMContext &,
|
|
|
|
EVT VT) const {
|
2016-03-02 04:25:43 +08:00
|
|
|
if (!VT.isVector())
|
|
|
|
return MVT::i32;
|
|
|
|
return VT.changeVectorElementTypeToInteger();
|
2008-03-10 23:42:14 +08:00
|
|
|
}
|
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
static SDValue performDivRemCombine(SDNode *N, SelectionDAG &DAG,
|
2011-03-05 05:03:24 +08:00
|
|
|
TargetLowering::DAGCombinerInfo &DCI,
|
2014-07-19 06:55:25 +08:00
|
|
|
const MipsSubtarget &Subtarget) {
|
2011-03-05 05:03:24 +08:00
|
|
|
if (DCI.isBeforeLegalizeOps())
|
|
|
|
return SDValue();
|
|
|
|
|
2011-10-04 05:06:13 +08:00
|
|
|
EVT Ty = N->getValueType(0);
|
2013-08-14 08:47:08 +08:00
|
|
|
unsigned LO = (Ty == MVT::i32) ? Mips::LO0 : Mips::LO0_64;
|
|
|
|
unsigned HI = (Ty == MVT::i32) ? Mips::HI0 : Mips::HI0_64;
|
2013-03-30 09:36:35 +08:00
|
|
|
unsigned Opc = N->getOpcode() == ISD::SDIVREM ? MipsISD::DivRem16 :
|
|
|
|
MipsISD::DivRemU16;
|
2013-05-25 10:42:55 +08:00
|
|
|
SDLoc DL(N);
|
2011-03-05 05:03:24 +08:00
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue DivRem = DAG.getNode(Opc, DL, MVT::Glue,
|
2011-03-05 05:03:24 +08:00
|
|
|
N->getOperand(0), N->getOperand(1));
|
|
|
|
SDValue InChain = DAG.getEntryNode();
|
|
|
|
SDValue InGlue = DivRem;
|
|
|
|
|
|
|
|
// insert MFLO
|
|
|
|
if (N->hasAnyUseOfValue(0)) {
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue CopyFromLo = DAG.getCopyFromReg(InChain, DL, LO, Ty,
|
2011-03-05 05:03:24 +08:00
|
|
|
InGlue);
|
|
|
|
DAG.ReplaceAllUsesOfValueWith(SDValue(N, 0), CopyFromLo);
|
|
|
|
InChain = CopyFromLo.getValue(1);
|
|
|
|
InGlue = CopyFromLo.getValue(2);
|
|
|
|
}
|
|
|
|
|
|
|
|
// insert MFHI
|
|
|
|
if (N->hasAnyUseOfValue(1)) {
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue CopyFromHi = DAG.getCopyFromReg(InChain, DL,
|
2011-10-04 05:06:13 +08:00
|
|
|
HI, Ty, InGlue);
|
2011-03-05 05:03:24 +08:00
|
|
|
DAG.ReplaceAllUsesOfValueWith(SDValue(N, 1), CopyFromHi);
|
|
|
|
}
|
|
|
|
|
|
|
|
return SDValue();
|
|
|
|
}
|
|
|
|
|
2016-09-09 19:06:01 +08:00
|
|
|
static Mips::CondCode condCodeToFCC(ISD::CondCode CC) {
|
|
|
|
switch (CC) {
|
|
|
|
default: llvm_unreachable("Unknown fp condition code!");
|
|
|
|
case ISD::SETEQ:
|
|
|
|
case ISD::SETOEQ: return Mips::FCOND_OEQ;
|
|
|
|
case ISD::SETUNE: return Mips::FCOND_UNE;
|
|
|
|
case ISD::SETLT:
|
|
|
|
case ISD::SETOLT: return Mips::FCOND_OLT;
|
|
|
|
case ISD::SETGT:
|
|
|
|
case ISD::SETOGT: return Mips::FCOND_OGT;
|
|
|
|
case ISD::SETLE:
|
|
|
|
case ISD::SETOLE: return Mips::FCOND_OLE;
|
|
|
|
case ISD::SETGE:
|
|
|
|
case ISD::SETOGE: return Mips::FCOND_OGE;
|
|
|
|
case ISD::SETULT: return Mips::FCOND_ULT;
|
|
|
|
case ISD::SETULE: return Mips::FCOND_ULE;
|
|
|
|
case ISD::SETUGT: return Mips::FCOND_UGT;
|
|
|
|
case ISD::SETUGE: return Mips::FCOND_UGE;
|
|
|
|
case ISD::SETUO: return Mips::FCOND_UN;
|
|
|
|
case ISD::SETO: return Mips::FCOND_OR;
|
|
|
|
case ISD::SETNE:
|
|
|
|
case ISD::SETONE: return Mips::FCOND_ONE;
|
|
|
|
case ISD::SETUEQ: return Mips::FCOND_UEQ;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/// This function returns true if the floating point conditional branches and
|
|
|
|
/// conditional moves which use condition code CC should be inverted.
|
|
|
|
static bool invertFPCondCodeUser(Mips::CondCode CC) {
|
|
|
|
if (CC >= Mips::FCOND_F && CC <= Mips::FCOND_NGT)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
assert((CC >= Mips::FCOND_T && CC <= Mips::FCOND_GT) &&
|
|
|
|
"Illegal Condition Code");
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Creates and returns an FPCmp node from a setcc node.
|
|
|
|
// Returns Op if setcc is not a floating point comparison.
|
|
|
|
static SDValue createFPCmp(SelectionDAG &DAG, const SDValue &Op) {
|
|
|
|
// must be a SETCC node
|
|
|
|
if (Op.getOpcode() != ISD::SETCC)
|
|
|
|
return Op;
|
|
|
|
|
|
|
|
SDValue LHS = Op.getOperand(0);
|
|
|
|
|
|
|
|
if (!LHS.getValueType().isFloatingPoint())
|
|
|
|
return Op;
|
|
|
|
|
|
|
|
SDValue RHS = Op.getOperand(1);
|
|
|
|
SDLoc DL(Op);
|
|
|
|
|
|
|
|
// Assume the 3rd operand is a CondCodeSDNode. Add code to check the type of
|
|
|
|
// node if necessary.
|
|
|
|
ISD::CondCode CC = cast<CondCodeSDNode>(Op.getOperand(2))->get();
|
|
|
|
|
|
|
|
return DAG.getNode(MipsISD::FPCmp, DL, MVT::Glue, LHS, RHS,
|
|
|
|
DAG.getConstant(condCodeToFCC(CC), DL, MVT::i32));
|
|
|
|
}
|
|
|
|
|
|
|
|
// Creates and returns a CMovFPT/F node.
|
|
|
|
static SDValue createCMovFP(SelectionDAG &DAG, SDValue Cond, SDValue True,
|
|
|
|
SDValue False, const SDLoc &DL) {
|
|
|
|
ConstantSDNode *CC = cast<ConstantSDNode>(Cond.getOperand(2));
|
|
|
|
bool invert = invertFPCondCodeUser((Mips::CondCode)CC->getSExtValue());
|
|
|
|
SDValue FCC0 = DAG.getRegister(Mips::FCC0, MVT::i32);
|
|
|
|
|
|
|
|
return DAG.getNode((invert ? MipsISD::CMovFP_F : MipsISD::CMovFP_T), DL,
|
|
|
|
True.getValueType(), True, FCC0, False, Cond);
|
|
|
|
}
|
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
static SDValue performSELECTCombine(SDNode *N, SelectionDAG &DAG,
|
2012-03-08 10:14:24 +08:00
|
|
|
TargetLowering::DAGCombinerInfo &DCI,
|
2014-07-19 06:55:25 +08:00
|
|
|
const MipsSubtarget &Subtarget) {
|
2012-03-08 10:14:24 +08:00
|
|
|
if (DCI.isBeforeLegalizeOps())
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
SDValue SetCC = N->getOperand(0);
|
|
|
|
|
|
|
|
if ((SetCC.getOpcode() != ISD::SETCC) ||
|
|
|
|
!SetCC.getOperand(0).getValueType().isInteger())
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
SDValue False = N->getOperand(2);
|
|
|
|
EVT FalseTy = False.getValueType();
|
|
|
|
|
|
|
|
if (!FalseTy.isInteger())
|
|
|
|
return SDValue();
|
|
|
|
|
2013-12-05 19:56:56 +08:00
|
|
|
ConstantSDNode *FalseC = dyn_cast<ConstantSDNode>(False);
|
|
|
|
|
|
|
|
// If the RHS (False) is 0, we swap the order of the operands
|
|
|
|
// of ISD::SELECT (obviously also inverting the condition) so that we can
|
|
|
|
// take advantage of conditional moves using the $0 register.
|
|
|
|
// Example:
|
|
|
|
// return (a != 0) ? x : 0;
|
|
|
|
// load $reg, x
|
|
|
|
// movz $reg, $0, a
|
|
|
|
if (!FalseC)
|
2012-03-08 10:14:24 +08:00
|
|
|
return SDValue();
|
|
|
|
|
2013-05-25 10:42:55 +08:00
|
|
|
const SDLoc DL(N);
|
2012-06-15 05:10:56 +08:00
|
|
|
|
2013-12-05 19:56:56 +08:00
|
|
|
if (!FalseC->getZExtValue()) {
|
|
|
|
ISD::CondCode CC = cast<CondCodeSDNode>(SetCC.getOperand(2))->get();
|
|
|
|
SDValue True = N->getOperand(1);
|
|
|
|
|
|
|
|
SetCC = DAG.getSetCC(DL, SetCC.getValueType(), SetCC.getOperand(0),
|
|
|
|
SetCC.getOperand(1), ISD::getSetCCInverse(CC, true));
|
2012-06-15 05:10:56 +08:00
|
|
|
|
2013-12-05 19:56:56 +08:00
|
|
|
return DAG.getNode(ISD::SELECT, DL, FalseTy, SetCC, False, True);
|
|
|
|
}
|
|
|
|
|
2013-12-05 20:07:05 +08:00
|
|
|
// If both operands are integer constants there's a possibility that we
|
|
|
|
// can do some interesting optimizations.
|
|
|
|
SDValue True = N->getOperand(1);
|
|
|
|
ConstantSDNode *TrueC = dyn_cast<ConstantSDNode>(True);
|
|
|
|
|
|
|
|
if (!TrueC || !True.getValueType().isInteger())
|
|
|
|
return SDValue();
|
|
|
|
|
2016-03-02 04:25:43 +08:00
|
|
|
// We'll also ignore MVT::i64 operands as this optimizations proves
|
|
|
|
// to be ineffective because of the required sign extensions as the result
|
|
|
|
// of a SETCC operator is always MVT::i32 for non-vector types.
|
|
|
|
if (True.getValueType() == MVT::i64)
|
|
|
|
return SDValue();
|
|
|
|
|
2013-12-05 20:07:05 +08:00
|
|
|
int64_t Diff = TrueC->getSExtValue() - FalseC->getSExtValue();
|
|
|
|
|
|
|
|
// 1) (a < x) ? y : y-1
|
|
|
|
// slti $reg1, a, x
|
|
|
|
// addiu $reg2, $reg1, y-1
|
2016-03-02 04:25:43 +08:00
|
|
|
if (Diff == 1)
|
|
|
|
return DAG.getNode(ISD::ADD, DL, SetCC.getValueType(), SetCC, False);
|
2013-12-05 20:07:05 +08:00
|
|
|
|
|
|
|
// 2) (a < x) ? y-1 : y
|
|
|
|
// slti $reg1, a, x
|
|
|
|
// xor $reg1, $reg1, 1
|
|
|
|
// addiu $reg2, $reg1, y-1
|
|
|
|
if (Diff == -1) {
|
|
|
|
ISD::CondCode CC = cast<CondCodeSDNode>(SetCC.getOperand(2))->get();
|
|
|
|
SetCC = DAG.getSetCC(DL, SetCC.getValueType(), SetCC.getOperand(0),
|
|
|
|
SetCC.getOperand(1), ISD::getSetCCInverse(CC, true));
|
|
|
|
return DAG.getNode(ISD::ADD, DL, SetCC.getValueType(), SetCC, True);
|
|
|
|
}
|
|
|
|
|
2013-12-05 19:56:56 +08:00
|
|
|
// Couldn't optimize.
|
|
|
|
return SDValue();
|
2012-03-08 10:14:24 +08:00
|
|
|
}
|
|
|
|
|
2015-03-02 20:47:32 +08:00
|
|
|
static SDValue performCMovFPCombine(SDNode *N, SelectionDAG &DAG,
|
|
|
|
TargetLowering::DAGCombinerInfo &DCI,
|
|
|
|
const MipsSubtarget &Subtarget) {
|
|
|
|
if (DCI.isBeforeLegalizeOps())
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
SDValue ValueIfTrue = N->getOperand(0), ValueIfFalse = N->getOperand(2);
|
|
|
|
|
|
|
|
ConstantSDNode *FalseC = dyn_cast<ConstantSDNode>(ValueIfFalse);
|
|
|
|
if (!FalseC || FalseC->getZExtValue())
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
// Since RHS (False) is 0, we swap the order of the True/False operands
|
|
|
|
// (obviously also inverting the condition) so that we can
|
|
|
|
// take advantage of conditional moves using the $0 register.
|
|
|
|
// Example:
|
|
|
|
// return (a != 0) ? x : 0;
|
|
|
|
// load $reg, x
|
|
|
|
// movz $reg, $0, a
|
|
|
|
unsigned Opc = (N->getOpcode() == MipsISD::CMovFP_T) ? MipsISD::CMovFP_F :
|
|
|
|
MipsISD::CMovFP_T;
|
|
|
|
|
|
|
|
SDValue FCC = N->getOperand(1), Glue = N->getOperand(3);
|
2015-03-04 20:10:18 +08:00
|
|
|
return DAG.getNode(Opc, SDLoc(N), ValueIfFalse.getValueType(),
|
|
|
|
ValueIfFalse, FCC, ValueIfTrue, Glue);
|
2015-03-02 20:47:32 +08:00
|
|
|
}
|
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
static SDValue performANDCombine(SDNode *N, SelectionDAG &DAG,
|
2011-08-18 01:45:08 +08:00
|
|
|
TargetLowering::DAGCombinerInfo &DCI,
|
2014-07-19 06:55:25 +08:00
|
|
|
const MipsSubtarget &Subtarget) {
|
|
|
|
if (DCI.isBeforeLegalizeOps() || !Subtarget.hasExtractInsert())
|
2011-08-18 01:45:08 +08:00
|
|
|
return SDValue();
|
|
|
|
|
[Mips] Add support to match more patterns for DEXT and CINS
This patch adds support for recognizing more patterns to match to DEXT and
CINS instructions.
It finds cases where multiple instructions could be replaced with a single
DEXT or CINS instruction.
For example, for the following:
define i64 @dext_and32(i64 zeroext %a) {
entry:
%and = and i64 %a, 4294967295
ret i64 %and
}
instead of generating:
0000000000000088 <dext_and32>:
88: 64010001 daddiu at,zero,1
8c: 0001083c dsll32 at,at,0x0
90: 6421ffff daddiu at,at,-1
94: 03e00008 jr ra
98: 00811024 and v0,a0,at
9c: 00000000 nop
the following gets generated:
0000000000000068 <dext_and32>:
68: 03e00008 jr ra
6c: 7c82f803 dext v0,a0,0x0,0x20
Cases that are covered:
DEXT:
1. and $src, mask where mask > 0xffff
2. zext $src zero extend from i32 to i64
CINS:
1. and (shl $src, pos), mask
2. shl (and $src, mask), pos
3. zext (shl $src, pos) zero extend from i32 to i64
Patch by Violeta Vukobrat.
Differential Revision: https://reviews.llvm.org/D30464
llvm-svn: 297832
2017-03-15 21:10:08 +08:00
|
|
|
SDValue FirstOperand = N->getOperand(0);
|
|
|
|
unsigned FirstOperandOpc = FirstOperand.getOpcode();
|
|
|
|
SDValue Mask = N->getOperand(1);
|
|
|
|
EVT ValTy = N->getValueType(0);
|
|
|
|
SDLoc DL(N);
|
2011-08-18 01:45:08 +08:00
|
|
|
|
[Mips] Add support to match more patterns for DEXT and CINS
This patch adds support for recognizing more patterns to match to DEXT and
CINS instructions.
It finds cases where multiple instructions could be replaced with a single
DEXT or CINS instruction.
For example, for the following:
define i64 @dext_and32(i64 zeroext %a) {
entry:
%and = and i64 %a, 4294967295
ret i64 %and
}
instead of generating:
0000000000000088 <dext_and32>:
88: 64010001 daddiu at,zero,1
8c: 0001083c dsll32 at,at,0x0
90: 6421ffff daddiu at,at,-1
94: 03e00008 jr ra
98: 00811024 and v0,a0,at
9c: 00000000 nop
the following gets generated:
0000000000000068 <dext_and32>:
68: 03e00008 jr ra
6c: 7c82f803 dext v0,a0,0x0,0x20
Cases that are covered:
DEXT:
1. and $src, mask where mask > 0xffff
2. zext $src zero extend from i32 to i64
CINS:
1. and (shl $src, pos), mask
2. shl (and $src, mask), pos
3. zext (shl $src, pos) zero extend from i32 to i64
Patch by Violeta Vukobrat.
Differential Revision: https://reviews.llvm.org/D30464
llvm-svn: 297832
2017-03-15 21:10:08 +08:00
|
|
|
uint64_t Pos = 0, SMPos, SMSize;
|
2011-08-18 01:45:08 +08:00
|
|
|
ConstantSDNode *CN;
|
[Mips] Add support to match more patterns for DEXT and CINS
This patch adds support for recognizing more patterns to match to DEXT and
CINS instructions.
It finds cases where multiple instructions could be replaced with a single
DEXT or CINS instruction.
For example, for the following:
define i64 @dext_and32(i64 zeroext %a) {
entry:
%and = and i64 %a, 4294967295
ret i64 %and
}
instead of generating:
0000000000000088 <dext_and32>:
88: 64010001 daddiu at,zero,1
8c: 0001083c dsll32 at,at,0x0
90: 6421ffff daddiu at,at,-1
94: 03e00008 jr ra
98: 00811024 and v0,a0,at
9c: 00000000 nop
the following gets generated:
0000000000000068 <dext_and32>:
68: 03e00008 jr ra
6c: 7c82f803 dext v0,a0,0x0,0x20
Cases that are covered:
DEXT:
1. and $src, mask where mask > 0xffff
2. zext $src zero extend from i32 to i64
CINS:
1. and (shl $src, pos), mask
2. shl (and $src, mask), pos
3. zext (shl $src, pos) zero extend from i32 to i64
Patch by Violeta Vukobrat.
Differential Revision: https://reviews.llvm.org/D30464
llvm-svn: 297832
2017-03-15 21:10:08 +08:00
|
|
|
SDValue NewOperand;
|
|
|
|
unsigned Opc;
|
2011-12-06 05:26:34 +08:00
|
|
|
|
2011-08-18 01:45:08 +08:00
|
|
|
// Op's second operand must be a shifted mask.
|
|
|
|
if (!(CN = dyn_cast<ConstantSDNode>(Mask)) ||
|
2013-03-12 08:16:36 +08:00
|
|
|
!isShiftedMask(CN->getZExtValue(), SMPos, SMSize))
|
2011-08-18 01:45:08 +08:00
|
|
|
return SDValue();
|
|
|
|
|
[Mips] Add support to match more patterns for DEXT and CINS
This patch adds support for recognizing more patterns to match to DEXT and
CINS instructions.
It finds cases where multiple instructions could be replaced with a single
DEXT or CINS instruction.
For example, for the following:
define i64 @dext_and32(i64 zeroext %a) {
entry:
%and = and i64 %a, 4294967295
ret i64 %and
}
instead of generating:
0000000000000088 <dext_and32>:
88: 64010001 daddiu at,zero,1
8c: 0001083c dsll32 at,at,0x0
90: 6421ffff daddiu at,at,-1
94: 03e00008 jr ra
98: 00811024 and v0,a0,at
9c: 00000000 nop
the following gets generated:
0000000000000068 <dext_and32>:
68: 03e00008 jr ra
6c: 7c82f803 dext v0,a0,0x0,0x20
Cases that are covered:
DEXT:
1. and $src, mask where mask > 0xffff
2. zext $src zero extend from i32 to i64
CINS:
1. and (shl $src, pos), mask
2. shl (and $src, mask), pos
3. zext (shl $src, pos) zero extend from i32 to i64
Patch by Violeta Vukobrat.
Differential Revision: https://reviews.llvm.org/D30464
llvm-svn: 297832
2017-03-15 21:10:08 +08:00
|
|
|
if (FirstOperandOpc == ISD::SRA || FirstOperandOpc == ISD::SRL) {
|
|
|
|
// Pattern match EXT.
|
|
|
|
// $dst = and ((sra or srl) $src , pos), (2**size - 1)
|
|
|
|
// => ext $dst, $src, pos, size
|
|
|
|
|
|
|
|
// The second operand of the shift must be an immediate.
|
|
|
|
if (!(CN = dyn_cast<ConstantSDNode>(FirstOperand.getOperand(1))))
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
Pos = CN->getZExtValue();
|
|
|
|
|
|
|
|
// Return if the shifted mask does not start at bit 0 or the sum of its size
|
|
|
|
// and Pos exceeds the word's size.
|
|
|
|
if (SMPos != 0 || Pos + SMSize > ValTy.getSizeInBits())
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
Opc = MipsISD::Ext;
|
|
|
|
NewOperand = FirstOperand.getOperand(0);
|
|
|
|
} else if (FirstOperandOpc == ISD::SHL && Subtarget.hasCnMips()) {
|
|
|
|
// Pattern match CINS.
|
|
|
|
// $dst = and (shl $src , pos), mask
|
|
|
|
// => cins $dst, $src, pos, size
|
|
|
|
// mask is a shifted mask with consecutive 1's, pos = shift amount,
|
|
|
|
// size = population count.
|
|
|
|
|
|
|
|
// The second operand of the shift must be an immediate.
|
|
|
|
if (!(CN = dyn_cast<ConstantSDNode>(FirstOperand.getOperand(1))))
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
Pos = CN->getZExtValue();
|
|
|
|
|
|
|
|
if (SMPos != Pos || Pos >= ValTy.getSizeInBits() || SMSize >= 32 ||
|
|
|
|
Pos + SMSize > ValTy.getSizeInBits())
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
NewOperand = FirstOperand.getOperand(0);
|
|
|
|
// SMSize is 'location' (position) in this case, not size.
|
|
|
|
SMSize--;
|
|
|
|
Opc = MipsISD::CIns;
|
|
|
|
} else {
|
|
|
|
// Pattern match EXT.
|
|
|
|
// $dst = and $src, (2**size - 1) , if size > 16
|
|
|
|
// => ext $dst, $src, pos, size , pos = 0
|
2011-08-18 01:45:08 +08:00
|
|
|
|
[Mips] Add support to match more patterns for DEXT and CINS
This patch adds support for recognizing more patterns to match to DEXT and
CINS instructions.
It finds cases where multiple instructions could be replaced with a single
DEXT or CINS instruction.
For example, for the following:
define i64 @dext_and32(i64 zeroext %a) {
entry:
%and = and i64 %a, 4294967295
ret i64 %and
}
instead of generating:
0000000000000088 <dext_and32>:
88: 64010001 daddiu at,zero,1
8c: 0001083c dsll32 at,at,0x0
90: 6421ffff daddiu at,at,-1
94: 03e00008 jr ra
98: 00811024 and v0,a0,at
9c: 00000000 nop
the following gets generated:
0000000000000068 <dext_and32>:
68: 03e00008 jr ra
6c: 7c82f803 dext v0,a0,0x0,0x20
Cases that are covered:
DEXT:
1. and $src, mask where mask > 0xffff
2. zext $src zero extend from i32 to i64
CINS:
1. and (shl $src, pos), mask
2. shl (and $src, mask), pos
3. zext (shl $src, pos) zero extend from i32 to i64
Patch by Violeta Vukobrat.
Differential Revision: https://reviews.llvm.org/D30464
llvm-svn: 297832
2017-03-15 21:10:08 +08:00
|
|
|
// If the mask is <= 0xffff, andi can be used instead.
|
|
|
|
if (CN->getZExtValue() <= 0xffff)
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
// Return if the mask doesn't start at position 0.
|
|
|
|
if (SMPos)
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
Opc = MipsISD::Ext;
|
|
|
|
NewOperand = FirstOperand;
|
|
|
|
}
|
|
|
|
return DAG.getNode(Opc, DL, ValTy, NewOperand,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(Pos, DL, MVT::i32),
|
|
|
|
DAG.getConstant(SMSize, DL, MVT::i32));
|
2011-08-18 01:45:08 +08:00
|
|
|
}
|
2012-02-28 15:46:26 +08:00
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
static SDValue performORCombine(SDNode *N, SelectionDAG &DAG,
|
2011-08-18 01:45:08 +08:00
|
|
|
TargetLowering::DAGCombinerInfo &DCI,
|
2014-07-19 06:55:25 +08:00
|
|
|
const MipsSubtarget &Subtarget) {
|
2011-08-18 01:45:08 +08:00
|
|
|
// Pattern match INS.
|
|
|
|
// $dst = or (and $src1 , mask0), (and (shl $src, pos), mask1),
|
2012-02-28 15:46:26 +08:00
|
|
|
// where mask1 = (2**size - 1) << pos, mask0 = ~mask1
|
2011-08-18 01:45:08 +08:00
|
|
|
// => ins $dst, $src, size, pos, $src1
|
2014-07-19 06:55:25 +08:00
|
|
|
if (DCI.isBeforeLegalizeOps() || !Subtarget.hasExtractInsert())
|
2011-08-18 01:45:08 +08:00
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
SDValue And0 = N->getOperand(0), And1 = N->getOperand(1);
|
|
|
|
uint64_t SMPos0, SMSize0, SMPos1, SMSize1;
|
2017-05-09 21:18:48 +08:00
|
|
|
ConstantSDNode *CN;
|
2011-08-18 01:45:08 +08:00
|
|
|
|
|
|
|
// See if Op's first operand matches (and $src1 , mask0).
|
|
|
|
if (And0.getOpcode() != ISD::AND)
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
if (!(CN = dyn_cast<ConstantSDNode>(And0.getOperand(1))) ||
|
2013-03-12 08:16:36 +08:00
|
|
|
!isShiftedMask(~CN->getSExtValue(), SMPos0, SMSize0))
|
2011-08-18 01:45:08 +08:00
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
// See if Op's second operand matches (and (shl $src, pos), mask1).
|
2017-05-09 21:18:48 +08:00
|
|
|
if (And1.getOpcode() != ISD::AND)
|
|
|
|
return SDValue();
|
2011-08-18 01:45:08 +08:00
|
|
|
|
2017-05-09 21:18:48 +08:00
|
|
|
if (!(CN = dyn_cast<ConstantSDNode>(And1.getOperand(1))) ||
|
|
|
|
!isShiftedMask(CN->getZExtValue(), SMPos1, SMSize1))
|
|
|
|
return SDValue();
|
2011-08-18 01:45:08 +08:00
|
|
|
|
2017-05-09 21:18:48 +08:00
|
|
|
// The shift masks must have the same position and size.
|
|
|
|
if (SMPos0 != SMPos1 || SMSize0 != SMSize1)
|
|
|
|
return SDValue();
|
2011-08-18 01:45:08 +08:00
|
|
|
|
2017-05-09 21:18:48 +08:00
|
|
|
SDValue Shl = And1.getOperand(0);
|
|
|
|
if (Shl.getOpcode() != ISD::SHL)
|
|
|
|
return SDValue();
|
2011-08-18 01:45:08 +08:00
|
|
|
|
2017-05-09 21:18:48 +08:00
|
|
|
if (!(CN = dyn_cast<ConstantSDNode>(Shl.getOperand(1))))
|
|
|
|
return SDValue();
|
2011-08-18 01:45:08 +08:00
|
|
|
|
2017-05-09 21:18:48 +08:00
|
|
|
unsigned Shamt = CN->getZExtValue();
|
2012-02-28 15:46:26 +08:00
|
|
|
|
2017-05-09 21:18:48 +08:00
|
|
|
// Return if the shift amount and the first bit position of mask are not the
|
|
|
|
// same.
|
|
|
|
EVT ValTy = N->getValueType(0);
|
|
|
|
if ((Shamt != SMPos0) || (SMPos0 + SMSize0 > ValTy.getSizeInBits()))
|
2017-05-09 18:02:00 +08:00
|
|
|
return SDValue();
|
2017-05-09 21:18:48 +08:00
|
|
|
|
|
|
|
SDLoc DL(N);
|
|
|
|
return DAG.getNode(MipsISD::Ins, DL, ValTy, Shl.getOperand(0),
|
|
|
|
DAG.getConstant(SMPos0, DL, MVT::i32),
|
|
|
|
DAG.getConstant(SMSize0, DL, MVT::i32),
|
|
|
|
And0.getOperand(0));
|
2011-08-18 01:45:08 +08:00
|
|
|
}
|
2012-02-28 15:46:26 +08:00
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
static SDValue performADDCombine(SDNode *N, SelectionDAG &DAG,
|
2012-06-14 04:33:18 +08:00
|
|
|
TargetLowering::DAGCombinerInfo &DCI,
|
2014-07-19 06:55:25 +08:00
|
|
|
const MipsSubtarget &Subtarget) {
|
2012-06-14 04:33:18 +08:00
|
|
|
// (add v0, (add v1, abs_lo(tjt))) => (add (add v0, v1), abs_lo(tjt))
|
|
|
|
|
|
|
|
if (DCI.isBeforeLegalizeOps())
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
SDValue Add = N->getOperand(1);
|
|
|
|
|
|
|
|
if (Add.getOpcode() != ISD::ADD)
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
SDValue Lo = Add.getOperand(1);
|
|
|
|
|
|
|
|
if ((Lo.getOpcode() != MipsISD::Lo) ||
|
|
|
|
(Lo.getOperand(0).getOpcode() != ISD::TargetJumpTable))
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
EVT ValTy = N->getValueType(0);
|
2013-05-25 10:42:55 +08:00
|
|
|
SDLoc DL(N);
|
2012-06-14 04:33:18 +08:00
|
|
|
|
|
|
|
SDValue Add1 = DAG.getNode(ISD::ADD, DL, ValTy, N->getOperand(0),
|
|
|
|
Add.getOperand(0));
|
|
|
|
return DAG.getNode(ISD::ADD, DL, ValTy, Add1, Lo);
|
|
|
|
}
|
|
|
|
|
2016-04-13 23:07:45 +08:00
|
|
|
static SDValue performAssertZextCombine(SDNode *N, SelectionDAG &DAG,
|
|
|
|
TargetLowering::DAGCombinerInfo &DCI,
|
|
|
|
const MipsSubtarget &Subtarget) {
|
|
|
|
SDValue N0 = N->getOperand(0);
|
|
|
|
EVT NarrowerVT = cast<VTSDNode>(N->getOperand(1))->getVT();
|
|
|
|
|
|
|
|
if (N0.getOpcode() != ISD::TRUNCATE)
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
if (N0.getOperand(0).getOpcode() != ISD::AssertZext)
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
// fold (AssertZext (trunc (AssertZext x))) -> (trunc (AssertZext x))
|
|
|
|
// if the type of the extension of the innermost AssertZext node is
|
|
|
|
// smaller from that of the outermost node, eg:
|
|
|
|
// (AssertZext:i32 (trunc:i32 (AssertZext:i64 X, i32)), i8)
|
|
|
|
// -> (trunc:i32 (AssertZext X, i8))
|
|
|
|
SDValue WiderAssertZext = N0.getOperand(0);
|
|
|
|
EVT WiderVT = cast<VTSDNode>(WiderAssertZext->getOperand(1))->getVT();
|
|
|
|
|
|
|
|
if (NarrowerVT.bitsLT(WiderVT)) {
|
|
|
|
SDValue NewAssertZext = DAG.getNode(
|
|
|
|
ISD::AssertZext, SDLoc(N), WiderAssertZext.getValueType(),
|
|
|
|
WiderAssertZext.getOperand(0), DAG.getValueType(NarrowerVT));
|
|
|
|
return DAG.getNode(ISD::TRUNCATE, SDLoc(N), N->getValueType(0),
|
|
|
|
NewAssertZext);
|
|
|
|
}
|
|
|
|
|
|
|
|
return SDValue();
|
|
|
|
}
|
|
|
|
|
[Mips] Add support to match more patterns for DEXT and CINS
This patch adds support for recognizing more patterns to match to DEXT and
CINS instructions.
It finds cases where multiple instructions could be replaced with a single
DEXT or CINS instruction.
For example, for the following:
define i64 @dext_and32(i64 zeroext %a) {
entry:
%and = and i64 %a, 4294967295
ret i64 %and
}
instead of generating:
0000000000000088 <dext_and32>:
88: 64010001 daddiu at,zero,1
8c: 0001083c dsll32 at,at,0x0
90: 6421ffff daddiu at,at,-1
94: 03e00008 jr ra
98: 00811024 and v0,a0,at
9c: 00000000 nop
the following gets generated:
0000000000000068 <dext_and32>:
68: 03e00008 jr ra
6c: 7c82f803 dext v0,a0,0x0,0x20
Cases that are covered:
DEXT:
1. and $src, mask where mask > 0xffff
2. zext $src zero extend from i32 to i64
CINS:
1. and (shl $src, pos), mask
2. shl (and $src, mask), pos
3. zext (shl $src, pos) zero extend from i32 to i64
Patch by Violeta Vukobrat.
Differential Revision: https://reviews.llvm.org/D30464
llvm-svn: 297832
2017-03-15 21:10:08 +08:00
|
|
|
|
|
|
|
static SDValue performSHLCombine(SDNode *N, SelectionDAG &DAG,
|
|
|
|
TargetLowering::DAGCombinerInfo &DCI,
|
|
|
|
const MipsSubtarget &Subtarget) {
|
|
|
|
// Pattern match CINS.
|
|
|
|
// $dst = shl (and $src , imm), pos
|
|
|
|
// => cins $dst, $src, pos, size
|
|
|
|
|
|
|
|
if (DCI.isBeforeLegalizeOps() || !Subtarget.hasCnMips())
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
SDValue FirstOperand = N->getOperand(0);
|
|
|
|
unsigned FirstOperandOpc = FirstOperand.getOpcode();
|
|
|
|
SDValue SecondOperand = N->getOperand(1);
|
|
|
|
EVT ValTy = N->getValueType(0);
|
|
|
|
SDLoc DL(N);
|
|
|
|
|
|
|
|
uint64_t Pos = 0, SMPos, SMSize;
|
|
|
|
ConstantSDNode *CN;
|
|
|
|
SDValue NewOperand;
|
|
|
|
|
|
|
|
// The second operand of the shift must be an immediate.
|
|
|
|
if (!(CN = dyn_cast<ConstantSDNode>(SecondOperand)))
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
Pos = CN->getZExtValue();
|
|
|
|
|
|
|
|
if (Pos >= ValTy.getSizeInBits())
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
if (FirstOperandOpc != ISD::AND)
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
// AND's second operand must be a shifted mask.
|
|
|
|
if (!(CN = dyn_cast<ConstantSDNode>(FirstOperand.getOperand(1))) ||
|
|
|
|
!isShiftedMask(CN->getZExtValue(), SMPos, SMSize))
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
// Return if the shifted mask does not start at bit 0 or the sum of its size
|
|
|
|
// and Pos exceeds the word's size.
|
|
|
|
if (SMPos != 0 || SMSize > 32 || Pos + SMSize > ValTy.getSizeInBits())
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
NewOperand = FirstOperand.getOperand(0);
|
|
|
|
// SMSize is 'location' (position) in this case, not size.
|
|
|
|
SMSize--;
|
|
|
|
|
|
|
|
return DAG.getNode(MipsISD::CIns, DL, ValTy, NewOperand,
|
|
|
|
DAG.getConstant(Pos, DL, MVT::i32),
|
|
|
|
DAG.getConstant(SMSize, DL, MVT::i32));
|
|
|
|
}
|
|
|
|
|
2011-02-11 02:05:10 +08:00
|
|
|
SDValue MipsTargetLowering::PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI)
|
2011-01-19 03:29:17 +08:00
|
|
|
const {
|
|
|
|
SelectionDAG &DAG = DCI.DAG;
|
2013-03-12 08:16:36 +08:00
|
|
|
unsigned Opc = N->getOpcode();
|
2011-01-19 03:29:17 +08:00
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
switch (Opc) {
|
2011-01-19 03:29:17 +08:00
|
|
|
default: break;
|
2011-03-05 05:03:24 +08:00
|
|
|
case ISD::SDIVREM:
|
|
|
|
case ISD::UDIVREM:
|
2013-03-12 08:16:36 +08:00
|
|
|
return performDivRemCombine(N, DAG, DCI, Subtarget);
|
2012-03-08 10:14:24 +08:00
|
|
|
case ISD::SELECT:
|
2013-03-12 08:16:36 +08:00
|
|
|
return performSELECTCombine(N, DAG, DCI, Subtarget);
|
2015-03-02 20:47:32 +08:00
|
|
|
case MipsISD::CMovFP_F:
|
|
|
|
case MipsISD::CMovFP_T:
|
|
|
|
return performCMovFPCombine(N, DAG, DCI, Subtarget);
|
2011-08-18 01:45:08 +08:00
|
|
|
case ISD::AND:
|
2013-03-12 08:16:36 +08:00
|
|
|
return performANDCombine(N, DAG, DCI, Subtarget);
|
2011-08-18 01:45:08 +08:00
|
|
|
case ISD::OR:
|
2013-03-12 08:16:36 +08:00
|
|
|
return performORCombine(N, DAG, DCI, Subtarget);
|
2012-06-14 04:33:18 +08:00
|
|
|
case ISD::ADD:
|
2013-03-12 08:16:36 +08:00
|
|
|
return performADDCombine(N, DAG, DCI, Subtarget);
|
2016-04-13 23:07:45 +08:00
|
|
|
case ISD::AssertZext:
|
|
|
|
return performAssertZextCombine(N, DAG, DCI, Subtarget);
|
[Mips] Add support to match more patterns for DEXT and CINS
This patch adds support for recognizing more patterns to match to DEXT and
CINS instructions.
It finds cases where multiple instructions could be replaced with a single
DEXT or CINS instruction.
For example, for the following:
define i64 @dext_and32(i64 zeroext %a) {
entry:
%and = and i64 %a, 4294967295
ret i64 %and
}
instead of generating:
0000000000000088 <dext_and32>:
88: 64010001 daddiu at,zero,1
8c: 0001083c dsll32 at,at,0x0
90: 6421ffff daddiu at,at,-1
94: 03e00008 jr ra
98: 00811024 and v0,a0,at
9c: 00000000 nop
the following gets generated:
0000000000000068 <dext_and32>:
68: 03e00008 jr ra
6c: 7c82f803 dext v0,a0,0x0,0x20
Cases that are covered:
DEXT:
1. and $src, mask where mask > 0xffff
2. zext $src zero extend from i32 to i64
CINS:
1. and (shl $src, pos), mask
2. shl (and $src, mask), pos
3. zext (shl $src, pos) zero extend from i32 to i64
Patch by Violeta Vukobrat.
Differential Revision: https://reviews.llvm.org/D30464
llvm-svn: 297832
2017-03-15 21:10:08 +08:00
|
|
|
case ISD::SHL:
|
|
|
|
return performSHLCombine(N, DAG, DCI, Subtarget);
|
2011-01-19 03:29:17 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
return SDValue();
|
|
|
|
}
|
|
|
|
|
[MIPS] add overrides for isCheapToSpeculateCttz() and isCheapToSpeculateCtlz()
MIPS32 has instructions for efficient count-leading/trailing-zeros, so this should be
considered a cheap operation (and therefore fair game for speculation) for any MIPS32
implementation.
The net result of allowing this speculation for the regression tests in this patch is
that we get this code:
ctlz:
jr $ra
clz $2, $4
cttz:
addiu $1, $4, -1
not $2, $4
and $1, $2, $1
clz $1, $1
addiu $2, $zero, 32
jr $ra
subu $2, $2, $1
Instead of:
ctlz:
beqz $4, $BB0_2
addiu $2, $zero, 32
clz $2, $4
$BB0_2:
jr $ra
nop
cttz:
beqz $4, $BB1_2
addiu $2, $zero, 32
addiu $1, $4, -1
not $2, $4
and $1, $2, $1
clz $1, $1
addiu $2, $zero, 32
subu $2, $2, $1
$BB1_2:
jr $ra
nop
See D14469 for the larger motivation.
Differential Revision: http://reviews.llvm.org/D14500
llvm-svn: 252755
2015-11-12 01:24:56 +08:00
|
|
|
bool MipsTargetLowering::isCheapToSpeculateCttz() const {
|
|
|
|
return Subtarget.hasMips32();
|
|
|
|
}
|
|
|
|
|
|
|
|
bool MipsTargetLowering::isCheapToSpeculateCtlz() const {
|
|
|
|
return Subtarget.hasMips32();
|
|
|
|
}
|
|
|
|
|
2012-09-22 07:58:31 +08:00
|
|
|
void
|
|
|
|
MipsTargetLowering::LowerOperationWrapper(SDNode *N,
|
|
|
|
SmallVectorImpl<SDValue> &Results,
|
|
|
|
SelectionDAG &DAG) const {
|
|
|
|
SDValue Res = LowerOperation(SDValue(N, 0), DAG);
|
|
|
|
|
|
|
|
for (unsigned I = 0, E = Res->getNumValues(); I != E; ++I)
|
|
|
|
Results.push_back(Res.getValue(I));
|
|
|
|
}
|
|
|
|
|
|
|
|
void
|
|
|
|
MipsTargetLowering::ReplaceNodeResults(SDNode *N,
|
|
|
|
SmallVectorImpl<SDValue> &Results,
|
|
|
|
SelectionDAG &DAG) const {
|
2013-05-01 05:17:07 +08:00
|
|
|
return LowerOperationWrapper(N, Results, DAG);
|
2012-09-22 07:58:31 +08:00
|
|
|
}
|
|
|
|
|
2008-07-28 05:46:04 +08:00
|
|
|
SDValue MipsTargetLowering::
|
2010-04-17 23:26:15 +08:00
|
|
|
LowerOperation(SDValue Op, SelectionDAG &DAG) const
|
2007-06-06 15:42:06 +08:00
|
|
|
{
|
2010-11-23 11:31:01 +08:00
|
|
|
switch (Op.getOpcode())
|
2007-06-06 15:42:06 +08:00
|
|
|
{
|
2016-09-09 19:06:01 +08:00
|
|
|
case ISD::BRCOND: return lowerBRCOND(Op, DAG);
|
2013-03-30 09:15:17 +08:00
|
|
|
case ISD::ConstantPool: return lowerConstantPool(Op, DAG);
|
|
|
|
case ISD::GlobalAddress: return lowerGlobalAddress(Op, DAG);
|
|
|
|
case ISD::BlockAddress: return lowerBlockAddress(Op, DAG);
|
|
|
|
case ISD::GlobalTLSAddress: return lowerGlobalTLSAddress(Op, DAG);
|
|
|
|
case ISD::JumpTable: return lowerJumpTable(Op, DAG);
|
2016-09-09 19:06:01 +08:00
|
|
|
case ISD::SELECT: return lowerSELECT(Op, DAG);
|
|
|
|
case ISD::SETCC: return lowerSETCC(Op, DAG);
|
2013-03-30 09:15:17 +08:00
|
|
|
case ISD::VASTART: return lowerVASTART(Op, DAG);
|
2014-08-01 17:17:39 +08:00
|
|
|
case ISD::VAARG: return lowerVAARG(Op, DAG);
|
2013-03-30 09:15:17 +08:00
|
|
|
case ISD::FCOPYSIGN: return lowerFCOPYSIGN(Op, DAG);
|
|
|
|
case ISD::FRAMEADDR: return lowerFRAMEADDR(Op, DAG);
|
|
|
|
case ISD::RETURNADDR: return lowerRETURNADDR(Op, DAG);
|
|
|
|
case ISD::EH_RETURN: return lowerEH_RETURN(Op, DAG);
|
|
|
|
case ISD::ATOMIC_FENCE: return lowerATOMIC_FENCE(Op, DAG);
|
|
|
|
case ISD::SHL_PARTS: return lowerShiftLeftParts(Op, DAG);
|
|
|
|
case ISD::SRA_PARTS: return lowerShiftRightParts(Op, DAG, true);
|
|
|
|
case ISD::SRL_PARTS: return lowerShiftRightParts(Op, DAG, false);
|
|
|
|
case ISD::LOAD: return lowerLOAD(Op, DAG);
|
|
|
|
case ISD::STORE: return lowerSTORE(Op, DAG);
|
Add ISD::EH_DWARF_CFA, simplify @llvm.eh.dwarf.cfa on Mips, fix on PowerPC
LLVM has an @llvm.eh.dwarf.cfa intrinsic, used to lower the GCC-compatible
__builtin_dwarf_cfa() builtin. As pointed out in PR26761, this is currently
broken on PowerPC (and likely on ARM as well). Currently, @llvm.eh.dwarf.cfa is
lowered using:
ADD(FRAMEADDR, FRAME_TO_ARGS_OFFSET)
where FRAME_TO_ARGS_OFFSET defaults to the constant zero. On x86,
FRAME_TO_ARGS_OFFSET is lowered to 2*SlotSize. This setup, however, does not
work for PowerPC. Because of the way that the stack layout works, the canonical
frame address is not exactly (FRAMEADDR + FRAME_TO_ARGS_OFFSET) on PowerPC
(there is a lower save-area offset as well), so it is not just a matter of
implementing FRAME_TO_ARGS_OFFSET for PowerPC (unless we redefine its
semantics -- We can do that, since it is currently used only for
@llvm.eh.dwarf.cfa lowering, but the better to directly lower the CFA construct
itself (since it can be easily represented as a fixed-offset FrameIndex)). Mips
currently does this, but by using a custom lowering for ADD that specifically
recognizes the (FRAMEADDR, FRAME_TO_ARGS_OFFSET) pattern.
This change introduces a ISD::EH_DWARF_CFA node, which by default expands using
the existing logic, but can be directly lowered by the target. Mips is updated
to use this method (which simplifies its implementation, and I suspect makes it
more robust), and updates PowerPC to do the same.
Fixes PR26761.
Differential Revision: https://reviews.llvm.org/D24038
llvm-svn: 280350
2016-09-01 18:28:47 +08:00
|
|
|
case ISD::EH_DWARF_CFA: return lowerEH_DWARF_CFA(Op, DAG);
|
2013-05-17 05:17:15 +08:00
|
|
|
case ISD::FP_TO_SINT: return lowerFP_TO_SINT(Op, DAG);
|
2007-06-06 15:42:06 +08:00
|
|
|
}
|
2008-07-28 05:46:04 +08:00
|
|
|
return SDValue();
|
2007-06-06 15:42:06 +08:00
|
|
|
}
|
|
|
|
|
2011-04-16 05:51:11 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
2007-06-06 15:42:06 +08:00
|
|
|
// Lower helper functions
|
2011-04-16 05:51:11 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
2007-06-06 15:42:06 +08:00
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
// addLiveIn - This helper function adds the specified physical register to the
|
2007-06-06 15:42:06 +08:00
|
|
|
// MachineFunction as a live in value. It also creates a corresponding
|
|
|
|
// virtual register for it.
|
|
|
|
static unsigned
|
2013-03-12 08:16:36 +08:00
|
|
|
addLiveIn(MachineFunction &MF, unsigned PReg, const TargetRegisterClass *RC)
|
2007-06-06 15:42:06 +08:00
|
|
|
{
|
2007-12-31 12:13:23 +08:00
|
|
|
unsigned VReg = MF.getRegInfo().createVirtualRegister(RC);
|
|
|
|
MF.getRegInfo().addLiveIn(PReg, VReg);
|
2007-06-06 15:42:06 +08:00
|
|
|
return VReg;
|
|
|
|
}
|
|
|
|
|
2016-07-01 06:52:52 +08:00
|
|
|
static MachineBasicBlock *insertDivByZeroTrap(MachineInstr &MI,
|
[mips][mips64r6] Replace m[tf]hi, m[tf]lo, mult, multu, dmult, dmultu, div, ddiv, divu, ddivu for MIPS32r6/MIPS64.
Summary:
The accumulator-based (HI/LO) multiplies and divides from earlier ISA's have
been removed and replaced with GPR-based equivalents. For example:
div $1, $2
mflo $3
is now:
div $3, $1, $2
This patch disables the accumulator-based multiplies and divides for
MIPS32r6/MIPS64r6 and uses the GPR-based equivalents instead.
Renamed expandPseudoDiv to insertDivByZeroTrap to better describe the
behaviour of the function.
MipsDelaySlotFiller now invalidates the liveness information when moving
instructions to the delay slot. Without this, divrem.ll will abort since
%GP ends up used before it is defined.
Reviewers: vmedic, zoran.jovanovic, jkolek
Reviewed By: jkolek
Differential Revision: http://reviews.llvm.org/D3896
llvm-svn: 210760
2014-06-12 18:44:10 +08:00
|
|
|
MachineBasicBlock &MBB,
|
|
|
|
const TargetInstrInfo &TII,
|
2016-04-13 16:02:26 +08:00
|
|
|
bool Is64Bit, bool IsMicroMips) {
|
2013-05-21 02:07:43 +08:00
|
|
|
if (NoZeroDivCheck)
|
|
|
|
return &MBB;
|
|
|
|
|
|
|
|
// Insert instruction "teq $divisor_reg, $zero, 7".
|
|
|
|
MachineBasicBlock::iterator I(MI);
|
|
|
|
MachineInstrBuilder MIB;
|
2016-07-01 06:52:52 +08:00
|
|
|
MachineOperand &Divisor = MI.getOperand(2);
|
|
|
|
MIB = BuildMI(MBB, std::next(I), MI.getDebugLoc(),
|
2016-04-13 16:02:26 +08:00
|
|
|
TII.get(IsMicroMips ? Mips::TEQ_MM : Mips::TEQ))
|
2016-07-01 06:52:52 +08:00
|
|
|
.addReg(Divisor.getReg(), getKillRegState(Divisor.isKill()))
|
|
|
|
.addReg(Mips::ZERO)
|
|
|
|
.addImm(7);
|
2013-05-21 02:07:43 +08:00
|
|
|
|
|
|
|
// Use the 32-bit sub-register if this is a 64-bit division.
|
|
|
|
if (Is64Bit)
|
|
|
|
MIB->getOperand(0).setSubReg(Mips::sub_32);
|
|
|
|
|
2013-10-15 09:06:30 +08:00
|
|
|
// Clear Divisor's kill flag.
|
|
|
|
Divisor.setIsKill(false);
|
[mips][mips64r6] Replace m[tf]hi, m[tf]lo, mult, multu, dmult, dmultu, div, ddiv, divu, ddivu for MIPS32r6/MIPS64.
Summary:
The accumulator-based (HI/LO) multiplies and divides from earlier ISA's have
been removed and replaced with GPR-based equivalents. For example:
div $1, $2
mflo $3
is now:
div $3, $1, $2
This patch disables the accumulator-based multiplies and divides for
MIPS32r6/MIPS64r6 and uses the GPR-based equivalents instead.
Renamed expandPseudoDiv to insertDivByZeroTrap to better describe the
behaviour of the function.
MipsDelaySlotFiller now invalidates the liveness information when moving
instructions to the delay slot. Without this, divrem.ll will abort since
%GP ends up used before it is defined.
Reviewers: vmedic, zoran.jovanovic, jkolek
Reviewed By: jkolek
Differential Revision: http://reviews.llvm.org/D3896
llvm-svn: 210760
2014-06-12 18:44:10 +08:00
|
|
|
|
|
|
|
// We would normally delete the original instruction here but in this case
|
|
|
|
// we only needed to inject an additional instruction rather than replace it.
|
|
|
|
|
2013-05-21 02:07:43 +08:00
|
|
|
return &MBB;
|
|
|
|
}
|
|
|
|
|
2011-06-08 03:28:39 +08:00
|
|
|
MachineBasicBlock *
|
2016-07-01 06:52:52 +08:00
|
|
|
MipsTargetLowering::EmitInstrWithCustomInserter(MachineInstr &MI,
|
2011-06-08 03:28:39 +08:00
|
|
|
MachineBasicBlock *BB) const {
|
2016-07-01 06:52:52 +08:00
|
|
|
switch (MI.getOpcode()) {
|
2013-02-21 12:22:38 +08:00
|
|
|
default:
|
|
|
|
llvm_unreachable("Unexpected instr type to insert");
|
2011-06-08 03:28:39 +08:00
|
|
|
case Mips::ATOMIC_LOAD_ADD_I8:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinaryPartword(MI, BB, 1, Mips::ADDu);
|
2011-06-08 03:28:39 +08:00
|
|
|
case Mips::ATOMIC_LOAD_ADD_I16:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinaryPartword(MI, BB, 2, Mips::ADDu);
|
2011-06-08 03:28:39 +08:00
|
|
|
case Mips::ATOMIC_LOAD_ADD_I32:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinary(MI, BB, 4, Mips::ADDu);
|
2011-11-11 12:14:30 +08:00
|
|
|
case Mips::ATOMIC_LOAD_ADD_I64:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinary(MI, BB, 8, Mips::DADDu);
|
2011-06-08 03:28:39 +08:00
|
|
|
|
|
|
|
case Mips::ATOMIC_LOAD_AND_I8:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinaryPartword(MI, BB, 1, Mips::AND);
|
2011-06-08 03:28:39 +08:00
|
|
|
case Mips::ATOMIC_LOAD_AND_I16:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinaryPartword(MI, BB, 2, Mips::AND);
|
2011-06-08 03:28:39 +08:00
|
|
|
case Mips::ATOMIC_LOAD_AND_I32:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinary(MI, BB, 4, Mips::AND);
|
2011-11-11 12:14:30 +08:00
|
|
|
case Mips::ATOMIC_LOAD_AND_I64:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinary(MI, BB, 8, Mips::AND64);
|
2011-06-08 03:28:39 +08:00
|
|
|
|
|
|
|
case Mips::ATOMIC_LOAD_OR_I8:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinaryPartword(MI, BB, 1, Mips::OR);
|
2011-06-08 03:28:39 +08:00
|
|
|
case Mips::ATOMIC_LOAD_OR_I16:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinaryPartword(MI, BB, 2, Mips::OR);
|
2011-06-08 03:28:39 +08:00
|
|
|
case Mips::ATOMIC_LOAD_OR_I32:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinary(MI, BB, 4, Mips::OR);
|
2011-11-11 12:14:30 +08:00
|
|
|
case Mips::ATOMIC_LOAD_OR_I64:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinary(MI, BB, 8, Mips::OR64);
|
2011-06-08 03:28:39 +08:00
|
|
|
|
|
|
|
case Mips::ATOMIC_LOAD_XOR_I8:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinaryPartword(MI, BB, 1, Mips::XOR);
|
2011-06-08 03:28:39 +08:00
|
|
|
case Mips::ATOMIC_LOAD_XOR_I16:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinaryPartword(MI, BB, 2, Mips::XOR);
|
2011-06-08 03:28:39 +08:00
|
|
|
case Mips::ATOMIC_LOAD_XOR_I32:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinary(MI, BB, 4, Mips::XOR);
|
2011-11-11 12:14:30 +08:00
|
|
|
case Mips::ATOMIC_LOAD_XOR_I64:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinary(MI, BB, 8, Mips::XOR64);
|
2011-06-08 03:28:39 +08:00
|
|
|
|
|
|
|
case Mips::ATOMIC_LOAD_NAND_I8:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinaryPartword(MI, BB, 1, 0, true);
|
2011-06-08 03:28:39 +08:00
|
|
|
case Mips::ATOMIC_LOAD_NAND_I16:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinaryPartword(MI, BB, 2, 0, true);
|
2011-06-08 03:28:39 +08:00
|
|
|
case Mips::ATOMIC_LOAD_NAND_I32:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinary(MI, BB, 4, 0, true);
|
2011-11-11 12:14:30 +08:00
|
|
|
case Mips::ATOMIC_LOAD_NAND_I64:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinary(MI, BB, 8, 0, true);
|
2011-06-08 03:28:39 +08:00
|
|
|
|
|
|
|
case Mips::ATOMIC_LOAD_SUB_I8:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinaryPartword(MI, BB, 1, Mips::SUBu);
|
2011-06-08 03:28:39 +08:00
|
|
|
case Mips::ATOMIC_LOAD_SUB_I16:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinaryPartword(MI, BB, 2, Mips::SUBu);
|
2011-06-08 03:28:39 +08:00
|
|
|
case Mips::ATOMIC_LOAD_SUB_I32:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinary(MI, BB, 4, Mips::SUBu);
|
2011-11-11 12:14:30 +08:00
|
|
|
case Mips::ATOMIC_LOAD_SUB_I64:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinary(MI, BB, 8, Mips::DSUBu);
|
2011-06-08 03:28:39 +08:00
|
|
|
|
|
|
|
case Mips::ATOMIC_SWAP_I8:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinaryPartword(MI, BB, 1, 0);
|
2011-06-08 03:28:39 +08:00
|
|
|
case Mips::ATOMIC_SWAP_I16:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinaryPartword(MI, BB, 2, 0);
|
2011-06-08 03:28:39 +08:00
|
|
|
case Mips::ATOMIC_SWAP_I32:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinary(MI, BB, 4, 0);
|
2011-11-11 12:14:30 +08:00
|
|
|
case Mips::ATOMIC_SWAP_I64:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicBinary(MI, BB, 8, 0);
|
2011-06-08 03:28:39 +08:00
|
|
|
|
2017-03-09 22:03:26 +08:00
|
|
|
case Mips::ATOMIC_CMP_SWAP_I8:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicCmpSwapPartword(MI, BB, 1);
|
2017-03-09 22:03:26 +08:00
|
|
|
case Mips::ATOMIC_CMP_SWAP_I16:
|
2013-03-12 08:16:36 +08:00
|
|
|
return emitAtomicCmpSwapPartword(MI, BB, 2);
|
2017-03-09 22:03:26 +08:00
|
|
|
case Mips::ATOMIC_CMP_SWAP_I32:
|
|
|
|
return emitAtomicCmpSwap(MI, BB, 4);
|
|
|
|
case Mips::ATOMIC_CMP_SWAP_I64:
|
|
|
|
return emitAtomicCmpSwap(MI, BB, 8);
|
2013-05-21 02:07:43 +08:00
|
|
|
case Mips::PseudoSDIV:
|
|
|
|
case Mips::PseudoUDIV:
|
[mips][mips64r6] Replace m[tf]hi, m[tf]lo, mult, multu, dmult, dmultu, div, ddiv, divu, ddivu for MIPS32r6/MIPS64.
Summary:
The accumulator-based (HI/LO) multiplies and divides from earlier ISA's have
been removed and replaced with GPR-based equivalents. For example:
div $1, $2
mflo $3
is now:
div $3, $1, $2
This patch disables the accumulator-based multiplies and divides for
MIPS32r6/MIPS64r6 and uses the GPR-based equivalents instead.
Renamed expandPseudoDiv to insertDivByZeroTrap to better describe the
behaviour of the function.
MipsDelaySlotFiller now invalidates the liveness information when moving
instructions to the delay slot. Without this, divrem.ll will abort since
%GP ends up used before it is defined.
Reviewers: vmedic, zoran.jovanovic, jkolek
Reviewed By: jkolek
Differential Revision: http://reviews.llvm.org/D3896
llvm-svn: 210760
2014-06-12 18:44:10 +08:00
|
|
|
case Mips::DIV:
|
|
|
|
case Mips::DIVU:
|
|
|
|
case Mips::MOD:
|
|
|
|
case Mips::MODU:
|
2016-04-13 16:02:26 +08:00
|
|
|
return insertDivByZeroTrap(MI, *BB, *Subtarget.getInstrInfo(), false,
|
|
|
|
false);
|
|
|
|
case Mips::SDIV_MM_Pseudo:
|
|
|
|
case Mips::UDIV_MM_Pseudo:
|
|
|
|
case Mips::SDIV_MM:
|
|
|
|
case Mips::UDIV_MM:
|
|
|
|
case Mips::DIV_MMR6:
|
|
|
|
case Mips::DIVU_MMR6:
|
|
|
|
case Mips::MOD_MMR6:
|
|
|
|
case Mips::MODU_MMR6:
|
|
|
|
return insertDivByZeroTrap(MI, *BB, *Subtarget.getInstrInfo(), false, true);
|
2013-05-21 02:07:43 +08:00
|
|
|
case Mips::PseudoDSDIV:
|
|
|
|
case Mips::PseudoDUDIV:
|
[mips][mips64r6] Replace m[tf]hi, m[tf]lo, mult, multu, dmult, dmultu, div, ddiv, divu, ddivu for MIPS32r6/MIPS64.
Summary:
The accumulator-based (HI/LO) multiplies and divides from earlier ISA's have
been removed and replaced with GPR-based equivalents. For example:
div $1, $2
mflo $3
is now:
div $3, $1, $2
This patch disables the accumulator-based multiplies and divides for
MIPS32r6/MIPS64r6 and uses the GPR-based equivalents instead.
Renamed expandPseudoDiv to insertDivByZeroTrap to better describe the
behaviour of the function.
MipsDelaySlotFiller now invalidates the liveness information when moving
instructions to the delay slot. Without this, divrem.ll will abort since
%GP ends up used before it is defined.
Reviewers: vmedic, zoran.jovanovic, jkolek
Reviewed By: jkolek
Differential Revision: http://reviews.llvm.org/D3896
llvm-svn: 210760
2014-06-12 18:44:10 +08:00
|
|
|
case Mips::DDIV:
|
|
|
|
case Mips::DDIVU:
|
|
|
|
case Mips::DMOD:
|
|
|
|
case Mips::DMODU:
|
2016-04-13 16:02:26 +08:00
|
|
|
return insertDivByZeroTrap(MI, *BB, *Subtarget.getInstrInfo(), true, false);
|
|
|
|
case Mips::DDIV_MM64R6:
|
|
|
|
case Mips::DDIVU_MM64R6:
|
|
|
|
case Mips::DMOD_MM64R6:
|
|
|
|
case Mips::DMODU_MM64R6:
|
|
|
|
return insertDivByZeroTrap(MI, *BB, *Subtarget.getInstrInfo(), true, true);
|
2014-06-12 21:39:06 +08:00
|
|
|
case Mips::SEL_D:
|
2016-06-09 19:15:53 +08:00
|
|
|
case Mips::SEL_D_MMR6:
|
2014-06-12 21:39:06 +08:00
|
|
|
return emitSEL_D(MI, BB);
|
2014-12-12 22:41:37 +08:00
|
|
|
|
|
|
|
case Mips::PseudoSELECT_I:
|
2014-12-12 23:16:46 +08:00
|
|
|
case Mips::PseudoSELECT_I64:
|
2014-12-12 22:41:37 +08:00
|
|
|
case Mips::PseudoSELECT_S:
|
|
|
|
case Mips::PseudoSELECT_D32:
|
2014-12-12 23:16:46 +08:00
|
|
|
case Mips::PseudoSELECT_D64:
|
2016-03-02 04:25:43 +08:00
|
|
|
return emitPseudoSELECT(MI, BB, false, Mips::BNE);
|
2014-12-12 22:41:37 +08:00
|
|
|
case Mips::PseudoSELECTFP_F_I:
|
2014-12-12 23:16:46 +08:00
|
|
|
case Mips::PseudoSELECTFP_F_I64:
|
2014-12-12 22:41:37 +08:00
|
|
|
case Mips::PseudoSELECTFP_F_S:
|
|
|
|
case Mips::PseudoSELECTFP_F_D32:
|
2014-12-12 23:16:46 +08:00
|
|
|
case Mips::PseudoSELECTFP_F_D64:
|
2014-12-12 22:41:37 +08:00
|
|
|
return emitPseudoSELECT(MI, BB, true, Mips::BC1F);
|
|
|
|
case Mips::PseudoSELECTFP_T_I:
|
2014-12-12 23:16:46 +08:00
|
|
|
case Mips::PseudoSELECTFP_T_I64:
|
2014-12-12 22:41:37 +08:00
|
|
|
case Mips::PseudoSELECTFP_T_S:
|
|
|
|
case Mips::PseudoSELECTFP_T_D32:
|
2014-12-12 23:16:46 +08:00
|
|
|
case Mips::PseudoSELECTFP_T_D64:
|
2014-12-12 22:41:37 +08:00
|
|
|
return emitPseudoSELECT(MI, BB, true, Mips::BC1T);
|
2011-06-08 03:28:39 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-05-31 10:54:07 +08:00
|
|
|
// This function also handles Mips::ATOMIC_SWAP_I32 (when BinOpcode == 0), and
|
|
|
|
// Mips::ATOMIC_LOAD_NAND_I32 (when Nand == true)
|
2016-07-01 06:52:52 +08:00
|
|
|
MachineBasicBlock *MipsTargetLowering::emitAtomicBinary(MachineInstr &MI,
|
|
|
|
MachineBasicBlock *BB,
|
|
|
|
unsigned Size,
|
|
|
|
unsigned BinOpcode,
|
|
|
|
bool Nand) const {
|
2011-11-11 12:14:30 +08:00
|
|
|
assert((Size == 4 || Size == 8) && "Unsupported size for EmitAtomicBinary.");
|
2011-05-31 10:54:07 +08:00
|
|
|
|
|
|
|
MachineFunction *MF = BB->getParent();
|
|
|
|
MachineRegisterInfo &RegInfo = MF->getRegInfo();
|
2011-11-11 12:14:30 +08:00
|
|
|
const TargetRegisterClass *RC = getRegClassFor(MVT::getIntegerVT(Size * 8));
|
2015-01-30 07:27:36 +08:00
|
|
|
const TargetInstrInfo *TII = Subtarget.getInstrInfo();
|
2016-06-14 19:29:28 +08:00
|
|
|
const bool ArePtrs64bit = ABI.ArePtrs64bit();
|
2016-07-01 06:52:52 +08:00
|
|
|
DebugLoc DL = MI.getDebugLoc();
|
2011-11-11 12:14:30 +08:00
|
|
|
unsigned LL, SC, AND, NOR, ZERO, BEQ;
|
|
|
|
|
|
|
|
if (Size == 4) {
|
2014-06-16 21:13:03 +08:00
|
|
|
if (isMicroMips) {
|
|
|
|
LL = Mips::LL_MM;
|
|
|
|
SC = Mips::SC_MM;
|
|
|
|
} else {
|
2016-06-14 19:29:28 +08:00
|
|
|
LL = Subtarget.hasMips32r6()
|
|
|
|
? (ArePtrs64bit ? Mips::LL64_R6 : Mips::LL_R6)
|
|
|
|
: (ArePtrs64bit ? Mips::LL64 : Mips::LL);
|
|
|
|
SC = Subtarget.hasMips32r6()
|
|
|
|
? (ArePtrs64bit ? Mips::SC64_R6 : Mips::SC_R6)
|
|
|
|
: (ArePtrs64bit ? Mips::SC64 : Mips::SC);
|
2014-06-16 21:13:03 +08:00
|
|
|
}
|
2016-06-14 19:29:28 +08:00
|
|
|
|
2011-11-11 12:14:30 +08:00
|
|
|
AND = Mips::AND;
|
|
|
|
NOR = Mips::NOR;
|
|
|
|
ZERO = Mips::ZERO;
|
|
|
|
BEQ = Mips::BEQ;
|
2014-06-16 21:13:03 +08:00
|
|
|
} else {
|
2014-07-24 17:47:14 +08:00
|
|
|
LL = Subtarget.hasMips64r6() ? Mips::LLD_R6 : Mips::LLD;
|
|
|
|
SC = Subtarget.hasMips64r6() ? Mips::SCD_R6 : Mips::SCD;
|
2011-11-11 12:14:30 +08:00
|
|
|
AND = Mips::AND64;
|
|
|
|
NOR = Mips::NOR64;
|
|
|
|
ZERO = Mips::ZERO_64;
|
|
|
|
BEQ = Mips::BEQ64;
|
|
|
|
}
|
2011-05-31 10:54:07 +08:00
|
|
|
|
2016-07-01 06:52:52 +08:00
|
|
|
unsigned OldVal = MI.getOperand(0).getReg();
|
|
|
|
unsigned Ptr = MI.getOperand(1).getReg();
|
|
|
|
unsigned Incr = MI.getOperand(2).getReg();
|
2011-05-31 10:54:07 +08:00
|
|
|
|
2011-07-20 04:11:17 +08:00
|
|
|
unsigned StoreVal = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned AndRes = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned Success = RegInfo.createVirtualRegister(RC);
|
2011-05-31 10:54:07 +08:00
|
|
|
|
|
|
|
// insert new blocks after the current block
|
|
|
|
const BasicBlock *LLVM_BB = BB->getBasicBlock();
|
|
|
|
MachineBasicBlock *loopMBB = MF->CreateMachineBasicBlock(LLVM_BB);
|
|
|
|
MachineBasicBlock *exitMBB = MF->CreateMachineBasicBlock(LLVM_BB);
|
2015-10-20 08:15:20 +08:00
|
|
|
MachineFunction::iterator It = ++BB->getIterator();
|
2011-05-31 10:54:07 +08:00
|
|
|
MF->insert(It, loopMBB);
|
|
|
|
MF->insert(It, exitMBB);
|
|
|
|
|
|
|
|
// Transfer the remainder of BB and its successor edges to exitMBB.
|
|
|
|
exitMBB->splice(exitMBB->begin(), BB,
|
2014-03-02 20:27:27 +08:00
|
|
|
std::next(MachineBasicBlock::iterator(MI)), BB->end());
|
2011-05-31 10:54:07 +08:00
|
|
|
exitMBB->transferSuccessorsAndUpdatePHIs(BB);
|
|
|
|
|
|
|
|
// thisMBB:
|
|
|
|
// ...
|
|
|
|
// fallthrough --> loopMBB
|
|
|
|
BB->addSuccessor(loopMBB);
|
2011-07-20 01:09:53 +08:00
|
|
|
loopMBB->addSuccessor(loopMBB);
|
|
|
|
loopMBB->addSuccessor(exitMBB);
|
2011-05-31 10:54:07 +08:00
|
|
|
|
|
|
|
// loopMBB:
|
|
|
|
// ll oldval, 0(ptr)
|
2011-07-20 04:11:17 +08:00
|
|
|
// <binop> storeval, oldval, incr
|
|
|
|
// sc success, storeval, 0(ptr)
|
|
|
|
// beq success, $0, loopMBB
|
2011-05-31 10:54:07 +08:00
|
|
|
BB = loopMBB;
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(LL), OldVal).addReg(Ptr).addImm(0);
|
2011-05-31 10:54:07 +08:00
|
|
|
if (Nand) {
|
2011-07-20 04:11:17 +08:00
|
|
|
// and andres, oldval, incr
|
|
|
|
// nor storeval, $0, andres
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(AND), AndRes).addReg(OldVal).addReg(Incr);
|
|
|
|
BuildMI(BB, DL, TII->get(NOR), StoreVal).addReg(ZERO).addReg(AndRes);
|
2011-05-31 10:54:07 +08:00
|
|
|
} else if (BinOpcode) {
|
2011-07-20 04:11:17 +08:00
|
|
|
// <binop> storeval, oldval, incr
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(BinOpcode), StoreVal).addReg(OldVal).addReg(Incr);
|
2011-05-31 10:54:07 +08:00
|
|
|
} else {
|
2011-07-20 04:11:17 +08:00
|
|
|
StoreVal = Incr;
|
2011-05-31 10:54:07 +08:00
|
|
|
}
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(SC), Success).addReg(StoreVal).addReg(Ptr).addImm(0);
|
|
|
|
BuildMI(BB, DL, TII->get(BEQ)).addReg(Success).addReg(ZERO).addMBB(loopMBB);
|
2011-05-31 10:54:07 +08:00
|
|
|
|
2016-07-01 06:52:52 +08:00
|
|
|
MI.eraseFromParent(); // The instruction is gone now.
|
2011-05-31 10:54:07 +08:00
|
|
|
|
2011-07-19 11:42:13 +08:00
|
|
|
return exitMBB;
|
2011-05-31 10:54:07 +08:00
|
|
|
}
|
|
|
|
|
2014-06-16 21:13:03 +08:00
|
|
|
MachineBasicBlock *MipsTargetLowering::emitSignExtendToI32InReg(
|
2016-07-01 06:52:52 +08:00
|
|
|
MachineInstr &MI, MachineBasicBlock *BB, unsigned Size, unsigned DstReg,
|
2014-06-16 21:13:03 +08:00
|
|
|
unsigned SrcReg) const {
|
2015-01-30 07:27:36 +08:00
|
|
|
const TargetInstrInfo *TII = Subtarget.getInstrInfo();
|
2016-07-01 06:52:52 +08:00
|
|
|
const DebugLoc &DL = MI.getDebugLoc();
|
2014-06-16 21:13:03 +08:00
|
|
|
|
2014-07-19 06:55:25 +08:00
|
|
|
if (Subtarget.hasMips32r2() && Size == 1) {
|
2014-06-16 21:13:03 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::SEB), DstReg).addReg(SrcReg);
|
|
|
|
return BB;
|
|
|
|
}
|
|
|
|
|
2014-07-19 06:55:25 +08:00
|
|
|
if (Subtarget.hasMips32r2() && Size == 2) {
|
2014-06-16 21:13:03 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::SEH), DstReg).addReg(SrcReg);
|
|
|
|
return BB;
|
|
|
|
}
|
|
|
|
|
|
|
|
MachineFunction *MF = BB->getParent();
|
|
|
|
MachineRegisterInfo &RegInfo = MF->getRegInfo();
|
|
|
|
const TargetRegisterClass *RC = getRegClassFor(MVT::i32);
|
|
|
|
unsigned ScrReg = RegInfo.createVirtualRegister(RC);
|
|
|
|
|
|
|
|
assert(Size < 32);
|
|
|
|
int64_t ShiftImm = 32 - (Size * 8);
|
|
|
|
|
|
|
|
BuildMI(BB, DL, TII->get(Mips::SLL), ScrReg).addReg(SrcReg).addImm(ShiftImm);
|
|
|
|
BuildMI(BB, DL, TII->get(Mips::SRA), DstReg).addReg(ScrReg).addImm(ShiftImm);
|
|
|
|
|
|
|
|
return BB;
|
|
|
|
}
|
|
|
|
|
|
|
|
MachineBasicBlock *MipsTargetLowering::emitAtomicBinaryPartword(
|
2016-07-01 06:52:52 +08:00
|
|
|
MachineInstr &MI, MachineBasicBlock *BB, unsigned Size, unsigned BinOpcode,
|
2014-06-16 21:13:03 +08:00
|
|
|
bool Nand) const {
|
2011-05-31 10:54:07 +08:00
|
|
|
assert((Size == 1 || Size == 2) &&
|
2013-10-08 03:33:02 +08:00
|
|
|
"Unsupported size for EmitAtomicBinaryPartial.");
|
2011-05-31 10:54:07 +08:00
|
|
|
|
|
|
|
MachineFunction *MF = BB->getParent();
|
|
|
|
MachineRegisterInfo &RegInfo = MF->getRegInfo();
|
|
|
|
const TargetRegisterClass *RC = getRegClassFor(MVT::i32);
|
2016-06-14 19:29:28 +08:00
|
|
|
const bool ArePtrs64bit = ABI.ArePtrs64bit();
|
2016-04-29 00:26:43 +08:00
|
|
|
const TargetRegisterClass *RCp =
|
|
|
|
getRegClassFor(ArePtrs64bit ? MVT::i64 : MVT::i32);
|
2015-01-30 07:27:36 +08:00
|
|
|
const TargetInstrInfo *TII = Subtarget.getInstrInfo();
|
2016-07-01 06:52:52 +08:00
|
|
|
DebugLoc DL = MI.getDebugLoc();
|
2011-05-31 10:54:07 +08:00
|
|
|
|
2016-07-01 06:52:52 +08:00
|
|
|
unsigned Dest = MI.getOperand(0).getReg();
|
|
|
|
unsigned Ptr = MI.getOperand(1).getReg();
|
|
|
|
unsigned Incr = MI.getOperand(2).getReg();
|
2011-05-31 10:54:07 +08:00
|
|
|
|
2016-04-29 00:26:43 +08:00
|
|
|
unsigned AlignedAddr = RegInfo.createVirtualRegister(RCp);
|
2011-07-20 04:11:17 +08:00
|
|
|
unsigned ShiftAmt = RegInfo.createVirtualRegister(RC);
|
2011-05-31 10:54:07 +08:00
|
|
|
unsigned Mask = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned Mask2 = RegInfo.createVirtualRegister(RC);
|
2011-07-20 04:11:17 +08:00
|
|
|
unsigned NewVal = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned OldVal = RegInfo.createVirtualRegister(RC);
|
2011-05-31 10:54:07 +08:00
|
|
|
unsigned Incr2 = RegInfo.createVirtualRegister(RC);
|
2016-04-29 00:26:43 +08:00
|
|
|
unsigned MaskLSB2 = RegInfo.createVirtualRegister(RCp);
|
2011-07-20 04:11:17 +08:00
|
|
|
unsigned PtrLSB2 = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned MaskUpper = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned AndRes = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned BinOpRes = RegInfo.createVirtualRegister(RC);
|
2011-07-20 04:56:53 +08:00
|
|
|
unsigned MaskedOldVal0 = RegInfo.createVirtualRegister(RC);
|
2011-07-20 04:11:17 +08:00
|
|
|
unsigned StoreVal = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned MaskedOldVal1 = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned SrlRes = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned Success = RegInfo.createVirtualRegister(RC);
|
2011-05-31 10:54:07 +08:00
|
|
|
|
2016-06-14 19:29:28 +08:00
|
|
|
unsigned LL, SC;
|
|
|
|
if (isMicroMips) {
|
|
|
|
LL = Mips::LL_MM;
|
|
|
|
SC = Mips::SC_MM;
|
|
|
|
} else {
|
|
|
|
LL = Subtarget.hasMips32r6() ? (ArePtrs64bit ? Mips::LL64_R6 : Mips::LL_R6)
|
|
|
|
: (ArePtrs64bit ? Mips::LL64 : Mips::LL);
|
|
|
|
SC = Subtarget.hasMips32r6() ? (ArePtrs64bit ? Mips::SC64_R6 : Mips::SC_R6)
|
|
|
|
: (ArePtrs64bit ? Mips::SC64 : Mips::SC);
|
|
|
|
}
|
|
|
|
|
2011-05-31 10:54:07 +08:00
|
|
|
// insert new blocks after the current block
|
|
|
|
const BasicBlock *LLVM_BB = BB->getBasicBlock();
|
|
|
|
MachineBasicBlock *loopMBB = MF->CreateMachineBasicBlock(LLVM_BB);
|
2011-07-19 11:42:13 +08:00
|
|
|
MachineBasicBlock *sinkMBB = MF->CreateMachineBasicBlock(LLVM_BB);
|
2011-05-31 10:54:07 +08:00
|
|
|
MachineBasicBlock *exitMBB = MF->CreateMachineBasicBlock(LLVM_BB);
|
2015-10-20 08:15:20 +08:00
|
|
|
MachineFunction::iterator It = ++BB->getIterator();
|
2011-05-31 10:54:07 +08:00
|
|
|
MF->insert(It, loopMBB);
|
2011-07-19 11:42:13 +08:00
|
|
|
MF->insert(It, sinkMBB);
|
2011-05-31 10:54:07 +08:00
|
|
|
MF->insert(It, exitMBB);
|
|
|
|
|
|
|
|
// Transfer the remainder of BB and its successor edges to exitMBB.
|
|
|
|
exitMBB->splice(exitMBB->begin(), BB,
|
2014-03-02 20:27:27 +08:00
|
|
|
std::next(MachineBasicBlock::iterator(MI)), BB->end());
|
2011-05-31 10:54:07 +08:00
|
|
|
exitMBB->transferSuccessorsAndUpdatePHIs(BB);
|
|
|
|
|
2011-07-20 01:09:53 +08:00
|
|
|
BB->addSuccessor(loopMBB);
|
|
|
|
loopMBB->addSuccessor(loopMBB);
|
|
|
|
loopMBB->addSuccessor(sinkMBB);
|
|
|
|
sinkMBB->addSuccessor(exitMBB);
|
|
|
|
|
2011-05-31 10:54:07 +08:00
|
|
|
// thisMBB:
|
2011-07-20 04:11:17 +08:00
|
|
|
// addiu masklsb2,$0,-4 # 0xfffffffc
|
|
|
|
// and alignedaddr,ptr,masklsb2
|
|
|
|
// andi ptrlsb2,ptr,3
|
|
|
|
// sll shiftamt,ptrlsb2,3
|
|
|
|
// ori maskupper,$0,255 # 0xff
|
|
|
|
// sll mask,maskupper,shiftamt
|
2011-05-31 10:54:07 +08:00
|
|
|
// nor mask2,$0,mask
|
2011-07-20 04:11:17 +08:00
|
|
|
// sll incr2,incr,shiftamt
|
2011-05-31 10:54:07 +08:00
|
|
|
|
|
|
|
int64_t MaskImm = (Size == 1) ? 255 : 65535;
|
2016-04-29 00:26:43 +08:00
|
|
|
BuildMI(BB, DL, TII->get(ABI.GetPtrAddiuOp()), MaskLSB2)
|
|
|
|
.addReg(ABI.GetNullPtr()).addImm(-4);
|
|
|
|
BuildMI(BB, DL, TII->get(ABI.GetPtrAndOp()), AlignedAddr)
|
2011-07-20 04:11:17 +08:00
|
|
|
.addReg(Ptr).addReg(MaskLSB2);
|
2016-04-29 00:26:43 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::ANDi), PtrLSB2)
|
|
|
|
.addReg(Ptr, 0, ArePtrs64bit ? Mips::sub_32 : 0).addImm(3);
|
2014-07-19 06:55:25 +08:00
|
|
|
if (Subtarget.isLittle()) {
|
2013-05-31 11:25:44 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::SLL), ShiftAmt).addReg(PtrLSB2).addImm(3);
|
|
|
|
} else {
|
|
|
|
unsigned Off = RegInfo.createVirtualRegister(RC);
|
|
|
|
BuildMI(BB, DL, TII->get(Mips::XORi), Off)
|
|
|
|
.addReg(PtrLSB2).addImm((Size == 1) ? 3 : 2);
|
|
|
|
BuildMI(BB, DL, TII->get(Mips::SLL), ShiftAmt).addReg(Off).addImm(3);
|
|
|
|
}
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::ORi), MaskUpper)
|
2011-07-20 04:11:17 +08:00
|
|
|
.addReg(Mips::ZERO).addImm(MaskImm);
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::SLLV), Mask)
|
2013-07-02 04:39:53 +08:00
|
|
|
.addReg(MaskUpper).addReg(ShiftAmt);
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::NOR), Mask2).addReg(Mips::ZERO).addReg(Mask);
|
2013-07-02 04:39:53 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::SLLV), Incr2).addReg(Incr).addReg(ShiftAmt);
|
2011-06-01 04:25:26 +08:00
|
|
|
|
2011-07-19 02:52:12 +08:00
|
|
|
// atomic.load.binop
|
2011-05-31 10:54:07 +08:00
|
|
|
// loopMBB:
|
2011-07-20 04:11:17 +08:00
|
|
|
// ll oldval,0(alignedaddr)
|
|
|
|
// binop binopres,oldval,incr2
|
|
|
|
// and newval,binopres,mask
|
|
|
|
// and maskedoldval0,oldval,mask2
|
|
|
|
// or storeval,maskedoldval0,newval
|
|
|
|
// sc success,storeval,0(alignedaddr)
|
|
|
|
// beq success,$0,loopMBB
|
|
|
|
|
2011-07-19 02:52:12 +08:00
|
|
|
// atomic.swap
|
|
|
|
// loopMBB:
|
2011-07-20 04:11:17 +08:00
|
|
|
// ll oldval,0(alignedaddr)
|
2011-07-20 02:14:26 +08:00
|
|
|
// and newval,incr2,mask
|
2011-07-20 04:11:17 +08:00
|
|
|
// and maskedoldval0,oldval,mask2
|
|
|
|
// or storeval,maskedoldval0,newval
|
|
|
|
// sc success,storeval,0(alignedaddr)
|
|
|
|
// beq success,$0,loopMBB
|
2011-07-19 02:52:12 +08:00
|
|
|
|
2011-05-31 10:54:07 +08:00
|
|
|
BB = loopMBB;
|
2014-12-19 00:39:29 +08:00
|
|
|
BuildMI(BB, DL, TII->get(LL), OldVal).addReg(AlignedAddr).addImm(0);
|
2011-05-31 10:54:07 +08:00
|
|
|
if (Nand) {
|
2011-07-20 04:11:17 +08:00
|
|
|
// and andres, oldval, incr2
|
|
|
|
// nor binopres, $0, andres
|
|
|
|
// and newval, binopres, mask
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::AND), AndRes).addReg(OldVal).addReg(Incr2);
|
|
|
|
BuildMI(BB, DL, TII->get(Mips::NOR), BinOpRes)
|
2011-07-20 04:11:17 +08:00
|
|
|
.addReg(Mips::ZERO).addReg(AndRes);
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::AND), NewVal).addReg(BinOpRes).addReg(Mask);
|
2011-05-31 10:54:07 +08:00
|
|
|
} else if (BinOpcode) {
|
2011-07-20 04:11:17 +08:00
|
|
|
// <binop> binopres, oldval, incr2
|
|
|
|
// and newval, binopres, mask
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(BinOpcode), BinOpRes).addReg(OldVal).addReg(Incr2);
|
|
|
|
BuildMI(BB, DL, TII->get(Mips::AND), NewVal).addReg(BinOpRes).addReg(Mask);
|
2013-10-08 03:33:02 +08:00
|
|
|
} else { // atomic.swap
|
2011-07-20 04:11:17 +08:00
|
|
|
// and newval, incr2, mask
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::AND), NewVal).addReg(Incr2).addReg(Mask);
|
2011-07-20 02:14:26 +08:00
|
|
|
}
|
2012-02-28 15:46:26 +08:00
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::AND), MaskedOldVal0)
|
2011-07-20 04:11:17 +08:00
|
|
|
.addReg(OldVal).addReg(Mask2);
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::OR), StoreVal)
|
2011-07-20 04:56:53 +08:00
|
|
|
.addReg(MaskedOldVal0).addReg(NewVal);
|
2014-12-19 00:39:29 +08:00
|
|
|
BuildMI(BB, DL, TII->get(SC), Success)
|
2011-07-20 04:11:17 +08:00
|
|
|
.addReg(StoreVal).addReg(AlignedAddr).addImm(0);
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::BEQ))
|
2011-07-20 04:11:17 +08:00
|
|
|
.addReg(Success).addReg(Mips::ZERO).addMBB(loopMBB);
|
2011-05-31 10:54:07 +08:00
|
|
|
|
2011-07-19 11:42:13 +08:00
|
|
|
// sinkMBB:
|
2011-07-20 04:11:17 +08:00
|
|
|
// and maskedoldval1,oldval,mask
|
|
|
|
// srl srlres,maskedoldval1,shiftamt
|
2014-06-16 21:13:03 +08:00
|
|
|
// sign_extend dest,srlres
|
2011-07-19 11:42:13 +08:00
|
|
|
BB = sinkMBB;
|
2011-07-19 11:14:58 +08:00
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::AND), MaskedOldVal1)
|
2011-07-20 04:11:17 +08:00
|
|
|
.addReg(OldVal).addReg(Mask);
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::SRLV), SrlRes)
|
2013-07-02 04:39:53 +08:00
|
|
|
.addReg(MaskedOldVal1).addReg(ShiftAmt);
|
2014-06-16 21:13:03 +08:00
|
|
|
BB = emitSignExtendToI32InReg(MI, BB, Size, Dest, SrlRes);
|
2011-05-31 10:54:07 +08:00
|
|
|
|
2016-07-01 06:52:52 +08:00
|
|
|
MI.eraseFromParent(); // The instruction is gone now.
|
2011-05-31 10:54:07 +08:00
|
|
|
|
2011-07-19 11:42:13 +08:00
|
|
|
return exitMBB;
|
2011-05-31 10:54:07 +08:00
|
|
|
}
|
|
|
|
|
2017-03-09 22:03:26 +08:00
|
|
|
MachineBasicBlock *MipsTargetLowering::emitAtomicCmpSwap(MachineInstr &MI,
|
|
|
|
MachineBasicBlock *BB,
|
|
|
|
unsigned Size) const {
|
|
|
|
assert((Size == 4 || Size == 8) && "Unsupported size for EmitAtomicCmpSwap.");
|
|
|
|
|
|
|
|
MachineFunction *MF = BB->getParent();
|
|
|
|
MachineRegisterInfo &RegInfo = MF->getRegInfo();
|
|
|
|
const TargetRegisterClass *RC = getRegClassFor(MVT::getIntegerVT(Size * 8));
|
|
|
|
const TargetInstrInfo *TII = Subtarget.getInstrInfo();
|
|
|
|
const bool ArePtrs64bit = ABI.ArePtrs64bit();
|
|
|
|
DebugLoc DL = MI.getDebugLoc();
|
|
|
|
unsigned LL, SC, ZERO, BNE, BEQ;
|
|
|
|
|
|
|
|
if (Size == 4) {
|
|
|
|
if (isMicroMips) {
|
|
|
|
LL = Mips::LL_MM;
|
|
|
|
SC = Mips::SC_MM;
|
|
|
|
} else {
|
|
|
|
LL = Subtarget.hasMips32r6()
|
|
|
|
? (ArePtrs64bit ? Mips::LL64_R6 : Mips::LL_R6)
|
|
|
|
: (ArePtrs64bit ? Mips::LL64 : Mips::LL);
|
|
|
|
SC = Subtarget.hasMips32r6()
|
|
|
|
? (ArePtrs64bit ? Mips::SC64_R6 : Mips::SC_R6)
|
|
|
|
: (ArePtrs64bit ? Mips::SC64 : Mips::SC);
|
|
|
|
}
|
|
|
|
|
|
|
|
ZERO = Mips::ZERO;
|
|
|
|
BNE = Mips::BNE;
|
|
|
|
BEQ = Mips::BEQ;
|
|
|
|
} else {
|
|
|
|
LL = Subtarget.hasMips64r6() ? Mips::LLD_R6 : Mips::LLD;
|
|
|
|
SC = Subtarget.hasMips64r6() ? Mips::SCD_R6 : Mips::SCD;
|
|
|
|
ZERO = Mips::ZERO_64;
|
|
|
|
BNE = Mips::BNE64;
|
|
|
|
BEQ = Mips::BEQ64;
|
|
|
|
}
|
|
|
|
|
|
|
|
unsigned Dest = MI.getOperand(0).getReg();
|
|
|
|
unsigned Ptr = MI.getOperand(1).getReg();
|
|
|
|
unsigned OldVal = MI.getOperand(2).getReg();
|
|
|
|
unsigned NewVal = MI.getOperand(3).getReg();
|
|
|
|
|
|
|
|
unsigned Success = RegInfo.createVirtualRegister(RC);
|
|
|
|
|
|
|
|
// insert new blocks after the current block
|
|
|
|
const BasicBlock *LLVM_BB = BB->getBasicBlock();
|
|
|
|
MachineBasicBlock *loop1MBB = MF->CreateMachineBasicBlock(LLVM_BB);
|
|
|
|
MachineBasicBlock *loop2MBB = MF->CreateMachineBasicBlock(LLVM_BB);
|
|
|
|
MachineBasicBlock *exitMBB = MF->CreateMachineBasicBlock(LLVM_BB);
|
|
|
|
MachineFunction::iterator It = ++BB->getIterator();
|
|
|
|
MF->insert(It, loop1MBB);
|
|
|
|
MF->insert(It, loop2MBB);
|
|
|
|
MF->insert(It, exitMBB);
|
|
|
|
|
|
|
|
// Transfer the remainder of BB and its successor edges to exitMBB.
|
|
|
|
exitMBB->splice(exitMBB->begin(), BB,
|
|
|
|
std::next(MachineBasicBlock::iterator(MI)), BB->end());
|
|
|
|
exitMBB->transferSuccessorsAndUpdatePHIs(BB);
|
|
|
|
|
|
|
|
// thisMBB:
|
|
|
|
// ...
|
|
|
|
// fallthrough --> loop1MBB
|
|
|
|
BB->addSuccessor(loop1MBB);
|
|
|
|
loop1MBB->addSuccessor(exitMBB);
|
|
|
|
loop1MBB->addSuccessor(loop2MBB);
|
|
|
|
loop2MBB->addSuccessor(loop1MBB);
|
|
|
|
loop2MBB->addSuccessor(exitMBB);
|
|
|
|
|
|
|
|
// loop1MBB:
|
|
|
|
// ll dest, 0(ptr)
|
|
|
|
// bne dest, oldval, exitMBB
|
|
|
|
BB = loop1MBB;
|
|
|
|
BuildMI(BB, DL, TII->get(LL), Dest).addReg(Ptr).addImm(0);
|
|
|
|
BuildMI(BB, DL, TII->get(BNE))
|
|
|
|
.addReg(Dest).addReg(OldVal).addMBB(exitMBB);
|
|
|
|
|
|
|
|
// loop2MBB:
|
|
|
|
// sc success, newval, 0(ptr)
|
|
|
|
// beq success, $0, loop1MBB
|
|
|
|
BB = loop2MBB;
|
|
|
|
BuildMI(BB, DL, TII->get(SC), Success)
|
|
|
|
.addReg(NewVal).addReg(Ptr).addImm(0);
|
|
|
|
BuildMI(BB, DL, TII->get(BEQ))
|
|
|
|
.addReg(Success).addReg(ZERO).addMBB(loop1MBB);
|
|
|
|
|
|
|
|
MI.eraseFromParent(); // The instruction is gone now.
|
|
|
|
|
|
|
|
return exitMBB;
|
|
|
|
}
|
|
|
|
|
2016-07-01 06:52:52 +08:00
|
|
|
MachineBasicBlock *MipsTargetLowering::emitAtomicCmpSwapPartword(
|
|
|
|
MachineInstr &MI, MachineBasicBlock *BB, unsigned Size) const {
|
2011-05-31 10:54:07 +08:00
|
|
|
assert((Size == 1 || Size == 2) &&
|
|
|
|
"Unsupported size for EmitAtomicCmpSwapPartial.");
|
|
|
|
|
|
|
|
MachineFunction *MF = BB->getParent();
|
|
|
|
MachineRegisterInfo &RegInfo = MF->getRegInfo();
|
|
|
|
const TargetRegisterClass *RC = getRegClassFor(MVT::i32);
|
2016-06-14 19:29:28 +08:00
|
|
|
const bool ArePtrs64bit = ABI.ArePtrs64bit();
|
2016-04-14 00:02:25 +08:00
|
|
|
const TargetRegisterClass *RCp =
|
|
|
|
getRegClassFor(ArePtrs64bit ? MVT::i64 : MVT::i32);
|
2015-01-30 07:27:36 +08:00
|
|
|
const TargetInstrInfo *TII = Subtarget.getInstrInfo();
|
2016-07-01 06:52:52 +08:00
|
|
|
DebugLoc DL = MI.getDebugLoc();
|
2011-05-31 10:54:07 +08:00
|
|
|
|
2016-07-01 06:52:52 +08:00
|
|
|
unsigned Dest = MI.getOperand(0).getReg();
|
|
|
|
unsigned Ptr = MI.getOperand(1).getReg();
|
|
|
|
unsigned CmpVal = MI.getOperand(2).getReg();
|
|
|
|
unsigned NewVal = MI.getOperand(3).getReg();
|
2011-05-31 10:54:07 +08:00
|
|
|
|
2016-04-14 00:02:25 +08:00
|
|
|
unsigned AlignedAddr = RegInfo.createVirtualRegister(RCp);
|
2011-07-20 04:11:17 +08:00
|
|
|
unsigned ShiftAmt = RegInfo.createVirtualRegister(RC);
|
2011-05-31 10:54:07 +08:00
|
|
|
unsigned Mask = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned Mask2 = RegInfo.createVirtualRegister(RC);
|
2011-07-20 04:11:17 +08:00
|
|
|
unsigned ShiftedCmpVal = RegInfo.createVirtualRegister(RC);
|
2017-03-09 22:03:26 +08:00
|
|
|
unsigned OldVal = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned MaskedOldVal0 = RegInfo.createVirtualRegister(RC);
|
2011-07-20 04:11:17 +08:00
|
|
|
unsigned ShiftedNewVal = RegInfo.createVirtualRegister(RC);
|
2016-04-14 00:02:25 +08:00
|
|
|
unsigned MaskLSB2 = RegInfo.createVirtualRegister(RCp);
|
2011-07-20 04:11:17 +08:00
|
|
|
unsigned PtrLSB2 = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned MaskUpper = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned MaskedCmpVal = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned MaskedNewVal = RegInfo.createVirtualRegister(RC);
|
2017-03-09 22:03:26 +08:00
|
|
|
unsigned MaskedOldVal1 = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned StoreVal = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned SrlRes = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned Success = RegInfo.createVirtualRegister(RC);
|
|
|
|
unsigned LL, SC;
|
|
|
|
|
|
|
|
if (isMicroMips) {
|
|
|
|
LL = Mips::LL_MM;
|
|
|
|
SC = Mips::SC_MM;
|
|
|
|
} else {
|
|
|
|
LL = Subtarget.hasMips32r6() ? (ArePtrs64bit ? Mips::LL64_R6 : Mips::LL_R6)
|
|
|
|
: (ArePtrs64bit ? Mips::LL64 : Mips::LL);
|
|
|
|
SC = Subtarget.hasMips32r6() ? (ArePtrs64bit ? Mips::SC64_R6 : Mips::SC_R6)
|
|
|
|
: (ArePtrs64bit ? Mips::SC64 : Mips::SC);
|
|
|
|
}
|
2011-05-31 10:54:07 +08:00
|
|
|
|
|
|
|
// insert new blocks after the current block
|
|
|
|
const BasicBlock *LLVM_BB = BB->getBasicBlock();
|
2017-03-09 22:03:26 +08:00
|
|
|
MachineBasicBlock *loop1MBB = MF->CreateMachineBasicBlock(LLVM_BB);
|
|
|
|
MachineBasicBlock *loop2MBB = MF->CreateMachineBasicBlock(LLVM_BB);
|
|
|
|
MachineBasicBlock *sinkMBB = MF->CreateMachineBasicBlock(LLVM_BB);
|
2011-05-31 10:54:07 +08:00
|
|
|
MachineBasicBlock *exitMBB = MF->CreateMachineBasicBlock(LLVM_BB);
|
2015-10-20 08:15:20 +08:00
|
|
|
MachineFunction::iterator It = ++BB->getIterator();
|
2017-03-09 22:03:26 +08:00
|
|
|
MF->insert(It, loop1MBB);
|
|
|
|
MF->insert(It, loop2MBB);
|
|
|
|
MF->insert(It, sinkMBB);
|
2011-05-31 10:54:07 +08:00
|
|
|
MF->insert(It, exitMBB);
|
|
|
|
|
|
|
|
// Transfer the remainder of BB and its successor edges to exitMBB.
|
|
|
|
exitMBB->splice(exitMBB->begin(), BB,
|
2014-03-02 20:27:27 +08:00
|
|
|
std::next(MachineBasicBlock::iterator(MI)), BB->end());
|
2011-05-31 10:54:07 +08:00
|
|
|
exitMBB->transferSuccessorsAndUpdatePHIs(BB);
|
|
|
|
|
2017-03-09 22:03:26 +08:00
|
|
|
BB->addSuccessor(loop1MBB);
|
|
|
|
loop1MBB->addSuccessor(sinkMBB);
|
|
|
|
loop1MBB->addSuccessor(loop2MBB);
|
|
|
|
loop2MBB->addSuccessor(loop1MBB);
|
|
|
|
loop2MBB->addSuccessor(sinkMBB);
|
|
|
|
sinkMBB->addSuccessor(exitMBB);
|
2011-07-20 01:09:53 +08:00
|
|
|
|
2011-07-20 02:14:26 +08:00
|
|
|
// FIXME: computation of newval2 can be moved to loop2MBB.
|
2011-05-31 10:54:07 +08:00
|
|
|
// thisMBB:
|
2011-07-20 04:11:17 +08:00
|
|
|
// addiu masklsb2,$0,-4 # 0xfffffffc
|
|
|
|
// and alignedaddr,ptr,masklsb2
|
|
|
|
// andi ptrlsb2,ptr,3
|
2016-04-14 00:02:25 +08:00
|
|
|
// xori ptrlsb2,ptrlsb2,3 # Only for BE
|
2011-07-20 04:11:17 +08:00
|
|
|
// sll shiftamt,ptrlsb2,3
|
|
|
|
// ori maskupper,$0,255 # 0xff
|
|
|
|
// sll mask,maskupper,shiftamt
|
2011-05-31 10:54:07 +08:00
|
|
|
// nor mask2,$0,mask
|
2011-07-20 04:11:17 +08:00
|
|
|
// andi maskedcmpval,cmpval,255
|
|
|
|
// sll shiftedcmpval,maskedcmpval,shiftamt
|
|
|
|
// andi maskednewval,newval,255
|
|
|
|
// sll shiftednewval,maskednewval,shiftamt
|
2011-05-31 10:54:07 +08:00
|
|
|
int64_t MaskImm = (Size == 1) ? 255 : 65535;
|
2016-04-14 00:02:25 +08:00
|
|
|
BuildMI(BB, DL, TII->get(ArePtrs64bit ? Mips::DADDiu : Mips::ADDiu), MaskLSB2)
|
|
|
|
.addReg(ABI.GetNullPtr()).addImm(-4);
|
|
|
|
BuildMI(BB, DL, TII->get(ArePtrs64bit ? Mips::AND64 : Mips::AND), AlignedAddr)
|
2011-07-20 04:11:17 +08:00
|
|
|
.addReg(Ptr).addReg(MaskLSB2);
|
2016-04-14 00:02:25 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::ANDi), PtrLSB2)
|
|
|
|
.addReg(Ptr, 0, ArePtrs64bit ? Mips::sub_32 : 0).addImm(3);
|
2014-07-19 06:55:25 +08:00
|
|
|
if (Subtarget.isLittle()) {
|
2013-05-31 11:25:44 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::SLL), ShiftAmt).addReg(PtrLSB2).addImm(3);
|
|
|
|
} else {
|
|
|
|
unsigned Off = RegInfo.createVirtualRegister(RC);
|
|
|
|
BuildMI(BB, DL, TII->get(Mips::XORi), Off)
|
|
|
|
.addReg(PtrLSB2).addImm((Size == 1) ? 3 : 2);
|
|
|
|
BuildMI(BB, DL, TII->get(Mips::SLL), ShiftAmt).addReg(Off).addImm(3);
|
|
|
|
}
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::ORi), MaskUpper)
|
2011-07-20 04:11:17 +08:00
|
|
|
.addReg(Mips::ZERO).addImm(MaskImm);
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::SLLV), Mask)
|
2013-07-02 04:39:53 +08:00
|
|
|
.addReg(MaskUpper).addReg(ShiftAmt);
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::NOR), Mask2).addReg(Mips::ZERO).addReg(Mask);
|
|
|
|
BuildMI(BB, DL, TII->get(Mips::ANDi), MaskedCmpVal)
|
2011-07-20 04:11:17 +08:00
|
|
|
.addReg(CmpVal).addImm(MaskImm);
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::SLLV), ShiftedCmpVal)
|
2013-07-02 04:39:53 +08:00
|
|
|
.addReg(MaskedCmpVal).addReg(ShiftAmt);
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::ANDi), MaskedNewVal)
|
2011-07-20 04:11:17 +08:00
|
|
|
.addReg(NewVal).addImm(MaskImm);
|
2013-03-12 08:16:36 +08:00
|
|
|
BuildMI(BB, DL, TII->get(Mips::SLLV), ShiftedNewVal)
|
2013-07-02 04:39:53 +08:00
|
|
|
.addReg(MaskedNewVal).addReg(ShiftAmt);
|
2011-05-31 10:54:07 +08:00
|
|
|
|
2017-03-09 22:03:26 +08:00
|
|
|
// loop1MBB:
|
|
|
|
// ll oldval,0(alginedaddr)
|
|
|
|
// and maskedoldval0,oldval,mask
|
|
|
|
// bne maskedoldval0,shiftedcmpval,sinkMBB
|
|
|
|
BB = loop1MBB;
|
|
|
|
BuildMI(BB, DL, TII->get(LL), OldVal).addReg(AlignedAddr).addImm(0);
|
|
|
|
BuildMI(BB, DL, TII->get(Mips::AND), MaskedOldVal0)
|
|
|
|
.addReg(OldVal).addReg(Mask);
|
|
|
|
BuildMI(BB, DL, TII->get(Mips::BNE))
|
|
|
|
.addReg(MaskedOldVal0).addReg(ShiftedCmpVal).addMBB(sinkMBB);
|
|
|
|
|
|
|
|
// loop2MBB:
|
|
|
|
// and maskedoldval1,oldval,mask2
|
|
|
|
// or storeval,maskedoldval1,shiftednewval
|
|
|
|
// sc success,storeval,0(alignedaddr)
|
|
|
|
// beq success,$0,loop1MBB
|
|
|
|
BB = loop2MBB;
|
|
|
|
BuildMI(BB, DL, TII->get(Mips::AND), MaskedOldVal1)
|
|
|
|
.addReg(OldVal).addReg(Mask2);
|
|
|
|
BuildMI(BB, DL, TII->get(Mips::OR), StoreVal)
|
|
|
|
.addReg(MaskedOldVal1).addReg(ShiftedNewVal);
|
|
|
|
BuildMI(BB, DL, TII->get(SC), Success)
|
|
|
|
.addReg(StoreVal).addReg(AlignedAddr).addImm(0);
|
|
|
|
BuildMI(BB, DL, TII->get(Mips::BEQ))
|
|
|
|
.addReg(Success).addReg(Mips::ZERO).addMBB(loop1MBB);
|
|
|
|
|
|
|
|
// sinkMBB:
|
|
|
|
// srl srlres,maskedoldval0,shiftamt
|
|
|
|
// sign_extend dest,srlres
|
|
|
|
BB = sinkMBB;
|
|
|
|
|
|
|
|
BuildMI(BB, DL, TII->get(Mips::SRLV), SrlRes)
|
|
|
|
.addReg(MaskedOldVal0).addReg(ShiftAmt);
|
|
|
|
BB = emitSignExtendToI32InReg(MI, BB, Size, Dest, SrlRes);
|
2011-05-31 10:54:07 +08:00
|
|
|
|
2016-07-01 06:52:52 +08:00
|
|
|
MI.eraseFromParent(); // The instruction is gone now.
|
2011-05-31 10:54:07 +08:00
|
|
|
|
2011-07-19 11:42:13 +08:00
|
|
|
return exitMBB;
|
2011-05-31 10:54:07 +08:00
|
|
|
}
|
|
|
|
|
2016-07-01 06:52:52 +08:00
|
|
|
MachineBasicBlock *MipsTargetLowering::emitSEL_D(MachineInstr &MI,
|
2014-06-12 21:39:06 +08:00
|
|
|
MachineBasicBlock *BB) const {
|
|
|
|
MachineFunction *MF = BB->getParent();
|
2015-01-30 07:27:36 +08:00
|
|
|
const TargetRegisterInfo *TRI = Subtarget.getRegisterInfo();
|
|
|
|
const TargetInstrInfo *TII = Subtarget.getInstrInfo();
|
2014-06-12 21:39:06 +08:00
|
|
|
MachineRegisterInfo &RegInfo = MF->getRegInfo();
|
2016-07-01 06:52:52 +08:00
|
|
|
DebugLoc DL = MI.getDebugLoc();
|
2014-06-12 21:39:06 +08:00
|
|
|
MachineBasicBlock::iterator II(MI);
|
|
|
|
|
2016-07-01 06:52:52 +08:00
|
|
|
unsigned Fc = MI.getOperand(1).getReg();
|
2014-06-12 21:39:06 +08:00
|
|
|
const auto &FGR64RegClass = TRI->getRegClass(Mips::FGR64RegClassID);
|
|
|
|
|
|
|
|
unsigned Fc2 = RegInfo.createVirtualRegister(FGR64RegClass);
|
|
|
|
|
|
|
|
BuildMI(*BB, II, DL, TII->get(Mips::SUBREG_TO_REG), Fc2)
|
|
|
|
.addImm(0)
|
|
|
|
.addReg(Fc)
|
|
|
|
.addImm(Mips::sub_lo);
|
|
|
|
|
|
|
|
// We don't erase the original instruction, we just replace the condition
|
|
|
|
// register with the 64-bit super-register.
|
2016-07-01 06:52:52 +08:00
|
|
|
MI.getOperand(1).setReg(Fc2);
|
2014-06-12 21:39:06 +08:00
|
|
|
|
|
|
|
return BB;
|
|
|
|
}
|
|
|
|
|
2016-09-09 19:06:01 +08:00
|
|
|
SDValue MipsTargetLowering::lowerBRCOND(SDValue Op, SelectionDAG &DAG) const {
|
|
|
|
// The first operand is the chain, the second is the condition, the third is
|
|
|
|
// the block to branch to if the condition is true.
|
|
|
|
SDValue Chain = Op.getOperand(0);
|
|
|
|
SDValue Dest = Op.getOperand(2);
|
|
|
|
SDLoc DL(Op);
|
|
|
|
|
|
|
|
assert(!Subtarget.hasMips32r6() && !Subtarget.hasMips64r6());
|
|
|
|
SDValue CondRes = createFPCmp(DAG, Op.getOperand(1));
|
|
|
|
|
|
|
|
// Return if flag is not set by a floating point comparison.
|
|
|
|
if (CondRes.getOpcode() != MipsISD::FPCmp)
|
|
|
|
return Op;
|
|
|
|
|
|
|
|
SDValue CCNode = CondRes.getOperand(2);
|
|
|
|
Mips::CondCode CC =
|
|
|
|
(Mips::CondCode)cast<ConstantSDNode>(CCNode)->getZExtValue();
|
|
|
|
unsigned Opc = invertFPCondCodeUser(CC) ? Mips::BRANCH_F : Mips::BRANCH_T;
|
|
|
|
SDValue BrCode = DAG.getConstant(Opc, DL, MVT::i32);
|
|
|
|
SDValue FCC0 = DAG.getRegister(Mips::FCC0, MVT::i32);
|
|
|
|
return DAG.getNode(MipsISD::FPBrcond, DL, Op.getValueType(), Chain, BrCode,
|
|
|
|
FCC0, Dest, CondRes);
|
|
|
|
}
|
|
|
|
|
|
|
|
SDValue MipsTargetLowering::
|
|
|
|
lowerSELECT(SDValue Op, SelectionDAG &DAG) const
|
|
|
|
{
|
|
|
|
assert(!Subtarget.hasMips32r6() && !Subtarget.hasMips64r6());
|
|
|
|
SDValue Cond = createFPCmp(DAG, Op.getOperand(0));
|
|
|
|
|
|
|
|
// Return if flag is not set by a floating point comparison.
|
|
|
|
if (Cond.getOpcode() != MipsISD::FPCmp)
|
|
|
|
return Op;
|
|
|
|
|
|
|
|
return createCMovFP(DAG, Cond, Op.getOperand(1), Op.getOperand(2),
|
|
|
|
SDLoc(Op));
|
|
|
|
}
|
|
|
|
|
|
|
|
SDValue MipsTargetLowering::lowerSETCC(SDValue Op, SelectionDAG &DAG) const {
|
|
|
|
assert(!Subtarget.hasMips32r6() && !Subtarget.hasMips64r6());
|
|
|
|
SDValue Cond = createFPCmp(DAG, Op);
|
|
|
|
|
|
|
|
assert(Cond.getOpcode() == MipsISD::FPCmp &&
|
|
|
|
"Floating point operand expected.");
|
|
|
|
|
|
|
|
SDLoc DL(Op);
|
|
|
|
SDValue True = DAG.getConstant(1, DL, MVT::i32);
|
|
|
|
SDValue False = DAG.getConstant(0, DL, MVT::i32);
|
|
|
|
|
|
|
|
return createCMovFP(DAG, Cond, True, False, DL);
|
|
|
|
}
|
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue MipsTargetLowering::lowerGlobalAddress(SDValue Op,
|
2010-04-17 23:26:15 +08:00
|
|
|
SelectionDAG &DAG) const {
|
2013-09-28 03:51:35 +08:00
|
|
|
EVT Ty = Op.getValueType();
|
|
|
|
GlobalAddressSDNode *N = cast<GlobalAddressSDNode>(Op);
|
|
|
|
const GlobalValue *GV = N->getGlobal();
|
2008-07-30 03:29:50 +08:00
|
|
|
|
2017-01-27 19:36:52 +08:00
|
|
|
if (!isPositionIndependent()) {
|
2015-02-03 15:22:52 +08:00
|
|
|
const MipsTargetObjectFile *TLOF =
|
|
|
|
static_cast<const MipsTargetObjectFile *>(
|
|
|
|
getTargetMachine().getObjFileLowering());
|
2016-10-25 03:23:39 +08:00
|
|
|
const GlobalObject *GO = GV->getBaseObject();
|
|
|
|
if (GO && TLOF->IsGlobalInSmallSection(GO, getTargetMachine()))
|
2014-11-06 21:20:12 +08:00
|
|
|
// %gp_rel relocation
|
2015-01-24 22:35:11 +08:00
|
|
|
return getAddrGPRel(N, SDLoc(N), Ty, DAG);
|
2012-11-22 04:30:40 +08:00
|
|
|
|
2017-01-27 19:36:52 +08:00
|
|
|
// %hi/%lo relocation
|
|
|
|
return Subtarget.hasSym32() ? getAddrNonPIC(N, SDLoc(N), Ty, DAG)
|
|
|
|
// %highest/%higher/%hi/%lo relocation
|
|
|
|
: getAddrNonPICSym64(N, SDLoc(N), Ty, DAG);
|
2008-07-30 03:29:50 +08:00
|
|
|
}
|
|
|
|
|
2016-06-27 20:33:33 +08:00
|
|
|
// Every other architecture would use shouldAssumeDSOLocal in here, but
|
|
|
|
// mips is special.
|
2016-06-28 07:21:07 +08:00
|
|
|
// * In PIC code mips requires got loads even for local statics!
|
2016-06-27 20:33:33 +08:00
|
|
|
// * To save on got entries, for local statics the got entry contains the
|
|
|
|
// page and an additional add instruction takes care of the low bits.
|
|
|
|
// * It is legal to access a hidden symbol with a non hidden undefined,
|
|
|
|
// so one cannot guarantee that all access to a hidden symbol will know
|
|
|
|
// it is hidden.
|
|
|
|
// * Mips linkers don't support creating a page and a full got entry for
|
|
|
|
// the same symbol.
|
|
|
|
// * Given all that, we have to use a full got entry for hidden symbols :-(
|
2016-06-27 11:19:40 +08:00
|
|
|
if (GV->hasLocalLinkage())
|
2015-01-30 07:27:36 +08:00
|
|
|
return getAddrLocal(N, SDLoc(N), Ty, DAG, ABI.IsN32() || ABI.IsN64());
|
2012-11-22 04:30:40 +08:00
|
|
|
|
2012-11-22 04:40:38 +08:00
|
|
|
if (LargeGOT)
|
2015-08-12 07:09:45 +08:00
|
|
|
return getAddrGlobalLargeGOT(
|
|
|
|
N, SDLoc(N), Ty, DAG, MipsII::MO_GOT_HI16, MipsII::MO_GOT_LO16,
|
|
|
|
DAG.getEntryNode(),
|
|
|
|
MachinePointerInfo::getGOT(DAG.getMachineFunction()));
|
2012-11-22 04:40:38 +08:00
|
|
|
|
2015-08-12 07:09:45 +08:00
|
|
|
return getAddrGlobal(
|
|
|
|
N, SDLoc(N), Ty, DAG,
|
2016-05-03 21:35:44 +08:00
|
|
|
(ABI.IsN32() || ABI.IsN64()) ? MipsII::MO_GOT_DISP : MipsII::MO_GOT,
|
2015-08-12 07:09:45 +08:00
|
|
|
DAG.getEntryNode(), MachinePointerInfo::getGOT(DAG.getMachineFunction()));
|
2008-07-30 03:29:50 +08:00
|
|
|
}
|
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue MipsTargetLowering::lowerBlockAddress(SDValue Op,
|
2011-03-05 04:01:52 +08:00
|
|
|
SelectionDAG &DAG) const {
|
2013-09-28 03:51:35 +08:00
|
|
|
BlockAddressSDNode *N = cast<BlockAddressSDNode>(Op);
|
|
|
|
EVT Ty = Op.getValueType();
|
|
|
|
|
2017-01-27 19:36:52 +08:00
|
|
|
if (!isPositionIndependent())
|
|
|
|
return Subtarget.hasSym32() ? getAddrNonPIC(N, SDLoc(N), Ty, DAG)
|
|
|
|
: getAddrNonPICSym64(N, SDLoc(N), Ty, DAG);
|
2011-04-26 01:10:45 +08:00
|
|
|
|
2015-01-30 07:27:36 +08:00
|
|
|
return getAddrLocal(N, SDLoc(N), Ty, DAG, ABI.IsN32() || ABI.IsN64());
|
2011-03-05 04:01:52 +08:00
|
|
|
}
|
|
|
|
|
2008-07-30 03:29:50 +08:00
|
|
|
SDValue MipsTargetLowering::
|
2013-03-12 08:16:36 +08:00
|
|
|
lowerGlobalTLSAddress(SDValue Op, SelectionDAG &DAG) const
|
2008-07-30 03:29:50 +08:00
|
|
|
{
|
2011-12-15 02:26:41 +08:00
|
|
|
// If the relocation model is PIC, use the General Dynamic TLS Model or
|
|
|
|
// Local Dynamic TLS model, otherwise use the Initial Exec or
|
|
|
|
// Local Exec TLS Model.
|
2011-05-31 10:53:58 +08:00
|
|
|
|
|
|
|
GlobalAddressSDNode *GA = cast<GlobalAddressSDNode>(Op);
|
2015-07-29 00:24:05 +08:00
|
|
|
if (DAG.getTarget().Options.EmulatedTLS)
|
|
|
|
return LowerToTLSEmulatedModel(GA, DAG);
|
|
|
|
|
2013-05-25 10:42:55 +08:00
|
|
|
SDLoc DL(GA);
|
2011-05-31 10:53:58 +08:00
|
|
|
const GlobalValue *GV = GA->getGlobal();
|
2015-07-09 10:09:04 +08:00
|
|
|
EVT PtrVT = getPointerTy(DAG.getDataLayout());
|
2011-05-31 10:53:58 +08:00
|
|
|
|
2012-05-04 17:40:39 +08:00
|
|
|
TLSModel::Model model = getTargetMachine().getTLSModel(GV);
|
|
|
|
|
|
|
|
if (model == TLSModel::GeneralDynamic || model == TLSModel::LocalDynamic) {
|
2012-06-04 22:02:08 +08:00
|
|
|
// General Dynamic and Local Dynamic TLS Model.
|
|
|
|
unsigned Flag = (model == TLSModel::LocalDynamic) ? MipsII::MO_TLSLDM
|
|
|
|
: MipsII::MO_TLSGD;
|
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue TGA = DAG.getTargetGlobalAddress(GV, DL, PtrVT, 0, Flag);
|
|
|
|
SDValue Argument = DAG.getNode(MipsISD::Wrapper, DL, PtrVT,
|
|
|
|
getGlobalReg(DAG, PtrVT), TGA);
|
2011-12-09 05:05:38 +08:00
|
|
|
unsigned PtrSize = PtrVT.getSizeInBits();
|
|
|
|
IntegerType *PtrTy = Type::getIntNTy(*DAG.getContext(), PtrSize);
|
|
|
|
|
2011-12-11 20:21:34 +08:00
|
|
|
SDValue TlsGetAddr = DAG.getExternalSymbol("__tls_get_addr", PtrVT);
|
2011-05-31 10:53:58 +08:00
|
|
|
|
|
|
|
ArgListTy Args;
|
|
|
|
ArgListEntry Entry;
|
|
|
|
Entry.Node = Argument;
|
2011-12-09 04:34:32 +08:00
|
|
|
Entry.Ty = PtrTy;
|
2011-05-31 10:53:58 +08:00
|
|
|
Args.push_back(Entry);
|
2012-02-28 15:46:26 +08:00
|
|
|
|
2014-05-18 05:50:17 +08:00
|
|
|
TargetLowering::CallLoweringInfo CLI(DAG);
|
2017-03-18 08:44:07 +08:00
|
|
|
CLI.setDebugLoc(DL)
|
|
|
|
.setChain(DAG.getEntryNode())
|
|
|
|
.setLibCallee(CallingConv::C, PtrTy, TlsGetAddr, std::move(Args));
|
2012-05-26 00:35:28 +08:00
|
|
|
std::pair<SDValue, SDValue> CallResult = LowerCallTo(CLI);
|
2011-05-31 10:53:58 +08:00
|
|
|
|
2011-12-15 02:26:41 +08:00
|
|
|
SDValue Ret = CallResult.first;
|
|
|
|
|
2012-05-04 17:40:39 +08:00
|
|
|
if (model != TLSModel::LocalDynamic)
|
2011-12-15 02:26:41 +08:00
|
|
|
return Ret;
|
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue TGAHi = DAG.getTargetGlobalAddress(GV, DL, PtrVT, 0,
|
2011-12-15 02:26:41 +08:00
|
|
|
MipsII::MO_DTPREL_HI);
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue Hi = DAG.getNode(MipsISD::Hi, DL, PtrVT, TGAHi);
|
|
|
|
SDValue TGALo = DAG.getTargetGlobalAddress(GV, DL, PtrVT, 0,
|
2011-12-15 02:26:41 +08:00
|
|
|
MipsII::MO_DTPREL_LO);
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue Lo = DAG.getNode(MipsISD::Lo, DL, PtrVT, TGALo);
|
|
|
|
SDValue Add = DAG.getNode(ISD::ADD, DL, PtrVT, Hi, Ret);
|
|
|
|
return DAG.getNode(ISD::ADD, DL, PtrVT, Add, Lo);
|
2011-06-21 09:02:03 +08:00
|
|
|
}
|
2011-05-31 10:53:58 +08:00
|
|
|
|
2011-06-21 09:02:03 +08:00
|
|
|
SDValue Offset;
|
2012-05-04 17:40:39 +08:00
|
|
|
if (model == TLSModel::InitialExec) {
|
2011-06-21 09:02:03 +08:00
|
|
|
// Initial Exec TLS Model
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue TGA = DAG.getTargetGlobalAddress(GV, DL, PtrVT, 0,
|
2011-06-21 09:02:03 +08:00
|
|
|
MipsII::MO_GOTTPREL);
|
2013-03-12 08:16:36 +08:00
|
|
|
TGA = DAG.getNode(MipsISD::Wrapper, DL, PtrVT, getGlobalReg(DAG, PtrVT),
|
2012-02-25 06:34:47 +08:00
|
|
|
TGA);
|
[SelectionDAG] Get rid of bool parameters in SelectionDAG::getLoad, getStore, and friends.
Summary:
Instead, we take a single flags arg (a bitset).
Also add a default 0 alignment, and change the order of arguments so the
alignment comes before the flags.
This greatly simplifies many callsites, and fixes a bug in
AMDGPUISelLowering, wherein the order of the args to getLoad was
inverted. It also greatly simplifies the process of adding another flag
to getLoad.
Reviewers: chandlerc, tstellarAMD
Subscribers: jholewinski, arsenm, jyknight, dsanders, nemanjai, llvm-commits
Differential Revision: http://reviews.llvm.org/D22249
llvm-svn: 275592
2016-07-16 02:27:10 +08:00
|
|
|
Offset =
|
|
|
|
DAG.getLoad(PtrVT, DL, DAG.getEntryNode(), TGA, MachinePointerInfo());
|
2011-06-21 09:02:03 +08:00
|
|
|
} else {
|
|
|
|
// Local Exec TLS Model
|
2012-05-04 17:40:39 +08:00
|
|
|
assert(model == TLSModel::LocalExec);
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue TGAHi = DAG.getTargetGlobalAddress(GV, DL, PtrVT, 0,
|
2011-06-21 09:02:03 +08:00
|
|
|
MipsII::MO_TPREL_HI);
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue TGALo = DAG.getTargetGlobalAddress(GV, DL, PtrVT, 0,
|
2011-06-21 09:02:03 +08:00
|
|
|
MipsII::MO_TPREL_LO);
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue Hi = DAG.getNode(MipsISD::Hi, DL, PtrVT, TGAHi);
|
|
|
|
SDValue Lo = DAG.getNode(MipsISD::Lo, DL, PtrVT, TGALo);
|
|
|
|
Offset = DAG.getNode(ISD::ADD, DL, PtrVT, Hi, Lo);
|
2011-05-31 10:53:58 +08:00
|
|
|
}
|
2011-06-21 09:02:03 +08:00
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue ThreadPointer = DAG.getNode(MipsISD::ThreadPointer, DL, PtrVT);
|
|
|
|
return DAG.getNode(ISD::ADD, DL, PtrVT, ThreadPointer, Offset);
|
2008-07-30 03:29:50 +08:00
|
|
|
}
|
|
|
|
|
2008-07-28 05:46:04 +08:00
|
|
|
SDValue MipsTargetLowering::
|
2013-03-12 08:16:36 +08:00
|
|
|
lowerJumpTable(SDValue Op, SelectionDAG &DAG) const
|
2007-11-13 03:49:57 +08:00
|
|
|
{
|
2013-09-28 03:51:35 +08:00
|
|
|
JumpTableSDNode *N = cast<JumpTableSDNode>(Op);
|
|
|
|
EVT Ty = Op.getValueType();
|
|
|
|
|
2017-01-27 19:36:52 +08:00
|
|
|
if (!isPositionIndependent())
|
|
|
|
return Subtarget.hasSym32() ? getAddrNonPIC(N, SDLoc(N), Ty, DAG)
|
|
|
|
: getAddrNonPICSym64(N, SDLoc(N), Ty, DAG);
|
2007-11-13 03:49:57 +08:00
|
|
|
|
2015-01-30 07:27:36 +08:00
|
|
|
return getAddrLocal(N, SDLoc(N), Ty, DAG, ABI.IsN32() || ABI.IsN64());
|
2007-11-13 03:49:57 +08:00
|
|
|
}
|
|
|
|
|
2008-07-28 05:46:04 +08:00
|
|
|
SDValue MipsTargetLowering::
|
2013-03-12 08:16:36 +08:00
|
|
|
lowerConstantPool(SDValue Op, SelectionDAG &DAG) const
|
2008-07-09 12:15:08 +08:00
|
|
|
{
|
2013-09-28 03:51:35 +08:00
|
|
|
ConstantPoolSDNode *N = cast<ConstantPoolSDNode>(Op);
|
|
|
|
EVT Ty = Op.getValueType();
|
2009-11-25 20:17:58 +08:00
|
|
|
|
2017-01-27 19:36:52 +08:00
|
|
|
if (!isPositionIndependent()) {
|
2015-02-03 15:22:52 +08:00
|
|
|
const MipsTargetObjectFile *TLOF =
|
|
|
|
static_cast<const MipsTargetObjectFile *>(
|
|
|
|
getTargetMachine().getObjFileLowering());
|
2014-11-06 21:20:12 +08:00
|
|
|
|
2015-07-16 14:11:10 +08:00
|
|
|
if (TLOF->IsConstantInSmallSection(DAG.getDataLayout(), N->getConstVal(),
|
|
|
|
getTargetMachine()))
|
2014-11-06 21:20:12 +08:00
|
|
|
// %gp_rel relocation
|
2015-01-24 22:35:11 +08:00
|
|
|
return getAddrGPRel(N, SDLoc(N), Ty, DAG);
|
2014-11-06 21:20:12 +08:00
|
|
|
|
2017-01-27 19:36:52 +08:00
|
|
|
return Subtarget.hasSym32() ? getAddrNonPIC(N, SDLoc(N), Ty, DAG)
|
|
|
|
: getAddrNonPICSym64(N, SDLoc(N), Ty, DAG);
|
2014-11-06 21:20:12 +08:00
|
|
|
}
|
2008-07-24 00:01:50 +08:00
|
|
|
|
2017-01-27 19:36:52 +08:00
|
|
|
return getAddrLocal(N, SDLoc(N), Ty, DAG, ABI.IsN32() || ABI.IsN64());
|
2008-07-09 12:15:08 +08:00
|
|
|
}
|
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue MipsTargetLowering::lowerVASTART(SDValue Op, SelectionDAG &DAG) const {
|
2010-04-17 22:41:14 +08:00
|
|
|
MachineFunction &MF = DAG.getMachineFunction();
|
|
|
|
MipsFunctionInfo *FuncInfo = MF.getInfo<MipsFunctionInfo>();
|
|
|
|
|
2013-05-25 10:42:55 +08:00
|
|
|
SDLoc DL(Op);
|
2010-04-17 22:41:14 +08:00
|
|
|
SDValue FI = DAG.getFrameIndex(FuncInfo->getVarArgsFrameIndex(),
|
2015-07-09 10:09:04 +08:00
|
|
|
getPointerTy(MF.getDataLayout()));
|
2010-02-07 05:00:02 +08:00
|
|
|
|
|
|
|
// vastart just stores the address of the VarArgsFrameIndex slot into the
|
|
|
|
// memory location argument.
|
|
|
|
const Value *SV = cast<SrcValueSDNode>(Op.getOperand(2))->getValue();
|
2013-03-12 08:16:36 +08:00
|
|
|
return DAG.getStore(Op.getOperand(0), DL, FI, Op.getOperand(1),
|
[SelectionDAG] Get rid of bool parameters in SelectionDAG::getLoad, getStore, and friends.
Summary:
Instead, we take a single flags arg (a bitset).
Also add a default 0 alignment, and change the order of arguments so the
alignment comes before the flags.
This greatly simplifies many callsites, and fixes a bug in
AMDGPUISelLowering, wherein the order of the args to getLoad was
inverted. It also greatly simplifies the process of adding another flag
to getLoad.
Reviewers: chandlerc, tstellarAMD
Subscribers: jholewinski, arsenm, jyknight, dsanders, nemanjai, llvm-commits
Differential Revision: http://reviews.llvm.org/D22249
llvm-svn: 275592
2016-07-16 02:27:10 +08:00
|
|
|
MachinePointerInfo(SV));
|
2010-02-07 05:00:02 +08:00
|
|
|
}
|
2012-02-28 15:46:26 +08:00
|
|
|
|
2014-08-01 17:17:39 +08:00
|
|
|
SDValue MipsTargetLowering::lowerVAARG(SDValue Op, SelectionDAG &DAG) const {
|
|
|
|
SDNode *Node = Op.getNode();
|
|
|
|
EVT VT = Node->getValueType(0);
|
|
|
|
SDValue Chain = Node->getOperand(0);
|
|
|
|
SDValue VAListPtr = Node->getOperand(1);
|
|
|
|
unsigned Align = Node->getConstantOperandVal(3);
|
|
|
|
const Value *SV = cast<SrcValueSDNode>(Node->getOperand(2))->getValue();
|
|
|
|
SDLoc DL(Node);
|
2015-01-30 07:27:36 +08:00
|
|
|
unsigned ArgSlotSizeInBytes = (ABI.IsN32() || ABI.IsN64()) ? 8 : 4;
|
2014-08-01 17:17:39 +08:00
|
|
|
|
[SelectionDAG] Get rid of bool parameters in SelectionDAG::getLoad, getStore, and friends.
Summary:
Instead, we take a single flags arg (a bitset).
Also add a default 0 alignment, and change the order of arguments so the
alignment comes before the flags.
This greatly simplifies many callsites, and fixes a bug in
AMDGPUISelLowering, wherein the order of the args to getLoad was
inverted. It also greatly simplifies the process of adding another flag
to getLoad.
Reviewers: chandlerc, tstellarAMD
Subscribers: jholewinski, arsenm, jyknight, dsanders, nemanjai, llvm-commits
Differential Revision: http://reviews.llvm.org/D22249
llvm-svn: 275592
2016-07-16 02:27:10 +08:00
|
|
|
SDValue VAListLoad = DAG.getLoad(getPointerTy(DAG.getDataLayout()), DL, Chain,
|
|
|
|
VAListPtr, MachinePointerInfo(SV));
|
2014-08-01 17:17:39 +08:00
|
|
|
SDValue VAList = VAListLoad;
|
|
|
|
|
|
|
|
// Re-align the pointer if necessary.
|
|
|
|
// It should only ever be necessary for 64-bit types on O32 since the minimum
|
|
|
|
// argument alignment is the same as the maximum type alignment for N32/N64.
|
|
|
|
//
|
|
|
|
// FIXME: We currently align too often. The code generator doesn't notice
|
|
|
|
// when the pointer is still aligned from the last va_arg (or pair of
|
|
|
|
// va_args for the i64 on O32 case).
|
|
|
|
if (Align > getMinStackArgumentAlignment()) {
|
|
|
|
assert(((Align & (Align-1)) == 0) && "Expected Align to be a power of 2");
|
|
|
|
|
|
|
|
VAList = DAG.getNode(ISD::ADD, DL, VAList.getValueType(), VAList,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(Align - 1, DL, VAList.getValueType()));
|
2014-08-01 17:17:39 +08:00
|
|
|
|
|
|
|
VAList = DAG.getNode(ISD::AND, DL, VAList.getValueType(), VAList,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(-(int64_t)Align, DL,
|
2014-08-01 17:17:39 +08:00
|
|
|
VAList.getValueType()));
|
|
|
|
}
|
|
|
|
|
|
|
|
// Increment the pointer, VAList, to the next vaarg.
|
2015-07-09 10:09:52 +08:00
|
|
|
auto &TD = DAG.getDataLayout();
|
|
|
|
unsigned ArgSizeInBytes =
|
|
|
|
TD.getTypeAllocSize(VT.getTypeForEVT(*DAG.getContext()));
|
2016-01-15 05:06:47 +08:00
|
|
|
SDValue Tmp3 =
|
|
|
|
DAG.getNode(ISD::ADD, DL, VAList.getValueType(), VAList,
|
|
|
|
DAG.getConstant(alignTo(ArgSizeInBytes, ArgSlotSizeInBytes),
|
|
|
|
DL, VAList.getValueType()));
|
2014-08-01 17:17:39 +08:00
|
|
|
// Store the incremented VAList to the legalized pointer
|
|
|
|
Chain = DAG.getStore(VAListLoad.getValue(1), DL, Tmp3, VAListPtr,
|
[SelectionDAG] Get rid of bool parameters in SelectionDAG::getLoad, getStore, and friends.
Summary:
Instead, we take a single flags arg (a bitset).
Also add a default 0 alignment, and change the order of arguments so the
alignment comes before the flags.
This greatly simplifies many callsites, and fixes a bug in
AMDGPUISelLowering, wherein the order of the args to getLoad was
inverted. It also greatly simplifies the process of adding another flag
to getLoad.
Reviewers: chandlerc, tstellarAMD
Subscribers: jholewinski, arsenm, jyknight, dsanders, nemanjai, llvm-commits
Differential Revision: http://reviews.llvm.org/D22249
llvm-svn: 275592
2016-07-16 02:27:10 +08:00
|
|
|
MachinePointerInfo(SV));
|
2014-08-01 17:17:39 +08:00
|
|
|
|
|
|
|
// In big-endian mode we must adjust the pointer when the load size is smaller
|
|
|
|
// than the argument slot size. We must also reduce the known alignment to
|
|
|
|
// match. For example in the N64 ABI, we must add 4 bytes to the offset to get
|
|
|
|
// the correct half of the slot, and reduce the alignment from 8 (slot
|
|
|
|
// alignment) down to 4 (type alignment).
|
|
|
|
if (!Subtarget.isLittle() && ArgSizeInBytes < ArgSlotSizeInBytes) {
|
|
|
|
unsigned Adjustment = ArgSlotSizeInBytes - ArgSizeInBytes;
|
|
|
|
VAList = DAG.getNode(ISD::ADD, DL, VAListPtr.getValueType(), VAList,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getIntPtrConstant(Adjustment, DL));
|
2014-08-01 17:17:39 +08:00
|
|
|
}
|
|
|
|
// Load the actual argument out of the pointer VAList
|
[SelectionDAG] Get rid of bool parameters in SelectionDAG::getLoad, getStore, and friends.
Summary:
Instead, we take a single flags arg (a bitset).
Also add a default 0 alignment, and change the order of arguments so the
alignment comes before the flags.
This greatly simplifies many callsites, and fixes a bug in
AMDGPUISelLowering, wherein the order of the args to getLoad was
inverted. It also greatly simplifies the process of adding another flag
to getLoad.
Reviewers: chandlerc, tstellarAMD
Subscribers: jholewinski, arsenm, jyknight, dsanders, nemanjai, llvm-commits
Differential Revision: http://reviews.llvm.org/D22249
llvm-svn: 275592
2016-07-16 02:27:10 +08:00
|
|
|
return DAG.getLoad(VT, DL, Chain, VAList, MachinePointerInfo());
|
2014-08-01 17:17:39 +08:00
|
|
|
}
|
|
|
|
|
2013-10-10 07:36:17 +08:00
|
|
|
static SDValue lowerFCOPYSIGN32(SDValue Op, SelectionDAG &DAG,
|
|
|
|
bool HasExtractInsert) {
|
2012-04-12 06:13:04 +08:00
|
|
|
EVT TyX = Op.getOperand(0).getValueType();
|
|
|
|
EVT TyY = Op.getOperand(1).getValueType();
|
2013-05-25 10:42:55 +08:00
|
|
|
SDLoc DL(Op);
|
2015-04-28 22:05:47 +08:00
|
|
|
SDValue Const1 = DAG.getConstant(1, DL, MVT::i32);
|
|
|
|
SDValue Const31 = DAG.getConstant(31, DL, MVT::i32);
|
2012-04-12 06:13:04 +08:00
|
|
|
SDValue Res;
|
|
|
|
|
|
|
|
// If operand is of type f64, extract the upper 32-bit. Otherwise, bitcast it
|
|
|
|
// to i32.
|
|
|
|
SDValue X = (TyX == MVT::f32) ?
|
|
|
|
DAG.getNode(ISD::BITCAST, DL, MVT::i32, Op.getOperand(0)) :
|
|
|
|
DAG.getNode(MipsISD::ExtractElementF64, DL, MVT::i32, Op.getOperand(0),
|
|
|
|
Const1);
|
|
|
|
SDValue Y = (TyY == MVT::f32) ?
|
|
|
|
DAG.getNode(ISD::BITCAST, DL, MVT::i32, Op.getOperand(1)) :
|
|
|
|
DAG.getNode(MipsISD::ExtractElementF64, DL, MVT::i32, Op.getOperand(1),
|
|
|
|
Const1);
|
|
|
|
|
2013-10-10 07:36:17 +08:00
|
|
|
if (HasExtractInsert) {
|
2012-04-12 06:13:04 +08:00
|
|
|
// ext E, Y, 31, 1 ; extract bit31 of Y
|
|
|
|
// ins X, E, 31, 1 ; insert extracted bit at bit31 of X
|
|
|
|
SDValue E = DAG.getNode(MipsISD::Ext, DL, MVT::i32, Y, Const31, Const1);
|
|
|
|
Res = DAG.getNode(MipsISD::Ins, DL, MVT::i32, E, Const31, Const1, X);
|
|
|
|
} else {
|
|
|
|
// sll SllX, X, 1
|
|
|
|
// srl SrlX, SllX, 1
|
|
|
|
// srl SrlY, Y, 31
|
|
|
|
// sll SllY, SrlX, 31
|
|
|
|
// or Or, SrlX, SllY
|
|
|
|
SDValue SllX = DAG.getNode(ISD::SHL, DL, MVT::i32, X, Const1);
|
|
|
|
SDValue SrlX = DAG.getNode(ISD::SRL, DL, MVT::i32, SllX, Const1);
|
|
|
|
SDValue SrlY = DAG.getNode(ISD::SRL, DL, MVT::i32, Y, Const31);
|
|
|
|
SDValue SllY = DAG.getNode(ISD::SHL, DL, MVT::i32, SrlY, Const31);
|
|
|
|
Res = DAG.getNode(ISD::OR, DL, MVT::i32, SrlX, SllY);
|
|
|
|
}
|
2011-05-26 03:32:07 +08:00
|
|
|
|
2012-04-12 06:13:04 +08:00
|
|
|
if (TyX == MVT::f32)
|
|
|
|
return DAG.getNode(ISD::BITCAST, DL, Op.getOperand(0).getValueType(), Res);
|
2011-06-09 07:55:35 +08:00
|
|
|
|
2012-04-12 06:13:04 +08:00
|
|
|
SDValue LowX = DAG.getNode(MipsISD::ExtractElementF64, DL, MVT::i32,
|
2015-04-28 22:05:47 +08:00
|
|
|
Op.getOperand(0),
|
|
|
|
DAG.getConstant(0, DL, MVT::i32));
|
2012-04-12 06:13:04 +08:00
|
|
|
return DAG.getNode(MipsISD::BuildPairF64, DL, MVT::f64, LowX, Res);
|
|
|
|
}
|
2011-05-26 03:32:07 +08:00
|
|
|
|
2013-10-10 07:36:17 +08:00
|
|
|
static SDValue lowerFCOPYSIGN64(SDValue Op, SelectionDAG &DAG,
|
|
|
|
bool HasExtractInsert) {
|
2012-04-12 06:13:04 +08:00
|
|
|
unsigned WidthX = Op.getOperand(0).getValueSizeInBits();
|
|
|
|
unsigned WidthY = Op.getOperand(1).getValueSizeInBits();
|
|
|
|
EVT TyX = MVT::getIntegerVT(WidthX), TyY = MVT::getIntegerVT(WidthY);
|
2013-05-25 10:42:55 +08:00
|
|
|
SDLoc DL(Op);
|
2015-04-28 22:05:47 +08:00
|
|
|
SDValue Const1 = DAG.getConstant(1, DL, MVT::i32);
|
2012-04-12 06:13:04 +08:00
|
|
|
|
|
|
|
// Bitcast to integer nodes.
|
|
|
|
SDValue X = DAG.getNode(ISD::BITCAST, DL, TyX, Op.getOperand(0));
|
|
|
|
SDValue Y = DAG.getNode(ISD::BITCAST, DL, TyY, Op.getOperand(1));
|
|
|
|
|
2013-10-10 07:36:17 +08:00
|
|
|
if (HasExtractInsert) {
|
2012-04-12 06:13:04 +08:00
|
|
|
// ext E, Y, width(Y) - 1, 1 ; extract bit width(Y)-1 of Y
|
|
|
|
// ins X, E, width(X) - 1, 1 ; insert extracted bit at bit width(X)-1 of X
|
|
|
|
SDValue E = DAG.getNode(MipsISD::Ext, DL, TyY, Y,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(WidthY - 1, DL, MVT::i32), Const1);
|
2012-04-12 06:13:04 +08:00
|
|
|
|
|
|
|
if (WidthX > WidthY)
|
|
|
|
E = DAG.getNode(ISD::ZERO_EXTEND, DL, TyX, E);
|
|
|
|
else if (WidthY > WidthX)
|
|
|
|
E = DAG.getNode(ISD::TRUNCATE, DL, TyX, E);
|
|
|
|
|
|
|
|
SDValue I = DAG.getNode(MipsISD::Ins, DL, TyX, E,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(WidthX - 1, DL, MVT::i32), Const1,
|
|
|
|
X);
|
2012-04-12 06:13:04 +08:00
|
|
|
return DAG.getNode(ISD::BITCAST, DL, Op.getOperand(0).getValueType(), I);
|
|
|
|
}
|
|
|
|
|
|
|
|
// (d)sll SllX, X, 1
|
|
|
|
// (d)srl SrlX, SllX, 1
|
|
|
|
// (d)srl SrlY, Y, width(Y)-1
|
|
|
|
// (d)sll SllY, SrlX, width(Y)-1
|
|
|
|
// or Or, SrlX, SllY
|
|
|
|
SDValue SllX = DAG.getNode(ISD::SHL, DL, TyX, X, Const1);
|
|
|
|
SDValue SrlX = DAG.getNode(ISD::SRL, DL, TyX, SllX, Const1);
|
|
|
|
SDValue SrlY = DAG.getNode(ISD::SRL, DL, TyY, Y,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(WidthY - 1, DL, MVT::i32));
|
2012-04-12 06:13:04 +08:00
|
|
|
|
|
|
|
if (WidthX > WidthY)
|
|
|
|
SrlY = DAG.getNode(ISD::ZERO_EXTEND, DL, TyX, SrlY);
|
|
|
|
else if (WidthY > WidthX)
|
|
|
|
SrlY = DAG.getNode(ISD::TRUNCATE, DL, TyX, SrlY);
|
|
|
|
|
|
|
|
SDValue SllY = DAG.getNode(ISD::SHL, DL, TyX, SrlY,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(WidthX - 1, DL, MVT::i32));
|
2012-04-12 06:13:04 +08:00
|
|
|
SDValue Or = DAG.getNode(ISD::OR, DL, TyX, SrlX, SllY);
|
|
|
|
return DAG.getNode(ISD::BITCAST, DL, Op.getOperand(0).getValueType(), Or);
|
2011-05-26 03:32:07 +08:00
|
|
|
}
|
|
|
|
|
2011-12-20 03:52:25 +08:00
|
|
|
SDValue
|
2013-03-12 08:16:36 +08:00
|
|
|
MipsTargetLowering::lowerFCOPYSIGN(SDValue Op, SelectionDAG &DAG) const {
|
2014-07-19 06:55:25 +08:00
|
|
|
if (Subtarget.isGP64bit())
|
|
|
|
return lowerFCOPYSIGN64(Op, DAG, Subtarget.hasExtractInsert());
|
2012-02-28 15:46:26 +08:00
|
|
|
|
2014-07-19 06:55:25 +08:00
|
|
|
return lowerFCOPYSIGN32(Op, DAG, Subtarget.hasExtractInsert());
|
2012-04-12 06:49:04 +08:00
|
|
|
}
|
|
|
|
|
2011-06-02 08:24:44 +08:00
|
|
|
SDValue MipsTargetLowering::
|
2013-03-12 08:16:36 +08:00
|
|
|
lowerFRAMEADDR(SDValue Op, SelectionDAG &DAG) const {
|
2011-06-16 08:40:02 +08:00
|
|
|
// check the depth
|
|
|
|
assert((cast<ConstantSDNode>(Op.getOperand(0))->getZExtValue() == 0) &&
|
2011-06-08 02:58:42 +08:00
|
|
|
"Frame address can only be determined for current frame.");
|
2011-06-02 08:24:44 +08:00
|
|
|
|
2016-07-29 02:40:00 +08:00
|
|
|
MachineFrameInfo &MFI = DAG.getMachineFunction().getFrameInfo();
|
|
|
|
MFI.setFrameAddressIsTaken(true);
|
2011-06-02 08:24:44 +08:00
|
|
|
EVT VT = Op.getValueType();
|
2013-05-25 10:42:55 +08:00
|
|
|
SDLoc DL(Op);
|
2015-01-30 07:27:36 +08:00
|
|
|
SDValue FrameAddr = DAG.getCopyFromReg(
|
|
|
|
DAG.getEntryNode(), DL, ABI.IsN64() ? Mips::FP_64 : Mips::FP, VT);
|
2011-06-02 08:24:44 +08:00
|
|
|
return FrameAddr;
|
|
|
|
}
|
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue MipsTargetLowering::lowerRETURNADDR(SDValue Op,
|
2012-07-11 08:53:32 +08:00
|
|
|
SelectionDAG &DAG) const {
|
2014-01-06 08:43:20 +08:00
|
|
|
if (verifyReturnAddressArgumentIsConstant(Op, DAG))
|
2014-01-05 09:47:20 +08:00
|
|
|
return SDValue();
|
|
|
|
|
2012-07-11 08:53:32 +08:00
|
|
|
// check the depth
|
|
|
|
assert((cast<ConstantSDNode>(Op.getOperand(0))->getZExtValue() == 0) &&
|
|
|
|
"Return address can be determined only for current frame.");
|
|
|
|
|
|
|
|
MachineFunction &MF = DAG.getMachineFunction();
|
2016-07-29 02:40:00 +08:00
|
|
|
MachineFrameInfo &MFI = MF.getFrameInfo();
|
2012-12-13 14:34:11 +08:00
|
|
|
MVT VT = Op.getSimpleValueType();
|
2015-01-30 07:27:36 +08:00
|
|
|
unsigned RA = ABI.IsN64() ? Mips::RA_64 : Mips::RA;
|
2016-07-29 02:40:00 +08:00
|
|
|
MFI.setReturnAddressIsTaken(true);
|
2012-07-11 08:53:32 +08:00
|
|
|
|
|
|
|
// Return RA, which contains the return address. Mark it an implicit live-in.
|
|
|
|
unsigned Reg = MF.addLiveIn(RA, getRegClassFor(VT));
|
2013-05-25 10:42:55 +08:00
|
|
|
return DAG.getCopyFromReg(DAG.getEntryNode(), SDLoc(Op), Reg, VT);
|
2012-07-11 08:53:32 +08:00
|
|
|
}
|
|
|
|
|
2013-01-30 08:26:49 +08:00
|
|
|
// An EH_RETURN is the result of lowering llvm.eh.return which in turn is
|
|
|
|
// generated from __builtin_eh_return (offset, handler)
|
|
|
|
// The effect of this is to adjust the stack pointer by "offset"
|
|
|
|
// and then branch to "handler".
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue MipsTargetLowering::lowerEH_RETURN(SDValue Op, SelectionDAG &DAG)
|
2013-01-30 08:26:49 +08:00
|
|
|
const {
|
|
|
|
MachineFunction &MF = DAG.getMachineFunction();
|
|
|
|
MipsFunctionInfo *MipsFI = MF.getInfo<MipsFunctionInfo>();
|
|
|
|
|
|
|
|
MipsFI->setCallsEhReturn();
|
|
|
|
SDValue Chain = Op.getOperand(0);
|
|
|
|
SDValue Offset = Op.getOperand(1);
|
|
|
|
SDValue Handler = Op.getOperand(2);
|
2013-05-25 10:42:55 +08:00
|
|
|
SDLoc DL(Op);
|
2015-01-30 07:27:36 +08:00
|
|
|
EVT Ty = ABI.IsN64() ? MVT::i64 : MVT::i32;
|
2013-01-30 08:26:49 +08:00
|
|
|
|
|
|
|
// Store stack offset in V1, store jump target in V0. Glue CopyToReg and
|
|
|
|
// EH_RETURN nodes, so that instructions are emitted back-to-back.
|
2015-01-30 07:27:36 +08:00
|
|
|
unsigned OffsetReg = ABI.IsN64() ? Mips::V1_64 : Mips::V1;
|
|
|
|
unsigned AddrReg = ABI.IsN64() ? Mips::V0_64 : Mips::V0;
|
2013-01-30 08:26:49 +08:00
|
|
|
Chain = DAG.getCopyToReg(Chain, DL, OffsetReg, Offset, SDValue());
|
|
|
|
Chain = DAG.getCopyToReg(Chain, DL, AddrReg, Handler, Chain.getValue(1));
|
|
|
|
return DAG.getNode(MipsISD::EH_RETURN, DL, MVT::Other, Chain,
|
|
|
|
DAG.getRegister(OffsetReg, Ty),
|
2015-07-09 10:09:04 +08:00
|
|
|
DAG.getRegister(AddrReg, getPointerTy(MF.getDataLayout())),
|
2013-01-30 08:26:49 +08:00
|
|
|
Chain.getValue(1));
|
|
|
|
}
|
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue MipsTargetLowering::lowerATOMIC_FENCE(SDValue Op,
|
2012-06-15 05:10:56 +08:00
|
|
|
SelectionDAG &DAG) const {
|
2011-07-28 06:21:52 +08:00
|
|
|
// FIXME: Need pseudo-fence for 'singlethread' fences
|
|
|
|
// FIXME: Set SType for weaker fences where supported/appropriate.
|
|
|
|
unsigned SType = 0;
|
2013-05-25 10:42:55 +08:00
|
|
|
SDLoc DL(Op);
|
2013-03-12 08:16:36 +08:00
|
|
|
return DAG.getNode(MipsISD::Sync, DL, MVT::Other, Op.getOperand(0),
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(SType, DL, MVT::i32));
|
2011-07-28 06:21:52 +08:00
|
|
|
}
|
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue MipsTargetLowering::lowerShiftLeftParts(SDValue Op,
|
2012-06-15 05:10:56 +08:00
|
|
|
SelectionDAG &DAG) const {
|
2013-05-25 10:42:55 +08:00
|
|
|
SDLoc DL(Op);
|
2015-01-26 20:33:22 +08:00
|
|
|
MVT VT = Subtarget.isGP64bit() ? MVT::i64 : MVT::i32;
|
|
|
|
|
2012-05-09 08:55:21 +08:00
|
|
|
SDValue Lo = Op.getOperand(0), Hi = Op.getOperand(1);
|
|
|
|
SDValue Shamt = Op.getOperand(2);
|
2015-01-26 20:33:22 +08:00
|
|
|
// if shamt < (VT.bits):
|
2012-05-09 08:55:21 +08:00
|
|
|
// lo = (shl lo, shamt)
|
|
|
|
// hi = (or (shl hi, shamt) (srl (srl lo, 1), ~shamt))
|
|
|
|
// else:
|
|
|
|
// lo = 0
|
|
|
|
// hi = (shl lo, shamt[4:0])
|
|
|
|
SDValue Not = DAG.getNode(ISD::XOR, DL, MVT::i32, Shamt,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(-1, DL, MVT::i32));
|
2015-01-26 20:33:22 +08:00
|
|
|
SDValue ShiftRight1Lo = DAG.getNode(ISD::SRL, DL, VT, Lo,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(1, DL, VT));
|
2015-01-26 20:33:22 +08:00
|
|
|
SDValue ShiftRightLo = DAG.getNode(ISD::SRL, DL, VT, ShiftRight1Lo, Not);
|
|
|
|
SDValue ShiftLeftHi = DAG.getNode(ISD::SHL, DL, VT, Hi, Shamt);
|
|
|
|
SDValue Or = DAG.getNode(ISD::OR, DL, VT, ShiftLeftHi, ShiftRightLo);
|
|
|
|
SDValue ShiftLeftLo = DAG.getNode(ISD::SHL, DL, VT, Lo, Shamt);
|
2012-05-09 08:55:21 +08:00
|
|
|
SDValue Cond = DAG.getNode(ISD::AND, DL, MVT::i32, Shamt,
|
2015-04-29 20:28:58 +08:00
|
|
|
DAG.getConstant(VT.getSizeInBits(), DL, MVT::i32));
|
2015-01-26 20:33:22 +08:00
|
|
|
Lo = DAG.getNode(ISD::SELECT, DL, VT, Cond,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(0, DL, VT), ShiftLeftLo);
|
2015-01-26 20:33:22 +08:00
|
|
|
Hi = DAG.getNode(ISD::SELECT, DL, VT, Cond, ShiftLeftLo, Or);
|
2012-05-09 08:55:21 +08:00
|
|
|
|
|
|
|
SDValue Ops[2] = {Lo, Hi};
|
2014-04-28 03:20:57 +08:00
|
|
|
return DAG.getMergeValues(Ops, DL);
|
2012-05-09 08:55:21 +08:00
|
|
|
}
|
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue MipsTargetLowering::lowerShiftRightParts(SDValue Op, SelectionDAG &DAG,
|
2012-05-09 08:55:21 +08:00
|
|
|
bool IsSRA) const {
|
2013-05-25 10:42:55 +08:00
|
|
|
SDLoc DL(Op);
|
2012-05-09 08:55:21 +08:00
|
|
|
SDValue Lo = Op.getOperand(0), Hi = Op.getOperand(1);
|
|
|
|
SDValue Shamt = Op.getOperand(2);
|
2015-01-26 20:33:22 +08:00
|
|
|
MVT VT = Subtarget.isGP64bit() ? MVT::i64 : MVT::i32;
|
2012-05-09 08:55:21 +08:00
|
|
|
|
2015-01-26 20:33:22 +08:00
|
|
|
// if shamt < (VT.bits):
|
2012-05-09 08:55:21 +08:00
|
|
|
// lo = (or (shl (shl hi, 1), ~shamt) (srl lo, shamt))
|
|
|
|
// if isSRA:
|
|
|
|
// hi = (sra hi, shamt)
|
|
|
|
// else:
|
|
|
|
// hi = (srl hi, shamt)
|
|
|
|
// else:
|
|
|
|
// if isSRA:
|
|
|
|
// lo = (sra hi, shamt[4:0])
|
|
|
|
// hi = (sra hi, 31)
|
|
|
|
// else:
|
|
|
|
// lo = (srl hi, shamt[4:0])
|
|
|
|
// hi = 0
|
|
|
|
SDValue Not = DAG.getNode(ISD::XOR, DL, MVT::i32, Shamt,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(-1, DL, MVT::i32));
|
2015-01-26 20:33:22 +08:00
|
|
|
SDValue ShiftLeft1Hi = DAG.getNode(ISD::SHL, DL, VT, Hi,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(1, DL, VT));
|
2015-01-26 20:33:22 +08:00
|
|
|
SDValue ShiftLeftHi = DAG.getNode(ISD::SHL, DL, VT, ShiftLeft1Hi, Not);
|
|
|
|
SDValue ShiftRightLo = DAG.getNode(ISD::SRL, DL, VT, Lo, Shamt);
|
|
|
|
SDValue Or = DAG.getNode(ISD::OR, DL, VT, ShiftLeftHi, ShiftRightLo);
|
|
|
|
SDValue ShiftRightHi = DAG.getNode(IsSRA ? ISD::SRA : ISD::SRL,
|
|
|
|
DL, VT, Hi, Shamt);
|
2012-05-09 08:55:21 +08:00
|
|
|
SDValue Cond = DAG.getNode(ISD::AND, DL, MVT::i32, Shamt,
|
2015-04-29 20:28:58 +08:00
|
|
|
DAG.getConstant(VT.getSizeInBits(), DL, MVT::i32));
|
|
|
|
SDValue Ext = DAG.getNode(ISD::SRA, DL, VT, Hi,
|
|
|
|
DAG.getConstant(VT.getSizeInBits() - 1, DL, VT));
|
2015-01-26 20:33:22 +08:00
|
|
|
Lo = DAG.getNode(ISD::SELECT, DL, VT, Cond, ShiftRightHi, Or);
|
|
|
|
Hi = DAG.getNode(ISD::SELECT, DL, VT, Cond,
|
2015-04-29 20:28:58 +08:00
|
|
|
IsSRA ? Ext : DAG.getConstant(0, DL, VT), ShiftRightHi);
|
2012-05-09 08:55:21 +08:00
|
|
|
|
|
|
|
SDValue Ops[2] = {Lo, Hi};
|
2014-04-28 03:20:57 +08:00
|
|
|
return DAG.getMergeValues(Ops, DL);
|
2012-05-09 08:55:21 +08:00
|
|
|
}
|
|
|
|
|
2013-04-12 03:07:14 +08:00
|
|
|
static SDValue createLoadLR(unsigned Opc, SelectionDAG &DAG, LoadSDNode *LD,
|
2012-06-02 08:03:49 +08:00
|
|
|
SDValue Chain, SDValue Src, unsigned Offset) {
|
2012-06-14 03:06:08 +08:00
|
|
|
SDValue Ptr = LD->getBasePtr();
|
2012-06-02 08:03:49 +08:00
|
|
|
EVT VT = LD->getValueType(0), MemVT = LD->getMemoryVT();
|
2012-06-14 03:06:08 +08:00
|
|
|
EVT BasePtrVT = Ptr.getValueType();
|
2013-05-25 10:42:55 +08:00
|
|
|
SDLoc DL(LD);
|
2012-06-02 08:03:49 +08:00
|
|
|
SDVTList VTList = DAG.getVTList(VT, MVT::Other);
|
|
|
|
|
|
|
|
if (Offset)
|
2012-06-14 03:06:08 +08:00
|
|
|
Ptr = DAG.getNode(ISD::ADD, DL, BasePtrVT, Ptr,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(Offset, DL, BasePtrVT));
|
2012-06-02 08:03:49 +08:00
|
|
|
|
|
|
|
SDValue Ops[] = { Chain, Ptr, Src };
|
2014-04-27 03:29:41 +08:00
|
|
|
return DAG.getMemIntrinsicNode(Opc, DL, VTList, Ops, MemVT,
|
2012-06-02 08:03:49 +08:00
|
|
|
LD->getMemOperand());
|
|
|
|
}
|
|
|
|
|
|
|
|
// Expand an unaligned 32 or 64-bit integer load node.
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue MipsTargetLowering::lowerLOAD(SDValue Op, SelectionDAG &DAG) const {
|
2012-06-02 08:03:49 +08:00
|
|
|
LoadSDNode *LD = cast<LoadSDNode>(Op);
|
|
|
|
EVT MemVT = LD->getMemoryVT();
|
|
|
|
|
2014-07-19 06:55:25 +08:00
|
|
|
if (Subtarget.systemSupportsUnalignedAccess())
|
2014-05-23 21:18:02 +08:00
|
|
|
return Op;
|
|
|
|
|
2012-06-02 08:03:49 +08:00
|
|
|
// Return if load is aligned or if MemVT is neither i32 nor i64.
|
|
|
|
if ((LD->getAlignment() >= MemVT.getSizeInBits() / 8) ||
|
|
|
|
((MemVT != MVT::i32) && (MemVT != MVT::i64)))
|
|
|
|
return SDValue();
|
|
|
|
|
2014-07-19 06:55:25 +08:00
|
|
|
bool IsLittle = Subtarget.isLittle();
|
2012-06-02 08:03:49 +08:00
|
|
|
EVT VT = Op.getValueType();
|
|
|
|
ISD::LoadExtType ExtType = LD->getExtensionType();
|
|
|
|
SDValue Chain = LD->getChain(), Undef = DAG.getUNDEF(VT);
|
|
|
|
|
|
|
|
assert((VT == MVT::i32) || (VT == MVT::i64));
|
|
|
|
|
|
|
|
// Expand
|
|
|
|
// (set dst, (i64 (load baseptr)))
|
|
|
|
// to
|
|
|
|
// (set tmp, (ldl (add baseptr, 7), undef))
|
|
|
|
// (set dst, (ldr baseptr, tmp))
|
|
|
|
if ((VT == MVT::i64) && (ExtType == ISD::NON_EXTLOAD)) {
|
2013-04-12 03:07:14 +08:00
|
|
|
SDValue LDL = createLoadLR(MipsISD::LDL, DAG, LD, Chain, Undef,
|
2012-06-02 08:03:49 +08:00
|
|
|
IsLittle ? 7 : 0);
|
2013-04-12 03:07:14 +08:00
|
|
|
return createLoadLR(MipsISD::LDR, DAG, LD, LDL.getValue(1), LDL,
|
2012-06-02 08:03:49 +08:00
|
|
|
IsLittle ? 0 : 7);
|
|
|
|
}
|
|
|
|
|
2013-04-12 03:07:14 +08:00
|
|
|
SDValue LWL = createLoadLR(MipsISD::LWL, DAG, LD, Chain, Undef,
|
2012-06-02 08:03:49 +08:00
|
|
|
IsLittle ? 3 : 0);
|
2013-04-12 03:07:14 +08:00
|
|
|
SDValue LWR = createLoadLR(MipsISD::LWR, DAG, LD, LWL.getValue(1), LWL,
|
2012-06-02 08:03:49 +08:00
|
|
|
IsLittle ? 0 : 3);
|
|
|
|
|
|
|
|
// Expand
|
|
|
|
// (set dst, (i32 (load baseptr))) or
|
|
|
|
// (set dst, (i64 (sextload baseptr))) or
|
|
|
|
// (set dst, (i64 (extload baseptr)))
|
|
|
|
// to
|
|
|
|
// (set tmp, (lwl (add baseptr, 3), undef))
|
|
|
|
// (set dst, (lwr baseptr, tmp))
|
|
|
|
if ((VT == MVT::i32) || (ExtType == ISD::SEXTLOAD) ||
|
|
|
|
(ExtType == ISD::EXTLOAD))
|
|
|
|
return LWR;
|
|
|
|
|
|
|
|
assert((VT == MVT::i64) && (ExtType == ISD::ZEXTLOAD));
|
|
|
|
|
|
|
|
// Expand
|
|
|
|
// (set dst, (i64 (zextload baseptr)))
|
|
|
|
// to
|
|
|
|
// (set tmp0, (lwl (add baseptr, 3), undef))
|
|
|
|
// (set tmp1, (lwr baseptr, tmp0))
|
|
|
|
// (set tmp2, (shl tmp1, 32))
|
|
|
|
// (set dst, (srl tmp2, 32))
|
2013-05-25 10:42:55 +08:00
|
|
|
SDLoc DL(LD);
|
2015-04-28 22:05:47 +08:00
|
|
|
SDValue Const32 = DAG.getConstant(32, DL, MVT::i32);
|
2012-06-02 08:03:49 +08:00
|
|
|
SDValue SLL = DAG.getNode(ISD::SHL, DL, MVT::i64, LWR, Const32);
|
2012-06-05 01:46:29 +08:00
|
|
|
SDValue SRL = DAG.getNode(ISD::SRL, DL, MVT::i64, SLL, Const32);
|
|
|
|
SDValue Ops[] = { SRL, LWR.getValue(1) };
|
2014-04-28 03:20:57 +08:00
|
|
|
return DAG.getMergeValues(Ops, DL);
|
2012-06-02 08:03:49 +08:00
|
|
|
}
|
|
|
|
|
2013-04-12 03:07:14 +08:00
|
|
|
static SDValue createStoreLR(unsigned Opc, SelectionDAG &DAG, StoreSDNode *SD,
|
2012-06-02 08:03:49 +08:00
|
|
|
SDValue Chain, unsigned Offset) {
|
2012-06-14 03:06:08 +08:00
|
|
|
SDValue Ptr = SD->getBasePtr(), Value = SD->getValue();
|
|
|
|
EVT MemVT = SD->getMemoryVT(), BasePtrVT = Ptr.getValueType();
|
2013-05-25 10:42:55 +08:00
|
|
|
SDLoc DL(SD);
|
2012-06-02 08:03:49 +08:00
|
|
|
SDVTList VTList = DAG.getVTList(MVT::Other);
|
|
|
|
|
|
|
|
if (Offset)
|
2012-06-14 03:06:08 +08:00
|
|
|
Ptr = DAG.getNode(ISD::ADD, DL, BasePtrVT, Ptr,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(Offset, DL, BasePtrVT));
|
2012-06-02 08:03:49 +08:00
|
|
|
|
|
|
|
SDValue Ops[] = { Chain, Value, Ptr };
|
2014-04-27 03:29:41 +08:00
|
|
|
return DAG.getMemIntrinsicNode(Opc, DL, VTList, Ops, MemVT,
|
2012-06-02 08:03:49 +08:00
|
|
|
SD->getMemOperand());
|
|
|
|
}
|
|
|
|
|
|
|
|
// Expand an unaligned 32 or 64-bit integer store node.
|
2013-05-17 04:45:17 +08:00
|
|
|
static SDValue lowerUnalignedIntStore(StoreSDNode *SD, SelectionDAG &DAG,
|
|
|
|
bool IsLittle) {
|
2012-06-02 08:03:49 +08:00
|
|
|
SDValue Value = SD->getValue(), Chain = SD->getChain();
|
|
|
|
EVT VT = Value.getValueType();
|
|
|
|
|
|
|
|
// Expand
|
|
|
|
// (store val, baseptr) or
|
|
|
|
// (truncstore val, baseptr)
|
|
|
|
// to
|
|
|
|
// (swl val, (add baseptr, 3))
|
|
|
|
// (swr val, baseptr)
|
|
|
|
if ((VT == MVT::i32) || SD->isTruncatingStore()) {
|
2013-04-12 03:07:14 +08:00
|
|
|
SDValue SWL = createStoreLR(MipsISD::SWL, DAG, SD, Chain,
|
2012-06-02 08:03:49 +08:00
|
|
|
IsLittle ? 3 : 0);
|
2013-04-12 03:07:14 +08:00
|
|
|
return createStoreLR(MipsISD::SWR, DAG, SD, SWL, IsLittle ? 0 : 3);
|
2012-06-02 08:03:49 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
assert(VT == MVT::i64);
|
|
|
|
|
|
|
|
// Expand
|
|
|
|
// (store val, baseptr)
|
|
|
|
// to
|
|
|
|
// (sdl val, (add baseptr, 7))
|
|
|
|
// (sdr val, baseptr)
|
2013-04-12 03:07:14 +08:00
|
|
|
SDValue SDL = createStoreLR(MipsISD::SDL, DAG, SD, Chain, IsLittle ? 7 : 0);
|
|
|
|
return createStoreLR(MipsISD::SDR, DAG, SD, SDL, IsLittle ? 0 : 7);
|
2012-06-02 08:03:49 +08:00
|
|
|
}
|
|
|
|
|
2013-05-17 05:17:15 +08:00
|
|
|
// Lower (store (fp_to_sint $fp) $ptr) to (store (TruncIntFP $fp), $ptr).
|
|
|
|
static SDValue lowerFP_TO_SINT_STORE(StoreSDNode *SD, SelectionDAG &DAG) {
|
|
|
|
SDValue Val = SD->getValue();
|
|
|
|
|
|
|
|
if (Val.getOpcode() != ISD::FP_TO_SINT)
|
|
|
|
return SDValue();
|
|
|
|
|
|
|
|
EVT FPTy = EVT::getFloatingPointVT(Val.getValueSizeInBits());
|
2013-05-25 10:42:55 +08:00
|
|
|
SDValue Tr = DAG.getNode(MipsISD::TruncIntFP, SDLoc(Val), FPTy,
|
2013-05-17 05:17:15 +08:00
|
|
|
Val.getOperand(0));
|
2013-05-25 10:42:55 +08:00
|
|
|
return DAG.getStore(SD->getChain(), SDLoc(SD), Tr, SD->getBasePtr(),
|
[SelectionDAG] Get rid of bool parameters in SelectionDAG::getLoad, getStore, and friends.
Summary:
Instead, we take a single flags arg (a bitset).
Also add a default 0 alignment, and change the order of arguments so the
alignment comes before the flags.
This greatly simplifies many callsites, and fixes a bug in
AMDGPUISelLowering, wherein the order of the args to getLoad was
inverted. It also greatly simplifies the process of adding another flag
to getLoad.
Reviewers: chandlerc, tstellarAMD
Subscribers: jholewinski, arsenm, jyknight, dsanders, nemanjai, llvm-commits
Differential Revision: http://reviews.llvm.org/D22249
llvm-svn: 275592
2016-07-16 02:27:10 +08:00
|
|
|
SD->getPointerInfo(), SD->getAlignment(),
|
|
|
|
SD->getMemOperand()->getFlags());
|
2013-05-17 05:17:15 +08:00
|
|
|
}
|
|
|
|
|
2013-05-17 04:45:17 +08:00
|
|
|
SDValue MipsTargetLowering::lowerSTORE(SDValue Op, SelectionDAG &DAG) const {
|
|
|
|
StoreSDNode *SD = cast<StoreSDNode>(Op);
|
|
|
|
EVT MemVT = SD->getMemoryVT();
|
|
|
|
|
|
|
|
// Lower unaligned integer stores.
|
2014-07-19 06:55:25 +08:00
|
|
|
if (!Subtarget.systemSupportsUnalignedAccess() &&
|
2014-05-23 21:18:02 +08:00
|
|
|
(SD->getAlignment() < MemVT.getSizeInBits() / 8) &&
|
2013-05-17 04:45:17 +08:00
|
|
|
((MemVT == MVT::i32) || (MemVT == MVT::i64)))
|
2014-07-19 06:55:25 +08:00
|
|
|
return lowerUnalignedIntStore(SD, DAG, Subtarget.isLittle());
|
2013-05-17 04:45:17 +08:00
|
|
|
|
2013-05-17 05:17:15 +08:00
|
|
|
return lowerFP_TO_SINT_STORE(SD, DAG);
|
2013-05-17 04:45:17 +08:00
|
|
|
}
|
|
|
|
|
Add ISD::EH_DWARF_CFA, simplify @llvm.eh.dwarf.cfa on Mips, fix on PowerPC
LLVM has an @llvm.eh.dwarf.cfa intrinsic, used to lower the GCC-compatible
__builtin_dwarf_cfa() builtin. As pointed out in PR26761, this is currently
broken on PowerPC (and likely on ARM as well). Currently, @llvm.eh.dwarf.cfa is
lowered using:
ADD(FRAMEADDR, FRAME_TO_ARGS_OFFSET)
where FRAME_TO_ARGS_OFFSET defaults to the constant zero. On x86,
FRAME_TO_ARGS_OFFSET is lowered to 2*SlotSize. This setup, however, does not
work for PowerPC. Because of the way that the stack layout works, the canonical
frame address is not exactly (FRAMEADDR + FRAME_TO_ARGS_OFFSET) on PowerPC
(there is a lower save-area offset as well), so it is not just a matter of
implementing FRAME_TO_ARGS_OFFSET for PowerPC (unless we redefine its
semantics -- We can do that, since it is currently used only for
@llvm.eh.dwarf.cfa lowering, but the better to directly lower the CFA construct
itself (since it can be easily represented as a fixed-offset FrameIndex)). Mips
currently does this, but by using a custom lowering for ADD that specifically
recognizes the (FRAMEADDR, FRAME_TO_ARGS_OFFSET) pattern.
This change introduces a ISD::EH_DWARF_CFA node, which by default expands using
the existing logic, but can be directly lowered by the target. Mips is updated
to use this method (which simplifies its implementation, and I suspect makes it
more robust), and updates PowerPC to do the same.
Fixes PR26761.
Differential Revision: https://reviews.llvm.org/D24038
llvm-svn: 280350
2016-09-01 18:28:47 +08:00
|
|
|
SDValue MipsTargetLowering::lowerEH_DWARF_CFA(SDValue Op,
|
|
|
|
SelectionDAG &DAG) const {
|
2012-11-08 03:10:58 +08:00
|
|
|
|
Add ISD::EH_DWARF_CFA, simplify @llvm.eh.dwarf.cfa on Mips, fix on PowerPC
LLVM has an @llvm.eh.dwarf.cfa intrinsic, used to lower the GCC-compatible
__builtin_dwarf_cfa() builtin. As pointed out in PR26761, this is currently
broken on PowerPC (and likely on ARM as well). Currently, @llvm.eh.dwarf.cfa is
lowered using:
ADD(FRAMEADDR, FRAME_TO_ARGS_OFFSET)
where FRAME_TO_ARGS_OFFSET defaults to the constant zero. On x86,
FRAME_TO_ARGS_OFFSET is lowered to 2*SlotSize. This setup, however, does not
work for PowerPC. Because of the way that the stack layout works, the canonical
frame address is not exactly (FRAMEADDR + FRAME_TO_ARGS_OFFSET) on PowerPC
(there is a lower save-area offset as well), so it is not just a matter of
implementing FRAME_TO_ARGS_OFFSET for PowerPC (unless we redefine its
semantics -- We can do that, since it is currently used only for
@llvm.eh.dwarf.cfa lowering, but the better to directly lower the CFA construct
itself (since it can be easily represented as a fixed-offset FrameIndex)). Mips
currently does this, but by using a custom lowering for ADD that specifically
recognizes the (FRAMEADDR, FRAME_TO_ARGS_OFFSET) pattern.
This change introduces a ISD::EH_DWARF_CFA node, which by default expands using
the existing logic, but can be directly lowered by the target. Mips is updated
to use this method (which simplifies its implementation, and I suspect makes it
more robust), and updates PowerPC to do the same.
Fixes PR26761.
Differential Revision: https://reviews.llvm.org/D24038
llvm-svn: 280350
2016-09-01 18:28:47 +08:00
|
|
|
// Return a fixed StackObject with offset 0 which points to the old stack
|
|
|
|
// pointer.
|
2016-07-29 02:40:00 +08:00
|
|
|
MachineFrameInfo &MFI = DAG.getMachineFunction().getFrameInfo();
|
2012-11-08 03:10:58 +08:00
|
|
|
EVT ValTy = Op->getValueType(0);
|
2016-07-29 02:40:00 +08:00
|
|
|
int FI = MFI.CreateFixedObject(Op.getValueSizeInBits() / 8, 0, false);
|
Add ISD::EH_DWARF_CFA, simplify @llvm.eh.dwarf.cfa on Mips, fix on PowerPC
LLVM has an @llvm.eh.dwarf.cfa intrinsic, used to lower the GCC-compatible
__builtin_dwarf_cfa() builtin. As pointed out in PR26761, this is currently
broken on PowerPC (and likely on ARM as well). Currently, @llvm.eh.dwarf.cfa is
lowered using:
ADD(FRAMEADDR, FRAME_TO_ARGS_OFFSET)
where FRAME_TO_ARGS_OFFSET defaults to the constant zero. On x86,
FRAME_TO_ARGS_OFFSET is lowered to 2*SlotSize. This setup, however, does not
work for PowerPC. Because of the way that the stack layout works, the canonical
frame address is not exactly (FRAMEADDR + FRAME_TO_ARGS_OFFSET) on PowerPC
(there is a lower save-area offset as well), so it is not just a matter of
implementing FRAME_TO_ARGS_OFFSET for PowerPC (unless we redefine its
semantics -- We can do that, since it is currently used only for
@llvm.eh.dwarf.cfa lowering, but the better to directly lower the CFA construct
itself (since it can be easily represented as a fixed-offset FrameIndex)). Mips
currently does this, but by using a custom lowering for ADD that specifically
recognizes the (FRAMEADDR, FRAME_TO_ARGS_OFFSET) pattern.
This change introduces a ISD::EH_DWARF_CFA node, which by default expands using
the existing logic, but can be directly lowered by the target. Mips is updated
to use this method (which simplifies its implementation, and I suspect makes it
more robust), and updates PowerPC to do the same.
Fixes PR26761.
Differential Revision: https://reviews.llvm.org/D24038
llvm-svn: 280350
2016-09-01 18:28:47 +08:00
|
|
|
return DAG.getFrameIndex(FI, ValTy);
|
2012-11-08 03:10:58 +08:00
|
|
|
}
|
|
|
|
|
2013-05-17 05:17:15 +08:00
|
|
|
SDValue MipsTargetLowering::lowerFP_TO_SINT(SDValue Op,
|
|
|
|
SelectionDAG &DAG) const {
|
|
|
|
EVT FPTy = EVT::getFloatingPointVT(Op.getValueSizeInBits());
|
2013-05-25 10:42:55 +08:00
|
|
|
SDValue Trunc = DAG.getNode(MipsISD::TruncIntFP, SDLoc(Op), FPTy,
|
2013-05-17 05:17:15 +08:00
|
|
|
Op.getOperand(0));
|
2013-05-25 10:42:55 +08:00
|
|
|
return DAG.getNode(ISD::BITCAST, SDLoc(Op), Op.getValueType(), Trunc);
|
2013-05-17 05:17:15 +08:00
|
|
|
}
|
|
|
|
|
2011-04-16 05:51:11 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
2007-06-06 15:42:06 +08:00
|
|
|
// Calling Convention Implementation
|
2011-04-16 05:51:11 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
2007-06-06 15:42:06 +08:00
|
|
|
|
2011-04-16 05:51:11 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
2010-11-23 11:31:01 +08:00
|
|
|
// TODO: Implement a generic logic using tblgen that can support this.
|
2009-03-19 10:12:28 +08:00
|
|
|
// Mips O32 ABI rules:
|
|
|
|
// ---
|
|
|
|
// i32 - Passed in A0, A1, A2, A3 and stack
|
2010-11-23 11:31:01 +08:00
|
|
|
// f32 - Only passed in f32 registers if no int reg has been used yet to hold
|
2009-03-19 10:12:28 +08:00
|
|
|
// an argument. Otherwise, passed in A1, A2, A3 and stack.
|
2010-11-23 11:31:01 +08:00
|
|
|
// f64 - Only passed in two aliased f32 registers if no int reg has been used
|
|
|
|
// yet to hold an argument. Otherwise, use A2, A3 and stack. If A1 is
|
2014-08-12 02:04:46 +08:00
|
|
|
// not used, it must be shadowed. If only A3 is available, shadow it and
|
2009-03-19 10:12:28 +08:00
|
|
|
// go to stack.
|
2011-05-20 02:06:05 +08:00
|
|
|
//
|
|
|
|
// For vararg functions, all arguments are passed in A0, A1, A2, A3 and stack.
|
2011-04-16 05:51:11 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
2009-03-19 10:12:28 +08:00
|
|
|
|
2013-10-08 03:33:02 +08:00
|
|
|
static bool CC_MipsO32(unsigned ValNo, MVT ValVT, MVT LocVT,
|
|
|
|
CCValAssign::LocInfo LocInfo, ISD::ArgFlagsTy ArgFlags,
|
2015-02-21 10:11:17 +08:00
|
|
|
CCState &State, ArrayRef<MCPhysReg> F64Regs) {
|
2015-01-30 07:27:36 +08:00
|
|
|
const MipsSubtarget &Subtarget = static_cast<const MipsSubtarget &>(
|
|
|
|
State.getMachineFunction().getSubtarget());
|
2009-03-19 10:12:28 +08:00
|
|
|
|
2014-04-04 13:16:06 +08:00
|
|
|
static const MCPhysReg IntRegs[] = { Mips::A0, Mips::A1, Mips::A2, Mips::A3 };
|
|
|
|
static const MCPhysReg F32Regs[] = { Mips::F12, Mips::F14 };
|
2009-03-19 10:12:28 +08:00
|
|
|
|
2012-10-27 08:29:43 +08:00
|
|
|
// Do not process byval args here.
|
|
|
|
if (ArgFlags.isByVal())
|
|
|
|
return true;
|
2011-05-25 03:18:33 +08:00
|
|
|
|
2014-12-03 04:40:27 +08:00
|
|
|
// Promote i8 and i16
|
|
|
|
if (ArgFlags.isInReg() && !Subtarget.isLittle()) {
|
|
|
|
if (LocVT == MVT::i8 || LocVT == MVT::i16 || LocVT == MVT::i32) {
|
|
|
|
LocVT = MVT::i32;
|
|
|
|
if (ArgFlags.isSExt())
|
|
|
|
LocInfo = CCValAssign::SExtUpper;
|
|
|
|
else if (ArgFlags.isZExt())
|
|
|
|
LocInfo = CCValAssign::ZExtUpper;
|
|
|
|
else
|
|
|
|
LocInfo = CCValAssign::AExtUpper;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2010-02-07 03:20:49 +08:00
|
|
|
// Promote i8 and i16
|
|
|
|
if (LocVT == MVT::i8 || LocVT == MVT::i16) {
|
|
|
|
LocVT = MVT::i32;
|
|
|
|
if (ArgFlags.isSExt())
|
|
|
|
LocInfo = CCValAssign::SExt;
|
|
|
|
else if (ArgFlags.isZExt())
|
|
|
|
LocInfo = CCValAssign::ZExt;
|
|
|
|
else
|
|
|
|
LocInfo = CCValAssign::AExt;
|
|
|
|
}
|
|
|
|
|
2011-03-05 04:27:44 +08:00
|
|
|
unsigned Reg;
|
2010-02-07 03:20:49 +08:00
|
|
|
|
2011-05-20 02:06:05 +08:00
|
|
|
// f32 and f64 are allocated in A0, A1, A2, A3 when either of the following
|
|
|
|
// is true: function is vararg, argument is 3rd or higher, there is previous
|
|
|
|
// argument which is not f32 or f64.
|
2015-02-21 10:11:17 +08:00
|
|
|
bool AllocateFloatsInIntReg = State.isVarArg() || ValNo > 1 ||
|
|
|
|
State.getFirstUnallocated(F32Regs) != ValNo;
|
2011-05-20 04:29:48 +08:00
|
|
|
unsigned OrigAlign = ArgFlags.getOrigAlign();
|
|
|
|
bool isI64 = (ValVT == MVT::i32 && OrigAlign == 8);
|
2017-04-08 01:25:05 +08:00
|
|
|
|
|
|
|
if (ValVT == MVT::i32 || (ValVT == MVT::f32 && AllocateFloatsInIntReg)) {
|
2015-02-21 10:11:17 +08:00
|
|
|
Reg = State.AllocateReg(IntRegs);
|
2011-05-20 04:29:48 +08:00
|
|
|
// If this is the first part of an i64 arg,
|
|
|
|
// the allocated register must be either A0 or A2.
|
|
|
|
if (isI64 && (Reg == Mips::A1 || Reg == Mips::A3))
|
2015-02-21 10:11:17 +08:00
|
|
|
Reg = State.AllocateReg(IntRegs);
|
2011-03-05 04:27:44 +08:00
|
|
|
LocVT = MVT::i32;
|
2011-05-20 02:06:05 +08:00
|
|
|
} else if (ValVT == MVT::f64 && AllocateFloatsInIntReg) {
|
|
|
|
// Allocate int register and shadow next int register. If first
|
|
|
|
// available register is Mips::A1 or Mips::A3, shadow it too.
|
2015-02-21 10:11:17 +08:00
|
|
|
Reg = State.AllocateReg(IntRegs);
|
2011-03-05 04:27:44 +08:00
|
|
|
if (Reg == Mips::A1 || Reg == Mips::A3)
|
2015-02-21 10:11:17 +08:00
|
|
|
Reg = State.AllocateReg(IntRegs);
|
|
|
|
State.AllocateReg(IntRegs);
|
2011-03-05 04:27:44 +08:00
|
|
|
LocVT = MVT::i32;
|
2011-05-20 02:06:05 +08:00
|
|
|
} else if (ValVT.isFloatingPoint() && !AllocateFloatsInIntReg) {
|
|
|
|
// we are guaranteed to find an available float register
|
|
|
|
if (ValVT == MVT::f32) {
|
2015-02-21 10:11:17 +08:00
|
|
|
Reg = State.AllocateReg(F32Regs);
|
2011-05-20 02:06:05 +08:00
|
|
|
// Shadow int register
|
2015-02-21 10:11:17 +08:00
|
|
|
State.AllocateReg(IntRegs);
|
2011-05-20 02:06:05 +08:00
|
|
|
} else {
|
2015-02-21 10:11:17 +08:00
|
|
|
Reg = State.AllocateReg(F64Regs);
|
2011-05-20 02:06:05 +08:00
|
|
|
// Shadow int registers
|
2015-02-21 10:11:17 +08:00
|
|
|
unsigned Reg2 = State.AllocateReg(IntRegs);
|
2011-05-20 02:06:05 +08:00
|
|
|
if (Reg2 == Mips::A1 || Reg2 == Mips::A3)
|
2015-02-21 10:11:17 +08:00
|
|
|
State.AllocateReg(IntRegs);
|
|
|
|
State.AllocateReg(IntRegs);
|
2011-05-20 02:06:05 +08:00
|
|
|
}
|
2011-03-05 04:27:44 +08:00
|
|
|
} else
|
|
|
|
llvm_unreachable("Cannot handle this ValVT.");
|
2010-02-07 03:20:49 +08:00
|
|
|
|
2012-10-27 08:29:43 +08:00
|
|
|
if (!Reg) {
|
|
|
|
unsigned Offset = State.AllocateStack(ValVT.getSizeInBits() >> 3,
|
|
|
|
OrigAlign);
|
2011-03-05 04:27:44 +08:00
|
|
|
State.addLoc(CCValAssign::getMem(ValNo, ValVT, Offset, LocVT, LocInfo));
|
2012-10-27 08:29:43 +08:00
|
|
|
} else
|
2011-03-05 04:27:44 +08:00
|
|
|
State.addLoc(CCValAssign::getReg(ValNo, ValVT, Reg, LocVT, LocInfo));
|
2010-02-07 03:20:49 +08:00
|
|
|
|
2012-10-27 08:29:43 +08:00
|
|
|
return false;
|
2011-11-12 10:20:46 +08:00
|
|
|
}
|
|
|
|
|
2013-08-21 07:38:40 +08:00
|
|
|
static bool CC_MipsO32_FP32(unsigned ValNo, MVT ValVT,
|
|
|
|
MVT LocVT, CCValAssign::LocInfo LocInfo,
|
|
|
|
ISD::ArgFlagsTy ArgFlags, CCState &State) {
|
2014-04-04 13:16:06 +08:00
|
|
|
static const MCPhysReg F64Regs[] = { Mips::D6, Mips::D7 };
|
2013-08-21 07:38:40 +08:00
|
|
|
|
|
|
|
return CC_MipsO32(ValNo, ValVT, LocVT, LocInfo, ArgFlags, State, F64Regs);
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool CC_MipsO32_FP64(unsigned ValNo, MVT ValVT,
|
|
|
|
MVT LocVT, CCValAssign::LocInfo LocInfo,
|
|
|
|
ISD::ArgFlagsTy ArgFlags, CCState &State) {
|
2014-04-04 13:16:06 +08:00
|
|
|
static const MCPhysReg F64Regs[] = { Mips::D12_64, Mips::D14_64 };
|
2013-08-21 07:38:40 +08:00
|
|
|
|
|
|
|
return CC_MipsO32(ValNo, ValVT, LocVT, LocInfo, ArgFlags, State, F64Regs);
|
|
|
|
}
|
|
|
|
|
2014-11-14 08:39:33 +08:00
|
|
|
static bool CC_MipsO32(unsigned ValNo, MVT ValVT, MVT LocVT,
|
|
|
|
CCValAssign::LocInfo LocInfo, ISD::ArgFlagsTy ArgFlags,
|
|
|
|
CCState &State) LLVM_ATTRIBUTE_UNUSED;
|
2014-11-14 07:37:45 +08:00
|
|
|
|
2011-11-12 10:20:46 +08:00
|
|
|
#include "MipsGenCallingConv.inc"
|
|
|
|
|
2011-04-16 05:51:11 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
Major calling convention code refactoring.
Instead of awkwardly encoding calling-convention information with ISD::CALL,
ISD::FORMAL_ARGUMENTS, ISD::RET, and ISD::ARG_FLAGS nodes, TargetLowering
provides three virtual functions for targets to override:
LowerFormalArguments, LowerCall, and LowerRet, which replace the custom
lowering done on the special nodes. They provide the same information, but
in a more immediately usable format.
This also reworks much of the target-independent tail call logic. The
decision of whether or not to perform a tail call is now cleanly split
between target-independent portions, and the target dependent portion
in IsEligibleForTailCallOptimization.
This also synchronizes all in-tree targets, to help enable future
refactoring and feature work.
llvm-svn: 78142
2009-08-05 09:29:28 +08:00
|
|
|
// Call Calling Convention Implementation
|
2011-04-16 05:51:11 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
2007-06-06 15:42:06 +08:00
|
|
|
|
2011-09-23 08:58:33 +08:00
|
|
|
// Return next O32 integer argument register.
|
|
|
|
static unsigned getNextIntArgReg(unsigned Reg) {
|
|
|
|
assert((Reg == Mips::A0) || (Reg == Mips::A2));
|
|
|
|
return (Reg == Mips::A0) ? Mips::A1 : Mips::A3;
|
|
|
|
}
|
|
|
|
|
2016-06-12 23:39:02 +08:00
|
|
|
SDValue MipsTargetLowering::passArgOnStack(SDValue StackPtr, unsigned Offset,
|
|
|
|
SDValue Chain, SDValue Arg,
|
|
|
|
const SDLoc &DL, bool IsTailCall,
|
|
|
|
SelectionDAG &DAG) const {
|
2012-10-31 03:23:25 +08:00
|
|
|
if (!IsTailCall) {
|
2015-07-09 10:09:04 +08:00
|
|
|
SDValue PtrOff =
|
|
|
|
DAG.getNode(ISD::ADD, DL, getPointerTy(DAG.getDataLayout()), StackPtr,
|
|
|
|
DAG.getIntPtrConstant(Offset, DL));
|
[SelectionDAG] Get rid of bool parameters in SelectionDAG::getLoad, getStore, and friends.
Summary:
Instead, we take a single flags arg (a bitset).
Also add a default 0 alignment, and change the order of arguments so the
alignment comes before the flags.
This greatly simplifies many callsites, and fixes a bug in
AMDGPUISelLowering, wherein the order of the args to getLoad was
inverted. It also greatly simplifies the process of adding another flag
to getLoad.
Reviewers: chandlerc, tstellarAMD
Subscribers: jholewinski, arsenm, jyknight, dsanders, nemanjai, llvm-commits
Differential Revision: http://reviews.llvm.org/D22249
llvm-svn: 275592
2016-07-16 02:27:10 +08:00
|
|
|
return DAG.getStore(Chain, DL, Arg, PtrOff, MachinePointerInfo());
|
2012-10-31 03:23:25 +08:00
|
|
|
}
|
|
|
|
|
2016-07-29 02:40:00 +08:00
|
|
|
MachineFrameInfo &MFI = DAG.getMachineFunction().getFrameInfo();
|
|
|
|
int FI = MFI.CreateFixedObject(Arg.getValueSizeInBits() / 8, Offset, false);
|
2015-07-09 10:09:04 +08:00
|
|
|
SDValue FIN = DAG.getFrameIndex(FI, getPointerTy(DAG.getDataLayout()));
|
2012-10-31 03:23:25 +08:00
|
|
|
return DAG.getStore(Chain, DL, Arg, FIN, MachinePointerInfo(),
|
[SelectionDAG] Get rid of bool parameters in SelectionDAG::getLoad, getStore, and friends.
Summary:
Instead, we take a single flags arg (a bitset).
Also add a default 0 alignment, and change the order of arguments so the
alignment comes before the flags.
This greatly simplifies many callsites, and fixes a bug in
AMDGPUISelLowering, wherein the order of the args to getLoad was
inverted. It also greatly simplifies the process of adding another flag
to getLoad.
Reviewers: chandlerc, tstellarAMD
Subscribers: jholewinski, arsenm, jyknight, dsanders, nemanjai, llvm-commits
Differential Revision: http://reviews.llvm.org/D22249
llvm-svn: 275592
2016-07-16 02:27:10 +08:00
|
|
|
/* Alignment = */ 0, MachineMemOperand::MOVolatile);
|
2012-10-31 03:23:25 +08:00
|
|
|
}
|
|
|
|
|
2013-03-13 08:54:29 +08:00
|
|
|
void MipsTargetLowering::
|
|
|
|
getOpndList(SmallVectorImpl<SDValue> &Ops,
|
|
|
|
std::deque< std::pair<unsigned, SDValue> > &RegsToPass,
|
|
|
|
bool IsPICCall, bool GlobalOrExternal, bool InternalLinkage,
|
2014-10-01 16:22:21 +08:00
|
|
|
bool IsCallReloc, CallLoweringInfo &CLI, SDValue Callee,
|
|
|
|
SDValue Chain) const {
|
2013-03-13 08:54:29 +08:00
|
|
|
// Insert node "GP copy globalreg" before call to function.
|
|
|
|
//
|
|
|
|
// R_MIPS_CALL* operators (emitted when non-internal functions are called
|
|
|
|
// in PIC mode) allow symbols to be resolved via lazy binding.
|
|
|
|
// The lazy binding stub requires GP to point to the GOT.
|
2014-10-01 16:22:21 +08:00
|
|
|
// Note that we don't need GP to point to the GOT for indirect calls
|
|
|
|
// (when R_MIPS_CALL* is not used for the call) because Mips linker generates
|
|
|
|
// lazy binding stub for a function only when R_MIPS_CALL* are the only relocs
|
|
|
|
// used for the function (that is, Mips linker doesn't generate lazy binding
|
|
|
|
// stub for a function whose address is taken in the program).
|
|
|
|
if (IsPICCall && !InternalLinkage && IsCallReloc) {
|
2015-01-30 07:27:36 +08:00
|
|
|
unsigned GPReg = ABI.IsN64() ? Mips::GP_64 : Mips::GP;
|
|
|
|
EVT Ty = ABI.IsN64() ? MVT::i64 : MVT::i32;
|
2013-03-13 08:54:29 +08:00
|
|
|
RegsToPass.push_back(std::make_pair(GPReg, getGlobalReg(CLI.DAG, Ty)));
|
2013-01-24 12:24:02 +08:00
|
|
|
}
|
|
|
|
|
2013-03-13 08:54:29 +08:00
|
|
|
// Build a sequence of copy-to-reg nodes chained together with token
|
|
|
|
// chain and flag operands which copy the outgoing args into registers.
|
|
|
|
// The InFlag in necessary since all emitted instructions must be
|
|
|
|
// stuck together.
|
|
|
|
SDValue InFlag;
|
|
|
|
|
|
|
|
for (unsigned i = 0, e = RegsToPass.size(); i != e; ++i) {
|
|
|
|
Chain = CLI.DAG.getCopyToReg(Chain, CLI.DL, RegsToPass[i].first,
|
|
|
|
RegsToPass[i].second, InFlag);
|
|
|
|
InFlag = Chain.getValue(1);
|
2013-01-24 12:24:02 +08:00
|
|
|
}
|
2013-03-13 08:54:29 +08:00
|
|
|
|
|
|
|
// Add argument registers to the end of the list so that they are
|
|
|
|
// known live into the call.
|
|
|
|
for (unsigned i = 0, e = RegsToPass.size(); i != e; ++i)
|
|
|
|
Ops.push_back(CLI.DAG.getRegister(RegsToPass[i].first,
|
|
|
|
RegsToPass[i].second.getValueType()));
|
|
|
|
|
|
|
|
// Add a register mask operand representing the call-preserved registers.
|
2015-01-30 07:27:36 +08:00
|
|
|
const TargetRegisterInfo *TRI = Subtarget.getRegisterInfo();
|
2015-03-12 06:42:13 +08:00
|
|
|
const uint32_t *Mask =
|
|
|
|
TRI->getCallPreservedMask(CLI.DAG.getMachineFunction(), CLI.CallConv);
|
2013-03-13 08:54:29 +08:00
|
|
|
assert(Mask && "Missing call preserved mask for calling convention");
|
2014-07-19 06:55:25 +08:00
|
|
|
if (Subtarget.inMips16HardFloat()) {
|
Checkin in of first of several patches to finish implementation of
mips16/mips32 floating point interoperability.
This patch fixes returns from mips16 functions so that if the function
was in fact called by a mips32 hard float routine, then values
that would have been returned in floating point registers are so returned.
Mips16 mode has no floating point instructions so there is no way to
load values into floating point registers.
This is needed when returning float, double, single complex, double complex
in the Mips ABI.
Helper functions in libc for mips16 are available to do this.
For efficiency purposes, these helper functions have a different calling
convention from normal Mips calls.
Registers v0,v1,a0,a1 are used to pass parameters instead of
a0,a1,a2,a3.
This is because v0,v1,a0,a1 are the natural registers used to return
floating point values in soft float. These values can then be moved
to the appropriate floating point registers with no extra cost.
The only register that is modified is ra in this call.
The helper functions make sure that the return values are in the floating
point registers that they would be in if soft float was not in effect
(which it is for mips16, though the soft float is implemented using a mips32
library that uses hard float).
llvm-svn: 181641
2013-05-11 06:25:39 +08:00
|
|
|
if (GlobalAddressSDNode *G = dyn_cast<GlobalAddressSDNode>(CLI.Callee)) {
|
|
|
|
llvm::StringRef Sym = G->getGlobal()->getName();
|
|
|
|
Function *F = G->getGlobal()->getParent()->getFunction(Sym);
|
2013-12-12 10:41:11 +08:00
|
|
|
if (F && F->hasFnAttribute("__Mips16RetHelper")) {
|
Checkin in of first of several patches to finish implementation of
mips16/mips32 floating point interoperability.
This patch fixes returns from mips16 functions so that if the function
was in fact called by a mips32 hard float routine, then values
that would have been returned in floating point registers are so returned.
Mips16 mode has no floating point instructions so there is no way to
load values into floating point registers.
This is needed when returning float, double, single complex, double complex
in the Mips ABI.
Helper functions in libc for mips16 are available to do this.
For efficiency purposes, these helper functions have a different calling
convention from normal Mips calls.
Registers v0,v1,a0,a1 are used to pass parameters instead of
a0,a1,a2,a3.
This is because v0,v1,a0,a1 are the natural registers used to return
floating point values in soft float. These values can then be moved
to the appropriate floating point registers with no extra cost.
The only register that is modified is ra in this call.
The helper functions make sure that the return values are in the floating
point registers that they would be in if soft float was not in effect
(which it is for mips16, though the soft float is implemented using a mips32
library that uses hard float).
llvm-svn: 181641
2013-05-11 06:25:39 +08:00
|
|
|
Mask = MipsRegisterInfo::getMips16RetHelperMask();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2013-03-13 08:54:29 +08:00
|
|
|
Ops.push_back(CLI.DAG.getRegisterMask(Mask));
|
|
|
|
|
|
|
|
if (InFlag.getNode())
|
|
|
|
Ops.push_back(InFlag);
|
2013-01-24 12:24:02 +08:00
|
|
|
}
|
|
|
|
|
Major calling convention code refactoring.
Instead of awkwardly encoding calling-convention information with ISD::CALL,
ISD::FORMAL_ARGUMENTS, ISD::RET, and ISD::ARG_FLAGS nodes, TargetLowering
provides three virtual functions for targets to override:
LowerFormalArguments, LowerCall, and LowerRet, which replace the custom
lowering done on the special nodes. They provide the same information, but
in a more immediately usable format.
This also reworks much of the target-independent tail call logic. The
decision of whether or not to perform a tail call is now cleanly split
between target-independent portions, and the target dependent portion
in IsEligibleForTailCallOptimization.
This also synchronizes all in-tree targets, to help enable future
refactoring and feature work.
llvm-svn: 78142
2009-08-05 09:29:28 +08:00
|
|
|
/// LowerCall - functions arguments are copied from virtual regs to
|
2009-01-26 11:15:54 +08:00
|
|
|
/// (physical regs)/(stack frame), CALLSEQ_START and CALLSEQ_END are emitted.
|
Major calling convention code refactoring.
Instead of awkwardly encoding calling-convention information with ISD::CALL,
ISD::FORMAL_ARGUMENTS, ISD::RET, and ISD::ARG_FLAGS nodes, TargetLowering
provides three virtual functions for targets to override:
LowerFormalArguments, LowerCall, and LowerRet, which replace the custom
lowering done on the special nodes. They provide the same information, but
in a more immediately usable format.
This also reworks much of the target-independent tail call logic. The
decision of whether or not to perform a tail call is now cleanly split
between target-independent portions, and the target dependent portion
in IsEligibleForTailCallOptimization.
This also synchronizes all in-tree targets, to help enable future
refactoring and feature work.
llvm-svn: 78142
2009-08-05 09:29:28 +08:00
|
|
|
SDValue
|
2012-05-26 00:35:28 +08:00
|
|
|
MipsTargetLowering::LowerCall(TargetLowering::CallLoweringInfo &CLI,
|
2010-04-17 23:26:15 +08:00
|
|
|
SmallVectorImpl<SDValue> &InVals) const {
|
2012-05-26 00:35:28 +08:00
|
|
|
SelectionDAG &DAG = CLI.DAG;
|
2013-05-25 10:42:55 +08:00
|
|
|
SDLoc DL = CLI.DL;
|
2013-07-14 12:42:23 +08:00
|
|
|
SmallVectorImpl<ISD::OutputArg> &Outs = CLI.Outs;
|
|
|
|
SmallVectorImpl<SDValue> &OutVals = CLI.OutVals;
|
|
|
|
SmallVectorImpl<ISD::InputArg> &Ins = CLI.Ins;
|
2012-08-01 02:46:41 +08:00
|
|
|
SDValue Chain = CLI.Chain;
|
2012-05-26 00:35:28 +08:00
|
|
|
SDValue Callee = CLI.Callee;
|
2013-03-12 08:16:36 +08:00
|
|
|
bool &IsTailCall = CLI.IsTailCall;
|
2012-05-26 00:35:28 +08:00
|
|
|
CallingConv::ID CallConv = CLI.CallConv;
|
2013-03-12 08:16:36 +08:00
|
|
|
bool IsVarArg = CLI.IsVarArg;
|
2012-05-26 00:35:28 +08:00
|
|
|
|
Major calling convention code refactoring.
Instead of awkwardly encoding calling-convention information with ISD::CALL,
ISD::FORMAL_ARGUMENTS, ISD::RET, and ISD::ARG_FLAGS nodes, TargetLowering
provides three virtual functions for targets to override:
LowerFormalArguments, LowerCall, and LowerRet, which replace the custom
lowering done on the special nodes. They provide the same information, but
in a more immediately usable format.
This also reworks much of the target-independent tail call logic. The
decision of whether or not to perform a tail call is now cleanly split
between target-independent portions, and the target dependent portion
in IsEligibleForTailCallOptimization.
This also synchronizes all in-tree targets, to help enable future
refactoring and feature work.
llvm-svn: 78142
2009-08-05 09:29:28 +08:00
|
|
|
MachineFunction &MF = DAG.getMachineFunction();
|
2016-07-29 02:40:00 +08:00
|
|
|
MachineFrameInfo &MFI = MF.getFrameInfo();
|
2015-01-30 07:27:36 +08:00
|
|
|
const TargetFrameLowering *TFL = Subtarget.getFrameLowering();
|
2013-09-28 08:12:32 +08:00
|
|
|
MipsFunctionInfo *FuncInfo = MF.getInfo<MipsFunctionInfo>();
|
2016-06-27 20:48:21 +08:00
|
|
|
bool IsPIC = isPositionIndependent();
|
2007-06-06 15:42:06 +08:00
|
|
|
|
|
|
|
// Analyze operands of the call, assigning locations to each operand.
|
|
|
|
SmallVector<CCValAssign, 16> ArgLocs;
|
2014-11-07 19:10:48 +08:00
|
|
|
MipsCCState CCInfo(
|
|
|
|
CallConv, IsVarArg, DAG.getMachineFunction(), ArgLocs, *DAG.getContext(),
|
|
|
|
MipsCCState::getSpecialCallingConvForCallee(Callee.getNode(), Subtarget));
|
2014-11-07 23:33:08 +08:00
|
|
|
|
|
|
|
// Allocate the reserved argument area. It seems strange to do this from the
|
|
|
|
// caller side but removing it breaks the frame size calculation.
|
|
|
|
CCInfo.AllocateStack(ABI.GetCalleeAllocdArgSizeInBytes(CallConv), 1);
|
2007-07-12 07:16:16 +08:00
|
|
|
|
2017-04-26 19:10:38 +08:00
|
|
|
const ExternalSymbolSDNode *ES =
|
|
|
|
dyn_cast_or_null<const ExternalSymbolSDNode>(Callee.getNode());
|
|
|
|
CCInfo.AnalyzeCallOperands(Outs, CC_Mips, CLI.getArgs(),
|
|
|
|
ES ? ES->getSymbol() : nullptr);
|
2010-11-23 11:31:01 +08:00
|
|
|
|
2007-06-06 15:42:06 +08:00
|
|
|
// Get a count of how many bytes are to be pushed on the stack.
|
2011-06-09 01:39:33 +08:00
|
|
|
unsigned NextStackOffset = CCInfo.getNextStackOffset();
|
2012-07-27 07:27:01 +08:00
|
|
|
|
2016-11-21 05:23:08 +08:00
|
|
|
// Check if it's really possible to do a tail call. Restrict it to functions
|
|
|
|
// that are part of this compilation unit.
|
|
|
|
bool InternalLinkage = false;
|
|
|
|
if (IsTailCall) {
|
2014-11-03 00:09:29 +08:00
|
|
|
IsTailCall = isEligibleForTailCallOptimization(
|
|
|
|
CCInfo, NextStackOffset, *MF.getInfo<MipsFunctionInfo>());
|
2016-11-21 05:23:08 +08:00
|
|
|
if (GlobalAddressSDNode *G = dyn_cast<GlobalAddressSDNode>(Callee)) {
|
|
|
|
InternalLinkage = G->getGlobal()->hasInternalLinkage();
|
|
|
|
IsTailCall &= (InternalLinkage || G->getGlobal()->hasLocalLinkage() ||
|
|
|
|
G->getGlobal()->hasPrivateLinkage() ||
|
|
|
|
G->getGlobal()->hasHiddenVisibility() ||
|
|
|
|
G->getGlobal()->hasProtectedVisibility());
|
|
|
|
}
|
|
|
|
}
|
2014-04-25 04:14:34 +08:00
|
|
|
if (!IsTailCall && CLI.CS && CLI.CS->isMustTailCall())
|
|
|
|
report_fatal_error("failed to perform tail call elimination on a call "
|
|
|
|
"site marked musttail");
|
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
if (IsTailCall)
|
2012-10-20 05:47:33 +08:00
|
|
|
++NumTailCalls;
|
|
|
|
|
2011-09-20 04:26:02 +08:00
|
|
|
// Chain is the output chain of the last Load/Store or CopyToReg node.
|
|
|
|
// ByValChain is the output chain of the last Memcpy node created for copying
|
|
|
|
// byval arguments to the stack.
|
2012-10-31 04:16:31 +08:00
|
|
|
unsigned StackAlignment = TFL->getStackAlignment();
|
2016-01-15 05:06:47 +08:00
|
|
|
NextStackOffset = alignTo(NextStackOffset, StackAlignment);
|
2015-04-28 22:05:47 +08:00
|
|
|
SDValue NextStackOffsetVal = DAG.getIntPtrConstant(NextStackOffset, DL, true);
|
2012-10-20 05:47:33 +08:00
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
if (!IsTailCall)
|
2017-05-09 21:35:13 +08:00
|
|
|
Chain = DAG.getCALLSEQ_START(Chain, NextStackOffset, 0, DL);
|
2012-08-01 02:46:41 +08:00
|
|
|
|
2015-07-09 10:09:04 +08:00
|
|
|
SDValue StackPtr =
|
|
|
|
DAG.getCopyFromReg(Chain, DL, ABI.IsN64() ? Mips::SP_64 : Mips::SP,
|
|
|
|
getPointerTy(DAG.getDataLayout()));
|
2007-06-06 15:42:06 +08:00
|
|
|
|
2013-01-23 04:05:56 +08:00
|
|
|
std::deque< std::pair<unsigned, SDValue> > RegsToPass;
|
2011-06-09 01:39:33 +08:00
|
|
|
SmallVector<SDValue, 8> MemOpChains;
|
2014-11-03 00:09:29 +08:00
|
|
|
|
|
|
|
CCInfo.rewindByValRegsInfo();
|
2011-06-09 01:39:33 +08:00
|
|
|
|
2007-06-06 15:42:06 +08:00
|
|
|
// Walk the register/memloc assignments, inserting copies/loads.
|
|
|
|
for (unsigned i = 0, e = ArgLocs.size(); i != e; ++i) {
|
2010-07-07 23:54:55 +08:00
|
|
|
SDValue Arg = OutVals[i];
|
2007-06-06 15:42:06 +08:00
|
|
|
CCValAssign &VA = ArgLocs[i];
|
2011-10-29 03:49:00 +08:00
|
|
|
MVT ValVT = VA.getValVT(), LocVT = VA.getLocVT();
|
2011-11-12 10:34:50 +08:00
|
|
|
ISD::ArgFlagsTy Flags = Outs[i].Flags;
|
2014-11-08 00:54:21 +08:00
|
|
|
bool UseUpperBits = false;
|
2011-11-12 10:34:50 +08:00
|
|
|
|
|
|
|
// ByVal Arg.
|
|
|
|
if (Flags.isByVal()) {
|
2014-11-03 00:09:29 +08:00
|
|
|
unsigned FirstByValReg, LastByValReg;
|
|
|
|
unsigned ByValIdx = CCInfo.getInRegsParamsProcessed();
|
|
|
|
CCInfo.getInRegsParamInfo(ByValIdx, FirstByValReg, LastByValReg);
|
|
|
|
|
2011-11-12 10:34:50 +08:00
|
|
|
assert(Flags.getByValSize() &&
|
|
|
|
"ByVal args of size 0 should have been ignored by front-end.");
|
2014-11-03 00:09:29 +08:00
|
|
|
assert(ByValIdx < CCInfo.getInRegsParamsCount());
|
2013-03-12 08:16:36 +08:00
|
|
|
assert(!IsTailCall &&
|
2012-10-31 04:16:31 +08:00
|
|
|
"Do not tail-call optimize if there is a byval argument.");
|
2013-03-12 08:16:36 +08:00
|
|
|
passByValArg(Chain, DL, RegsToPass, MemOpChains, StackPtr, MFI, DAG, Arg,
|
2014-11-07 23:33:08 +08:00
|
|
|
FirstByValReg, LastByValReg, Flags, Subtarget.isLittle(),
|
|
|
|
VA);
|
2014-11-03 00:09:29 +08:00
|
|
|
CCInfo.nextInRegsParam();
|
2011-11-12 10:34:50 +08:00
|
|
|
continue;
|
|
|
|
}
|
2012-02-28 15:46:26 +08:00
|
|
|
|
2007-06-06 15:42:06 +08:00
|
|
|
// Promote the value if needed.
|
|
|
|
switch (VA.getLocInfo()) {
|
2014-11-08 00:54:21 +08:00
|
|
|
default:
|
|
|
|
llvm_unreachable("Unknown loc info!");
|
2010-11-23 11:31:01 +08:00
|
|
|
case CCValAssign::Full:
|
2011-10-29 03:49:00 +08:00
|
|
|
if (VA.isRegLoc()) {
|
|
|
|
if ((ValVT == MVT::f32 && LocVT == MVT::i32) ||
|
2013-03-06 06:20:28 +08:00
|
|
|
(ValVT == MVT::f64 && LocVT == MVT::i64) ||
|
|
|
|
(ValVT == MVT::i64 && LocVT == MVT::f64))
|
2013-03-12 08:16:36 +08:00
|
|
|
Arg = DAG.getNode(ISD::BITCAST, DL, LocVT, Arg);
|
2011-10-29 03:49:00 +08:00
|
|
|
else if (ValVT == MVT::f64 && LocVT == MVT::i32) {
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue Lo = DAG.getNode(MipsISD::ExtractElementF64, DL, MVT::i32,
|
2015-04-28 22:05:47 +08:00
|
|
|
Arg, DAG.getConstant(0, DL, MVT::i32));
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue Hi = DAG.getNode(MipsISD::ExtractElementF64, DL, MVT::i32,
|
2015-04-28 22:05:47 +08:00
|
|
|
Arg, DAG.getConstant(1, DL, MVT::i32));
|
2014-07-19 06:55:25 +08:00
|
|
|
if (!Subtarget.isLittle())
|
2011-04-16 03:52:08 +08:00
|
|
|
std::swap(Lo, Hi);
|
2012-02-28 15:46:26 +08:00
|
|
|
unsigned LocRegLo = VA.getLocReg();
|
2011-09-23 08:58:33 +08:00
|
|
|
unsigned LocRegHigh = getNextIntArgReg(LocRegLo);
|
|
|
|
RegsToPass.push_back(std::make_pair(LocRegLo, Lo));
|
|
|
|
RegsToPass.push_back(std::make_pair(LocRegHigh, Hi));
|
2009-03-19 10:12:28 +08:00
|
|
|
continue;
|
2010-11-23 11:31:01 +08:00
|
|
|
}
|
2009-03-19 10:12:28 +08:00
|
|
|
}
|
|
|
|
break;
|
2014-11-03 00:09:29 +08:00
|
|
|
case CCValAssign::BCvt:
|
|
|
|
Arg = DAG.getNode(ISD::BITCAST, DL, LocVT, Arg);
|
|
|
|
break;
|
2014-11-08 00:54:21 +08:00
|
|
|
case CCValAssign::SExtUpper:
|
|
|
|
UseUpperBits = true;
|
2016-08-17 13:10:15 +08:00
|
|
|
LLVM_FALLTHROUGH;
|
2008-03-17 14:57:02 +08:00
|
|
|
case CCValAssign::SExt:
|
2013-03-12 08:16:36 +08:00
|
|
|
Arg = DAG.getNode(ISD::SIGN_EXTEND, DL, LocVT, Arg);
|
2008-03-17 14:57:02 +08:00
|
|
|
break;
|
2014-11-08 00:54:21 +08:00
|
|
|
case CCValAssign::ZExtUpper:
|
|
|
|
UseUpperBits = true;
|
2016-08-17 13:10:15 +08:00
|
|
|
LLVM_FALLTHROUGH;
|
2008-03-17 14:57:02 +08:00
|
|
|
case CCValAssign::ZExt:
|
2013-03-12 08:16:36 +08:00
|
|
|
Arg = DAG.getNode(ISD::ZERO_EXTEND, DL, LocVT, Arg);
|
2008-03-17 14:57:02 +08:00
|
|
|
break;
|
2014-11-08 00:54:21 +08:00
|
|
|
case CCValAssign::AExtUpper:
|
|
|
|
UseUpperBits = true;
|
2016-08-17 13:10:15 +08:00
|
|
|
LLVM_FALLTHROUGH;
|
2008-03-17 14:57:02 +08:00
|
|
|
case CCValAssign::AExt:
|
2013-03-12 08:16:36 +08:00
|
|
|
Arg = DAG.getNode(ISD::ANY_EXTEND, DL, LocVT, Arg);
|
2008-03-17 14:57:02 +08:00
|
|
|
break;
|
2007-06-06 15:42:06 +08:00
|
|
|
}
|
2010-11-23 11:31:01 +08:00
|
|
|
|
2014-11-08 00:54:21 +08:00
|
|
|
if (UseUpperBits) {
|
|
|
|
unsigned ValSizeInBits = Outs[i].ArgVT.getSizeInBits();
|
|
|
|
unsigned LocSizeInBits = VA.getLocVT().getSizeInBits();
|
|
|
|
Arg = DAG.getNode(
|
|
|
|
ISD::SHL, DL, VA.getLocVT(), Arg,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(LocSizeInBits - ValSizeInBits, DL, VA.getLocVT()));
|
2014-11-08 00:54:21 +08:00
|
|
|
}
|
|
|
|
|
2010-11-23 11:31:01 +08:00
|
|
|
// Arguments that can be passed on register must be kept at
|
2007-11-05 11:02:32 +08:00
|
|
|
// RegsToPass vector
|
2007-06-06 15:42:06 +08:00
|
|
|
if (VA.isRegLoc()) {
|
|
|
|
RegsToPass.push_back(std::make_pair(VA.getLocReg(), Arg));
|
2008-03-17 14:57:02 +08:00
|
|
|
continue;
|
2007-06-06 15:42:06 +08:00
|
|
|
}
|
2010-11-23 11:31:01 +08:00
|
|
|
|
2009-03-19 10:12:28 +08:00
|
|
|
// Register can't get to this point...
|
2008-03-17 14:57:02 +08:00
|
|
|
assert(VA.isMemLoc());
|
2010-11-23 11:31:01 +08:00
|
|
|
|
|
|
|
// emit ISD::STORE whichs stores the
|
2008-03-17 14:57:02 +08:00
|
|
|
// parameter value to a stack Location
|
2012-10-31 04:16:31 +08:00
|
|
|
MemOpChains.push_back(passArgOnStack(StackPtr, VA.getLocMemOffset(),
|
2013-03-12 08:16:36 +08:00
|
|
|
Chain, Arg, DL, IsTailCall, DAG));
|
2007-06-06 15:42:06 +08:00
|
|
|
}
|
|
|
|
|
Several changes to Mips backend, experimental fp support being the most
important.
- Cleanup in the Subtarget info with addition of new features, not all support
yet, but they allow the future inclusion of features easier. Among new features,
we have : Arch family info (mips1, mips2, ...), ABI info (o32, eabi), 64-bit
integer
and float registers, allegrex vector FPU (VFPU), single float only support.
- TargetMachine now detects allegrex core.
- Added allegrex (Mips32r2) sext_inreg instructions.
- *Added Float Point Instructions*, handling single float only, and
aliased accesses for 32-bit FPUs.
- Some cleanup in FP instruction formats and FP register classes.
- Calling conventions improved to support mips 32-bit EABI.
- Added Asm Printer support for fp cond codes.
- Added support for sret copy to a return register.
- EABI support added into LowerCALL and FORMAL_ARGS.
- MipsFunctionInfo now keeps a virtual register per function to track the
sret on function entry until function ret.
- MipsInstrInfo FP support into methods (isMoveInstr, isLoadFromStackSlot, ...),
FP cond codes mapping and initial FP Branch Analysis.
- Two new Mips SDNode to handle fp branch and compare instructions : FPBrcond,
FPCmp
- MipsTargetLowering : handling different FP classes, Allegrex support, sret
return copy, no homing location within EABI, non 32-bit stack objects
arguments, and asm constraint for float.
llvm-svn: 53146
2008-07-06 03:05:21 +08:00
|
|
|
// Transform all store nodes into one single node because all store
|
|
|
|
// nodes are independent of each other.
|
2010-11-23 11:31:01 +08:00
|
|
|
if (!MemOpChains.empty())
|
2014-04-27 02:35:24 +08:00
|
|
|
Chain = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, MemOpChains);
|
2007-06-06 15:42:06 +08:00
|
|
|
|
2008-09-17 05:48:12 +08:00
|
|
|
// If the callee is a GlobalAddress/ExternalSymbol node (quite common, every
|
2010-11-23 11:31:01 +08:00
|
|
|
// direct call is) turn it into a TargetGlobalAddress/TargetExternalSymbol
|
|
|
|
// node so that legalize doesn't hack it.
|
2017-01-27 19:36:52 +08:00
|
|
|
|
2011-04-08 03:51:44 +08:00
|
|
|
SDValue CalleeLo;
|
2013-09-28 03:51:35 +08:00
|
|
|
EVT Ty = Callee.getValueType();
|
2016-11-21 05:23:08 +08:00
|
|
|
bool GlobalOrExternal = false, IsCallReloc = false;
|
2011-04-05 01:11:07 +08:00
|
|
|
|
|
|
|
if (GlobalAddressSDNode *G = dyn_cast<GlobalAddressSDNode>(Callee)) {
|
2017-01-27 19:36:52 +08:00
|
|
|
if (IsPIC) {
|
2013-09-28 08:12:32 +08:00
|
|
|
const GlobalValue *Val = G->getGlobal();
|
|
|
|
InternalLinkage = Val->hasInternalLinkage();
|
2012-12-13 11:17:29 +08:00
|
|
|
|
|
|
|
if (InternalLinkage)
|
2015-01-30 07:27:36 +08:00
|
|
|
Callee = getAddrLocal(G, DL, Ty, DAG, ABI.IsN32() || ABI.IsN64());
|
2014-10-01 16:22:21 +08:00
|
|
|
else if (LargeGOT) {
|
2015-01-24 22:35:11 +08:00
|
|
|
Callee = getAddrGlobalLargeGOT(G, DL, Ty, DAG, MipsII::MO_CALL_HI16,
|
2013-09-28 08:12:32 +08:00
|
|
|
MipsII::MO_CALL_LO16, Chain,
|
|
|
|
FuncInfo->callPtrInfo(Val));
|
2014-10-01 16:22:21 +08:00
|
|
|
IsCallReloc = true;
|
|
|
|
} else {
|
2015-01-24 22:35:11 +08:00
|
|
|
Callee = getAddrGlobal(G, DL, Ty, DAG, MipsII::MO_GOT_CALL, Chain,
|
2013-09-28 08:12:32 +08:00
|
|
|
FuncInfo->callPtrInfo(Val));
|
2014-10-01 16:22:21 +08:00
|
|
|
IsCallReloc = true;
|
|
|
|
}
|
2012-11-22 04:30:40 +08:00
|
|
|
} else
|
2015-07-09 10:09:04 +08:00
|
|
|
Callee = DAG.getTargetGlobalAddress(G->getGlobal(), DL,
|
|
|
|
getPointerTy(DAG.getDataLayout()), 0,
|
2012-11-22 04:30:40 +08:00
|
|
|
MipsII::MO_NO_FLAG);
|
2011-12-09 09:45:12 +08:00
|
|
|
GlobalOrExternal = true;
|
2011-04-05 01:11:07 +08:00
|
|
|
}
|
|
|
|
else if (ExternalSymbolSDNode *S = dyn_cast<ExternalSymbolSDNode>(Callee)) {
|
2013-09-28 08:12:32 +08:00
|
|
|
const char *Sym = S->getSymbol();
|
|
|
|
|
2017-01-27 19:36:52 +08:00
|
|
|
if (!IsPIC) // static
|
2015-07-09 10:09:04 +08:00
|
|
|
Callee = DAG.getTargetExternalSymbol(
|
|
|
|
Sym, getPointerTy(DAG.getDataLayout()), MipsII::MO_NO_FLAG);
|
2014-10-01 16:22:21 +08:00
|
|
|
else if (LargeGOT) {
|
2015-01-24 22:35:11 +08:00
|
|
|
Callee = getAddrGlobalLargeGOT(S, DL, Ty, DAG, MipsII::MO_CALL_HI16,
|
2013-09-28 08:12:32 +08:00
|
|
|
MipsII::MO_CALL_LO16, Chain,
|
|
|
|
FuncInfo->callPtrInfo(Sym));
|
2014-10-01 16:22:21 +08:00
|
|
|
IsCallReloc = true;
|
2017-01-27 19:36:52 +08:00
|
|
|
} else { // PIC
|
2015-01-24 22:35:11 +08:00
|
|
|
Callee = getAddrGlobal(S, DL, Ty, DAG, MipsII::MO_GOT_CALL, Chain,
|
2013-09-28 08:12:32 +08:00
|
|
|
FuncInfo->callPtrInfo(Sym));
|
2014-10-01 16:22:21 +08:00
|
|
|
IsCallReloc = true;
|
|
|
|
}
|
2012-11-22 04:30:40 +08:00
|
|
|
|
2011-12-09 09:45:12 +08:00
|
|
|
GlobalOrExternal = true;
|
2011-04-05 01:11:07 +08:00
|
|
|
}
|
|
|
|
|
2013-01-23 04:05:56 +08:00
|
|
|
SmallVector<SDValue, 8> Ops(1, Chain);
|
2013-03-13 08:54:29 +08:00
|
|
|
SDVTList NodeTys = DAG.getVTList(MVT::Other, MVT::Glue);
|
2013-01-23 04:05:56 +08:00
|
|
|
|
2017-01-27 19:36:52 +08:00
|
|
|
getOpndList(Ops, RegsToPass, IsPIC, GlobalOrExternal, InternalLinkage,
|
2014-10-01 16:22:21 +08:00
|
|
|
IsCallReloc, CLI, Callee, Chain);
|
2007-06-06 15:42:06 +08:00
|
|
|
|
2016-09-21 17:43:40 +08:00
|
|
|
if (IsTailCall) {
|
|
|
|
MF.getFrameInfo().setHasTailCall();
|
2014-04-27 02:35:24 +08:00
|
|
|
return DAG.getNode(MipsISD::TailCall, DL, MVT::Other, Ops);
|
2016-09-21 17:43:40 +08:00
|
|
|
}
|
2012-10-20 05:47:33 +08:00
|
|
|
|
2014-04-27 02:35:24 +08:00
|
|
|
Chain = DAG.getNode(MipsISD::JmpLink, DL, NodeTys, Ops);
|
2013-03-13 08:54:29 +08:00
|
|
|
SDValue InFlag = Chain.getValue(1);
|
2007-06-06 15:42:06 +08:00
|
|
|
|
2010-01-31 02:32:07 +08:00
|
|
|
// Create the CALLSEQ_END node.
|
2012-07-27 07:27:01 +08:00
|
|
|
Chain = DAG.getCALLSEQ_END(Chain, NextStackOffsetVal,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getIntPtrConstant(0, DL, true), InFlag, DL);
|
2010-01-31 02:32:07 +08:00
|
|
|
InFlag = Chain.getValue(1);
|
|
|
|
|
2007-06-06 15:42:06 +08:00
|
|
|
// Handle result values, copying them out of physregs into vregs that we
|
|
|
|
// return.
|
2014-09-26 18:06:12 +08:00
|
|
|
return LowerCallResult(Chain, InFlag, CallConv, IsVarArg, Ins, DL, DAG,
|
|
|
|
InVals, CLI);
|
2007-06-06 15:42:06 +08:00
|
|
|
}
|
|
|
|
|
Major calling convention code refactoring.
Instead of awkwardly encoding calling-convention information with ISD::CALL,
ISD::FORMAL_ARGUMENTS, ISD::RET, and ISD::ARG_FLAGS nodes, TargetLowering
provides three virtual functions for targets to override:
LowerFormalArguments, LowerCall, and LowerRet, which replace the custom
lowering done on the special nodes. They provide the same information, but
in a more immediately usable format.
This also reworks much of the target-independent tail call logic. The
decision of whether or not to perform a tail call is now cleanly split
between target-independent portions, and the target dependent portion
in IsEligibleForTailCallOptimization.
This also synchronizes all in-tree targets, to help enable future
refactoring and feature work.
llvm-svn: 78142
2009-08-05 09:29:28 +08:00
|
|
|
/// LowerCallResult - Lower the result values of a call into the
|
|
|
|
/// appropriate copies out of appropriate physical registers.
|
2014-09-26 18:06:12 +08:00
|
|
|
SDValue MipsTargetLowering::LowerCallResult(
|
|
|
|
SDValue Chain, SDValue InFlag, CallingConv::ID CallConv, bool IsVarArg,
|
2016-06-12 23:39:02 +08:00
|
|
|
const SmallVectorImpl<ISD::InputArg> &Ins, const SDLoc &DL,
|
|
|
|
SelectionDAG &DAG, SmallVectorImpl<SDValue> &InVals,
|
2014-09-26 18:06:12 +08:00
|
|
|
TargetLowering::CallLoweringInfo &CLI) const {
|
2007-06-06 15:42:06 +08:00
|
|
|
// Assign locations to each value returned by this call.
|
|
|
|
SmallVector<CCValAssign, 16> RVLocs;
|
2014-09-26 18:06:12 +08:00
|
|
|
MipsCCState CCInfo(CallConv, IsVarArg, DAG.getMachineFunction(), RVLocs,
|
|
|
|
*DAG.getContext());
|
2017-04-26 19:10:38 +08:00
|
|
|
|
|
|
|
const ExternalSymbolSDNode *ES =
|
|
|
|
dyn_cast_or_null<const ExternalSymbolSDNode>(CLI.Callee.getNode());
|
|
|
|
CCInfo.AnalyzeCallResult(Ins, RetCC_Mips, CLI.RetTy,
|
|
|
|
ES ? ES->getSymbol() : nullptr);
|
2007-06-06 15:42:06 +08:00
|
|
|
|
|
|
|
// Copy all of the result registers out of their specified physreg.
|
|
|
|
for (unsigned i = 0; i != RVLocs.size(); ++i) {
|
2014-09-25 20:15:05 +08:00
|
|
|
CCValAssign &VA = RVLocs[i];
|
|
|
|
assert(VA.isRegLoc() && "Can only return in registers!");
|
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue Val = DAG.getCopyFromReg(Chain, DL, RVLocs[i].getLocReg(),
|
2013-03-06 06:41:55 +08:00
|
|
|
RVLocs[i].getLocVT(), InFlag);
|
|
|
|
Chain = Val.getValue(1);
|
|
|
|
InFlag = Val.getValue(2);
|
|
|
|
|
2014-09-25 20:15:05 +08:00
|
|
|
if (VA.isUpperBitsInLoc()) {
|
|
|
|
unsigned ValSizeInBits = Ins[i].ArgVT.getSizeInBits();
|
|
|
|
unsigned LocSizeInBits = VA.getLocVT().getSizeInBits();
|
|
|
|
unsigned Shift =
|
|
|
|
VA.getLocInfo() == CCValAssign::ZExtUpper ? ISD::SRL : ISD::SRA;
|
|
|
|
Val = DAG.getNode(
|
|
|
|
Shift, DL, VA.getLocVT(), Val,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(LocSizeInBits - ValSizeInBits, DL, VA.getLocVT()));
|
2014-09-25 20:15:05 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
switch (VA.getLocInfo()) {
|
|
|
|
default:
|
|
|
|
llvm_unreachable("Unknown loc info!");
|
|
|
|
case CCValAssign::Full:
|
|
|
|
break;
|
|
|
|
case CCValAssign::BCvt:
|
|
|
|
Val = DAG.getNode(ISD::BITCAST, DL, VA.getValVT(), Val);
|
|
|
|
break;
|
|
|
|
case CCValAssign::AExt:
|
|
|
|
case CCValAssign::AExtUpper:
|
|
|
|
Val = DAG.getNode(ISD::TRUNCATE, DL, VA.getValVT(), Val);
|
|
|
|
break;
|
|
|
|
case CCValAssign::ZExt:
|
|
|
|
case CCValAssign::ZExtUpper:
|
|
|
|
Val = DAG.getNode(ISD::AssertZext, DL, VA.getLocVT(), Val,
|
|
|
|
DAG.getValueType(VA.getValVT()));
|
|
|
|
Val = DAG.getNode(ISD::TRUNCATE, DL, VA.getValVT(), Val);
|
|
|
|
break;
|
|
|
|
case CCValAssign::SExt:
|
|
|
|
case CCValAssign::SExtUpper:
|
|
|
|
Val = DAG.getNode(ISD::AssertSext, DL, VA.getLocVT(), Val,
|
|
|
|
DAG.getValueType(VA.getValVT()));
|
|
|
|
Val = DAG.getNode(ISD::TRUNCATE, DL, VA.getValVT(), Val);
|
|
|
|
break;
|
|
|
|
}
|
2013-03-06 06:41:55 +08:00
|
|
|
|
|
|
|
InVals.push_back(Val);
|
2007-06-06 15:42:06 +08:00
|
|
|
}
|
2007-11-05 11:02:32 +08:00
|
|
|
|
Major calling convention code refactoring.
Instead of awkwardly encoding calling-convention information with ISD::CALL,
ISD::FORMAL_ARGUMENTS, ISD::RET, and ISD::ARG_FLAGS nodes, TargetLowering
provides three virtual functions for targets to override:
LowerFormalArguments, LowerCall, and LowerRet, which replace the custom
lowering done on the special nodes. They provide the same information, but
in a more immediately usable format.
This also reworks much of the target-independent tail call logic. The
decision of whether or not to perform a tail call is now cleanly split
between target-independent portions, and the target dependent portion
in IsEligibleForTailCallOptimization.
This also synchronizes all in-tree targets, to help enable future
refactoring and feature work.
llvm-svn: 78142
2009-08-05 09:29:28 +08:00
|
|
|
return Chain;
|
2007-06-06 15:42:06 +08:00
|
|
|
}
|
|
|
|
|
2014-11-08 00:54:21 +08:00
|
|
|
static SDValue UnpackFromArgumentSlot(SDValue Val, const CCValAssign &VA,
|
2016-06-12 23:39:02 +08:00
|
|
|
EVT ArgVT, const SDLoc &DL,
|
|
|
|
SelectionDAG &DAG) {
|
2014-11-08 00:54:21 +08:00
|
|
|
MVT LocVT = VA.getLocVT();
|
|
|
|
EVT ValVT = VA.getValVT();
|
|
|
|
|
|
|
|
// Shift into the upper bits if necessary.
|
|
|
|
switch (VA.getLocInfo()) {
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
case CCValAssign::AExtUpper:
|
|
|
|
case CCValAssign::SExtUpper:
|
|
|
|
case CCValAssign::ZExtUpper: {
|
|
|
|
unsigned ValSizeInBits = ArgVT.getSizeInBits();
|
|
|
|
unsigned LocSizeInBits = VA.getLocVT().getSizeInBits();
|
|
|
|
unsigned Opcode =
|
|
|
|
VA.getLocInfo() == CCValAssign::ZExtUpper ? ISD::SRL : ISD::SRA;
|
|
|
|
Val = DAG.getNode(
|
|
|
|
Opcode, DL, VA.getLocVT(), Val,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(LocSizeInBits - ValSizeInBits, DL, VA.getLocVT()));
|
2014-11-08 00:54:21 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// If this is an value smaller than the argument slot size (32-bit for O32,
|
|
|
|
// 64-bit for N32/N64), it has been promoted in some way to the argument slot
|
|
|
|
// size. Extract the value and insert any appropriate assertions regarding
|
|
|
|
// sign/zero extension.
|
|
|
|
switch (VA.getLocInfo()) {
|
|
|
|
default:
|
|
|
|
llvm_unreachable("Unknown loc info!");
|
|
|
|
case CCValAssign::Full:
|
|
|
|
break;
|
|
|
|
case CCValAssign::AExtUpper:
|
|
|
|
case CCValAssign::AExt:
|
|
|
|
Val = DAG.getNode(ISD::TRUNCATE, DL, ValVT, Val);
|
|
|
|
break;
|
|
|
|
case CCValAssign::SExtUpper:
|
|
|
|
case CCValAssign::SExt:
|
|
|
|
Val = DAG.getNode(ISD::AssertSext, DL, LocVT, Val, DAG.getValueType(ValVT));
|
|
|
|
Val = DAG.getNode(ISD::TRUNCATE, DL, ValVT, Val);
|
|
|
|
break;
|
|
|
|
case CCValAssign::ZExtUpper:
|
|
|
|
case CCValAssign::ZExt:
|
|
|
|
Val = DAG.getNode(ISD::AssertZext, DL, LocVT, Val, DAG.getValueType(ValVT));
|
|
|
|
Val = DAG.getNode(ISD::TRUNCATE, DL, ValVT, Val);
|
|
|
|
break;
|
|
|
|
case CCValAssign::BCvt:
|
|
|
|
Val = DAG.getNode(ISD::BITCAST, DL, ValVT, Val);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return Val;
|
|
|
|
}
|
|
|
|
|
2011-04-16 05:51:11 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
Major calling convention code refactoring.
Instead of awkwardly encoding calling-convention information with ISD::CALL,
ISD::FORMAL_ARGUMENTS, ISD::RET, and ISD::ARG_FLAGS nodes, TargetLowering
provides three virtual functions for targets to override:
LowerFormalArguments, LowerCall, and LowerRet, which replace the custom
lowering done on the special nodes. They provide the same information, but
in a more immediately usable format.
This also reworks much of the target-independent tail call logic. The
decision of whether or not to perform a tail call is now cleanly split
between target-independent portions, and the target dependent portion
in IsEligibleForTailCallOptimization.
This also synchronizes all in-tree targets, to help enable future
refactoring and feature work.
llvm-svn: 78142
2009-08-05 09:29:28 +08:00
|
|
|
// Formal Arguments Calling Convention Implementation
|
2011-04-16 05:51:11 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
2010-11-23 11:31:01 +08:00
|
|
|
/// LowerFormalArguments - transform physical registers into virtual registers
|
2010-02-07 03:20:49 +08:00
|
|
|
/// and generate load operations for arguments places on the stack.
|
2016-06-12 23:39:02 +08:00
|
|
|
SDValue MipsTargetLowering::LowerFormalArguments(
|
|
|
|
SDValue Chain, CallingConv::ID CallConv, bool IsVarArg,
|
|
|
|
const SmallVectorImpl<ISD::InputArg> &Ins, const SDLoc &DL,
|
|
|
|
SelectionDAG &DAG, SmallVectorImpl<SDValue> &InVals) const {
|
2008-08-04 15:12:52 +08:00
|
|
|
MachineFunction &MF = DAG.getMachineFunction();
|
2016-07-29 02:40:00 +08:00
|
|
|
MachineFrameInfo &MFI = MF.getFrameInfo();
|
2007-08-28 13:08:16 +08:00
|
|
|
MipsFunctionInfo *MipsFI = MF.getInfo<MipsFunctionInfo>();
|
2007-07-12 07:16:16 +08:00
|
|
|
|
2010-04-17 22:41:14 +08:00
|
|
|
MipsFI->setVarArgsFrameIndex(0);
|
2007-06-06 15:42:06 +08:00
|
|
|
|
2010-02-07 03:20:49 +08:00
|
|
|
// Used with vargs to acumulate store chains.
|
|
|
|
std::vector<SDValue> OutChains;
|
|
|
|
|
2007-06-06 15:42:06 +08:00
|
|
|
// Assign locations to all of the incoming arguments.
|
|
|
|
SmallVector<CCValAssign, 16> ArgLocs;
|
2014-11-03 00:09:29 +08:00
|
|
|
MipsCCState CCInfo(CallConv, IsVarArg, DAG.getMachineFunction(), ArgLocs,
|
|
|
|
*DAG.getContext());
|
2014-11-07 23:33:08 +08:00
|
|
|
CCInfo.AllocateStack(ABI.GetCalleeAllocdArgSizeInBytes(CallConv), 1);
|
2015-10-26 20:38:43 +08:00
|
|
|
const Function *Func = DAG.getMachineFunction().getFunction();
|
|
|
|
Function::const_arg_iterator FuncArg = Func->arg_begin();
|
|
|
|
|
2015-10-26 22:24:30 +08:00
|
|
|
if (Func->hasFnAttribute("interrupt") && !Func->arg_empty())
|
|
|
|
report_fatal_error(
|
|
|
|
"Functions with the interrupt attribute cannot have arguments!");
|
2007-07-12 07:16:16 +08:00
|
|
|
|
2014-11-07 00:36:30 +08:00
|
|
|
CCInfo.AnalyzeFormalArguments(Ins, CC_Mips_FixedArg);
|
2012-10-31 03:37:25 +08:00
|
|
|
MipsFI->setFormalArgInfo(CCInfo.getNextStackOffset(),
|
2014-11-03 00:09:29 +08:00
|
|
|
CCInfo.getInRegsParamsCount() > 0);
|
2009-03-19 10:12:28 +08:00
|
|
|
|
2012-10-27 08:44:39 +08:00
|
|
|
unsigned CurArgIdx = 0;
|
2014-11-03 00:09:29 +08:00
|
|
|
CCInfo.rewindByValRegsInfo();
|
Several changes to Mips backend, experimental fp support being the most
important.
- Cleanup in the Subtarget info with addition of new features, not all support
yet, but they allow the future inclusion of features easier. Among new features,
we have : Arch family info (mips1, mips2, ...), ABI info (o32, eabi), 64-bit
integer
and float registers, allegrex vector FPU (VFPU), single float only support.
- TargetMachine now detects allegrex core.
- Added allegrex (Mips32r2) sext_inreg instructions.
- *Added Float Point Instructions*, handling single float only, and
aliased accesses for 32-bit FPUs.
- Some cleanup in FP instruction formats and FP register classes.
- Calling conventions improved to support mips 32-bit EABI.
- Added Asm Printer support for fp cond codes.
- Added support for sret copy to a return register.
- EABI support added into LowerCALL and FORMAL_ARGS.
- MipsFunctionInfo now keeps a virtual register per function to track the
sret on function entry until function ret.
- MipsInstrInfo FP support into methods (isMoveInstr, isLoadFromStackSlot, ...),
FP cond codes mapping and initial FP Branch Analysis.
- Two new Mips SDNode to handle fp branch and compare instructions : FPBrcond,
FPCmp
- MipsTargetLowering : handling different FP classes, Allegrex support, sret
return copy, no homing location within EABI, non 32-bit stack objects
arguments, and asm constraint for float.
llvm-svn: 53146
2008-07-06 03:05:21 +08:00
|
|
|
|
2012-10-27 08:44:39 +08:00
|
|
|
for (unsigned i = 0, e = ArgLocs.size(); i != e; ++i) {
|
2007-06-06 15:42:06 +08:00
|
|
|
CCValAssign &VA = ArgLocs[i];
|
2015-02-17 02:10:47 +08:00
|
|
|
if (Ins[i].isOrigArg()) {
|
|
|
|
std::advance(FuncArg, Ins[i].getOrigArgIndex() - CurArgIdx);
|
|
|
|
CurArgIdx = Ins[i].getOrigArgIndex();
|
|
|
|
}
|
2011-10-29 03:55:48 +08:00
|
|
|
EVT ValVT = VA.getValVT();
|
2011-11-12 10:29:58 +08:00
|
|
|
ISD::ArgFlagsTy Flags = Ins[i].Flags;
|
|
|
|
bool IsRegLoc = VA.isRegLoc();
|
|
|
|
|
|
|
|
if (Flags.isByVal()) {
|
2015-02-17 02:10:47 +08:00
|
|
|
assert(Ins[i].isOrigArg() && "Byval arguments cannot be implicit");
|
2014-11-03 00:09:29 +08:00
|
|
|
unsigned FirstByValReg, LastByValReg;
|
|
|
|
unsigned ByValIdx = CCInfo.getInRegsParamsProcessed();
|
|
|
|
CCInfo.getInRegsParamInfo(ByValIdx, FirstByValReg, LastByValReg);
|
|
|
|
|
2011-11-12 10:29:58 +08:00
|
|
|
assert(Flags.getByValSize() &&
|
|
|
|
"ByVal args of size 0 should have been ignored by front-end.");
|
2014-11-03 00:09:29 +08:00
|
|
|
assert(ByValIdx < CCInfo.getInRegsParamsCount());
|
2013-03-12 08:16:36 +08:00
|
|
|
copyByValRegs(Chain, DL, OutChains, DAG, Flags, InVals, &*FuncArg,
|
2014-11-07 23:33:08 +08:00
|
|
|
FirstByValReg, LastByValReg, VA, CCInfo);
|
2014-11-03 00:09:29 +08:00
|
|
|
CCInfo.nextInRegsParam();
|
2011-11-12 10:29:58 +08:00
|
|
|
continue;
|
|
|
|
}
|
2007-06-06 15:42:06 +08:00
|
|
|
|
|
|
|
// Arguments stored on registers
|
2011-11-12 10:29:58 +08:00
|
|
|
if (IsRegLoc) {
|
2013-10-29 05:21:36 +08:00
|
|
|
MVT RegVT = VA.getLocVT();
|
2011-05-24 08:23:52 +08:00
|
|
|
unsigned ArgReg = VA.getLocReg();
|
2013-10-29 05:21:36 +08:00
|
|
|
const TargetRegisterClass *RC = getRegClassFor(RegVT);
|
2007-06-06 15:42:06 +08:00
|
|
|
|
2010-11-23 11:31:01 +08:00
|
|
|
// Transform the arguments stored on
|
2007-06-06 15:42:06 +08:00
|
|
|
// physical registers into virtual ones
|
2013-03-12 08:16:36 +08:00
|
|
|
unsigned Reg = addLiveIn(DAG.getMachineFunction(), ArgReg, RC);
|
|
|
|
SDValue ArgValue = DAG.getCopyFromReg(Chain, DL, Reg, RegVT);
|
2010-11-23 11:31:01 +08:00
|
|
|
|
2014-11-08 00:54:21 +08:00
|
|
|
ArgValue = UnpackFromArgumentSlot(ArgValue, VA, Ins[i].ArgVT, DL, DAG);
|
2009-03-19 10:12:28 +08:00
|
|
|
|
2013-03-06 06:13:04 +08:00
|
|
|
// Handle floating point arguments passed in integer registers and
|
|
|
|
// long double arguments passed in floating point registers.
|
2011-10-29 03:55:48 +08:00
|
|
|
if ((RegVT == MVT::i32 && ValVT == MVT::f32) ||
|
2013-03-06 06:13:04 +08:00
|
|
|
(RegVT == MVT::i64 && ValVT == MVT::f64) ||
|
|
|
|
(RegVT == MVT::f64 && ValVT == MVT::i64))
|
2013-03-12 08:16:36 +08:00
|
|
|
ArgValue = DAG.getNode(ISD::BITCAST, DL, ValVT, ArgValue);
|
2015-01-30 07:27:36 +08:00
|
|
|
else if (ABI.IsO32() && RegVT == MVT::i32 &&
|
2014-07-03 07:18:40 +08:00
|
|
|
ValVT == MVT::f64) {
|
2013-03-12 08:16:36 +08:00
|
|
|
unsigned Reg2 = addLiveIn(DAG.getMachineFunction(),
|
2011-10-29 03:55:48 +08:00
|
|
|
getNextIntArgReg(ArgReg), RC);
|
2013-03-12 08:16:36 +08:00
|
|
|
SDValue ArgValue2 = DAG.getCopyFromReg(Chain, DL, Reg2, RegVT);
|
2014-07-19 06:55:25 +08:00
|
|
|
if (!Subtarget.isLittle())
|
2011-10-29 03:55:48 +08:00
|
|
|
std::swap(ArgValue, ArgValue2);
|
2013-03-12 08:16:36 +08:00
|
|
|
ArgValue = DAG.getNode(MipsISD::BuildPairF64, DL, MVT::f64,
|
2011-10-29 03:55:48 +08:00
|
|
|
ArgValue, ArgValue2);
|
2009-03-19 10:12:28 +08:00
|
|
|
}
|
2007-06-06 15:42:06 +08:00
|
|
|
|
Major calling convention code refactoring.
Instead of awkwardly encoding calling-convention information with ISD::CALL,
ISD::FORMAL_ARGUMENTS, ISD::RET, and ISD::ARG_FLAGS nodes, TargetLowering
provides three virtual functions for targets to override:
LowerFormalArguments, LowerCall, and LowerRet, which replace the custom
lowering done on the special nodes. They provide the same information, but
in a more immediately usable format.
This also reworks much of the target-independent tail call logic. The
decision of whether or not to perform a tail call is now cleanly split
between target-independent portions, and the target dependent portion
in IsEligibleForTailCallOptimization.
This also synchronizes all in-tree targets, to help enable future
refactoring and feature work.
llvm-svn: 78142
2009-08-05 09:29:28 +08:00
|
|
|
InVals.push_back(ArgValue);
|
Several changes to Mips backend, experimental fp support being the most
important.
- Cleanup in the Subtarget info with addition of new features, not all support
yet, but they allow the future inclusion of features easier. Among new features,
we have : Arch family info (mips1, mips2, ...), ABI info (o32, eabi), 64-bit
integer
and float registers, allegrex vector FPU (VFPU), single float only support.
- TargetMachine now detects allegrex core.
- Added allegrex (Mips32r2) sext_inreg instructions.
- *Added Float Point Instructions*, handling single float only, and
aliased accesses for 32-bit FPUs.
- Some cleanup in FP instruction formats and FP register classes.
- Calling conventions improved to support mips 32-bit EABI.
- Added Asm Printer support for fp cond codes.
- Added support for sret copy to a return register.
- EABI support added into LowerCALL and FORMAL_ARGS.
- MipsFunctionInfo now keeps a virtual register per function to track the
sret on function entry until function ret.
- MipsInstrInfo FP support into methods (isMoveInstr, isLoadFromStackSlot, ...),
FP cond codes mapping and initial FP Branch Analysis.
- Two new Mips SDNode to handle fp branch and compare instructions : FPBrcond,
FPCmp
- MipsTargetLowering : handling different FP classes, Allegrex support, sret
return copy, no homing location within EABI, non 32-bit stack objects
arguments, and asm constraint for float.
llvm-svn: 53146
2008-07-06 03:05:21 +08:00
|
|
|
} else { // VA.isRegLoc()
|
2014-11-08 00:54:21 +08:00
|
|
|
MVT LocVT = VA.getLocVT();
|
|
|
|
|
2015-01-30 07:27:36 +08:00
|
|
|
if (ABI.IsO32()) {
|
2014-11-08 00:54:21 +08:00
|
|
|
// We ought to be able to use LocVT directly but O32 sets it to i32
|
|
|
|
// when allocating floating point values to integer registers.
|
|
|
|
// This shouldn't influence how we load the value into registers unless
|
2015-08-09 02:27:36 +08:00
|
|
|
// we are targeting softfloat.
|
2015-05-08 07:10:21 +08:00
|
|
|
if (VA.getValVT().isFloatingPoint() && !Subtarget.useSoftFloat())
|
2014-11-08 00:54:21 +08:00
|
|
|
LocVT = VA.getValVT();
|
|
|
|
}
|
Several changes to Mips backend, experimental fp support being the most
important.
- Cleanup in the Subtarget info with addition of new features, not all support
yet, but they allow the future inclusion of features easier. Among new features,
we have : Arch family info (mips1, mips2, ...), ABI info (o32, eabi), 64-bit
integer
and float registers, allegrex vector FPU (VFPU), single float only support.
- TargetMachine now detects allegrex core.
- Added allegrex (Mips32r2) sext_inreg instructions.
- *Added Float Point Instructions*, handling single float only, and
aliased accesses for 32-bit FPUs.
- Some cleanup in FP instruction formats and FP register classes.
- Calling conventions improved to support mips 32-bit EABI.
- Added Asm Printer support for fp cond codes.
- Added support for sret copy to a return register.
- EABI support added into LowerCALL and FORMAL_ARGS.
- MipsFunctionInfo now keeps a virtual register per function to track the
sret on function entry until function ret.
- MipsInstrInfo FP support into methods (isMoveInstr, isLoadFromStackSlot, ...),
FP cond codes mapping and initial FP Branch Analysis.
- Two new Mips SDNode to handle fp branch and compare instructions : FPBrcond,
FPCmp
- MipsTargetLowering : handling different FP classes, Allegrex support, sret
return copy, no homing location within EABI, non 32-bit stack objects
arguments, and asm constraint for float.
llvm-svn: 53146
2008-07-06 03:05:21 +08:00
|
|
|
|
2007-06-06 15:42:06 +08:00
|
|
|
// sanity check
|
|
|
|
assert(VA.isMemLoc());
|
2010-02-07 03:20:49 +08:00
|
|
|
|
2010-11-23 11:31:01 +08:00
|
|
|
// The stack pointer offset is relative to the caller stack frame.
|
2016-07-29 02:40:00 +08:00
|
|
|
int FI = MFI.CreateFixedObject(LocVT.getSizeInBits() / 8,
|
|
|
|
VA.getLocMemOffset(), true);
|
2007-06-06 15:42:06 +08:00
|
|
|
|
|
|
|
// Create load nodes to retrieve arguments from the stack
|
2015-07-09 10:09:04 +08:00
|
|
|
SDValue FIN = DAG.getFrameIndex(FI, getPointerTy(DAG.getDataLayout()));
|
2015-08-12 07:09:45 +08:00
|
|
|
SDValue ArgValue = DAG.getLoad(
|
|
|
|
LocVT, DL, Chain, FIN,
|
[SelectionDAG] Get rid of bool parameters in SelectionDAG::getLoad, getStore, and friends.
Summary:
Instead, we take a single flags arg (a bitset).
Also add a default 0 alignment, and change the order of arguments so the
alignment comes before the flags.
This greatly simplifies many callsites, and fixes a bug in
AMDGPUISelLowering, wherein the order of the args to getLoad was
inverted. It also greatly simplifies the process of adding another flag
to getLoad.
Reviewers: chandlerc, tstellarAMD
Subscribers: jholewinski, arsenm, jyknight, dsanders, nemanjai, llvm-commits
Differential Revision: http://reviews.llvm.org/D22249
llvm-svn: 275592
2016-07-16 02:27:10 +08:00
|
|
|
MachinePointerInfo::getFixedStack(DAG.getMachineFunction(), FI));
|
2014-11-08 00:54:21 +08:00
|
|
|
OutChains.push_back(ArgValue.getValue(1));
|
|
|
|
|
|
|
|
ArgValue = UnpackFromArgumentSlot(ArgValue, VA, Ins[i].ArgVT, DL, DAG);
|
|
|
|
|
|
|
|
InVals.push_back(ArgValue);
|
2007-06-06 15:42:06 +08:00
|
|
|
}
|
2014-05-13 06:01:27 +08:00
|
|
|
}
|
Several changes to Mips backend, experimental fp support being the most
important.
- Cleanup in the Subtarget info with addition of new features, not all support
yet, but they allow the future inclusion of features easier. Among new features,
we have : Arch family info (mips1, mips2, ...), ABI info (o32, eabi), 64-bit
integer
and float registers, allegrex vector FPU (VFPU), single float only support.
- TargetMachine now detects allegrex core.
- Added allegrex (Mips32r2) sext_inreg instructions.
- *Added Float Point Instructions*, handling single float only, and
aliased accesses for 32-bit FPUs.
- Some cleanup in FP instruction formats and FP register classes.
- Calling conventions improved to support mips 32-bit EABI.
- Added Asm Printer support for fp cond codes.
- Added support for sret copy to a return register.
- EABI support added into LowerCALL and FORMAL_ARGS.
- MipsFunctionInfo now keeps a virtual register per function to track the
sret on function entry until function ret.
- MipsInstrInfo FP support into methods (isMoveInstr, isLoadFromStackSlot, ...),
FP cond codes mapping and initial FP Branch Analysis.
- Two new Mips SDNode to handle fp branch and compare instructions : FPBrcond,
FPCmp
- MipsTargetLowering : handling different FP classes, Allegrex support, sret
return copy, no homing location within EABI, non 32-bit stack objects
arguments, and asm constraint for float.
llvm-svn: 53146
2008-07-06 03:05:21 +08:00
|
|
|
|
2014-05-13 06:01:27 +08:00
|
|
|
for (unsigned i = 0, e = ArgLocs.size(); i != e; ++i) {
|
2014-05-10 06:32:13 +08:00
|
|
|
// The mips ABIs for returning structs by value requires that we copy
|
|
|
|
// the sret argument into $v0 for the return. Save the argument into
|
|
|
|
// a virtual register so that we can access it from the return points.
|
2014-05-13 06:01:27 +08:00
|
|
|
if (Ins[i].Flags.isSRet()) {
|
2014-05-10 06:32:13 +08:00
|
|
|
unsigned Reg = MipsFI->getSRetReturnReg();
|
|
|
|
if (!Reg) {
|
|
|
|
Reg = MF.getRegInfo().createVirtualRegister(
|
2015-01-30 07:27:36 +08:00
|
|
|
getRegClassFor(ABI.IsN64() ? MVT::i64 : MVT::i32));
|
2014-05-10 06:32:13 +08:00
|
|
|
MipsFI->setSRetReturnReg(Reg);
|
|
|
|
}
|
2014-05-13 06:01:27 +08:00
|
|
|
SDValue Copy = DAG.getCopyToReg(DAG.getEntryNode(), DL, Reg, InVals[i]);
|
2014-05-10 06:32:13 +08:00
|
|
|
Chain = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, Copy, Chain);
|
2014-05-13 06:01:27 +08:00
|
|
|
break;
|
Several changes to Mips backend, experimental fp support being the most
important.
- Cleanup in the Subtarget info with addition of new features, not all support
yet, but they allow the future inclusion of features easier. Among new features,
we have : Arch family info (mips1, mips2, ...), ABI info (o32, eabi), 64-bit
integer
and float registers, allegrex vector FPU (VFPU), single float only support.
- TargetMachine now detects allegrex core.
- Added allegrex (Mips32r2) sext_inreg instructions.
- *Added Float Point Instructions*, handling single float only, and
aliased accesses for 32-bit FPUs.
- Some cleanup in FP instruction formats and FP register classes.
- Calling conventions improved to support mips 32-bit EABI.
- Added Asm Printer support for fp cond codes.
- Added support for sret copy to a return register.
- EABI support added into LowerCALL and FORMAL_ARGS.
- MipsFunctionInfo now keeps a virtual register per function to track the
sret on function entry until function ret.
- MipsInstrInfo FP support into methods (isMoveInstr, isLoadFromStackSlot, ...),
FP cond codes mapping and initial FP Branch Analysis.
- Two new Mips SDNode to handle fp branch and compare instructions : FPBrcond,
FPCmp
- MipsTargetLowering : handling different FP classes, Allegrex support, sret
return copy, no homing location within EABI, non 32-bit stack objects
arguments, and asm constraint for float.
llvm-svn: 53146
2008-07-06 03:05:21 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
if (IsVarArg)
|
2014-11-07 23:33:08 +08:00
|
|
|
writeVarArgRegs(OutChains, Chain, DL, DAG, CCInfo);
|
2010-02-07 03:20:49 +08:00
|
|
|
|
2010-11-23 11:31:01 +08:00
|
|
|
// All stores are grouped in one node to allow the matching between
|
2010-02-07 03:20:49 +08:00
|
|
|
// the size of Ins and InVals. This only happens when on varg functions
|
|
|
|
if (!OutChains.empty()) {
|
|
|
|
OutChains.push_back(Chain);
|
2014-04-27 02:35:24 +08:00
|
|
|
Chain = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, OutChains);
|
2010-02-07 03:20:49 +08:00
|
|
|
}
|
|
|
|
|
Major calling convention code refactoring.
Instead of awkwardly encoding calling-convention information with ISD::CALL,
ISD::FORMAL_ARGUMENTS, ISD::RET, and ISD::ARG_FLAGS nodes, TargetLowering
provides three virtual functions for targets to override:
LowerFormalArguments, LowerCall, and LowerRet, which replace the custom
lowering done on the special nodes. They provide the same information, but
in a more immediately usable format.
This also reworks much of the target-independent tail call logic. The
decision of whether or not to perform a tail call is now cleanly split
between target-independent portions, and the target dependent portion
in IsEligibleForTailCallOptimization.
This also synchronizes all in-tree targets, to help enable future
refactoring and feature work.
llvm-svn: 78142
2009-08-05 09:29:28 +08:00
|
|
|
return Chain;
|
2007-06-06 15:42:06 +08:00
|
|
|
}
|
|
|
|
|
2011-04-16 05:51:11 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
2007-06-06 15:42:06 +08:00
|
|
|
// Return Value Calling Convention Implementation
|
2011-04-16 05:51:11 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
2007-06-06 15:42:06 +08:00
|
|
|
|
2012-10-10 09:27:09 +08:00
|
|
|
bool
|
|
|
|
MipsTargetLowering::CanLowerReturn(CallingConv::ID CallConv,
|
2013-03-12 08:16:36 +08:00
|
|
|
MachineFunction &MF, bool IsVarArg,
|
2012-10-10 09:27:09 +08:00
|
|
|
const SmallVectorImpl<ISD::OutputArg> &Outs,
|
|
|
|
LLVMContext &Context) const {
|
|
|
|
SmallVector<CCValAssign, 16> RVLocs;
|
2014-09-26 18:06:12 +08:00
|
|
|
MipsCCState CCInfo(CallConv, IsVarArg, MF, RVLocs, Context);
|
2012-10-10 09:27:09 +08:00
|
|
|
return CCInfo.CheckReturn(Outs, RetCC_Mips);
|
|
|
|
}
|
|
|
|
|
2015-03-23 20:28:13 +08:00
|
|
|
bool
|
|
|
|
MipsTargetLowering::shouldSignExtendTypeInLibCall(EVT Type, bool IsSigned) const {
|
2015-05-08 07:10:21 +08:00
|
|
|
if (Subtarget.hasMips3() && Subtarget.useSoftFloat()) {
|
2015-03-23 20:28:13 +08:00
|
|
|
if (Type == MVT::i32)
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return IsSigned;
|
|
|
|
}
|
|
|
|
|
Major calling convention code refactoring.
Instead of awkwardly encoding calling-convention information with ISD::CALL,
ISD::FORMAL_ARGUMENTS, ISD::RET, and ISD::ARG_FLAGS nodes, TargetLowering
provides three virtual functions for targets to override:
LowerFormalArguments, LowerCall, and LowerRet, which replace the custom
lowering done on the special nodes. They provide the same information, but
in a more immediately usable format.
This also reworks much of the target-independent tail call logic. The
decision of whether or not to perform a tail call is now cleanly split
between target-independent portions, and the target dependent portion
in IsEligibleForTailCallOptimization.
This also synchronizes all in-tree targets, to help enable future
refactoring and feature work.
llvm-svn: 78142
2009-08-05 09:29:28 +08:00
|
|
|
SDValue
|
2015-10-26 20:38:43 +08:00
|
|
|
MipsTargetLowering::LowerInterruptReturn(SmallVectorImpl<SDValue> &RetOps,
|
2016-06-12 23:39:02 +08:00
|
|
|
const SDLoc &DL,
|
|
|
|
SelectionDAG &DAG) const {
|
2015-10-26 20:38:43 +08:00
|
|
|
|
|
|
|
MachineFunction &MF = DAG.getMachineFunction();
|
|
|
|
MipsFunctionInfo *MipsFI = MF.getInfo<MipsFunctionInfo>();
|
|
|
|
|
|
|
|
MipsFI->setISR();
|
|
|
|
|
|
|
|
return DAG.getNode(MipsISD::ERet, DL, MVT::Other, RetOps);
|
|
|
|
}
|
|
|
|
|
|
|
|
SDValue
|
|
|
|
MipsTargetLowering::LowerReturn(SDValue Chain, CallingConv::ID CallConv,
|
|
|
|
bool IsVarArg,
|
Major calling convention code refactoring.
Instead of awkwardly encoding calling-convention information with ISD::CALL,
ISD::FORMAL_ARGUMENTS, ISD::RET, and ISD::ARG_FLAGS nodes, TargetLowering
provides three virtual functions for targets to override:
LowerFormalArguments, LowerCall, and LowerRet, which replace the custom
lowering done on the special nodes. They provide the same information, but
in a more immediately usable format.
This also reworks much of the target-independent tail call logic. The
decision of whether or not to perform a tail call is now cleanly split
between target-independent portions, and the target dependent portion
in IsEligibleForTailCallOptimization.
This also synchronizes all in-tree targets, to help enable future
refactoring and feature work.
llvm-svn: 78142
2009-08-05 09:29:28 +08:00
|
|
|
const SmallVectorImpl<ISD::OutputArg> &Outs,
|
2010-07-07 23:54:55 +08:00
|
|
|
const SmallVectorImpl<SDValue> &OutVals,
|
2016-06-12 23:39:02 +08:00
|
|
|
const SDLoc &DL, SelectionDAG &DAG) const {
|
2007-06-06 15:42:06 +08:00
|
|
|
// CCValAssign - represent the assignment of
|
|
|
|
// the return value to a location
|
|
|
|
SmallVector<CCValAssign, 16> RVLocs;
|
2013-03-06 06:41:55 +08:00
|
|
|
MachineFunction &MF = DAG.getMachineFunction();
|
2007-06-06 15:42:06 +08:00
|
|
|
|
|
|
|
// CCState - Info about the registers and stack slot.
|
2014-09-26 18:06:12 +08:00
|
|
|
MipsCCState CCInfo(CallConv, IsVarArg, MF, RVLocs, *DAG.getContext());
|
2007-06-06 15:42:06 +08:00
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
// Analyze return values.
|
2014-09-26 18:06:12 +08:00
|
|
|
CCInfo.AnalyzeReturn(Outs, RetCC_Mips);
|
2007-06-06 15:42:06 +08:00
|
|
|
|
2008-07-28 05:46:04 +08:00
|
|
|
SDValue Flag;
|
2013-02-06 02:12:03 +08:00
|
|
|
SmallVector<SDValue, 4> RetOps(1, Chain);
|
2007-06-06 15:42:06 +08:00
|
|
|
|
|
|
|
// Copy the result values into the output registers.
|
|
|
|
for (unsigned i = 0; i != RVLocs.size(); ++i) {
|
2013-03-06 06:41:55 +08:00
|
|
|
SDValue Val = OutVals[i];
|
2007-06-06 15:42:06 +08:00
|
|
|
CCValAssign &VA = RVLocs[i];
|
|
|
|
assert(VA.isRegLoc() && "Can only return in registers!");
|
2014-09-25 20:15:05 +08:00
|
|
|
bool UseUpperBits = false;
|
|
|
|
|
|
|
|
switch (VA.getLocInfo()) {
|
|
|
|
default:
|
|
|
|
llvm_unreachable("Unknown loc info!");
|
|
|
|
case CCValAssign::Full:
|
|
|
|
break;
|
|
|
|
case CCValAssign::BCvt:
|
|
|
|
Val = DAG.getNode(ISD::BITCAST, DL, VA.getLocVT(), Val);
|
|
|
|
break;
|
|
|
|
case CCValAssign::AExtUpper:
|
|
|
|
UseUpperBits = true;
|
2016-08-17 13:10:15 +08:00
|
|
|
LLVM_FALLTHROUGH;
|
2014-09-25 20:15:05 +08:00
|
|
|
case CCValAssign::AExt:
|
|
|
|
Val = DAG.getNode(ISD::ANY_EXTEND, DL, VA.getLocVT(), Val);
|
|
|
|
break;
|
|
|
|
case CCValAssign::ZExtUpper:
|
|
|
|
UseUpperBits = true;
|
2016-08-17 13:10:15 +08:00
|
|
|
LLVM_FALLTHROUGH;
|
2014-09-25 20:15:05 +08:00
|
|
|
case CCValAssign::ZExt:
|
|
|
|
Val = DAG.getNode(ISD::ZERO_EXTEND, DL, VA.getLocVT(), Val);
|
|
|
|
break;
|
|
|
|
case CCValAssign::SExtUpper:
|
|
|
|
UseUpperBits = true;
|
2016-08-17 13:10:15 +08:00
|
|
|
LLVM_FALLTHROUGH;
|
2014-09-25 20:15:05 +08:00
|
|
|
case CCValAssign::SExt:
|
|
|
|
Val = DAG.getNode(ISD::SIGN_EXTEND, DL, VA.getLocVT(), Val);
|
|
|
|
break;
|
|
|
|
}
|
2007-06-06 15:42:06 +08:00
|
|
|
|
2014-09-25 20:15:05 +08:00
|
|
|
if (UseUpperBits) {
|
|
|
|
unsigned ValSizeInBits = Outs[i].ArgVT.getSizeInBits();
|
|
|
|
unsigned LocSizeInBits = VA.getLocVT().getSizeInBits();
|
|
|
|
Val = DAG.getNode(
|
|
|
|
ISD::SHL, DL, VA.getLocVT(), Val,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(LocSizeInBits - ValSizeInBits, DL, VA.getLocVT()));
|
2014-09-25 20:15:05 +08:00
|
|
|
}
|
2013-03-06 06:41:55 +08:00
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
Chain = DAG.getCopyToReg(Chain, DL, VA.getLocReg(), Val, Flag);
|
2007-06-06 15:42:06 +08:00
|
|
|
|
2013-02-06 02:12:03 +08:00
|
|
|
// Guarantee that all emitted copies are stuck together with flags.
|
2007-06-06 15:42:06 +08:00
|
|
|
Flag = Chain.getValue(1);
|
2013-02-06 02:12:03 +08:00
|
|
|
RetOps.push_back(DAG.getRegister(VA.getLocReg(), VA.getLocVT()));
|
2007-06-06 15:42:06 +08:00
|
|
|
}
|
|
|
|
|
Several changes to Mips backend, experimental fp support being the most
important.
- Cleanup in the Subtarget info with addition of new features, not all support
yet, but they allow the future inclusion of features easier. Among new features,
we have : Arch family info (mips1, mips2, ...), ABI info (o32, eabi), 64-bit
integer
and float registers, allegrex vector FPU (VFPU), single float only support.
- TargetMachine now detects allegrex core.
- Added allegrex (Mips32r2) sext_inreg instructions.
- *Added Float Point Instructions*, handling single float only, and
aliased accesses for 32-bit FPUs.
- Some cleanup in FP instruction formats and FP register classes.
- Calling conventions improved to support mips 32-bit EABI.
- Added Asm Printer support for fp cond codes.
- Added support for sret copy to a return register.
- EABI support added into LowerCALL and FORMAL_ARGS.
- MipsFunctionInfo now keeps a virtual register per function to track the
sret on function entry until function ret.
- MipsInstrInfo FP support into methods (isMoveInstr, isLoadFromStackSlot, ...),
FP cond codes mapping and initial FP Branch Analysis.
- Two new Mips SDNode to handle fp branch and compare instructions : FPBrcond,
FPCmp
- MipsTargetLowering : handling different FP classes, Allegrex support, sret
return copy, no homing location within EABI, non 32-bit stack objects
arguments, and asm constraint for float.
llvm-svn: 53146
2008-07-06 03:05:21 +08:00
|
|
|
// The mips ABIs for returning structs by value requires that we copy
|
|
|
|
// the sret argument into $v0 for the return. We saved the argument into
|
|
|
|
// a virtual register in the entry block, so now we copy the value out
|
|
|
|
// and into $v0.
|
2013-03-06 06:41:55 +08:00
|
|
|
if (MF.getFunction()->hasStructRetAttr()) {
|
Several changes to Mips backend, experimental fp support being the most
important.
- Cleanup in the Subtarget info with addition of new features, not all support
yet, but they allow the future inclusion of features easier. Among new features,
we have : Arch family info (mips1, mips2, ...), ABI info (o32, eabi), 64-bit
integer
and float registers, allegrex vector FPU (VFPU), single float only support.
- TargetMachine now detects allegrex core.
- Added allegrex (Mips32r2) sext_inreg instructions.
- *Added Float Point Instructions*, handling single float only, and
aliased accesses for 32-bit FPUs.
- Some cleanup in FP instruction formats and FP register classes.
- Calling conventions improved to support mips 32-bit EABI.
- Added Asm Printer support for fp cond codes.
- Added support for sret copy to a return register.
- EABI support added into LowerCALL and FORMAL_ARGS.
- MipsFunctionInfo now keeps a virtual register per function to track the
sret on function entry until function ret.
- MipsInstrInfo FP support into methods (isMoveInstr, isLoadFromStackSlot, ...),
FP cond codes mapping and initial FP Branch Analysis.
- Two new Mips SDNode to handle fp branch and compare instructions : FPBrcond,
FPCmp
- MipsTargetLowering : handling different FP classes, Allegrex support, sret
return copy, no homing location within EABI, non 32-bit stack objects
arguments, and asm constraint for float.
llvm-svn: 53146
2008-07-06 03:05:21 +08:00
|
|
|
MipsFunctionInfo *MipsFI = MF.getInfo<MipsFunctionInfo>();
|
|
|
|
unsigned Reg = MipsFI->getSRetReturnReg();
|
|
|
|
|
2010-11-23 11:31:01 +08:00
|
|
|
if (!Reg)
|
2009-07-15 00:55:14 +08:00
|
|
|
llvm_unreachable("sret virtual register not created in the entry block");
|
2015-07-09 10:09:04 +08:00
|
|
|
SDValue Val =
|
|
|
|
DAG.getCopyFromReg(Chain, DL, Reg, getPointerTy(DAG.getDataLayout()));
|
2015-01-30 07:27:36 +08:00
|
|
|
unsigned V0 = ABI.IsN64() ? Mips::V0_64 : Mips::V0;
|
Several changes to Mips backend, experimental fp support being the most
important.
- Cleanup in the Subtarget info with addition of new features, not all support
yet, but they allow the future inclusion of features easier. Among new features,
we have : Arch family info (mips1, mips2, ...), ABI info (o32, eabi), 64-bit
integer
and float registers, allegrex vector FPU (VFPU), single float only support.
- TargetMachine now detects allegrex core.
- Added allegrex (Mips32r2) sext_inreg instructions.
- *Added Float Point Instructions*, handling single float only, and
aliased accesses for 32-bit FPUs.
- Some cleanup in FP instruction formats and FP register classes.
- Calling conventions improved to support mips 32-bit EABI.
- Added Asm Printer support for fp cond codes.
- Added support for sret copy to a return register.
- EABI support added into LowerCALL and FORMAL_ARGS.
- MipsFunctionInfo now keeps a virtual register per function to track the
sret on function entry until function ret.
- MipsInstrInfo FP support into methods (isMoveInstr, isLoadFromStackSlot, ...),
FP cond codes mapping and initial FP Branch Analysis.
- Two new Mips SDNode to handle fp branch and compare instructions : FPBrcond,
FPCmp
- MipsTargetLowering : handling different FP classes, Allegrex support, sret
return copy, no homing location within EABI, non 32-bit stack objects
arguments, and asm constraint for float.
llvm-svn: 53146
2008-07-06 03:05:21 +08:00
|
|
|
|
2013-03-12 08:16:36 +08:00
|
|
|
Chain = DAG.getCopyToReg(Chain, DL, V0, Val, Flag);
|
Several changes to Mips backend, experimental fp support being the most
important.
- Cleanup in the Subtarget info with addition of new features, not all support
yet, but they allow the future inclusion of features easier. Among new features,
we have : Arch family info (mips1, mips2, ...), ABI info (o32, eabi), 64-bit
integer
and float registers, allegrex vector FPU (VFPU), single float only support.
- TargetMachine now detects allegrex core.
- Added allegrex (Mips32r2) sext_inreg instructions.
- *Added Float Point Instructions*, handling single float only, and
aliased accesses for 32-bit FPUs.
- Some cleanup in FP instruction formats and FP register classes.
- Calling conventions improved to support mips 32-bit EABI.
- Added Asm Printer support for fp cond codes.
- Added support for sret copy to a return register.
- EABI support added into LowerCALL and FORMAL_ARGS.
- MipsFunctionInfo now keeps a virtual register per function to track the
sret on function entry until function ret.
- MipsInstrInfo FP support into methods (isMoveInstr, isLoadFromStackSlot, ...),
FP cond codes mapping and initial FP Branch Analysis.
- Two new Mips SDNode to handle fp branch and compare instructions : FPBrcond,
FPCmp
- MipsTargetLowering : handling different FP classes, Allegrex support, sret
return copy, no homing location within EABI, non 32-bit stack objects
arguments, and asm constraint for float.
llvm-svn: 53146
2008-07-06 03:05:21 +08:00
|
|
|
Flag = Chain.getValue(1);
|
2015-07-09 10:09:04 +08:00
|
|
|
RetOps.push_back(DAG.getRegister(V0, getPointerTy(DAG.getDataLayout())));
|
Several changes to Mips backend, experimental fp support being the most
important.
- Cleanup in the Subtarget info with addition of new features, not all support
yet, but they allow the future inclusion of features easier. Among new features,
we have : Arch family info (mips1, mips2, ...), ABI info (o32, eabi), 64-bit
integer
and float registers, allegrex vector FPU (VFPU), single float only support.
- TargetMachine now detects allegrex core.
- Added allegrex (Mips32r2) sext_inreg instructions.
- *Added Float Point Instructions*, handling single float only, and
aliased accesses for 32-bit FPUs.
- Some cleanup in FP instruction formats and FP register classes.
- Calling conventions improved to support mips 32-bit EABI.
- Added Asm Printer support for fp cond codes.
- Added support for sret copy to a return register.
- EABI support added into LowerCALL and FORMAL_ARGS.
- MipsFunctionInfo now keeps a virtual register per function to track the
sret on function entry until function ret.
- MipsInstrInfo FP support into methods (isMoveInstr, isLoadFromStackSlot, ...),
FP cond codes mapping and initial FP Branch Analysis.
- Two new Mips SDNode to handle fp branch and compare instructions : FPBrcond,
FPCmp
- MipsTargetLowering : handling different FP classes, Allegrex support, sret
return copy, no homing location within EABI, non 32-bit stack objects
arguments, and asm constraint for float.
llvm-svn: 53146
2008-07-06 03:05:21 +08:00
|
|
|
}
|
|
|
|
|
2013-02-06 02:12:03 +08:00
|
|
|
RetOps[0] = Chain; // Update chain.
|
|
|
|
|
|
|
|
// Add the flag if we have it.
|
2008-08-29 05:40:38 +08:00
|
|
|
if (Flag.getNode())
|
2013-02-06 02:12:03 +08:00
|
|
|
RetOps.push_back(Flag);
|
2012-07-10 08:19:06 +08:00
|
|
|
|
2015-10-26 20:38:43 +08:00
|
|
|
// ISRs must use "eret".
|
|
|
|
if (DAG.getMachineFunction().getFunction()->hasFnAttribute("interrupt"))
|
|
|
|
return LowerInterruptReturn(RetOps, DL, DAG);
|
|
|
|
|
|
|
|
// Standard return on Mips is a "jr $ra"
|
2014-04-27 02:35:24 +08:00
|
|
|
return DAG.getNode(MipsISD::Ret, DL, MVT::Other, RetOps);
|
2007-06-06 15:42:06 +08:00
|
|
|
}
|
2007-08-22 00:09:25 +08:00
|
|
|
|
2011-04-16 05:51:11 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
2007-08-22 00:09:25 +08:00
|
|
|
// Mips Inline Assembly Support
|
2011-04-16 05:51:11 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
2007-08-22 00:09:25 +08:00
|
|
|
|
|
|
|
/// getConstraintType - Given a constraint letter, return the type of
|
|
|
|
/// constraint it is for this target.
|
2015-07-06 03:29:18 +08:00
|
|
|
MipsTargetLowering::ConstraintType
|
|
|
|
MipsTargetLowering::getConstraintType(StringRef Constraint) const {
|
2013-11-12 20:56:01 +08:00
|
|
|
// Mips specific constraints
|
Several changes to Mips backend, experimental fp support being the most
important.
- Cleanup in the Subtarget info with addition of new features, not all support
yet, but they allow the future inclusion of features easier. Among new features,
we have : Arch family info (mips1, mips2, ...), ABI info (o32, eabi), 64-bit
integer
and float registers, allegrex vector FPU (VFPU), single float only support.
- TargetMachine now detects allegrex core.
- Added allegrex (Mips32r2) sext_inreg instructions.
- *Added Float Point Instructions*, handling single float only, and
aliased accesses for 32-bit FPUs.
- Some cleanup in FP instruction formats and FP register classes.
- Calling conventions improved to support mips 32-bit EABI.
- Added Asm Printer support for fp cond codes.
- Added support for sret copy to a return register.
- EABI support added into LowerCALL and FORMAL_ARGS.
- MipsFunctionInfo now keeps a virtual register per function to track the
sret on function entry until function ret.
- MipsInstrInfo FP support into methods (isMoveInstr, isLoadFromStackSlot, ...),
FP cond codes mapping and initial FP Branch Analysis.
- Two new Mips SDNode to handle fp branch and compare instructions : FPBrcond,
FPCmp
- MipsTargetLowering : handling different FP classes, Allegrex support, sret
return copy, no homing location within EABI, non 32-bit stack objects
arguments, and asm constraint for float.
llvm-svn: 53146
2008-07-06 03:05:21 +08:00
|
|
|
// GCC config/mips/constraints.md
|
|
|
|
//
|
2010-11-23 11:31:01 +08:00
|
|
|
// 'd' : An address register. Equivalent to r
|
|
|
|
// unless generating MIPS16 code.
|
|
|
|
// 'y' : Equivalent to r; retained for
|
|
|
|
// backwards compatibility.
|
2012-05-07 14:25:10 +08:00
|
|
|
// 'c' : A register suitable for use in an indirect
|
|
|
|
// jump. This will always be $25 for -mabicalls.
|
2012-05-07 14:25:19 +08:00
|
|
|
// 'l' : The lo register. 1 word storage.
|
|
|
|
// 'x' : The hilo register pair. Double word storage.
|
2007-08-22 00:09:25 +08:00
|
|
|
if (Constraint.size() == 1) {
|
|
|
|
switch (Constraint[0]) {
|
|
|
|
default : break;
|
2010-11-23 11:31:01 +08:00
|
|
|
case 'd':
|
|
|
|
case 'y':
|
Several changes to Mips backend, experimental fp support being the most
important.
- Cleanup in the Subtarget info with addition of new features, not all support
yet, but they allow the future inclusion of features easier. Among new features,
we have : Arch family info (mips1, mips2, ...), ABI info (o32, eabi), 64-bit
integer
and float registers, allegrex vector FPU (VFPU), single float only support.
- TargetMachine now detects allegrex core.
- Added allegrex (Mips32r2) sext_inreg instructions.
- *Added Float Point Instructions*, handling single float only, and
aliased accesses for 32-bit FPUs.
- Some cleanup in FP instruction formats and FP register classes.
- Calling conventions improved to support mips 32-bit EABI.
- Added Asm Printer support for fp cond codes.
- Added support for sret copy to a return register.
- EABI support added into LowerCALL and FORMAL_ARGS.
- MipsFunctionInfo now keeps a virtual register per function to track the
sret on function entry until function ret.
- MipsInstrInfo FP support into methods (isMoveInstr, isLoadFromStackSlot, ...),
FP cond codes mapping and initial FP Branch Analysis.
- Two new Mips SDNode to handle fp branch and compare instructions : FPBrcond,
FPCmp
- MipsTargetLowering : handling different FP classes, Allegrex support, sret
return copy, no homing location within EABI, non 32-bit stack objects
arguments, and asm constraint for float.
llvm-svn: 53146
2008-07-06 03:05:21 +08:00
|
|
|
case 'f':
|
2012-05-07 14:25:10 +08:00
|
|
|
case 'c':
|
2012-05-07 14:25:15 +08:00
|
|
|
case 'l':
|
2012-05-07 14:25:19 +08:00
|
|
|
case 'x':
|
2007-08-22 00:09:25 +08:00
|
|
|
return C_RegisterClass;
|
2013-03-05 05:33:15 +08:00
|
|
|
case 'R':
|
|
|
|
return C_Memory;
|
2007-08-22 00:09:25 +08:00
|
|
|
}
|
|
|
|
}
|
2015-03-24 19:26:34 +08:00
|
|
|
|
|
|
|
if (Constraint == "ZC")
|
|
|
|
return C_Memory;
|
|
|
|
|
2007-08-22 00:09:25 +08:00
|
|
|
return TargetLowering::getConstraintType(Constraint);
|
|
|
|
}
|
|
|
|
|
2010-10-30 01:29:13 +08:00
|
|
|
/// Examine constraint type and operand type and determine a weight value.
|
|
|
|
/// This object must already have been set up with the operand type
|
|
|
|
/// and the current alternative constraint selected.
|
|
|
|
TargetLowering::ConstraintWeight
|
|
|
|
MipsTargetLowering::getSingleConstraintMatchWeight(
|
|
|
|
AsmOperandInfo &info, const char *constraint) const {
|
|
|
|
ConstraintWeight weight = CW_Invalid;
|
|
|
|
Value *CallOperandVal = info.CallOperandVal;
|
|
|
|
// If we don't have a value, we can't do a match,
|
|
|
|
// but allow it at the lowest weight.
|
2014-04-25 13:30:21 +08:00
|
|
|
if (!CallOperandVal)
|
2010-10-30 01:29:13 +08:00
|
|
|
return CW_Default;
|
2011-07-18 12:54:35 +08:00
|
|
|
Type *type = CallOperandVal->getType();
|
2010-10-30 01:29:13 +08:00
|
|
|
// Look at the constraint type.
|
|
|
|
switch (*constraint) {
|
|
|
|
default:
|
|
|
|
weight = TargetLowering::getSingleConstraintMatchWeight(info, constraint);
|
|
|
|
break;
|
2010-11-23 11:31:01 +08:00
|
|
|
case 'd':
|
|
|
|
case 'y':
|
2010-10-30 01:29:13 +08:00
|
|
|
if (type->isIntegerTy())
|
|
|
|
weight = CW_Register;
|
|
|
|
break;
|
2013-11-12 20:56:01 +08:00
|
|
|
case 'f': // FPU or MSA register
|
2014-07-19 06:55:25 +08:00
|
|
|
if (Subtarget.hasMSA() && type->isVectorTy() &&
|
2013-11-12 20:56:01 +08:00
|
|
|
cast<VectorType>(type)->getBitWidth() == 128)
|
|
|
|
weight = CW_Register;
|
|
|
|
else if (type->isFloatTy())
|
2010-10-30 01:29:13 +08:00
|
|
|
weight = CW_Register;
|
|
|
|
break;
|
2012-05-07 14:25:10 +08:00
|
|
|
case 'c': // $25 for indirect jumps
|
2012-05-07 14:25:15 +08:00
|
|
|
case 'l': // lo register
|
2012-05-07 14:25:19 +08:00
|
|
|
case 'x': // hilo register pair
|
2013-11-12 20:56:01 +08:00
|
|
|
if (type->isIntegerTy())
|
2012-05-07 14:25:10 +08:00
|
|
|
weight = CW_SpecificReg;
|
2013-11-12 20:56:01 +08:00
|
|
|
break;
|
2012-05-07 11:13:32 +08:00
|
|
|
case 'I': // signed 16 bit immediate
|
2012-05-07 11:13:42 +08:00
|
|
|
case 'J': // integer zero
|
2012-05-07 13:46:29 +08:00
|
|
|
case 'K': // unsigned 16 bit immediate
|
2012-05-07 13:46:37 +08:00
|
|
|
case 'L': // signed 32 bit immediate where lower 16 bits are 0
|
2012-05-07 13:46:43 +08:00
|
|
|
case 'N': // immediate in the range of -65535 to -1 (inclusive)
|
2012-05-07 13:46:48 +08:00
|
|
|
case 'O': // signed 15 bit immediate (+- 16383)
|
2012-05-07 14:25:02 +08:00
|
|
|
case 'P': // immediate in the range of 65535 to 1 (inclusive)
|
2012-05-07 11:13:32 +08:00
|
|
|
if (isa<ConstantInt>(CallOperandVal))
|
|
|
|
weight = CW_Constant;
|
|
|
|
break;
|
2013-03-05 05:33:15 +08:00
|
|
|
case 'R':
|
|
|
|
weight = CW_Memory;
|
|
|
|
break;
|
2010-10-30 01:29:13 +08:00
|
|
|
}
|
|
|
|
return weight;
|
|
|
|
}
|
|
|
|
|
2013-08-14 08:21:25 +08:00
|
|
|
/// This is a helper function to parse a physical register string and split it
|
|
|
|
/// into non-numeric and numeric parts (Prefix and Reg). The first boolean flag
|
|
|
|
/// that is returned indicates whether parsing was successful. The second flag
|
|
|
|
/// is true if the numeric part exists.
|
2015-07-06 03:29:18 +08:00
|
|
|
static std::pair<bool, bool> parsePhysicalReg(StringRef C, StringRef &Prefix,
|
|
|
|
unsigned long long &Reg) {
|
2013-08-14 08:21:25 +08:00
|
|
|
if (C.front() != '{' || C.back() != '}')
|
|
|
|
return std::make_pair(false, false);
|
|
|
|
|
|
|
|
// Search for the first numeric character.
|
|
|
|
StringRef::const_iterator I, B = C.begin() + 1, E = C.end() - 1;
|
2015-11-23 15:19:06 +08:00
|
|
|
I = std::find_if(B, E, isdigit);
|
2013-08-14 08:21:25 +08:00
|
|
|
|
2015-07-06 03:29:18 +08:00
|
|
|
Prefix = StringRef(B, I - B);
|
2013-08-14 08:21:25 +08:00
|
|
|
|
|
|
|
// The second flag is set to false if no numeric characters were found.
|
|
|
|
if (I == E)
|
|
|
|
return std::make_pair(true, false);
|
|
|
|
|
|
|
|
// Parse the numeric characters.
|
|
|
|
return std::make_pair(!getAsUnsignedInteger(StringRef(I, E - I), 10, Reg),
|
|
|
|
true);
|
|
|
|
}
|
|
|
|
|
|
|
|
std::pair<unsigned, const TargetRegisterClass *> MipsTargetLowering::
|
2014-08-31 00:48:02 +08:00
|
|
|
parseRegForInlineAsmConstraint(StringRef C, MVT VT) const {
|
2014-08-05 05:25:23 +08:00
|
|
|
const TargetRegisterInfo *TRI =
|
2015-01-30 07:27:36 +08:00
|
|
|
Subtarget.getRegisterInfo();
|
2013-08-14 08:21:25 +08:00
|
|
|
const TargetRegisterClass *RC;
|
2015-07-06 03:29:18 +08:00
|
|
|
StringRef Prefix;
|
2013-08-14 08:21:25 +08:00
|
|
|
unsigned long long Reg;
|
|
|
|
|
|
|
|
std::pair<bool, bool> R = parsePhysicalReg(C, Prefix, Reg);
|
|
|
|
|
|
|
|
if (!R.first)
|
2014-04-25 13:30:21 +08:00
|
|
|
return std::make_pair(0U, nullptr);
|
2013-08-14 08:21:25 +08:00
|
|
|
|
|
|
|
if ((Prefix == "hi" || Prefix == "lo")) { // Parse hi/lo.
|
|
|
|
// No numeric characters follow "hi" or "lo".
|
|
|
|
if (R.second)
|
2014-04-25 13:30:21 +08:00
|
|
|
return std::make_pair(0U, nullptr);
|
2013-08-14 08:21:25 +08:00
|
|
|
|
|
|
|
RC = TRI->getRegClass(Prefix == "hi" ?
|
2013-08-14 08:47:08 +08:00
|
|
|
Mips::HI32RegClassID : Mips::LO32RegClassID);
|
2013-08-14 08:21:25 +08:00
|
|
|
return std::make_pair(*(RC->begin()), RC);
|
2015-07-06 03:29:18 +08:00
|
|
|
} else if (Prefix.startswith("$msa")) {
|
2013-11-12 20:56:01 +08:00
|
|
|
// Parse $msa(ir|csr|access|save|modify|request|map|unmap)
|
|
|
|
|
|
|
|
// No numeric characters follow the name.
|
|
|
|
if (R.second)
|
2014-04-25 13:30:21 +08:00
|
|
|
return std::make_pair(0U, nullptr);
|
2013-11-12 20:56:01 +08:00
|
|
|
|
|
|
|
Reg = StringSwitch<unsigned long long>(Prefix)
|
|
|
|
.Case("$msair", Mips::MSAIR)
|
|
|
|
.Case("$msacsr", Mips::MSACSR)
|
|
|
|
.Case("$msaaccess", Mips::MSAAccess)
|
|
|
|
.Case("$msasave", Mips::MSASave)
|
|
|
|
.Case("$msamodify", Mips::MSAModify)
|
|
|
|
.Case("$msarequest", Mips::MSARequest)
|
|
|
|
.Case("$msamap", Mips::MSAMap)
|
|
|
|
.Case("$msaunmap", Mips::MSAUnmap)
|
|
|
|
.Default(0);
|
|
|
|
|
|
|
|
if (!Reg)
|
2014-04-25 13:30:21 +08:00
|
|
|
return std::make_pair(0U, nullptr);
|
2013-11-12 20:56:01 +08:00
|
|
|
|
|
|
|
RC = TRI->getRegClass(Mips::MSACtrlRegClassID);
|
|
|
|
return std::make_pair(Reg, RC);
|
2013-08-14 08:21:25 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
if (!R.second)
|
2014-04-25 13:30:21 +08:00
|
|
|
return std::make_pair(0U, nullptr);
|
2013-08-14 08:21:25 +08:00
|
|
|
|
|
|
|
if (Prefix == "$f") { // Parse $f0-$f31.
|
|
|
|
// If the size of FP registers is 64-bit or Reg is an even number, select
|
|
|
|
// the 64-bit register class. Otherwise, select the 32-bit register class.
|
|
|
|
if (VT == MVT::Other)
|
2014-07-19 06:55:25 +08:00
|
|
|
VT = (Subtarget.isFP64bit() || !(Reg % 2)) ? MVT::f64 : MVT::f32;
|
2013-08-14 08:21:25 +08:00
|
|
|
|
2013-10-08 03:33:02 +08:00
|
|
|
RC = getRegClassFor(VT);
|
2013-08-14 08:21:25 +08:00
|
|
|
|
|
|
|
if (RC == &Mips::AFGR64RegClass) {
|
|
|
|
assert(Reg % 2 == 0);
|
|
|
|
Reg >>= 1;
|
|
|
|
}
|
2013-11-12 20:56:01 +08:00
|
|
|
} else if (Prefix == "$fcc") // Parse $fcc0-$fcc7.
|
2013-08-14 08:21:25 +08:00
|
|
|
RC = TRI->getRegClass(Mips::FCCRegClassID);
|
2013-11-12 20:56:01 +08:00
|
|
|
else if (Prefix == "$w") { // Parse $w0-$w31.
|
|
|
|
RC = getRegClassFor((VT == MVT::Other) ? MVT::v16i8 : VT);
|
2013-08-14 08:21:25 +08:00
|
|
|
} else { // Parse $0-$31.
|
|
|
|
assert(Prefix == "$");
|
|
|
|
RC = getRegClassFor((VT == MVT::Other) ? MVT::i32 : VT);
|
|
|
|
}
|
|
|
|
|
|
|
|
assert(Reg < RC->getNumRegs());
|
|
|
|
return std::make_pair(*(RC->begin() + Reg), RC);
|
|
|
|
}
|
|
|
|
|
2011-06-30 03:33:04 +08:00
|
|
|
/// Given a register class constraint, like 'r', if this corresponds directly
|
|
|
|
/// to an LLVM register class, return a register of 0 and the register class
|
|
|
|
/// pointer.
|
2015-02-27 06:38:43 +08:00
|
|
|
std::pair<unsigned, const TargetRegisterClass *>
|
|
|
|
MipsTargetLowering::getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI,
|
2015-07-06 03:29:18 +08:00
|
|
|
StringRef Constraint,
|
2015-02-27 06:38:43 +08:00
|
|
|
MVT VT) const {
|
2007-08-22 00:09:25 +08:00
|
|
|
if (Constraint.size() == 1) {
|
|
|
|
switch (Constraint[0]) {
|
2011-06-30 03:04:31 +08:00
|
|
|
case 'd': // Address register. Same as 'r' unless generating MIPS16 code.
|
|
|
|
case 'y': // Same as 'r'. Exists for compatibility.
|
2007-08-22 00:09:25 +08:00
|
|
|
case 'r':
|
2012-09-13 07:27:55 +08:00
|
|
|
if (VT == MVT::i32 || VT == MVT::i16 || VT == MVT::i8) {
|
2014-07-19 06:55:25 +08:00
|
|
|
if (Subtarget.inMips16Mode())
|
2012-09-13 07:27:55 +08:00
|
|
|
return std::make_pair(0U, &Mips::CPU16RegsRegClass);
|
2013-08-07 07:08:38 +08:00
|
|
|
return std::make_pair(0U, &Mips::GPR32RegClass);
|
2012-09-13 07:27:55 +08:00
|
|
|
}
|
2014-07-19 06:55:25 +08:00
|
|
|
if (VT == MVT::i64 && !Subtarget.isGP64bit())
|
2013-08-07 07:08:38 +08:00
|
|
|
return std::make_pair(0U, &Mips::GPR32RegClass);
|
2014-07-19 06:55:25 +08:00
|
|
|
if (VT == MVT::i64 && Subtarget.isGP64bit())
|
2013-08-07 07:08:38 +08:00
|
|
|
return std::make_pair(0U, &Mips::GPR64RegClass);
|
2012-05-07 11:13:22 +08:00
|
|
|
// This will generate an error message
|
2014-04-25 13:30:21 +08:00
|
|
|
return std::make_pair(0U, nullptr);
|
2013-11-12 20:56:01 +08:00
|
|
|
case 'f': // FPU or MSA register
|
|
|
|
if (VT == MVT::v16i8)
|
|
|
|
return std::make_pair(0U, &Mips::MSA128BRegClass);
|
|
|
|
else if (VT == MVT::v8i16 || VT == MVT::v8f16)
|
|
|
|
return std::make_pair(0U, &Mips::MSA128HRegClass);
|
|
|
|
else if (VT == MVT::v4i32 || VT == MVT::v4f32)
|
|
|
|
return std::make_pair(0U, &Mips::MSA128WRegClass);
|
|
|
|
else if (VT == MVT::v2i64 || VT == MVT::v2f64)
|
|
|
|
return std::make_pair(0U, &Mips::MSA128DRegClass);
|
|
|
|
else if (VT == MVT::f32)
|
2012-04-20 15:30:17 +08:00
|
|
|
return std::make_pair(0U, &Mips::FGR32RegClass);
|
2014-07-19 06:55:25 +08:00
|
|
|
else if ((VT == MVT::f64) && (!Subtarget.isSingleFloat())) {
|
|
|
|
if (Subtarget.isFP64bit())
|
2012-04-20 15:30:17 +08:00
|
|
|
return std::make_pair(0U, &Mips::FGR64RegClass);
|
|
|
|
return std::make_pair(0U, &Mips::AFGR64RegClass);
|
2012-01-04 10:45:01 +08:00
|
|
|
}
|
2012-05-07 14:25:10 +08:00
|
|
|
break;
|
|
|
|
case 'c': // register suitable for indirect jump
|
|
|
|
if (VT == MVT::i32)
|
2013-08-07 07:08:38 +08:00
|
|
|
return std::make_pair((unsigned)Mips::T9, &Mips::GPR32RegClass);
|
2012-05-07 14:25:10 +08:00
|
|
|
assert(VT == MVT::i64 && "Unexpected type.");
|
2013-08-07 07:08:38 +08:00
|
|
|
return std::make_pair((unsigned)Mips::T9_64, &Mips::GPR64RegClass);
|
2012-05-07 14:25:15 +08:00
|
|
|
case 'l': // register suitable for indirect jump
|
|
|
|
if (VT == MVT::i32)
|
2013-08-14 08:47:08 +08:00
|
|
|
return std::make_pair((unsigned)Mips::LO0, &Mips::LO32RegClass);
|
|
|
|
return std::make_pair((unsigned)Mips::LO0_64, &Mips::LO64RegClass);
|
2012-05-07 14:25:19 +08:00
|
|
|
case 'x': // register suitable for indirect jump
|
|
|
|
// Fixme: Not triggering the use of both hi and low
|
|
|
|
// This will generate an error message
|
2014-04-25 13:30:21 +08:00
|
|
|
return std::make_pair(0U, nullptr);
|
2007-08-22 00:09:25 +08:00
|
|
|
}
|
|
|
|
}
|
2013-08-14 08:21:25 +08:00
|
|
|
|
|
|
|
std::pair<unsigned, const TargetRegisterClass *> R;
|
|
|
|
R = parseRegForInlineAsmConstraint(Constraint, VT);
|
|
|
|
|
|
|
|
if (R.second)
|
|
|
|
return R;
|
|
|
|
|
2015-02-27 06:38:43 +08:00
|
|
|
return TargetLowering::getRegForInlineAsmConstraint(TRI, Constraint, VT);
|
2007-08-22 00:09:25 +08:00
|
|
|
}
|
|
|
|
|
2012-05-07 11:13:32 +08:00
|
|
|
/// LowerAsmOperandForConstraint - Lower the specified operand into the Ops
|
|
|
|
/// vector. If it is invalid, don't add anything to Ops.
|
|
|
|
void MipsTargetLowering::LowerAsmOperandForConstraint(SDValue Op,
|
|
|
|
std::string &Constraint,
|
|
|
|
std::vector<SDValue>&Ops,
|
|
|
|
SelectionDAG &DAG) const {
|
2015-04-28 22:05:47 +08:00
|
|
|
SDLoc DL(Op);
|
2014-04-25 13:30:21 +08:00
|
|
|
SDValue Result;
|
2012-05-07 11:13:32 +08:00
|
|
|
|
|
|
|
// Only support length 1 constraints for now.
|
|
|
|
if (Constraint.length() > 1) return;
|
|
|
|
|
|
|
|
char ConstraintLetter = Constraint[0];
|
|
|
|
switch (ConstraintLetter) {
|
|
|
|
default: break; // This will fall through to the generic implementation
|
|
|
|
case 'I': // Signed 16 bit constant
|
|
|
|
// If this fails, the parent routine will give an error
|
|
|
|
if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op)) {
|
|
|
|
EVT Type = Op.getValueType();
|
|
|
|
int64_t Val = C->getSExtValue();
|
|
|
|
if (isInt<16>(Val)) {
|
2015-04-28 22:05:47 +08:00
|
|
|
Result = DAG.getTargetConstant(Val, DL, Type);
|
2012-05-07 11:13:32 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return;
|
2012-05-07 11:13:42 +08:00
|
|
|
case 'J': // integer zero
|
|
|
|
if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op)) {
|
|
|
|
EVT Type = Op.getValueType();
|
|
|
|
int64_t Val = C->getZExtValue();
|
|
|
|
if (Val == 0) {
|
2015-04-28 22:05:47 +08:00
|
|
|
Result = DAG.getTargetConstant(0, DL, Type);
|
2012-05-07 11:13:42 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return;
|
2012-05-07 13:46:29 +08:00
|
|
|
case 'K': // unsigned 16 bit immediate
|
|
|
|
if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op)) {
|
|
|
|
EVT Type = Op.getValueType();
|
|
|
|
uint64_t Val = (uint64_t)C->getZExtValue();
|
|
|
|
if (isUInt<16>(Val)) {
|
2015-04-28 22:05:47 +08:00
|
|
|
Result = DAG.getTargetConstant(Val, DL, Type);
|
2012-05-07 13:46:29 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return;
|
2012-05-07 13:46:37 +08:00
|
|
|
case 'L': // signed 32 bit immediate where lower 16 bits are 0
|
|
|
|
if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op)) {
|
|
|
|
EVT Type = Op.getValueType();
|
|
|
|
int64_t Val = C->getSExtValue();
|
|
|
|
if ((isInt<32>(Val)) && ((Val & 0xffff) == 0)){
|
2015-04-28 22:05:47 +08:00
|
|
|
Result = DAG.getTargetConstant(Val, DL, Type);
|
2012-05-07 13:46:37 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return;
|
2012-05-07 13:46:43 +08:00
|
|
|
case 'N': // immediate in the range of -65535 to -1 (inclusive)
|
|
|
|
if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op)) {
|
|
|
|
EVT Type = Op.getValueType();
|
|
|
|
int64_t Val = C->getSExtValue();
|
|
|
|
if ((Val >= -65535) && (Val <= -1)) {
|
2015-04-28 22:05:47 +08:00
|
|
|
Result = DAG.getTargetConstant(Val, DL, Type);
|
2012-05-07 13:46:43 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return;
|
2012-05-07 13:46:48 +08:00
|
|
|
case 'O': // signed 15 bit immediate
|
|
|
|
if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op)) {
|
|
|
|
EVT Type = Op.getValueType();
|
|
|
|
int64_t Val = C->getSExtValue();
|
|
|
|
if ((isInt<15>(Val))) {
|
2015-04-28 22:05:47 +08:00
|
|
|
Result = DAG.getTargetConstant(Val, DL, Type);
|
2012-05-07 13:46:48 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return;
|
2012-05-07 14:25:02 +08:00
|
|
|
case 'P': // immediate in the range of 1 to 65535 (inclusive)
|
|
|
|
if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op)) {
|
|
|
|
EVT Type = Op.getValueType();
|
|
|
|
int64_t Val = C->getSExtValue();
|
|
|
|
if ((Val <= 65535) && (Val >= 1)) {
|
2015-04-28 22:05:47 +08:00
|
|
|
Result = DAG.getTargetConstant(Val, DL, Type);
|
2012-05-07 14:25:02 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return;
|
2012-05-07 11:13:32 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
if (Result.getNode()) {
|
|
|
|
Ops.push_back(Result);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
TargetLowering::LowerAsmOperandForConstraint(Op, Constraint, Ops, DAG);
|
|
|
|
}
|
|
|
|
|
2015-07-09 10:09:40 +08:00
|
|
|
bool MipsTargetLowering::isLegalAddressingMode(const DataLayout &DL,
|
|
|
|
const AddrMode &AM, Type *Ty,
|
2015-06-01 13:31:59 +08:00
|
|
|
unsigned AS) const {
|
2012-11-17 08:25:41 +08:00
|
|
|
// No global is ever allowed as a base.
|
|
|
|
if (AM.BaseGV)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
switch (AM.Scale) {
|
|
|
|
case 0: // "r+i" or just "i", depending on HasBaseReg.
|
|
|
|
break;
|
|
|
|
case 1:
|
|
|
|
if (!AM.HasBaseReg) // allow "r+i".
|
|
|
|
break;
|
|
|
|
return false; // disallow "r+r" or "r+r+i".
|
|
|
|
default:
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
Teach DAGCombine to fold constant offsets into GlobalAddress nodes,
and add a TargetLowering hook for it to use to determine when this
is legal (i.e. not in PIC mode, etc.)
This allows instruction selection to emit folded constant offsets
in more cases, such as the included testcase, eliminating the need
for explicit arithmetic instructions.
This eliminates the need for the C++ code in X86ISelDAGToDAG.cpp
that attempted to achieve the same effect, but wasn't as effective.
Also, fix handling of offsets in GlobalAddressSDNodes in several
places, including changing GlobalAddressSDNode's offset from
int to int64_t.
The Mips, Alpha, Sparc, and CellSPU targets appear to be
unaware of GlobalAddress offsets currently, so set the hook to
false on those targets.
llvm-svn: 57748
2008-10-18 10:06:02 +08:00
|
|
|
bool
|
|
|
|
MipsTargetLowering::isOffsetFoldingLegal(const GlobalAddressSDNode *GA) const {
|
|
|
|
// The Mips target isn't yet aware of offsets.
|
|
|
|
return false;
|
|
|
|
}
|
2009-10-28 03:56:55 +08:00
|
|
|
|
2012-06-14 03:33:32 +08:00
|
|
|
EVT MipsTargetLowering::getOptimalMemOpType(uint64_t Size, unsigned DstAlign,
|
2012-12-12 10:34:41 +08:00
|
|
|
unsigned SrcAlign,
|
|
|
|
bool IsMemset, bool ZeroMemset,
|
2012-06-14 03:33:32 +08:00
|
|
|
bool MemcpyStrSrc,
|
|
|
|
MachineFunction &MF) const {
|
2014-07-19 06:55:25 +08:00
|
|
|
if (Subtarget.hasMips64())
|
2012-06-14 03:33:32 +08:00
|
|
|
return MVT::i64;
|
|
|
|
|
|
|
|
return MVT::i32;
|
|
|
|
}
|
|
|
|
|
2009-10-28 09:43:28 +08:00
|
|
|
bool MipsTargetLowering::isFPImmLegal(const APFloat &Imm, EVT VT) const {
|
|
|
|
if (VT != MVT::f32 && VT != MVT::f64)
|
|
|
|
return false;
|
2011-01-19 03:41:41 +08:00
|
|
|
if (Imm.isNegZero())
|
|
|
|
return false;
|
2009-10-28 03:56:55 +08:00
|
|
|
return Imm.isZero();
|
|
|
|
}
|
2012-02-03 12:33:00 +08:00
|
|
|
|
|
|
|
unsigned MipsTargetLowering::getJumpTableEncoding() const {
|
2017-01-27 19:36:52 +08:00
|
|
|
|
|
|
|
// FIXME: For space reasons this should be: EK_GPRel32BlockAddress.
|
|
|
|
if (ABI.IsN64() && isPositionIndependent())
|
2012-02-03 12:33:00 +08:00
|
|
|
return MachineJumpTableInfo::EK_GPRel64BlockAddress;
|
2012-02-28 15:46:26 +08:00
|
|
|
|
2012-02-03 12:33:00 +08:00
|
|
|
return TargetLowering::getJumpTableEncoding();
|
|
|
|
}
|
2012-10-27 07:56:38 +08:00
|
|
|
|
2015-05-12 09:26:05 +08:00
|
|
|
bool MipsTargetLowering::useSoftFloat() const {
|
|
|
|
return Subtarget.useSoftFloat();
|
|
|
|
}
|
|
|
|
|
2014-11-02 02:44:56 +08:00
|
|
|
void MipsTargetLowering::copyByValRegs(
|
2016-06-12 23:39:02 +08:00
|
|
|
SDValue Chain, const SDLoc &DL, std::vector<SDValue> &OutChains,
|
|
|
|
SelectionDAG &DAG, const ISD::ArgFlagsTy &Flags,
|
|
|
|
SmallVectorImpl<SDValue> &InVals, const Argument *FuncArg,
|
|
|
|
unsigned FirstReg, unsigned LastReg, const CCValAssign &VA,
|
|
|
|
MipsCCState &State) const {
|
2012-10-27 08:10:18 +08:00
|
|
|
MachineFunction &MF = DAG.getMachineFunction();
|
2016-07-29 02:40:00 +08:00
|
|
|
MachineFrameInfo &MFI = MF.getFrameInfo();
|
2014-09-09 20:11:16 +08:00
|
|
|
unsigned GPRSizeInBytes = Subtarget.getGPRSizeInBytes();
|
2014-11-03 00:09:29 +08:00
|
|
|
unsigned NumRegs = LastReg - FirstReg;
|
|
|
|
unsigned RegAreaSize = NumRegs * GPRSizeInBytes;
|
2012-10-27 08:10:18 +08:00
|
|
|
unsigned FrameObjSize = std::max(Flags.getByValSize(), RegAreaSize);
|
|
|
|
int FrameObjOffset;
|
2014-11-07 23:03:53 +08:00
|
|
|
ArrayRef<MCPhysReg> ByValArgRegs = ABI.GetByValArgRegs();
|
2012-10-27 08:10:18 +08:00
|
|
|
|
|
|
|
if (RegAreaSize)
|
2014-11-07 23:03:53 +08:00
|
|
|
FrameObjOffset =
|
|
|
|
(int)ABI.GetCalleeAllocdArgSizeInBytes(State.getCallingConv()) -
|
|
|
|
(int)((ByValArgRegs.size() - FirstReg) * GPRSizeInBytes);
|
2012-10-27 08:10:18 +08:00
|
|
|
else
|
2014-11-02 02:44:56 +08:00
|
|
|
FrameObjOffset = VA.getLocMemOffset();
|
2012-10-27 08:10:18 +08:00
|
|
|
|
|
|
|
// Create frame object.
|
2015-07-09 10:09:04 +08:00
|
|
|
EVT PtrTy = getPointerTy(DAG.getDataLayout());
|
2016-07-29 02:40:00 +08:00
|
|
|
int FI = MFI.CreateFixedObject(FrameObjSize, FrameObjOffset, true);
|
2012-10-27 08:10:18 +08:00
|
|
|
SDValue FIN = DAG.getFrameIndex(FI, PtrTy);
|
|
|
|
InVals.push_back(FIN);
|
|
|
|
|
2014-11-03 00:09:29 +08:00
|
|
|
if (!NumRegs)
|
2012-10-27 08:10:18 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
// Copy arg registers.
|
2014-09-09 20:11:16 +08:00
|
|
|
MVT RegTy = MVT::getIntegerVT(GPRSizeInBytes * 8);
|
2012-10-27 08:10:18 +08:00
|
|
|
const TargetRegisterClass *RC = getRegClassFor(RegTy);
|
|
|
|
|
2014-11-03 00:09:29 +08:00
|
|
|
for (unsigned I = 0; I < NumRegs; ++I) {
|
2014-11-07 20:21:37 +08:00
|
|
|
unsigned ArgReg = ByValArgRegs[FirstReg + I];
|
2013-03-12 08:16:36 +08:00
|
|
|
unsigned VReg = addLiveIn(MF, ArgReg, RC);
|
2014-09-09 20:11:16 +08:00
|
|
|
unsigned Offset = I * GPRSizeInBytes;
|
2012-10-27 08:10:18 +08:00
|
|
|
SDValue StorePtr = DAG.getNode(ISD::ADD, DL, PtrTy, FIN,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(Offset, DL, PtrTy));
|
2012-10-27 08:10:18 +08:00
|
|
|
SDValue Store = DAG.getStore(Chain, DL, DAG.getRegister(VReg, RegTy),
|
[SelectionDAG] Get rid of bool parameters in SelectionDAG::getLoad, getStore, and friends.
Summary:
Instead, we take a single flags arg (a bitset).
Also add a default 0 alignment, and change the order of arguments so the
alignment comes before the flags.
This greatly simplifies many callsites, and fixes a bug in
AMDGPUISelLowering, wherein the order of the args to getLoad was
inverted. It also greatly simplifies the process of adding another flag
to getLoad.
Reviewers: chandlerc, tstellarAMD
Subscribers: jholewinski, arsenm, jyknight, dsanders, nemanjai, llvm-commits
Differential Revision: http://reviews.llvm.org/D22249
llvm-svn: 275592
2016-07-16 02:27:10 +08:00
|
|
|
StorePtr, MachinePointerInfo(FuncArg, Offset));
|
2012-10-27 08:10:18 +08:00
|
|
|
OutChains.push_back(Store);
|
|
|
|
}
|
|
|
|
}
|
2012-10-27 08:16:36 +08:00
|
|
|
|
|
|
|
// Copy byVal arg to registers and stack.
|
2014-11-02 02:44:56 +08:00
|
|
|
void MipsTargetLowering::passByValArg(
|
2016-06-12 23:39:02 +08:00
|
|
|
SDValue Chain, const SDLoc &DL,
|
2014-11-02 02:44:56 +08:00
|
|
|
std::deque<std::pair<unsigned, SDValue>> &RegsToPass,
|
|
|
|
SmallVectorImpl<SDValue> &MemOpChains, SDValue StackPtr,
|
2016-07-29 02:40:00 +08:00
|
|
|
MachineFrameInfo &MFI, SelectionDAG &DAG, SDValue Arg, unsigned FirstReg,
|
2014-11-07 23:33:08 +08:00
|
|
|
unsigned LastReg, const ISD::ArgFlagsTy &Flags, bool isLittle,
|
|
|
|
const CCValAssign &VA) const {
|
2014-05-23 21:18:02 +08:00
|
|
|
unsigned ByValSizeInBytes = Flags.getByValSize();
|
|
|
|
unsigned OffsetInBytes = 0; // From beginning of struct
|
2014-09-09 20:11:16 +08:00
|
|
|
unsigned RegSizeInBytes = Subtarget.getGPRSizeInBytes();
|
2014-05-23 21:18:02 +08:00
|
|
|
unsigned Alignment = std::min(Flags.getByValAlign(), RegSizeInBytes);
|
2015-07-09 10:09:04 +08:00
|
|
|
EVT PtrTy = getPointerTy(DAG.getDataLayout()),
|
|
|
|
RegTy = MVT::getIntegerVT(RegSizeInBytes * 8);
|
2014-11-03 00:09:29 +08:00
|
|
|
unsigned NumRegs = LastReg - FirstReg;
|
2012-10-27 08:16:36 +08:00
|
|
|
|
2014-11-03 00:09:29 +08:00
|
|
|
if (NumRegs) {
|
2015-09-28 08:15:34 +08:00
|
|
|
ArrayRef<MCPhysReg> ArgRegs = ABI.GetByValArgRegs();
|
2014-11-03 00:09:29 +08:00
|
|
|
bool LeftoverBytes = (NumRegs * RegSizeInBytes > ByValSizeInBytes);
|
2012-10-27 08:16:36 +08:00
|
|
|
unsigned I = 0;
|
|
|
|
|
|
|
|
// Copy words to registers.
|
2014-11-03 00:09:29 +08:00
|
|
|
for (; I < NumRegs - LeftoverBytes; ++I, OffsetInBytes += RegSizeInBytes) {
|
2012-10-27 08:16:36 +08:00
|
|
|
SDValue LoadPtr = DAG.getNode(ISD::ADD, DL, PtrTy, Arg,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(OffsetInBytes, DL, PtrTy));
|
2012-10-27 08:16:36 +08:00
|
|
|
SDValue LoadVal = DAG.getLoad(RegTy, DL, Chain, LoadPtr,
|
[SelectionDAG] Get rid of bool parameters in SelectionDAG::getLoad, getStore, and friends.
Summary:
Instead, we take a single flags arg (a bitset).
Also add a default 0 alignment, and change the order of arguments so the
alignment comes before the flags.
This greatly simplifies many callsites, and fixes a bug in
AMDGPUISelLowering, wherein the order of the args to getLoad was
inverted. It also greatly simplifies the process of adding another flag
to getLoad.
Reviewers: chandlerc, tstellarAMD
Subscribers: jholewinski, arsenm, jyknight, dsanders, nemanjai, llvm-commits
Differential Revision: http://reviews.llvm.org/D22249
llvm-svn: 275592
2016-07-16 02:27:10 +08:00
|
|
|
MachinePointerInfo(), Alignment);
|
2012-10-27 08:16:36 +08:00
|
|
|
MemOpChains.push_back(LoadVal.getValue(1));
|
2014-11-03 00:09:29 +08:00
|
|
|
unsigned ArgReg = ArgRegs[FirstReg + I];
|
2012-10-27 08:16:36 +08:00
|
|
|
RegsToPass.push_back(std::make_pair(ArgReg, LoadVal));
|
|
|
|
}
|
|
|
|
|
|
|
|
// Return if the struct has been fully copied.
|
2014-05-23 21:18:02 +08:00
|
|
|
if (ByValSizeInBytes == OffsetInBytes)
|
2012-10-27 08:16:36 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
// Copy the remainder of the byval argument with sub-word loads and shifts.
|
|
|
|
if (LeftoverBytes) {
|
|
|
|
SDValue Val;
|
|
|
|
|
2014-05-23 21:18:02 +08:00
|
|
|
for (unsigned LoadSizeInBytes = RegSizeInBytes / 2, TotalBytesLoaded = 0;
|
|
|
|
OffsetInBytes < ByValSizeInBytes; LoadSizeInBytes /= 2) {
|
|
|
|
unsigned RemainingSizeInBytes = ByValSizeInBytes - OffsetInBytes;
|
2012-10-27 08:16:36 +08:00
|
|
|
|
2014-05-23 21:18:02 +08:00
|
|
|
if (RemainingSizeInBytes < LoadSizeInBytes)
|
2012-10-27 08:16:36 +08:00
|
|
|
continue;
|
|
|
|
|
|
|
|
// Load subword.
|
|
|
|
SDValue LoadPtr = DAG.getNode(ISD::ADD, DL, PtrTy, Arg,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(OffsetInBytes, DL,
|
|
|
|
PtrTy));
|
2014-05-23 21:18:02 +08:00
|
|
|
SDValue LoadVal = DAG.getExtLoad(
|
|
|
|
ISD::ZEXTLOAD, DL, RegTy, Chain, LoadPtr, MachinePointerInfo(),
|
[SelectionDAG] Get rid of bool parameters in SelectionDAG::getLoad, getStore, and friends.
Summary:
Instead, we take a single flags arg (a bitset).
Also add a default 0 alignment, and change the order of arguments so the
alignment comes before the flags.
This greatly simplifies many callsites, and fixes a bug in
AMDGPUISelLowering, wherein the order of the args to getLoad was
inverted. It also greatly simplifies the process of adding another flag
to getLoad.
Reviewers: chandlerc, tstellarAMD
Subscribers: jholewinski, arsenm, jyknight, dsanders, nemanjai, llvm-commits
Differential Revision: http://reviews.llvm.org/D22249
llvm-svn: 275592
2016-07-16 02:27:10 +08:00
|
|
|
MVT::getIntegerVT(LoadSizeInBytes * 8), Alignment);
|
2012-10-27 08:16:36 +08:00
|
|
|
MemOpChains.push_back(LoadVal.getValue(1));
|
|
|
|
|
|
|
|
// Shift the loaded value.
|
|
|
|
unsigned Shamt;
|
|
|
|
|
|
|
|
if (isLittle)
|
2014-05-23 21:18:02 +08:00
|
|
|
Shamt = TotalBytesLoaded * 8;
|
2012-10-27 08:16:36 +08:00
|
|
|
else
|
2014-05-23 21:18:02 +08:00
|
|
|
Shamt = (RegSizeInBytes - (TotalBytesLoaded + LoadSizeInBytes)) * 8;
|
2012-10-27 08:16:36 +08:00
|
|
|
|
|
|
|
SDValue Shift = DAG.getNode(ISD::SHL, DL, RegTy, LoadVal,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(Shamt, DL, MVT::i32));
|
2012-10-27 08:16:36 +08:00
|
|
|
|
|
|
|
if (Val.getNode())
|
|
|
|
Val = DAG.getNode(ISD::OR, DL, RegTy, Val, Shift);
|
|
|
|
else
|
|
|
|
Val = Shift;
|
|
|
|
|
2014-05-23 21:18:02 +08:00
|
|
|
OffsetInBytes += LoadSizeInBytes;
|
|
|
|
TotalBytesLoaded += LoadSizeInBytes;
|
|
|
|
Alignment = std::min(Alignment, LoadSizeInBytes);
|
2012-10-27 08:16:36 +08:00
|
|
|
}
|
|
|
|
|
2014-11-03 00:09:29 +08:00
|
|
|
unsigned ArgReg = ArgRegs[FirstReg + I];
|
2012-10-27 08:16:36 +08:00
|
|
|
RegsToPass.push_back(std::make_pair(ArgReg, Val));
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Copy remainder of byval arg to it with memcpy.
|
2014-05-23 21:18:02 +08:00
|
|
|
unsigned MemCpySize = ByValSizeInBytes - OffsetInBytes;
|
2012-10-27 08:16:36 +08:00
|
|
|
SDValue Src = DAG.getNode(ISD::ADD, DL, PtrTy, Arg,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getConstant(OffsetInBytes, DL, PtrTy));
|
2012-10-27 08:16:36 +08:00
|
|
|
SDValue Dst = DAG.getNode(ISD::ADD, DL, PtrTy, StackPtr,
|
2015-04-28 22:05:47 +08:00
|
|
|
DAG.getIntPtrConstant(VA.getLocMemOffset(), DL));
|
|
|
|
Chain = DAG.getMemcpy(Chain, DL, Dst, Src,
|
|
|
|
DAG.getConstant(MemCpySize, DL, PtrTy),
|
2013-10-08 03:33:02 +08:00
|
|
|
Alignment, /*isVolatile=*/false, /*AlwaysInline=*/false,
|
2015-04-14 01:16:45 +08:00
|
|
|
/*isTailCall=*/false,
|
2014-04-15 15:22:52 +08:00
|
|
|
MachinePointerInfo(), MachinePointerInfo());
|
2012-10-27 08:16:36 +08:00
|
|
|
MemOpChains.push_back(Chain);
|
|
|
|
}
|
2012-10-27 08:21:13 +08:00
|
|
|
|
2013-10-08 03:33:02 +08:00
|
|
|
void MipsTargetLowering::writeVarArgRegs(std::vector<SDValue> &OutChains,
|
2016-06-12 23:39:02 +08:00
|
|
|
SDValue Chain, const SDLoc &DL,
|
2014-11-07 23:33:08 +08:00
|
|
|
SelectionDAG &DAG,
|
2014-11-02 02:13:52 +08:00
|
|
|
CCState &State) const {
|
2015-09-28 08:15:34 +08:00
|
|
|
ArrayRef<MCPhysReg> ArgRegs = ABI.GetVarArgRegs();
|
2015-02-21 10:11:17 +08:00
|
|
|
unsigned Idx = State.getFirstUnallocated(ArgRegs);
|
2014-09-09 20:11:16 +08:00
|
|
|
unsigned RegSizeInBytes = Subtarget.getGPRSizeInBytes();
|
|
|
|
MVT RegTy = MVT::getIntegerVT(RegSizeInBytes * 8);
|
2012-10-27 08:21:13 +08:00
|
|
|
const TargetRegisterClass *RC = getRegClassFor(RegTy);
|
|
|
|
MachineFunction &MF = DAG.getMachineFunction();
|
2016-07-29 02:40:00 +08:00
|
|
|
MachineFrameInfo &MFI = MF.getFrameInfo();
|
2012-10-27 08:21:13 +08:00
|
|
|
MipsFunctionInfo *MipsFI = MF.getInfo<MipsFunctionInfo>();
|
|
|
|
|
|
|
|
// Offset of the first variable argument from stack pointer.
|
|
|
|
int VaArgOffset;
|
|
|
|
|
2014-09-10 18:37:03 +08:00
|
|
|
if (ArgRegs.size() == Idx)
|
2016-01-15 05:06:47 +08:00
|
|
|
VaArgOffset = alignTo(State.getNextStackOffset(), RegSizeInBytes);
|
2014-11-07 23:03:53 +08:00
|
|
|
else {
|
|
|
|
VaArgOffset =
|
|
|
|
(int)ABI.GetCalleeAllocdArgSizeInBytes(State.getCallingConv()) -
|
|
|
|
(int)(RegSizeInBytes * (ArgRegs.size() - Idx));
|
|
|
|
}
|
2012-10-27 08:21:13 +08:00
|
|
|
|
|
|
|
// Record the frame index of the first variable argument
|
|
|
|
// which is a value necessary to VASTART.
|
2016-07-29 02:40:00 +08:00
|
|
|
int FI = MFI.CreateFixedObject(RegSizeInBytes, VaArgOffset, true);
|
2012-10-27 08:21:13 +08:00
|
|
|
MipsFI->setVarArgsFrameIndex(FI);
|
|
|
|
|
|
|
|
// Copy the integer registers that have not been used for argument passing
|
|
|
|
// to the argument register save area. For O32, the save area is allocated
|
|
|
|
// in the caller's stack frame, while for N32/64, it is allocated in the
|
|
|
|
// callee's stack frame.
|
2014-09-10 18:37:03 +08:00
|
|
|
for (unsigned I = Idx; I < ArgRegs.size();
|
|
|
|
++I, VaArgOffset += RegSizeInBytes) {
|
2013-03-12 08:16:36 +08:00
|
|
|
unsigned Reg = addLiveIn(MF, ArgRegs[I], RC);
|
2012-10-27 08:21:13 +08:00
|
|
|
SDValue ArgValue = DAG.getCopyFromReg(Chain, DL, Reg, RegTy);
|
2016-07-29 02:40:00 +08:00
|
|
|
FI = MFI.CreateFixedObject(RegSizeInBytes, VaArgOffset, true);
|
2015-07-09 10:09:04 +08:00
|
|
|
SDValue PtrOff = DAG.getFrameIndex(FI, getPointerTy(DAG.getDataLayout()));
|
[SelectionDAG] Get rid of bool parameters in SelectionDAG::getLoad, getStore, and friends.
Summary:
Instead, we take a single flags arg (a bitset).
Also add a default 0 alignment, and change the order of arguments so the
alignment comes before the flags.
This greatly simplifies many callsites, and fixes a bug in
AMDGPUISelLowering, wherein the order of the args to getLoad was
inverted. It also greatly simplifies the process of adding another flag
to getLoad.
Reviewers: chandlerc, tstellarAMD
Subscribers: jholewinski, arsenm, jyknight, dsanders, nemanjai, llvm-commits
Differential Revision: http://reviews.llvm.org/D22249
llvm-svn: 275592
2016-07-16 02:27:10 +08:00
|
|
|
SDValue Store =
|
|
|
|
DAG.getStore(Chain, DL, ArgValue, PtrOff, MachinePointerInfo());
|
2014-07-19 06:55:25 +08:00
|
|
|
cast<StoreSDNode>(Store.getNode())->getMemOperand()->setValue(
|
|
|
|
(Value *)nullptr);
|
2012-10-27 08:21:13 +08:00
|
|
|
OutChains.push_back(Store);
|
|
|
|
}
|
|
|
|
}
|
2014-11-03 00:09:29 +08:00
|
|
|
|
|
|
|
void MipsTargetLowering::HandleByVal(CCState *State, unsigned &Size,
|
|
|
|
unsigned Align) const {
|
2015-01-30 07:27:36 +08:00
|
|
|
const TargetFrameLowering *TFL = Subtarget.getFrameLowering();
|
2014-11-03 00:09:29 +08:00
|
|
|
|
|
|
|
assert(Size && "Byval argument's size shouldn't be 0.");
|
|
|
|
|
|
|
|
Align = std::min(Align, TFL->getStackAlignment());
|
|
|
|
|
|
|
|
unsigned FirstReg = 0;
|
|
|
|
unsigned NumRegs = 0;
|
|
|
|
|
|
|
|
if (State->getCallingConv() != CallingConv::Fast) {
|
|
|
|
unsigned RegSizeInBytes = Subtarget.getGPRSizeInBytes();
|
2015-09-28 08:15:34 +08:00
|
|
|
ArrayRef<MCPhysReg> IntArgRegs = ABI.GetByValArgRegs();
|
2014-11-03 00:09:29 +08:00
|
|
|
// FIXME: The O32 case actually describes no shadow registers.
|
|
|
|
const MCPhysReg *ShadowRegs =
|
2015-01-30 07:27:36 +08:00
|
|
|
ABI.IsO32() ? IntArgRegs.data() : Mips64DPRegs;
|
2014-11-03 00:09:29 +08:00
|
|
|
|
|
|
|
// We used to check the size as well but we can't do that anymore since
|
|
|
|
// CCState::HandleByVal() rounds up the size after calling this function.
|
|
|
|
assert(!(Align % RegSizeInBytes) &&
|
|
|
|
"Byval argument's alignment should be a multiple of"
|
|
|
|
"RegSizeInBytes.");
|
|
|
|
|
2015-02-21 10:11:17 +08:00
|
|
|
FirstReg = State->getFirstUnallocated(IntArgRegs);
|
2014-11-03 00:09:29 +08:00
|
|
|
|
|
|
|
// If Align > RegSizeInBytes, the first arg register must be even.
|
|
|
|
// FIXME: This condition happens to do the right thing but it's not the
|
|
|
|
// right way to test it. We want to check that the stack frame offset
|
|
|
|
// of the register is aligned.
|
|
|
|
if ((Align > RegSizeInBytes) && (FirstReg % 2)) {
|
|
|
|
State->AllocateReg(IntArgRegs[FirstReg], ShadowRegs[FirstReg]);
|
|
|
|
++FirstReg;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Mark the registers allocated.
|
2016-01-15 05:06:47 +08:00
|
|
|
Size = alignTo(Size, RegSizeInBytes);
|
2014-11-03 00:09:29 +08:00
|
|
|
for (unsigned I = FirstReg; Size > 0 && (I < IntArgRegs.size());
|
|
|
|
Size -= RegSizeInBytes, ++I, ++NumRegs)
|
|
|
|
State->AllocateReg(IntArgRegs[I], ShadowRegs[I]);
|
|
|
|
}
|
|
|
|
|
|
|
|
State->addInRegsParamInfo(FirstReg, FirstReg + NumRegs);
|
|
|
|
}
|
2014-12-12 22:41:37 +08:00
|
|
|
|
2016-07-01 06:52:52 +08:00
|
|
|
MachineBasicBlock *MipsTargetLowering::emitPseudoSELECT(MachineInstr &MI,
|
|
|
|
MachineBasicBlock *BB,
|
|
|
|
bool isFPCmp,
|
|
|
|
unsigned Opc) const {
|
2014-12-12 22:41:37 +08:00
|
|
|
assert(!(Subtarget.hasMips4() || Subtarget.hasMips32()) &&
|
|
|
|
"Subtarget already supports SELECT nodes with the use of"
|
|
|
|
"conditional-move instructions.");
|
|
|
|
|
|
|
|
const TargetInstrInfo *TII =
|
2015-01-30 07:27:36 +08:00
|
|
|
Subtarget.getInstrInfo();
|
2016-07-01 06:52:52 +08:00
|
|
|
DebugLoc DL = MI.getDebugLoc();
|
2014-12-12 22:41:37 +08:00
|
|
|
|
|
|
|
// To "insert" a SELECT instruction, we actually have to insert the
|
|
|
|
// diamond control-flow pattern. The incoming instruction knows the
|
|
|
|
// destination vreg to set, the condition code register to branch on, the
|
|
|
|
// true/false values to select between, and a branch opcode to use.
|
|
|
|
const BasicBlock *LLVM_BB = BB->getBasicBlock();
|
2015-10-20 08:15:20 +08:00
|
|
|
MachineFunction::iterator It = ++BB->getIterator();
|
2014-12-12 22:41:37 +08:00
|
|
|
|
|
|
|
// thisMBB:
|
|
|
|
// ...
|
|
|
|
// TrueVal = ...
|
|
|
|
// setcc r1, r2, r3
|
|
|
|
// bNE r1, r0, copy1MBB
|
|
|
|
// fallthrough --> copy0MBB
|
|
|
|
MachineBasicBlock *thisMBB = BB;
|
|
|
|
MachineFunction *F = BB->getParent();
|
|
|
|
MachineBasicBlock *copy0MBB = F->CreateMachineBasicBlock(LLVM_BB);
|
|
|
|
MachineBasicBlock *sinkMBB = F->CreateMachineBasicBlock(LLVM_BB);
|
|
|
|
F->insert(It, copy0MBB);
|
|
|
|
F->insert(It, sinkMBB);
|
|
|
|
|
|
|
|
// Transfer the remainder of BB and its successor edges to sinkMBB.
|
|
|
|
sinkMBB->splice(sinkMBB->begin(), BB,
|
|
|
|
std::next(MachineBasicBlock::iterator(MI)), BB->end());
|
|
|
|
sinkMBB->transferSuccessorsAndUpdatePHIs(BB);
|
|
|
|
|
|
|
|
// Next, add the true and fallthrough blocks as its successors.
|
|
|
|
BB->addSuccessor(copy0MBB);
|
|
|
|
BB->addSuccessor(sinkMBB);
|
|
|
|
|
|
|
|
if (isFPCmp) {
|
|
|
|
// bc1[tf] cc, sinkMBB
|
|
|
|
BuildMI(BB, DL, TII->get(Opc))
|
2016-09-09 19:06:01 +08:00
|
|
|
.addReg(MI.getOperand(1).getReg())
|
2016-07-01 06:52:52 +08:00
|
|
|
.addMBB(sinkMBB);
|
2014-12-12 22:41:37 +08:00
|
|
|
} else {
|
|
|
|
// bne rs, $0, sinkMBB
|
|
|
|
BuildMI(BB, DL, TII->get(Opc))
|
2016-09-09 19:06:01 +08:00
|
|
|
.addReg(MI.getOperand(1).getReg())
|
2016-07-01 06:52:52 +08:00
|
|
|
.addReg(Mips::ZERO)
|
|
|
|
.addMBB(sinkMBB);
|
2014-12-12 22:41:37 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// copy0MBB:
|
|
|
|
// %FalseValue = ...
|
|
|
|
// # fallthrough to sinkMBB
|
|
|
|
BB = copy0MBB;
|
|
|
|
|
|
|
|
// Update machine-CFG edges
|
|
|
|
BB->addSuccessor(sinkMBB);
|
|
|
|
|
|
|
|
// sinkMBB:
|
|
|
|
// %Result = phi [ %TrueValue, thisMBB ], [ %FalseValue, copy0MBB ]
|
|
|
|
// ...
|
|
|
|
BB = sinkMBB;
|
|
|
|
|
2016-07-01 06:52:52 +08:00
|
|
|
BuildMI(*BB, BB->begin(), DL, TII->get(Mips::PHI), MI.getOperand(0).getReg())
|
2016-09-09 19:06:01 +08:00
|
|
|
.addReg(MI.getOperand(2).getReg())
|
2016-07-01 06:52:52 +08:00
|
|
|
.addMBB(thisMBB)
|
|
|
|
.addReg(MI.getOperand(3).getReg())
|
|
|
|
.addMBB(copy0MBB);
|
2014-12-12 22:41:37 +08:00
|
|
|
|
2016-07-01 06:52:52 +08:00
|
|
|
MI.eraseFromParent(); // The pseudo instruction is gone now.
|
2014-12-12 22:41:37 +08:00
|
|
|
|
|
|
|
return BB;
|
|
|
|
}
|
2015-01-10 01:21:30 +08:00
|
|
|
|
|
|
|
// FIXME? Maybe this could be a TableGen attribute on some registers and
|
|
|
|
// this table could be generated automatically from RegInfo.
|
2015-07-10 01:40:29 +08:00
|
|
|
unsigned MipsTargetLowering::getRegisterByName(const char* RegName, EVT VT,
|
|
|
|
SelectionDAG &DAG) const {
|
2015-01-10 01:21:30 +08:00
|
|
|
// Named registers is expected to be fairly rare. For now, just support $28
|
|
|
|
// since the linux kernel uses it.
|
|
|
|
if (Subtarget.isGP64bit()) {
|
|
|
|
unsigned Reg = StringSwitch<unsigned>(RegName)
|
|
|
|
.Case("$28", Mips::GP_64)
|
|
|
|
.Default(0);
|
|
|
|
if (Reg)
|
|
|
|
return Reg;
|
|
|
|
} else {
|
|
|
|
unsigned Reg = StringSwitch<unsigned>(RegName)
|
|
|
|
.Case("$28", Mips::GP)
|
|
|
|
.Default(0);
|
|
|
|
if (Reg)
|
|
|
|
return Reg;
|
|
|
|
}
|
|
|
|
report_fatal_error("Invalid register name global variable");
|
|
|
|
}
|