forked from OSchip/llvm-project
[X86][ARM][TargetLowering] Add SrcVT to isExtractSubvectorCheap
Summary: Without the SrcVT its hard to know what is really being asked for. For example if your target has 128, 256, and 512 bit vectors. Maybe extracting 128 from 256 is cheap, but maybe extracting 128 from 512 is not. For x86 we do support extracting a quarter of a 512-bit register. But for i1 vectors we don't have isel patterns for extracting arbitrary pieces. So we need this to have a correct implementation of isExtractSubvectorCheap for mask vectors. Reviewers: RKSimon, zvi, efriedma Reviewed By: RKSimon Subscribers: aemerson, javed.absar, kristof.beyls, llvm-commits Differential Revision: https://reviews.llvm.org/D36649 llvm-svn: 310793
This commit is contained in:
parent
bed2c50607
commit
2251ef95a3
|
@ -2172,11 +2172,12 @@ public:
|
|||
return false;
|
||||
}
|
||||
|
||||
/// Return true if EXTRACT_SUBVECTOR is cheap for this result type
|
||||
/// with this index. This is needed because EXTRACT_SUBVECTOR usually
|
||||
/// has custom lowering that depends on the index of the first element,
|
||||
/// and only the target knows which lowering is cheap.
|
||||
virtual bool isExtractSubvectorCheap(EVT ResVT, unsigned Index) const {
|
||||
/// Return true if EXTRACT_SUBVECTOR is cheap for extracting this result type
|
||||
/// from this source type with this index. This is needed because
|
||||
/// EXTRACT_SUBVECTOR usually has custom lowering that depends on the index of
|
||||
/// the first element, and only the target knows which lowering is cheap.
|
||||
virtual bool isExtractSubvectorCheap(EVT ResVT, EVT SrcVT,
|
||||
unsigned Index) const {
|
||||
return false;
|
||||
}
|
||||
|
||||
|
|
|
@ -14212,7 +14212,7 @@ SDValue DAGCombiner::createBuildVecShuffle(const SDLoc &DL, SDNode *N,
|
|||
VecIn1 = DAG.getNode(ISD::CONCAT_VECTORS, DL, VT, ConcatOps);
|
||||
VecIn2 = SDValue();
|
||||
} else if (InVT1.getSizeInBits() == VT.getSizeInBits() * 2) {
|
||||
if (!TLI.isExtractSubvectorCheap(VT, NumElems))
|
||||
if (!TLI.isExtractSubvectorCheap(VT, InVT1, NumElems))
|
||||
return SDValue();
|
||||
|
||||
if (!VecIn2.getNode()) {
|
||||
|
|
|
@ -13402,7 +13402,7 @@ bool ARMTargetLowering::shouldConvertConstantLoadToIntImm(const APInt &Imm,
|
|||
return true;
|
||||
}
|
||||
|
||||
bool ARMTargetLowering::isExtractSubvectorCheap(EVT ResVT,
|
||||
bool ARMTargetLowering::isExtractSubvectorCheap(EVT ResVT, EVT SrcVT,
|
||||
unsigned Index) const {
|
||||
if (!isOperationLegalOrCustom(ISD::EXTRACT_SUBVECTOR, ResVT))
|
||||
return false;
|
||||
|
|
|
@ -459,7 +459,8 @@ class InstrItineraryData;
|
|||
|
||||
/// Return true if EXTRACT_SUBVECTOR is cheap for this result type
|
||||
/// with this index.
|
||||
bool isExtractSubvectorCheap(EVT ResVT, unsigned Index) const override;
|
||||
bool isExtractSubvectorCheap(EVT ResVT, EVT SrcVT,
|
||||
unsigned Index) const override;
|
||||
|
||||
/// \brief Returns true if an argument of type Ty needs to be passed in a
|
||||
/// contiguous block of registers in calling convention CallConv.
|
||||
|
|
|
@ -4574,7 +4574,7 @@ bool X86TargetLowering::shouldConvertConstantLoadToIntImm(const APInt &Imm,
|
|||
return true;
|
||||
}
|
||||
|
||||
bool X86TargetLowering::isExtractSubvectorCheap(EVT ResVT,
|
||||
bool X86TargetLowering::isExtractSubvectorCheap(EVT ResVT, EVT SrcVT,
|
||||
unsigned Index) const {
|
||||
if (!isOperationLegalOrCustom(ISD::EXTRACT_SUBVECTOR, ResVT))
|
||||
return false;
|
||||
|
|
|
@ -1036,7 +1036,8 @@ namespace llvm {
|
|||
|
||||
/// Return true if EXTRACT_SUBVECTOR is cheap for this result type
|
||||
/// with this index.
|
||||
bool isExtractSubvectorCheap(EVT ResVT, unsigned Index) const override;
|
||||
bool isExtractSubvectorCheap(EVT ResVT, EVT SrcVT,
|
||||
unsigned Index) const override;
|
||||
|
||||
/// Intel processors have a unified instruction and data cache
|
||||
const char * getClearCacheBuiltinName() const override {
|
||||
|
|
Loading…
Reference in New Issue