forked from OSchip/llvm-project
[X86][AVX] lowerV2X128Shuffle - use getBROADCAST_LOAD helper. NFCI.
This commit is contained in:
parent
7999355106
commit
8ca666a280
|
@ -16432,21 +16432,12 @@ static SDValue lowerV2X128Shuffle(const SDLoc &DL, MVT VT, SDValue V1,
|
|||
bool SplatHi = isShuffleEquivalent(Mask, {2, 3, 2, 3}, V1);
|
||||
if ((SplatLo || SplatHi) && !Subtarget.hasAVX512() && V1.hasOneUse() &&
|
||||
X86::mayFoldLoad(peekThroughOneUseBitcasts(V1), Subtarget)) {
|
||||
auto *Ld = cast<LoadSDNode>(peekThroughOneUseBitcasts(V1));
|
||||
if (!Ld->isNonTemporal()) {
|
||||
MVT MemVT = VT.getHalfNumVectorElementsVT();
|
||||
unsigned Ofs = SplatLo ? 0 : MemVT.getStoreSize();
|
||||
SDVTList Tys = DAG.getVTList(VT, MVT::Other);
|
||||
SDValue Ptr = DAG.getMemBasePlusOffset(Ld->getBasePtr(),
|
||||
TypeSize::Fixed(Ofs), DL);
|
||||
SDValue Ops[] = {Ld->getChain(), Ptr};
|
||||
SDValue BcastLd = DAG.getMemIntrinsicNode(
|
||||
X86ISD::SUBV_BROADCAST_LOAD, DL, Tys, Ops, MemVT,
|
||||
DAG.getMachineFunction().getMachineMemOperand(
|
||||
Ld->getMemOperand(), Ofs, MemVT.getStoreSize()));
|
||||
DAG.ReplaceAllUsesOfValueWith(SDValue(Ld, 1), BcastLd.getValue(1));
|
||||
return BcastLd;
|
||||
}
|
||||
auto *Ld = cast<LoadSDNode>(peekThroughOneUseBitcasts(V1));
|
||||
if (SDValue BcstLd = getBROADCAST_LOAD(X86ISD::SUBV_BROADCAST_LOAD, DL,
|
||||
VT, MemVT, Ld, Ofs, DAG))
|
||||
return BcstLd;
|
||||
}
|
||||
|
||||
// With AVX2, use VPERMQ/VPERMPD for unary shuffles to allow memory folding.
|
||||
|
|
Loading…
Reference in New Issue