[SVE][CodeGen] Fix TypeSize/ElementCount related warnings in sve-split-store.ll

I have fixed up a number of warnings resulting from TypeSize -> uint64_t
casts and calling getVectorNumElements() on scalable vector types. I
think most of the changes are fairly trivial except for those in
DAGTypeLegalizer::SplitVecRes_MSTORE I've tried to ensure we create
the MachineMemoryOperands in a sensible way for scalable vectors.

I have added a CHECK line to the following test:

 CodeGen/AArch64/sve-split-store.ll

that ensures no new warnings are added.

Differential Revision: https://reviews.llvm.org/D86928
This commit is contained in:
David Sherwood 2020-08-26 10:51:56 +01:00
parent 6e25586990
commit fa0293081d
4 changed files with 37 additions and 17 deletions

View File

@ -542,28 +542,29 @@ void SelectionDAGLegalize::LegalizeStoreOps(SDNode *Node) {
LLVM_DEBUG(dbgs() << "Legalizing truncating store operations\n"); LLVM_DEBUG(dbgs() << "Legalizing truncating store operations\n");
SDValue Value = ST->getValue(); SDValue Value = ST->getValue();
EVT StVT = ST->getMemoryVT(); EVT StVT = ST->getMemoryVT();
unsigned StWidth = StVT.getSizeInBits(); TypeSize StWidth = StVT.getSizeInBits();
TypeSize StSize = StVT.getStoreSizeInBits();
auto &DL = DAG.getDataLayout(); auto &DL = DAG.getDataLayout();
if (StWidth != StVT.getStoreSizeInBits()) { if (StWidth != StSize) {
// Promote to a byte-sized store with upper bits zero if not // Promote to a byte-sized store with upper bits zero if not
// storing an integral number of bytes. For example, promote // storing an integral number of bytes. For example, promote
// TRUNCSTORE:i1 X -> TRUNCSTORE:i8 (and X, 1) // TRUNCSTORE:i1 X -> TRUNCSTORE:i8 (and X, 1)
EVT NVT = EVT::getIntegerVT(*DAG.getContext(), EVT NVT = EVT::getIntegerVT(*DAG.getContext(), StSize.getFixedSize());
StVT.getStoreSizeInBits());
Value = DAG.getZeroExtendInReg(Value, dl, StVT); Value = DAG.getZeroExtendInReg(Value, dl, StVT);
SDValue Result = SDValue Result =
DAG.getTruncStore(Chain, dl, Value, Ptr, ST->getPointerInfo(), NVT, DAG.getTruncStore(Chain, dl, Value, Ptr, ST->getPointerInfo(), NVT,
ST->getOriginalAlign(), MMOFlags, AAInfo); ST->getOriginalAlign(), MMOFlags, AAInfo);
ReplaceNode(SDValue(Node, 0), Result); ReplaceNode(SDValue(Node, 0), Result);
} else if (StWidth & (StWidth - 1)) { } else if (!StVT.isVector() && !isPowerOf2_64(StWidth.getFixedSize())) {
// If not storing a power-of-2 number of bits, expand as two stores. // If not storing a power-of-2 number of bits, expand as two stores.
assert(!StVT.isVector() && "Unsupported truncstore!"); assert(!StVT.isVector() && "Unsupported truncstore!");
unsigned LogStWidth = Log2_32(StWidth); unsigned StWidthBits = StWidth.getFixedSize();
unsigned LogStWidth = Log2_32(StWidthBits);
assert(LogStWidth < 32); assert(LogStWidth < 32);
unsigned RoundWidth = 1 << LogStWidth; unsigned RoundWidth = 1 << LogStWidth;
assert(RoundWidth < StWidth); assert(RoundWidth < StWidthBits);
unsigned ExtraWidth = StWidth - RoundWidth; unsigned ExtraWidth = StWidthBits - RoundWidth;
assert(ExtraWidth < RoundWidth); assert(ExtraWidth < RoundWidth);
assert(!(RoundWidth % 8) && !(ExtraWidth % 8) && assert(!(RoundWidth % 8) && !(ExtraWidth % 8) &&
"Store size not an integral number of bytes!"); "Store size not an integral number of bytes!");

View File

@ -2425,9 +2425,10 @@ SDValue DAGTypeLegalizer::SplitVecOp_MSTORE(MaskedStoreSDNode *N,
DAG.GetDependentSplitDestVTs(MemoryVT, DataLo.getValueType(), &HiIsEmpty); DAG.GetDependentSplitDestVTs(MemoryVT, DataLo.getValueType(), &HiIsEmpty);
SDValue Lo, Hi, Res; SDValue Lo, Hi, Res;
unsigned LoSize = MemoryLocation::getSizeOrUnknown(LoMemVT.getStoreSize());
MachineMemOperand *MMO = DAG.getMachineFunction().getMachineMemOperand( MachineMemOperand *MMO = DAG.getMachineFunction().getMachineMemOperand(
N->getPointerInfo(), MachineMemOperand::MOStore, LoMemVT.getStoreSize(), N->getPointerInfo(), MachineMemOperand::MOStore, LoSize, Alignment,
Alignment, N->getAAInfo(), N->getRanges()); N->getAAInfo(), N->getRanges());
Lo = DAG.getMaskedStore(Ch, DL, DataLo, Ptr, Offset, MaskLo, LoMemVT, MMO, Lo = DAG.getMaskedStore(Ch, DL, DataLo, Ptr, Offset, MaskLo, LoMemVT, MMO,
N->getAddressingMode(), N->isTruncatingStore(), N->getAddressingMode(), N->isTruncatingStore(),
@ -2441,11 +2442,20 @@ SDValue DAGTypeLegalizer::SplitVecOp_MSTORE(MaskedStoreSDNode *N,
Ptr = TLI.IncrementMemoryAddress(Ptr, MaskLo, DL, LoMemVT, DAG, Ptr = TLI.IncrementMemoryAddress(Ptr, MaskLo, DL, LoMemVT, DAG,
N->isCompressingStore()); N->isCompressingStore());
unsigned HiOffset = LoMemVT.getStoreSize();
MachinePointerInfo MPI;
if (LoMemVT.isScalableVector()) {
Alignment = commonAlignment(
Alignment, LoMemVT.getSizeInBits().getKnownMinSize() / 8);
MPI = MachinePointerInfo(N->getPointerInfo().getAddrSpace());
} else
MPI = N->getPointerInfo().getWithOffset(
LoMemVT.getStoreSize().getFixedSize());
unsigned HiSize = MemoryLocation::getSizeOrUnknown(HiMemVT.getStoreSize());
MMO = DAG.getMachineFunction().getMachineMemOperand( MMO = DAG.getMachineFunction().getMachineMemOperand(
N->getPointerInfo().getWithOffset(HiOffset), MachineMemOperand::MOStore, MPI, MachineMemOperand::MOStore, HiSize, Alignment, N->getAAInfo(),
HiMemVT.getStoreSize(), Alignment, N->getAAInfo(), N->getRanges()); N->getRanges());
Hi = DAG.getMaskedStore(Ch, DL, DataHi, Ptr, Offset, MaskHi, HiMemVT, MMO, Hi = DAG.getMaskedStore(Ch, DL, DataHi, Ptr, Offset, MaskHi, HiMemVT, MMO,
N->getAddressingMode(), N->isTruncatingStore(), N->getAddressingMode(), N->isTruncatingStore(),

View File

@ -2214,6 +2214,10 @@ SDValue SelectionDAG::FoldSetCC(EVT VT, SDValue N1, SDValue N2,
/// SimplifyMultipleUseDemandedBits and not generate any new nodes. /// SimplifyMultipleUseDemandedBits and not generate any new nodes.
SDValue SelectionDAG::GetDemandedBits(SDValue V, const APInt &DemandedBits) { SDValue SelectionDAG::GetDemandedBits(SDValue V, const APInt &DemandedBits) {
EVT VT = V.getValueType(); EVT VT = V.getValueType();
if (VT.isScalableVector())
return SDValue();
APInt DemandedElts = VT.isVector() APInt DemandedElts = VT.isVector()
? APInt::getAllOnesValue(VT.getVectorNumElements()) ? APInt::getAllOnesValue(VT.getVectorNumElements())
: APInt(1, 1); : APInt(1, 1);
@ -7135,7 +7139,8 @@ SDValue SelectionDAG::getTruncStore(SDValue Chain, const SDLoc &dl, SDValue Val,
MachineFunction &MF = getMachineFunction(); MachineFunction &MF = getMachineFunction();
MachineMemOperand *MMO = MF.getMachineMemOperand( MachineMemOperand *MMO = MF.getMachineMemOperand(
PtrInfo, MMOFlags, SVT.getStoreSize(), Alignment, AAInfo); PtrInfo, MMOFlags, MemoryLocation::getSizeOrUnknown(SVT.getStoreSize()),
Alignment, AAInfo);
return getTruncStore(Chain, dl, Val, Ptr, SVT, MMO); return getTruncStore(Chain, dl, Val, Ptr, SVT, MMO);
} }
@ -7156,7 +7161,7 @@ SDValue SelectionDAG::getTruncStore(SDValue Chain, const SDLoc &dl, SDValue Val,
assert(VT.isVector() == SVT.isVector() && assert(VT.isVector() == SVT.isVector() &&
"Cannot use trunc store to convert to or from a vector!"); "Cannot use trunc store to convert to or from a vector!");
assert((!VT.isVector() || assert((!VT.isVector() ||
VT.getVectorNumElements() == SVT.getVectorNumElements()) && VT.getVectorElementCount() == SVT.getVectorElementCount()) &&
"Cannot use trunc store to change the number of vector elements!"); "Cannot use trunc store to change the number of vector elements!");
SDVTList VTs = getVTList(MVT::Other); SDVTList VTs = getVTList(MVT::Other);

View File

@ -1,5 +1,9 @@
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc -mtriple=aarch64-linux-gnu -mattr=+sve < %s | FileCheck %s ; RUN: llc -mtriple=aarch64-linux-gnu -mattr=+sve < %s 2>%t | FileCheck %s
; RUN: FileCheck --check-prefix=WARN --allow-empty %s <%t
; If this check fails please read test/CodeGen/AArch64/README for instructions on how to resolve it.
; WARN-NOT: warning
; UNPREDICATED ; UNPREDICATED
@ -113,10 +117,10 @@ define void @masked_store_split_8i64(<vscale x 8 x i64> %data, <vscale x 8 x i64
; CHECK-NEXT: zip1 p0.h, p0.h, p1.h ; CHECK-NEXT: zip1 p0.h, p0.h, p1.h
; CHECK-NEXT: zip2 p3.s, p2.s, p1.s ; CHECK-NEXT: zip2 p3.s, p2.s, p1.s
; CHECK-NEXT: zip1 p2.s, p2.s, p1.s ; CHECK-NEXT: zip1 p2.s, p2.s, p1.s
; CHECK-NEXT: st1d { z3.d }, p3, [x0, #3, mul vl]
; CHECK-NEXT: st1d { z2.d }, p2, [x0, #2, mul vl] ; CHECK-NEXT: st1d { z2.d }, p2, [x0, #2, mul vl]
; CHECK-NEXT: zip2 p2.s, p0.s, p1.s ; CHECK-NEXT: zip2 p2.s, p0.s, p1.s
; CHECK-NEXT: zip1 p0.s, p0.s, p1.s ; CHECK-NEXT: zip1 p0.s, p0.s, p1.s
; CHECK-NEXT: st1d { z3.d }, p3, [x0, #3, mul vl]
; CHECK-NEXT: st1d { z1.d }, p2, [x0, #1, mul vl] ; CHECK-NEXT: st1d { z1.d }, p2, [x0, #1, mul vl]
; CHECK-NEXT: st1d { z0.d }, p0, [x0] ; CHECK-NEXT: st1d { z0.d }, p0, [x0]
; CHECK-NEXT: ret ; CHECK-NEXT: ret