[Hexagon] Avoid widening vectors with non-HVX element types

This commit is contained in:
Krzysztof Parzyszek 2020-09-12 16:32:24 -05:00
parent 70daa353e2
commit 9d300bc8d2
3 changed files with 61 additions and 14 deletions

View File

@ -1925,6 +1925,17 @@ HexagonTargetLowering::WidenHvxTruncate(SDValue Op, SelectionDAG &DAG) const {
const SDLoc &dl(Op); const SDLoc &dl(Op);
unsigned HwWidth = 8*Subtarget.getVectorLength(); unsigned HwWidth = 8*Subtarget.getVectorLength();
SDValue Op0 = Op.getOperand(0);
MVT ResTy = ty(Op);
MVT OpTy = ty(Op0);
if (!Subtarget.isHVXElementType(OpTy) || !Subtarget.isHVXElementType(ResTy))
return SDValue();
// .-res, op-> Scalar Illegal HVX
// Scalar ok extract(widen) -
// Illegal - widen widen
// HVX - - ok
auto getFactor = [HwWidth](MVT Ty) { auto getFactor = [HwWidth](MVT Ty) {
unsigned Width = Ty.getSizeInBits(); unsigned Width = Ty.getSizeInBits();
assert(HwWidth % Width == 0); assert(HwWidth % Width == 0);
@ -1936,15 +1947,6 @@ HexagonTargetLowering::WidenHvxTruncate(SDValue Op, SelectionDAG &DAG) const {
return MVT::getVectorVT(Ty.getVectorElementType(), WideLen); return MVT::getVectorVT(Ty.getVectorElementType(), WideLen);
}; };
SDValue Op0 = Op.getOperand(0);
MVT ResTy = ty(Op);
MVT OpTy = ty(Op0);
// .-res, op-> Scalar Illegal HVX
// Scalar ok extract(widen) -
// Illegal - widen widen
// HVX - - ok
if (Subtarget.isHVXVectorType(OpTy)) if (Subtarget.isHVXVectorType(OpTy))
return DAG.getNode(HexagonISD::VPACKL, dl, getWideTy(ResTy), Op0); return DAG.getNode(HexagonISD::VPACKL, dl, getWideTy(ResTy), Op0);
@ -2053,7 +2055,7 @@ HexagonTargetLowering::LowerHvxOperationWrapper(SDNode *N,
switch (Opc) { switch (Opc) {
case ISD::TRUNCATE: { case ISD::TRUNCATE: {
assert(shouldWidenToHvx(ty(Op.getOperand(0)), DAG) && "Not widening?"); assert(shouldWidenToHvx(ty(Op.getOperand(0)), DAG) && "Not widening?");
SDValue T = WidenHvxTruncate(Op, DAG); if (SDValue T = WidenHvxTruncate(Op, DAG))
Results.push_back(T); Results.push_back(T);
break; break;
} }
@ -2089,7 +2091,7 @@ HexagonTargetLowering::ReplaceHvxNodeResults(SDNode *N,
switch (Opc) { switch (Opc) {
case ISD::TRUNCATE: { case ISD::TRUNCATE: {
assert(shouldWidenToHvx(ty(Op), DAG) && "Not widening?"); assert(shouldWidenToHvx(ty(Op), DAG) && "Not widening?");
SDValue T = WidenHvxTruncate(Op, DAG); if (SDValue T = WidenHvxTruncate(Op, DAG))
Results.push_back(T); Results.push_back(T);
break; break;
} }

View File

@ -275,6 +275,17 @@ public:
return makeArrayRef(Types); return makeArrayRef(Types);
} }
bool isHVXElementType(MVT Ty, bool IncludeBool = false) const {
if (!useHVXOps())
return false;
if (Ty.isVector())
Ty = Ty.getVectorElementType();
if (IncludeBool && Ty == MVT::i1)
return true;
ArrayRef<MVT> ElemTypes = getHVXElementTypes();
return llvm::find(ElemTypes, Ty) != ElemTypes.end();
}
bool isHVXVectorType(MVT VecTy, bool IncludeBool = false) const { bool isHVXVectorType(MVT VecTy, bool IncludeBool = false) const {
if (!VecTy.isVector() || !useHVXOps() || VecTy.isScalableVector()) if (!VecTy.isVector() || !useHVXOps() || VecTy.isScalableVector())
return false; return false;
@ -298,7 +309,7 @@ public:
unsigned VecWidth = VecTy.getSizeInBits(); unsigned VecWidth = VecTy.getSizeInBits();
if (VecWidth != 8*HwLen && VecWidth != 16*HwLen) if (VecWidth != 8*HwLen && VecWidth != 16*HwLen)
return false; return false;
return llvm::any_of(ElemTypes, [ElemTy] (MVT T) { return ElemTy == T; }); return llvm::find(ElemTypes, ElemTy) != ElemTypes.end();
} }
unsigned getTypeAlignment(MVT Ty) const { unsigned getTypeAlignment(MVT Ty) const {

View File

@ -0,0 +1,34 @@
; RUN: llc -march=hexagon < %s | FileCheck %s
; Check that this does not crash.
; CHECK: vmem
target datalayout = "e-m:e-p:32:32:32-a:0-n16:32-i64:64:64-i32:32:32-i16:16:16-i1:8:8-f32:32:32-f64:64:64-v32:32:32-v64:64:64-v512:512:512-v1024:1024:1024-v2048:2048:2048"
target triple = "hexagon"
define dso_local void @f0() local_unnamed_addr #0 {
b0:
%v0 = load i32, i32* undef, align 4
%v1 = select i1 undef, i32 0, i32 1073741823
%v2 = shl i32 %v1, 0
%v3 = sext i32 %v0 to i64
%v4 = sext i32 %v2 to i64
%v5 = mul nsw i64 %v4, %v3
%v6 = lshr i64 %v5, 32
%v7 = trunc i64 %v6 to i32
%v8 = sext i32 %v7 to i64
%v9 = insertelement <32 x i64> undef, i64 %v8, i32 0
%v10 = shufflevector <32 x i64> %v9, <32 x i64> undef, <32 x i32> zeroinitializer
%v11 = getelementptr i32, i32* null, i32 32
%v12 = bitcast i32* %v11 to <32 x i32>*
%v13 = load <32 x i32>, <32 x i32>* %v12, align 4
%v14 = shl <32 x i32> %v13, zeroinitializer
%v15 = sext <32 x i32> %v14 to <32 x i64>
%v16 = mul nsw <32 x i64> %v10, %v15
%v17 = lshr <32 x i64> %v16, <i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32, i64 32>
%v18 = trunc <32 x i64> %v17 to <32 x i32>
store <32 x i32> %v18, <32 x i32>* %v12, align 4
ret void
}
attributes #0 = { "target-features"="+hvx-length128b,+hvxv67,+v67,-long-calls" }