[Hexagon] Handle BUILD_VECTOR from undef values in buildHvxVectorReg

llvm-svn: 323889
This commit is contained in:
Krzysztof Parzyszek 2018-01-31 16:52:15 +00:00
parent f89f188ddb
commit 82a83391d3
2 changed files with 43 additions and 1 deletions

View File

@ -168,16 +168,19 @@ HexagonTargetLowering::buildHvxVectorReg(ArrayRef<SDValue> Values,
}
unsigned NumWords = Words.size();
bool IsSplat = true;
bool IsSplat = true, IsUndef = true;
SDValue SplatV;
for (unsigned i = 0; i != NumWords && IsSplat; ++i) {
if (isUndef(Words[i]))
continue;
IsUndef = false;
if (!SplatV.getNode())
SplatV = Words[i];
else if (SplatV != Words[i])
IsSplat = false;
}
if (IsUndef)
return DAG.getUNDEF(VecTy);
if (IsSplat) {
assert(SplatV.getNode());
auto *IdxN = dyn_cast<ConstantSDNode>(SplatV.getNode());

View File

@ -0,0 +1,39 @@
; RUN: llc -march=hexagon < %s | FileCheck %s
; During lowering, a BUILD_VECTOR of undef values was created. This was
; not properly handled by buildHvxVectorReg, which tried to generate a
; splat, but had no source value.
;
; Check that this compiles successfully.
; CHECK: vxor
target datalayout = "e-m:e-p:32:32:32-a:0-n16:32-i64:64:64-i32:32:32-i16:16:16-i1:8:8-f32:32:32-f64:64:64-v32:32:32-v64:64:64-v512:512:512-v1024:1024:1024-v2048:2048:2048"
target triple = "hexagon"
define void @fred() #0 {
b0:
%v1 = load i8, i8* undef, align 1
%v2 = insertelement <32 x i8> undef, i8 %v1, i32 31
%v3 = zext <32 x i8> %v2 to <32 x i16>
%v4 = add nuw nsw <32 x i16> %v3, zeroinitializer
%v5 = add nuw nsw <32 x i16> %v4, zeroinitializer
%v6 = add nuw nsw <32 x i16> %v5, zeroinitializer
%v7 = add nuw nsw <32 x i16> %v6, zeroinitializer
%v8 = add nuw nsw <32 x i16> %v7, zeroinitializer
%v9 = add nuw nsw <32 x i16> %v8, zeroinitializer
%v10 = add <32 x i16> %v9, zeroinitializer
%v11 = add <32 x i16> %v10, zeroinitializer
%v12 = add <32 x i16> %v11, zeroinitializer
%v13 = add <32 x i16> %v12, zeroinitializer
%v14 = add <32 x i16> %v13, zeroinitializer
%v15 = add <32 x i16> %v14, zeroinitializer
%v16 = add <32 x i16> %v15, zeroinitializer
%v17 = add <32 x i16> %v16, zeroinitializer
%v18 = add <32 x i16> %v17, zeroinitializer
%v19 = lshr <32 x i16> %v18, <i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4, i16 4>
%v20 = trunc <32 x i16> %v19 to <32 x i8>
store <32 x i8> %v20, <32 x i8>* undef, align 1
unreachable
}
attributes #0 = { norecurse nounwind "target-cpu"="hexagonv60" "target-features"="+hvx-length64b,+hvxv60" }