forked from OSchip/llvm-project
Revert r199628: "[AArch64 NEON] Fix a bug caused by undef lane when generating VEXT."
This test fails the newly added regression tests. llvm-svn: 199631
This commit is contained in:
parent
b587ab679f
commit
f835fc6f4f
|
@ -4654,28 +4654,22 @@ AArch64TargetLowering::LowerVECTOR_SHUFFLE(SDValue Op,
|
|||
// it into NEON_VEXTRACT.
|
||||
if (V1EltNum == Length) {
|
||||
// Check if the shuffle mask is sequential.
|
||||
int SkipUndef = 0;
|
||||
while (ShuffleMask[SkipUndef] == -1) {
|
||||
SkipUndef++;
|
||||
bool IsSequential = true;
|
||||
int CurMask = ShuffleMask[0];
|
||||
for (int I = 0; I < Length; ++I) {
|
||||
if (ShuffleMask[I] != CurMask) {
|
||||
IsSequential = false;
|
||||
break;
|
||||
}
|
||||
CurMask++;
|
||||
}
|
||||
int CurMask = ShuffleMask[SkipUndef];
|
||||
if (CurMask >= SkipUndef) {
|
||||
bool IsSequential = true;
|
||||
for (int I = SkipUndef; I < Length; ++I) {
|
||||
if (ShuffleMask[I] != -1 && ShuffleMask[I] != CurMask) {
|
||||
IsSequential = false;
|
||||
break;
|
||||
}
|
||||
CurMask++;
|
||||
}
|
||||
if (IsSequential) {
|
||||
assert((EltSize % 8 == 0) && "Bitsize of vector element is incorrect");
|
||||
unsigned VecSize = EltSize * V1EltNum;
|
||||
unsigned Index = (EltSize / 8) * (ShuffleMask[SkipUndef] - SkipUndef);
|
||||
if (VecSize == 64 || VecSize == 128)
|
||||
return DAG.getNode(AArch64ISD::NEON_VEXTRACT, dl, VT, V1, V2,
|
||||
DAG.getConstant(Index, MVT::i64));
|
||||
}
|
||||
if (IsSequential) {
|
||||
assert((EltSize % 8 == 0) && "Bitsize of vector element is incorrect");
|
||||
unsigned VecSize = EltSize * V1EltNum;
|
||||
unsigned Index = (EltSize/8) * ShuffleMask[0];
|
||||
if (VecSize == 64 || VecSize == 128)
|
||||
return DAG.getNode(AArch64ISD::NEON_VEXTRACT, dl, VT, V1, V2,
|
||||
DAG.getConstant(Index, MVT::i64));
|
||||
}
|
||||
}
|
||||
|
||||
|
|
|
@ -188,35 +188,3 @@ entry:
|
|||
%vext = shufflevector <8 x i16> %a, <8 x i16> %b, <8 x i32> <i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10>
|
||||
ret <8 x i16> %vext
|
||||
}
|
||||
|
||||
define <8 x i8> @test_undef_vext_s8(<8 x i8> %a) {
|
||||
; CHECK: test_undef_vext_s8:
|
||||
; CHECK: ext {{v[0-9]+}}.8b, {{v[0-9]+}}.8b, {{v[0-9]+}}.8b, #0x2
|
||||
entry:
|
||||
%vext = shufflevector <8 x i8> %a, <8 x i8> undef, <8 x i32> <i32 10, i32 10, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9>
|
||||
ret <8 x i8> %vext
|
||||
}
|
||||
|
||||
define <16 x i8> @test_undef_vextq_s8(<16 x i8> %a) {
|
||||
; CHECK: test_undef_vextq_s8:
|
||||
; CHECK: ext {{v[0-9]+}}.16b, {{v[0-9]+}}.16b, {{v[0-9]+}}.16b, #0x6
|
||||
entry:
|
||||
%vext = shufflevector <16 x i8> %a, <16 x i8> undef, <16 x i32> <i32 20, i32 20, i32 20, i32 20, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15, i32 16, i32 20, i32 20, i32 20, i32 20, i32 20>
|
||||
ret <16 x i8> %vext
|
||||
}
|
||||
|
||||
define <4 x i16> @test_undef_vext_s16(<4 x i16> %a) {
|
||||
; CHECK: test_undef_vext_s16:
|
||||
; CHECK: ext {{v[0-9]+}}.8b, {{v[0-9]+}}.8b, {{v[0-9]+}}.8b, #0x2
|
||||
entry:
|
||||
%vext = shufflevector <4 x i16> %a, <4 x i16> undef, <4 x i32> <i32 4, i32 2, i32 3, i32 4>
|
||||
ret <4 x i16> %vext
|
||||
}
|
||||
|
||||
define <8 x i16> @test_undef_vextq_s16(<8 x i16> %a) {
|
||||
; CHECK: test_undef_vextq_s16:
|
||||
; CHECK: ext {{v[0-9]+}}.16b, {{v[0-9]+}}.16b, {{v[0-9]+}}.16b, #0x6
|
||||
entry:
|
||||
%vext = shufflevector <8 x i16> %a, <8 x i16> undef, <8 x i32> <i32 10, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10>
|
||||
ret <8 x i16> %vext
|
||||
}
|
||||
|
|
Loading…
Reference in New Issue