forked from OSchip/llvm-project
Simplified TRUNCATE operation that comes after SETCC. It is possible since SETCC result is 0 or -1.
Added a test. llvm-svn: 171467
This commit is contained in:
parent
820aac1c78
commit
5f2f06d2d9
|
@ -14661,12 +14661,29 @@ static SDValue PerformShuffleCombine(SDNode *N, SelectionDAG &DAG,
|
||||||
return EltsFromConsecutiveLoads(VT, Elts, dl, DAG);
|
return EltsFromConsecutiveLoads(VT, Elts, dl, DAG);
|
||||||
}
|
}
|
||||||
|
|
||||||
/// PerformTruncateCombine - Converts truncate operation to
|
/// PerformTruncateCombine - In some cases a sequence with "truncate"
|
||||||
/// a sequence of vector shuffle operations.
|
/// operation may be simplified.
|
||||||
/// It is possible when we truncate 256-bit vector to 128-bit vector
|
|
||||||
static SDValue PerformTruncateCombine(SDNode *N, SelectionDAG &DAG,
|
static SDValue PerformTruncateCombine(SDNode *N, SelectionDAG &DAG,
|
||||||
TargetLowering::DAGCombinerInfo &DCI,
|
TargetLowering::DAGCombinerInfo &DCI,
|
||||||
const X86Subtarget *Subtarget) {
|
const X86Subtarget *Subtarget) {
|
||||||
|
EVT VT = N->getValueType(0);
|
||||||
|
if (DCI.isBeforeLegalize() || !VT.isVector())
|
||||||
|
return SDValue();
|
||||||
|
|
||||||
|
SDValue In = N->getOperand(0);
|
||||||
|
// Optimize the sequence setcc -> truncate
|
||||||
|
if (In.getOpcode() == ISD::SETCC) {
|
||||||
|
DebugLoc DL = N->getDebugLoc();
|
||||||
|
EVT InVT = In.getValueType();
|
||||||
|
|
||||||
|
// The vector element is all ones or all zero. Just take a half of it.
|
||||||
|
EVT HalfVT = EVT::getVectorVT(*DAG.getContext(), InVT.getScalarType(),
|
||||||
|
InVT.getVectorNumElements()/2);
|
||||||
|
SDValue HalfVec = DAG.getNode(ISD::EXTRACT_SUBVECTOR, DL, HalfVT, In,
|
||||||
|
DAG.getIntPtrConstant(0));
|
||||||
|
assert(HalfVT.getSizeInBits() == VT.getSizeInBits());
|
||||||
|
return DAG.getNode(ISD::BITCAST, DL, VT, HalfVec);
|
||||||
|
}
|
||||||
return SDValue();
|
return SDValue();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -13,3 +13,18 @@ define <8 x i16> @trunc_32_16(<8 x i32> %A) nounwind uwtable readnone ssp{
|
||||||
ret <8 x i16>%B
|
ret <8 x i16>%B
|
||||||
}
|
}
|
||||||
|
|
||||||
|
define <8 x i16> @trunc_after_setcc(<8 x float> %a, <8 x float> %b, <8 x float> %c, <8 x float> %d) {
|
||||||
|
; CHECK: trunc_after_setcc
|
||||||
|
; CHECK: vcmpltps
|
||||||
|
; CHECK-NOT: vextract
|
||||||
|
; CHECK: vcmpltps
|
||||||
|
; CHECK-NEXT: vandps
|
||||||
|
; CHECK-NEXT: vandps
|
||||||
|
; CHECK: ret
|
||||||
|
%res1 = fcmp olt <8 x float> %a, %b
|
||||||
|
%res2 = fcmp olt <8 x float> %c, %d
|
||||||
|
%andr = and <8 x i1>%res1, %res2
|
||||||
|
%ex = zext <8 x i1> %andr to <8 x i16>
|
||||||
|
ret <8 x i16>%ex
|
||||||
|
}
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue