forked from OSchip/llvm-project
[X86] Remove isel checks for immediate size on floating point compare and xop compare instructions. NFCI
If these checks fail we end up not selecting an instruction at all. So we are already relying on the immediate being checked upstream of isel. So doing the check in isel is just bloat to the isel table. Interestingly, we didn't check on the AVX512 version of the instructions anyway. llvm-svn: 313724
This commit is contained in:
parent
2e3bf37ec4
commit
5c7cd25f82
|
@ -590,19 +590,11 @@ def SSECC : Operand<i8> {
|
|||
let OperandType = "OPERAND_IMMEDIATE";
|
||||
}
|
||||
|
||||
def i8immZExt3 : ImmLeaf<i8, [{
|
||||
return Imm >= 0 && Imm < 8;
|
||||
}]>;
|
||||
|
||||
def AVXCC : Operand<i8> {
|
||||
let PrintMethod = "printSSEAVXCC";
|
||||
let OperandType = "OPERAND_IMMEDIATE";
|
||||
}
|
||||
|
||||
def i8immZExt5 : ImmLeaf<i8, [{
|
||||
return Imm >= 0 && Imm < 32;
|
||||
}]>;
|
||||
|
||||
def AVX512ICC : Operand<i8> {
|
||||
let PrintMethod = "printSSEAVXCC";
|
||||
let OperandType = "OPERAND_IMMEDIATE";
|
||||
|
|
|
@ -2071,16 +2071,16 @@ let Predicates = [UseSSE2] in {
|
|||
multiclass sse12_cmp_scalar<RegisterClass RC, X86MemOperand x86memop,
|
||||
Operand CC, SDNode OpNode, ValueType VT,
|
||||
PatFrag ld_frag, string asm, string asm_alt,
|
||||
OpndItins itins, ImmLeaf immLeaf> {
|
||||
OpndItins itins> {
|
||||
let isCommutable = 1 in
|
||||
def rr : SIi8<0xC2, MRMSrcReg,
|
||||
(outs RC:$dst), (ins RC:$src1, RC:$src2, CC:$cc), asm,
|
||||
[(set RC:$dst, (OpNode (VT RC:$src1), RC:$src2, immLeaf:$cc))],
|
||||
[(set RC:$dst, (OpNode (VT RC:$src1), RC:$src2, imm:$cc))],
|
||||
itins.rr>, Sched<[itins.Sched]>;
|
||||
def rm : SIi8<0xC2, MRMSrcMem,
|
||||
(outs RC:$dst), (ins RC:$src1, x86memop:$src2, CC:$cc), asm,
|
||||
[(set RC:$dst, (OpNode (VT RC:$src1),
|
||||
(ld_frag addr:$src2), immLeaf:$cc))],
|
||||
(ld_frag addr:$src2), imm:$cc))],
|
||||
itins.rm>,
|
||||
Sched<[itins.Sched.Folded, ReadAfterLd]>;
|
||||
|
||||
|
@ -2101,41 +2101,41 @@ let ExeDomain = SSEPackedSingle in
|
|||
defm VCMPSS : sse12_cmp_scalar<FR32, f32mem, AVXCC, X86cmps, f32, loadf32,
|
||||
"cmp${cc}ss\t{$src2, $src1, $dst|$dst, $src1, $src2}",
|
||||
"cmpss\t{$cc, $src2, $src1, $dst|$dst, $src1, $src2, $cc}",
|
||||
SSE_ALU_F32S, i8immZExt5>, XS, VEX_4V, VEX_LIG, VEX_WIG;
|
||||
SSE_ALU_F32S>, XS, VEX_4V, VEX_LIG, VEX_WIG;
|
||||
let ExeDomain = SSEPackedDouble in
|
||||
defm VCMPSD : sse12_cmp_scalar<FR64, f64mem, AVXCC, X86cmps, f64, loadf64,
|
||||
"cmp${cc}sd\t{$src2, $src1, $dst|$dst, $src1, $src2}",
|
||||
"cmpsd\t{$cc, $src2, $src1, $dst|$dst, $src1, $src2, $cc}",
|
||||
SSE_ALU_F32S, i8immZExt5>, // same latency as 32 bit compare
|
||||
SSE_ALU_F32S>, // same latency as 32 bit compare
|
||||
XD, VEX_4V, VEX_LIG, VEX_WIG;
|
||||
|
||||
let Constraints = "$src1 = $dst" in {
|
||||
let ExeDomain = SSEPackedSingle in
|
||||
defm CMPSS : sse12_cmp_scalar<FR32, f32mem, SSECC, X86cmps, f32, loadf32,
|
||||
"cmp${cc}ss\t{$src2, $dst|$dst, $src2}",
|
||||
"cmpss\t{$cc, $src2, $dst|$dst, $src2, $cc}", SSE_ALU_F32S,
|
||||
i8immZExt3>, XS;
|
||||
"cmpss\t{$cc, $src2, $dst|$dst, $src2, $cc}", SSE_ALU_F32S>,
|
||||
XS;
|
||||
let ExeDomain = SSEPackedDouble in
|
||||
defm CMPSD : sse12_cmp_scalar<FR64, f64mem, SSECC, X86cmps, f64, loadf64,
|
||||
"cmp${cc}sd\t{$src2, $dst|$dst, $src2}",
|
||||
"cmpsd\t{$cc, $src2, $dst|$dst, $src2, $cc}",
|
||||
SSE_ALU_F64S, i8immZExt3>, XD;
|
||||
SSE_ALU_F64S>, XD;
|
||||
}
|
||||
|
||||
multiclass sse12_cmp_scalar_int<Operand memop, Operand CC,
|
||||
Intrinsic Int, string asm, OpndItins itins,
|
||||
ImmLeaf immLeaf, ComplexPattern mem_cpat> {
|
||||
ComplexPattern mem_cpat> {
|
||||
def rr : SIi8<0xC2, MRMSrcReg, (outs VR128:$dst),
|
||||
(ins VR128:$src1, VR128:$src, CC:$cc), asm,
|
||||
[(set VR128:$dst, (Int VR128:$src1,
|
||||
VR128:$src, immLeaf:$cc))],
|
||||
VR128:$src, imm:$cc))],
|
||||
itins.rr>,
|
||||
Sched<[itins.Sched]>;
|
||||
let mayLoad = 1 in
|
||||
def rm : SIi8<0xC2, MRMSrcMem, (outs VR128:$dst),
|
||||
(ins VR128:$src1, memop:$src, CC:$cc), asm,
|
||||
[(set VR128:$dst, (Int VR128:$src1,
|
||||
mem_cpat:$src, immLeaf:$cc))],
|
||||
mem_cpat:$src, imm:$cc))],
|
||||
itins.rm>,
|
||||
Sched<[itins.Sched.Folded, ReadAfterLd]>;
|
||||
}
|
||||
|
@ -2145,23 +2145,21 @@ let isCodeGenOnly = 1 in {
|
|||
let ExeDomain = SSEPackedSingle in
|
||||
defm Int_VCMPSS : sse12_cmp_scalar_int<ssmem, AVXCC, int_x86_sse_cmp_ss,
|
||||
"cmp${cc}ss\t{$src, $src1, $dst|$dst, $src1, $src}",
|
||||
SSE_ALU_F32S, i8immZExt5, sse_load_f32>,
|
||||
XS, VEX_4V;
|
||||
SSE_ALU_F32S, sse_load_f32>, XS, VEX_4V;
|
||||
let ExeDomain = SSEPackedDouble in
|
||||
defm Int_VCMPSD : sse12_cmp_scalar_int<sdmem, AVXCC, int_x86_sse2_cmp_sd,
|
||||
"cmp${cc}sd\t{$src, $src1, $dst|$dst, $src1, $src}",
|
||||
SSE_ALU_F32S, i8immZExt5, sse_load_f64>, // same latency as f32
|
||||
SSE_ALU_F32S, sse_load_f64>, // same latency as f32
|
||||
XD, VEX_4V;
|
||||
let Constraints = "$src1 = $dst" in {
|
||||
let ExeDomain = SSEPackedSingle in
|
||||
defm Int_CMPSS : sse12_cmp_scalar_int<ssmem, SSECC, int_x86_sse_cmp_ss,
|
||||
"cmp${cc}ss\t{$src, $dst|$dst, $src}",
|
||||
SSE_ALU_F32S, i8immZExt3, sse_load_f32>, XS;
|
||||
SSE_ALU_F32S, sse_load_f32>, XS;
|
||||
let ExeDomain = SSEPackedDouble in
|
||||
defm Int_CMPSD : sse12_cmp_scalar_int<sdmem, SSECC, int_x86_sse2_cmp_sd,
|
||||
"cmp${cc}sd\t{$src, $dst|$dst, $src}",
|
||||
SSE_ALU_F64S, i8immZExt3, sse_load_f64>,
|
||||
XD;
|
||||
SSE_ALU_F64S, sse_load_f64>, XD;
|
||||
}
|
||||
}
|
||||
|
||||
|
@ -2255,18 +2253,18 @@ let Defs = [EFLAGS] in {
|
|||
// sse12_cmp_packed - sse 1 & 2 compare packed instructions
|
||||
multiclass sse12_cmp_packed<RegisterClass RC, X86MemOperand x86memop,
|
||||
Operand CC, ValueType VT, string asm,
|
||||
string asm_alt, Domain d, ImmLeaf immLeaf,
|
||||
string asm_alt, Domain d,
|
||||
PatFrag ld_frag, OpndItins itins = SSE_ALU_F32P> {
|
||||
let isCommutable = 1 in
|
||||
def rri : PIi8<0xC2, MRMSrcReg,
|
||||
(outs RC:$dst), (ins RC:$src1, RC:$src2, CC:$cc), asm,
|
||||
[(set RC:$dst, (VT (X86cmpp RC:$src1, RC:$src2, immLeaf:$cc)))],
|
||||
[(set RC:$dst, (VT (X86cmpp RC:$src1, RC:$src2, imm:$cc)))],
|
||||
itins.rr, d>,
|
||||
Sched<[WriteFAdd]>;
|
||||
def rmi : PIi8<0xC2, MRMSrcMem,
|
||||
(outs RC:$dst), (ins RC:$src1, x86memop:$src2, CC:$cc), asm,
|
||||
[(set RC:$dst,
|
||||
(VT (X86cmpp RC:$src1, (ld_frag addr:$src2), immLeaf:$cc)))],
|
||||
(VT (X86cmpp RC:$src1, (ld_frag addr:$src2), imm:$cc)))],
|
||||
itins.rm, d>,
|
||||
Sched<[WriteFAddLd, ReadAfterLd]>;
|
||||
|
||||
|
@ -2286,28 +2284,28 @@ multiclass sse12_cmp_packed<RegisterClass RC, X86MemOperand x86memop,
|
|||
defm VCMPPS : sse12_cmp_packed<VR128, f128mem, AVXCC, v4f32,
|
||||
"cmp${cc}ps\t{$src2, $src1, $dst|$dst, $src1, $src2}",
|
||||
"cmpps\t{$cc, $src2, $src1, $dst|$dst, $src1, $src2, $cc}",
|
||||
SSEPackedSingle, i8immZExt5, loadv4f32>, PS, VEX_4V, VEX_WIG;
|
||||
SSEPackedSingle, loadv4f32>, PS, VEX_4V, VEX_WIG;
|
||||
defm VCMPPD : sse12_cmp_packed<VR128, f128mem, AVXCC, v2f64,
|
||||
"cmp${cc}pd\t{$src2, $src1, $dst|$dst, $src1, $src2}",
|
||||
"cmppd\t{$cc, $src2, $src1, $dst|$dst, $src1, $src2, $cc}",
|
||||
SSEPackedDouble, i8immZExt5, loadv2f64>, PD, VEX_4V, VEX_WIG;
|
||||
SSEPackedDouble, loadv2f64>, PD, VEX_4V, VEX_WIG;
|
||||
defm VCMPPSY : sse12_cmp_packed<VR256, f256mem, AVXCC, v8f32,
|
||||
"cmp${cc}ps\t{$src2, $src1, $dst|$dst, $src1, $src2}",
|
||||
"cmpps\t{$cc, $src2, $src1, $dst|$dst, $src1, $src2, $cc}",
|
||||
SSEPackedSingle, i8immZExt5, loadv8f32>, PS, VEX_4V, VEX_L;
|
||||
SSEPackedSingle, loadv8f32>, PS, VEX_4V, VEX_L;
|
||||
defm VCMPPDY : sse12_cmp_packed<VR256, f256mem, AVXCC, v4f64,
|
||||
"cmp${cc}pd\t{$src2, $src1, $dst|$dst, $src1, $src2}",
|
||||
"cmppd\t{$cc, $src2, $src1, $dst|$dst, $src1, $src2, $cc}",
|
||||
SSEPackedDouble, i8immZExt5, loadv4f64>, PD, VEX_4V, VEX_L;
|
||||
SSEPackedDouble, loadv4f64>, PD, VEX_4V, VEX_L;
|
||||
let Constraints = "$src1 = $dst" in {
|
||||
defm CMPPS : sse12_cmp_packed<VR128, f128mem, SSECC, v4f32,
|
||||
"cmp${cc}ps\t{$src2, $dst|$dst, $src2}",
|
||||
"cmpps\t{$cc, $src2, $dst|$dst, $src2, $cc}",
|
||||
SSEPackedSingle, i8immZExt5, memopv4f32, SSE_ALU_F32P>, PS;
|
||||
SSEPackedSingle, memopv4f32, SSE_ALU_F32P>, PS;
|
||||
defm CMPPD : sse12_cmp_packed<VR128, f128mem, SSECC, v2f64,
|
||||
"cmp${cc}pd\t{$src2, $dst|$dst, $src2}",
|
||||
"cmppd\t{$cc, $src2, $dst|$dst, $src2, $cc}",
|
||||
SSEPackedDouble, i8immZExt5, memopv2f64, SSE_ALU_F64P>, PD;
|
||||
SSEPackedDouble, memopv2f64, SSE_ALU_F64P>, PD;
|
||||
}
|
||||
|
||||
//===----------------------------------------------------------------------===//
|
||||
|
|
|
@ -213,7 +213,7 @@ multiclass xopvpcom<bits<8> opc, string Suffix, SDNode OpNode, ValueType vt128>
|
|||
"\t{$src2, $src1, $dst|$dst, $src1, $src2}"),
|
||||
[(set VR128:$dst,
|
||||
(vt128 (OpNode (vt128 VR128:$src1), (vt128 VR128:$src2),
|
||||
i8immZExt3:$cc)))]>,
|
||||
imm:$cc)))]>,
|
||||
XOP_4V;
|
||||
def mi : IXOPi8<opc, MRMSrcMem, (outs VR128:$dst),
|
||||
(ins VR128:$src1, i128mem:$src2, XOPCC:$cc),
|
||||
|
@ -222,7 +222,7 @@ multiclass xopvpcom<bits<8> opc, string Suffix, SDNode OpNode, ValueType vt128>
|
|||
[(set VR128:$dst,
|
||||
(vt128 (OpNode (vt128 VR128:$src1),
|
||||
(vt128 (bitconvert (loadv2i64 addr:$src2))),
|
||||
i8immZExt3:$cc)))]>,
|
||||
imm:$cc)))]>,
|
||||
XOP_4V;
|
||||
let isAsmParserOnly = 1, hasSideEffects = 0 in {
|
||||
def ri_alt : IXOPi8<opc, MRMSrcReg, (outs VR128:$dst),
|
||||
|
|
Loading…
Reference in New Issue