[X86][Btver2] Modelled float bitwise instructions as being performed on the float cluster (FPA/FPM) not the integer.

llvm-svn: 327793
This commit is contained in:
Simon Pilgrim 2018-03-18 12:37:35 +00:00
parent 163326d10c
commit e16790b133
4 changed files with 65 additions and 51 deletions

View File

@ -468,25 +468,39 @@ def : InstRW<[JWriteCVTPH2PSYLd], (instrs VCVTPH2PSYrm)>;
// AVX instructions.
////////////////////////////////////////////////////////////////////////////////
def JWriteLogicY: SchedWriteRes<[JFPU01]> {
let Latency = 1;
def JWriteFLogic: SchedWriteRes<[JFPU01, JFPX]> {
}
def : InstRW<[JWriteFLogic], (instrs ORPDrr, ORPSrr, VORPDrr, VORPSrr,
XORPDrr, XORPSrr, VXORPDrr, VXORPSrr,
ANDPDrr, ANDPSrr, VANDPDrr, VANDPSrr,
ANDNPDrr, ANDNPSrr, VANDNPDrr, VANDNPSrr)>;
def JWriteFLogicLd: SchedWriteRes<[JLAGU, JFPU01, JFPX]> {
let Latency = 6;
}
def : InstRW<[JWriteFLogicLd], (instrs ORPDrm, ORPSrm, VORPDrm, VORPSrm,
XORPDrm, XORPSrm, VXORPDrm, VXORPSrm,
ANDPDrm, ANDPSrm, VANDPDrm, VANDPSrm,
ANDNPDrm, ANDNPSrm, VANDNPDrm, VANDNPSrm)>;
def JWriteFLogicY: SchedWriteRes<[JFPU01]> {
let ResourceCycles = [2];
let NumMicroOps = 2;
}
def : InstRW<[JWriteLogicY], (instrs VORPDYrr, VORPSYrr,
VXORPDYrr, VXORPSYrr,
VANDPDYrr, VANDPSYrr,
VANDNPDYrr, VANDNPSYrr)>;
def : InstRW<[JWriteFLogicY], (instrs VORPDYrr, VORPSYrr,
VXORPDYrr, VXORPSYrr,
VANDPDYrr, VANDPSYrr,
VANDNPDYrr, VANDNPSYrr)>;
def JWriteLogicYLd: SchedWriteRes<[JLAGU, JFPU01]> {
def JWriteFLogicYLd: SchedWriteRes<[JLAGU, JFPU01]> {
let Latency = 6;
let ResourceCycles = [1, 2];
let NumMicroOps = 3;
}
def : InstRW<[JWriteLogicYLd], (instrs VORPDYrm, VORPSYrm,
VXORPDYrm, VXORPSYrm,
VANDPDYrm, VANDPSYrm,
VANDNPDYrm, VANDNPSYrm)>;
def : InstRW<[JWriteFLogicYLd], (instrs VORPDYrm, VORPSYrm,
VXORPDYrm, VXORPSYrm,
VANDPDYrm, VANDPSYrm,
VANDNPDYrm, VANDNPSYrm)>;
def JWriteVDPPSY: SchedWriteRes<[JFPU1, JFPU0]> {
let Latency = 12;

View File

@ -1053,25 +1053,25 @@ vzeroupper
# CHECK-NEXT: - - - - - 1.00 - 1.00 - - - - - 1.00 vaesimc (%rax), %xmm2
# CHECK-NEXT: - - - - - 1.00 - - - - - - - 1.00 vaeskeygenassist $22, %xmm0, %xmm2
# CHECK-NEXT: - - - - - 1.00 - 1.00 - - - - - 1.00 vaeskeygenassist $22, (%rax), %xmm2
# CHECK-NEXT: - - - - - - 1.00 - - - - - 1.00 - vandnpd %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - - - 1.00 1.00 - - - 1.00 - - vandnpd (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 - - - - - - - vandnpd %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 1.00 - - - - - - vandnpd (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - - - 2.00 - - - - - - - vandnpd %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - - - - 2.00 1.00 - - - - - - vandnpd (%rax), %ymm1, %ymm2
# CHECK-NEXT: - - - - - - 1.00 - - - - - 1.00 - vandnps %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - - - 1.00 1.00 - - - 1.00 - - vandnps (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 - - - - - - - vandnps %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 1.00 - - - - - - vandnps (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - - - 2.00 - - - - - - - vandnps %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - - - - 2.00 1.00 - - - - - - vandnps (%rax), %ymm1, %ymm2
# CHECK-NEXT: - - - - - - 1.00 - - - - - 1.00 - vandpd %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - - - 1.00 1.00 - - - - 1.00 - vandpd (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - 1.00 - - 1.00 - - - - - - - vandpd %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - 1.00 - - 1.00 1.00 - - - - - - vandpd (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - - - 2.00 - - - - - - - vandpd %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - - - - 2.00 1.00 - - - - - - vandpd (%rax), %ymm1, %ymm2
# CHECK-NEXT: - - - - - - 1.00 - - - - 1.00 - - vandps %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - - 1.00 - 1.00 - - - 1.00 - - vandps (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 - - - - - - - vandps %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - 1.00 1.00 - 1.00 - - - - - - vandps (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - - - 2.00 - - - - - - - vandps %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - - - - 2.00 1.00 - - - - - - vandps (%rax), %ymm1, %ymm2
# CHECK-NEXT: - - - - 1.00 - 1.00 - - - - - - - vblendpd $11, %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - 1.00 1.00 - 1.00 - - - - - - vblendpd $11, (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - 1.00 1.00 - - - - - - - - vblendpd $11, %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - 1.00 - 1.00 - - - - - - - - vblendpd $11, %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - 1.00 - - 1.00 1.00 - - - - - - vblendpd $11, (%rax), %ymm1, %ymm2
# CHECK-NEXT: - - - 1.00 - 1.00 - - - - - - - - vblendps $11, %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - 1.00 - - 1.00 1.00 - - - - - - vblendps $11, (%rax), %xmm1, %xmm2
@ -1338,12 +1338,12 @@ vzeroupper
# CHECK-NEXT: - - - - - - 2.00 1.00 - - - - - - vmulsd (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 - - - - - - - vmulss %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 1.00 - - - - - - vmulss (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - - 1.00 - - - - - 1.00 - - vorpd %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - - 1.00 - 1.00 - - - - 1.00 - vorpd (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - 1.00 1.00 - - - - - - - - vorpd %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - 1.00 - 1.00 - 1.00 - - - - - - vorpd (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - - 2.00 - - - - - - - - vorpd %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - - - 2.00 - 1.00 - - - - - - vorpd (%rax), %ymm1, %ymm2
# CHECK-NEXT: - - - - - 1.00 - - - - - 1.00 - - vorps %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - - 1.00 - 1.00 - - - - 1.00 - vorps (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - 1.00 - 1.00 - - - - - - - - vorps %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - 1.00 - 1.00 - 1.00 - - - - - - vorps (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - - 2.00 - - - - - - - - vorps %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - - - 2.00 - 1.00 - - - - - - vorps (%rax), %ymm1, %ymm2
# CHECK-NEXT: - - - - - 1.00 - - - - - 1.00 - - vpabsb %xmm0, %xmm2
@ -1681,7 +1681,7 @@ vzeroupper
# CHECK-NEXT: - - - - 1.00 - 1.00 - - - - - - - vunpckhps %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - 1.00 1.00 - 1.00 - - - - - - vunpckhps (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - 1.00 - - 1.00 - - - - - - - vunpckhps %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - - 1.00 - 1.00 1.00 - - - - - - vunpckhps (%rax), %ymm1, %ymm2
# CHECK-NEXT: - - - 1.00 - - 1.00 1.00 - - - - - - vunpckhps (%rax), %ymm1, %ymm2
# CHECK-NEXT: - - - - 1.00 - 1.00 - - - - - - - vunpcklpd %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - 1.00 - - 1.00 1.00 - - - - - - vunpcklpd (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 - - - - - - - vunpcklpd %ymm0, %ymm1, %ymm2
@ -1690,12 +1690,12 @@ vzeroupper
# CHECK-NEXT: - - - 1.00 - 1.00 - 1.00 - - - - - - vunpcklps (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 - - - - - - - vunpcklps %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - - 1.00 - 1.00 1.00 - - - - - - vunpcklps (%rax), %ymm1, %ymm2
# CHECK-NEXT: - - - - - - 1.00 - - - - - 1.00 - vxorpd %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - - 1.00 - 1.00 - - - - 1.00 - vxorpd (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 - - - - - - - vxorpd %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - 1.00 - 1.00 - 1.00 - - - - - - vxorpd (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - - - 2.00 - - - - - - - vxorpd %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - - - - 2.00 1.00 - - - - - - vxorpd (%rax), %ymm1, %ymm2
# CHECK-NEXT: - - - - - 1.00 - - - - - 1.00 - - vxorps %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - - 1.00 - 1.00 - - - 1.00 - - vxorps (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - 1.00 1.00 - - - - - - - - vxorps %xmm0, %xmm1, %xmm2
# CHECK-NEXT: - - - - 1.00 1.00 - 1.00 - - - - - - vxorps (%rax), %xmm1, %xmm2
# CHECK-NEXT: - - - - - 2.00 - - - - - - - - vxorps %ymm0, %ymm1, %ymm2
# CHECK-NEXT: - - - - - - 2.00 1.00 - - - - - - vxorps (%rax), %ymm1, %ymm2
# CHECK-NEXT: - - - - - - - - - - - - - - vzeroall

View File

@ -156,10 +156,10 @@ xorps (%rax), %xmm2
# CHECK-NEXT: - - - 1.00 - 1.00 - 1.00 - - - - - - addps (%rax), %xmm2
# CHECK-NEXT: - - - 1.00 - 1.00 - - - - - - - - addss %xmm0, %xmm2
# CHECK-NEXT: - - - 1.00 - 1.00 - 1.00 - - - - - - addss (%rax), %xmm2
# CHECK-NEXT: - - - - - 0.01 0.99 - - - - 0.50 0.50 - andnps %xmm0, %xmm2
# CHECK-NEXT: - - - - - 0.01 0.99 1.00 - - - 0.50 0.50 - andnps (%rax), %xmm2
# CHECK-NEXT: - - - - - 0.01 0.99 - - - - 0.50 0.50 - andps %xmm0, %xmm2
# CHECK-NEXT: - - - - - 0.99 0.01 1.00 - - - 0.50 0.50 - andps (%rax), %xmm2
# CHECK-NEXT: - - - 1.00 - 0.01 0.99 - - - - - - - andnps %xmm0, %xmm2
# CHECK-NEXT: - - - 1.00 - 0.01 0.99 1.00 - - - - - - andnps (%rax), %xmm2
# CHECK-NEXT: - - - 1.00 - 0.01 0.99 - - - - - - - andps %xmm0, %xmm2
# CHECK-NEXT: - - - 1.00 - 0.99 0.01 1.00 - - - - - - andps (%rax), %xmm2
# CHECK-NEXT: - - - - - 1.00 - - - - - - - - cmpps $0, %xmm0, %xmm2
# CHECK-NEXT: - - - - - 1.00 - 1.00 - - - - - - cmpps $0, (%rax), %xmm2
# CHECK-NEXT: - - - - - 1.00 - - - - - - - - cmpss $0, %xmm0, %xmm2
@ -195,9 +195,9 @@ xorps (%rax), %xmm2
# CHECK-NEXT: - - - - - - - - - 1.00 - - - - movaps %xmm0, (%rax)
# CHECK-NEXT: - - - - - - - 1.00 - - - - - - movaps (%rax), %xmm2
# CHECK-NEXT: - - - 1.00 - 0.01 0.99 - - - - - - - movhlps %xmm0, %xmm2
# CHECK-NEXT: - - - 0.01 0.99 - 1.00 - - - - - - - movlhps %xmm0, %xmm2
# CHECK-NEXT: - - - 1.00 - - 1.00 - - - - - - - movlhps %xmm0, %xmm2
# CHECK-NEXT: - - - - - - - - - 1.00 - - - - movhps %xmm0, (%rax)
# CHECK-NEXT: - - - 0.99 0.01 0.99 0.01 1.00 - - - - - - movhps (%rax), %xmm2
# CHECK-NEXT: - - - - 1.00 0.99 0.01 1.00 - - - - - - movhps (%rax), %xmm2
# CHECK-NEXT: - - - - - - - - - 1.00 - - - - movlps %xmm0, (%rax)
# CHECK-NEXT: - - - 1.00 - 1.00 - 1.00 - - - - - - movlps (%rax), %xmm2
# CHECK-NEXT: - - - - - - 1.00 - - - - 0.50 0.50 - movmskps %xmm0, %ecx
@ -212,10 +212,10 @@ xorps (%rax), %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 1.00 - - - - - - mulps (%rax), %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 - - - - - - - mulss %xmm0, %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 1.00 - - - - - - mulss (%rax), %xmm2
# CHECK-NEXT: - - - - - 0.99 0.01 - - - - 0.50 0.50 - orps %xmm0, %xmm2
# CHECK-NEXT: - - - - - 0.01 0.99 1.00 - - - 0.50 0.50 - orps (%rax), %xmm2
# CHECK-NEXT: - - - - - 1.00 - - - - - 0.50 0.50 - pinsrw $1, %eax, %xmm1
# CHECK-NEXT: - - - - - 0.01 0.99 1.00 - - - 0.50 0.50 - pinsrw $1, (%rax), %xmm1
# CHECK-NEXT: - - - 1.00 - - 1.00 - - - - - - - orps %xmm0, %xmm2
# CHECK-NEXT: - - - 1.00 - 1.00 - 1.00 - - - - - - orps (%rax), %xmm2
# CHECK-NEXT: - - - - - 0.01 0.99 - - - - 0.50 0.50 - pinsrw $1, %eax, %xmm1
# CHECK-NEXT: - - - - - 1.00 - 1.00 - - - 0.50 0.50 - pinsrw $1, (%rax), %xmm1
# CHECK-NEXT: - - - - 1.00 - 1.00 - - - - - - - rcpps %xmm0, %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 1.00 - - - - - - rcpps (%rax), %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 - - - - - - - rcpss %xmm0, %xmm2
@ -224,8 +224,8 @@ xorps (%rax), %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 1.00 - - - - - - rsqrtps (%rax), %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 - - - - - - - rsqrtss %xmm0, %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 1.00 - - - - - - rsqrtss (%rax), %xmm2
# CHECK-NEXT: - - - 1.00 - 0.99 0.01 - - - - - - - shufps $1, %xmm0, %xmm2
# CHECK-NEXT: - - - 1.00 - 0.01 0.99 1.00 - - - - - - shufps $1, (%rax), %xmm2
# CHECK-NEXT: - - - 1.00 - - 1.00 - - - - - - - shufps $1, %xmm0, %xmm2
# CHECK-NEXT: - - - 1.00 - 1.00 - 1.00 - - - - - - shufps $1, (%rax), %xmm2
# CHECK-NEXT: - - - - 21.00 - 1.00 - - - - - - - sqrtps %xmm0, %xmm2
# CHECK-NEXT: - - - - 21.00 - 1.00 1.00 - - - - - - sqrtps (%rax), %xmm2
# CHECK-NEXT: - - - - 21.00 - 1.00 - - - - - - - sqrtss %xmm0, %xmm2
@ -241,5 +241,5 @@ xorps (%rax), %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 1.00 - - - - - - unpckhps (%rax), %xmm2
# CHECK-NEXT: - - - 0.01 0.99 1.00 - - - - - - - - unpcklps %xmm0, %xmm2
# CHECK-NEXT: - - - - 1.00 0.99 0.01 1.00 - - - - - - unpcklps (%rax), %xmm2
# CHECK-NEXT: - - - - - 1.00 - - - - - 0.50 0.50 - xorps %xmm0, %xmm2
# CHECK-NEXT: - - - - - 0.99 0.01 1.00 - - - 0.50 0.50 - xorps (%rax), %xmm2
# CHECK-NEXT: - - - 1.00 - 1.00 - - - - - - - - xorps %xmm0, %xmm2
# CHECK-NEXT: - - - 0.99 0.01 0.99 0.01 1.00 - - - - - - xorps (%rax), %xmm2

View File

@ -399,10 +399,10 @@ xorpd (%rax), %xmm2
# CHECK-NEXT: - - - 1.00 - 1.00 - 1.00 - - - - - - addsd (%rax), %xmm2
# CHECK-NEXT: - - - 1.00 - 1.00 - - - - - - - - addsubpd %xmm0, %xmm2
# CHECK-NEXT: - - - 1.00 - 1.00 - 1.00 - - - - - - addsubpd (%rax), %xmm2
# CHECK-NEXT: - - - - - 1.00 - - - - - - 1.00 - andnpd %xmm0, %xmm2
# CHECK-NEXT: - - - - - 0.01 0.99 1.00 - - - 1.00 - - andnpd (%rax), %xmm2
# CHECK-NEXT: - - - - - 0.01 0.99 - - - - - 1.00 - andpd %xmm0, %xmm2
# CHECK-NEXT: - - - - - 1.00 - 1.00 - - - 1.00 - - andpd (%rax), %xmm2
# CHECK-NEXT: - - - 0.99 0.01 1.00 - - - - - - - - andnpd %xmm0, %xmm2
# CHECK-NEXT: - - - 0.99 0.01 0.01 0.99 1.00 - - - - - - andnpd (%rax), %xmm2
# CHECK-NEXT: - - - 1.00 - 0.01 0.99 - - - - - - - andpd %xmm0, %xmm2
# CHECK-NEXT: - - - 0.99 0.01 1.00 - 1.00 - - - - - - andpd (%rax), %xmm2
# CHECK-NEXT: - - - - - 1.00 - - - - - - - - cmppd $0, %xmm0, %xmm2
# CHECK-NEXT: - - - - - 1.00 - 1.00 - - - - - - cmppd $0, (%rax), %xmm2
# CHECK-NEXT: - - - - - 1.00 - - - - - - - - cmpsd $0, %xmm0, %xmm2
@ -489,8 +489,8 @@ xorpd (%rax), %xmm2
# CHECK-NEXT: - - - - - - 2.00 1.00 - - - - - - mulpd (%rax), %xmm2
# CHECK-NEXT: - - - - - - 2.00 - - - - - - - mulsd %xmm0, %xmm2
# CHECK-NEXT: - - - - - - 2.00 1.00 - - - - - - mulsd (%rax), %xmm2
# CHECK-NEXT: - - - - - 1.00 - - - - - - 1.00 - orpd %xmm0, %xmm2
# CHECK-NEXT: - - - - - - 1.00 1.00 - - - 1.00 - - orpd (%rax), %xmm2
# CHECK-NEXT: - - - 1.00 - 1.00 - - - - - - - - orpd %xmm0, %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 1.00 - - - - - - orpd (%rax), %xmm2
# CHECK-NEXT: - - - - - - 1.00 - - - - - 1.00 - pabsb %xmm0, %xmm2
# CHECK-NEXT: - - - - - 1.00 - 1.00 - - - - 1.00 - pabsb (%rax), %xmm2
# CHECK-NEXT: - - - - - 1.00 - - - - - 1.00 - - pabsd %xmm0, %xmm2
@ -645,5 +645,5 @@ xorpd (%rax), %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 1.00 - - - - - - unpckhpd (%rax), %xmm2
# CHECK-NEXT: - - - 1.00 - 1.00 - - - - - - - - unpcklpd %xmm0, %xmm2
# CHECK-NEXT: - - - - 1.00 - 1.00 1.00 - - - - - - unpcklpd (%rax), %xmm2
# CHECK-NEXT: - - - - - 1.00 - - - - - - 1.00 - xorpd %xmm0, %xmm2
# CHECK-NEXT: - - - - - 0.99 0.01 1.00 - - - 1.00 - - xorpd (%rax), %xmm2
# CHECK-NEXT: - - - 0.01 0.99 1.00 - - - - - - - - xorpd %xmm0, %xmm2
# CHECK-NEXT: - - - - 1.00 0.99 0.01 1.00 - - - - - - xorpd (%rax), %xmm2