forked from OSchip/llvm-project
[X86] AMD Zen 3 Scheduler Model
Introduce basic schedule model for AMD Zen 3 CPU's, a.k.a `znver3`. This is fully built from scratch, from llvm-mca measurements and documented reference materials. Nothing was copied from `znver2`/`znver1`. I believe this is in a reasonable state of completion for inclusion, probably better than D52779 `bdver2` was :) Namely: * uops are pretty spot-on (at least what llvm-mca can measure) {F16422596} * latency is also pretty spot-on (at least what llvm-mca can measure) {F16422601} * throughput is within reason {F16422607} I haven't run much benchmarks with this, however RawSpeed benchmarks says this is beneficial: {F16603978} {F16604029} I'll call out the obvious problems there: * i didn't really bother with X87 instructions * i didn't really bother with obviously-microcoded/system instructions * There are large discrepancy in throughput for `mr` and `rm` instructions. I'm not really sure if it's a modelling defect that needs to be fixed, or it's a defect of measurments. * Pipe distributions are probably bad :) I can't do much here until AMD allows that to be fixed by documenting the appropriate counters and updating libpfm That being said, as @RKSimon notes: >>! In D94395#2647381, @RKSimon wrote: > I'll mention again that all the znver* models appear to be very inaccurate wrt SIMD/FPU instructions <...> so how much worse this could possibly be?! Things that aren't there: * Various tunings: zero idioms, etc. That is follow-ups. Differential Revision: https://reviews.llvm.org/D94395
This commit is contained in:
parent
8518742104
commit
2b93c9c16c
|
@ -555,6 +555,7 @@ include "X86SchedBroadwell.td"
|
|||
include "X86ScheduleSLM.td"
|
||||
include "X86ScheduleZnver1.td"
|
||||
include "X86ScheduleZnver2.td"
|
||||
include "X86ScheduleZnver3.td"
|
||||
include "X86ScheduleBdVer2.td"
|
||||
include "X86ScheduleBtVer2.td"
|
||||
include "X86SchedSkylakeClient.td"
|
||||
|
@ -1382,7 +1383,7 @@ def : ProcModel<"znver1", Znver1Model, ProcessorFeatures.ZNFeatures,
|
|||
ProcessorFeatures.ZNTuning>;
|
||||
def : ProcModel<"znver2", Znver2Model, ProcessorFeatures.ZN2Features,
|
||||
ProcessorFeatures.ZN2Tuning>;
|
||||
def : ProcModel<"znver3", Znver2Model, ProcessorFeatures.ZN3Features,
|
||||
def : ProcModel<"znver3", Znver3Model, ProcessorFeatures.ZN3Features,
|
||||
ProcessorFeatures.ZN3Tuning>;
|
||||
|
||||
def : Proc<"geode", [FeatureX87, FeatureCMPXCHG8B, Feature3DNowA],
|
||||
|
|
|
@ -233,3 +233,16 @@ def ZnVer2PfmCounters : ProcPfmCounters {
|
|||
];
|
||||
}
|
||||
def : PfmCountersBinding<"znver2", ZnVer2PfmCounters>;
|
||||
|
||||
def ZnVer3PfmCounters : ProcPfmCounters {
|
||||
let CycleCounter = PfmCounter<"cycles_not_in_halt">;
|
||||
let UopsCounter = PfmCounter<"retired_ops">;
|
||||
let IssueCounters = [
|
||||
PfmIssueCounter<"Zn3Int", "ops_type_dispatched_from_decoder:int_disp_retire_mode">,
|
||||
PfmIssueCounter<"Zn3FPU", "ops_type_dispatched_from_decoder:fp_disp_retire_mode">,
|
||||
PfmIssueCounter<"Zn3Load", "ls_dispatch:ld_dispatch">,
|
||||
PfmIssueCounter<"Zn3Store", "ls_dispatch:store_dispatch">,
|
||||
PfmIssueCounter<"Zn3Divider", "div_op_count">
|
||||
];
|
||||
}
|
||||
def : PfmCountersBinding<"znver3", ZnVer3PfmCounters>;
|
||||
|
|
File diff suppressed because it is too large
Load Diff
|
@ -48,6 +48,7 @@
|
|||
; RUN: llc < %s -mtriple=i386-unknown-unknown -mcpu=bdver4 2>&1 | FileCheck %s --check-prefix=FAST
|
||||
; RUN: llc < %s -mtriple=i386-unknown-unknown -mcpu=znver1 2>&1 | FileCheck %s --check-prefix=FAST
|
||||
; RUN: llc < %s -mtriple=i386-unknown-unknown -mcpu=znver2 2>&1 | FileCheck %s --check-prefix=FAST
|
||||
; RUN: llc < %s -mtriple=i386-unknown-unknown -mcpu=znver3 2>&1 | FileCheck %s --check-prefix=FAST
|
||||
|
||||
; Other chips with slow unaligned memory accesses
|
||||
|
||||
|
|
|
@ -14,6 +14,7 @@
|
|||
; RUN: llc < %s -mtriple=x86_64-- -mcpu=bdver4 | FileCheck %s
|
||||
; RUN: llc < %s -mtriple=x86_64-- -mcpu=znver1 | FileCheck %s
|
||||
; RUN: llc < %s -mtriple=x86_64-- -mcpu=znver2 | FileCheck %s
|
||||
; RUN: llc < %s -mtriple=x86_64-- -mcpu=znver3 | FileCheck %s
|
||||
|
||||
; Verify that for the X86_64 processors that are known to have poor latency
|
||||
; double precision shift instructions we do not generate 'shld' or 'shrd'
|
||||
|
|
|
@ -0,0 +1,48 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -iterations=1 -resource-pressure=false -timeline < %s | FileCheck %s
|
||||
|
||||
imul %rax, %rbx
|
||||
lzcnt %ax, %bx
|
||||
add %ecx, %ebx
|
||||
|
||||
# CHECK: Iterations: 1
|
||||
# CHECK-NEXT: Instructions: 3
|
||||
# CHECK-NEXT: Total Cycles: 8
|
||||
# CHECK-NEXT: Total uOps: 3
|
||||
|
||||
# CHECK: Dispatch Width: 6
|
||||
# CHECK-NEXT: uOps Per Cycle: 0.38
|
||||
# CHECK-NEXT: IPC: 0.38
|
||||
# CHECK-NEXT: Block RThroughput: 1.3
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 3 1.00 imulq %rax, %rbx
|
||||
# CHECK-NEXT: 1 1 1.00 lzcntw %ax, %bx
|
||||
# CHECK-NEXT: 1 1 0.25 addl %ecx, %ebx
|
||||
|
||||
# CHECK: Timeline view:
|
||||
# CHECK-NEXT: Index 01234567
|
||||
|
||||
# CHECK: [0,0] DeeeER . imulq %rax, %rbx
|
||||
# CHECK-NEXT: [0,1] D===eER. lzcntw %ax, %bx
|
||||
# CHECK-NEXT: [0,2] D====eER addl %ecx, %ebx
|
||||
|
||||
# CHECK: Average Wait times (based on the timeline view):
|
||||
# CHECK-NEXT: [0]: Executions
|
||||
# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
|
||||
# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
|
||||
# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
|
||||
|
||||
# CHECK: [0] [1] [2] [3]
|
||||
# CHECK-NEXT: 0. 1 1.0 1.0 0.0 imulq %rax, %rbx
|
||||
# CHECK-NEXT: 1. 1 4.0 0.0 0.0 lzcntw %ax, %bx
|
||||
# CHECK-NEXT: 2. 1 5.0 0.0 0.0 addl %ecx, %ebx
|
||||
# CHECK-NEXT: 1 3.3 0.3 0.0 <total>
|
|
@ -0,0 +1,102 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -iterations=1500 -timeline -timeline-max-iterations=6 < %s | FileCheck %s
|
||||
|
||||
# The ILP is limited by the false dependency on %dx. So, the mov cannot execute
|
||||
# in parallel with the add.
|
||||
|
||||
add %cx, %dx
|
||||
mov %ax, %dx
|
||||
xor %bx, %dx
|
||||
|
||||
# CHECK: Iterations: 1500
|
||||
# CHECK-NEXT: Instructions: 4500
|
||||
# CHECK-NEXT: Total Cycles: 4503
|
||||
# CHECK-NEXT: Total uOps: 4500
|
||||
|
||||
# CHECK: Dispatch Width: 6
|
||||
# CHECK-NEXT: uOps Per Cycle: 1.00
|
||||
# CHECK-NEXT: IPC: 1.00
|
||||
# CHECK-NEXT: Block RThroughput: 1.5
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 1 0.25 addw %cx, %dx
|
||||
# CHECK-NEXT: 1 1 1.00 movw %ax, %dx
|
||||
# CHECK-NEXT: 1 1 0.25 xorw %bx, %dx
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: - - - 1.50 1.50 1.50 1.50 - - - - - - - - - - - - - - - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - addw %cx, %dx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - movw %ax, %dx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - xorw %bx, %dx
|
||||
|
||||
# CHECK: Timeline view:
|
||||
# CHECK-NEXT: 0123456789
|
||||
# CHECK-NEXT: Index 0123456789 0
|
||||
|
||||
# CHECK: [0,0] DeER . . . . addw %cx, %dx
|
||||
# CHECK-NEXT: [0,1] D=eER. . . . movw %ax, %dx
|
||||
# CHECK-NEXT: [0,2] D==eER . . . xorw %bx, %dx
|
||||
# CHECK-NEXT: [1,0] D===eER . . . addw %cx, %dx
|
||||
# CHECK-NEXT: [1,1] D====eER . . . movw %ax, %dx
|
||||
# CHECK-NEXT: [1,2] D=====eER . . . xorw %bx, %dx
|
||||
# CHECK-NEXT: [2,0] .D=====eER. . . addw %cx, %dx
|
||||
# CHECK-NEXT: [2,1] .D======eER . . movw %ax, %dx
|
||||
# CHECK-NEXT: [2,2] .D=======eER . . xorw %bx, %dx
|
||||
# CHECK-NEXT: [3,0] .D========eER . . addw %cx, %dx
|
||||
# CHECK-NEXT: [3,1] .D=========eER . . movw %ax, %dx
|
||||
# CHECK-NEXT: [3,2] .D==========eER. . xorw %bx, %dx
|
||||
# CHECK-NEXT: [4,0] . D==========eER . addw %cx, %dx
|
||||
# CHECK-NEXT: [4,1] . D===========eER . movw %ax, %dx
|
||||
# CHECK-NEXT: [4,2] . D============eER . xorw %bx, %dx
|
||||
# CHECK-NEXT: [5,0] . D=============eER . addw %cx, %dx
|
||||
# CHECK-NEXT: [5,1] . D==============eER. movw %ax, %dx
|
||||
# CHECK-NEXT: [5,2] . D===============eER xorw %bx, %dx
|
||||
|
||||
# CHECK: Average Wait times (based on the timeline view):
|
||||
# CHECK-NEXT: [0]: Executions
|
||||
# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
|
||||
# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
|
||||
# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
|
||||
|
||||
# CHECK: [0] [1] [2] [3]
|
||||
# CHECK-NEXT: 0. 6 7.5 0.2 0.0 addw %cx, %dx
|
||||
# CHECK-NEXT: 1. 6 8.5 0.0 0.0 movw %ax, %dx
|
||||
# CHECK-NEXT: 2. 6 9.5 0.0 0.0 xorw %bx, %dx
|
||||
# CHECK-NEXT: 6 8.5 0.1 0.0 <total>
|
|
@ -0,0 +1,105 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -iterations=1500 -timeline -timeline-max-iterations=7 < %s | FileCheck %s
|
||||
|
||||
# The lzcnt cannot execute in parallel with the imul because there is a false
|
||||
# dependency on %bx.
|
||||
|
||||
imul %ax, %bx
|
||||
lzcnt %ax, %bx
|
||||
add %cx, %bx
|
||||
|
||||
# CHECK: Iterations: 1500
|
||||
# CHECK-NEXT: Instructions: 4500
|
||||
# CHECK-NEXT: Total Cycles: 7503
|
||||
# CHECK-NEXT: Total uOps: 4500
|
||||
|
||||
# CHECK: Dispatch Width: 6
|
||||
# CHECK-NEXT: uOps Per Cycle: 0.60
|
||||
# CHECK-NEXT: IPC: 0.60
|
||||
# CHECK-NEXT: Block RThroughput: 1.3
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 3 1.00 imulw %ax, %bx
|
||||
# CHECK-NEXT: 1 1 1.00 lzcntw %ax, %bx
|
||||
# CHECK-NEXT: 1 1 0.25 addw %cx, %bx
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: - - - 1.67 1.00 1.67 1.67 - - - - - - - - - - - - - - - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - imulw %ax, %bx
|
||||
# CHECK-NEXT: - - - 1.33 - 1.33 1.33 - - - - - - - - - - - - - - - - lzcntw %ax, %bx
|
||||
# CHECK-NEXT: - - - 0.33 - 0.33 0.33 - - - - - - - - - - - - - - - - addw %cx, %bx
|
||||
|
||||
# CHECK: Timeline view:
|
||||
# CHECK-NEXT: 0123456789 01234567
|
||||
# CHECK-NEXT: Index 0123456789 0123456789
|
||||
|
||||
# CHECK: [0,0] DeeeER . . . . . . . imulw %ax, %bx
|
||||
# CHECK-NEXT: [0,1] D===eER . . . . . . . lzcntw %ax, %bx
|
||||
# CHECK-NEXT: [0,2] D====eER . . . . . . . addw %cx, %bx
|
||||
# CHECK-NEXT: [1,0] D=====eeeER . . . . . . imulw %ax, %bx
|
||||
# CHECK-NEXT: [1,1] D========eER . . . . . . lzcntw %ax, %bx
|
||||
# CHECK-NEXT: [1,2] D=========eER . . . . . . addw %cx, %bx
|
||||
# CHECK-NEXT: [2,0] .D=========eeeER . . . . . imulw %ax, %bx
|
||||
# CHECK-NEXT: [2,1] .D============eER . . . . . lzcntw %ax, %bx
|
||||
# CHECK-NEXT: [2,2] .D=============eER . . . . . addw %cx, %bx
|
||||
# CHECK-NEXT: [3,0] .D==============eeeER . . . . imulw %ax, %bx
|
||||
# CHECK-NEXT: [3,1] .D=================eER . . . . lzcntw %ax, %bx
|
||||
# CHECK-NEXT: [3,2] .D==================eER . . . . addw %cx, %bx
|
||||
# CHECK-NEXT: [4,0] . D==================eeeER . . . imulw %ax, %bx
|
||||
# CHECK-NEXT: [4,1] . D=====================eER . . . lzcntw %ax, %bx
|
||||
# CHECK-NEXT: [4,2] . D======================eER . . . addw %cx, %bx
|
||||
# CHECK-NEXT: [5,0] . D=======================eeeER . . imulw %ax, %bx
|
||||
# CHECK-NEXT: [5,1] . D==========================eER . . lzcntw %ax, %bx
|
||||
# CHECK-NEXT: [5,2] . D===========================eER . . addw %cx, %bx
|
||||
# CHECK-NEXT: [6,0] . D===========================eeeER . imulw %ax, %bx
|
||||
# CHECK-NEXT: [6,1] . D==============================eER. lzcntw %ax, %bx
|
||||
# CHECK-NEXT: [6,2] . D===============================eER addw %cx, %bx
|
||||
|
||||
# CHECK: Average Wait times (based on the timeline view):
|
||||
# CHECK-NEXT: [0]: Executions
|
||||
# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
|
||||
# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
|
||||
# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
|
||||
|
||||
# CHECK: [0] [1] [2] [3]
|
||||
# CHECK-NEXT: 0. 7 14.7 0.1 0.0 imulw %ax, %bx
|
||||
# CHECK-NEXT: 1. 7 17.7 0.0 0.0 lzcntw %ax, %bx
|
||||
# CHECK-NEXT: 2. 7 18.7 0.0 0.0 addw %cx, %bx
|
||||
# CHECK-NEXT: 7 17.0 0.0 0.0 <total>
|
|
@ -0,0 +1,80 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -iterations=1500 -timeline -timeline-max-iterations=8 < %s | FileCheck %s
|
||||
|
||||
lzcnt %ax, %bx ## partial register stall.
|
||||
|
||||
# CHECK: Iterations: 1500
|
||||
# CHECK-NEXT: Instructions: 1500
|
||||
# CHECK-NEXT: Total Cycles: 1503
|
||||
# CHECK-NEXT: Total uOps: 1500
|
||||
|
||||
# CHECK: Dispatch Width: 6
|
||||
# CHECK-NEXT: uOps Per Cycle: 1.00
|
||||
# CHECK-NEXT: IPC: 1.00
|
||||
# CHECK-NEXT: Block RThroughput: 1.0
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 1 1.00 lzcntw %ax, %bx
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - lzcntw %ax, %bx
|
||||
|
||||
# CHECK: Timeline view:
|
||||
# CHECK-NEXT: 0
|
||||
# CHECK-NEXT: Index 0123456789
|
||||
|
||||
# CHECK: [0,0] DeER . . lzcntw %ax, %bx
|
||||
# CHECK-NEXT: [1,0] D=eER. . lzcntw %ax, %bx
|
||||
# CHECK-NEXT: [2,0] D==eER . lzcntw %ax, %bx
|
||||
# CHECK-NEXT: [3,0] D===eER . lzcntw %ax, %bx
|
||||
# CHECK-NEXT: [4,0] D====eER . lzcntw %ax, %bx
|
||||
# CHECK-NEXT: [5,0] D=====eER . lzcntw %ax, %bx
|
||||
# CHECK-NEXT: [6,0] .D=====eER. lzcntw %ax, %bx
|
||||
# CHECK-NEXT: [7,0] .D======eER lzcntw %ax, %bx
|
||||
|
||||
# CHECK: Average Wait times (based on the timeline view):
|
||||
# CHECK-NEXT: [0]: Executions
|
||||
# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
|
||||
# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
|
||||
# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
|
||||
|
||||
# CHECK: [0] [1] [2] [3]
|
||||
# CHECK-NEXT: 0. 8 4.3 0.1 0.0 lzcntw %ax, %bx
|
|
@ -0,0 +1,98 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -iterations=1500 -timeline -timeline-max-iterations=4 < %s | FileCheck %s
|
||||
|
||||
# Each lzcnt has a false dependency on %ecx; the first lzcnt has to wait on the
|
||||
# imul. However, the folded load can start immediately.
|
||||
# The last lzcnt has a false dependency on %cx. However, even in this case, the
|
||||
# folded load can start immediately.
|
||||
|
||||
imul %edx, %ecx
|
||||
lzcnt (%rsp), %cx
|
||||
lzcnt 2(%rsp), %cx
|
||||
|
||||
# CHECK: Iterations: 1500
|
||||
# CHECK-NEXT: Instructions: 4500
|
||||
# CHECK-NEXT: Total Cycles: 9003
|
||||
# CHECK-NEXT: Total uOps: 4500
|
||||
|
||||
# CHECK: Dispatch Width: 6
|
||||
# CHECK-NEXT: uOps Per Cycle: 0.50
|
||||
# CHECK-NEXT: IPC: 0.50
|
||||
# CHECK-NEXT: Block RThroughput: 1.0
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 3 1.00 imull %edx, %ecx
|
||||
# CHECK-NEXT: 1 5 0.33 * lzcntw (%rsp), %cx
|
||||
# CHECK-NEXT: 1 5 0.33 * lzcntw 2(%rsp), %cx
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: 0.67 0.67 0.67 0.67 1.00 0.67 0.67 - - - - - - - - 0.67 0.67 0.67 0.67 0.67 0.67 - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - imull %edx, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.33 - 0.33 0.33 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - lzcntw (%rsp), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.33 - 0.33 0.33 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - lzcntw 2(%rsp), %cx
|
||||
|
||||
# CHECK: Timeline view:
|
||||
# CHECK-NEXT: 0123456789
|
||||
# CHECK-NEXT: Index 0123456789 0123456
|
||||
|
||||
# CHECK: [0,0] DeeeER . . . .. imull %edx, %ecx
|
||||
# CHECK-NEXT: [0,1] DeeeeeER . . . .. lzcntw (%rsp), %cx
|
||||
# CHECK-NEXT: [0,2] D=eeeeeER . . . .. lzcntw 2(%rsp), %cx
|
||||
# CHECK-NEXT: [1,0] D======eeeER . . .. imull %edx, %ecx
|
||||
# CHECK-NEXT: [1,1] D======eeeeeER . . .. lzcntw (%rsp), %cx
|
||||
# CHECK-NEXT: [1,2] D=======eeeeeER. . .. lzcntw 2(%rsp), %cx
|
||||
# CHECK-NEXT: [2,0] .D===========eeeER . .. imull %edx, %ecx
|
||||
# CHECK-NEXT: [2,1] .D===========eeeeeER. .. lzcntw (%rsp), %cx
|
||||
# CHECK-NEXT: [2,2] .D============eeeeeER .. lzcntw 2(%rsp), %cx
|
||||
# CHECK-NEXT: [3,0] .D=================eeeER .. imull %edx, %ecx
|
||||
# CHECK-NEXT: [3,1] .D=================eeeeeER. lzcntw (%rsp), %cx
|
||||
# CHECK-NEXT: [3,2] .D==================eeeeeER lzcntw 2(%rsp), %cx
|
||||
|
||||
# CHECK: Average Wait times (based on the timeline view):
|
||||
# CHECK-NEXT: [0]: Executions
|
||||
# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
|
||||
# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
|
||||
# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
|
||||
|
||||
# CHECK: [0] [1] [2] [3]
|
||||
# CHECK-NEXT: 0. 4 9.5 0.3 0.0 imull %edx, %ecx
|
||||
# CHECK-NEXT: 1. 4 9.5 0.0 0.0 lzcntw (%rsp), %cx
|
||||
# CHECK-NEXT: 2. 4 10.5 0.0 0.0 lzcntw 2(%rsp), %cx
|
||||
# CHECK-NEXT: 4 9.8 0.1 0.0 <total>
|
|
@ -0,0 +1,52 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -iterations=1 -resource-pressure=false -timeline < %s | FileCheck %s
|
||||
|
||||
# An instruction that writes to a 32-bit register will not have any false
|
||||
# dependence on the corresponding 64-bit register because the upper part of
|
||||
# the 64-bit register is set to zero
|
||||
|
||||
imulq %rax, %rcx
|
||||
addl %edx, %ecx
|
||||
addq %rcx, %rdx
|
||||
|
||||
# CHECK: Iterations: 1
|
||||
# CHECK-NEXT: Instructions: 3
|
||||
# CHECK-NEXT: Total Cycles: 8
|
||||
# CHECK-NEXT: Total uOps: 3
|
||||
|
||||
# CHECK: Dispatch Width: 6
|
||||
# CHECK-NEXT: uOps Per Cycle: 0.38
|
||||
# CHECK-NEXT: IPC: 0.38
|
||||
# CHECK-NEXT: Block RThroughput: 1.0
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 3 1.00 imulq %rax, %rcx
|
||||
# CHECK-NEXT: 1 1 0.25 addl %edx, %ecx
|
||||
# CHECK-NEXT: 1 1 0.25 addq %rcx, %rdx
|
||||
|
||||
# CHECK: Timeline view:
|
||||
# CHECK-NEXT: Index 01234567
|
||||
|
||||
# CHECK: [0,0] DeeeER . imulq %rax, %rcx
|
||||
# CHECK-NEXT: [0,1] D===eER. addl %edx, %ecx
|
||||
# CHECK-NEXT: [0,2] D====eER addq %rcx, %rdx
|
||||
|
||||
# CHECK: Average Wait times (based on the timeline view):
|
||||
# CHECK-NEXT: [0]: Executions
|
||||
# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
|
||||
# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
|
||||
# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
|
||||
|
||||
# CHECK: [0] [1] [2] [3]
|
||||
# CHECK-NEXT: 0. 1 1.0 1.0 0.0 imulq %rax, %rcx
|
||||
# CHECK-NEXT: 1. 1 4.0 0.0 0.0 addl %edx, %ecx
|
||||
# CHECK-NEXT: 2. 1 5.0 0.0 0.0 addq %rcx, %rdx
|
||||
# CHECK-NEXT: 1 3.3 0.3 0.0 <total>
|
|
@ -0,0 +1,48 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -iterations=1 -resource-pressure=false -timeline < %s | FileCheck %s
|
||||
|
||||
imul %ax, %cx
|
||||
add %al, %cl
|
||||
add %ecx, %ebx
|
||||
|
||||
# CHECK: Iterations: 1
|
||||
# CHECK-NEXT: Instructions: 3
|
||||
# CHECK-NEXT: Total Cycles: 8
|
||||
# CHECK-NEXT: Total uOps: 3
|
||||
|
||||
# CHECK: Dispatch Width: 6
|
||||
# CHECK-NEXT: uOps Per Cycle: 0.38
|
||||
# CHECK-NEXT: IPC: 0.38
|
||||
# CHECK-NEXT: Block RThroughput: 1.0
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 3 1.00 imulw %ax, %cx
|
||||
# CHECK-NEXT: 1 1 0.25 addb %al, %cl
|
||||
# CHECK-NEXT: 1 1 0.25 addl %ecx, %ebx
|
||||
|
||||
# CHECK: Timeline view:
|
||||
# CHECK-NEXT: Index 01234567
|
||||
|
||||
# CHECK: [0,0] DeeeER . imulw %ax, %cx
|
||||
# CHECK-NEXT: [0,1] D===eER. addb %al, %cl
|
||||
# CHECK-NEXT: [0,2] D====eER addl %ecx, %ebx
|
||||
|
||||
# CHECK: Average Wait times (based on the timeline view):
|
||||
# CHECK-NEXT: [0]: Executions
|
||||
# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
|
||||
# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
|
||||
# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
|
||||
|
||||
# CHECK: [0] [1] [2] [3]
|
||||
# CHECK-NEXT: 0. 1 1.0 1.0 0.0 imulw %ax, %cx
|
||||
# CHECK-NEXT: 1. 1 4.0 0.0 0.0 addb %al, %cl
|
||||
# CHECK-NEXT: 2. 1 5.0 0.0 0.0 addl %ecx, %ebx
|
||||
# CHECK-NEXT: 1 3.3 0.3 0.0 <total>
|
|
@ -0,0 +1,70 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
adcx %ebx, %ecx
|
||||
adcx (%rbx), %ecx
|
||||
adcx %rbx, %rcx
|
||||
adcx (%rbx), %rcx
|
||||
|
||||
adox %ebx, %ecx
|
||||
adox (%rbx), %ecx
|
||||
adox %rbx, %rcx
|
||||
adox (%rbx), %rcx
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 1 1.00 adcxl %ebx, %ecx
|
||||
# CHECK-NEXT: 1 5 1.00 * adcxl (%rbx), %ecx
|
||||
# CHECK-NEXT: 1 1 1.00 adcxq %rbx, %rcx
|
||||
# CHECK-NEXT: 1 5 1.00 * adcxq (%rbx), %rcx
|
||||
# CHECK-NEXT: 1 1 1.00 adoxl %ebx, %ecx
|
||||
# CHECK-NEXT: 1 5 1.00 * adoxl (%rbx), %ecx
|
||||
# CHECK-NEXT: 1 1 1.00 adoxq %rbx, %rcx
|
||||
# CHECK-NEXT: 1 5 1.00 * adoxq (%rbx), %rcx
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: 1.33 1.33 1.33 8.00 8.00 8.00 8.00 - - - - - - - - 1.33 1.33 1.33 1.33 1.33 1.33 - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - adcxl %ebx, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 1.00 1.00 1.00 1.00 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - adcxl (%rbx), %ecx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - adcxq %rbx, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 1.00 1.00 1.00 1.00 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - adcxq (%rbx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - adoxl %ebx, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 1.00 1.00 1.00 1.00 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - adoxl (%rbx), %ecx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - adoxq %rbx, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 1.00 1.00 1.00 1.00 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - adoxq (%rbx), %rcx
|
|
@ -0,0 +1,86 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
aesdec %xmm0, %xmm2
|
||||
aesdec (%rax), %xmm2
|
||||
|
||||
aesdeclast %xmm0, %xmm2
|
||||
aesdeclast (%rax), %xmm2
|
||||
|
||||
aesenc %xmm0, %xmm2
|
||||
aesenc (%rax), %xmm2
|
||||
|
||||
aesenclast %xmm0, %xmm2
|
||||
aesenclast (%rax), %xmm2
|
||||
|
||||
aesimc %xmm0, %xmm2
|
||||
aesimc (%rax), %xmm2
|
||||
|
||||
aeskeygenassist $22, %xmm0, %xmm2
|
||||
aeskeygenassist $22, (%rax), %xmm2
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 4 0.50 aesdec %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 11 0.50 * aesdec (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 4 0.50 aesdeclast %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 11 0.50 * aesdeclast (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 4 0.50 aesenc %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 11 0.50 * aesenc (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 4 0.50 aesenclast %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 11 0.50 * aesenclast (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 4 0.50 aesimc %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 11 0.50 * aesimc (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 4 0.50 aeskeygenassist $22, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 11 0.50 * aeskeygenassist $22, (%rax), %xmm2
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: - - - - - - - - 6.00 6.00 - - 3.00 3.00 - 2.00 2.00 2.00 2.00 2.00 2.00 - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - aesdec %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - aesdec (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - aesdeclast %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - aesdeclast (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - aesenc %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - aesenc (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - aesenclast %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - aesenclast (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - aesimc %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - aesimc (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - aeskeygenassist $22, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - aeskeygenassist $22, (%rax), %xmm2
|
File diff suppressed because it is too large
Load Diff
File diff suppressed because it is too large
Load Diff
|
@ -0,0 +1,135 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
andn %eax, %ebx, %ecx
|
||||
andn (%rax), %ebx, %ecx
|
||||
|
||||
andn %rax, %rbx, %rcx
|
||||
andn (%rax), %rbx, %rcx
|
||||
|
||||
bextr %eax, %ebx, %ecx
|
||||
bextr %eax, (%rbx), %ecx
|
||||
|
||||
bextr %rax, %rbx, %rcx
|
||||
bextr %rax, (%rbx), %rcx
|
||||
|
||||
blsi %eax, %ecx
|
||||
blsi (%rax), %ecx
|
||||
|
||||
blsi %rax, %rcx
|
||||
blsi (%rax), %rcx
|
||||
|
||||
blsmsk %eax, %ecx
|
||||
blsmsk (%rax), %ecx
|
||||
|
||||
blsmsk %rax, %rcx
|
||||
blsmsk (%rax), %rcx
|
||||
|
||||
blsr %eax, %ecx
|
||||
blsr (%rax), %ecx
|
||||
|
||||
blsr %rax, %rcx
|
||||
blsr (%rax), %rcx
|
||||
|
||||
tzcnt %ax, %cx
|
||||
tzcnt (%rax), %cx
|
||||
|
||||
tzcnt %eax, %ecx
|
||||
tzcnt (%rax), %ecx
|
||||
|
||||
tzcnt %rax, %rcx
|
||||
tzcnt (%rax), %rcx
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 1 0.25 andnl %eax, %ebx, %ecx
|
||||
# CHECK-NEXT: 1 5 0.33 * andnl (%rax), %ebx, %ecx
|
||||
# CHECK-NEXT: 1 1 0.25 andnq %rax, %rbx, %rcx
|
||||
# CHECK-NEXT: 1 5 0.33 * andnq (%rax), %rbx, %rcx
|
||||
# CHECK-NEXT: 1 1 0.50 bextrl %eax, %ebx, %ecx
|
||||
# CHECK-NEXT: 2 5 0.50 * bextrl %eax, (%rbx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.50 bextrq %rax, %rbx, %rcx
|
||||
# CHECK-NEXT: 2 5 0.50 * bextrq %rax, (%rbx), %rcx
|
||||
# CHECK-NEXT: 2 2 0.50 blsil %eax, %ecx
|
||||
# CHECK-NEXT: 3 6 0.50 * blsil (%rax), %ecx
|
||||
# CHECK-NEXT: 2 2 0.50 blsiq %rax, %rcx
|
||||
# CHECK-NEXT: 3 6 0.50 * blsiq (%rax), %rcx
|
||||
# CHECK-NEXT: 2 2 0.50 blsmskl %eax, %ecx
|
||||
# CHECK-NEXT: 3 6 0.50 * blsmskl (%rax), %ecx
|
||||
# CHECK-NEXT: 2 2 0.50 blsmskq %rax, %rcx
|
||||
# CHECK-NEXT: 3 6 0.50 * blsmskq (%rax), %rcx
|
||||
# CHECK-NEXT: 2 2 0.50 blsrl %eax, %ecx
|
||||
# CHECK-NEXT: 3 6 0.50 * blsrl (%rax), %ecx
|
||||
# CHECK-NEXT: 2 2 0.50 blsrq %rax, %rcx
|
||||
# CHECK-NEXT: 3 6 0.50 * blsrq (%rax), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 tzcntw %ax, %cx
|
||||
# CHECK-NEXT: 2 6 0.50 * tzcntw (%rax), %cx
|
||||
# CHECK-NEXT: 2 2 0.50 tzcntl %eax, %ecx
|
||||
# CHECK-NEXT: 2 6 0.50 * tzcntl (%rax), %ecx
|
||||
# CHECK-NEXT: 2 2 0.50 tzcntq %rax, %rcx
|
||||
# CHECK-NEXT: 2 6 0.50 * tzcntq (%rax), %rcx
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: 4.33 4.33 4.33 8.00 12.50 12.50 8.00 - - - - - - - - 4.33 4.33 4.33 4.33 4.33 4.33 - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - andnl %eax, %ebx, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - andnl (%rax), %ebx, %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - andnq %rax, %rbx, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - andnq (%rax), %rbx, %rcx
|
||||
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - bextrl %eax, %ebx, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - bextrl %eax, (%rbx), %ecx
|
||||
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - bextrq %rax, %rbx, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - bextrq %rax, (%rbx), %rcx
|
||||
# CHECK-NEXT: - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - - - - - - blsil %eax, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 0.50 0.50 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - blsil (%rax), %ecx
|
||||
# CHECK-NEXT: - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - - - - - - blsiq %rax, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 0.50 0.50 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - blsiq (%rax), %rcx
|
||||
# CHECK-NEXT: - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - - - - - - blsmskl %eax, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 0.50 0.50 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - blsmskl (%rax), %ecx
|
||||
# CHECK-NEXT: - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - - - - - - blsmskq %rax, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 0.50 0.50 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - blsmskq (%rax), %rcx
|
||||
# CHECK-NEXT: - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - - - - - - blsrl %eax, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 0.50 0.50 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - blsrl (%rax), %ecx
|
||||
# CHECK-NEXT: - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - - - - - - blsrq %rax, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 0.50 0.50 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - blsrq (%rax), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - tzcntw %ax, %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - tzcntw (%rax), %cx
|
||||
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - tzcntl %eax, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - tzcntl (%rax), %ecx
|
||||
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - tzcntq %rax, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - tzcntq (%rax), %rcx
|
|
@ -0,0 +1,156 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
bzhi %eax, %ebx, %ecx
|
||||
bzhi %eax, (%rbx), %ecx
|
||||
|
||||
bzhi %rax, %rbx, %rcx
|
||||
bzhi %rax, (%rbx), %rcx
|
||||
|
||||
mulx %eax, %ebx, %ecx
|
||||
mulx (%rax), %ebx, %ecx
|
||||
|
||||
mulx %rax, %rbx, %rcx
|
||||
mulx (%rax), %rbx, %rcx
|
||||
|
||||
pdep %eax, %ebx, %ecx
|
||||
pdep (%rax), %ebx, %ecx
|
||||
|
||||
pdep %rax, %rbx, %rcx
|
||||
pdep (%rax), %rbx, %rcx
|
||||
|
||||
pext %eax, %ebx, %ecx
|
||||
pext (%rax), %ebx, %ecx
|
||||
|
||||
pext %rax, %rbx, %rcx
|
||||
pext (%rax), %rbx, %rcx
|
||||
|
||||
rorx $1, %eax, %ecx
|
||||
rorx $1, (%rax), %ecx
|
||||
|
||||
rorx $1, %rax, %rcx
|
||||
rorx $1, (%rax), %rcx
|
||||
|
||||
sarx %eax, %ebx, %ecx
|
||||
sarx %eax, (%rbx), %ecx
|
||||
|
||||
sarx %rax, %rbx, %rcx
|
||||
sarx %rax, (%rbx), %rcx
|
||||
|
||||
shlx %eax, %ebx, %ecx
|
||||
shlx %eax, (%rbx), %ecx
|
||||
|
||||
shlx %rax, %rbx, %rcx
|
||||
shlx %rax, (%rbx), %rcx
|
||||
|
||||
shrx %eax, %ebx, %ecx
|
||||
shrx %eax, (%rbx), %ecx
|
||||
|
||||
shrx %rax, %rbx, %rcx
|
||||
shrx %rax, (%rbx), %rcx
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 1 0.50 bzhil %eax, %ebx, %ecx
|
||||
# CHECK-NEXT: 2 5 0.50 * bzhil %eax, (%rbx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.50 bzhiq %rax, %rbx, %rcx
|
||||
# CHECK-NEXT: 2 5 0.50 * bzhiq %rax, (%rbx), %rcx
|
||||
# CHECK-NEXT: 2 3 1.00 mulxl %eax, %ebx, %ecx
|
||||
# CHECK-NEXT: 2 7 2.00 * mulxl (%rax), %ebx, %ecx
|
||||
# CHECK-NEXT: 2 4 1.00 mulxq %rax, %rbx, %rcx
|
||||
# CHECK-NEXT: 2 8 2.00 * mulxq (%rax), %rbx, %rcx
|
||||
# CHECK-NEXT: 1 3 1.00 pdepl %eax, %ebx, %ecx
|
||||
# CHECK-NEXT: 1 5 0.33 * pdepl (%rax), %ebx, %ecx
|
||||
# CHECK-NEXT: 1 3 1.00 pdepq %rax, %rbx, %rcx
|
||||
# CHECK-NEXT: 1 5 0.33 * pdepq (%rax), %rbx, %rcx
|
||||
# CHECK-NEXT: 1 3 1.00 pextl %eax, %ebx, %ecx
|
||||
# CHECK-NEXT: 1 5 0.33 * pextl (%rax), %ebx, %ecx
|
||||
# CHECK-NEXT: 1 3 1.00 pextq %rax, %rbx, %rcx
|
||||
# CHECK-NEXT: 1 5 0.33 * pextq (%rax), %rbx, %rcx
|
||||
# CHECK-NEXT: 1 1 0.50 rorxl $1, %eax, %ecx
|
||||
# CHECK-NEXT: 2 5 0.50 * rorxl $1, (%rax), %ecx
|
||||
# CHECK-NEXT: 1 1 0.50 rorxq $1, %rax, %rcx
|
||||
# CHECK-NEXT: 2 5 0.50 * rorxq $1, (%rax), %rcx
|
||||
# CHECK-NEXT: 1 1 0.50 sarxl %eax, %ebx, %ecx
|
||||
# CHECK-NEXT: 2 5 0.50 * sarxl %eax, (%rbx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.50 sarxq %rax, %rbx, %rcx
|
||||
# CHECK-NEXT: 2 5 0.50 * sarxq %rax, (%rbx), %rcx
|
||||
# CHECK-NEXT: 1 1 0.50 shlxl %eax, %ebx, %ecx
|
||||
# CHECK-NEXT: 2 5 0.50 * shlxl %eax, (%rbx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.50 shlxq %rax, %rbx, %rcx
|
||||
# CHECK-NEXT: 2 5 0.50 * shlxq %rax, (%rbx), %rcx
|
||||
# CHECK-NEXT: 1 1 0.50 shrxl %eax, %ebx, %ecx
|
||||
# CHECK-NEXT: 2 5 0.50 * shrxl %eax, (%rbx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.50 shrxq %rax, %rbx, %rcx
|
||||
# CHECK-NEXT: 2 5 0.50 * shrxq %rax, (%rbx), %rcx
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: 5.33 5.33 5.33 1.00 21.00 11.00 1.00 - - - - - - - - 5.33 5.33 5.33 5.33 5.33 5.33 - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - bzhil %eax, %ebx, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - bzhil %eax, (%rbx), %ecx
|
||||
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - bzhiq %rax, %rbx, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - bzhiq %rax, (%rbx), %rcx
|
||||
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - mulxl %eax, %ebx, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 2.00 - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - mulxl (%rax), %ebx, %ecx
|
||||
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - mulxq %rax, %rbx, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 2.00 - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - mulxq (%rax), %rbx, %rcx
|
||||
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - pdepl %eax, %ebx, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - pdepl (%rax), %ebx, %ecx
|
||||
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - pdepq %rax, %rbx, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - pdepq (%rax), %rbx, %rcx
|
||||
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - pextl %eax, %ebx, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - pextl (%rax), %ebx, %ecx
|
||||
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - pextq %rax, %rbx, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - pextq (%rax), %rbx, %rcx
|
||||
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - rorxl $1, %eax, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - rorxl $1, (%rax), %ecx
|
||||
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - rorxq $1, %rax, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - rorxq $1, (%rax), %rcx
|
||||
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - sarxl %eax, %ebx, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - sarxl %eax, (%rbx), %ecx
|
||||
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - sarxq %rax, %rbx, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - sarxq %rax, (%rbx), %rcx
|
||||
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - shlxl %eax, %ebx, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - shlxl %eax, (%rbx), %ecx
|
||||
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - shlxq %rax, %rbx, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - shlxq %rax, (%rbx), %rcx
|
||||
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - shrxl %eax, %ebx, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - shrxl %eax, (%rbx), %ecx
|
||||
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - - - - - - - - - - - - shrxq %rax, %rbx, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 0.50 0.50 - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - shrxq %rax, (%rbx), %rcx
|
|
@ -0,0 +1,48 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
clflushopt (%rax)
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 5 0.33 * * U clflushopt (%rax)
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - clflushopt (%rax)
|
|
@ -0,0 +1,48 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
clzero
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 5 0.33 U clzero
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - clzero
|
|
@ -0,0 +1,338 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
cmovow %si, %di
|
||||
cmovnow %si, %di
|
||||
cmovbw %si, %di
|
||||
cmovaew %si, %di
|
||||
cmovew %si, %di
|
||||
cmovnew %si, %di
|
||||
cmovbew %si, %di
|
||||
cmovaw %si, %di
|
||||
cmovsw %si, %di
|
||||
cmovnsw %si, %di
|
||||
cmovpw %si, %di
|
||||
cmovnpw %si, %di
|
||||
cmovlw %si, %di
|
||||
cmovgew %si, %di
|
||||
cmovlew %si, %di
|
||||
cmovgw %si, %di
|
||||
|
||||
cmovow (%rax), %di
|
||||
cmovnow (%rax), %di
|
||||
cmovbw (%rax), %di
|
||||
cmovaew (%rax), %di
|
||||
cmovew (%rax), %di
|
||||
cmovnew (%rax), %di
|
||||
cmovbew (%rax), %di
|
||||
cmovaw (%rax), %di
|
||||
cmovsw (%rax), %di
|
||||
cmovnsw (%rax), %di
|
||||
cmovpw (%rax), %di
|
||||
cmovnpw (%rax), %di
|
||||
cmovlw (%rax), %di
|
||||
cmovgew (%rax), %di
|
||||
cmovlew (%rax), %di
|
||||
cmovgw (%rax), %di
|
||||
|
||||
cmovol %esi, %edi
|
||||
cmovnol %esi, %edi
|
||||
cmovbl %esi, %edi
|
||||
cmovael %esi, %edi
|
||||
cmovel %esi, %edi
|
||||
cmovnel %esi, %edi
|
||||
cmovbel %esi, %edi
|
||||
cmoval %esi, %edi
|
||||
cmovsl %esi, %edi
|
||||
cmovnsl %esi, %edi
|
||||
cmovpl %esi, %edi
|
||||
cmovnpl %esi, %edi
|
||||
cmovll %esi, %edi
|
||||
cmovgel %esi, %edi
|
||||
cmovlel %esi, %edi
|
||||
cmovgl %esi, %edi
|
||||
|
||||
cmovol (%rax), %edi
|
||||
cmovnol (%rax), %edi
|
||||
cmovbl (%rax), %edi
|
||||
cmovael (%rax), %edi
|
||||
cmovel (%rax), %edi
|
||||
cmovnel (%rax), %edi
|
||||
cmovbel (%rax), %edi
|
||||
cmoval (%rax), %edi
|
||||
cmovsl (%rax), %edi
|
||||
cmovnsl (%rax), %edi
|
||||
cmovpl (%rax), %edi
|
||||
cmovnpl (%rax), %edi
|
||||
cmovll (%rax), %edi
|
||||
cmovgel (%rax), %edi
|
||||
cmovlel (%rax), %edi
|
||||
cmovgl (%rax), %edi
|
||||
|
||||
cmovoq %rsi, %rdi
|
||||
cmovnoq %rsi, %rdi
|
||||
cmovbq %rsi, %rdi
|
||||
cmovaeq %rsi, %rdi
|
||||
cmoveq %rsi, %rdi
|
||||
cmovneq %rsi, %rdi
|
||||
cmovbeq %rsi, %rdi
|
||||
cmovaq %rsi, %rdi
|
||||
cmovsq %rsi, %rdi
|
||||
cmovnsq %rsi, %rdi
|
||||
cmovpq %rsi, %rdi
|
||||
cmovnpq %rsi, %rdi
|
||||
cmovlq %rsi, %rdi
|
||||
cmovgeq %rsi, %rdi
|
||||
cmovleq %rsi, %rdi
|
||||
cmovgq %rsi, %rdi
|
||||
|
||||
cmovoq (%rax), %rdi
|
||||
cmovnoq (%rax), %rdi
|
||||
cmovbq (%rax), %rdi
|
||||
cmovaeq (%rax), %rdi
|
||||
cmoveq (%rax), %rdi
|
||||
cmovneq (%rax), %rdi
|
||||
cmovbeq (%rax), %rdi
|
||||
cmovaq (%rax), %rdi
|
||||
cmovsq (%rax), %rdi
|
||||
cmovnsq (%rax), %rdi
|
||||
cmovpq (%rax), %rdi
|
||||
cmovnpq (%rax), %rdi
|
||||
cmovlq (%rax), %rdi
|
||||
cmovgeq (%rax), %rdi
|
||||
cmovleq (%rax), %rdi
|
||||
cmovgq (%rax), %rdi
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 1 0.50 cmovow %si, %di
|
||||
# CHECK-NEXT: 1 1 0.50 cmovnow %si, %di
|
||||
# CHECK-NEXT: 1 1 0.50 cmovbw %si, %di
|
||||
# CHECK-NEXT: 1 1 0.50 cmovaew %si, %di
|
||||
# CHECK-NEXT: 1 1 0.50 cmovew %si, %di
|
||||
# CHECK-NEXT: 1 1 0.50 cmovnew %si, %di
|
||||
# CHECK-NEXT: 1 1 0.50 cmovbew %si, %di
|
||||
# CHECK-NEXT: 1 1 0.50 cmovaw %si, %di
|
||||
# CHECK-NEXT: 1 1 0.50 cmovsw %si, %di
|
||||
# CHECK-NEXT: 1 1 0.50 cmovnsw %si, %di
|
||||
# CHECK-NEXT: 1 1 0.50 cmovpw %si, %di
|
||||
# CHECK-NEXT: 1 1 0.50 cmovnpw %si, %di
|
||||
# CHECK-NEXT: 1 1 0.50 cmovlw %si, %di
|
||||
# CHECK-NEXT: 1 1 0.50 cmovgew %si, %di
|
||||
# CHECK-NEXT: 1 1 0.50 cmovlew %si, %di
|
||||
# CHECK-NEXT: 1 1 0.50 cmovgw %si, %di
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovow (%rax), %di
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovnow (%rax), %di
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovbw (%rax), %di
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovaew (%rax), %di
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovew (%rax), %di
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovnew (%rax), %di
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovbew (%rax), %di
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovaw (%rax), %di
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovsw (%rax), %di
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovnsw (%rax), %di
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovpw (%rax), %di
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovnpw (%rax), %di
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovlw (%rax), %di
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovgew (%rax), %di
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovlew (%rax), %di
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovgw (%rax), %di
|
||||
# CHECK-NEXT: 1 1 0.50 cmovol %esi, %edi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovnol %esi, %edi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovbl %esi, %edi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovael %esi, %edi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovel %esi, %edi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovnel %esi, %edi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovbel %esi, %edi
|
||||
# CHECK-NEXT: 1 1 0.50 cmoval %esi, %edi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovsl %esi, %edi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovnsl %esi, %edi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovpl %esi, %edi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovnpl %esi, %edi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovll %esi, %edi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovgel %esi, %edi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovlel %esi, %edi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovgl %esi, %edi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovol (%rax), %edi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovnol (%rax), %edi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovbl (%rax), %edi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovael (%rax), %edi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovel (%rax), %edi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovnel (%rax), %edi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovbel (%rax), %edi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmoval (%rax), %edi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovsl (%rax), %edi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovnsl (%rax), %edi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovpl (%rax), %edi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovnpl (%rax), %edi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovll (%rax), %edi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovgel (%rax), %edi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovlel (%rax), %edi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovgl (%rax), %edi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovoq %rsi, %rdi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovnoq %rsi, %rdi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovbq %rsi, %rdi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovaeq %rsi, %rdi
|
||||
# CHECK-NEXT: 1 1 0.50 cmoveq %rsi, %rdi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovneq %rsi, %rdi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovbeq %rsi, %rdi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovaq %rsi, %rdi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovsq %rsi, %rdi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovnsq %rsi, %rdi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovpq %rsi, %rdi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovnpq %rsi, %rdi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovlq %rsi, %rdi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovgeq %rsi, %rdi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovleq %rsi, %rdi
|
||||
# CHECK-NEXT: 1 1 0.50 cmovgq %rsi, %rdi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovoq (%rax), %rdi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovnoq (%rax), %rdi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovbq (%rax), %rdi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovaeq (%rax), %rdi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmoveq (%rax), %rdi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovneq (%rax), %rdi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovbeq (%rax), %rdi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovaq (%rax), %rdi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovsq (%rax), %rdi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovnsq (%rax), %rdi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovpq (%rax), %rdi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovnpq (%rax), %rdi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovlq (%rax), %rdi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovgeq (%rax), %rdi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovleq (%rax), %rdi
|
||||
# CHECK-NEXT: 1 5 0.50 * cmovgq (%rax), %rdi
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: 16.00 16.00 16.00 48.00 - - 48.00 - - - - - - - - 16.00 16.00 16.00 16.00 16.00 16.00 - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovow %si, %di
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovnow %si, %di
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovbw %si, %di
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovaew %si, %di
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovew %si, %di
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovnew %si, %di
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovbew %si, %di
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovaw %si, %di
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovsw %si, %di
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovnsw %si, %di
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovpw %si, %di
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovnpw %si, %di
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovlw %si, %di
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovgew %si, %di
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovlew %si, %di
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovgw %si, %di
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovow (%rax), %di
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovnow (%rax), %di
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovbw (%rax), %di
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovaew (%rax), %di
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovew (%rax), %di
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovnew (%rax), %di
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovbew (%rax), %di
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovaw (%rax), %di
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovsw (%rax), %di
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovnsw (%rax), %di
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovpw (%rax), %di
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovnpw (%rax), %di
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovlw (%rax), %di
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovgew (%rax), %di
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovlew (%rax), %di
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovgw (%rax), %di
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovol %esi, %edi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovnol %esi, %edi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovbl %esi, %edi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovael %esi, %edi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovel %esi, %edi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovnel %esi, %edi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovbel %esi, %edi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmoval %esi, %edi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovsl %esi, %edi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovnsl %esi, %edi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovpl %esi, %edi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovnpl %esi, %edi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovll %esi, %edi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovgel %esi, %edi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovlel %esi, %edi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovgl %esi, %edi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovol (%rax), %edi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovnol (%rax), %edi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovbl (%rax), %edi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovael (%rax), %edi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovel (%rax), %edi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovnel (%rax), %edi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovbel (%rax), %edi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmoval (%rax), %edi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovsl (%rax), %edi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovnsl (%rax), %edi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovpl (%rax), %edi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovnpl (%rax), %edi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovll (%rax), %edi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovgel (%rax), %edi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovlel (%rax), %edi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovgl (%rax), %edi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovoq %rsi, %rdi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovnoq %rsi, %rdi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovbq %rsi, %rdi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovaeq %rsi, %rdi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmoveq %rsi, %rdi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovneq %rsi, %rdi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovbeq %rsi, %rdi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovaq %rsi, %rdi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovsq %rsi, %rdi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovnsq %rsi, %rdi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovpq %rsi, %rdi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovnpq %rsi, %rdi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovlq %rsi, %rdi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovgeq %rsi, %rdi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovleq %rsi, %rdi
|
||||
# CHECK-NEXT: - - - 0.50 - - 0.50 - - - - - - - - - - - - - - - - cmovgq %rsi, %rdi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovoq (%rax), %rdi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovnoq (%rax), %rdi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovbq (%rax), %rdi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovaeq (%rax), %rdi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmoveq (%rax), %rdi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovneq (%rax), %rdi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovbeq (%rax), %rdi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovaq (%rax), %rdi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovsq (%rax), %rdi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovnsq (%rax), %rdi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovpq (%rax), %rdi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovnpq (%rax), %rdi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovlq (%rax), %rdi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovgeq (%rax), %rdi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovleq (%rax), %rdi
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.50 - - 0.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmovgq (%rax), %rdi
|
|
@ -0,0 +1,51 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
cmpxchg8b (%rax)
|
||||
cmpxchg16b (%rax)
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 19 3 6.00 * * cmpxchg8b (%rax)
|
||||
# CHECK-NEXT: 28 4 14.75 * * cmpxchg16b (%rax)
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: - - - 20.75 20.75 20.75 20.75 - - - - - - - - - - - - - - - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - 6.00 6.00 6.00 6.00 - - - - - - - - - - - - - - - - cmpxchg8b (%rax)
|
||||
# CHECK-NEXT: - - - 14.75 14.75 14.75 14.75 - - - - - - - - - - - - - - - - cmpxchg16b (%rax)
|
|
@ -0,0 +1,72 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
vcvtph2ps %xmm0, %xmm2
|
||||
vcvtph2ps (%rax), %xmm2
|
||||
|
||||
vcvtph2ps %xmm0, %ymm2
|
||||
vcvtph2ps (%rax), %ymm2
|
||||
|
||||
vcvtps2ph $0, %xmm0, %xmm2
|
||||
vcvtps2ph $0, %xmm0, (%rax)
|
||||
|
||||
vcvtps2ph $0, %ymm0, %xmm2
|
||||
vcvtps2ph $0, %ymm0, (%rax)
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 3 0.50 vcvtph2ps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * vcvtph2ps (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 4 1.00 vcvtph2ps %xmm0, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vcvtph2ps (%rax), %ymm2
|
||||
# CHECK-NEXT: 1 3 1.00 vcvtps2ph $0, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 2 4 1.00 * vcvtps2ph $0, %xmm0, (%rax)
|
||||
# CHECK-NEXT: 2 6 1.00 vcvtps2ph $0, %ymm0, %xmm2
|
||||
# CHECK-NEXT: 3 7 1.00 * vcvtps2ph $0, %ymm0, (%rax)
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: - - - - - - - - - - 6.50 6.50 2.00 2.00 2.00 1.33 1.33 1.33 0.67 0.67 0.67 1.00 1.00
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - vcvtph2ps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vcvtph2ps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - vcvtph2ps %xmm0, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vcvtph2ps (%rax), %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - vcvtps2ph $0, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 vcvtps2ph $0, %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - vcvtps2ph $0, %ymm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 vcvtps2ph $0, %ymm0, (%rax)
|
|
@ -0,0 +1,716 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
vfmadd132pd %xmm0, %xmm1, %xmm2
|
||||
vfmadd132pd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmadd132pd %ymm0, %ymm1, %ymm2
|
||||
vfmadd132pd (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmadd213pd %xmm0, %xmm1, %xmm2
|
||||
vfmadd213pd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmadd213pd %ymm0, %ymm1, %ymm2
|
||||
vfmadd213pd (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmadd231pd %xmm0, %xmm1, %xmm2
|
||||
vfmadd231pd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmadd231pd %ymm0, %ymm1, %ymm2
|
||||
vfmadd231pd (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmadd132ps %xmm0, %xmm1, %xmm2
|
||||
vfmadd132ps (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmadd132ps %ymm0, %ymm1, %ymm2
|
||||
vfmadd132ps (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmadd213ps %xmm0, %xmm1, %xmm2
|
||||
vfmadd213ps (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmadd213ps %ymm0, %ymm1, %ymm2
|
||||
vfmadd213ps (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmadd231ps %xmm0, %xmm1, %xmm2
|
||||
vfmadd231ps (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmadd231ps %ymm0, %ymm1, %ymm2
|
||||
vfmadd231ps (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmadd132sd %xmm0, %xmm1, %xmm2
|
||||
vfmadd132sd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmadd213sd %xmm0, %xmm1, %xmm2
|
||||
vfmadd213sd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmadd231sd %xmm0, %xmm1, %xmm2
|
||||
vfmadd231sd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmadd132ss %xmm0, %xmm1, %xmm2
|
||||
vfmadd132ss (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmadd213ss %xmm0, %xmm1, %xmm2
|
||||
vfmadd213ss (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmadd231ss %xmm0, %xmm1, %xmm2
|
||||
vfmadd231ss (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmaddsub132pd %xmm0, %xmm1, %xmm2
|
||||
vfmaddsub132pd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmaddsub132pd %ymm0, %ymm1, %ymm2
|
||||
vfmaddsub132pd (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmaddsub213pd %xmm0, %xmm1, %xmm2
|
||||
vfmaddsub213pd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmaddsub213pd %ymm0, %ymm1, %ymm2
|
||||
vfmaddsub213pd (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmaddsub231pd %xmm0, %xmm1, %xmm2
|
||||
vfmaddsub231pd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmaddsub231pd %ymm0, %ymm1, %ymm2
|
||||
vfmaddsub231pd (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmaddsub132ps %xmm0, %xmm1, %xmm2
|
||||
vfmaddsub132ps (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmaddsub132ps %ymm0, %ymm1, %ymm2
|
||||
vfmaddsub132ps (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmaddsub213ps %xmm0, %xmm1, %xmm2
|
||||
vfmaddsub213ps (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmaddsub213ps %ymm0, %ymm1, %ymm2
|
||||
vfmaddsub213ps (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmaddsub231ps %xmm0, %xmm1, %xmm2
|
||||
vfmaddsub231ps (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmaddsub231ps %ymm0, %ymm1, %ymm2
|
||||
vfmaddsub231ps (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmsub132pd %xmm0, %xmm1, %xmm2
|
||||
vfmsub132pd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmsub132pd %ymm0, %ymm1, %ymm2
|
||||
vfmsub132pd (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmsub213pd %xmm0, %xmm1, %xmm2
|
||||
vfmsub213pd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmsub213pd %ymm0, %ymm1, %ymm2
|
||||
vfmsub213pd (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmsub231pd %xmm0, %xmm1, %xmm2
|
||||
vfmsub231pd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmsub231pd %ymm0, %ymm1, %ymm2
|
||||
vfmsub231pd (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmsub132ps %xmm0, %xmm1, %xmm2
|
||||
vfmsub132ps (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmsub132ps %ymm0, %ymm1, %ymm2
|
||||
vfmsub132ps (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmsub213ps %xmm0, %xmm1, %xmm2
|
||||
vfmsub213ps (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmsub213ps %ymm0, %ymm1, %ymm2
|
||||
vfmsub213ps (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmsub231ps %xmm0, %xmm1, %xmm2
|
||||
vfmsub231ps (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmsub231ps %ymm0, %ymm1, %ymm2
|
||||
vfmsub231ps (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmsub132sd %xmm0, %xmm1, %xmm2
|
||||
vfmsub132sd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmsub213sd %xmm0, %xmm1, %xmm2
|
||||
vfmsub213sd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmsub231sd %xmm0, %xmm1, %xmm2
|
||||
vfmsub231sd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmsub132ss %xmm0, %xmm1, %xmm2
|
||||
vfmsub132ss (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmsub213ss %xmm0, %xmm1, %xmm2
|
||||
vfmsub213ss (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmsub231ss %xmm0, %xmm1, %xmm2
|
||||
vfmsub231ss (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmsubadd132pd %xmm0, %xmm1, %xmm2
|
||||
vfmsubadd132pd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmsubadd132pd %ymm0, %ymm1, %ymm2
|
||||
vfmsubadd132pd (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmsubadd213pd %xmm0, %xmm1, %xmm2
|
||||
vfmsubadd213pd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmsubadd213pd %ymm0, %ymm1, %ymm2
|
||||
vfmsubadd213pd (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmsubadd231pd %xmm0, %xmm1, %xmm2
|
||||
vfmsubadd231pd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmsubadd231pd %ymm0, %ymm1, %ymm2
|
||||
vfmsubadd231pd (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmsubadd132ps %xmm0, %xmm1, %xmm2
|
||||
vfmsubadd132ps (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmsubadd132ps %ymm0, %ymm1, %ymm2
|
||||
vfmsubadd132ps (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmsubadd213ps %xmm0, %xmm1, %xmm2
|
||||
vfmsubadd213ps (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmsubadd213ps %ymm0, %ymm1, %ymm2
|
||||
vfmsubadd213ps (%rax), %ymm1, %ymm2
|
||||
|
||||
vfmsubadd231ps %xmm0, %xmm1, %xmm2
|
||||
vfmsubadd231ps (%rax), %xmm1, %xmm2
|
||||
|
||||
vfmsubadd231ps %ymm0, %ymm1, %ymm2
|
||||
vfmsubadd231ps (%rax), %ymm1, %ymm2
|
||||
|
||||
vfnmadd132pd %xmm0, %xmm1, %xmm2
|
||||
vfnmadd132pd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmadd132pd %ymm0, %ymm1, %ymm2
|
||||
vfnmadd132pd (%rax), %ymm1, %ymm2
|
||||
|
||||
vfnmadd213pd %xmm0, %xmm1, %xmm2
|
||||
vfnmadd213pd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmadd213pd %ymm0, %ymm1, %ymm2
|
||||
vfnmadd213pd (%rax), %ymm1, %ymm2
|
||||
|
||||
vfnmadd231pd %xmm0, %xmm1, %xmm2
|
||||
vfnmadd231pd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmadd231pd %ymm0, %ymm1, %ymm2
|
||||
vfnmadd231pd (%rax), %ymm1, %ymm2
|
||||
|
||||
vfnmadd132ps %xmm0, %xmm1, %xmm2
|
||||
vfnmadd132ps (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmadd132ps %ymm0, %ymm1, %ymm2
|
||||
vfnmadd132ps (%rax), %ymm1, %ymm2
|
||||
|
||||
vfnmadd213ps %xmm0, %xmm1, %xmm2
|
||||
vfnmadd213ps (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmadd213ps %ymm0, %ymm1, %ymm2
|
||||
vfnmadd213ps (%rax), %ymm1, %ymm2
|
||||
|
||||
vfnmadd231ps %xmm0, %xmm1, %xmm2
|
||||
vfnmadd231ps (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmadd231ps %ymm0, %ymm1, %ymm2
|
||||
vfnmadd231ps (%rax), %ymm1, %ymm2
|
||||
|
||||
vfnmadd132sd %xmm0, %xmm1, %xmm2
|
||||
vfnmadd132sd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmadd213sd %xmm0, %xmm1, %xmm2
|
||||
vfnmadd213sd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmadd231sd %xmm0, %xmm1, %xmm2
|
||||
vfnmadd231sd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmadd132ss %xmm0, %xmm1, %xmm2
|
||||
vfnmadd132ss (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmadd213ss %xmm0, %xmm1, %xmm2
|
||||
vfnmadd213ss (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmadd231ss %xmm0, %xmm1, %xmm2
|
||||
vfnmadd231ss (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmsub132pd %xmm0, %xmm1, %xmm2
|
||||
vfnmsub132pd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmsub132pd %ymm0, %ymm1, %ymm2
|
||||
vfnmsub132pd (%rax), %ymm1, %ymm2
|
||||
|
||||
vfnmsub213pd %xmm0, %xmm1, %xmm2
|
||||
vfnmsub213pd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmsub213pd %ymm0, %ymm1, %ymm2
|
||||
vfnmsub213pd (%rax), %ymm1, %ymm2
|
||||
|
||||
vfnmsub231pd %xmm0, %xmm1, %xmm2
|
||||
vfnmsub231pd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmsub231pd %ymm0, %ymm1, %ymm2
|
||||
vfnmsub231pd (%rax), %ymm1, %ymm2
|
||||
|
||||
vfnmsub132ps %xmm0, %xmm1, %xmm2
|
||||
vfnmsub132ps (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmsub132ps %ymm0, %ymm1, %ymm2
|
||||
vfnmsub132ps (%rax), %ymm1, %ymm2
|
||||
|
||||
vfnmsub213ps %xmm0, %xmm1, %xmm2
|
||||
vfnmsub213ps (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmsub213ps %ymm0, %ymm1, %ymm2
|
||||
vfnmsub213ps (%rax), %ymm1, %ymm2
|
||||
|
||||
vfnmsub231ps %xmm0, %xmm1, %xmm2
|
||||
vfnmsub231ps (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmsub231ps %ymm0, %ymm1, %ymm2
|
||||
vfnmsub231ps (%rax), %ymm1, %ymm2
|
||||
|
||||
vfnmsub132sd %xmm0, %xmm1, %xmm2
|
||||
vfnmsub132sd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmsub213sd %xmm0, %xmm1, %xmm2
|
||||
vfnmsub213sd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmsub231sd %xmm0, %xmm1, %xmm2
|
||||
vfnmsub231sd (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmsub132ss %xmm0, %xmm1, %xmm2
|
||||
vfnmsub132ss (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmsub213ss %xmm0, %xmm1, %xmm2
|
||||
vfnmsub213ss (%rax), %xmm1, %xmm2
|
||||
|
||||
vfnmsub231ss %xmm0, %xmm1, %xmm2
|
||||
vfnmsub231ss (%rax), %xmm1, %xmm2
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 4 1.00 vfmadd132pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmadd132pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmadd132pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmadd132pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmadd213pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmadd213pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmadd213pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmadd213pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmadd231pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmadd231pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmadd231pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmadd231pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmadd132ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmadd132ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmadd132ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmadd132ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmadd213ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmadd213ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmadd213ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmadd213ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmadd231ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmadd231ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmadd231ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmadd231ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmadd132sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmadd132sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmadd213sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmadd213sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmadd231sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmadd231sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmadd132ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmadd132ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmadd213ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmadd213ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmadd231ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmadd231ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmaddsub132pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmaddsub132pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmaddsub132pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmaddsub132pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmaddsub213pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmaddsub213pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmaddsub213pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmaddsub213pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmaddsub231pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmaddsub231pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmaddsub231pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmaddsub231pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmaddsub132ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmaddsub132ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmaddsub132ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmaddsub132ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmaddsub213ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmaddsub213ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmaddsub213ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmaddsub213ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmaddsub231ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmaddsub231ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmaddsub231ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmaddsub231ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsub132pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsub132pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsub132pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsub132pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsub213pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsub213pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsub213pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsub213pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsub231pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsub231pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsub231pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsub231pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsub132ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsub132ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsub132ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsub132ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsub213ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsub213ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsub213ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsub213ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsub231ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsub231ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsub231ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsub231ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsub132sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsub132sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsub213sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsub213sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsub231sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsub231sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsub132ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsub132ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsub213ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsub213ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsub231ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsub231ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsubadd132pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsubadd132pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsubadd132pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsubadd132pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsubadd213pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsubadd213pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsubadd213pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsubadd213pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsubadd231pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsubadd231pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsubadd231pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsubadd231pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsubadd132ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsubadd132ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsubadd132ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsubadd132ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsubadd213ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsubadd213ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsubadd213ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsubadd213ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsubadd231ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsubadd231ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfmsubadd231ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfmsubadd231ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmadd132pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmadd132pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmadd132pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmadd132pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmadd213pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmadd213pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmadd213pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmadd213pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmadd231pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmadd231pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmadd231pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmadd231pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmadd132ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmadd132ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmadd132ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmadd132ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmadd213ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmadd213ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmadd213ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmadd213ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmadd231ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmadd231ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmadd231ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmadd231ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmadd132sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmadd132sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmadd213sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmadd213sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmadd231sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmadd231sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmadd132ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmadd132ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmadd213ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmadd213ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmadd231ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmadd231ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmsub132pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmsub132pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmsub132pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmsub132pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmsub213pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmsub213pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmsub213pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmsub213pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmsub231pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmsub231pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmsub231pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmsub231pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmsub132ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmsub132ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmsub132ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmsub132ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmsub213ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmsub213ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmsub213ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmsub213ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmsub231ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmsub231ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmsub231ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmsub231ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmsub132sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmsub132sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmsub213sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmsub213sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmsub231sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmsub231sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmsub132ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmsub132ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmsub213ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmsub213ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 4 1.00 vfnmsub231ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: 1 11 1.00 * vfnmsub231ss (%rax), %xmm1, %xmm2
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: - - - - - - - - 192.00 192.00 - - 48.00 48.00 - 32.00 32.00 32.00 32.00 32.00 32.00 - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmadd132pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmadd132pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmadd132pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmadd132pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmadd213pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmadd213pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmadd213pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmadd213pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmadd231pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmadd231pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmadd231pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmadd231pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmadd132ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmadd132ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmadd132ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmadd132ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmadd213ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmadd213ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmadd213ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmadd213ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmadd231ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmadd231ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmadd231ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmadd231ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmadd132sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmadd132sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmadd213sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmadd213sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmadd231sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmadd231sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmadd132ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmadd132ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmadd213ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmadd213ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmadd231ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmadd231ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmaddsub132pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmaddsub132pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmaddsub132pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmaddsub132pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmaddsub213pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmaddsub213pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmaddsub213pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmaddsub213pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmaddsub231pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmaddsub231pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmaddsub231pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmaddsub231pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmaddsub132ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmaddsub132ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmaddsub132ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmaddsub132ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmaddsub213ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmaddsub213ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmaddsub213ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmaddsub213ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmaddsub231ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmaddsub231ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmaddsub231ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmaddsub231ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsub132pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsub132pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsub132pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsub132pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsub213pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsub213pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsub213pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsub213pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsub231pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsub231pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsub231pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsub231pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsub132ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsub132ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsub132ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsub132ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsub213ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsub213ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsub213ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsub213ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsub231ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsub231ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsub231ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsub231ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsub132sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsub132sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsub213sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsub213sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsub231sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsub231sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsub132ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsub132ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsub213ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsub213ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsub231ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsub231ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsubadd132pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsubadd132pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsubadd132pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsubadd132pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsubadd213pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsubadd213pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsubadd213pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsubadd213pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsubadd231pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsubadd231pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsubadd231pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsubadd231pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsubadd132ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsubadd132ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsubadd132ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsubadd132ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsubadd213ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsubadd213ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsubadd213ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsubadd213ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsubadd231ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsubadd231ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfmsubadd231ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfmsubadd231ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmadd132pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmadd132pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmadd132pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmadd132pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmadd213pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmadd213pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmadd213pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmadd213pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmadd231pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmadd231pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmadd231pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmadd231pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmadd132ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmadd132ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmadd132ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmadd132ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmadd213ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmadd213ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmadd213ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmadd213ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmadd231ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmadd231ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmadd231ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmadd231ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmadd132sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmadd132sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmadd213sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmadd213sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmadd231sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmadd231sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmadd132ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmadd132ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmadd213ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmadd213ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmadd231ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmadd231ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmsub132pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmsub132pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmsub132pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmsub132pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmsub213pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmsub213pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmsub213pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmsub213pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmsub231pd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmsub231pd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmsub231pd %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmsub231pd (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmsub132ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmsub132ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmsub132ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmsub132ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmsub213ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmsub213ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmsub213ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmsub213ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmsub231ps %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmsub231ps (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmsub231ps %ymm0, %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmsub231ps (%rax), %ymm1, %ymm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmsub132sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmsub132sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmsub213sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmsub213sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmsub231sd %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmsub231sd (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmsub132ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmsub132ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmsub213ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmsub213ss (%rax), %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - vfnmsub231ss %xmm0, %xmm1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - vfnmsub231ss (%rax), %xmm1, %xmm2
|
|
@ -0,0 +1,72 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
rdfsbase %eax
|
||||
rdfsbase %rax
|
||||
|
||||
rdgsbase %eax
|
||||
rdgsbase %rax
|
||||
|
||||
wrfsbase %edi
|
||||
wrfsbase %rdi
|
||||
|
||||
wrgsbase %edi
|
||||
wrgsbase %rdi
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 100 100 25.00 * * U rdfsbasel %eax
|
||||
# CHECK-NEXT: 100 100 25.00 * * U rdfsbaseq %rax
|
||||
# CHECK-NEXT: 100 100 25.00 * * U rdgsbasel %eax
|
||||
# CHECK-NEXT: 100 100 25.00 * * U rdgsbaseq %rax
|
||||
# CHECK-NEXT: 100 100 25.00 * * U wrfsbasel %edi
|
||||
# CHECK-NEXT: 100 100 25.00 * * U wrfsbaseq %rdi
|
||||
# CHECK-NEXT: 100 100 25.00 * * U wrgsbasel %edi
|
||||
# CHECK-NEXT: 100 100 25.00 * * U wrgsbaseq %rdi
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: - - - 200.00 200.00 200.00 200.00 - - - - - - - - - - - - - - - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - rdfsbasel %eax
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - rdfsbaseq %rax
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - rdgsbasel %eax
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - rdgsbaseq %rax
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - wrfsbasel %edi
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - wrfsbaseq %rdi
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - wrgsbasel %edi
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - wrgsbaseq %rdi
|
|
@ -0,0 +1,452 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
lea 0(), %cx
|
||||
lea 0(), %ecx
|
||||
lea 0(), %rcx
|
||||
lea (%eax), %cx
|
||||
lea (%eax), %ecx
|
||||
lea (%eax), %rcx
|
||||
lea (%rax), %cx
|
||||
lea (%rax), %ecx
|
||||
lea (%rax), %rcx
|
||||
lea (, %ebx), %cx
|
||||
lea (, %ebx), %ecx
|
||||
lea (, %ebx), %rcx
|
||||
lea (, %rbx), %cx
|
||||
lea (, %rbx), %ecx
|
||||
lea (, %rbx), %rcx
|
||||
lea (, %ebx, 1), %cx
|
||||
lea (, %ebx, 1), %ecx
|
||||
lea (, %ebx, 1), %rcx
|
||||
lea (, %rbx, 1), %cx
|
||||
lea (, %rbx, 1), %ecx
|
||||
lea (, %rbx, 1), %rcx
|
||||
lea (, %ebx, 2), %cx
|
||||
lea (, %ebx, 2), %ecx
|
||||
lea (, %ebx, 2), %rcx
|
||||
lea (, %rbx, 2), %cx
|
||||
lea (, %rbx, 2), %ecx
|
||||
lea (, %rbx, 2), %rcx
|
||||
lea (%eax, %ebx), %cx
|
||||
lea (%eax, %ebx), %ecx
|
||||
lea (%eax, %ebx), %rcx
|
||||
lea (%rax, %rbx), %cx
|
||||
lea (%rax, %rbx), %ecx
|
||||
lea (%rax, %rbx), %rcx
|
||||
lea (%eax, %ebx, 1), %cx
|
||||
lea (%eax, %ebx, 1), %ecx
|
||||
lea (%eax, %ebx, 1), %rcx
|
||||
lea (%rax, %rbx, 1), %cx
|
||||
lea (%rax, %rbx, 1), %ecx
|
||||
lea (%rax, %rbx, 1), %rcx
|
||||
lea (%eax, %ebx, 2), %cx
|
||||
lea (%eax, %ebx, 2), %ecx
|
||||
lea (%eax, %ebx, 2), %rcx
|
||||
lea (%rax, %rbx, 2), %cx
|
||||
lea (%rax, %rbx, 2), %ecx
|
||||
lea (%rax, %rbx, 2), %rcx
|
||||
|
||||
lea -16(), %cx
|
||||
lea -16(), %ecx
|
||||
lea -16(), %rcx
|
||||
lea -16(%eax), %cx
|
||||
lea -16(%eax), %ecx
|
||||
lea -16(%eax), %rcx
|
||||
lea -16(%rax), %cx
|
||||
lea -16(%rax), %ecx
|
||||
lea -16(%rax), %rcx
|
||||
lea -16(, %ebx), %cx
|
||||
lea -16(, %ebx), %ecx
|
||||
lea -16(, %ebx), %rcx
|
||||
lea -16(, %rbx), %cx
|
||||
lea -16(, %rbx), %ecx
|
||||
lea -16(, %rbx), %rcx
|
||||
lea -16(, %ebx, 1), %cx
|
||||
lea -16(, %ebx, 1), %ecx
|
||||
lea -16(, %ebx, 1), %rcx
|
||||
lea -16(, %rbx, 1), %cx
|
||||
lea -16(, %rbx, 1), %ecx
|
||||
lea -16(, %rbx, 1), %rcx
|
||||
lea -16(, %ebx, 2), %cx
|
||||
lea -16(, %ebx, 2), %ecx
|
||||
lea -16(, %ebx, 2), %rcx
|
||||
lea -16(, %rbx, 2), %cx
|
||||
lea -16(, %rbx, 2), %ecx
|
||||
lea -16(, %rbx, 2), %rcx
|
||||
lea -16(%eax, %ebx), %cx
|
||||
lea -16(%eax, %ebx), %ecx
|
||||
lea -16(%eax, %ebx), %rcx
|
||||
lea -16(%rax, %rbx), %cx
|
||||
lea -16(%rax, %rbx), %ecx
|
||||
lea -16(%rax, %rbx), %rcx
|
||||
lea -16(%eax, %ebx, 1), %cx
|
||||
lea -16(%eax, %ebx, 1), %ecx
|
||||
lea -16(%eax, %ebx, 1), %rcx
|
||||
lea -16(%rax, %rbx, 1), %cx
|
||||
lea -16(%rax, %rbx, 1), %ecx
|
||||
lea -16(%rax, %rbx, 1), %rcx
|
||||
lea -16(%eax, %ebx, 2), %cx
|
||||
lea -16(%eax, %ebx, 2), %ecx
|
||||
lea -16(%eax, %ebx, 2), %rcx
|
||||
lea -16(%rax, %rbx, 2), %cx
|
||||
lea -16(%rax, %rbx, 2), %ecx
|
||||
lea -16(%rax, %rbx, 2), %rcx
|
||||
|
||||
lea 1024(), %cx
|
||||
lea 1024(), %ecx
|
||||
lea 1024(), %rcx
|
||||
lea 1024(%eax), %cx
|
||||
lea 1024(%eax), %ecx
|
||||
lea 1024(%eax), %rcx
|
||||
lea 1024(%rax), %cx
|
||||
lea 1024(%rax), %ecx
|
||||
lea 1024(%rax), %rcx
|
||||
lea 1024(, %ebx), %cx
|
||||
lea 1024(, %ebx), %ecx
|
||||
lea 1024(, %ebx), %rcx
|
||||
lea 1024(, %rbx), %cx
|
||||
lea 1024(, %rbx), %ecx
|
||||
lea 1024(, %rbx), %rcx
|
||||
lea 1024(, %ebx, 1), %cx
|
||||
lea 1024(, %ebx, 1), %ecx
|
||||
lea 1024(, %ebx, 1), %rcx
|
||||
lea 1024(, %rbx, 1), %cx
|
||||
lea 1024(, %rbx, 1), %ecx
|
||||
lea 1024(, %rbx, 1), %rcx
|
||||
lea 1024(, %ebx, 2), %cx
|
||||
lea 1024(, %ebx, 2), %ecx
|
||||
lea 1024(, %ebx, 2), %rcx
|
||||
lea 1024(, %rbx, 2), %cx
|
||||
lea 1024(, %rbx, 2), %ecx
|
||||
lea 1024(, %rbx, 2), %rcx
|
||||
lea 1024(%eax, %ebx), %cx
|
||||
lea 1024(%eax, %ebx), %ecx
|
||||
lea 1024(%eax, %ebx), %rcx
|
||||
lea 1024(%rax, %rbx), %cx
|
||||
lea 1024(%rax, %rbx), %ecx
|
||||
lea 1024(%rax, %rbx), %rcx
|
||||
lea 1024(%eax, %ebx, 1), %cx
|
||||
lea 1024(%eax, %ebx, 1), %ecx
|
||||
lea 1024(%eax, %ebx, 1), %rcx
|
||||
lea 1024(%rax, %rbx, 1), %cx
|
||||
lea 1024(%rax, %rbx, 1), %ecx
|
||||
lea 1024(%rax, %rbx, 1), %rcx
|
||||
lea 1024(%eax, %ebx, 2), %cx
|
||||
lea 1024(%eax, %ebx, 2), %ecx
|
||||
lea 1024(%eax, %ebx, 2), %rcx
|
||||
lea 1024(%rax, %rbx, 2), %cx
|
||||
lea 1024(%rax, %rbx, 2), %ecx
|
||||
lea 1024(%rax, %rbx, 2), %rcx
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 2 2 1.00 leaw 0, %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal 0, %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq 0, %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw (%eax), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal (%eax), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq (%eax), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw (%rax), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal (%rax), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq (%rax), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw (,%ebx), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal (,%ebx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq (,%ebx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw (,%rbx), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal (,%rbx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq (,%rbx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw (,%ebx), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal (,%ebx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq (,%ebx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw (,%rbx), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal (,%rbx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq (,%rbx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw (,%ebx,2), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal (,%ebx,2), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq (,%ebx,2), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw (,%rbx,2), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal (,%rbx,2), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq (,%rbx,2), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw (%eax,%ebx), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal (%eax,%ebx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq (%eax,%ebx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw (%rax,%rbx), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal (%rax,%rbx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq (%rax,%rbx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw (%eax,%ebx), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal (%eax,%ebx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq (%eax,%ebx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw (%rax,%rbx), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal (%rax,%rbx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq (%rax,%rbx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw (%eax,%ebx,2), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal (%eax,%ebx,2), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq (%eax,%ebx,2), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw (%rax,%rbx,2), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal (%rax,%rbx,2), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq (%rax,%rbx,2), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw -16, %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal -16, %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq -16, %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw -16(%eax), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal -16(%eax), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq -16(%eax), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw -16(%rax), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal -16(%rax), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq -16(%rax), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw -16(,%ebx), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal -16(,%ebx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq -16(,%ebx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw -16(,%rbx), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal -16(,%rbx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq -16(,%rbx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw -16(,%ebx), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal -16(,%ebx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq -16(,%ebx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw -16(,%rbx), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal -16(,%rbx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq -16(,%rbx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw -16(,%ebx,2), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal -16(,%ebx,2), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq -16(,%ebx,2), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw -16(,%rbx,2), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal -16(,%rbx,2), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq -16(,%rbx,2), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw -16(%eax,%ebx), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal -16(%eax,%ebx), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq -16(%eax,%ebx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw -16(%rax,%rbx), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal -16(%rax,%rbx), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq -16(%rax,%rbx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw -16(%eax,%ebx), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal -16(%eax,%ebx), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq -16(%eax,%ebx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw -16(%rax,%rbx), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal -16(%rax,%rbx), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq -16(%rax,%rbx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw -16(%eax,%ebx,2), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal -16(%eax,%ebx,2), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq -16(%eax,%ebx,2), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw -16(%rax,%rbx,2), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal -16(%rax,%rbx,2), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq -16(%rax,%rbx,2), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw 1024, %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal 1024, %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq 1024, %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw 1024(%eax), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal 1024(%eax), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq 1024(%eax), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw 1024(%rax), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal 1024(%rax), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq 1024(%rax), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw 1024(,%ebx), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal 1024(,%ebx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq 1024(,%ebx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw 1024(,%rbx), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal 1024(,%rbx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq 1024(,%rbx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw 1024(,%ebx), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal 1024(,%ebx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq 1024(,%ebx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw 1024(,%rbx), %cx
|
||||
# CHECK-NEXT: 1 1 0.33 leal 1024(,%rbx), %ecx
|
||||
# CHECK-NEXT: 1 1 0.33 leaq 1024(,%rbx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw 1024(,%ebx,2), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal 1024(,%ebx,2), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq 1024(,%ebx,2), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw 1024(,%rbx,2), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal 1024(,%rbx,2), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq 1024(,%rbx,2), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw 1024(%eax,%ebx), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal 1024(%eax,%ebx), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq 1024(%eax,%ebx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw 1024(%rax,%rbx), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal 1024(%rax,%rbx), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq 1024(%rax,%rbx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw 1024(%eax,%ebx), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal 1024(%eax,%ebx), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq 1024(%eax,%ebx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw 1024(%rax,%rbx), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal 1024(%rax,%rbx), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq 1024(%rax,%rbx), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw 1024(%eax,%ebx,2), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal 1024(%eax,%ebx,2), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq 1024(%eax,%ebx,2), %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 leaw 1024(%rax,%rbx,2), %cx
|
||||
# CHECK-NEXT: 2 2 0.25 leal 1024(%rax,%rbx,2), %ecx
|
||||
# CHECK-NEXT: 2 2 0.25 leaq 1024(%rax,%rbx,2), %rcx
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: 16.67 16.67 16.67 55.00 55.00 55.00 55.00 - - - - - - - - - - - - - - - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw 0, %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal 0, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq 0, %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw (%eax), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal (%eax), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq (%eax), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw (%rax), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal (%rax), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq (%rax), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw (,%ebx), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal (,%ebx), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq (,%ebx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw (,%rbx), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal (,%rbx), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq (,%rbx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw (,%ebx), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal (,%ebx), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq (,%ebx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw (,%rbx), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal (,%rbx), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq (,%rbx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw (,%ebx,2), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal (,%ebx,2), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq (,%ebx,2), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw (,%rbx,2), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal (,%rbx,2), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq (,%rbx,2), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw (%eax,%ebx), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal (%eax,%ebx), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq (%eax,%ebx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw (%rax,%rbx), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal (%rax,%rbx), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq (%rax,%rbx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw (%eax,%ebx), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal (%eax,%ebx), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq (%eax,%ebx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw (%rax,%rbx), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal (%rax,%rbx), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq (%rax,%rbx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw (%eax,%ebx,2), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal (%eax,%ebx,2), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq (%eax,%ebx,2), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw (%rax,%rbx,2), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal (%rax,%rbx,2), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq (%rax,%rbx,2), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw -16, %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal -16, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq -16, %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw -16(%eax), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal -16(%eax), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq -16(%eax), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw -16(%rax), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal -16(%rax), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq -16(%rax), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw -16(,%ebx), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal -16(,%ebx), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq -16(,%ebx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw -16(,%rbx), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal -16(,%rbx), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq -16(,%rbx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw -16(,%ebx), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal -16(,%ebx), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq -16(,%ebx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw -16(,%rbx), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal -16(,%rbx), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq -16(,%rbx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw -16(,%ebx,2), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal -16(,%ebx,2), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq -16(,%ebx,2), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw -16(,%rbx,2), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal -16(,%rbx,2), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq -16(,%rbx,2), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw -16(%eax,%ebx), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal -16(%eax,%ebx), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq -16(%eax,%ebx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw -16(%rax,%rbx), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal -16(%rax,%rbx), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq -16(%rax,%rbx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw -16(%eax,%ebx), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal -16(%eax,%ebx), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq -16(%eax,%ebx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw -16(%rax,%rbx), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal -16(%rax,%rbx), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq -16(%rax,%rbx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw -16(%eax,%ebx,2), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal -16(%eax,%ebx,2), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq -16(%eax,%ebx,2), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw -16(%rax,%rbx,2), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal -16(%rax,%rbx,2), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq -16(%rax,%rbx,2), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw 1024, %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal 1024, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq 1024, %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw 1024(%eax), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal 1024(%eax), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq 1024(%eax), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw 1024(%rax), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal 1024(%rax), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq 1024(%rax), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw 1024(,%ebx), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal 1024(,%ebx), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq 1024(,%ebx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw 1024(,%rbx), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal 1024(,%rbx), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq 1024(,%rbx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw 1024(,%ebx), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal 1024(,%ebx), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq 1024(,%ebx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw 1024(,%rbx), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leal 1024(,%rbx), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - - - - - - - - - leaq 1024(,%rbx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw 1024(,%ebx,2), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal 1024(,%ebx,2), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq 1024(,%ebx,2), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw 1024(,%rbx,2), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal 1024(,%rbx,2), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq 1024(,%rbx,2), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw 1024(%eax,%ebx), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal 1024(%eax,%ebx), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq 1024(%eax,%ebx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw 1024(%rax,%rbx), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal 1024(%rax,%rbx), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq 1024(%rax,%rbx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw 1024(%eax,%ebx), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal 1024(%eax,%ebx), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq 1024(%eax,%ebx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw 1024(%rax,%rbx), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal 1024(%rax,%rbx), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq 1024(%rax,%rbx), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw 1024(%eax,%ebx,2), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal 1024(%eax,%ebx,2), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq 1024(%eax,%ebx,2), %rcx
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - leaw 1024(%rax,%rbx,2), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leal 1024(%rax,%rbx,2), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leaq 1024(%rax,%rbx,2), %rcx
|
|
@ -0,0 +1,65 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
lzcntw %cx, %cx
|
||||
lzcntw (%rax), %cx
|
||||
|
||||
lzcntl %eax, %ecx
|
||||
lzcntl (%rax), %ecx
|
||||
|
||||
lzcntq %rax, %rcx
|
||||
lzcntq (%rax), %rcx
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 1 1.00 lzcntw %cx, %cx
|
||||
# CHECK-NEXT: 1 5 0.33 * lzcntw (%rax), %cx
|
||||
# CHECK-NEXT: 1 1 0.25 lzcntl %eax, %ecx
|
||||
# CHECK-NEXT: 1 5 0.33 * lzcntl (%rax), %ecx
|
||||
# CHECK-NEXT: 1 1 0.25 lzcntq %rax, %rcx
|
||||
# CHECK-NEXT: 1 5 0.33 * lzcntq (%rax), %rcx
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: 1.00 1.00 1.00 2.25 2.25 2.25 2.25 - - - - - - - - 1.00 1.00 1.00 1.00 1.00 1.00 - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - lzcntw %cx, %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - lzcntw (%rax), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - lzcntl %eax, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - lzcntl (%rax), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - lzcntq %rax, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - lzcntq (%rax), %rcx
|
|
@ -0,0 +1,408 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
emms
|
||||
|
||||
movd %eax, %mm2
|
||||
movd (%rax), %mm2
|
||||
|
||||
movd %mm0, %ecx
|
||||
movd %mm0, (%rax)
|
||||
|
||||
movq %rax, %mm2
|
||||
movq (%rax), %mm2
|
||||
|
||||
movq %mm0, %rcx
|
||||
movq %mm0, (%rax)
|
||||
|
||||
packsswb %mm0, %mm2
|
||||
packsswb (%rax), %mm2
|
||||
|
||||
packssdw %mm0, %mm2
|
||||
packssdw (%rax), %mm2
|
||||
|
||||
packuswb %mm0, %mm2
|
||||
packuswb (%rax), %mm2
|
||||
|
||||
paddb %mm0, %mm2
|
||||
paddb (%rax), %mm2
|
||||
|
||||
paddd %mm0, %mm2
|
||||
paddd (%rax), %mm2
|
||||
|
||||
paddsb %mm0, %mm2
|
||||
paddsb (%rax), %mm2
|
||||
|
||||
paddsw %mm0, %mm2
|
||||
paddsw (%rax), %mm2
|
||||
|
||||
paddusb %mm0, %mm2
|
||||
paddusb (%rax), %mm2
|
||||
|
||||
paddusw %mm0, %mm2
|
||||
paddusw (%rax), %mm2
|
||||
|
||||
paddw %mm0, %mm2
|
||||
paddw (%rax), %mm2
|
||||
|
||||
pand %mm0, %mm2
|
||||
pand (%rax), %mm2
|
||||
|
||||
pandn %mm0, %mm2
|
||||
pandn (%rax), %mm2
|
||||
|
||||
pcmpeqb %mm0, %mm2
|
||||
pcmpeqb (%rax), %mm2
|
||||
|
||||
pcmpeqd %mm0, %mm2
|
||||
pcmpeqd (%rax), %mm2
|
||||
|
||||
pcmpeqw %mm0, %mm2
|
||||
pcmpeqw (%rax), %mm2
|
||||
|
||||
pcmpgtb %mm0, %mm2
|
||||
pcmpgtb (%rax), %mm2
|
||||
|
||||
pcmpgtd %mm0, %mm2
|
||||
pcmpgtd (%rax), %mm2
|
||||
|
||||
pcmpgtw %mm0, %mm2
|
||||
pcmpgtw (%rax), %mm2
|
||||
|
||||
pmaddwd %mm0, %mm2
|
||||
pmaddwd (%rax), %mm2
|
||||
|
||||
pmulhw %mm0, %mm2
|
||||
pmulhw (%rax), %mm2
|
||||
|
||||
pmullw %mm0, %mm2
|
||||
pmullw (%rax), %mm2
|
||||
|
||||
por %mm0, %mm2
|
||||
por (%rax), %mm2
|
||||
|
||||
pslld $1, %mm2
|
||||
pslld %mm0, %mm2
|
||||
pslld (%rax), %mm2
|
||||
|
||||
psllq $1, %mm2
|
||||
psllq %mm0, %mm2
|
||||
psllq (%rax), %mm2
|
||||
|
||||
psllw $1, %mm2
|
||||
psllw %mm0, %mm2
|
||||
psllw (%rax), %mm2
|
||||
|
||||
psrad $1, %mm2
|
||||
psrad %mm0, %mm2
|
||||
psrad (%rax), %mm2
|
||||
|
||||
psraw $1, %mm2
|
||||
psraw %mm0, %mm2
|
||||
psraw (%rax), %mm2
|
||||
|
||||
psrld $1, %mm2
|
||||
psrld %mm0, %mm2
|
||||
psrld (%rax), %mm2
|
||||
|
||||
psrlq $1, %mm2
|
||||
psrlq %mm0, %mm2
|
||||
psrlq (%rax), %mm2
|
||||
|
||||
psrlw $1, %mm2
|
||||
psrlw %mm0, %mm2
|
||||
psrlw (%rax), %mm2
|
||||
|
||||
psubb %mm0, %mm2
|
||||
psubb (%rax), %mm2
|
||||
|
||||
psubd %mm0, %mm2
|
||||
psubd (%rax), %mm2
|
||||
|
||||
psubsb %mm0, %mm2
|
||||
psubsb (%rax), %mm2
|
||||
|
||||
psubsw %mm0, %mm2
|
||||
psubsw (%rax), %mm2
|
||||
|
||||
psubusb %mm0, %mm2
|
||||
psubusb (%rax), %mm2
|
||||
|
||||
psubusw %mm0, %mm2
|
||||
psubusw (%rax), %mm2
|
||||
|
||||
psubw %mm0, %mm2
|
||||
psubw (%rax), %mm2
|
||||
|
||||
punpckhbw %mm0, %mm2
|
||||
punpckhbw (%rax), %mm2
|
||||
|
||||
punpckhdq %mm0, %mm2
|
||||
punpckhdq (%rax), %mm2
|
||||
|
||||
punpckhwd %mm0, %mm2
|
||||
punpckhwd (%rax), %mm2
|
||||
|
||||
punpcklbw %mm0, %mm2
|
||||
punpcklbw (%rax), %mm2
|
||||
|
||||
punpckldq %mm0, %mm2
|
||||
punpckldq (%rax), %mm2
|
||||
|
||||
punpcklwd %mm0, %mm2
|
||||
punpcklwd (%rax), %mm2
|
||||
|
||||
pxor %mm0, %mm2
|
||||
pxor (%rax), %mm2
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 2 0.25 * * U emms
|
||||
# CHECK-NEXT: 2 1 1.00 movd %eax, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * movd (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 1.00 movd %mm0, %ecx
|
||||
# CHECK-NEXT: 1 1 1.00 * U movd %mm0, (%rax)
|
||||
# CHECK-NEXT: 2 1 1.00 movq %rax, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * movq (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 1.00 movq %mm0, %rcx
|
||||
# CHECK-NEXT: 1 1 1.00 * movq %mm0, (%rax)
|
||||
# CHECK-NEXT: 1 1 0.50 packsswb %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * packsswb (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 packssdw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * packssdw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 packuswb %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * packuswb (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 paddb %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * paddb (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 paddd %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * paddd (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 paddsb %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * paddsb (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 paddsw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * paddsw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 paddusb %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * paddusb (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 paddusw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * paddusw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 paddw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * paddw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 pand %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pand (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 pandn %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pandn (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 pcmpeqb %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pcmpeqb (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 pcmpeqd %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pcmpeqd (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 pcmpeqw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pcmpeqw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 pcmpgtb %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pcmpgtb (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 pcmpgtd %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pcmpgtd (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 pcmpgtw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pcmpgtw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 3 0.50 pmaddwd %mm0, %mm2
|
||||
# CHECK-NEXT: 1 10 0.50 * pmaddwd (%rax), %mm2
|
||||
# CHECK-NEXT: 1 3 0.50 pmulhw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 10 0.50 * pmulhw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 3 0.50 pmullw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 10 0.50 * pmullw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 por %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * por (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 pslld $1, %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 pslld %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pslld (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psllq $1, %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psllq %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psllq (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psllw $1, %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psllw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psllw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psrad $1, %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psrad %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psrad (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psraw $1, %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psraw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psraw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psrld $1, %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psrld %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psrld (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psrlq $1, %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psrlq %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psrlq (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psrlw $1, %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psrlw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psrlw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 psubb %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psubb (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 psubd %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psubd (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psubsb %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psubsb (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psubsw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psubsw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psubusb %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psubusb (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psubusw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psubusw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 psubw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psubw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 punpckhbw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * punpckhbw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 punpckhdq %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * punpckhdq (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 punpckhwd %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * punpckhwd (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 punpcklbw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * punpcklbw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 punpckldq %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * punpckldq (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 punpcklwd %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * punpcklwd (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 pxor %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pxor (%rax), %mm2
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - 19.00 37.00 33.00 15.00 27.00 27.00 2.00 16.00 16.00 16.00 15.33 15.33 15.33 1.00 1.00
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - emms
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 1.00 1.00 0.50 0.50 - - - - - - - - - movd %eax, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movd (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.00 1.00 - - - - - - - - - movd %mm0, %ecx
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movd %mm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 1.00 1.00 0.50 0.50 - - - - - - - - - movq %rax, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movq (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.00 1.00 - - - - - - - - - movq %mm0, %rcx
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movq %mm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - packsswb %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - packsswb (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - packssdw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - packssdw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - packuswb %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - packuswb (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - paddb %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - paddb (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - paddd %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - paddd (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - paddsb %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - paddsb (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - paddsw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - paddsw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - paddusb %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - paddusb (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - paddusw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - paddusw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - paddw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - paddw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pand %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pand (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pandn %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pandn (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pcmpeqb %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pcmpeqb (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pcmpeqd %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pcmpeqd (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pcmpeqw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pcmpeqw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pcmpgtb %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pcmpgtb (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pcmpgtd %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pcmpgtd (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pcmpgtw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pcmpgtw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmaddwd %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmaddwd (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmulhw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmulhw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmullw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmullw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - por %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - por (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pslld $1, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pslld %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pslld (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psllq $1, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psllq %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psllq (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psllw $1, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psllw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psllw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psrad $1, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psrad %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psrad (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psraw $1, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psraw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psraw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psrld $1, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psrld %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psrld (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psrlq $1, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psrlq %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psrlq (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psrlw $1, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psrlw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psrlw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - psubb %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psubb (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - psubd %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psubd (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psubsb %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psubsb (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psubsw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psubsw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psubusb %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psubusb (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psubusw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psubusw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - psubw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psubw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - punpckhbw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - punpckhbw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - punpckhdq %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - punpckhdq (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - punpckhwd %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - punpckhwd (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - punpcklbw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - punpcklbw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - punpckldq %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - punpckldq (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - punpcklwd %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - punpcklwd (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pxor %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pxor (%rax), %mm2
|
|
@ -0,0 +1,65 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
movbe %cx, (%rax)
|
||||
movbe (%rax), %cx
|
||||
|
||||
movbe %ecx, (%rax)
|
||||
movbe (%rax), %ecx
|
||||
|
||||
movbe %rcx, (%rax)
|
||||
movbe (%rax), %rcx
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 2 1 1.00 * movbew %cx, (%rax)
|
||||
# CHECK-NEXT: 1 4 1.00 * movbew (%rax), %cx
|
||||
# CHECK-NEXT: 2 1 1.00 * movbel %ecx, (%rax)
|
||||
# CHECK-NEXT: 1 5 0.33 * movbel (%rax), %ecx
|
||||
# CHECK-NEXT: 2 1 1.00 * movbeq %rcx, (%rax)
|
||||
# CHECK-NEXT: 1 5 0.33 * movbeq (%rax), %rcx
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: 2.00 2.00 2.00 4.50 4.50 4.50 4.50 - - - - - - - - 2.00 2.00 2.00 1.00 1.00 1.00 1.50 1.50
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 1.00 1.00 1.00 1.00 - - - - - - - - 0.33 0.33 0.33 - - - 0.50 0.50 movbew %cx, (%rax)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 1.00 1.00 1.00 1.00 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - movbew (%rax), %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 1.00 1.00 1.00 1.00 - - - - - - - - 0.33 0.33 0.33 - - - 0.50 0.50 movbel %ecx, (%rax)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - movbel (%rax), %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 1.00 1.00 1.00 1.00 - - - - - - - - 0.33 0.33 0.33 - - - 0.50 0.50 movbeq %rcx, (%rax)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - movbeq (%rax), %rcx
|
|
@ -0,0 +1,51 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
monitorx
|
||||
mwaitx
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 100 100 25.00 U monitorx
|
||||
# CHECK-NEXT: 100 100 25.00 U mwaitx
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: - - - 50.00 50.00 50.00 50.00 - - - - - - - - - - - - - - - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - monitorx
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - mwaitx
|
|
@ -0,0 +1,51 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
pclmulqdq $11, %xmm0, %xmm2
|
||||
pclmulqdq $11, (%rax), %xmm2
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 4 4 2.00 pclmulqdq $11, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 4 11 2.00 * pclmulqdq $11, (%rax), %xmm2
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: - - - - - - - - 4.00 4.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - - - - - - - - - - - - pclmulqdq $11, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 2.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pclmulqdq $11, (%rax), %xmm2
|
|
@ -0,0 +1,65 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
popcntw %cx, %cx
|
||||
popcntw (%rax), %cx
|
||||
|
||||
popcntl %eax, %ecx
|
||||
popcntl (%rax), %ecx
|
||||
|
||||
popcntq %rax, %rcx
|
||||
popcntq (%rax), %rcx
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 1 1.00 popcntw %cx, %cx
|
||||
# CHECK-NEXT: 1 5 0.33 * popcntw (%rax), %cx
|
||||
# CHECK-NEXT: 1 1 0.25 popcntl %eax, %ecx
|
||||
# CHECK-NEXT: 1 5 0.33 * popcntl (%rax), %ecx
|
||||
# CHECK-NEXT: 1 1 0.25 popcntq %rax, %rcx
|
||||
# CHECK-NEXT: 1 5 0.33 * popcntq (%rax), %rcx
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: 1.00 1.00 1.00 2.25 2.25 2.25 2.25 - - - - - - - - 1.00 1.00 1.00 1.00 1.00 1.00 - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - popcntw %cx, %cx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - popcntw (%rax), %cx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - popcntl %eax, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - popcntl (%rax), %ecx
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - popcntq %rax, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 0.25 0.25 0.25 0.25 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - popcntq (%rax), %rcx
|
|
@ -0,0 +1,51 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
prefetch (%rax)
|
||||
prefetchw (%rax)
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 5 0.33 * * prefetch (%rax)
|
||||
# CHECK-NEXT: 1 5 0.33 * * prefetchw (%rax)
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: 0.67 0.67 0.67 - - - - - - - - - - - - 0.67 0.67 0.67 0.67 0.67 0.67 - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - prefetch (%rax)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - prefetchw (%rax)
|
|
@ -0,0 +1,54 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
rdrand %ax
|
||||
rdrand %eax
|
||||
rdrand %rax
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 100 100 25.00 U rdrandw %ax
|
||||
# CHECK-NEXT: 100 100 25.00 U rdrandl %eax
|
||||
# CHECK-NEXT: 100 100 25.00 U rdrandq %rax
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: - - - 75.00 75.00 75.00 75.00 - - - - - - - - - - - - - - - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - rdrandw %ax
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - rdrandl %eax
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - rdrandq %rax
|
|
@ -0,0 +1,54 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
rdseed %ax
|
||||
rdseed %eax
|
||||
rdseed %rax
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 100 100 25.00 U rdseedw %ax
|
||||
# CHECK-NEXT: 100 100 25.00 U rdseedl %eax
|
||||
# CHECK-NEXT: 100 100 25.00 U rdseedq %rax
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: - - - 75.00 75.00 75.00 75.00 - - - - - - - - - - - - - - - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - rdseedw %ax
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - rdseedl %eax
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - rdseedq %rax
|
|
@ -0,0 +1,93 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
sha1msg1 %xmm0, %xmm2
|
||||
sha1msg1 (%rax), %xmm2
|
||||
|
||||
sha1msg2 %xmm0, %xmm2
|
||||
sha1msg2 (%rax), %xmm2
|
||||
|
||||
sha1nexte %xmm0, %xmm2
|
||||
sha1nexte (%rax), %xmm2
|
||||
|
||||
sha1rnds4 $3, %xmm0, %xmm2
|
||||
sha1rnds4 $3, (%rax), %xmm2
|
||||
|
||||
sha256msg1 %xmm0, %xmm2
|
||||
sha256msg1 (%rax), %xmm2
|
||||
|
||||
sha256msg2 %xmm0, %xmm2
|
||||
sha256msg2 (%rax), %xmm2
|
||||
|
||||
sha256rnds2 %xmm0, %xmm2
|
||||
sha256rnds2 (%rax), %xmm2
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 2 2 0.50 sha1msg1 %xmm0, %xmm2
|
||||
# CHECK-NEXT: 2 6 0.50 * sha1msg1 (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 sha1msg2 %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 5 0.50 * sha1msg2 (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 sha1nexte %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 5 0.50 * sha1nexte (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 6 2.00 sha1rnds4 $3, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * sha1rnds4 $3, (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 2 0.75 sha256msg1 %xmm0, %xmm2
|
||||
# CHECK-NEXT: 2 6 0.75 * sha256msg1 (%rax), %xmm2
|
||||
# CHECK-NEXT: 4 3 2.00 sha256msg2 %xmm0, %xmm2
|
||||
# CHECK-NEXT: 5 7 2.00 * sha256msg2 (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 4 2.00 sha256rnds2 %xmm0, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * sha256rnds2 %xmm0, (%rax), %xmm2
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: 1.67 1.67 1.67 - - - - - 13.50 12.50 12.50 13.50 1.00 1.00 - 2.33 2.33 2.33 2.33 2.33 2.33 - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - sha1msg1 %xmm0, %xmm2
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - 0.50 0.50 0.50 0.50 - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - sha1msg1 (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - sha1msg2 %xmm0, %xmm2
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - 0.50 0.50 0.50 0.50 - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - sha1msg2 (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - sha1nexte %xmm0, %xmm2
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - 0.50 0.50 0.50 0.50 - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - sha1nexte (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 2.00 2.00 2.00 - - - - - - - - - - - sha1rnds4 $3, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - sha1rnds4 $3, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.75 0.75 0.75 0.75 - - - - - - - - - - - sha256msg1 %xmm0, %xmm2
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - 0.75 0.75 0.75 0.75 - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - sha256msg1 (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 2.00 2.00 2.00 - - - - - - - - - - - sha256msg2 %xmm0, %xmm2
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - 2.00 2.00 2.00 2.00 - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - sha256msg2 (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 2.00 2.00 2.00 - - - - - - - - - - - sha256rnds2 %xmm0, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - sha256rnds2 %xmm0, (%rax), %xmm2
|
|
@ -0,0 +1,476 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
addps %xmm0, %xmm2
|
||||
addps (%rax), %xmm2
|
||||
|
||||
addss %xmm0, %xmm2
|
||||
addss (%rax), %xmm2
|
||||
|
||||
andnps %xmm0, %xmm2
|
||||
andnps (%rax), %xmm2
|
||||
|
||||
andps %xmm0, %xmm2
|
||||
andps (%rax), %xmm2
|
||||
|
||||
cmpps $0, %xmm0, %xmm2
|
||||
cmpps $0, (%rax), %xmm2
|
||||
|
||||
cmpss $0, %xmm0, %xmm2
|
||||
cmpss $0, (%rax), %xmm2
|
||||
|
||||
comiss %xmm0, %xmm1
|
||||
comiss (%rax), %xmm1
|
||||
|
||||
cvtpi2ps %mm0, %xmm2
|
||||
cvtpi2ps (%rax), %xmm2
|
||||
|
||||
cvtps2pi %xmm0, %mm2
|
||||
cvtps2pi (%rax), %mm2
|
||||
|
||||
cvtsi2ss %ecx, %xmm2
|
||||
cvtsi2ss %rcx, %xmm2
|
||||
cvtsi2ss (%rax), %xmm2
|
||||
cvtsi2ss (%rax), %xmm2
|
||||
|
||||
cvtss2si %xmm0, %ecx
|
||||
cvtss2si %xmm0, %rcx
|
||||
cvtss2si (%rax), %ecx
|
||||
cvtss2si (%rax), %rcx
|
||||
|
||||
cvttps2pi %xmm0, %mm2
|
||||
cvttps2pi (%rax), %mm2
|
||||
|
||||
cvttss2si %xmm0, %ecx
|
||||
cvttss2si %xmm0, %rcx
|
||||
cvttss2si (%rax), %ecx
|
||||
cvttss2si (%rax), %rcx
|
||||
|
||||
divps %xmm0, %xmm2
|
||||
divps (%rax), %xmm2
|
||||
|
||||
divss %xmm0, %xmm2
|
||||
divss (%rax), %xmm2
|
||||
|
||||
ldmxcsr (%rax)
|
||||
|
||||
maskmovq %mm0, %mm1
|
||||
|
||||
maxps %xmm0, %xmm2
|
||||
maxps (%rax), %xmm2
|
||||
|
||||
maxss %xmm0, %xmm2
|
||||
maxss (%rax), %xmm2
|
||||
|
||||
minps %xmm0, %xmm2
|
||||
minps (%rax), %xmm2
|
||||
|
||||
minss %xmm0, %xmm2
|
||||
minss (%rax), %xmm2
|
||||
|
||||
movaps %xmm0, %xmm2
|
||||
movaps %xmm0, (%rax)
|
||||
movaps (%rax), %xmm2
|
||||
|
||||
movhlps %xmm0, %xmm2
|
||||
movlhps %xmm0, %xmm2
|
||||
|
||||
movhps %xmm0, (%rax)
|
||||
movhps (%rax), %xmm2
|
||||
|
||||
movlps %xmm0, (%rax)
|
||||
movlps (%rax), %xmm2
|
||||
|
||||
movmskps %xmm0, %rcx
|
||||
|
||||
movntps %xmm0, (%rax)
|
||||
movntq %mm0, (%rax)
|
||||
|
||||
movss %xmm0, %xmm2
|
||||
movss %xmm0, (%rax)
|
||||
movss (%rax), %xmm2
|
||||
|
||||
movups %xmm0, %xmm2
|
||||
movups %xmm0, (%rax)
|
||||
movups (%rax), %xmm2
|
||||
|
||||
mulps %xmm0, %xmm2
|
||||
mulps (%rax), %xmm2
|
||||
|
||||
mulss %xmm0, %xmm2
|
||||
mulss (%rax), %xmm2
|
||||
|
||||
orps %xmm0, %xmm2
|
||||
orps (%rax), %xmm2
|
||||
|
||||
pavgb %mm0, %mm2
|
||||
pavgb (%rax), %mm2
|
||||
|
||||
pavgw %mm0, %mm2
|
||||
pavgw (%rax), %mm2
|
||||
|
||||
pextrw $1, %mm0, %rcx
|
||||
|
||||
pinsrw $1, %rax, %mm2
|
||||
pinsrw $1, (%rax), %mm2
|
||||
|
||||
pmaxsw %mm0, %mm2
|
||||
pmaxsw (%rax), %mm2
|
||||
|
||||
pmaxub %mm0, %mm2
|
||||
pmaxub (%rax), %mm2
|
||||
|
||||
pminsw %mm0, %mm2
|
||||
pminsw (%rax), %mm2
|
||||
|
||||
pminub %mm0, %mm2
|
||||
pminub (%rax), %mm2
|
||||
|
||||
pmovmskb %mm0, %rcx
|
||||
|
||||
pmulhuw %mm0, %mm2
|
||||
pmulhuw (%rax), %mm2
|
||||
|
||||
prefetcht0 (%rax)
|
||||
prefetcht1 (%rax)
|
||||
prefetcht2 (%rax)
|
||||
prefetchnta (%rax)
|
||||
|
||||
psadbw %mm0, %mm2
|
||||
psadbw (%rax), %mm2
|
||||
|
||||
pshufw $1, %mm0, %mm2
|
||||
pshufw $1, (%rax), %mm2
|
||||
|
||||
rcpps %xmm0, %xmm2
|
||||
rcpps (%rax), %xmm2
|
||||
|
||||
rcpss %xmm0, %xmm2
|
||||
rcpss (%rax), %xmm2
|
||||
|
||||
rsqrtps %xmm0, %xmm2
|
||||
rsqrtps (%rax), %xmm2
|
||||
|
||||
rsqrtss %xmm0, %xmm2
|
||||
rsqrtss (%rax), %xmm2
|
||||
|
||||
sfence
|
||||
|
||||
shufps $1, %xmm0, %xmm2
|
||||
shufps $1, (%rax), %xmm2
|
||||
|
||||
sqrtps %xmm0, %xmm2
|
||||
sqrtps (%rax), %xmm2
|
||||
|
||||
sqrtss %xmm0, %xmm2
|
||||
sqrtss (%rax), %xmm2
|
||||
|
||||
stmxcsr (%rax)
|
||||
|
||||
subps %xmm0, %xmm2
|
||||
subps (%rax), %xmm2
|
||||
|
||||
subss %xmm0, %xmm2
|
||||
subss (%rax), %xmm2
|
||||
|
||||
ucomiss %xmm0, %xmm1
|
||||
ucomiss (%rax), %xmm1
|
||||
|
||||
unpckhps %xmm0, %xmm2
|
||||
unpckhps (%rax), %xmm2
|
||||
|
||||
unpcklps %xmm0, %xmm2
|
||||
unpcklps (%rax), %xmm2
|
||||
|
||||
xorps %xmm0, %xmm2
|
||||
xorps (%rax), %xmm2
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 3 0.50 addps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * addps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 addss %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * addss (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 andnps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * andnps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 andps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * andps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 cmpeqps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * cmpeqps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 cmpeqss %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * cmpeqss (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 4 1.00 comiss %xmm0, %xmm1
|
||||
# CHECK-NEXT: 2 11 1.00 * comiss (%rax), %xmm1
|
||||
# CHECK-NEXT: 2 3 0.50 cvtpi2ps %mm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * cvtpi2ps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 cvtps2pi %xmm0, %mm2
|
||||
# CHECK-NEXT: 1 10 0.50 * cvtps2pi (%rax), %mm2
|
||||
# CHECK-NEXT: 2 4 1.00 cvtsi2ss %ecx, %xmm2
|
||||
# CHECK-NEXT: 2 4 1.00 cvtsi2ss %rcx, %xmm2
|
||||
# CHECK-NEXT: 1 10 1.00 * cvtsi2ssl (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 10 1.00 * cvtsi2ssl (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 2 1.00 cvtss2si %xmm0, %ecx
|
||||
# CHECK-NEXT: 2 2 1.00 cvtss2si %xmm0, %rcx
|
||||
# CHECK-NEXT: 2 9 1.00 * cvtss2si (%rax), %ecx
|
||||
# CHECK-NEXT: 2 9 1.00 * cvtss2si (%rax), %rcx
|
||||
# CHECK-NEXT: 1 3 0.50 cvttps2pi %xmm0, %mm2
|
||||
# CHECK-NEXT: 1 10 0.50 * cvttps2pi (%rax), %mm2
|
||||
# CHECK-NEXT: 2 2 1.00 cvttss2si %xmm0, %ecx
|
||||
# CHECK-NEXT: 2 2 1.00 cvttss2si %xmm0, %rcx
|
||||
# CHECK-NEXT: 2 9 1.00 * cvttss2si (%rax), %ecx
|
||||
# CHECK-NEXT: 2 9 1.00 * cvttss2si (%rax), %rcx
|
||||
# CHECK-NEXT: 1 11 3.00 divps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 18 3.00 * divps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 11 3.00 divss %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 18 3.00 * divss (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 5 1.50 * * U ldmxcsr (%rax)
|
||||
# CHECK-NEXT: 1 1 0.50 * * U maskmovq %mm0, %mm1
|
||||
# CHECK-NEXT: 1 1 0.50 maxps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * maxps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 maxss %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * maxss (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 minps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * minps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 minss %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * minss (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 0 0.25 movaps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 1 1.00 * movaps %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 8 0.50 * movaps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 movhlps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 movlhps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 2 2 1.00 * movhps %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 8 0.50 * movhps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 1.00 * movlps %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 8 0.50 * movlps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 1.00 movmskps %xmm0, %ecx
|
||||
# CHECK-NEXT: 1 1 1.00 * movntps %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 1 1.00 * * U movntq %mm0, (%rax)
|
||||
# CHECK-NEXT: 1 1 0.50 movss %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 1 1.00 * movss %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 8 0.50 * movss (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 0 0.25 movups %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 1 1.00 * movups %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 8 0.50 * movups (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 mulps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * mulps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 mulss %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * mulss (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 orps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * orps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pavgb %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pavgb (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 pavgw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pavgw (%rax), %mm2
|
||||
# CHECK-NEXT: 2 1 1.00 pextrw $1, %mm0, %ecx
|
||||
# CHECK-NEXT: 2 2 1.00 pinsrw $1, %eax, %mm2
|
||||
# CHECK-NEXT: 1 8 1.50 * pinsrw $1, (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 pmaxsw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmaxsw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 pmaxub %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmaxub (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 pminsw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pminsw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 pminub %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pminub (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 1.00 pmovmskb %mm0, %ecx
|
||||
# CHECK-NEXT: 1 3 0.50 pmulhuw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 10 0.50 * pmulhuw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 5 0.33 * * prefetcht0 (%rax)
|
||||
# CHECK-NEXT: 1 5 0.33 * * prefetcht1 (%rax)
|
||||
# CHECK-NEXT: 1 5 0.33 * * prefetcht2 (%rax)
|
||||
# CHECK-NEXT: 1 5 0.33 * * prefetchnta (%rax)
|
||||
# CHECK-NEXT: 1 3 0.50 psadbw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 10 0.50 * psadbw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 pshufw $1, %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pshufw $1, (%rax), %mm2
|
||||
# CHECK-NEXT: 1 3 0.50 rcpps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * rcpps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 rcpss %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * rcpss (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 1.00 rsqrtps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 1.00 * rsqrtps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 1.00 rsqrtss %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 1.00 * rsqrtss (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.33 * * U sfence
|
||||
# CHECK-NEXT: 1 1 0.50 shufps $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * shufps $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 15 5.00 sqrtps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 22 5.00 * sqrtps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 15 5.00 sqrtss %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 22 5.00 * sqrtss (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 2 15.00 * U stmxcsr (%rax)
|
||||
# CHECK-NEXT: 1 3 0.50 subps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * subps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 subss %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * subss (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 4 1.00 ucomiss %xmm0, %xmm1
|
||||
# CHECK-NEXT: 2 11 1.00 * ucomiss (%rax), %xmm1
|
||||
# CHECK-NEXT: 1 1 0.50 unpckhps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * unpckhps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 unpcklps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * unpcklps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 xorps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * xorps (%rax), %xmm2
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: 2.00 2.00 2.00 16.50 16.50 16.50 16.50 - 22.00 64.00 34.00 26.00 33.00 33.00 7.00 22.33 22.33 22.33 19.33 19.33 19.33 4.00 4.00
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - addps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - addps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - addss %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - addss (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - andnps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - andnps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - andps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - andps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - cmpeqps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmpeqps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - cmpeqss %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmpeqss (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - comiss %xmm0, %xmm1
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - comiss (%rax), %xmm1
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - cvtpi2ps %mm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvtpi2ps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - cvtps2pi %xmm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvtps2pi (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - cvtsi2ss %ecx, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - cvtsi2ss %rcx, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvtsi2ssl (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvtsi2ssl (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - cvtss2si %xmm0, %ecx
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - cvtss2si %xmm0, %rcx
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvtss2si (%rax), %ecx
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvtss2si (%rax), %rcx
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - cvttps2pi %xmm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvttps2pi (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - cvttss2si %xmm0, %ecx
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - cvttss2si %xmm0, %rcx
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvttss2si (%rax), %ecx
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvttss2si (%rax), %rcx
|
||||
# CHECK-NEXT: - - - - - - - - - 3.00 - - - - - - - - - - - - - divps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 3.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - divps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 3.00 - - - - - - - - - - - - - divss %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 3.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - divss (%rax), %xmm2
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 1.50 1.50 1.50 1.50 - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - ldmxcsr (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - maskmovq %mm0, %mm1
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - maxps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - maxps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - maxss %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - maxss (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - minps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - minps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - minss %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - minss (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - movaps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movaps %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movaps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - movhlps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - movlhps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movhps %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movhps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movlps %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movlps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 - - - - - - - - - - - - movmskps %xmm0, %ecx
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movntps %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movntq %mm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - movss %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movss %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movss (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - movups %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movups %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movups (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - mulps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - mulps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - mulss %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - mulss (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - orps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - orps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - pavgb %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pavgb (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - pavgw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pavgw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.00 1.00 - - - - - - - - - pextrw $1, %mm0, %ecx
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.00 1.00 - - - - - - - - - pinsrw $1, %eax, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.50 1.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pinsrw $1, (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pmaxsw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmaxsw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pmaxub %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmaxub (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pminsw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pminsw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pminub %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pminub (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 - - - - - - - - - - - - pmovmskb %mm0, %ecx
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmulhuw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmulhuw (%rax), %mm2
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - prefetcht0 (%rax)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - prefetcht1 (%rax)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - prefetcht2 (%rax)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - prefetchnta (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - psadbw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psadbw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pshufw $1, %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pshufw $1, (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - rcpps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - rcpps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - rcpss %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - rcpss (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 1.00 - - - - - - - - - - - - - rsqrtps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - rsqrtps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 1.00 - - - - - - - - - - - - - rsqrtss %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - rsqrtss (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - - - - 0.33 0.33 0.33 - - - - - sfence
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - shufps $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - shufps $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 5.00 - - - - - - - - - - - - - sqrtps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 5.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - sqrtps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 5.00 - - - - - - - - - - - - - sqrtss %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 5.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - sqrtss (%rax), %xmm2
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 15.00 15.00 15.00 15.00 - - - - - - - - 0.33 0.33 0.33 - - - 0.50 0.50 stmxcsr (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - subps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - subps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - subss %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - subss (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - ucomiss %xmm0, %xmm1
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - ucomiss (%rax), %xmm1
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - unpckhps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - unpckhps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - unpcklps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - unpcklps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - xorps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - xorps (%rax), %xmm2
|
|
@ -0,0 +1,975 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
addpd %xmm0, %xmm2
|
||||
addpd (%rax), %xmm2
|
||||
|
||||
addsd %xmm0, %xmm2
|
||||
addsd (%rax), %xmm2
|
||||
|
||||
andnpd %xmm0, %xmm2
|
||||
andnpd (%rax), %xmm2
|
||||
|
||||
andpd %xmm0, %xmm2
|
||||
andpd (%rax), %xmm2
|
||||
|
||||
clflush (%rax)
|
||||
|
||||
cmppd $0, %xmm0, %xmm2
|
||||
cmppd $0, (%rax), %xmm2
|
||||
|
||||
cmpsd $0, %xmm0, %xmm2
|
||||
cmpsd $0, (%rax), %xmm2
|
||||
|
||||
comisd %xmm0, %xmm1
|
||||
comisd (%rax), %xmm1
|
||||
|
||||
cvtdq2pd %xmm0, %xmm2
|
||||
cvtdq2pd (%rax), %xmm2
|
||||
|
||||
cvtdq2ps %xmm0, %xmm2
|
||||
cvtdq2ps (%rax), %xmm2
|
||||
|
||||
cvtpd2dq %xmm0, %xmm2
|
||||
cvtpd2dq (%rax), %xmm2
|
||||
|
||||
cvtpd2pi %xmm0, %mm2
|
||||
cvtpd2pi (%rax), %mm2
|
||||
|
||||
cvtpd2ps %xmm0, %xmm2
|
||||
cvtpd2ps (%rax), %xmm2
|
||||
|
||||
cvtpi2pd %mm0, %xmm2
|
||||
cvtpi2pd (%rax), %xmm2
|
||||
|
||||
cvtps2dq %xmm0, %xmm2
|
||||
cvtps2dq (%rax), %xmm2
|
||||
|
||||
cvtps2pd %xmm0, %xmm2
|
||||
cvtps2pd (%rax), %xmm2
|
||||
|
||||
cvtsd2si %xmm0, %ecx
|
||||
cvtsd2si %xmm0, %rcx
|
||||
cvtsd2si (%rax), %ecx
|
||||
cvtsd2si (%rax), %rcx
|
||||
|
||||
cvtsd2ss %xmm0, %xmm2
|
||||
cvtsd2ss (%rax), %xmm2
|
||||
|
||||
cvtsi2sd %ecx, %xmm2
|
||||
cvtsi2sd %rcx, %xmm2
|
||||
cvtsi2sd (%rax), %xmm2
|
||||
cvtsi2sd (%rax), %xmm2
|
||||
|
||||
cvtss2sd %xmm0, %xmm2
|
||||
cvtss2sd (%rax), %xmm2
|
||||
|
||||
cvttpd2dq %xmm0, %xmm2
|
||||
cvttpd2dq (%rax), %xmm2
|
||||
|
||||
cvttpd2pi %xmm0, %mm2
|
||||
cvttpd2pi (%rax), %mm2
|
||||
|
||||
cvttps2dq %xmm0, %xmm2
|
||||
cvttps2dq (%rax), %xmm2
|
||||
|
||||
cvttsd2si %xmm0, %ecx
|
||||
cvttsd2si %xmm0, %rcx
|
||||
cvttsd2si (%rax), %ecx
|
||||
cvttsd2si (%rax), %rcx
|
||||
|
||||
divpd %xmm0, %xmm2
|
||||
divpd (%rax), %xmm2
|
||||
|
||||
divsd %xmm0, %xmm2
|
||||
divsd (%rax), %xmm2
|
||||
|
||||
lfence
|
||||
|
||||
maskmovdqu %xmm0, %xmm1
|
||||
|
||||
maxpd %xmm0, %xmm2
|
||||
maxpd (%rax), %xmm2
|
||||
|
||||
maxsd %xmm0, %xmm2
|
||||
maxsd (%rax), %xmm2
|
||||
|
||||
mfence
|
||||
|
||||
minpd %xmm0, %xmm2
|
||||
minpd (%rax), %xmm2
|
||||
|
||||
minsd %xmm0, %xmm2
|
||||
minsd (%rax), %xmm2
|
||||
|
||||
movapd %xmm0, %xmm2
|
||||
movapd %xmm0, (%rax)
|
||||
movapd (%rax), %xmm2
|
||||
|
||||
movd %eax, %xmm2
|
||||
movd (%rax), %xmm2
|
||||
|
||||
movd %xmm0, %ecx
|
||||
movd %xmm0, (%rax)
|
||||
|
||||
movdqa %xmm0, %xmm2
|
||||
movdqa %xmm0, (%rax)
|
||||
movdqa (%rax), %xmm2
|
||||
|
||||
movdqu %xmm0, %xmm2
|
||||
movdqu %xmm0, (%rax)
|
||||
movdqu (%rax), %xmm2
|
||||
|
||||
movdq2q %xmm0, %mm2
|
||||
|
||||
movhpd %xmm0, (%rax)
|
||||
movhpd (%rax), %xmm2
|
||||
|
||||
movlpd %xmm0, (%rax)
|
||||
movlpd (%rax), %xmm2
|
||||
|
||||
movmskpd %xmm0, %rcx
|
||||
|
||||
movntil %eax, (%rax)
|
||||
movntiq %rax, (%rax)
|
||||
|
||||
movntdq %xmm0, (%rax)
|
||||
movntpd %xmm0, (%rax)
|
||||
|
||||
movq %xmm0, %xmm2
|
||||
|
||||
movq %rax, %xmm2
|
||||
movq (%rax), %xmm2
|
||||
|
||||
movq %xmm0, %rcx
|
||||
movq %xmm0, (%rax)
|
||||
|
||||
movq2dq %mm0, %xmm2
|
||||
|
||||
movsd %xmm0, %xmm2
|
||||
movsd %xmm0, (%rax)
|
||||
movsd (%rax), %xmm2
|
||||
|
||||
movupd %xmm0, %xmm2
|
||||
movupd %xmm0, (%rax)
|
||||
movupd (%rax), %xmm2
|
||||
|
||||
mulpd %xmm0, %xmm2
|
||||
mulpd (%rax), %xmm2
|
||||
|
||||
mulsd %xmm0, %xmm2
|
||||
mulsd (%rax), %xmm2
|
||||
|
||||
orpd %xmm0, %xmm2
|
||||
orpd (%rax), %xmm2
|
||||
|
||||
packssdw %xmm0, %xmm2
|
||||
packssdw (%rax), %xmm2
|
||||
|
||||
packsswb %xmm0, %xmm2
|
||||
packsswb (%rax), %xmm2
|
||||
|
||||
packuswb %xmm0, %xmm2
|
||||
packuswb (%rax), %xmm2
|
||||
|
||||
paddb %xmm0, %xmm2
|
||||
paddb (%rax), %xmm2
|
||||
|
||||
paddd %xmm0, %xmm2
|
||||
paddd (%rax), %xmm2
|
||||
|
||||
paddq %mm0, %mm2
|
||||
paddq (%rax), %mm2
|
||||
|
||||
paddq %xmm0, %xmm2
|
||||
paddq (%rax), %xmm2
|
||||
|
||||
paddsb %xmm0, %xmm2
|
||||
paddsb (%rax), %xmm2
|
||||
|
||||
paddsw %xmm0, %xmm2
|
||||
paddsw (%rax), %xmm2
|
||||
|
||||
paddusb %xmm0, %xmm2
|
||||
paddusb (%rax), %xmm2
|
||||
|
||||
paddusw %xmm0, %xmm2
|
||||
paddusw (%rax), %xmm2
|
||||
|
||||
paddw %xmm0, %xmm2
|
||||
paddw (%rax), %xmm2
|
||||
|
||||
pand %xmm0, %xmm2
|
||||
pand (%rax), %xmm2
|
||||
|
||||
pandn %xmm0, %xmm2
|
||||
pandn (%rax), %xmm2
|
||||
|
||||
pavgb %xmm0, %xmm2
|
||||
pavgb (%rax), %xmm2
|
||||
|
||||
pavgw %xmm0, %xmm2
|
||||
pavgw (%rax), %xmm2
|
||||
|
||||
pcmpeqb %xmm0, %xmm2
|
||||
pcmpeqb (%rax), %xmm2
|
||||
|
||||
pcmpeqd %xmm0, %xmm2
|
||||
pcmpeqd (%rax), %xmm2
|
||||
|
||||
pcmpeqw %xmm0, %xmm2
|
||||
pcmpeqw (%rax), %xmm2
|
||||
|
||||
pcmpgtb %xmm0, %xmm2
|
||||
pcmpgtb (%rax), %xmm2
|
||||
|
||||
pcmpgtd %xmm0, %xmm2
|
||||
pcmpgtd (%rax), %xmm2
|
||||
|
||||
pcmpgtw %xmm0, %xmm2
|
||||
pcmpgtw (%rax), %xmm2
|
||||
|
||||
pextrw $1, %xmm0, %rcx
|
||||
|
||||
pinsrw $1, %rax, %xmm0
|
||||
pinsrw $1, (%rax), %xmm0
|
||||
|
||||
pmaddwd %xmm0, %xmm2
|
||||
pmaddwd (%rax), %xmm2
|
||||
|
||||
pmaxsw %xmm0, %xmm2
|
||||
pmaxsw (%rax), %xmm2
|
||||
|
||||
pmaxub %xmm0, %xmm2
|
||||
pmaxub (%rax), %xmm2
|
||||
|
||||
pminsw %xmm0, %xmm2
|
||||
pminsw (%rax), %xmm2
|
||||
|
||||
pminub %xmm0, %xmm2
|
||||
pminub (%rax), %xmm2
|
||||
|
||||
pmovmskb %xmm0, %rcx
|
||||
|
||||
pmulhuw %xmm0, %xmm2
|
||||
pmulhuw (%rax), %xmm2
|
||||
|
||||
pmulhw %xmm0, %xmm2
|
||||
pmulhw (%rax), %xmm2
|
||||
|
||||
pmullw %xmm0, %xmm2
|
||||
pmullw (%rax), %xmm2
|
||||
|
||||
pmuludq %mm0, %mm2
|
||||
pmuludq (%rax), %mm2
|
||||
|
||||
pmuludq %xmm0, %xmm2
|
||||
pmuludq (%rax), %xmm2
|
||||
|
||||
por %xmm0, %xmm2
|
||||
por (%rax), %xmm2
|
||||
|
||||
psadbw %xmm0, %xmm2
|
||||
psadbw (%rax), %xmm2
|
||||
|
||||
pshufd $1, %xmm0, %xmm2
|
||||
pshufd $1, (%rax), %xmm2
|
||||
|
||||
pshufhw $1, %xmm0, %xmm2
|
||||
pshufhw $1, (%rax), %xmm2
|
||||
|
||||
pshuflw $1, %xmm0, %xmm2
|
||||
pshuflw $1, (%rax), %xmm2
|
||||
|
||||
pslld $1, %xmm2
|
||||
pslld %xmm0, %xmm2
|
||||
pslld (%rax), %xmm2
|
||||
|
||||
pslldq $1, %xmm2
|
||||
|
||||
psllq $1, %xmm2
|
||||
psllq %xmm0, %xmm2
|
||||
psllq (%rax), %xmm2
|
||||
|
||||
psllw $1, %xmm2
|
||||
psllw %xmm0, %xmm2
|
||||
psllw (%rax), %xmm2
|
||||
|
||||
psrad $1, %xmm2
|
||||
psrad %xmm0, %xmm2
|
||||
psrad (%rax), %xmm2
|
||||
|
||||
psraw $1, %xmm2
|
||||
psraw %xmm0, %xmm2
|
||||
psraw (%rax), %xmm2
|
||||
|
||||
psrld $1, %xmm2
|
||||
psrld %xmm0, %xmm2
|
||||
psrld (%rax), %xmm2
|
||||
|
||||
psrldq $1, %xmm2
|
||||
|
||||
psrlq $1, %xmm2
|
||||
psrlq %xmm0, %xmm2
|
||||
psrlq (%rax), %xmm2
|
||||
|
||||
psrlw $1, %xmm2
|
||||
psrlw %xmm0, %xmm2
|
||||
psrlw (%rax), %xmm2
|
||||
|
||||
psubb %xmm0, %xmm2
|
||||
psubb (%rax), %xmm2
|
||||
|
||||
psubd %xmm0, %xmm2
|
||||
psubd (%rax), %xmm2
|
||||
|
||||
psubq %mm0, %mm2
|
||||
psubq (%rax), %mm2
|
||||
|
||||
psubq %xmm0, %xmm2
|
||||
psubq (%rax), %xmm2
|
||||
|
||||
psubsb %xmm0, %xmm2
|
||||
psubsb (%rax), %xmm2
|
||||
|
||||
psubsw %xmm0, %xmm2
|
||||
psubsw (%rax), %xmm2
|
||||
|
||||
psubusb %xmm0, %xmm2
|
||||
psubusb (%rax), %xmm2
|
||||
|
||||
psubusw %xmm0, %xmm2
|
||||
psubusw (%rax), %xmm2
|
||||
|
||||
psubw %xmm0, %xmm2
|
||||
psubw (%rax), %xmm2
|
||||
|
||||
punpckhbw %xmm0, %xmm2
|
||||
punpckhbw (%rax), %xmm2
|
||||
|
||||
punpckhdq %xmm0, %xmm2
|
||||
punpckhdq (%rax), %xmm2
|
||||
|
||||
punpckhqdq %xmm0, %xmm2
|
||||
punpckhqdq (%rax), %xmm2
|
||||
|
||||
punpckhwd %xmm0, %xmm2
|
||||
punpckhwd (%rax), %xmm2
|
||||
|
||||
punpcklbw %xmm0, %xmm2
|
||||
punpcklbw (%rax), %xmm2
|
||||
|
||||
punpckldq %xmm0, %xmm2
|
||||
punpckldq (%rax), %xmm2
|
||||
|
||||
punpcklqdq %xmm0, %xmm2
|
||||
punpcklqdq (%rax), %xmm2
|
||||
|
||||
punpcklwd %xmm0, %xmm2
|
||||
punpcklwd (%rax), %xmm2
|
||||
|
||||
pxor %xmm0, %xmm2
|
||||
pxor (%rax), %xmm2
|
||||
|
||||
shufpd $1, %xmm0, %xmm2
|
||||
shufpd $1, (%rax), %xmm2
|
||||
|
||||
sqrtpd %xmm0, %xmm2
|
||||
sqrtpd (%rax), %xmm2
|
||||
|
||||
sqrtsd %xmm0, %xmm2
|
||||
sqrtsd (%rax), %xmm2
|
||||
|
||||
subpd %xmm0, %xmm2
|
||||
subpd (%rax), %xmm2
|
||||
|
||||
subsd %xmm0, %xmm2
|
||||
subsd (%rax), %xmm2
|
||||
|
||||
ucomisd %xmm0, %xmm1
|
||||
ucomisd (%rax), %xmm1
|
||||
|
||||
unpckhpd %xmm0, %xmm2
|
||||
unpckhpd (%rax), %xmm2
|
||||
|
||||
unpcklpd %xmm0, %xmm2
|
||||
unpcklpd (%rax), %xmm2
|
||||
|
||||
xorpd %xmm0, %xmm2
|
||||
xorpd (%rax), %xmm2
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 3 0.50 addpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * addpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 addsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * addsd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 andnpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * andnpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 andpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * andpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 5 0.33 * * U clflush (%rax)
|
||||
# CHECK-NEXT: 1 1 0.50 cmpeqpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * cmpeqpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 cmpeqsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * cmpeqsd (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 4 1.00 comisd %xmm0, %xmm1
|
||||
# CHECK-NEXT: 2 11 1.00 * comisd (%rax), %xmm1
|
||||
# CHECK-NEXT: 1 3 0.50 cvtdq2pd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * cvtdq2pd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 cvtdq2ps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * cvtdq2ps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 cvtpd2dq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * cvtpd2dq (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 1 1.00 cvtpd2pi %xmm0, %mm2
|
||||
# CHECK-NEXT: 2 1 1.00 * cvtpd2pi (%rax), %mm2
|
||||
# CHECK-NEXT: 1 3 0.50 cvtpd2ps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * cvtpd2ps (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 2 3.00 cvtpi2pd %mm0, %xmm2
|
||||
# CHECK-NEXT: 2 2 3.00 * cvtpi2pd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 cvtps2dq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * cvtps2dq (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 cvtps2pd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * cvtps2pd (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 2 1.00 cvtsd2si %xmm0, %ecx
|
||||
# CHECK-NEXT: 2 2 1.00 cvtsd2si %xmm0, %rcx
|
||||
# CHECK-NEXT: 2 9 1.00 * cvtsd2si (%rax), %ecx
|
||||
# CHECK-NEXT: 2 9 1.00 * cvtsd2si (%rax), %rcx
|
||||
# CHECK-NEXT: 1 3 0.50 cvtsd2ss %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * cvtsd2ss (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 4 1.00 cvtsi2sd %ecx, %xmm2
|
||||
# CHECK-NEXT: 2 4 1.00 cvtsi2sd %rcx, %xmm2
|
||||
# CHECK-NEXT: 1 10 1.00 * cvtsi2sdl (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 10 1.00 * cvtsi2sdl (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 cvtss2sd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * cvtss2sd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 cvttpd2dq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * cvttpd2dq (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 1 1.00 cvttpd2pi %xmm0, %mm2
|
||||
# CHECK-NEXT: 2 1 1.00 * cvttpd2pi (%rax), %mm2
|
||||
# CHECK-NEXT: 1 3 0.50 cvttps2dq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * cvttps2dq (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 2 1.00 cvttsd2si %xmm0, %ecx
|
||||
# CHECK-NEXT: 2 2 1.00 cvttsd2si %xmm0, %rcx
|
||||
# CHECK-NEXT: 2 9 1.00 * cvttsd2si (%rax), %ecx
|
||||
# CHECK-NEXT: 2 9 1.00 * cvttsd2si (%rax), %rcx
|
||||
# CHECK-NEXT: 1 13 5.00 divpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 20 5.00 * divpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 13 5.00 divsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 20 5.00 * divsd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 10.00 * * U lfence
|
||||
# CHECK-NEXT: 1 1 1.00 * * U maskmovdqu %xmm0, %xmm1
|
||||
# CHECK-NEXT: 1 1 0.50 maxpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * maxpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 maxsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * maxsd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 25.00 * * U mfence
|
||||
# CHECK-NEXT: 1 1 0.50 minpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * minpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 minsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * minsd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 0 0.25 movapd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 1 1.00 * movapd %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 8 0.50 * movapd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 1.00 movd %eax, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * movd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 1.00 movd %xmm0, %ecx
|
||||
# CHECK-NEXT: 1 1 1.00 * movd %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 0 0.25 movdqa %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 1 1.00 * movdqa %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 8 0.50 * movdqa (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 0 0.25 movdqu %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 1 1.00 * movdqu %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 8 0.50 * movdqu (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 0 0.25 movdq2q %xmm0, %mm2
|
||||
# CHECK-NEXT: 2 2 1.00 * movhpd %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 8 0.50 * movhpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 1.00 * movlpd %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 8 0.50 * movlpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 1.00 movmskpd %xmm0, %ecx
|
||||
# CHECK-NEXT: 1 1 1.00 * movntil %eax, (%rax)
|
||||
# CHECK-NEXT: 1 1 1.00 * movntiq %rax, (%rax)
|
||||
# CHECK-NEXT: 1 1 1.00 * movntdq %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 1 1.00 * movntpd %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 1 0.25 movq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 1 1.00 movq %rax, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * movq (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 1.00 movq %xmm0, %rcx
|
||||
# CHECK-NEXT: 1 1 1.00 * movq %xmm0, (%rax)
|
||||
# CHECK-NEXT: 2 1 0.50 movq2dq %mm0, %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 movsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 1 1.00 * movsd %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 8 0.50 * movsd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 0 0.25 movupd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 1 1.00 * movupd %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 8 0.50 * movupd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 mulpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * mulpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 mulsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * mulsd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 orpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * orpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 packssdw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * packssdw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 packsswb %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * packsswb (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 packuswb %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * packuswb (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 paddb %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * paddb (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 paddd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * paddd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 paddq %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * paddq (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 paddq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * paddq (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 paddsb %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * paddsb (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 paddsw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * paddsw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 paddusb %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * paddusb (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 paddusw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * paddusw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 paddw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * paddw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pand %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pand (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pandn %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pandn (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pavgb %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pavgb (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pavgw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pavgw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pcmpeqb %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pcmpeqb (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pcmpeqd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pcmpeqd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pcmpeqw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pcmpeqw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pcmpgtb %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pcmpgtb (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pcmpgtd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pcmpgtd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pcmpgtw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pcmpgtw (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 1 1.00 pextrw $1, %xmm0, %ecx
|
||||
# CHECK-NEXT: 2 2 1.00 pinsrw $1, %eax, %xmm0
|
||||
# CHECK-NEXT: 1 8 1.50 * pinsrw $1, (%rax), %xmm0
|
||||
# CHECK-NEXT: 1 3 0.50 pmaddwd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * pmaddwd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pmaxsw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmaxsw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pmaxub %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmaxub (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pminsw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pminsw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pminub %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pminub (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 1.00 pmovmskb %xmm0, %ecx
|
||||
# CHECK-NEXT: 1 3 0.50 pmulhuw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * pmulhuw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 pmulhw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * pmulhw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 pmullw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * pmullw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 pmuludq %mm0, %mm2
|
||||
# CHECK-NEXT: 1 10 0.50 * pmuludq (%rax), %mm2
|
||||
# CHECK-NEXT: 1 3 0.50 pmuludq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * pmuludq (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 por %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * por (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 psadbw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * psadbw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pshufd $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pshufd $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pshufhw $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pshufhw $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pshuflw $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pshuflw $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pslld $1, %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pslld %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pslld (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pslldq $1, %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psllq $1, %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psllq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psllq (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psllw $1, %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psllw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psllw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psrad $1, %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psrad %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psrad (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psraw $1, %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psraw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psraw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psrld $1, %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psrld %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psrld (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psrldq $1, %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psrlq $1, %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psrlq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psrlq (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psrlw $1, %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psrlw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psrlw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 psubb %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psubb (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 psubd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psubd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 psubq %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psubq (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.25 psubq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psubq (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psubsb %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psubsb (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psubsw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psubsw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psubusb %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psubusb (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psubusw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psubusw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 psubw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psubw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 punpckhbw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * punpckhbw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 punpckhdq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * punpckhdq (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 punpckhqdq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * punpckhqdq (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 punpckhwd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * punpckhwd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 punpcklbw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * punpcklbw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 punpckldq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * punpckldq (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 punpcklqdq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * punpcklqdq (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 punpcklwd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * punpcklwd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pxor %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pxor (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 shufpd $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * shufpd $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 21 9.00 sqrtpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 28 9.00 * sqrtpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 21 9.00 sqrtsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 28 9.00 * sqrtsd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 subpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * subpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 subsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * subsd (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 4 1.00 ucomisd %xmm0, %xmm1
|
||||
# CHECK-NEXT: 2 11 1.00 * ucomisd (%rax), %xmm1
|
||||
# CHECK-NEXT: 1 1 0.50 unpckhpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * unpckhpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 unpcklpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * unpcklpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 xorpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * xorpd (%rax), %xmm2
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: 1.00 1.00 1.00 25.00 25.00 25.00 25.00 - 42.50 124.00 89.00 61.50 70.50 70.50 12.00 53.67 53.67 53.67 38.33 38.33 38.33 8.00 8.00
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - addpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - addpd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - addsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - addsd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - andnpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - andnpd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - andpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - andpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - clflush (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - cmpeqpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmpeqpd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - cmpeqsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cmpeqsd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - comisd %xmm0, %xmm1
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - comisd (%rax), %xmm1
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - cvtdq2pd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvtdq2pd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - cvtdq2ps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvtdq2ps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - cvtpd2dq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvtpd2dq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - cvtpd2pi %xmm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - cvtpd2pi (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - cvtpd2ps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvtpd2ps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 3.00 3.00 - - - - - - - - - - - cvtpi2pd %mm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 3.00 3.00 - - - - - - - - - - - cvtpi2pd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - cvtps2dq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvtps2dq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - cvtps2pd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvtps2pd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - cvtsd2si %xmm0, %ecx
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - cvtsd2si %xmm0, %rcx
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvtsd2si (%rax), %ecx
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvtsd2si (%rax), %rcx
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - cvtsd2ss %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvtsd2ss (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - cvtsi2sd %ecx, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - cvtsi2sd %rcx, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvtsi2sdl (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvtsi2sdl (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - cvtss2sd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvtss2sd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - cvttpd2dq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvttpd2dq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - cvttpd2pi %xmm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - cvttpd2pi (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - cvttps2dq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvttps2dq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - cvttsd2si %xmm0, %ecx
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 - - - - - - - - - - - cvttsd2si %xmm0, %rcx
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvttsd2si (%rax), %ecx
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 1.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - cvttsd2si (%rax), %rcx
|
||||
# CHECK-NEXT: - - - - - - - - - 5.00 - - - - - - - - - - - - - divpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 5.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - divpd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 5.00 - - - - - - - - - - - - - divsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 5.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - divsd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - - - - 10.00 10.00 10.00 - - - - - lfence
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 maskmovdqu %xmm0, %xmm1
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - maxpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - maxpd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - maxsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - maxsd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - mfence
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - minpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - minpd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - minsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - minsd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - movapd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movapd %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movapd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.00 1.00 - - - - - - - - - movd %eax, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.00 1.00 - - - - - - - - - movd %xmm0, %ecx
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movd %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - movdqa %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movdqa %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movdqa (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - movdqu %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movdqu %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movdqu (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - movdq2q %xmm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movhpd %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movhpd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movlpd %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movlpd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 - - - - - - - - - - - - movmskpd %xmm0, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.67 0.67 0.67 - - - 1.00 1.00 movntil %eax, (%rax)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.67 0.67 0.67 - - - 1.00 1.00 movntiq %rax, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movntdq %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movntpd %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - movq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.00 1.00 - - - - - - - - - movq %rax, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.00 1.00 - - - - - - - - - movq %xmm0, %rcx
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movq %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - - - - - - - - - movq2dq %mm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - movsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movsd %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movsd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - movupd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movupd %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movupd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - mulpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - mulpd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - mulsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - mulsd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - orpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - orpd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - packssdw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - packssdw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - packsswb %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - packsswb (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - packuswb %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - packuswb (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - paddb %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - paddb (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - paddd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - paddd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - paddq %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - paddq (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - paddq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - paddq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - paddsb %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - paddsb (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - paddsw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - paddsw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - paddusb %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - paddusb (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - paddusw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - paddusw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - paddw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - paddw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pand %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pand (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pandn %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pandn (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - pavgb %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pavgb (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - pavgw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pavgw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pcmpeqb %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pcmpeqb (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pcmpeqd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pcmpeqd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pcmpeqw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pcmpeqw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pcmpgtb %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pcmpgtb (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pcmpgtd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pcmpgtd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pcmpgtw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pcmpgtw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.00 1.00 - - - - - - - - - pextrw $1, %xmm0, %ecx
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.00 1.00 - - - - - - - - - pinsrw $1, %eax, %xmm0
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.50 1.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pinsrw $1, (%rax), %xmm0
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmaddwd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmaddwd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pmaxsw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmaxsw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pmaxub %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmaxub (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pminsw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pminsw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pminub %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pminub (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 1.00 - - - - - - - - - - - - pmovmskb %xmm0, %ecx
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmulhuw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmulhuw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmulhw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmulhw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmullw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmullw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmuludq %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmuludq (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmuludq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmuludq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - por %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - por (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 - - - - - - - - - - - psadbw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psadbw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pshufd $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pshufd $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pshufhw $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pshufhw $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pshuflw $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pshuflw $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pslld $1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pslld %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pslld (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pslldq $1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psllq $1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psllq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psllq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psllw $1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psllw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psllw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psrad $1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psrad %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psrad (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psraw $1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psraw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psraw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psrld $1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psrld %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psrld (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psrldq $1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psrlq $1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psrlq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psrlq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psrlw $1, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - psrlw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psrlw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - psubb %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psubb (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - psubd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psubd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - psubq %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psubq (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - psubq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psubq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psubsb %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psubsb (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psubsw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psubsw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psubusb %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psubusb (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psubusw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psubusw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - psubw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psubw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - punpckhbw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - punpckhbw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - punpckhdq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - punpckhdq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - punpckhqdq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - punpckhqdq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - punpckhwd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - punpckhwd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - punpcklbw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - punpcklbw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - punpckldq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - punpckldq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - punpcklqdq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - punpcklqdq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - punpcklwd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - punpcklwd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pxor %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pxor (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - shufpd $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - shufpd $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 9.00 - - - - - - - - - - - - - sqrtpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 9.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - sqrtpd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 9.00 - - - - - - - - - - - - - sqrtsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 9.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - sqrtsd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - subpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - subpd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - subsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - subsd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - ucomisd %xmm0, %xmm1
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - ucomisd (%rax), %xmm1
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - unpckhpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - unpckhpd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - unpcklpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - unpcklpd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - xorpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - xorpd (%rax), %xmm2
|
|
@ -0,0 +1,119 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
addsubpd %xmm0, %xmm2
|
||||
addsubpd (%rax), %xmm2
|
||||
|
||||
addsubps %xmm0, %xmm2
|
||||
addsubps (%rax), %xmm2
|
||||
|
||||
haddpd %xmm0, %xmm2
|
||||
haddpd (%rax), %xmm2
|
||||
|
||||
haddps %xmm0, %xmm2
|
||||
haddps (%rax), %xmm2
|
||||
|
||||
hsubpd %xmm0, %xmm2
|
||||
hsubpd (%rax), %xmm2
|
||||
|
||||
hsubps %xmm0, %xmm2
|
||||
hsubps (%rax), %xmm2
|
||||
|
||||
lddqu (%rax), %xmm2
|
||||
|
||||
monitor
|
||||
|
||||
movddup %xmm0, %xmm2
|
||||
movddup (%rax), %xmm2
|
||||
|
||||
movshdup %xmm0, %xmm2
|
||||
movshdup (%rax), %xmm2
|
||||
|
||||
movsldup %xmm0, %xmm2
|
||||
movsldup (%rax), %xmm2
|
||||
|
||||
mwait
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 3 0.50 addsubpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * addsubpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 addsubps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * addsubps (%rax), %xmm2
|
||||
# CHECK-NEXT: 4 6 2.00 haddpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 4 13 2.00 * haddpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 4 6 2.00 haddps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 4 13 2.00 * haddps (%rax), %xmm2
|
||||
# CHECK-NEXT: 4 6 2.00 hsubpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 4 13 2.00 * hsubpd (%rax), %xmm2
|
||||
# CHECK-NEXT: 4 6 2.00 hsubps %xmm0, %xmm2
|
||||
# CHECK-NEXT: 4 13 2.00 * hsubps (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * lddqu (%rax), %xmm2
|
||||
# CHECK-NEXT: 100 100 25.00 U monitor
|
||||
# CHECK-NEXT: 1 1 0.50 movddup %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * movddup (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 movshdup %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * movshdup (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 movsldup %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * movsldup (%rax), %xmm2
|
||||
# CHECK-NEXT: 100 100 25.00 * * U mwait
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: - - - 50.00 50.00 50.00 50.00 - - 3.00 21.00 2.00 5.00 5.00 - 3.33 3.33 3.33 3.33 3.33 3.33 - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - addsubpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - addsubpd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - addsubps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - addsubps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 2.00 - - - - - - - - - - - - haddpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 2.00 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - haddpd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 2.00 - - - - - - - - - - - - haddps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 2.00 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - haddps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 2.00 - - - - - - - - - - - - hsubpd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 2.00 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - hsubpd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 2.00 - - - - - - - - - - - - hsubps %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 2.00 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - hsubps (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - lddqu (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - monitor
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - movddup %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movddup (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - movshdup %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movshdup (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - movsldup %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movsldup (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - mwait
|
|
@ -0,0 +1,381 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
blendpd $11, %xmm0, %xmm2
|
||||
blendpd $11, (%rax), %xmm2
|
||||
|
||||
blendps $11, %xmm0, %xmm2
|
||||
blendps $11, (%rax), %xmm2
|
||||
|
||||
blendvpd %xmm0, %xmm2
|
||||
blendvpd (%rax), %xmm2
|
||||
|
||||
blendvps %xmm0, %xmm2
|
||||
blendvps (%rax), %xmm2
|
||||
|
||||
dppd $22, %xmm0, %xmm2
|
||||
dppd $22, (%rax), %xmm2
|
||||
|
||||
dpps $22, %xmm0, %xmm2
|
||||
dpps $22, (%rax), %xmm2
|
||||
|
||||
extractps $1, %xmm0, %rcx
|
||||
extractps $1, %xmm0, (%rax)
|
||||
|
||||
insertps $1, %xmm0, %xmm2
|
||||
insertps $1, (%rax), %xmm2
|
||||
|
||||
movntdqa (%rax), %xmm2
|
||||
|
||||
mpsadbw $1, %xmm0, %xmm2
|
||||
mpsadbw $1, (%rax), %xmm2
|
||||
|
||||
packusdw %xmm0, %xmm2
|
||||
packusdw (%rax), %xmm2
|
||||
|
||||
pblendvb %xmm0, %xmm2
|
||||
pblendvb (%rax), %xmm2
|
||||
|
||||
pblendw $11, %xmm0, %xmm2
|
||||
pblendw $11, (%rax), %xmm2
|
||||
|
||||
pcmpeqq %xmm0, %xmm2
|
||||
pcmpeqq (%rax), %xmm2
|
||||
|
||||
pextrb $1, %xmm0, %ecx
|
||||
pextrb $1, %xmm0, (%rax)
|
||||
|
||||
pextrd $1, %xmm0, %ecx
|
||||
pextrd $1, %xmm0, (%rax)
|
||||
|
||||
pextrq $1, %xmm0, %rcx
|
||||
pextrq $1, %xmm0, (%rax)
|
||||
|
||||
pextrw $1, %xmm0, (%rax)
|
||||
|
||||
phminposuw %xmm0, %xmm2
|
||||
phminposuw (%rax), %xmm2
|
||||
|
||||
pinsrb $1, %eax, %xmm1
|
||||
pinsrb $1, (%rax), %xmm1
|
||||
|
||||
pinsrd $1, %eax, %xmm1
|
||||
pinsrd $1, (%rax), %xmm1
|
||||
|
||||
pinsrq $1, %rax, %xmm1
|
||||
pinsrq $1, (%rax), %xmm1
|
||||
|
||||
pmaxsb %xmm0, %xmm2
|
||||
pmaxsb (%rax), %xmm2
|
||||
|
||||
pmaxsd %xmm0, %xmm2
|
||||
pmaxsd (%rax), %xmm2
|
||||
|
||||
pmaxud %xmm0, %xmm2
|
||||
pmaxud (%rax), %xmm2
|
||||
|
||||
pmaxuw %xmm0, %xmm2
|
||||
pmaxuw (%rax), %xmm2
|
||||
|
||||
pminsb %xmm0, %xmm2
|
||||
pminsb (%rax), %xmm2
|
||||
|
||||
pminsd %xmm0, %xmm2
|
||||
pminsd (%rax), %xmm2
|
||||
|
||||
pminud %xmm0, %xmm2
|
||||
pminud (%rax), %xmm2
|
||||
|
||||
pminuw %xmm0, %xmm2
|
||||
pminuw (%rax), %xmm2
|
||||
|
||||
pmovsxbd %xmm0, %xmm2
|
||||
pmovsxbd (%rax), %xmm2
|
||||
|
||||
pmovsxbq %xmm0, %xmm2
|
||||
pmovsxbq (%rax), %xmm2
|
||||
|
||||
pmovsxbw %xmm0, %xmm2
|
||||
pmovsxbw (%rax), %xmm2
|
||||
|
||||
pmovsxdq %xmm0, %xmm2
|
||||
pmovsxdq (%rax), %xmm2
|
||||
|
||||
pmovsxwd %xmm0, %xmm2
|
||||
pmovsxwd (%rax), %xmm2
|
||||
|
||||
pmovsxwq %xmm0, %xmm2
|
||||
pmovsxwq (%rax), %xmm2
|
||||
|
||||
pmovzxbd %xmm0, %xmm2
|
||||
pmovzxbd (%rax), %xmm2
|
||||
|
||||
pmovzxbq %xmm0, %xmm2
|
||||
pmovzxbq (%rax), %xmm2
|
||||
|
||||
pmovzxbw %xmm0, %xmm2
|
||||
pmovzxbw (%rax), %xmm2
|
||||
|
||||
pmovzxdq %xmm0, %xmm2
|
||||
pmovzxdq (%rax), %xmm2
|
||||
|
||||
pmovzxwd %xmm0, %xmm2
|
||||
pmovzxwd (%rax), %xmm2
|
||||
|
||||
pmovzxwq %xmm0, %xmm2
|
||||
pmovzxwq (%rax), %xmm2
|
||||
|
||||
pmuldq %xmm0, %xmm2
|
||||
pmuldq (%rax), %xmm2
|
||||
|
||||
pmulld %xmm0, %xmm2
|
||||
pmulld (%rax), %xmm2
|
||||
|
||||
ptest %xmm0, %xmm1
|
||||
ptest (%rax), %xmm1
|
||||
|
||||
roundpd $1, %xmm0, %xmm2
|
||||
roundpd $1, (%rax), %xmm2
|
||||
|
||||
roundps $1, %xmm0, %xmm2
|
||||
roundps $1, (%rax), %xmm2
|
||||
|
||||
roundsd $1, %xmm0, %xmm2
|
||||
roundsd $1, (%rax), %xmm2
|
||||
|
||||
roundss $1, %xmm0, %xmm2
|
||||
roundss $1, (%rax), %xmm2
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 1 0.50 blendpd $11, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * blendpd $11, (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 blendps $11, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * blendps $11, (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 blendvpd %xmm0, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * blendvpd %xmm0, (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 blendvps %xmm0, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * blendvps %xmm0, (%rax), %xmm2
|
||||
# CHECK-NEXT: 3 9 3.00 dppd $22, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 5 16 3.00 * dppd $22, (%rax), %xmm2
|
||||
# CHECK-NEXT: 8 15 4.00 dpps $22, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 10 22 4.00 * dpps $22, (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 1 1.00 extractps $1, %xmm0, %ecx
|
||||
# CHECK-NEXT: 2 2 1.00 * extractps $1, %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 1 0.50 insertps $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * insertps $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * movntdqa (%rax), %xmm2
|
||||
# CHECK-NEXT: 4 4 2.00 mpsadbw $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 6 11 2.00 * mpsadbw $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 packusdw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * packusdw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pblendvb %xmm0, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pblendvb %xmm0, (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pblendw $11, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pblendw $11, (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pcmpeqq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pcmpeqq (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 1 1.00 pextrb $1, %xmm0, %ecx
|
||||
# CHECK-NEXT: 2 2 1.00 * pextrb $1, %xmm0, (%rax)
|
||||
# CHECK-NEXT: 2 1 1.00 pextrd $1, %xmm0, %ecx
|
||||
# CHECK-NEXT: 2 2 1.00 * pextrd $1, %xmm0, (%rax)
|
||||
# CHECK-NEXT: 2 1 1.00 pextrq $1, %xmm0, %rcx
|
||||
# CHECK-NEXT: 2 2 1.00 * pextrq $1, %xmm0, (%rax)
|
||||
# CHECK-NEXT: 2 2 1.00 * pextrw $1, %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 3 0.50 phminposuw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * phminposuw (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 2 1.00 pinsrb $1, %eax, %xmm1
|
||||
# CHECK-NEXT: 1 8 1.50 * pinsrb $1, (%rax), %xmm1
|
||||
# CHECK-NEXT: 2 2 1.00 pinsrd $1, %eax, %xmm1
|
||||
# CHECK-NEXT: 1 8 1.50 * pinsrd $1, (%rax), %xmm1
|
||||
# CHECK-NEXT: 2 2 1.00 pinsrq $1, %rax, %xmm1
|
||||
# CHECK-NEXT: 1 8 1.50 * pinsrq $1, (%rax), %xmm1
|
||||
# CHECK-NEXT: 1 1 0.25 pmaxsb %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmaxsb (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pmaxsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmaxsd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pmaxud %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmaxud (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pmaxuw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmaxuw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pminsb %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pminsb (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pminsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pminsd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pminud %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pminud (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pminuw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pminuw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pmovsxbd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmovsxbd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pmovsxbq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmovsxbq (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pmovsxbw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmovsxbw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pmovsxdq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmovsxdq (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pmovsxwd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmovsxwd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pmovsxwq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmovsxwq (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pmovzxbd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmovzxbd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pmovzxbq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmovzxbq (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pmovzxbw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmovzxbw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pmovzxdq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmovzxdq (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pmovzxwd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmovzxwd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pmovzxwq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pmovzxwq (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 pmuldq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * pmuldq (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 pmulld %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * pmulld (%rax), %xmm2
|
||||
# CHECK-NEXT: 2 1 1.00 ptest %xmm0, %xmm1
|
||||
# CHECK-NEXT: 2 8 1.00 * ptest (%rax), %xmm1
|
||||
# CHECK-NEXT: 1 3 0.50 roundpd $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * roundpd $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 roundps $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * roundps $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 roundsd $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * roundsd $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 roundss $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * roundss $1, (%rax), %xmm2
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: - - - - - - - - 31.00 43.00 28.00 16.00 35.50 35.50 7.00 16.33 16.33 16.33 14.67 14.67 14.67 2.50 2.50
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - blendpd $11, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - blendpd $11, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - blendps $11, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - blendps $11, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - blendvpd %xmm0, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - blendvpd %xmm0, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - blendvps %xmm0, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - blendvps %xmm0, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 3.00 3.00 - - - - - - - - - - - - - dppd $22, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 3.00 3.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - dppd $22, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 4.00 4.00 - - - - - - - - - - - - - dpps $22, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 4.00 4.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - dpps $22, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.00 1.00 - - - - - - - - - extractps $1, %xmm0, %ecx
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 extractps $1, %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - insertps $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - insertps $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - movntdqa (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 2.00 2.00 2.00 - - - - - - - - - - - mpsadbw $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 2.00 2.00 2.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - mpsadbw $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - packusdw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - packusdw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pblendvb %xmm0, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pblendvb %xmm0, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pblendw $11, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pblendw $11, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pcmpeqq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pcmpeqq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.00 1.00 - - - - - - - - - pextrb $1, %xmm0, %ecx
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 pextrb $1, %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.00 1.00 - - - - - - - - - pextrd $1, %xmm0, %ecx
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 pextrd $1, %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.00 1.00 - - - - - - - - - pextrq $1, %xmm0, %rcx
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 pextrq $1, %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 pextrw $1, %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - phminposuw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phminposuw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.00 1.00 - - - - - - - - - pinsrb $1, %eax, %xmm1
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.50 1.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pinsrb $1, (%rax), %xmm1
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.00 1.00 - - - - - - - - - pinsrd $1, %eax, %xmm1
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.50 1.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pinsrd $1, (%rax), %xmm1
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.00 1.00 - - - - - - - - - pinsrq $1, %rax, %xmm1
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 1.50 1.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pinsrq $1, (%rax), %xmm1
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pmaxsb %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmaxsb (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pmaxsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmaxsd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pmaxud %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmaxud (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pmaxuw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmaxuw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pminsb %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pminsb (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pminsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pminsd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pminud %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pminud (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pminuw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pminuw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pmovsxbd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmovsxbd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pmovsxbq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmovsxbq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pmovsxbw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmovsxbw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pmovsxdq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmovsxdq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pmovsxwd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmovsxwd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pmovsxwq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmovsxwq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pmovzxbd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmovzxbd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pmovzxbq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmovzxbq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pmovzxbw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmovzxbw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pmovzxdq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmovzxdq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pmovzxwd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmovzxwd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pmovzxwq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmovzxwq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmuldq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmuldq (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmulld %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmulld (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 1.00 - - - - - - - - ptest %xmm0, %xmm1
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 1.00 1.00 1.00 0.33 0.33 0.33 0.33 0.33 0.33 - - ptest (%rax), %xmm1
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - roundpd $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - roundpd $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - roundps $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - roundps $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - roundsd $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - roundsd $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - roundss $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - roundss $1, (%rax), %xmm2
|
|
@ -0,0 +1,114 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
crc32b %al, %ecx
|
||||
crc32b (%rax), %ecx
|
||||
|
||||
crc32l %eax, %ecx
|
||||
crc32l (%rax), %ecx
|
||||
|
||||
crc32w %ax, %ecx
|
||||
crc32w (%rax), %ecx
|
||||
|
||||
crc32b %al, %rcx
|
||||
crc32b (%rax), %rcx
|
||||
|
||||
crc32q %rax, %rcx
|
||||
crc32q (%rax), %rcx
|
||||
|
||||
pcmpestri $1, %xmm0, %xmm2
|
||||
pcmpestri $1, (%rax), %xmm2
|
||||
|
||||
pcmpestrm $1, %xmm0, %xmm2
|
||||
pcmpestrm $1, (%rax), %xmm2
|
||||
|
||||
pcmpistri $1, %xmm0, %xmm2
|
||||
pcmpistri $1, (%rax), %xmm2
|
||||
|
||||
pcmpistrm $1, %xmm0, %xmm2
|
||||
pcmpistrm $1, (%rax), %xmm2
|
||||
|
||||
pcmpgtq %xmm0, %xmm2
|
||||
pcmpgtq (%rax), %xmm2
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 3 1.00 crc32b %al, %ecx
|
||||
# CHECK-NEXT: 1 7 1.00 * crc32b (%rax), %ecx
|
||||
# CHECK-NEXT: 1 3 1.00 crc32l %eax, %ecx
|
||||
# CHECK-NEXT: 1 7 1.00 * crc32l (%rax), %ecx
|
||||
# CHECK-NEXT: 1 3 1.00 crc32w %ax, %ecx
|
||||
# CHECK-NEXT: 1 7 1.00 * crc32w (%rax), %ecx
|
||||
# CHECK-NEXT: 1 3 1.00 crc32b %al, %rcx
|
||||
# CHECK-NEXT: 1 7 1.00 * crc32b (%rax), %rcx
|
||||
# CHECK-NEXT: 1 3 1.00 crc32q %rax, %rcx
|
||||
# CHECK-NEXT: 1 7 1.00 * crc32q (%rax), %rcx
|
||||
# CHECK-NEXT: 8 6 3.00 pcmpestri $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 12 13 3.00 * pcmpestri $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: 7 6 3.00 pcmpestrm $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 12 13 3.00 * pcmpestrm $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: 4 2 2.00 pcmpistri $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 4 9 2.00 * pcmpistri $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: 3 6 2.00 pcmpistrm $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 4 13 2.00 * pcmpistrm $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.25 pcmpgtq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pcmpgtq (%rax), %xmm2
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: 1.67 1.67 1.67 - 10.00 - - - 20.50 20.50 20.50 20.50 2.50 2.50 - 3.33 3.33 3.33 3.33 3.33 3.33 - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - crc32b %al, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 1.00 - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - crc32b (%rax), %ecx
|
||||
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - crc32l %eax, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 1.00 - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - crc32l (%rax), %ecx
|
||||
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - crc32w %ax, %ecx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 1.00 - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - crc32w (%rax), %ecx
|
||||
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - crc32b %al, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 1.00 - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - crc32b (%rax), %rcx
|
||||
# CHECK-NEXT: - - - - 1.00 - - - - - - - - - - - - - - - - - - crc32q %rax, %rcx
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - 1.00 - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - crc32q (%rax), %rcx
|
||||
# CHECK-NEXT: - - - - - - - - 3.00 3.00 3.00 3.00 - - - - - - - - - - - pcmpestri $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 3.00 3.00 3.00 3.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pcmpestri $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 3.00 3.00 3.00 3.00 - - - - - - - - - - - pcmpestrm $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 3.00 3.00 3.00 3.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pcmpestrm $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 2.00 2.00 2.00 - - - - - - - - - - - pcmpistri $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 2.00 2.00 2.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pcmpistri $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 2.00 2.00 2.00 - - - - - - - - - - - pcmpistrm $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 2.00 2.00 2.00 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pcmpistrm $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - pcmpgtq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pcmpgtq (%rax), %xmm2
|
|
@ -0,0 +1,65 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
extrq %xmm0, %xmm2
|
||||
extrq $22, $2, %xmm2
|
||||
|
||||
insertq %xmm0, %xmm2
|
||||
insertq $22, $22, %xmm0, %xmm2
|
||||
|
||||
movntsd %xmm0, (%rax)
|
||||
movntss %xmm0, (%rax)
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 3 0.50 extrq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 2 3 0.50 extrq $22, $2, %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 insertq %xmm0, %xmm2
|
||||
# CHECK-NEXT: 2 3 0.50 insertq $22, $22, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 1 1.00 * movntsd %xmm0, (%rax)
|
||||
# CHECK-NEXT: 1 1 1.00 * movntss %xmm0, (%rax)
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: - - - - - - - - - 2.00 2.00 - 3.00 3.00 2.00 0.67 0.67 0.67 - - - 1.00 1.00
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - - - - - - - - - extrq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - - - - - - - - - extrq $22, $2, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - - - - - - - - - insertq %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - - - - - - - - - insertq $22, $22, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movntsd %xmm0, (%rax)
|
||||
# CHECK-NEXT: - - - - - - - - - - - - 0.50 0.50 1.00 0.33 0.33 0.33 - - - 0.50 0.50 movntss %xmm0, (%rax)
|
|
@ -0,0 +1,268 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
pabsb %mm0, %mm2
|
||||
pabsb (%rax), %mm2
|
||||
|
||||
pabsb %xmm0, %xmm2
|
||||
pabsb (%rax), %xmm2
|
||||
|
||||
pabsd %mm0, %mm2
|
||||
pabsd (%rax), %mm2
|
||||
|
||||
pabsd %xmm0, %xmm2
|
||||
pabsd (%rax), %xmm2
|
||||
|
||||
pabsw %mm0, %mm2
|
||||
pabsw (%rax), %mm2
|
||||
|
||||
pabsw %xmm0, %xmm2
|
||||
pabsw (%rax), %xmm2
|
||||
|
||||
palignr $1, %mm0, %mm2
|
||||
palignr $1, (%rax), %mm2
|
||||
|
||||
palignr $1, %xmm0, %xmm2
|
||||
palignr $1, (%rax), %xmm2
|
||||
|
||||
phaddd %mm0, %mm2
|
||||
phaddd (%rax), %mm2
|
||||
|
||||
phaddd %xmm0, %xmm2
|
||||
phaddd (%rax), %xmm2
|
||||
|
||||
phaddsw %mm0, %mm2
|
||||
phaddsw (%rax), %mm2
|
||||
|
||||
phaddsw %xmm0, %xmm2
|
||||
phaddsw (%rax), %xmm2
|
||||
|
||||
phaddw %mm0, %mm2
|
||||
phaddw (%rax), %mm2
|
||||
|
||||
phaddw %xmm0, %xmm2
|
||||
phaddw (%rax), %xmm2
|
||||
|
||||
phsubd %mm0, %mm2
|
||||
phsubd (%rax), %mm2
|
||||
|
||||
phsubd %xmm0, %xmm2
|
||||
phsubd (%rax), %xmm2
|
||||
|
||||
phsubsw %mm0, %mm2
|
||||
phsubsw (%rax), %mm2
|
||||
|
||||
phsubsw %xmm0, %xmm2
|
||||
phsubsw (%rax), %xmm2
|
||||
|
||||
phsubw %mm0, %mm2
|
||||
phsubw (%rax), %mm2
|
||||
|
||||
phsubw %xmm0, %xmm2
|
||||
phsubw (%rax), %xmm2
|
||||
|
||||
pmaddubsw %mm0, %mm2
|
||||
pmaddubsw (%rax), %mm2
|
||||
|
||||
pmaddubsw %xmm0, %xmm2
|
||||
pmaddubsw (%rax), %xmm2
|
||||
|
||||
pmulhrsw %mm0, %mm2
|
||||
pmulhrsw (%rax), %mm2
|
||||
|
||||
pmulhrsw %xmm0, %xmm2
|
||||
pmulhrsw (%rax), %xmm2
|
||||
|
||||
pshufb %mm0, %mm2
|
||||
pshufb (%rax), %mm2
|
||||
|
||||
pshufb %xmm0, %xmm2
|
||||
pshufb (%rax), %xmm2
|
||||
|
||||
psignb %mm0, %mm2
|
||||
psignb (%rax), %mm2
|
||||
|
||||
psignb %xmm0, %xmm2
|
||||
psignb (%rax), %xmm2
|
||||
|
||||
psignd %mm0, %mm2
|
||||
psignd (%rax), %mm2
|
||||
|
||||
psignd %xmm0, %xmm2
|
||||
psignd (%rax), %xmm2
|
||||
|
||||
psignw %mm0, %mm2
|
||||
psignw (%rax), %mm2
|
||||
|
||||
psignw %xmm0, %xmm2
|
||||
psignw (%rax), %xmm2
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 1 1 0.50 pabsb %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pabsb (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 pabsb %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pabsb (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pabsd %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pabsd (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 pabsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pabsd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pabsw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pabsw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 pabsw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pabsw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 palignr $1, %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * palignr $1, (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 palignr $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * palignr $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: 3 2 2.00 phaddd %mm0, %mm2
|
||||
# CHECK-NEXT: 4 9 2.00 * phaddd (%rax), %mm2
|
||||
# CHECK-NEXT: 4 2 2.00 phaddd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 4 9 2.00 * phaddd (%rax), %xmm2
|
||||
# CHECK-NEXT: 3 2 2.00 phaddsw %mm0, %mm2
|
||||
# CHECK-NEXT: 4 9 2.00 * phaddsw (%rax), %mm2
|
||||
# CHECK-NEXT: 4 2 2.00 phaddsw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 4 9 2.00 * phaddsw (%rax), %xmm2
|
||||
# CHECK-NEXT: 3 2 2.00 phaddw %mm0, %mm2
|
||||
# CHECK-NEXT: 4 9 2.00 * phaddw (%rax), %mm2
|
||||
# CHECK-NEXT: 4 2 2.00 phaddw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 4 9 2.00 * phaddw (%rax), %xmm2
|
||||
# CHECK-NEXT: 3 2 2.00 phsubd %mm0, %mm2
|
||||
# CHECK-NEXT: 4 9 2.00 * phsubd (%rax), %mm2
|
||||
# CHECK-NEXT: 4 2 2.00 phsubd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 4 9 2.00 * phsubd (%rax), %xmm2
|
||||
# CHECK-NEXT: 3 2 2.00 phsubsw %mm0, %mm2
|
||||
# CHECK-NEXT: 4 9 2.00 * phsubsw (%rax), %mm2
|
||||
# CHECK-NEXT: 4 2 2.00 phsubsw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 4 9 2.00 * phsubsw (%rax), %xmm2
|
||||
# CHECK-NEXT: 3 2 2.00 phsubw %mm0, %mm2
|
||||
# CHECK-NEXT: 4 9 2.00 * phsubw (%rax), %mm2
|
||||
# CHECK-NEXT: 4 2 2.00 phsubw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 4 9 2.00 * phsubw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 pmaddubsw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 10 0.50 * pmaddubsw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 3 0.50 pmaddubsw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * pmaddubsw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 3 0.50 pmulhrsw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 10 0.50 * pmulhrsw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 3 0.50 pmulhrsw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 10 0.50 * pmulhrsw (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 pshufb %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pshufb (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 pshufb %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * pshufb (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psignb %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psignb (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psignb %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psignb (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psignd %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psignd (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psignd %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psignd (%rax), %xmm2
|
||||
# CHECK-NEXT: 1 1 0.50 psignw %mm0, %mm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psignw (%rax), %mm2
|
||||
# CHECK-NEXT: 1 1 0.50 psignw %xmm0, %xmm2
|
||||
# CHECK-NEXT: 1 8 0.50 * psignw (%rax), %xmm2
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: - - - - - - - - 61.00 13.00 7.00 7.00 16.00 16.00 - 10.67 10.67 10.67 10.67 10.67 10.67 - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - pabsb %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pabsb (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - pabsb %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pabsb (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - pabsd %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pabsd (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - pabsd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pabsd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - pabsw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pabsw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - pabsw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pabsw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - palignr $1, %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - palignr $1, (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - palignr $1, %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - palignr $1, (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phaddd %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phaddd (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phaddd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phaddd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phaddsw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phaddsw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phaddsw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phaddsw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phaddw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phaddw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phaddw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phaddw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phsubd %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phsubd (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phsubd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phsubd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phsubsw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phsubsw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phsubsw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phsubsw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phsubw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phsubw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - - - - - - - - - - - - phsubw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 2.00 - - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - phsubw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmaddubsw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmaddubsw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmaddubsw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmaddubsw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmulhrsw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmulhrsw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 - - - - - - - - - - - pmulhrsw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 - - 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pmulhrsw (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pshufb %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pshufb (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - - - - - - - - - - - - pshufb %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - - 0.50 0.50 - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - pshufb (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psignb %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psignb (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psignb %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psignb (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psignd %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psignd (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psignd %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psignd (%rax), %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psignw %mm0, %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psignw (%rax), %mm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - psignw %xmm0, %xmm2
|
||||
# CHECK-NEXT: - - - - - - - - 0.25 0.25 0.25 0.25 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - psignw (%rax), %xmm2
|
|
@ -0,0 +1,93 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=i686-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
aaa
|
||||
|
||||
aad
|
||||
aad $7
|
||||
|
||||
aam
|
||||
aam $7
|
||||
|
||||
aas
|
||||
|
||||
bound %bx, (%eax)
|
||||
bound %ebx, (%eax)
|
||||
|
||||
daa
|
||||
|
||||
das
|
||||
|
||||
into
|
||||
|
||||
leave
|
||||
|
||||
salc
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 100 100 25.00 aaa
|
||||
# CHECK-NEXT: 100 100 25.00 aad
|
||||
# CHECK-NEXT: 100 100 25.00 aad $7
|
||||
# CHECK-NEXT: 100 100 25.00 aam
|
||||
# CHECK-NEXT: 100 100 25.00 aam $7
|
||||
# CHECK-NEXT: 100 100 25.00 aas
|
||||
# CHECK-NEXT: 100 100 25.00 U bound %bx, (%eax)
|
||||
# CHECK-NEXT: 100 100 25.00 U bound %ebx, (%eax)
|
||||
# CHECK-NEXT: 100 100 25.00 daa
|
||||
# CHECK-NEXT: 100 100 25.00 das
|
||||
# CHECK-NEXT: 100 100 25.00 U into
|
||||
# CHECK-NEXT: 1 1 0.25 * leave
|
||||
# CHECK-NEXT: 1 1 0.25 U salc
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: - - - 275.50 275.50 275.50 275.50 - - - - - - - - - - - - - - - -
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - aaa
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - aad
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - aad $7
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - aam
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - aam $7
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - aas
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - bound %bx, (%eax)
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - bound %ebx, (%eax)
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - daa
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - das
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - into
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - leave
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - salc
|
File diff suppressed because it is too large
Load Diff
|
@ -0,0 +1,536 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -instruction-tables < %s | FileCheck %s
|
||||
|
||||
f2xm1
|
||||
|
||||
fabs
|
||||
|
||||
fadd %st, %st(1)
|
||||
fadd %st(2)
|
||||
fadds (%ecx)
|
||||
faddl (%ecx)
|
||||
faddp %st(1)
|
||||
faddp %st(2)
|
||||
fiadds (%ecx)
|
||||
fiaddl (%ecx)
|
||||
|
||||
fbld (%ecx)
|
||||
fbstp (%eax)
|
||||
|
||||
fchs
|
||||
|
||||
fnclex
|
||||
|
||||
fcmovb %st(1), %st
|
||||
fcmovbe %st(1), %st
|
||||
fcmove %st(1), %st
|
||||
fcmovnb %st(1), %st
|
||||
fcmovnbe %st(1), %st
|
||||
fcmovne %st(1), %st
|
||||
fcmovnu %st(1), %st
|
||||
fcmovu %st(1), %st
|
||||
|
||||
fcom %st(1)
|
||||
fcom %st(3)
|
||||
fcoms (%ecx)
|
||||
fcoml (%eax)
|
||||
fcomp %st(1)
|
||||
fcomp %st(3)
|
||||
fcomps (%ecx)
|
||||
fcompl (%eax)
|
||||
fcompp
|
||||
|
||||
fcomi %st(3)
|
||||
fcompi %st(3)
|
||||
|
||||
fcos
|
||||
|
||||
fdecstp
|
||||
|
||||
fdiv %st, %st(1)
|
||||
fdiv %st(2)
|
||||
fdivs (%ecx)
|
||||
fdivl (%eax)
|
||||
fdivp %st(1)
|
||||
fdivp %st(2)
|
||||
fidivs (%ecx)
|
||||
fidivl (%eax)
|
||||
|
||||
fdivr %st, %st(1)
|
||||
fdivr %st(2)
|
||||
fdivrs (%ecx)
|
||||
fdivrl (%eax)
|
||||
fdivrp %st(1)
|
||||
fdivrp %st(2)
|
||||
fidivrs (%ecx)
|
||||
fidivrl (%eax)
|
||||
|
||||
ffree %st(0)
|
||||
|
||||
ficoms (%ecx)
|
||||
ficoml (%eax)
|
||||
ficomps (%ecx)
|
||||
ficompl (%eax)
|
||||
|
||||
filds (%edx)
|
||||
fildl (%ecx)
|
||||
fildll (%eax)
|
||||
|
||||
fincstp
|
||||
|
||||
fninit
|
||||
|
||||
fists (%edx)
|
||||
fistl (%ecx)
|
||||
fistps (%edx)
|
||||
fistpl (%ecx)
|
||||
fistpll (%eax)
|
||||
|
||||
fisttps (%edx)
|
||||
fisttpl (%ecx)
|
||||
fisttpll (%eax)
|
||||
|
||||
fld %st(0)
|
||||
flds (%edx)
|
||||
fldl (%ecx)
|
||||
fldt (%eax)
|
||||
|
||||
fldcw (%eax)
|
||||
fldenv (%eax)
|
||||
|
||||
fld1
|
||||
fldl2e
|
||||
fldl2t
|
||||
fldlg2
|
||||
fldln2
|
||||
fldpi
|
||||
fldz
|
||||
|
||||
fmul %st, %st(1)
|
||||
fmul %st(2)
|
||||
fmuls (%ecx)
|
||||
fmull (%eax)
|
||||
fmulp %st(1)
|
||||
fmulp %st(2)
|
||||
fimuls (%ecx)
|
||||
fimull (%eax)
|
||||
|
||||
fnop
|
||||
|
||||
fpatan
|
||||
|
||||
fprem
|
||||
fprem1
|
||||
|
||||
fptan
|
||||
|
||||
frndint
|
||||
|
||||
frstor (%eax)
|
||||
|
||||
fnsave (%eax)
|
||||
|
||||
fscale
|
||||
|
||||
fsin
|
||||
|
||||
fsincos
|
||||
|
||||
fsqrt
|
||||
|
||||
fst %st(0)
|
||||
fsts (%edx)
|
||||
fstl (%ecx)
|
||||
fstp %st(0)
|
||||
fstpl (%edx)
|
||||
fstpl (%ecx)
|
||||
fstpt (%eax)
|
||||
|
||||
fnstcw (%eax)
|
||||
fnstenv (%eax)
|
||||
fnstsw (%eax)
|
||||
|
||||
frstor (%eax)
|
||||
fsave (%eax)
|
||||
|
||||
fsub %st, %st(1)
|
||||
fsub %st(2)
|
||||
fsubs (%ecx)
|
||||
fsubl (%eax)
|
||||
fsubp %st(1)
|
||||
fsubp %st(2)
|
||||
fisubs (%ecx)
|
||||
fisubl (%eax)
|
||||
|
||||
fsubr %st, %st(1)
|
||||
fsubr %st(2)
|
||||
fsubrs (%ecx)
|
||||
fsubrl (%eax)
|
||||
fsubrp %st(1)
|
||||
fsubrp %st(2)
|
||||
fisubrs (%ecx)
|
||||
fisubrl (%eax)
|
||||
|
||||
ftst
|
||||
|
||||
fucom %st(1)
|
||||
fucom %st(3)
|
||||
fucomp %st(1)
|
||||
fucomp %st(3)
|
||||
fucompp
|
||||
|
||||
fucomi %st(3)
|
||||
fucompi %st(3)
|
||||
|
||||
fwait
|
||||
|
||||
fxam
|
||||
|
||||
fxch %st(1)
|
||||
fxch %st(3)
|
||||
|
||||
fxrstor (%eax)
|
||||
fxsave (%eax)
|
||||
|
||||
fxtract
|
||||
|
||||
fyl2x
|
||||
fyl2xp1
|
||||
|
||||
# CHECK: Instruction Info:
|
||||
# CHECK-NEXT: [1]: #uOps
|
||||
# CHECK-NEXT: [2]: Latency
|
||||
# CHECK-NEXT: [3]: RThroughput
|
||||
# CHECK-NEXT: [4]: MayLoad
|
||||
# CHECK-NEXT: [5]: MayStore
|
||||
# CHECK-NEXT: [6]: HasSideEffects (U)
|
||||
|
||||
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
|
||||
# CHECK-NEXT: 100 100 25.00 U f2xm1
|
||||
# CHECK-NEXT: 1 1 1.00 U fabs
|
||||
# CHECK-NEXT: 1 3 0.50 U fadd %st, %st(1)
|
||||
# CHECK-NEXT: 1 3 0.50 U fadd %st(2), %st
|
||||
# CHECK-NEXT: 1 10 0.50 * U fadds (%ecx)
|
||||
# CHECK-NEXT: 1 10 0.50 * U faddl (%ecx)
|
||||
# CHECK-NEXT: 1 3 0.50 U faddp %st, %st(1)
|
||||
# CHECK-NEXT: 1 3 0.50 U faddp %st, %st(2)
|
||||
# CHECK-NEXT: 2 5 6.00 * U fiadds (%ecx)
|
||||
# CHECK-NEXT: 2 5 6.00 * U fiaddl (%ecx)
|
||||
# CHECK-NEXT: 100 100 25.00 * U fbld (%ecx)
|
||||
# CHECK-NEXT: 100 100 25.00 * U fbstp (%eax)
|
||||
# CHECK-NEXT: 1 1 1.00 U fchs
|
||||
# CHECK-NEXT: 100 100 25.00 U fnclex
|
||||
# CHECK-NEXT: 7 7 7.00 U fcmovb %st(1), %st
|
||||
# CHECK-NEXT: 7 7 7.00 U fcmovbe %st(1), %st
|
||||
# CHECK-NEXT: 7 7 7.00 U fcmove %st(1), %st
|
||||
# CHECK-NEXT: 7 7 7.00 U fcmovnb %st(1), %st
|
||||
# CHECK-NEXT: 7 7 7.00 U fcmovnbe %st(1), %st
|
||||
# CHECK-NEXT: 7 7 7.00 U fcmovne %st(1), %st
|
||||
# CHECK-NEXT: 7 7 7.00 U fcmovnu %st(1), %st
|
||||
# CHECK-NEXT: 7 7 7.00 U fcmovu %st(1), %st
|
||||
# CHECK-NEXT: 1 3 1.00 U fcom %st(1)
|
||||
# CHECK-NEXT: 1 3 1.00 U fcom %st(3)
|
||||
# CHECK-NEXT: 1 10 1.00 * U fcoms (%ecx)
|
||||
# CHECK-NEXT: 1 10 1.00 * U fcoml (%eax)
|
||||
# CHECK-NEXT: 1 3 1.00 U fcomp %st(1)
|
||||
# CHECK-NEXT: 1 3 1.00 U fcomp %st(3)
|
||||
# CHECK-NEXT: 1 10 1.00 * U fcomps (%ecx)
|
||||
# CHECK-NEXT: 1 10 1.00 * U fcompl (%eax)
|
||||
# CHECK-NEXT: 100 100 25.00 U fcompp
|
||||
# CHECK-NEXT: 1 3 1.00 U fcomi %st(3), %st
|
||||
# CHECK-NEXT: 1 3 1.00 U fcompi %st(3), %st
|
||||
# CHECK-NEXT: 100 100 25.00 U fcos
|
||||
# CHECK-NEXT: 100 100 25.00 U fdecstp
|
||||
# CHECK-NEXT: 1 11 3.00 U fdiv %st, %st(1)
|
||||
# CHECK-NEXT: 1 11 3.00 U fdiv %st(2), %st
|
||||
# CHECK-NEXT: 1 18 3.00 * U fdivs (%ecx)
|
||||
# CHECK-NEXT: 1 18 3.00 * U fdivl (%eax)
|
||||
# CHECK-NEXT: 1 11 3.00 U fdivp %st, %st(1)
|
||||
# CHECK-NEXT: 1 11 3.00 U fdivp %st, %st(2)
|
||||
# CHECK-NEXT: 2 5 15.50 * U fidivs (%ecx)
|
||||
# CHECK-NEXT: 2 5 15.50 * U fidivl (%eax)
|
||||
# CHECK-NEXT: 1 11 3.00 U fdivr %st, %st(1)
|
||||
# CHECK-NEXT: 1 11 3.00 U fdivr %st(2), %st
|
||||
# CHECK-NEXT: 1 18 3.00 * U fdivrs (%ecx)
|
||||
# CHECK-NEXT: 1 18 3.00 * U fdivrl (%eax)
|
||||
# CHECK-NEXT: 1 11 3.00 U fdivrp %st, %st(1)
|
||||
# CHECK-NEXT: 1 11 3.00 U fdivrp %st, %st(2)
|
||||
# CHECK-NEXT: 2 5 15.50 * U fidivrs (%ecx)
|
||||
# CHECK-NEXT: 2 5 15.50 * U fidivrl (%eax)
|
||||
# CHECK-NEXT: 100 100 25.00 U ffree %st(0)
|
||||
# CHECK-NEXT: 1 10 1.00 * U ficoms (%ecx)
|
||||
# CHECK-NEXT: 1 10 1.00 * U ficoml (%eax)
|
||||
# CHECK-NEXT: 1 10 1.00 * U ficomps (%ecx)
|
||||
# CHECK-NEXT: 1 10 1.00 * U ficompl (%eax)
|
||||
# CHECK-NEXT: 1 5 0.33 * U filds (%edx)
|
||||
# CHECK-NEXT: 1 5 0.33 * U fildl (%ecx)
|
||||
# CHECK-NEXT: 1 5 0.33 * U fildll (%eax)
|
||||
# CHECK-NEXT: 100 100 25.00 U fincstp
|
||||
# CHECK-NEXT: 100 100 25.00 U fninit
|
||||
# CHECK-NEXT: 1 1 1.00 * U fists (%edx)
|
||||
# CHECK-NEXT: 1 1 1.00 * U fistl (%ecx)
|
||||
# CHECK-NEXT: 1 1 1.00 * U fistps (%edx)
|
||||
# CHECK-NEXT: 1 1 1.00 * U fistpl (%ecx)
|
||||
# CHECK-NEXT: 1 1 1.00 * U fistpll (%eax)
|
||||
# CHECK-NEXT: 1 1 1.00 * U fisttps (%edx)
|
||||
# CHECK-NEXT: 1 1 1.00 * U fisttpl (%ecx)
|
||||
# CHECK-NEXT: 1 1 1.00 * U fisttpll (%eax)
|
||||
# CHECK-NEXT: 1 1 1.00 U fld %st(0)
|
||||
# CHECK-NEXT: 1 5 0.33 * U flds (%edx)
|
||||
# CHECK-NEXT: 1 5 0.33 * U fldl (%ecx)
|
||||
# CHECK-NEXT: 1 5 0.33 * U fldt (%eax)
|
||||
# CHECK-NEXT: 1 5 0.33 * U fldcw (%eax)
|
||||
# CHECK-NEXT: 100 100 25.00 * U fldenv (%eax)
|
||||
# CHECK-NEXT: 1 11 1.00 U fld1
|
||||
# CHECK-NEXT: 1 11 1.00 U fldl2e
|
||||
# CHECK-NEXT: 1 11 1.00 U fldl2t
|
||||
# CHECK-NEXT: 1 11 1.00 U fldlg2
|
||||
# CHECK-NEXT: 1 11 1.00 U fldln2
|
||||
# CHECK-NEXT: 1 11 1.00 U fldpi
|
||||
# CHECK-NEXT: 1 8 1.00 U fldz
|
||||
# CHECK-NEXT: 1 3 0.50 U fmul %st, %st(1)
|
||||
# CHECK-NEXT: 1 3 0.50 U fmul %st(2), %st
|
||||
# CHECK-NEXT: 1 10 0.50 * U fmuls (%ecx)
|
||||
# CHECK-NEXT: 1 10 0.50 * U fmull (%eax)
|
||||
# CHECK-NEXT: 1 3 0.50 U fmulp %st, %st(1)
|
||||
# CHECK-NEXT: 1 3 0.50 U fmulp %st, %st(2)
|
||||
# CHECK-NEXT: 2 5 6.00 * U fimuls (%ecx)
|
||||
# CHECK-NEXT: 2 5 6.00 * U fimull (%eax)
|
||||
# CHECK-NEXT: 1 0 0.25 U fnop
|
||||
# CHECK-NEXT: 100 100 25.00 U fpatan
|
||||
# CHECK-NEXT: 100 100 25.00 U fprem
|
||||
# CHECK-NEXT: 100 100 25.00 U fprem1
|
||||
# CHECK-NEXT: 100 100 25.00 U fptan
|
||||
# CHECK-NEXT: 100 100 25.00 U frndint
|
||||
# CHECK-NEXT: 100 100 25.00 * U frstor (%eax)
|
||||
# CHECK-NEXT: 100 100 25.00 * U fnsave (%eax)
|
||||
# CHECK-NEXT: 100 100 25.00 U fscale
|
||||
# CHECK-NEXT: 100 100 25.00 U fsin
|
||||
# CHECK-NEXT: 100 100 25.00 U fsincos
|
||||
# CHECK-NEXT: 1 22 23.00 U fsqrt
|
||||
# CHECK-NEXT: 1 1 1.00 U fst %st(0)
|
||||
# CHECK-NEXT: 1 1 1.00 * U fsts (%edx)
|
||||
# CHECK-NEXT: 1 1 1.00 * U fstl (%ecx)
|
||||
# CHECK-NEXT: 1 1 1.00 U fstp %st(0)
|
||||
# CHECK-NEXT: 1 1 1.00 * U fstpl (%edx)
|
||||
# CHECK-NEXT: 1 1 1.00 * U fstpl (%ecx)
|
||||
# CHECK-NEXT: 1 1 1.00 * U fstpt (%eax)
|
||||
# CHECK-NEXT: 1 1 0.25 * U fnstcw (%eax)
|
||||
# CHECK-NEXT: 100 100 25.00 * U fnstenv (%eax)
|
||||
# CHECK-NEXT: 100 100 25.00 * U fnstsw (%eax)
|
||||
# CHECK-NEXT: 100 100 25.00 * U frstor (%eax)
|
||||
# CHECK-NEXT: 100 100 25.00 U wait
|
||||
# CHECK-NEXT: 100 100 25.00 * U fnsave (%eax)
|
||||
# CHECK-NEXT: 1 3 0.50 U fsub %st, %st(1)
|
||||
# CHECK-NEXT: 1 3 0.50 U fsub %st(2), %st
|
||||
# CHECK-NEXT: 1 10 0.50 * U fsubs (%ecx)
|
||||
# CHECK-NEXT: 1 10 0.50 * U fsubl (%eax)
|
||||
# CHECK-NEXT: 1 3 0.50 U fsubp %st, %st(1)
|
||||
# CHECK-NEXT: 1 3 0.50 U fsubp %st, %st(2)
|
||||
# CHECK-NEXT: 2 5 6.00 * U fisubs (%ecx)
|
||||
# CHECK-NEXT: 2 5 6.00 * U fisubl (%eax)
|
||||
# CHECK-NEXT: 1 3 0.50 U fsubr %st, %st(1)
|
||||
# CHECK-NEXT: 1 3 0.50 U fsubr %st(2), %st
|
||||
# CHECK-NEXT: 1 10 0.50 * U fsubrs (%ecx)
|
||||
# CHECK-NEXT: 1 10 0.50 * U fsubrl (%eax)
|
||||
# CHECK-NEXT: 1 3 0.50 U fsubrp %st, %st(1)
|
||||
# CHECK-NEXT: 1 3 0.50 U fsubrp %st, %st(2)
|
||||
# CHECK-NEXT: 2 5 6.00 * U fisubrs (%ecx)
|
||||
# CHECK-NEXT: 2 5 6.00 * U fisubrl (%eax)
|
||||
# CHECK-NEXT: 1 3 1.00 U ftst
|
||||
# CHECK-NEXT: 1 3 1.00 U fucom %st(1)
|
||||
# CHECK-NEXT: 1 3 1.00 U fucom %st(3)
|
||||
# CHECK-NEXT: 1 3 1.00 U fucomp %st(1)
|
||||
# CHECK-NEXT: 1 3 1.00 U fucomp %st(3)
|
||||
# CHECK-NEXT: 1 3 1.00 U fucompp
|
||||
# CHECK-NEXT: 1 3 1.00 U fucomi %st(3), %st
|
||||
# CHECK-NEXT: 1 3 1.00 U fucompi %st(3), %st
|
||||
# CHECK-NEXT: 100 100 25.00 U wait
|
||||
# CHECK-NEXT: 100 100 25.00 U fxam
|
||||
# CHECK-NEXT: 1 1 1.00 U fxch %st(1)
|
||||
# CHECK-NEXT: 1 1 1.00 U fxch %st(3)
|
||||
# CHECK-NEXT: 100 100 25.00 * * U fxrstor (%eax)
|
||||
# CHECK-NEXT: 100 100 25.00 * * U fxsave (%eax)
|
||||
# CHECK-NEXT: 100 100 25.00 U fxtract
|
||||
# CHECK-NEXT: 100 100 25.00 U fyl2x
|
||||
# CHECK-NEXT: 100 100 25.00 U fyl2xp1
|
||||
|
||||
# CHECK: Resources:
|
||||
# CHECK-NEXT: [0] - Zn3AGU0
|
||||
# CHECK-NEXT: [1] - Zn3AGU1
|
||||
# CHECK-NEXT: [2] - Zn3AGU2
|
||||
# CHECK-NEXT: [3] - Zn3ALU0
|
||||
# CHECK-NEXT: [4] - Zn3ALU1
|
||||
# CHECK-NEXT: [5] - Zn3ALU2
|
||||
# CHECK-NEXT: [6] - Zn3ALU3
|
||||
# CHECK-NEXT: [7] - Zn3BRU1
|
||||
# CHECK-NEXT: [8] - Zn3FPP0
|
||||
# CHECK-NEXT: [9] - Zn3FPP1
|
||||
# CHECK-NEXT: [10] - Zn3FPP2
|
||||
# CHECK-NEXT: [11] - Zn3FPP3
|
||||
# CHECK-NEXT: [12.0] - Zn3FPP45
|
||||
# CHECK-NEXT: [12.1] - Zn3FPP45
|
||||
# CHECK-NEXT: [13] - Zn3FPSt
|
||||
# CHECK-NEXT: [14.0] - Zn3LSU
|
||||
# CHECK-NEXT: [14.1] - Zn3LSU
|
||||
# CHECK-NEXT: [14.2] - Zn3LSU
|
||||
# CHECK-NEXT: [15.0] - Zn3Load
|
||||
# CHECK-NEXT: [15.1] - Zn3Load
|
||||
# CHECK-NEXT: [15.2] - Zn3Load
|
||||
# CHECK-NEXT: [16.0] - Zn3Store
|
||||
# CHECK-NEXT: [16.1] - Zn3Store
|
||||
|
||||
# CHECK: Resource pressure per iteration:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1]
|
||||
# CHECK-NEXT: 10.67 10.67 10.67 886.50 886.50 886.50 886.50 - 137.00 203.00 119.00 119.00 13.50 13.50 - 24.00 24.00 24.00 15.33 15.33 15.33 13.00 13.00
|
||||
|
||||
# CHECK: Resource pressure by instruction:
|
||||
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12.0] [12.1] [13] [14.0] [14.1] [14.2] [15.0] [15.1] [15.2] [16.0] [16.1] Instructions:
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - f2xm1
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - fabs
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - fadd %st, %st(1)
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - fadd %st(2), %st
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fadds (%ecx)
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - faddl (%ecx)
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - faddp %st, %st(1)
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - faddp %st, %st(2)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - 6.00 6.00 6.00 6.00 - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - fiadds (%ecx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - 6.00 6.00 6.00 6.00 - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - fiaddl (%ecx)
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fbld (%ecx)
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fbstp (%eax)
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - fchs
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fnclex
|
||||
# CHECK-NEXT: - - - 7.00 7.00 7.00 7.00 - - - - - - - - - - - - - - - - fcmovb %st(1), %st
|
||||
# CHECK-NEXT: - - - 7.00 7.00 7.00 7.00 - - - - - - - - - - - - - - - - fcmovbe %st(1), %st
|
||||
# CHECK-NEXT: - - - 7.00 7.00 7.00 7.00 - - - - - - - - - - - - - - - - fcmove %st(1), %st
|
||||
# CHECK-NEXT: - - - 7.00 7.00 7.00 7.00 - - - - - - - - - - - - - - - - fcmovnb %st(1), %st
|
||||
# CHECK-NEXT: - - - 7.00 7.00 7.00 7.00 - - - - - - - - - - - - - - - - fcmovnbe %st(1), %st
|
||||
# CHECK-NEXT: - - - 7.00 7.00 7.00 7.00 - - - - - - - - - - - - - - - - fcmovne %st(1), %st
|
||||
# CHECK-NEXT: - - - 7.00 7.00 7.00 7.00 - - - - - - - - - - - - - - - - fcmovnu %st(1), %st
|
||||
# CHECK-NEXT: - - - 7.00 7.00 7.00 7.00 - - - - - - - - - - - - - - - - fcmovu %st(1), %st
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - fcom %st(1)
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - fcom %st(3)
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fcoms (%ecx)
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fcoml (%eax)
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - fcomp %st(1)
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - fcomp %st(3)
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fcomps (%ecx)
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fcompl (%eax)
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fcompp
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - fcomi %st(3), %st
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - fcompi %st(3), %st
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fcos
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fdecstp
|
||||
# CHECK-NEXT: - - - - - - - - - 3.00 - - - - - - - - - - - - - fdiv %st, %st(1)
|
||||
# CHECK-NEXT: - - - - - - - - - 3.00 - - - - - - - - - - - - - fdiv %st(2), %st
|
||||
# CHECK-NEXT: - - - - - - - - - 3.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fdivs (%ecx)
|
||||
# CHECK-NEXT: - - - - - - - - - 3.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fdivl (%eax)
|
||||
# CHECK-NEXT: - - - - - - - - - 3.00 - - - - - - - - - - - - - fdivp %st, %st(1)
|
||||
# CHECK-NEXT: - - - - - - - - - 3.00 - - - - - - - - - - - - - fdivp %st, %st(2)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - 15.50 15.50 15.50 15.50 - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - fidivs (%ecx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - 15.50 15.50 15.50 15.50 - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - fidivl (%eax)
|
||||
# CHECK-NEXT: - - - - - - - - - 3.00 - - - - - - - - - - - - - fdivr %st, %st(1)
|
||||
# CHECK-NEXT: - - - - - - - - - 3.00 - - - - - - - - - - - - - fdivr %st(2), %st
|
||||
# CHECK-NEXT: - - - - - - - - - 3.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fdivrs (%ecx)
|
||||
# CHECK-NEXT: - - - - - - - - - 3.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fdivrl (%eax)
|
||||
# CHECK-NEXT: - - - - - - - - - 3.00 - - - - - - - - - - - - - fdivrp %st, %st(1)
|
||||
# CHECK-NEXT: - - - - - - - - - 3.00 - - - - - - - - - - - - - fdivrp %st, %st(2)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - 15.50 15.50 15.50 15.50 - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - fidivrs (%ecx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - 15.50 15.50 15.50 15.50 - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - fidivrl (%eax)
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - ffree %st(0)
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - ficoms (%ecx)
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - ficoml (%eax)
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - ficomps (%ecx)
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - ficompl (%eax)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - filds (%edx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - fildl (%ecx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - fildll (%eax)
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fincstp
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fninit
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.67 0.67 0.67 - - - 1.00 1.00 fists (%edx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.67 0.67 0.67 - - - 1.00 1.00 fistl (%ecx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.67 0.67 0.67 - - - 1.00 1.00 fistps (%edx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.67 0.67 0.67 - - - 1.00 1.00 fistpl (%ecx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.67 0.67 0.67 - - - 1.00 1.00 fistpll (%eax)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.67 0.67 0.67 - - - 1.00 1.00 fisttps (%edx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.67 0.67 0.67 - - - 1.00 1.00 fisttpl (%ecx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.67 0.67 0.67 - - - 1.00 1.00 fisttpll (%eax)
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - fld %st(0)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - flds (%edx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - fldl (%ecx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - fldt (%eax)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - fldcw (%eax)
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fldenv (%eax)
|
||||
# CHECK-NEXT: - - - - - - - - - 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fld1
|
||||
# CHECK-NEXT: - - - - - - - - - 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fldl2e
|
||||
# CHECK-NEXT: - - - - - - - - - 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fldl2t
|
||||
# CHECK-NEXT: - - - - - - - - - 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fldlg2
|
||||
# CHECK-NEXT: - - - - - - - - - 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fldln2
|
||||
# CHECK-NEXT: - - - - - - - - - 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fldpi
|
||||
# CHECK-NEXT: - - - - - - - - - 1.00 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fldz
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - fmul %st, %st(1)
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - fmul %st(2), %st
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fmuls (%ecx)
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fmull (%eax)
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - fmulp %st, %st(1)
|
||||
# CHECK-NEXT: - - - - - - - - 0.50 0.50 - - - - - - - - - - - - - fmulp %st, %st(2)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - 6.00 6.00 6.00 6.00 - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - fimuls (%ecx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - 6.00 6.00 6.00 6.00 - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - fimull (%eax)
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - fnop
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fpatan
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fprem
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fprem1
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fptan
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - frndint
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - frstor (%eax)
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fnsave (%eax)
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fscale
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fsin
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fsincos
|
||||
# CHECK-NEXT: - - - - - - - - - 23.00 - - - - - - - - - - - - - fsqrt
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - fst %st(0)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.67 0.67 0.67 - - - 1.00 1.00 fsts (%edx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.67 0.67 0.67 - - - 1.00 1.00 fstl (%ecx)
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - fstp %st(0)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.67 0.67 0.67 - - - 1.00 1.00 fstpl (%edx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.67 0.67 0.67 - - - 1.00 1.00 fstpl (%ecx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - - - - - - - - 0.67 0.67 0.67 - - - 1.00 1.00 fstpt (%eax)
|
||||
# CHECK-NEXT: - - - 0.25 0.25 0.25 0.25 - - - - - - - - - - - - - - - - fnstcw (%eax)
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fnstenv (%eax)
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fnstsw (%eax)
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - frstor (%eax)
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - wait
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fnsave (%eax)
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - fsub %st, %st(1)
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - fsub %st(2), %st
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fsubs (%ecx)
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fsubl (%eax)
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - fsubp %st, %st(1)
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - fsubp %st, %st(2)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - 6.00 6.00 6.00 6.00 - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - fisubs (%ecx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - 6.00 6.00 6.00 6.00 - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - fisubl (%eax)
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - fsubr %st, %st(1)
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - fsubr %st(2), %st
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fsubrs (%ecx)
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 0.50 0.50 - 0.33 0.33 0.33 0.33 0.33 0.33 - - fsubrl (%eax)
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - fsubrp %st, %st(1)
|
||||
# CHECK-NEXT: - - - - - - - - - - 0.50 0.50 - - - - - - - - - - - fsubrp %st, %st(2)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - 6.00 6.00 6.00 6.00 - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - fisubrs (%ecx)
|
||||
# CHECK-NEXT: 0.33 0.33 0.33 - - - - - 6.00 6.00 6.00 6.00 - - - 0.33 0.33 0.33 0.33 0.33 0.33 - - fisubrl (%eax)
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - ftst
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - fucom %st(1)
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - fucom %st(3)
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - fucomp %st(1)
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - fucomp %st(3)
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - fucompp
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - fucomi %st(3), %st
|
||||
# CHECK-NEXT: - - - - - - - - 1.00 1.00 - - - - - - - - - - - - - fucompi %st(3), %st
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - wait
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fxam
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - fxch %st(1)
|
||||
# CHECK-NEXT: - - - 1.00 1.00 1.00 1.00 - - - - - - - - - - - - - - - - fxch %st(3)
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fxrstor (%eax)
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fxsave (%eax)
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fxtract
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fyl2x
|
||||
# CHECK-NEXT: - - - 25.00 25.00 25.00 25.00 - - - - - - - - - - - - - - - - fyl2xp1
|
|
@ -4,6 +4,7 @@
|
|||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=btver2 -resource-pressure=false -instruction-info=false < %s | FileCheck --check-prefixes=ALL,BTVER2 %s
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=znver1 -resource-pressure=false -instruction-info=false < %s | FileCheck --check-prefixes=ALL,ZNVER1 %s
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=znver2 -resource-pressure=false -instruction-info=false < %s | FileCheck --check-prefixes=ALL,ZNVER2 %s
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=znver3 -resource-pressure=false -instruction-info=false < %s | FileCheck --check-prefixes=ALL,ZNVER3 %s
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=sandybridge -resource-pressure=false -instruction-info=false < %s | FileCheck --check-prefixes=ALL,SANDYBRIDGE %s
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=ivybridge -resource-pressure=false -instruction-info=false < %s | FileCheck --check-prefixes=ALL,IVYBRIDGE %s
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=haswell -resource-pressure=false -instruction-info=false < %s | FileCheck --check-prefixes=ALL,HASWELL %s
|
||||
|
@ -84,3 +85,8 @@ add %edi, %eax
|
|||
# ZNVER2-NEXT: uOps Per Cycle: 0.97
|
||||
# ZNVER2-NEXT: IPC: 0.97
|
||||
# ZNVER2-NEXT: Block RThroughput: 0.3
|
||||
|
||||
# ZNVER3: Dispatch Width: 6
|
||||
# ZNVER3-NEXT: uOps Per Cycle: 0.97
|
||||
# ZNVER3-NEXT: IPC: 0.97
|
||||
# ZNVER3-NEXT: Block RThroughput: 0.3
|
||||
|
|
|
@ -1,3 +1,5 @@
|
|||
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=atom -o /dev/null 2>&1 | FileCheck %s
|
||||
# CHECK: warning: support for in-order CPU 'atom' is experimental.
|
||||
movsbw %al, %di
|
||||
|
||||
# CHECK: warning: support for in-order CPU 'atom' is experimental.
|
||||
|
|
|
@ -8,6 +8,7 @@
|
|||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=btver2 -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,BTVER2
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver1 -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,ZNVER1
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver2 -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,ZNVER2
|
||||
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver3 -iterations=1 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefixes=ALL,ZNVER3
|
||||
|
||||
vdivps %xmm0, %xmm1, %xmm1
|
||||
vaddps (%rax), %xmm1, %xmm1
|
||||
|
@ -42,6 +43,9 @@ vaddps (%rax), %xmm1, %xmm1
|
|||
# ZNVER2-NEXT: Total Cycles: 21
|
||||
# ZNVER2-NEXT: Total uOps: 2
|
||||
|
||||
# ZNVER3-NEXT: Total Cycles: 17
|
||||
# ZNVER3-NEXT: Total uOps: 2
|
||||
|
||||
# BARCELONA: Dispatch Width: 4
|
||||
# BARCELONA-NEXT: uOps Per Cycle: 0.15
|
||||
# BARCELONA-NEXT: IPC: 0.10
|
||||
|
@ -87,6 +91,11 @@ vaddps (%rax), %xmm1, %xmm1
|
|||
# ZNVER2-NEXT: IPC: 0.10
|
||||
# ZNVER2-NEXT: Block RThroughput: 1.0
|
||||
|
||||
# ZNVER3: Dispatch Width: 6
|
||||
# ZNVER3-NEXT: uOps Per Cycle: 0.12
|
||||
# ZNVER3-NEXT: IPC: 0.12
|
||||
# ZNVER3-NEXT: Block RThroughput: 3.0
|
||||
|
||||
# ALL: Timeline view:
|
||||
|
||||
# BARCELONA-NEXT: 0123456789
|
||||
|
@ -116,6 +125,9 @@ vaddps (%rax), %xmm1, %xmm1
|
|||
# ZNVER2-NEXT: 0123456789
|
||||
# ZNVER2-NEXT: Index 0123456789 0
|
||||
|
||||
# ZNVER3-NEXT: 0123456
|
||||
# ZNVER3-NEXT: Index 0123456789
|
||||
|
||||
# BARCELONA: [0,0] DeeeeeeeeeeeeeeER . vdivps %xmm0, %xmm1, %xmm1
|
||||
# BARCELONA-NEXT: [0,1] D========eeeeeeeeeER vaddps (%rax), %xmm1, %xmm1
|
||||
|
||||
|
@ -143,6 +155,9 @@ vaddps (%rax), %xmm1, %xmm1
|
|||
# ZNVER2: [0,0] DeeeeeeeeeeeeeeeER . vdivps %xmm0, %xmm1, %xmm1
|
||||
# ZNVER2-NEXT: [0,1] D========eeeeeeeeeeER vaddps (%rax), %xmm1, %xmm1
|
||||
|
||||
# ZNVER3: [0,0] DeeeeeeeeeeeER .. vdivps %xmm0, %xmm1, %xmm1
|
||||
# ZNVER3-NEXT: [0,1] D====eeeeeeeeeeER vaddps (%rax), %xmm1, %xmm1
|
||||
|
||||
# ALL: Average Wait times (based on the timeline view):
|
||||
# ALL-NEXT: [0]: Executions
|
||||
# ALL-NEXT: [1]: Average time spent waiting in a scheduler's queue
|
||||
|
@ -178,3 +193,6 @@ vaddps (%rax), %xmm1, %xmm1
|
|||
|
||||
# ZNVER2-NEXT: 1. 1 9.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1
|
||||
# ZNVER2-NEXT: 1 5.0 0.5 0.0 <total>
|
||||
|
||||
# ZNVER3-NEXT: 1. 1 5.0 0.0 0.0 vaddps (%rax), %xmm1, %xmm1
|
||||
# ZNVER3-NEXT: 1 3.0 0.5 0.0 <total>
|
||||
|
|
|
@ -5,6 +5,7 @@
|
|||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=btver2 -iterations=1 -all-stats=false -all-views=false -register-file-stats < %s | FileCheck --check-prefixes=ALL,BTVER2 %s
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=znver1 -iterations=1 -all-stats=false -all-views=false -register-file-stats < %s | FileCheck --check-prefixes=ALL,ZNVER1 %s
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=znver2 -iterations=1 -all-stats=false -all-views=false -register-file-stats < %s | FileCheck --check-prefixes=ALL,ZNVER2 %s
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=znver3 -iterations=1 -all-stats=false -all-views=false -register-file-stats < %s | FileCheck --check-prefixes=ALL,ZNVER3 %s
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=sandybridge -iterations=1 -all-stats=false -all-views=false -register-file-stats < %s | FileCheck --check-prefixes=ALL %s
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=ivybridge -iterations=1 -all-stats=false -all-views=false -register-file-stats < %s | FileCheck --check-prefixes=ALL %s
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=haswell -iterations=1 -all-stats=false -all-views=false -register-file-stats < %s | FileCheck --check-prefixes=ALL %s
|
||||
|
@ -44,6 +45,11 @@ xor %eax, %ebx
|
|||
# ZNVER2-NEXT: Total number of mappings created: 0
|
||||
# ZNVER2-NEXT: Max number of mappings used: 0
|
||||
|
||||
# ZNVER3: * Register File #1 -- Zn3FpPRF:
|
||||
# ZNVER3-NEXT: Number of physical registers: 160
|
||||
# ZNVER3-NEXT: Total number of mappings created: 0
|
||||
# ZNVER3-NEXT: Max number of mappings used: 0
|
||||
|
||||
# BDVER2: * Register File #2 -- PdIntegerPRF:
|
||||
# BDVER2-NEXT: Number of physical registers: 96
|
||||
# BDVER2-NEXT: Total number of mappings created: 2
|
||||
|
@ -63,3 +69,8 @@ xor %eax, %ebx
|
|||
# ZNVER2-NEXT: Number of physical registers: 168
|
||||
# ZNVER2-NEXT: Total number of mappings created: 2
|
||||
# ZNVER2-NEXT: Max number of mappings used: 2
|
||||
|
||||
# ZNVER3: * Register File #2 -- Zn3IntegerPRF:
|
||||
# ZNVER3-NEXT: Number of physical registers: 192
|
||||
# ZNVER3-NEXT: Total number of mappings created: 2
|
||||
# ZNVER3-NEXT: Max number of mappings used: 2
|
||||
|
|
|
@ -4,6 +4,7 @@
|
|||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=btver2 -iterations=1 -all-stats=false -all-views=false -scheduler-stats < %s | FileCheck --check-prefixes=ALL,BTVER2 %s
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=znver1 -iterations=1 -all-stats=false -all-views=false -scheduler-stats < %s | FileCheck --check-prefixes=ALL,ZNVER1 %s
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=znver2 -iterations=1 -all-stats=false -all-views=false -scheduler-stats < %s | FileCheck --check-prefixes=ALL,ZNVER2 %s
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=znver3 -iterations=1 -all-stats=false -all-views=false -scheduler-stats < %s | FileCheck --check-prefixes=ALL,ZNVER3 %s
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=sandybridge -iterations=1 -all-stats=false -all-views=false -scheduler-stats < %s | FileCheck --check-prefixes=ALL,SNB %s
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=ivybridge -iterations=1 -all-stats=false -all-views=false -scheduler-stats < %s | FileCheck --check-prefixes=ALL,IVB %s
|
||||
# RUN: llvm-mca %s -mtriple=x86_64-unknown-unknown -mcpu=haswell -iterations=1 -all-stats=false -all-views=false -scheduler-stats < %s | FileCheck --check-prefixes=ALL,HSW %s
|
||||
|
@ -95,6 +96,12 @@ xor %eax, %ebx
|
|||
# ZNVER2-NEXT: [3] Maximum number of used buffer entries.
|
||||
# ZNVER2-NEXT: [4] Total number of buffer entries.
|
||||
|
||||
# ZNVER3: Scheduler's queue usage:
|
||||
# ZNVER3-NEXT: [1] Resource name.
|
||||
# ZNVER3-NEXT: [2] Average number of used buffer entries.
|
||||
# ZNVER3-NEXT: [3] Maximum number of used buffer entries.
|
||||
# ZNVER3-NEXT: [4] Total number of buffer entries.
|
||||
|
||||
# BARCELONA: [1] [2] [3] [4]
|
||||
# BARCELONA-NEXT: SBPortAny 0 1 54
|
||||
|
||||
|
@ -139,3 +146,9 @@ xor %eax, %ebx
|
|||
# ZNVER2-NEXT: Zn2AGU 0 0 28
|
||||
# ZNVER2-NEXT: Zn2ALU 0 1 64
|
||||
# ZNVER2-NEXT: Zn2FPU 0 0 36
|
||||
|
||||
# ZNVER3: [1] [2] [3] [4]
|
||||
# ZNVER3-NEXT: Zn3FP 0 0 64
|
||||
# ZNVER3-NEXT: Zn3Int 0 1 96
|
||||
# ZNVER3-NEXT: Zn3Load 0 0 72
|
||||
# ZNVER3-NEXT: Zn3Store 0 0 64
|
||||
|
|
Loading…
Reference in New Issue