forked from OSchip/llvm-project
256 lines
14 KiB
ArmAsm
256 lines
14 KiB
ArmAsm
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
|
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=haswell -iterations=100 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefix=ALL -check-prefix=HASWELL
|
|
|
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=broadwell -iterations=100 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefix=ALL -check-prefix=BDWELL
|
|
|
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=skylake -iterations=100 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefix=ALL -check-prefix=SKYLAKE
|
|
|
|
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=znver1 -iterations=100 -resource-pressure=false -instruction-info=false -timeline < %s | FileCheck %s -check-prefix=ALL -check-prefix=ZNVER1
|
|
|
|
# Code Snippet from "Ithemal: Accurate, Portable and Fast Basic Block Throughput Estimation using Deep Neural Networks"
|
|
# Charith Mendis, Saman Amarasinghe, Michael Carbin
|
|
add $1, %edx
|
|
vpaddd (%r8), %ymm0, %ymm0
|
|
add $32, %r8
|
|
cmp %edi, %edx
|
|
|
|
# ALL: Iterations: 100
|
|
# ALL-NEXT: Instructions: 400
|
|
|
|
# BDWELL-NEXT: Total Cycles: 142
|
|
# BDWELL-NEXT: Total uOps: 500
|
|
|
|
# HASWELL-NEXT: Total Cycles: 143
|
|
# HASWELL-NEXT: Total uOps: 500
|
|
|
|
# SKYLAKE-NEXT: Total Cycles: 110
|
|
# SKYLAKE-NEXT: Total uOps: 500
|
|
|
|
# ZNVER1-NEXT: Total Cycles: 110
|
|
# ZNVER1-NEXT: Total uOps: 400
|
|
|
|
# BDWELL: Dispatch Width: 4
|
|
# BDWELL-NEXT: uOps Per Cycle: 3.52
|
|
# BDWELL-NEXT: IPC: 2.82
|
|
# BDWELL-NEXT: Block RThroughput: 1.3
|
|
|
|
# HASWELL: Dispatch Width: 4
|
|
# HASWELL-NEXT: uOps Per Cycle: 3.50
|
|
# HASWELL-NEXT: IPC: 2.80
|
|
# HASWELL-NEXT: Block RThroughput: 1.3
|
|
|
|
# SKYLAKE: Dispatch Width: 6
|
|
# SKYLAKE-NEXT: uOps Per Cycle: 4.55
|
|
# SKYLAKE-NEXT: IPC: 3.64
|
|
# SKYLAKE-NEXT: Block RThroughput: 0.8
|
|
|
|
# ZNVER1: Dispatch Width: 4
|
|
# ZNVER1-NEXT: uOps Per Cycle: 3.64
|
|
# ZNVER1-NEXT: IPC: 3.64
|
|
# ZNVER1-NEXT: Block RThroughput: 1.0
|
|
|
|
# ALL: Timeline view:
|
|
|
|
# BDWELL-NEXT: 0123456789
|
|
# BDWELL-NEXT: Index 0123456789 01
|
|
|
|
# HASWELL-NEXT: 0123456789
|
|
# HASWELL-NEXT: Index 0123456789 012
|
|
|
|
# SKYLAKE-NEXT: 0123456789
|
|
# SKYLAKE-NEXT: Index 0123456789
|
|
|
|
# ZNVER1-NEXT: 0123456789
|
|
# ZNVER1-NEXT: Index 0123456789
|
|
|
|
# BDWELL: [0,0] DeER . . . .. addl $1, %edx
|
|
# BDWELL-NEXT: [0,1] DeeeeeeeER. . .. vpaddd (%r8), %ymm0, %ymm0
|
|
# BDWELL-NEXT: [0,2] DeE------R. . .. addq $32, %r8
|
|
# BDWELL-NEXT: [0,3] .DeE-----R. . .. cmpl %edi, %edx
|
|
# BDWELL-NEXT: [1,0] .DeE-----R. . .. addl $1, %edx
|
|
# BDWELL-NEXT: [1,1] .DeeeeeeeER . .. vpaddd (%r8), %ymm0, %ymm0
|
|
# BDWELL-NEXT: [1,2] . DeE-----R . .. addq $32, %r8
|
|
# BDWELL-NEXT: [1,3] . DeE-----R . .. cmpl %edi, %edx
|
|
# BDWELL-NEXT: [2,0] . DeE-----R . .. addl $1, %edx
|
|
# BDWELL-NEXT: [2,1] . DeeeeeeeER . .. vpaddd (%r8), %ymm0, %ymm0
|
|
# BDWELL-NEXT: [2,2] . DeE------R . .. addq $32, %r8
|
|
# BDWELL-NEXT: [2,3] . DeE------R . .. cmpl %edi, %edx
|
|
# BDWELL-NEXT: [3,0] . DeE-----R . .. addl $1, %edx
|
|
# BDWELL-NEXT: [3,1] . DeeeeeeeER . .. vpaddd (%r8), %ymm0, %ymm0
|
|
# BDWELL-NEXT: [3,2] . DeE------R . .. addq $32, %r8
|
|
# BDWELL-NEXT: [3,3] . DeE-----R . .. cmpl %edi, %edx
|
|
# BDWELL-NEXT: [4,0] . DeE-----R . .. addl $1, %edx
|
|
# BDWELL-NEXT: [4,1] . DeeeeeeeER. .. vpaddd (%r8), %ymm0, %ymm0
|
|
# BDWELL-NEXT: [4,2] . .DeE-----R. .. addq $32, %r8
|
|
# BDWELL-NEXT: [4,3] . .DeE-----R. .. cmpl %edi, %edx
|
|
# BDWELL-NEXT: [5,0] . .DeE-----R. .. addl $1, %edx
|
|
# BDWELL-NEXT: [5,1] . . DeeeeeeeER .. vpaddd (%r8), %ymm0, %ymm0
|
|
# BDWELL-NEXT: [5,2] . . DeE------R .. addq $32, %r8
|
|
# BDWELL-NEXT: [5,3] . . DeE------R .. cmpl %edi, %edx
|
|
# BDWELL-NEXT: [6,0] . . DeE-----R .. addl $1, %edx
|
|
# BDWELL-NEXT: [6,1] . . DeeeeeeeER .. vpaddd (%r8), %ymm0, %ymm0
|
|
# BDWELL-NEXT: [6,2] . . DeE------R .. addq $32, %r8
|
|
# BDWELL-NEXT: [6,3] . . DeE-----R .. cmpl %edi, %edx
|
|
# BDWELL-NEXT: [7,0] . . DeE-----R .. addl $1, %edx
|
|
# BDWELL-NEXT: [7,1] . . DeeeeeeeER .. vpaddd (%r8), %ymm0, %ymm0
|
|
# BDWELL-NEXT: [7,2] . . DeE-----R .. addq $32, %r8
|
|
# BDWELL-NEXT: [7,3] . . DeE-----R .. cmpl %edi, %edx
|
|
# BDWELL-NEXT: [8,0] . . DeE-----R .. addl $1, %edx
|
|
# BDWELL-NEXT: [8,1] . . .DeeeeeeeER. vpaddd (%r8), %ymm0, %ymm0
|
|
# BDWELL-NEXT: [8,2] . . .DeE------R. addq $32, %r8
|
|
# BDWELL-NEXT: [8,3] . . .DeE------R. cmpl %edi, %edx
|
|
# BDWELL-NEXT: [9,0] . . . DeE-----R. addl $1, %edx
|
|
# BDWELL-NEXT: [9,1] . . . DeeeeeeeER vpaddd (%r8), %ymm0, %ymm0
|
|
# BDWELL-NEXT: [9,2] . . . DeE------R addq $32, %r8
|
|
# BDWELL-NEXT: [9,3] . . . DeE-----R cmpl %edi, %edx
|
|
|
|
# HASWELL: [0,0] DeER . . . . . addl $1, %edx
|
|
# HASWELL-NEXT: [0,1] DeeeeeeeeER . . . vpaddd (%r8), %ymm0, %ymm0
|
|
# HASWELL-NEXT: [0,2] DeE-------R . . . addq $32, %r8
|
|
# HASWELL-NEXT: [0,3] .DeE------R . . . cmpl %edi, %edx
|
|
# HASWELL-NEXT: [1,0] .DeE------R . . . addl $1, %edx
|
|
# HASWELL-NEXT: [1,1] .DeeeeeeeeER . . . vpaddd (%r8), %ymm0, %ymm0
|
|
# HASWELL-NEXT: [1,2] . DeE------R . . . addq $32, %r8
|
|
# HASWELL-NEXT: [1,3] . DeE------R . . . cmpl %edi, %edx
|
|
# HASWELL-NEXT: [2,0] . DeE------R . . . addl $1, %edx
|
|
# HASWELL-NEXT: [2,1] . DeeeeeeeeER . . . vpaddd (%r8), %ymm0, %ymm0
|
|
# HASWELL-NEXT: [2,2] . DeE-------R . . . addq $32, %r8
|
|
# HASWELL-NEXT: [2,3] . DeE-------R . . . cmpl %edi, %edx
|
|
# HASWELL-NEXT: [3,0] . DeE------R . . . addl $1, %edx
|
|
# HASWELL-NEXT: [3,1] . DeeeeeeeeER. . . vpaddd (%r8), %ymm0, %ymm0
|
|
# HASWELL-NEXT: [3,2] . DeE-------R. . . addq $32, %r8
|
|
# HASWELL-NEXT: [3,3] . DeE------R. . . cmpl %edi, %edx
|
|
# HASWELL-NEXT: [4,0] . DeE------R. . . addl $1, %edx
|
|
# HASWELL-NEXT: [4,1] . DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0
|
|
# HASWELL-NEXT: [4,2] . .DeE------R . . addq $32, %r8
|
|
# HASWELL-NEXT: [4,3] . .DeE------R . . cmpl %edi, %edx
|
|
# HASWELL-NEXT: [5,0] . .DeE------R . . addl $1, %edx
|
|
# HASWELL-NEXT: [5,1] . . DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0
|
|
# HASWELL-NEXT: [5,2] . . DeE-------R . . addq $32, %r8
|
|
# HASWELL-NEXT: [5,3] . . DeE-------R . . cmpl %edi, %edx
|
|
# HASWELL-NEXT: [6,0] . . DeE------R . . addl $1, %edx
|
|
# HASWELL-NEXT: [6,1] . . DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0
|
|
# HASWELL-NEXT: [6,2] . . DeE-------R . . addq $32, %r8
|
|
# HASWELL-NEXT: [6,3] . . DeE------R . . cmpl %edi, %edx
|
|
# HASWELL-NEXT: [7,0] . . DeE------R . . addl $1, %edx
|
|
# HASWELL-NEXT: [7,1] . . DeeeeeeeeER. . vpaddd (%r8), %ymm0, %ymm0
|
|
# HASWELL-NEXT: [7,2] . . DeE------R. . addq $32, %r8
|
|
# HASWELL-NEXT: [7,3] . . DeE------R. . cmpl %edi, %edx
|
|
# HASWELL-NEXT: [8,0] . . DeE------R. . addl $1, %edx
|
|
# HASWELL-NEXT: [8,1] . . .DeeeeeeeeER. vpaddd (%r8), %ymm0, %ymm0
|
|
# HASWELL-NEXT: [8,2] . . .DeE-------R. addq $32, %r8
|
|
# HASWELL-NEXT: [8,3] . . .DeE-------R. cmpl %edi, %edx
|
|
# HASWELL-NEXT: [9,0] . . . DeE------R. addl $1, %edx
|
|
# HASWELL-NEXT: [9,1] . . . DeeeeeeeeER vpaddd (%r8), %ymm0, %ymm0
|
|
# HASWELL-NEXT: [9,2] . . . DeE-------R addq $32, %r8
|
|
# HASWELL-NEXT: [9,3] . . . DeE------R cmpl %edi, %edx
|
|
|
|
# SKYLAKE: [0,0] DeER . . . . addl $1, %edx
|
|
# SKYLAKE-NEXT: [0,1] DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0
|
|
# SKYLAKE-NEXT: [0,2] DeE-------R . . addq $32, %r8
|
|
# SKYLAKE-NEXT: [0,3] D=eE------R . . cmpl %edi, %edx
|
|
# SKYLAKE-NEXT: [1,0] D=eE------R . . addl $1, %edx
|
|
# SKYLAKE-NEXT: [1,1] .DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0
|
|
# SKYLAKE-NEXT: [1,2] .DeE-------R . . addq $32, %r8
|
|
# SKYLAKE-NEXT: [1,3] .D=eE------R . . cmpl %edi, %edx
|
|
# SKYLAKE-NEXT: [2,0] .D=eE------R . . addl $1, %edx
|
|
# SKYLAKE-NEXT: [2,1] . DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0
|
|
# SKYLAKE-NEXT: [2,2] . DeE-------R . . addq $32, %r8
|
|
# SKYLAKE-NEXT: [2,3] . D=eE------R . . cmpl %edi, %edx
|
|
# SKYLAKE-NEXT: [3,0] . D=eE------R . . addl $1, %edx
|
|
# SKYLAKE-NEXT: [3,1] . DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0
|
|
# SKYLAKE-NEXT: [3,2] . DeE-------R . . addq $32, %r8
|
|
# SKYLAKE-NEXT: [3,3] . D=eE------R . . cmpl %edi, %edx
|
|
# SKYLAKE-NEXT: [4,0] . D=eE------R . . addl $1, %edx
|
|
# SKYLAKE-NEXT: [4,1] . DeeeeeeeeER. . vpaddd (%r8), %ymm0, %ymm0
|
|
# SKYLAKE-NEXT: [4,2] . DeE-------R. . addq $32, %r8
|
|
# SKYLAKE-NEXT: [4,3] . D=eE------R. . cmpl %edi, %edx
|
|
# SKYLAKE-NEXT: [5,0] . D=eE------R. . addl $1, %edx
|
|
# SKYLAKE-NEXT: [5,1] . DeeeeeeeeER . vpaddd (%r8), %ymm0, %ymm0
|
|
# SKYLAKE-NEXT: [5,2] . DeE-------R . addq $32, %r8
|
|
# SKYLAKE-NEXT: [5,3] . D=eE------R . cmpl %edi, %edx
|
|
# SKYLAKE-NEXT: [6,0] . D=eE------R . addl $1, %edx
|
|
# SKYLAKE-NEXT: [6,1] . .DeeeeeeeeER . vpaddd (%r8), %ymm0, %ymm0
|
|
# SKYLAKE-NEXT: [6,2] . .DeE-------R . addq $32, %r8
|
|
# SKYLAKE-NEXT: [6,3] . .D=eE------R . cmpl %edi, %edx
|
|
# SKYLAKE-NEXT: [7,0] . .D=eE------R . addl $1, %edx
|
|
# SKYLAKE-NEXT: [7,1] . . DeeeeeeeeER . vpaddd (%r8), %ymm0, %ymm0
|
|
# SKYLAKE-NEXT: [7,2] . . DeE-------R . addq $32, %r8
|
|
# SKYLAKE-NEXT: [7,3] . . D=eE------R . cmpl %edi, %edx
|
|
# SKYLAKE-NEXT: [8,0] . . D=eE------R . addl $1, %edx
|
|
# SKYLAKE-NEXT: [8,1] . . DeeeeeeeeER. vpaddd (%r8), %ymm0, %ymm0
|
|
# SKYLAKE-NEXT: [8,2] . . DeE-------R. addq $32, %r8
|
|
# SKYLAKE-NEXT: [8,3] . . D=eE------R. cmpl %edi, %edx
|
|
# SKYLAKE-NEXT: [9,0] . . D=eE------R. addl $1, %edx
|
|
# SKYLAKE-NEXT: [9,1] . . DeeeeeeeeER vpaddd (%r8), %ymm0, %ymm0
|
|
# SKYLAKE-NEXT: [9,2] . . DeE-------R addq $32, %r8
|
|
# SKYLAKE-NEXT: [9,3] . . D=eE------R cmpl %edi, %edx
|
|
|
|
# ZNVER1: [0,0] DeER . . . . addl $1, %edx
|
|
# ZNVER1-NEXT: [0,1] DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0
|
|
# ZNVER1-NEXT: [0,2] DeE-------R . . addq $32, %r8
|
|
# ZNVER1-NEXT: [0,3] D=eE------R . . cmpl %edi, %edx
|
|
# ZNVER1-NEXT: [1,0] .DeE------R . . addl $1, %edx
|
|
# ZNVER1-NEXT: [1,1] .DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0
|
|
# ZNVER1-NEXT: [1,2] .DeE-------R . . addq $32, %r8
|
|
# ZNVER1-NEXT: [1,3] .D=eE------R . . cmpl %edi, %edx
|
|
# ZNVER1-NEXT: [2,0] . DeE------R . . addl $1, %edx
|
|
# ZNVER1-NEXT: [2,1] . DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0
|
|
# ZNVER1-NEXT: [2,2] . DeE-------R . . addq $32, %r8
|
|
# ZNVER1-NEXT: [2,3] . D=eE------R . . cmpl %edi, %edx
|
|
# ZNVER1-NEXT: [3,0] . DeE------R . . addl $1, %edx
|
|
# ZNVER1-NEXT: [3,1] . DeeeeeeeeER . . vpaddd (%r8), %ymm0, %ymm0
|
|
# ZNVER1-NEXT: [3,2] . DeE-------R . . addq $32, %r8
|
|
# ZNVER1-NEXT: [3,3] . D=eE------R . . cmpl %edi, %edx
|
|
# ZNVER1-NEXT: [4,0] . DeE------R . . addl $1, %edx
|
|
# ZNVER1-NEXT: [4,1] . DeeeeeeeeER. . vpaddd (%r8), %ymm0, %ymm0
|
|
# ZNVER1-NEXT: [4,2] . DeE-------R. . addq $32, %r8
|
|
# ZNVER1-NEXT: [4,3] . D=eE------R. . cmpl %edi, %edx
|
|
# ZNVER1-NEXT: [5,0] . DeE------R. . addl $1, %edx
|
|
# ZNVER1-NEXT: [5,1] . DeeeeeeeeER . vpaddd (%r8), %ymm0, %ymm0
|
|
# ZNVER1-NEXT: [5,2] . DeE-------R . addq $32, %r8
|
|
# ZNVER1-NEXT: [5,3] . D=eE------R . cmpl %edi, %edx
|
|
# ZNVER1-NEXT: [6,0] . .DeE------R . addl $1, %edx
|
|
# ZNVER1-NEXT: [6,1] . .DeeeeeeeeER . vpaddd (%r8), %ymm0, %ymm0
|
|
# ZNVER1-NEXT: [6,2] . .DeE-------R . addq $32, %r8
|
|
# ZNVER1-NEXT: [6,3] . .D=eE------R . cmpl %edi, %edx
|
|
# ZNVER1-NEXT: [7,0] . . DeE------R . addl $1, %edx
|
|
# ZNVER1-NEXT: [7,1] . . DeeeeeeeeER . vpaddd (%r8), %ymm0, %ymm0
|
|
# ZNVER1-NEXT: [7,2] . . DeE-------R . addq $32, %r8
|
|
# ZNVER1-NEXT: [7,3] . . D=eE------R . cmpl %edi, %edx
|
|
# ZNVER1-NEXT: [8,0] . . DeE------R . addl $1, %edx
|
|
# ZNVER1-NEXT: [8,1] . . DeeeeeeeeER. vpaddd (%r8), %ymm0, %ymm0
|
|
# ZNVER1-NEXT: [8,2] . . DeE-------R. addq $32, %r8
|
|
# ZNVER1-NEXT: [8,3] . . D=eE------R. cmpl %edi, %edx
|
|
# ZNVER1-NEXT: [9,0] . . DeE------R. addl $1, %edx
|
|
# ZNVER1-NEXT: [9,1] . . DeeeeeeeeER vpaddd (%r8), %ymm0, %ymm0
|
|
# ZNVER1-NEXT: [9,2] . . DeE-------R addq $32, %r8
|
|
# ZNVER1-NEXT: [9,3] . . D=eE------R cmpl %edi, %edx
|
|
|
|
# ALL: Average Wait times (based on the timeline view):
|
|
# ALL-NEXT: [0]: Executions
|
|
# ALL-NEXT: [1]: Average time spent waiting in a scheduler's queue
|
|
# ALL-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
|
|
# ALL-NEXT: [3]: Average time elapsed from WB until retire stage
|
|
|
|
# ALL: [0] [1] [2] [3]
|
|
|
|
# BDWELL-NEXT: 0. 10 1.0 0.4 4.5 addl $1, %edx
|
|
# HASWELL-NEXT: 0. 10 1.0 0.4 5.4 addl $1, %edx
|
|
# SKYLAKE-NEXT: 0. 10 1.9 0.1 5.4 addl $1, %edx
|
|
# ZNVER1-NEXT: 0. 10 1.0 0.1 5.4 addl $1, %edx
|
|
|
|
# ALL-NEXT: 1. 10 1.0 0.1 0.0 vpaddd (%r8), %ymm0, %ymm0
|
|
|
|
# BDWELL-NEXT: 2. 10 1.0 0.4 5.7 addq $32, %r8
|
|
# BDWELL-NEXT: 3. 10 1.0 0.0 5.3 cmpl %edi, %edx
|
|
|
|
# HASWELL-NEXT: 2. 10 1.0 0.4 6.7 addq $32, %r8
|
|
# HASWELL-NEXT: 3. 10 1.0 0.0 6.3 cmpl %edi, %edx
|
|
|
|
# SKYLAKE-NEXT: 2. 10 1.0 0.1 7.0 addq $32, %r8
|
|
# SKYLAKE-NEXT: 3. 10 2.0 0.0 6.0 cmpl %edi, %edx
|
|
|
|
# ZNVER1-NEXT: 2. 10 1.0 0.1 7.0 addq $32, %r8
|
|
# ZNVER1-NEXT: 3. 10 2.0 0.0 6.0 cmpl %edi, %edx
|