From 031abc2bd7f176548238dd9c83eb159e2dcd2563 Mon Sep 17 00:00:00 2001 From: Evandro Menezes Date: Tue, 18 Dec 2018 23:19:52 +0000 Subject: [PATCH] [llvm-mca] Improve test (NFC) Add more instruction variations for Exynos. llvm-svn: 349567 --- .../llvm-mca/AArch64/Exynos/register-offset.s | 76 ++++++++++++++----- 1 file changed, 57 insertions(+), 19 deletions(-) diff --git a/llvm/test/tools/llvm-mca/AArch64/Exynos/register-offset.s b/llvm/test/tools/llvm-mca/AArch64/Exynos/register-offset.s index 0c8ad2610076..4fc4cf48fdcc 100644 --- a/llvm/test/tools/llvm-mca/AArch64/Exynos/register-offset.s +++ b/llvm/test/tools/llvm-mca/AArch64/Exynos/register-offset.s @@ -2,25 +2,43 @@ # RUN: llvm-mca -march=aarch64 -mcpu=exynos-m1 -resource-pressure=false < %s | FileCheck %s -check-prefixes=ALL,EM1 # RUN: llvm-mca -march=aarch64 -mcpu=exynos-m3 -resource-pressure=false < %s | FileCheck %s -check-prefixes=ALL,EM3 - ldrb w0, [x1, w2, sxtw #0] - strh w3, [x4, x5, sxtx #1] + ldrb w0, [x1, x2, lsl #0] + ldrh w3, [x4, x5, sxtx #1] ldr w6, [x7, w8, uxtw #2] - str x9, [x10, x11, lsl #3] + ldr x9, [x10, w11, sxtw #3] + ldr b12, [x13, w14, sxtw #0] + ldr h15, [x16, w17, uxtw #1] + ldr s18, [x19, x20, sxtx #2] + ldr d21, [x22, x23, lsl #3] + ldr q24, [x25, x26, lsl #4] + + strb w0, [x1, x2, lsl #0] + strh w3, [x4, x5, sxtx #1] + str w6, [x7, w8, uxtw #2] + str x9, [x10, w11, sxtw #3] + str b12, [x13, w14, sxtw #0] + str h15, [x16, w17, uxtw #1] + str s18, [x19, x20, sxtx #2] + str d21, [x22, x23, lsl #3] + str q24, [x25, x26, lsl #4] # ALL: Iterations: 100 -# ALL-NEXT: Instructions: 400 -# ALL-NEXT: Total Cycles: 208 -# ALL-NEXT: Total uOps: 600 +# ALL-NEXT: Instructions: 1800 + +# EM1-NEXT: Total Cycles: 1719 +# EM3-NEXT: Total Cycles: 1713 + +# ALL-NEXT: Total uOps: 2800 # EM1: Dispatch Width: 4 -# EM1-NEXT: uOps Per Cycle: 2.88 -# EM1-NEXT: IPC: 1.92 -# EM1-NEXT: Block RThroughput: 2.0 +# EM1-NEXT: uOps Per Cycle: 1.63 +# EM1-NEXT: IPC: 1.05 +# EM1-NEXT: Block RThroughput: 12.0 # EM3: Dispatch Width: 6 -# EM3-NEXT: uOps Per Cycle: 2.88 -# EM3-NEXT: IPC: 1.92 -# EM3-NEXT: Block RThroughput: 2.0 +# EM3-NEXT: uOps Per Cycle: 1.63 +# EM3-NEXT: IPC: 1.05 +# EM3-NEXT: Block RThroughput: 9.0 # ALL: Instruction Info: # ALL-NEXT: [1]: #uOps @@ -32,12 +50,32 @@ # ALL: [1] [2] [3] [4] [5] [6] Instructions: -# EM1-NEXT: 2 5 1.00 * ldrb w0, [x1, w2, sxtw #0] -# EM3-NEXT: 2 5 0.50 * ldrb w0, [x1, w2, sxtw #0] - -# ALL-NEXT: 1 1 1.00 * strh w3, [x4, x5, sxtx #1] - +# EM1-NEXT: 1 5 1.00 * ldrb w0, [x1, x2, lsl #0] +# EM1-NEXT: 1 5 1.00 * ldrh w3, [x4, x5, sxtx #1] # EM1-NEXT: 2 5 1.00 * ldr w6, [x7, w8, uxtw #2] -# EM3-NEXT: 2 5 0.50 * ldr w6, [x7, w8, uxtw #2] +# EM1-NEXT: 2 5 1.00 * ldr x9, [x10, w11, sxtw #3] +# EM1-NEXT: 2 6 2.00 * ldr b12, [x13, w14, sxtw #0] +# EM1-NEXT: 2 6 2.00 * ldr h15, [x16, w17, uxtw #1] +# EM1-NEXT: 1 5 1.00 * ldr s18, [x19, x20, sxtx #2] +# EM1-NEXT: 1 5 1.00 * ldr d21, [x22, x23, lsl #3] +# EM1-NEXT: 2 6 2.00 * ldr q24, [x25, x26, lsl #4] -# ALL-NEXT: 1 1 1.00 * str x9, [x10, x11, lsl #3] +# EM3-NEXT: 1 5 0.50 * ldrb w0, [x1, x2, lsl #0] +# EM3-NEXT: 1 5 0.50 * ldrh w3, [x4, x5, sxtx #1] +# EM3-NEXT: 2 5 0.50 * ldr w6, [x7, w8, uxtw #2] +# EM3-NEXT: 2 5 0.50 * ldr x9, [x10, w11, sxtw #3] +# EM3-NEXT: 2 6 0.50 * ldr b12, [x13, w14, sxtw #0] +# EM3-NEXT: 2 6 0.50 * ldr h15, [x16, w17, uxtw #1] +# EM3-NEXT: 1 5 0.50 * ldr s18, [x19, x20, sxtx #2] +# EM3-NEXT: 1 5 0.50 * ldr d21, [x22, x23, lsl #3] +# EM3-NEXT: 2 6 0.50 * ldr q24, [x25, x26, lsl #4] + +# ALL-NEXT: 1 1 1.00 * strb w0, [x1, x2, lsl #0] +# ALL-NEXT: 1 1 1.00 * strh w3, [x4, x5, sxtx #1] +# ALL-NEXT: 2 2 1.00 * str w6, [x7, w8, uxtw #2] +# ALL-NEXT: 2 2 1.00 * str x9, [x10, w11, sxtw #3] +# ALL-NEXT: 2 3 1.00 * str b12, [x13, w14, sxtw #0] +# ALL-NEXT: 2 3 1.00 * str h15, [x16, w17, uxtw #1] +# ALL-NEXT: 1 1 1.00 * str s18, [x19, x20, sxtx #2] +# ALL-NEXT: 1 1 1.00 * str d21, [x22, x23, lsl #3] +# ALL-NEXT: 2 3 1.00 * str q24, [x25, x26, lsl #4]