llvm-project/bolt/test/X86/jump-table-icp.test

114 lines
4.6 KiB
Plaintext

RUN: llvm-mc -filetype=obj -triple x86_64-unknown-unknown \
RUN: %p/Inputs/jump_table_icp.s -o %t.o
RUN: link_fdata %p/Inputs/jump_table_icp.s %t.o %t.fdata
RUN: llvm-strip --strip-unneeded %t.o
RUN: %clang %cflags %t.o -o %t.exe -Wl,-q
RUN: (llvm-bolt %t.exe -data %t.fdata -o %t -relocs \
RUN: -reorder-blocks=cache -split-functions=3 -split-all-cold \
RUN: -use-gnu-stack -dyno-stats -indirect-call-promotion=jump-tables \
RUN: -print-icp -v=0 \
RUN: -icp-jt-remaining-percent-threshold=10 \
RUN: -icp-jt-total-percent-threshold=2 \
RUN: -indirect-call-promotion-topn=1 \
RUN: -icp-jump-tables-targets -align-functions-max-bytes=7 2>&1 && \
RUN: llvm-objdump -d %t --print-imm-hex) | FileCheck %s
BOLT-INFO: ICP total indirect callsites = 0
BOLT-INFO: ICP total jump table callsites = 2
BOLT-INFO: ICP total number of calls = 2137
BOLT-INFO: ICP percentage of calls that are indirect = 0.0%
BOLT-INFO: ICP percentage of indirect calls that can be optimized = 0.0%
BOLT-INFO: ICP percentage of indirect calls that are optimized = 0.0%
BOLT-INFO: ICP percentage of jump table calls that can be optimized = 17.7%
BOLT-INFO: ICP percentage of jump table calls that are optimized = 100.0%
CHECK: Binary Function "_Z3inci" after indirect-call-promotion
CHECK: .LBB{{.*}} (8 instructions, align : 1)
CHECK-NEXT: Entry Point
CHECK-NEXT: Exec Count : 1073
CHECK: Successors: .Ltmp{{.*}} (mispreds: 189, count: 189), .LFT{{.*}} (mispreds: 0, count: 881)
CHECK: .LFT{{.*}} (4 instructions, align : 1)
CHECK-NEXT: Exec Count : 881
CHECK: Predecessors: .LBB{{.*}}
CHECK: Successors: .Ltmp{{.*}} (mispreds: 138, count: 155), .Ltmp{{.*}} (mispreds: 0, count: 726)
CHECK: .Ltmp{{.*}} (1 instructions, align : 1)
CHECK-NEXT: Exec Count : 726
CHECK: Predecessors: .LFT{{.*}}
CHECK: Successors: .L{{.*}} (mispreds: 126, count: 157), .L{{.*}} (mispreds: 140, count: 156), .L{{.*}} (mispreds: 134, count: 152), .L{{.*}} (mispreds: 137, count: 150), .L{{.*}} (mispreds: 129, count: 148), .L{{.*}} (mispreds: 0, count: 0)
CHECK: .Ltmp{{.*}} (5 instructions, align : 1)
CHECK-NEXT: Exec Count : 167
CHECK: Predecessors: .Ltmp{{.*}}, .LFT{{.*}}
CHECK: .Ltmp{{.*}} (5 instructions, align : 1)
CHECK-NEXT: Exec Count : 156
CHECK: Predecessors: .Ltmp{{.*}}
CHECK: .Ltmp{{.*}} (5 instructions, align : 1)
CHECK-NEXT: Exec Count : 157
CHECK: Predecessors: .Ltmp{{.*}}
CHECK: .Ltmp{{.*}} (5 instructions, align : 1)
CHECK-NEXT: Exec Count : 148
CHECK: Predecessors: .Ltmp{{.*}}
CHECK: .Ltmp{{.*}} (5 instructions, align : 1)
CHECK-NEXT: Exec Count : 150
CHECK: Predecessors: .Ltmp{{.*}}
CHECK: Binary Function "_Z7inc_dupi" after indirect-call-promotion
CHECK: .LBB{{.*}} (8 instructions, align : 1)
CHECK-NEXT: Entry Point
CHECK-NEXT: Exec Count : 1064
CHECK: Successors: .Ltmp{{.*}} (mispreds: 143, count: 144), .LFT{{.*}} (mispreds: 0, count: 777)
CHECK: .LFT{{.*}} (4 instructions, align : 1)
CHECK-NEXT: Exec Count : 777
CHECK: Predecessors: .LBB{{.*}}
CHECK: Successors: .Ltmp{{.*}} (mispreds: 120, count: 138), .Ltmp{{.*}} (mispreds: 0, count: 639)
CHECK: .Ltmp{{.*}} (1 instructions, align : 1)
CHECK-NEXT: Exec Count : 639
CHECK: Predecessors: .LFT{{.*}}
CHECK: Successors: .L{{.*}} (mispreds: 130, count: 137), .L{{.*}} (mispreds: 126, count: 136), .L{{.*}} (mispreds: 122, count: 130), .L{{.*}} (mispreds: 111, count: 130), .L{{.*}} (mispreds: 104, count: 114), .L{{.*}} (mispreds: 0, count: 0)
CHECK: .Ltmp{{.*}} (5 instructions, align : 1)
CHECK-NEXT: Exec Count : 137
CHECK: Predecessors: .Ltmp{{.*}}
CHECK: Successors: .Ltmp{{.*}} (mispreds: 0, count: 106)
CHECK: .Ltmp{{.*}} (5 instructions, align : 1)
CHECK-NEXT: Exec Count : 136
CHECK: Predecessors: .Ltmp{{.*}}
CHECK: Successors: .Ltmp{{.*}} (mispreds: 0, count: 113)
CHECK: .Ltmp{{.*}} (5 instructions, align : 1)
CHECK-NEXT: Exec Count : 130
CHECK: Predecessors: .Ltmp{{.*}}
CHECK: Successors: .Ltmp{{.*}} (mispreds: 0, count: 97)
CHECK: .Ltmp{{.*}} (5 instructions, align : 1)
CHECK-NEXT: Exec Count : 130
CHECK: Predecessors: .Ltmp{{.*}}
CHECK: Successors: .Ltmp{{.*}} (mispreds: 0, count: 105)
CHECK: .Ltmp{{.*}} (5 instructions, align : 1)
CHECK-NEXT: Exec Count : 140
CHECK: Predecessors: .Ltmp{{.*}}, .LFT{{.*}}
CHECK: Successors: .Ltmp{{.*}} (mispreds: 0, count: 98)
CHECK: <_Z3inci>:
CHECK: movq 0x{{.*}}(,%rax,8), %rax
CHECK-NEXT: cmpq $0x{{.*}}, %rax
CHECK-NEXT: je {{.*}} <_Z3inci+0x{{.*}}>
CHECK-NEXT: jmpq *%rax
CHECK: <_Z7inc_dupi>:
CHECK: movq 0x{{.*}}(,%rax,8), %rax
CHECK-NEXT: cmpq $0x{{.*}}, %rax
CHECK-NEXT: je {{.*}} <_Z7inc_dupi+0x{{.*}}>
CHECK-NEXT: jmpq *%rax