llvm-project/llvm/test/MC/X86/align-via-relaxation.s

76 lines
2.5 KiB
ArmAsm

# RUN: llvm-mc -mcpu=skylake -filetype=obj -triple x86_64-pc-linux-gnu -x86-pad-max-prefix-size=0 %s | llvm-objdump -d --section=.text - | FileCheck %s
# This test exercises only the padding via relaxation logic. The interaction
# etween prefix padding and relaxation logic can be seen in align-via-padding.s
.file "test.c"
.text
.section .text
# Demonstrate that we can relax instructions to provide padding, not
# just insert nops. jmps are being used for ease of demonstration.
# CHECK: .text
# CHECK: 0: eb 1f jmp 0x21 <foo>
# CHECK: 2: e9 1a 00 00 00 jmp 0x21 <foo>
# CHECK: 7: e9 15 00 00 00 jmp 0x21 <foo>
# CHECK: c: e9 10 00 00 00 jmp 0x21 <foo>
# CHECK: 11: e9 0b 00 00 00 jmp 0x21 <foo>
# CHECK: 16: e9 06 00 00 00 jmp 0x21 <foo>
# CHECK: 1b: e9 01 00 00 00 jmp 0x21 <foo>
# CHECK: 20: cc int3
.p2align 4
jmp foo
jmp foo
jmp foo
jmp foo
jmp foo
jmp foo
jmp foo
.p2align 5
int3
foo:
ret
# Check that we're not shifting aroudn the offsets of labels - doing
# that would require a further round of relaxation
# CHECK: <bar>:
# CHECK: 22: eb fe jmp 0x22 <bar>
# CHECK: 24: 66 66 66 2e 0f 1f 84 00 00 00 00 00 nopw %cs:(%rax,%rax)
# CHECK: 30: 0f 0b ud2
bar:
jmp bar
nobypass:
.p2align 4
ud2
# Canonical toy loop to show benefit - we can align the loop header with
# fewer nops by relaxing the branch, even though we don't need to
# CHECK: <loop_preheader>:
# CHECK: 45: 48 85 c0 testq %rax, %rax
# CHECK: 48: 0f 8e 22 00 00 00 jle 0x70 <loop_exit>
# CHECK: 4e: 66 66 66 66 66 66 2e 0f 1f 84 00 00 00 00 00 nopw %cs:(%rax,%rax)
# CHECK: 5d: 0f 1f 00 nopl (%rax)
# CHECK: <loop_header>:
# CHECK: 60: 48 83 e8 01 subq $1, %rax
# CHECK: 64: 48 85 c0 testq %rax, %rax
# CHECK: 67: 7e 07 jle 0x70 <loop_exit>
# CHECK: 69: e9 f2 ff ff ff jmp 0x60 <loop_header>
# CHECK: 6e: 66 90 nop
# CHECK: <loop_exit>:
# CHECK: 70: c3 retq
.p2align 5
.skip 5
loop_preheader:
testq %rax, %rax
jle loop_exit
.p2align 5
loop_header:
subq $1, %rax
testq %rax, %rax
jle loop_exit
jmp loop_header
.p2align 4
loop_exit:
ret