# RUN: llvm-mc -mcpu=skylake -filetype=obj -triple x86_64-pc-linux-gnu %s -x86-pad-max-prefix-size=5 -x86-pad-for-align=1 | llvm-objdump --no-print-imm-hex -d - | FileCheck %s
# This test file highlights the interactions between prefix padding and
# relaxation padding.
.file "test.c"
.text
.section .text
# We can both relax and prefix for padding purposes, but the moment, we
# can't prefix without first having relaxed.
# CHECK: .text
# CHECK: 0: eb 1f jmp
# CHECK: 2: eb 1d jmp
# CHECK: 4: eb 1b jmp
# CHECK: 6: eb 19 jmp
# CHECK: 8: eb 17 jmp
# CHECK: a: 2e 2e 2e 2e 2e e9 0d 00 00 00 jmp
# CHECK: 14: 2e 2e 2e 2e 2e e9 03 00 00 00 jmp
# CHECK: 1e: 66 90 nop
# CHECK: 20: cc int3
.p2align 4
jmp foo
jmp foo
jmp foo
jmp foo
jmp foo
jmp foo
jmp foo
.p2align 5
int3
foo:
ret
# Canonical toy loop to show benefit - we can align the loop header with
# fewer nops by relaxing the branch, even though we don't need to
# CHECK: <loop_preheader>:
# CHECK: 45: 48 85 c0 testq %rax, %rax
# CHECK: 48: 2e 2e 2e 2e 0f 8e 1e 00 00 00 jle 0x70 <loop_exit>
# CHECK: 52: 66 66 66 66 66 2e 0f 1f 84 00 00 00 00 00 nopw %cs:(%rax,%rax)
# CHECK: <loop_header>:
# CHECK: 60: 48 83 e8 01 subq $1, %rax
# CHECK: 64: 48 85 c0 testq %rax, %rax
# CHECK: 67: 7e 07 jle 0x70 <loop_exit>
# CHECK: 69: 2e 2e e9 f0 ff ff ff jmp
# CHECK: <loop_exit>:
# CHECK: 70: c3 retq
.p2align 5
.skip 5
loop_preheader:
testq %rax, %rax
jle loop_exit
.p2align 5
loop_header:
subq $1, %rax
testq %rax, %rax
jle loop_exit
jmp loop_header
.p2align 4
loop_exit:
ret
# Correctness cornercase - can't prefix pad jmp without having relaxed it
# first as doing so would make the relative offset too large
# CHECK: fd: cc int3
# CHECK: fe: eb 80 jmp 0x80 <loop_exit+0x10>
# CHECK: 100: cc int3
.p2align 5
.L1:
.rept 126
int3
.endr
jmp .L1
.rept 30
int3
.endr
.p2align 5