; RUN: llc %s -o - -filetype=obj --mcpu=znver2 | llvm-objdump -dr - | FileCheck %s
; RUN: llc %s -o - -filetype=asm --mcpu=znver2 | llvm-mc - -o - --mcpu=znver2 -filetype=obj -triple x86_64-unknown-linux-gnu | llvm-objdump -dr - | FileCheck %s
; RUN: llc %s -o - -filetype=asm --mcpu=znver2 | FileCheck %s --check-prefix=ASM
;; Check that we produce a push, then an align-to-16-bytes p2align.
;
; ASM: # %bb.0:
; ASM-NEXT: pushq %rax
; ASM-NEXT: .cfi_def_cfa_offset 16
; ASM-NEXT: .p2align 4{{$}}
;; When we assemble the file, either using the built-in asssembler or going
;; via a textual assembly file, we should get the same padding between the
;; initial push and the next block for alignment. It's a single 15 byte
;; nop.
; CHECK: 0: 50
; CHECK-NEXT: 66 66 66 66 66 66 2e 0f 1f 84 00 00 00 00 00 nopw %cs:(%rax,%rax)
;; Note that we specify a CPU to ensure the same nop patterns are selected
;; between llvm-mc and llc, just in case defaults changed, which one isn't
;; important.
target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-i128:128-f80:128-n8:16:32:64-S128"
target triple = "x86_64-unknown-linux-gnu"
; Function Attrs: noreturn nounwind uwtable
define dso_local void @b() local_unnamed_addr {
entry:
br label %for.cond
for.cond:
tail call void (...) @a()
br label %for.cond
}
declare void @a(...) local_unnamed_addr
!llvm.module.flags = !{!0, !1, !2, !3}
!llvm.ident = !{!4}
!0 = !{i32 1, !"wchar_size", i32 4}
!1 = !{i32 8, !"PIC Level", i32 2}
!2 = !{i32 7, !"PIE Level", i32 2}
!3 = !{i32 7, !"uwtable", i32 2}
!4 = !{!"clang"}