; RUN: llc < %s -mtriple=nvptx64-unknown-unknown | FileCheck %s
; RUN: %if ptxas %{ llc < %s -mtriple=nvptx64-unknown-unknown | %ptxas-verify %}
;
; NVPTXTargetLowering::getFunctionParamOptimizedAlign, which was introduces in
; D120129, contained a poorly designed assertion checking that a function with
; internal or private linkage is not a kernel. It relied on invariants that
; were not actually guaranteed, and that resulted in compiler crash with some
; CUDA versions (see discussion with @jdoerfert in D120129). This test contains
; metadata that caused compiler crash and a function with internal linkage
; which purpose is to let compiler run on path where the crash happened.
; Metadata was obtained from libdevice.10.bc shipped with cuda-11-0.
define internal i32 @foo() {
; CHECK-LABEL: .func (.param .b32 func_retval0) foo()
ret i32 42
}
define i32 @bar() {
; CHECK-LABEL: .visible .func (.param .b32 func_retval0) bar()
%x = call i32 @foo()
ret i32 %x
}
!nvvmir.version = !{!0}
!nvvm.annotations = !{!1, !2, !1, !3, !3, !3, !3, !4, !4, !3}
!0 = !{i32 1, i32 4}
!1 = !{null, !"align", i32 8}
!2 = !{null, !"align", i32 8, !"align", i32 65544, !"align", i32 131080}
!3 = !{null, !"align", i32 16}
!4 = !{null, !"align", i32 16, !"align", i32 65552, !"align", i32 131088}
!5 = distinct !{!5, !6}
!6 = !{!"llvm.loop.unroll.count", i32 1}
!7 = distinct !{!7, !6}