; RUN: llvm-split -o %t %s -j 3 -mtriple amdgcn-amd-amdhsa
; RUN: llvm-dis -o - %t0 | FileCheck --check-prefix=CHECK0 --implicit-check-not=define %s
; RUN: llvm-dis -o - %t1 | FileCheck --check-prefix=CHECK1 --implicit-check-not=define %s
; RUN: llvm-dis -o - %t2 | FileCheck --check-prefix=CHECK2 --implicit-check-not=define %s
; We have 4 kernels:
; - Each kernel has an internal helper
; - @A and @B's helpers does an indirect call.
;
; We default to putting A/B in P0, alongside a copy
; of all helpers who have their address taken.
; The other kernels can still go into separate partitions.
;
; Note that dependency discovery shouldn't stop upon finding an
; indirect call. HelperC/D should also end up in P0 as they
; are dependencies of HelperB.
; CHECK0: define internal void @HelperD
; CHECK0: define amdgpu_kernel void @D
; CHECK1: define internal void @HelperC
; CHECK1: define amdgpu_kernel void @C
; CHECK2: define hidden void @HelperA
; CHECK2: define hidden void @HelperB
; CHECK2: define hidden void @CallCandidate
; CHECK2: define internal void @HelperC
; CHECK2: define internal void @HelperD
; CHECK2: define amdgpu_kernel void @A
; CHECK2: define amdgpu_kernel void @B
@addrthief = global [3 x ptr] [ptr @HelperA, ptr @HelperB, ptr @CallCandidate]
define internal void @HelperA(ptr %call) {
call void %call()
ret void
}
define internal void @HelperB(ptr %call) {
call void @HelperC()
call void %call()
call void @HelperD()
ret void
}
define internal void @CallCandidate() {
ret void
}
define internal void @HelperC() {
ret void
}
define internal void @HelperD() {
ret void
}
define amdgpu_kernel void @A(ptr %call) {
call void @HelperA(ptr %call)
ret void
}
define amdgpu_kernel void @B(ptr %call) {
call void @HelperB(ptr %call)
ret void
}
define amdgpu_kernel void @C() {
call void @HelperC()
ret void
}
define amdgpu_kernel void @D() {
call void @HelperD()
ret void
}