llvm/llvm/test/Transforms/PGOProfile/icp_vtable_cmp.ll

; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5

; Tests that ICP compares vtables by checking IR.
; RUN: opt < %s -passes='pgo-icall-prom' -pass-remarks=pgo-icall-prom -enable-vtable-profile-use -icp-max-num-vtable-last-candidate=2 -S 2>&1 | FileCheck %s --check-prefixes=VTABLE-COMMON,VTABLE-CMP
; Require exactly one vtable candidate for each function candidate. Tests that ICP compares function by checking IR.
; RUN: opt < %s -passes='pgo-icall-prom' -pass-remarks=pgo-icall-prom -enable-vtable-profile-use -icp-max-num-vtable-last-candidate=1 -S 2>&1 | FileCheck %s --check-prefixes=VTABLE-COMMON,FUNC-CMP
; On top of line 4, ignore 'Base1' and its derived types for vtable-based comparison. Tests that ICP compares functions.
; RUN: opt < %s -passes='pgo-icall-prom' -pass-remarks=pgo-icall-prom -enable-vtable-profile-use -icp-max-num-vtable-last-candidate=2 -icp-ignored-base-types='Base1' -S 2>&1 | FileCheck %s --check-prefixes=VTABLE-COMMON,FUNC-CMP

target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128"
target triple = "x86_64-unknown-linux-gnu"

@Base1 = constant { [4 x ptr] } { [4 x ptr] [ptr null, ptr null, ptr @Base1_foo, ptr @Base1_bar] }, !type !0
@Base2 = constant { [3 x ptr] } { [3 x ptr] [ptr null, ptr null, ptr @Base2_foo] }, !type !2
@Base3 = constant { [3 x ptr] } { [3 x ptr] [ptr null, ptr null, ptr @Base3_foo] }, !type !6

@Derived1 = constant { [3 x ptr], [4 x ptr] } { [3 x ptr] [ptr null, ptr null, ptr @Base2_foo], [4 x ptr] [ptr null, ptr null, ptr @Base1_foo, ptr @Derived1_bar] }, !type !1, !type !2, !type !3
@Derived2 = constant { [3 x ptr], [3 x ptr], [4 x ptr] } { [3 x ptr] [ptr null, ptr null, ptr @Base3_foo], [3 x ptr] [ptr null, ptr null, ptr @Base2_foo], [4 x ptr] [ptr null, ptr null, ptr @Base1_foo, ptr @Derived2_bar] }, !type !4, !type !5, !type !6, !type !7
@Derived3 = constant { [4 x ptr] } { [4 x ptr] [ptr null, ptr null, ptr @Base1_foo, ptr @Base1_bar] }, !type !0, !type !8

; VTABLE-CMP: remark: <unknown>:0:0: Promote indirect call to Derived1_bar with count 600 out of 1600, sink 2 instruction(s) and compare 1 vtable(s): {Derived1}
; VTABLE-CMP: remark: <unknown>:0:0: Promote indirect call to Derived2_bar with count 500 out of 1000, sink 2 instruction(s) and compare 1 vtable(s): {Derived2}
; VTABLE-CMP: remark: <unknown>:0:0: Promote indirect call to Base1_bar with count 400 out of 500, sink 2 instruction(s) and compare 2 vtable(s): {Derived3, Base1}

define void @test(ptr %d) {
; VTABLE-CMP-LABEL: define void @test(
; VTABLE-CMP-SAME: ptr [[D:%.*]]) {
; VTABLE-CMP-NEXT:  [[ENTRY:.*:]]
; VTABLE-CMP-NEXT:    [[VTABLE:%.*]] = load ptr, ptr [[D]], align 8, !prof [[PROF9:![0-9]+]]
; VTABLE-CMP-NEXT:    [[TMP0:%.*]] = tail call i1 @llvm.type.test(ptr [[VTABLE]], metadata !"Base1")
; VTABLE-CMP-NEXT:    tail call void @llvm.assume(i1 [[TMP0]])
; VTABLE-CMP-NEXT:    [[TMP1:%.*]] = icmp eq ptr [[VTABLE]], getelementptr inbounds (i8, ptr @Derived1, i32 40)
; VTABLE-CMP-NEXT:    br i1 [[TMP1]], label %[[IF_TRUE_DIRECT_TARG:.*]], label %[[IF_FALSE_ORIG_INDIRECT:.*]], !prof [[PROF10:![0-9]+]]
; VTABLE-CMP:       [[IF_TRUE_DIRECT_TARG]]:
; VTABLE-CMP-NEXT:    call void @Derived1_bar(ptr [[D]])
; VTABLE-CMP-NEXT:    br label %[[IF_END_ICP:.*]]
; VTABLE-CMP:       [[IF_FALSE_ORIG_INDIRECT]]:
; VTABLE-CMP-NEXT:    [[TMP2:%.*]] = icmp eq ptr [[VTABLE]], getelementptr inbounds (i8, ptr @Derived2, i32 64)
; VTABLE-CMP-NEXT:    br i1 [[TMP2]], label %[[IF_TRUE_DIRECT_TARG1:.*]], label %[[IF_FALSE_ORIG_INDIRECT2:.*]], !prof [[PROF11:![0-9]+]]
; VTABLE-CMP:       [[IF_TRUE_DIRECT_TARG1]]:
; VTABLE-CMP-NEXT:    call void @Derived2_bar(ptr [[D]])
; VTABLE-CMP-NEXT:    br label %[[IF_END_ICP3:.*]]
; VTABLE-CMP:       [[IF_FALSE_ORIG_INDIRECT2]]:
; VTABLE-CMP-NEXT:    [[TMP3:%.*]] = icmp eq ptr [[VTABLE]], getelementptr inbounds (i8, ptr @Base1, i32 16)
; VTABLE-CMP-NEXT:    [[TMP4:%.*]] = icmp eq ptr [[VTABLE]], getelementptr inbounds (i8, ptr @Derived3, i32 16)
; VTABLE-CMP-NEXT:    [[TMP5:%.*]] = or i1 [[TMP3]], [[TMP4]]
; VTABLE-CMP-NEXT:    br i1 [[TMP5]], label %[[IF_TRUE_DIRECT_TARG4:.*]], label %[[IF_FALSE_ORIG_INDIRECT5:.*]], !prof [[PROF12:![0-9]+]]
; VTABLE-CMP:       [[IF_TRUE_DIRECT_TARG4]]:
; VTABLE-CMP-NEXT:    call void @Base1_bar(ptr [[D]])
; VTABLE-CMP-NEXT:    br label %[[IF_END_ICP6:.*]]
; VTABLE-CMP:       [[IF_FALSE_ORIG_INDIRECT5]]:
; VTABLE-CMP-NEXT:    [[VFN:%.*]] = getelementptr inbounds ptr, ptr [[VTABLE]], i64 1
; VTABLE-CMP-NEXT:    [[TMP6:%.*]] = load ptr, ptr [[VFN]], align 8
; VTABLE-CMP-NEXT:    call void [[TMP6]](ptr [[D]])
; VTABLE-CMP-NEXT:    br label %[[IF_END_ICP6]]
; VTABLE-CMP:       [[IF_END_ICP6]]:
; VTABLE-CMP-NEXT:    br label %[[IF_END_ICP3]]
; VTABLE-CMP:       [[IF_END_ICP3]]:
; VTABLE-CMP-NEXT:    br label %[[IF_END_ICP]]
; VTABLE-CMP:       [[IF_END_ICP]]:
; VTABLE-CMP-NEXT:    ret void
;
; FUNC-CMP-LABEL: define void @test(
; FUNC-CMP-SAME: ptr [[D:%.*]]) {
; FUNC-CMP-NEXT:  [[ENTRY:.*:]]
; FUNC-CMP-NEXT:    [[VTABLE:%.*]] = load ptr, ptr [[D]], align 8, !prof [[PROF9:![0-9]+]]
; FUNC-CMP-NEXT:    [[TMP0:%.*]] = tail call i1 @llvm.type.test(ptr [[VTABLE]], metadata !"Base1")
; FUNC-CMP-NEXT:    tail call void @llvm.assume(i1 [[TMP0]])
; FUNC-CMP-NEXT:    [[VFN:%.*]] = getelementptr inbounds ptr, ptr [[VTABLE]], i64 1
; FUNC-CMP-NEXT:    [[TMP1:%.*]] = load ptr, ptr [[VFN]], align 8
; FUNC-CMP-NEXT:    [[TMP2:%.*]] = icmp eq ptr [[TMP1]], @Derived1_bar
; FUNC-CMP-NEXT:    br i1 [[TMP2]], label %[[IF_TRUE_DIRECT_TARG:.*]], label %[[IF_FALSE_ORIG_INDIRECT:.*]], !prof [[PROF10:![0-9]+]]
; FUNC-CMP:       [[IF_TRUE_DIRECT_TARG]]:
; FUNC-CMP-NEXT:    call void @Derived1_bar(ptr [[D]])
; FUNC-CMP-NEXT:    br label %[[IF_END_ICP:.*]]
; FUNC-CMP:       [[IF_FALSE_ORIG_INDIRECT]]:
; FUNC-CMP-NEXT:    [[TMP3:%.*]] = icmp eq ptr [[TMP1]], @Derived2_bar
; FUNC-CMP-NEXT:    br i1 [[TMP3]], label %[[IF_TRUE_DIRECT_TARG1:.*]], label %[[IF_FALSE_ORIG_INDIRECT2:.*]], !prof [[PROF11:![0-9]+]]
; FUNC-CMP:       [[IF_TRUE_DIRECT_TARG1]]:
; FUNC-CMP-NEXT:    call void @Derived2_bar(ptr [[D]])
; FUNC-CMP-NEXT:    br label %[[IF_END_ICP3:.*]]
; FUNC-CMP:       [[IF_FALSE_ORIG_INDIRECT2]]:
; FUNC-CMP-NEXT:    [[TMP4:%.*]] = icmp eq ptr [[TMP1]], @Base1_bar
; FUNC-CMP-NEXT:    br i1 [[TMP4]], label %[[IF_TRUE_DIRECT_TARG4:.*]], label %[[IF_FALSE_ORIG_INDIRECT5:.*]], !prof [[PROF12:![0-9]+]]
; FUNC-CMP:       [[IF_TRUE_DIRECT_TARG4]]:
; FUNC-CMP-NEXT:    call void @Base1_bar(ptr [[D]])
; FUNC-CMP-NEXT:    br label %[[IF_END_ICP6:.*]]
; FUNC-CMP:       [[IF_FALSE_ORIG_INDIRECT5]]:
; FUNC-CMP-NEXT:    call void [[TMP1]](ptr [[D]])
; FUNC-CMP-NEXT:    br label %[[IF_END_ICP6]]
; FUNC-CMP:       [[IF_END_ICP6]]:
; FUNC-CMP-NEXT:    br label %[[IF_END_ICP3]]
; FUNC-CMP:       [[IF_END_ICP3]]:
; FUNC-CMP-NEXT:    br label %[[IF_END_ICP]]
; FUNC-CMP:       [[IF_END_ICP]]:
; FUNC-CMP-NEXT:    ret void
;
entry:
  %vtable = load ptr, ptr %d, !prof !9
  %0 = tail call i1 @llvm.type.test(ptr %vtable, metadata !"Base1")
  tail call void @llvm.assume(i1 %0)
  %vfn = getelementptr inbounds ptr, ptr %vtable, i64 1
  %1 = load ptr, ptr %vfn
  call void %1(ptr %d), !prof !10
  ret void
}

define void @Base1_bar(ptr %this) {
  ret void
}

define void @Derived1_bar(ptr %this) {
  ret void
}

define void @Derived2_bar(ptr %this) {
  ret void
}


declare i1 @llvm.type.test(ptr, metadata)
declare void @llvm.assume(i1)
declare i32 @Base2_foo(ptr)
declare i32 @Base1_foo(ptr)
declare void @Base3_foo(ptr)

!llvm.module.flags = !{!11}
!0 = !{i64 16, !"Base1"}
!1 = !{i64 40, !"Base1"}
!2 = !{i64 16, !"Base2"}
!3 = !{i64 16, !"Derived1"}
!4 = !{i64 64, !"Base1"}
!5 = !{i64 40, !"Base2"}
!6 = !{i64 16, !"Base3"}
!7 = !{i64 16, !"Derived2"}
!8 = !{i64 16, !"Derived3"}
!9 = !{!"VP", i32 2, i64 1600, i64 -4123858694673519054, i64 600, i64 -7211198353767973908, i64 500, i64 -3574436251470806727, i64 200, i64 6288809125658696740, i64 200, i64 12345678, i64 100}
!10 = !{!"VP", i32 0, i64 1600, i64 3827408714133779784, i64 600, i64 5837445539218476403, i64 500, i64 -9064955852395570538, i64 400,  i64 56781234, i64 100}

!11 = !{i32 1, !"ProfileSummary", !12}
!12 = !{!13, !14, !15, !16, !17, !18, !19, !20}
!13 = !{!"ProfileFormat", !"InstrProf"}
!14 = !{!"TotalCount", i64 10000}
!15 = !{!"MaxCount", i64 10}
!16 = !{!"MaxInternalCount", i64 1}
!17 = !{!"MaxFunctionCount", i64 1000}
!18 = !{!"NumCounts", i64 3}
!19 = !{!"NumFunctions", i64 3}
!20 = !{!"DetailedSummary", !21}
!21 = !{!22, !23, !24}
!22 = !{i32 10000, i64 101, i32 1}
!23 = !{i32 990000, i64 101, i32 1}
!24 = !{i32 999999, i64 1, i32 2}


;.
; VTABLE-COMMON: [[PROF9]] = !{!"VP", i32 2, i64 100, i64 12345678, i64 100}
; VTABLE-COMMON: [[PROF10]] = !{!"branch_weights", i32 600, i32 1000}
; VTABLE-COMMON: [[PROF11]] = !{!"branch_weights", i32 500, i32 500}
; VTABLE-COMMON: [[PROF12]] = !{!"branch_weights", i32 400, i32 100}