# RUN: llc -mtriple=aarch64 -run-pass=machine-outliner -machine-outliner-reruns=1 -verify-machineinstrs %s -o - | FileCheck %s --check-prefix TWO-RUNS
# RUN: llc -mtriple=aarch64 -run-pass=machine-outliner -machine-outliner-reruns=0 -verify-machineinstrs %s -o - | FileCheck %s --check-prefix ONE-RUN
# RUN: llc -mtriple=aarch64 -run-pass=machine-outliner -machine-outliner-reruns=3 -verify-machineinstrs %s -o - | FileCheck %s --check-prefix FOUR-RUNS
# Example of Repeated Instruction Sequence - Iterative Machine Outlining
#
#; define void @"$s12"(...) { define i64 @"$s5” (...) { define void @"$s13"(...) {
# ... ... ...
# %8 = load i1, i1* %7 %8 = load i1, i1* %7
# %9 = load i4, i4*, %6 %9 = load i4, i4*, %6 %9 = load i4, i4*, %6
# store i4 %9, i4* %5 store i4 %9, i4* %5 store i4 %9, i4* %5
# ... ... ...
# } } }
#
# After machine outliner (1st time)
#
# define void @"$s12"(...) { define i64 @"$s5” (...) { define void @"$s13"(...) {
# ... ... ...
# %8 = load i1, i1* %7 %8 = load i1, i1* %7
# call void @outlined_function_1_1 call void @outlined_function_1_1 call void @outlined_function_1_1
# ... ... ...
# } } }
#
# After machine outliner (2nd time)
#
# define void @"$s12"(...) { define i64 @"$s5” (...) { define void @"$s13"(...) {
# ... ... ...
# call void @outlined_function_2_1 call void @outlined_function_1_1 call void @outlined_function_2_1
# ... ... ...
# } } }
#
# Check whether machine outliner can further find the outlining opportunity after machine
# outlining has performed.
#
--- |
declare void @foo() local_unnamed_addr
declare void @widget() local_unnamed_addr
; Function Attrs: minsize noredzone optsize
define void @baz.14() #0 {
ret void
}
; Function Attrs: minsize noredzone optsize
define void @baz.15() #0 {
ret void
}
; Function Attrs: minsize noredzone optsize
define void @baz.16() #0 {
ret void
}
attributes #0 = { minsize noredzone optsize }
...
---
name: baz.14
tracksRegLiveness: true
stack:
- { id: 0, offset: -8, size: 8 }
- { id: 1, offset: -16, size: 8 }
body: |
bb.0:
liveins: $x0, $x19, $lr
early-clobber $sp = frame-setup STPXpre killed $lr, killed $x19, $sp, -2 :: (store (s64) into %stack.1), (store (s64) into %stack.0)
frame-setup CFI_INSTRUCTION def_cfa_offset 16
frame-setup CFI_INSTRUCTION offset $w19, -8
frame-setup CFI_INSTRUCTION offset $w30, -16
renamable $x19 = COPY $x0
renamable $x0 = nuw ADDXri $x0, 48, 0
$x1 = ADDXri $sp, 0, 0
dead $w2 = MOVi32imm 33, implicit-def $x2
$x3 = COPY $xzr
BL @foo, csr_aarch64_aapcs, implicit-def dead $lr, implicit $sp, implicit $x0, implicit killed $x1, implicit killed $x2, implicit killed $x3, implicit-def $sp
$x0 = COPY killed renamable $x19
BL @widget, csr_aarch64_aapcs, implicit-def dead $lr, implicit $sp, implicit $x0, implicit-def $sp
early-clobber $sp, $lr, $x19 = frame-destroy LDPXpost $sp, 2 :: (load (s64) from %stack.1), (load (s64) from %stack.0)
RET_ReallyLR
...
---
name: baz.15
tracksRegLiveness: true
stack:
- { id: 0, offset: -8, size: 8 }
- { id: 1, offset: -16, size: 8 }
body: |
bb.0:
liveins: $x0, $x19, $lr
early-clobber $sp = frame-setup STPXpre killed $lr, killed $x19, $sp, -2 :: (store (s64) into %stack.1), (store (s64) into %stack.0)
frame-setup CFI_INSTRUCTION def_cfa_offset 16
frame-setup CFI_INSTRUCTION offset $w19, -8
frame-setup CFI_INSTRUCTION offset $w30, -16
renamable $x19 = COPY $x0
renamable $x0 = nuw ADDXri killed renamable $x0, 16, 0
$x1 = ADDXri $sp, 0, 0
dead $w2 = MOVi32imm 33, implicit-def $x2
$x3 = COPY $xzr
BL @foo, csr_aarch64_aapcs, implicit-def dead $lr, implicit $sp, implicit $x0, implicit $x1, implicit killed $x2, implicit killed $x3, implicit-def $sp
$x0 = COPY killed renamable $x19
BL @widget, csr_aarch64_aapcs, implicit-def dead $lr, implicit $sp, implicit $x0, implicit-def $sp
early-clobber $sp, $lr, $x19 = frame-destroy LDPXpost $sp, 2 :: (load (s64) from %stack.1), (load (s64) from %stack.0)
RET_ReallyLR
...
---
name: baz.16
tracksRegLiveness: true
stack:
- { id: 0, offset: -8, size: 8 }
- { id: 1, offset: -16, size: 8 }
body: |
bb.0:
liveins: $x0, $x19, $lr
early-clobber $sp = frame-setup STPXpre killed $lr, killed $x19, $sp, -2 :: (store (s64) into %stack.1), (store (s64) into %stack.0)
frame-setup CFI_INSTRUCTION def_cfa_offset 16
frame-setup CFI_INSTRUCTION offset $w19, -8
frame-setup CFI_INSTRUCTION offset $w30, -16
renamable $x19 = COPY $x0
renamable $x0 = nuw ADDXri $x0, 48, 0
$x1 = ADDXri $sp, 0, 0
dead $w2 = MOVi32imm 33, implicit-def $x2
$x3 = COPY $xzr
BL @foo, csr_aarch64_aapcs, implicit-def dead $lr, implicit $sp, implicit $x0, implicit killed $x1, implicit killed $x2, implicit killed $x3, implicit-def $sp
$x0 = COPY killed renamable $x19
BL @widget, csr_aarch64_aapcs, implicit-def dead $lr, implicit $sp, implicit $x0, implicit-def $sp
early-clobber $sp, $lr, $x19 = frame-destroy LDPXpost $sp, 2 :: (load (s64) from %stack.1), (load (s64) from %stack.0)
RET_ReallyLR
...
# TWO-RUNS: name: OUTLINED_FUNCTION_2_0
# TWO-RUNS-DAG: bb.0:
# TWO-RUNS-DAG: renamable $x19 = COPY $x0
# TWO-RUNS-NEXT: renamable $x0 = nuw ADDXri $x0, 48, 0
# TWO-RUNS-NEXT: TCRETURNdi @OUTLINED_FUNCTION_0, 0, implicit $sp
#
# The machine outliner is expected to stop at the 1st iteration for case ONE-RUN
# since machine-outline-runs is specified as 1.
# ONE-RUN-NOT: [[OUTLINED:OUTLINED_FUNCTION_2_[0-9]+]]
#
# The machine outliner is expected to stop at the 3rd iteration for case FOUR-RUNS
# since the MIR has no change at the 3rd iteration.
# FOUR-RUNS-NOT: [[OUTLINED:OUTLINED_FUNCTION_3_[0-9]+]]
# FOUR-RUNS-NOT: [[OUTLINED:OUTLINED_FUNCTION_4_[0-9]+]]