; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
; RUN: opt < %s -passes=loop-unroll -unroll-runtime -unroll-allow-partial -S | FileCheck %s
declare void @f() convergent
declare void @g()
; Although this loop contains a convergent instruction, it should be
; fully unrolled.
define i32 @full_unroll() {
; CHECK-LABEL: @full_unroll(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[ANCHOR:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: br label [[L3:%.*]]
; CHECK: l3:
; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token [[ANCHOR]]) ]
; CHECK-NEXT: br label [[A:%.*]]
; CHECK: a:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: br label [[A_1:%.*]]
; CHECK: a.1:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: br label [[A_2:%.*]]
; CHECK: a.2:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: ret i32 0
;
entry:
%anchor = call token @llvm.experimental.convergence.anchor()
br label %l3
l3:
%x.0 = phi i32 [ 0, %entry ], [ %inc, %a ]
%tok.loop = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token %anchor) ]
%inc = add nsw i32 %x.0, 1
%exitcond = icmp eq i32 %inc, 3
br label %a
a:
call void @f() [ "convergencectrl"(token %tok.loop) ]
br i1 %exitcond, label %exit, label %l3
exit:
ret i32 0
}
; This loop contains a convergent instruction, but it should be partially
; unrolled. The unroll count is the largest power of 2 that divides the
; multiple -- 4, in this case.
define i32 @runtime_unroll(i32 %n) {
; CHECK-LABEL: @runtime_unroll(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[ANCHOR:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: [[LOOP_CTL:%.*]] = mul nsw i32 [[N:%.*]], 12
; CHECK-NEXT: br label [[L3:%.*]]
; CHECK: l3:
; CHECK-NEXT: [[X_0:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC_3:%.*]], [[A_3:%.*]] ]
; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token [[ANCHOR]]) ]
; CHECK-NEXT: br label [[A:%.*]]
; CHECK: a:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: br label [[A_1:%.*]]
; CHECK: a.1:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: br label [[A_2:%.*]]
; CHECK: a.2:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: br label [[A_3]]
; CHECK: a.3:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: [[INC_3]] = add nsw i32 [[X_0]], 4
; CHECK-NEXT: [[EXITCOND_3:%.*]] = icmp eq i32 [[INC_3]], [[LOOP_CTL]]
; CHECK-NEXT: br i1 [[EXITCOND_3]], label [[EXIT:%.*]], label [[L3]]
; CHECK: exit:
; CHECK-NEXT: ret i32 0
;
entry:
%anchor = call token @llvm.experimental.convergence.anchor()
%loop_ctl = mul nsw i32 %n, 12
br label %l3
l3:
%x.0 = phi i32 [ 0, %entry ], [ %inc, %a ]
%tok.loop = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token %anchor) ]
br label %a
a:
call void @f() [ "convergencectrl"(token %tok.loop) ]
%inc = add nsw i32 %x.0, 1
%exitcond = icmp eq i32 %inc, %loop_ctl
br i1 %exitcond, label %exit, label %l3
exit:
ret i32 0
}
; This loop contains a convergent instruction, so its partial unroll
; count must divide its trip multiple. This overrides its unroll
; pragma -- we unroll exactly 8 times, even though 16 is requested.
define i32 @pragma_unroll(i32 %n) {
; CHECK-LABEL: @pragma_unroll(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[ANCHOR:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: [[LOOP_CTL:%.*]] = mul nsw i32 [[N:%.*]], 24
; CHECK-NEXT: br label [[L3:%.*]], !llvm.loop [[LOOP0:![0-9]+]]
; CHECK: l3:
; CHECK-NEXT: [[X_0:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC_7:%.*]], [[A_7:%.*]] ]
; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token [[ANCHOR]]) ]
; CHECK-NEXT: br label [[A:%.*]]
; CHECK: a:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: br label [[A_1:%.*]]
; CHECK: a.1:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: br label [[A_2:%.*]]
; CHECK: a.2:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: br label [[A_3:%.*]]
; CHECK: a.3:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: br label [[A_4:%.*]]
; CHECK: a.4:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: br label [[A_5:%.*]]
; CHECK: a.5:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: br label [[A_6:%.*]]
; CHECK: a.6:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: br label [[A_7]]
; CHECK: a.7:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: [[INC_7]] = add nsw i32 [[X_0]], 8
; CHECK-NEXT: [[EXITCOND_7:%.*]] = icmp eq i32 [[INC_7]], [[LOOP_CTL]]
; CHECK-NEXT: br i1 [[EXITCOND_7]], label [[EXIT:%.*]], label [[L3]], !llvm.loop [[LOOP2:![0-9]+]]
; CHECK: exit:
; CHECK-NEXT: ret i32 0
;
entry:
%anchor = call token @llvm.experimental.convergence.anchor()
%loop_ctl = mul nsw i32 %n, 24
br label %l3, !llvm.loop !0
l3:
%x.0 = phi i32 [ 0, %entry ], [ %inc, %a ]
%tok.loop = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token %anchor) ]
br label %a
a:
call void @f() [ "convergencectrl"(token %tok.loop) ]
%inc = add nsw i32 %x.0, 1
%exitcond = icmp eq i32 %inc, %loop_ctl
br i1 %exitcond, label %exit, label %l3, !llvm.loop !0
exit:
ret i32 0
}
; This loop contains a convergent instruction. Since the pragma loop unroll
; count 2 divides trip count 4. The loop unroll should respect the pragma.
define void @pragma_unroll_divisible_trip_count() {
; CHECK-LABEL: @pragma_unroll_divisible_trip_count(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[ANCHOR:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: br label [[L3:%.*]], !llvm.loop [[LOOP4:![0-9]+]]
; CHECK: l3:
; CHECK-NEXT: [[X_0:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC_1:%.*]], [[L3]] ]
; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token [[ANCHOR]]) ]
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: [[INC_1]] = add nuw nsw i32 [[X_0]], 2
; CHECK-NEXT: [[EXITCOND_1:%.*]] = icmp eq i32 [[INC_1]], 4
; CHECK-NEXT: br i1 [[EXITCOND_1]], label [[EXIT:%.*]], label [[L3]], !llvm.loop [[LOOP6:![0-9]+]]
; CHECK: exit:
; CHECK-NEXT: ret void
;
entry:
%anchor = call token @llvm.experimental.convergence.anchor()
br label %l3, !llvm.loop !1
l3:
%x.0 = phi i32 [ 0, %entry ], [ %inc, %l3 ]
%tok.loop = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token %anchor) ]
call void @f() [ "convergencectrl"(token %tok.loop) ]
%inc = add nsw i32 %x.0, 1
%exitcond = icmp eq i32 %inc, 4
br i1 %exitcond, label %exit, label %l3, !llvm.loop !1
exit:
ret void
}
; This loop contains a convergent instruction. Since the pragma loop unroll
; count 2 divides trip multiple 2. The loop unroll should respect the pragma.
define i32 @pragma_unroll_divisible_trip_multiple(i32 %n) {
; CHECK-LABEL: @pragma_unroll_divisible_trip_multiple(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[ANCHOR:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: [[LOOP_CTL:%.*]] = mul nsw i32 [[N:%.*]], 2
; CHECK-NEXT: br label [[L3:%.*]], !llvm.loop [[LOOP4]]
; CHECK: l3:
; CHECK-NEXT: [[X_0:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC_1:%.*]], [[L3]] ]
; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token [[ANCHOR]]) ]
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: [[INC_1]] = add nsw i32 [[X_0]], 2
; CHECK-NEXT: [[EXITCOND_1:%.*]] = icmp eq i32 [[INC_1]], [[LOOP_CTL]]
; CHECK-NEXT: br i1 [[EXITCOND_1]], label [[EXIT:%.*]], label [[L3]], !llvm.loop [[LOOP7:![0-9]+]]
; CHECK: exit:
; CHECK-NEXT: ret i32 0
;
entry:
%anchor = call token @llvm.experimental.convergence.anchor()
%loop_ctl = mul nsw i32 %n, 2
br label %l3, !llvm.loop !1
l3:
%x.0 = phi i32 [ 0, %entry ], [ %inc, %l3 ]
%tok.loop = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token %anchor) ]
call void @f() [ "convergencectrl"(token %tok.loop) ]
%inc = add nsw i32 %x.0, 1
%exitcond = icmp eq i32 %inc, %loop_ctl
br i1 %exitcond, label %exit, label %l3, !llvm.loop !1
exit:
ret i32 0
}
; This loop contains a convergent instruction. Since the pragma loop unroll
; count 2 is unknown to divide runtime trip count, the loop is not unrolled
; since remainder is forbidden for unrolling convergent loop.
define i32 @pragma_unroll_indivisible_runtime_trip_count(i32 %n) {
; CHECK-LABEL: @pragma_unroll_indivisible_runtime_trip_count(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[ANCHOR:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: br label [[L3:%.*]], !llvm.loop [[LOOP4]]
; CHECK: l3:
; CHECK-NEXT: [[X_0:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC:%.*]], [[L3]] ]
; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token [[ANCHOR]]) ]
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: [[INC]] = add nsw i32 [[X_0]], 1
; CHECK-NEXT: [[EXITCOND:%.*]] = icmp eq i32 [[INC]], [[N:%.*]]
; CHECK-NEXT: br i1 [[EXITCOND]], label [[EXIT:%.*]], label [[L3]], !llvm.loop [[LOOP4]]
; CHECK: exit:
; CHECK-NEXT: ret i32 0
;
entry:
%anchor = call token @llvm.experimental.convergence.anchor()
br label %l3, !llvm.loop !1
l3:
%x.0 = phi i32 [ 0, %entry ], [ %inc, %l3 ]
%tok.loop = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token %anchor) ]
call void @f() [ "convergencectrl"(token %tok.loop) ]
%inc = add nsw i32 %x.0, 1
%exitcond = icmp eq i32 %inc, %n
br i1 %exitcond, label %exit, label %l3, !llvm.loop !1
exit:
ret i32 0
}
; This loop contains a convergent instruction. Since the pragma loop unroll
; count 2 does not divide trip count 5, the loop is not unrolled by 2
; since remainder is forbidden for unrolling convergent loop. Instead, the
; loop gets fully unrolled.
define i32 @pragma_unroll_indivisible_trip_count() {
; CHECK-LABEL: @pragma_unroll_indivisible_trip_count(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[ANCHOR:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: br label [[L3:%.*]], !llvm.loop [[LOOP4]]
; CHECK: l3:
; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token [[ANCHOR]]) ]
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: ret i32 0
;
entry:
%anchor = call token @llvm.experimental.convergence.anchor()
br label %l3, !llvm.loop !1
l3:
%x.0 = phi i32 [ 0, %entry ], [ %inc, %l3 ]
%tok.loop = call token @llvm.experimental.convergence.loop() [ "convergencectrl"(token %anchor) ]
call void @f() [ "convergencectrl"(token %tok.loop) ]
%inc = add nsw i32 %x.0, 1
%exitcond = icmp eq i32 %inc, 5
br i1 %exitcond, label %exit, label %l3, !llvm.loop !1
exit:
ret i32 0
}
; This loop contains a convergent instruction that is anchored inside the loop
; itself. It is unrolled by 2 with remainder, as requested by the loop metadata.
define i32 @pragma_unroll_with_remainder(i32 %n) {
; CHECK-LABEL: @pragma_unroll_with_remainder(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[TMP0:%.*]] = freeze i32 [[N:%.*]]
; CHECK-NEXT: [[TMP1:%.*]] = add i32 [[TMP0]], -1
; CHECK-NEXT: [[XTRAITER:%.*]] = and i32 [[TMP0]], 1
; CHECK-NEXT: [[TMP2:%.*]] = icmp ult i32 [[TMP1]], 1
; CHECK-NEXT: br i1 [[TMP2]], label [[EXIT_UNR_LCSSA:%.*]], label [[ENTRY_NEW:%.*]]
; CHECK: entry.new:
; CHECK-NEXT: [[UNROLL_ITER:%.*]] = sub i32 [[TMP0]], [[XTRAITER]]
; CHECK-NEXT: br label [[L3:%.*]], !llvm.loop [[LOOP4]]
; CHECK: l3:
; CHECK-NEXT: [[X_0:%.*]] = phi i32 [ 0, [[ENTRY_NEW]] ], [ [[INC_1:%.*]], [[L3]] ]
; CHECK-NEXT: [[NITER:%.*]] = phi i32 [ 0, [[ENTRY_NEW]] ], [ [[NITER_NEXT_1:%.*]], [[L3]] ]
; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: [[TOK_LOOP_1:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP_1]]) ]
; CHECK-NEXT: [[INC_1]] = add nsw i32 [[X_0]], 2
; CHECK-NEXT: [[NITER_NEXT_1]] = add i32 [[NITER]], 2
; CHECK-NEXT: [[NITER_NCMP_1:%.*]] = icmp eq i32 [[NITER_NEXT_1]], [[UNROLL_ITER]]
; CHECK-NEXT: br i1 [[NITER_NCMP_1]], label [[EXIT_UNR_LCSSA_LOOPEXIT:%.*]], label [[L3]], !llvm.loop [[LOOP8:![0-9]+]]
; CHECK: exit.unr-lcssa.loopexit:
; CHECK-NEXT: br label [[EXIT_UNR_LCSSA]]
; CHECK: exit.unr-lcssa:
; CHECK-NEXT: [[LCMP_MOD:%.*]] = icmp ne i32 [[XTRAITER]], 0
; CHECK-NEXT: br i1 [[LCMP_MOD]], label [[L3_EPIL_PREHEADER:%.*]], label [[EXIT:%.*]]
; CHECK: l3.epil.preheader:
; CHECK-NEXT: br label [[L3_EPIL:%.*]]
; CHECK: l3.epil:
; CHECK-NEXT: [[TOK_LOOP_EPIL:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP_EPIL]]) ]
; CHECK-NEXT: br label [[EXIT]]
; CHECK: exit:
; CHECK-NEXT: ret i32 0
;
entry:
br label %l3, !llvm.loop !1
l3:
%x.0 = phi i32 [ 0, %entry ], [ %inc, %l3 ]
%tok.loop = call token @llvm.experimental.convergence.anchor()
call void @f() [ "convergencectrl"(token %tok.loop) ]
%inc = add nsw i32 %x.0, 1
%exitcond = icmp eq i32 %inc, %n
br i1 %exitcond, label %exit, label %l3, !llvm.loop !1
exit:
ret i32 0
}
; Don't unroll a loop that is extended by convergence controls.
;
; We could theoretically duplicate the extension part, but this is not
; implemented.
define i32 @extended_loop(i32 %n) {
; CHECK-LABEL: @extended_loop(
; CHECK-NEXT: entry:
; CHECK-NEXT: br label [[L3:%.*]], !llvm.loop [[LOOP4]]
; CHECK: l3:
; CHECK-NEXT: [[X_0:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC:%.*]], [[L3]] ]
; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: [[INC]] = add nsw i32 [[X_0]], 1
; CHECK-NEXT: [[EXITCOND:%.*]] = icmp eq i32 [[INC]], [[N:%.*]]
; CHECK-NEXT: br i1 [[EXITCOND]], label [[EXIT:%.*]], label [[L3]], !llvm.loop [[LOOP4]]
; CHECK: exit:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_LOOP]]) ]
; CHECK-NEXT: ret i32 0
;
entry:
br label %l3, !llvm.loop !1
l3:
%x.0 = phi i32 [ 0, %entry ], [ %inc, %l3 ]
%tok.loop = call token @llvm.experimental.convergence.anchor()
%inc = add nsw i32 %x.0, 1
%exitcond = icmp eq i32 %inc, %n
br i1 %exitcond, label %exit, label %l3, !llvm.loop !1
exit:
call void @f() [ "convergencectrl"(token %tok.loop) ]
ret i32 0
}
; Inner loop is extended beyond the outer loop. No unrolling possible.
define i32 @extended_inner_loop_1(i32 %n, i1 %cond) {
; CHECK-LABEL: @extended_inner_loop_1(
; CHECK-NEXT: entry:
; CHECK-NEXT: br label [[L3:%.*]]
; CHECK: l3:
; CHECK-NEXT: [[X_0:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC:%.*]], [[LATCH:%.*]] ]
; CHECK-NEXT: [[TOK_LOOP:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: [[INC]] = add nsw i32 [[X_0]], 1
; CHECK-NEXT: [[EXITCOND:%.*]] = icmp eq i32 [[INC]], 4
; CHECK-NEXT: br label [[L2:%.*]], !llvm.loop [[LOOP4]]
; CHECK: l2:
; CHECK-NEXT: [[TOK_L2:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2]]) ]
; CHECK-NEXT: br i1 [[COND:%.*]], label [[L2]], label [[LATCH]], !llvm.loop [[LOOP4]]
; CHECK: latch:
; CHECK-NEXT: br i1 [[EXITCOND]], label [[EXIT:%.*]], label [[L3]]
; CHECK: exit:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2]]) ]
; CHECK-NEXT: ret i32 0
;
entry:
br label %l3
l3:
%x.0 = phi i32 [ 0, %entry ], [ %inc, %latch ]
%tok.loop = call token @llvm.experimental.convergence.anchor()
%inc = add nsw i32 %x.0, 1
%exitcond = icmp eq i32 %inc, 4
br label %l2, !llvm.loop !1
l2:
%tok.l2 = call token @llvm.experimental.convergence.anchor()
call void @f() [ "convergencectrl"(token %tok.l2) ]
br i1 %cond, label %l2, label %latch, !llvm.loop !1
latch:
br i1 %exitcond, label %exit, label %l3
exit:
call void @f() [ "convergencectrl"(token %tok.l2) ]
ret i32 0
}
; Inner loop is extended inside the outer loop. Outer loop is unrolled.
define i32 @extended_inner_loop_2(i32 %n, i1 %cond) {
; CHECK-LABEL: @extended_inner_loop_2(
; CHECK-NEXT: entry:
; CHECK-NEXT: br label [[L3:%.*]]
; CHECK: l3:
; CHECK-NEXT: br label [[L2:%.*]], !llvm.loop [[LOOP4]]
; CHECK: l2:
; CHECK-NEXT: [[TOK_L2:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2]]) ]
; CHECK-NEXT: br i1 [[COND:%.*]], label [[L2]], label [[LATCH:%.*]], !llvm.loop [[LOOP4]]
; CHECK: latch:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2]]) ]
; CHECK-NEXT: br label [[L2_1:%.*]], !llvm.loop [[LOOP4]]
; CHECK: l2.1:
; CHECK-NEXT: [[TOK_L2_1:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_1]]) ]
; CHECK-NEXT: br i1 [[COND]], label [[L2_1]], label [[LATCH_1:%.*]], !llvm.loop [[LOOP4]]
; CHECK: latch.1:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_1]]) ]
; CHECK-NEXT: br label [[L2_2:%.*]], !llvm.loop [[LOOP4]]
; CHECK: l2.2:
; CHECK-NEXT: [[TOK_L2_2:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_2]]) ]
; CHECK-NEXT: br i1 [[COND]], label [[L2_2]], label [[LATCH_2:%.*]], !llvm.loop [[LOOP4]]
; CHECK: latch.2:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_2]]) ]
; CHECK-NEXT: br label [[L2_3:%.*]], !llvm.loop [[LOOP4]]
; CHECK: l2.3:
; CHECK-NEXT: [[TOK_L2_3:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_3]]) ]
; CHECK-NEXT: br i1 [[COND]], label [[L2_3]], label [[LATCH_3:%.*]], !llvm.loop [[LOOP4]]
; CHECK: latch.3:
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_3]]) ]
; CHECK-NEXT: ret i32 0
;
entry:
br label %l3
l3:
%x.0 = phi i32 [ 0, %entry ], [ %inc, %latch ]
%tok.loop = call token @llvm.experimental.convergence.anchor()
%inc = add nsw i32 %x.0, 1
%exitcond = icmp eq i32 %inc, 4
br label %l2, !llvm.loop !1
l2:
%tok.l2 = call token @llvm.experimental.convergence.anchor()
call void @f() [ "convergencectrl"(token %tok.l2) ]
br i1 %cond, label %l2, label %latch, !llvm.loop !1
latch:
call void @f() [ "convergencectrl"(token %tok.l2) ]
br i1 %exitcond, label %exit, label %l3
exit:
ret i32 0
}
; No extension. Both loops unrolled.
define i32 @unroll_nest(i32 %n, i1 %cond) {
; CHECK-LABEL: @unroll_nest(
; CHECK-NEXT: entry:
; CHECK-NEXT: br label [[L3:%.*]]
; CHECK: l3:
; CHECK-NEXT: br label [[L2:%.*]], !llvm.loop [[LOOP4]]
; CHECK: l2:
; CHECK-NEXT: [[TOK_L2:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2]]) ]
; CHECK-NEXT: br i1 [[COND:%.*]], label [[L2_1:%.*]], label [[LATCH:%.*]], !llvm.loop [[LOOP4]]
; CHECK: l2.1:
; CHECK-NEXT: [[TOK_L2_1:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_1]]) ]
; CHECK-NEXT: br i1 [[COND]], label [[L2]], label [[LATCH]], !llvm.loop [[LOOP9:![0-9]+]]
; CHECK: latch:
; CHECK-NEXT: br label [[L2_12:%.*]], !llvm.loop [[LOOP4]]
; CHECK: l2.12:
; CHECK-NEXT: [[TOK_L2_11:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_11]]) ]
; CHECK-NEXT: br i1 [[COND]], label [[L2_1_1:%.*]], label [[LATCH_1:%.*]], !llvm.loop [[LOOP4]]
; CHECK: l2.1.1:
; CHECK-NEXT: [[TOK_L2_1_1:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_1_1]]) ]
; CHECK-NEXT: br i1 [[COND]], label [[L2_12]], label [[LATCH_1]], !llvm.loop [[LOOP9]]
; CHECK: latch.1:
; CHECK-NEXT: br label [[L2_2:%.*]], !llvm.loop [[LOOP4]]
; CHECK: l2.2:
; CHECK-NEXT: [[TOK_L2_2:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_2]]) ]
; CHECK-NEXT: br i1 [[COND]], label [[L2_1_2:%.*]], label [[LATCH_2:%.*]], !llvm.loop [[LOOP4]]
; CHECK: l2.1.2:
; CHECK-NEXT: [[TOK_L2_1_2:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_1_2]]) ]
; CHECK-NEXT: br i1 [[COND]], label [[L2_2]], label [[LATCH_2]], !llvm.loop [[LOOP9]]
; CHECK: latch.2:
; CHECK-NEXT: br label [[L2_3:%.*]], !llvm.loop [[LOOP4]]
; CHECK: l2.3:
; CHECK-NEXT: [[TOK_L2_3:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_3]]) ]
; CHECK-NEXT: br i1 [[COND]], label [[L2_1_3:%.*]], label [[LATCH_3:%.*]], !llvm.loop [[LOOP4]]
; CHECK: l2.1.3:
; CHECK-NEXT: [[TOK_L2_1_3:%.*]] = call token @llvm.experimental.convergence.anchor()
; CHECK-NEXT: call void @f() [ "convergencectrl"(token [[TOK_L2_1_3]]) ]
; CHECK-NEXT: br i1 [[COND]], label [[L2_3]], label [[LATCH_3]], !llvm.loop [[LOOP9]]
; CHECK: latch.3:
; CHECK-NEXT: ret i32 0
;
entry:
br label %l3
l3:
%x.0 = phi i32 [ 0, %entry ], [ %inc, %latch ]
%tok.loop = call token @llvm.experimental.convergence.anchor()
%inc = add nsw i32 %x.0, 1
%exitcond = icmp eq i32 %inc, 4
br label %l2, !llvm.loop !1
l2:
%tok.l2 = call token @llvm.experimental.convergence.anchor()
call void @f() [ "convergencectrl"(token %tok.l2) ]
br i1 %cond, label %l2, label %latch, !llvm.loop !1
latch:
br i1 %exitcond, label %exit, label %l3
exit:
ret i32 0
}
declare token @llvm.experimental.convergence.anchor()
declare token @llvm.experimental.convergence.loop()
!0 = !{!0, !{!"llvm.loop.unroll.count", i32 16}}
!1 = !{!1, !{!"llvm.loop.unroll.count", i32 2}}