; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
; RUN: opt -S < %s -passes=loop-idiom | FileCheck %s
; CHECK-NOT: memset
; check that memset is not generated (for stores) because that will result
; in udiv hoisted out of the loop by the SCEV Expander
; TODO: ideally we should be able to generate memset
; if SCEV expander is taught to generate the dependencies
; at the right point.
@a = global i32 0, align 4
@b = global i32 0, align 4
@c = external local_unnamed_addr global [1 x i8], align 1
define void @e() local_unnamed_addr {
; CHECK-LABEL: @e(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[D0:%.*]] = load i32, ptr @a, align 4
; CHECK-NEXT: [[D1:%.*]] = load i32, ptr @b, align 4
; CHECK-NEXT: br label [[FOR_COND1THREAD_PRE_SPLIT:%.*]]
; CHECK: for.cond1thread-pre-split.loopexit:
; CHECK-NEXT: br label [[FOR_COND1THREAD_PRE_SPLIT]]
; CHECK: for.cond1thread-pre-split:
; CHECK-NEXT: [[DIV:%.*]] = udiv i32 [[D0]], [[D1]]
; CHECK-NEXT: br label [[FOR_BODY5:%.*]]
; CHECK: for.body5:
; CHECK-NEXT: [[INDVARS_IV:%.*]] = phi i64 [ 0, [[FOR_COND1THREAD_PRE_SPLIT]] ], [ [[INDVARS_IV_NEXT:%.*]], [[FOR_BODY5]] ]
; CHECK-NEXT: [[DIVX:%.*]] = sext i32 [[DIV]] to i64
; CHECK-NEXT: [[TMP0:%.*]] = add nsw i64 [[DIVX]], [[INDVARS_IV]]
; CHECK-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds [1 x i8], ptr @c, i64 0, i64 [[TMP0]]
; CHECK-NEXT: store i8 0, ptr [[ARRAYIDX]], align 1
; CHECK-NEXT: [[INDVARS_IV_NEXT]] = add nsw i64 [[INDVARS_IV]], 1
; CHECK-NEXT: [[TMP1:%.*]] = trunc i64 [[INDVARS_IV_NEXT]] to i32
; CHECK-NEXT: [[TOBOOL4:%.*]] = icmp eq i32 [[TMP1]], 0
; CHECK-NEXT: br i1 [[TOBOOL4]], label [[FOR_COND1THREAD_PRE_SPLIT_LOOPEXIT:%.*]], label [[FOR_BODY5]]
;
entry:
%d0 = load i32, ptr @a, align 4
%d1 = load i32, ptr @b, align 4
br label %for.cond1thread-pre-split
for.cond1thread-pre-split: ; preds = %for.body5, %entry
%div = udiv i32 %d0, %d1
br label %for.body5
for.body5: ; preds = %for.body5, %for.cond1thread-pre-split
%indvars.iv = phi i64 [ 0, %for.cond1thread-pre-split ], [ %indvars.iv.next, %for.body5 ]
%divx = sext i32 %div to i64
%0 = add nsw i64 %divx, %indvars.iv
%arrayidx = getelementptr inbounds [1 x i8], ptr @c, i64 0, i64 %0
store i8 0, ptr %arrayidx, align 1
%indvars.iv.next = add nsw i64 %indvars.iv, 1
%1 = trunc i64 %indvars.iv.next to i32
%tobool4 = icmp eq i32 %1, 0
br i1 %tobool4, label %for.cond1thread-pre-split, label %for.body5
}
; The loop's trip count is depending on an unsafe operation
; udiv. SCEV expander hoists it out of the loop, so loop-idiom
; should check that the memset is not generated in this case.
define void @f(i32 %a, i32 %b, ptr nocapture %x) local_unnamed_addr {
; CHECK-LABEL: @f(
; CHECK-NEXT: entry:
; CHECK-NEXT: br label [[FOR_BODY:%.*]]
; CHECK: for.body.loopexit:
; CHECK-NEXT: br label [[FOR_BODY]]
; CHECK: for.body:
; CHECK-NEXT: [[DIV:%.*]] = udiv i32 [[A:%.*]], [[B:%.*]]
; CHECK-NEXT: [[CONV:%.*]] = zext i32 [[DIV]] to i64
; CHECK-NEXT: br label [[FOR_BODY6:%.*]]
; CHECK: for.body6:
; CHECK-NEXT: [[I_09:%.*]] = phi i64 [ [[INC:%.*]], [[FOR_BODY6]] ], [ 0, [[FOR_BODY]] ]
; CHECK-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i8, ptr [[X:%.*]], i64 [[I_09]]
; CHECK-NEXT: store i8 0, ptr [[ARRAYIDX]], align 1
; CHECK-NEXT: [[INC]] = add nuw nsw i64 [[I_09]], 1
; CHECK-NEXT: [[CMP3:%.*]] = icmp slt i64 [[INC]], [[CONV]]
; CHECK-NEXT: br i1 [[CMP3]], label [[FOR_BODY6]], label [[FOR_BODY_LOOPEXIT:%.*]]
;
entry:
br label %for.body
for.body: ; preds = %for.body6, %entry
%div = udiv i32 %a, %b
%conv = zext i32 %div to i64
br label %for.body6
for.body6: ; preds = %for.body6, %for.body
%i.09 = phi i64 [ %inc, %for.body6 ], [ 0, %for.body ]
%arrayidx = getelementptr inbounds i8, ptr %x, i64 %i.09
store i8 0, ptr %arrayidx, align 1
%inc = add nuw nsw i64 %i.09, 1
%cmp3 = icmp slt i64 %inc, %conv
br i1 %cmp3, label %for.body6, label %for.body
}