; RUN: opt < %s -passes=loop-interchange -cache-line-size=64 -pass-remarks-missed='loop-interchange' -pass-remarks-output=%t -S \
; RUN: -verify-dom-info -verify-loop-info -verify-loop-lcssa -stats 2>&1
; RUN: FileCheck --input-file=%t --check-prefix=REMARKS %s
; Triply nested loop, should be able to do interchange three times
; to get the ideal access pattern.
; void f(int e[10][10][10], int f[10][10][10]) {
; for (int a = 0; a < 10; a++) {
; for (int b = 0; b < 10; b++) {
; for (int c = 0; c < 10; c++) {
; f[c][b][a] = e[c][b][a];
; }
; }
; }
; }
; REMARKS: --- !Passed
; REMARKS-NEXT: Pass: loop-interchange
; REMARKS-NEXT: Name: Interchanged
; REMARKS-NEXT: Function: pr43326-triply-nested
; REMARKS: --- !Passed
; REMARKS-NEXT: Pass: loop-interchange
; REMARKS-NEXT: Name: Interchanged
; REMARKS-NEXT: Function: pr43326-triply-nested
; REMARKS: --- !Passed
; REMARKS-NEXT: Pass: loop-interchange
; REMARKS-NEXT: Name: Interchanged
; REMARKS-NEXT: Function: pr43326-triply-nested
define void @pr43326-triply-nested(ptr %e, ptr %f) {
entry:
br label %for.outermost.header
for.outermost.header: ; preds = %entry, %for.outermost.latch
%indvars.outermost = phi i64 [ 0, %entry ], [ %indvars.outermost.next, %for.outermost.latch ]
br label %for.middle.header
for.cond.cleanup: ; preds = %for.outermost.latch
ret void
for.middle.header: ; preds = %for.outermost.header, %for.middle.latch
%indvars.middle = phi i64 [ 0, %for.outermost.header ], [ %indvars.middle.next, %for.middle.latch ]
br label %for.innermost
for.outermost.latch: ; preds = %for.middle.latch
%indvars.outermost.next = add nuw nsw i64 %indvars.outermost, 1
%exitcond.outermost = icmp ne i64 %indvars.outermost.next, 10
br i1 %exitcond.outermost, label %for.outermost.header, label %for.cond.cleanup
for.middle.latch: ; preds = %for.innermost
%indvars.middle.next = add nuw nsw i64 %indvars.middle, 1
%exitcond.middle = icmp ne i64 %indvars.middle.next, 10
br i1 %exitcond.middle, label %for.middle.header, label %for.outermost.latch
for.innermost: ; preds = %for.middle.header, %for.innermost
%indvars.innermost = phi i64 [ 0, %for.middle.header ], [ %indvars.innermost.next, %for.innermost ]
%arrayidx12 = getelementptr inbounds [10 x [10 x i32]], ptr %e, i64 %indvars.innermost, i64 %indvars.middle, i64 %indvars.outermost
%0 = load i32, ptr %arrayidx12
%arrayidx18 = getelementptr inbounds [10 x [10 x i32]], ptr %f, i64 %indvars.innermost, i64 %indvars.middle, i64 %indvars.outermost
store i32 %0, ptr %arrayidx18
%indvars.innermost.next = add nuw nsw i64 %indvars.innermost, 1
%exitcond.innermost = icmp ne i64 %indvars.innermost.next, 10
br i1 %exitcond.innermost, label %for.innermost, label %for.middle.latch
}