; RUN: opt %loadNPMPolly '-passes=print<polly-function-scops>' -polly-invariant-load-hoisting=true -disable-output < %s 2>&1 | FileCheck %s
; RUN: opt %loadNPMPolly -passes=polly-codegen -polly-invariant-load-hoisting=true -S < %s 2>&1 | FileCheck %s --check-prefix=CODEGEN
;
; struct {
; int a;
; float b;
; } S;
;
; float f(int *A) {
; int x;
; float y;
; int i = 0;
; do {
; x = S.a;
; y = S.b;
; A[i] = x + y;
; } while (i++ < 1000);
; return x + y;
; }
;
; CHECK: Invariant Accesses: {
; CHECK-NEXT: ReadAccess := [Reduction Type: NONE] [Scalar: 0]
; CHECK-NEXT: { Stmt_do_body[i0] -> MemRef_S[0] };
; CHECK-NEXT: Execution Context: { : }
; CHECK-NEXT: ReadAccess := [Reduction Type: NONE] [Scalar: 0]
; CHECK-NEXT: { Stmt_do_body[i0] -> MemRef_S[1] };
; CHECK-NEXT: Execution Context: { : }
; CHECK-NEXT: }
;
; CHECK: Statements {
; CHECK-NEXT: Stmt_do_body
; CHECK-NEXT: Domain :=
; CHECK-NEXT: { Stmt_do_body[i0] : 0 <= i0 <= 1000 };
; CHECK-NEXT: Schedule :=
; CHECK-NEXT: { Stmt_do_body[i0] -> [i0] };
; CHECK-NEXT: MustWriteAccess := [Reduction Type: NONE] [Scalar: 0]
; CHECK-NEXT: { Stmt_do_body[i0] -> MemRef_A[i0] };
; CHECK-NEXT: }
;
; CODEGEN: entry:
; CODEGEN: %S.b.preload.s2a = alloca float
; CODEGEN: %S.a.preload.s2a = alloca i32
;
; CODEGEN: polly.preload.begin:
; CODEGEN: %S.load = load i32, ptr @S
; CODEGEN: store i32 %S.load, ptr %S.a.preload.s2a
; CODEGEN: %.load = load float, ptr getelementptr (i32, ptr @S, i64 1)
; CODEGEN: store float %.load, ptr %S.b.preload.s2a
;
; CODEGEN: polly.merge_new_and_old:
; CODEGEN-DAG: %S.b.merge = phi float [ %S.b.final_reload, %polly.exiting ], [ %S.b, %do.cond ]
; CODEGEN-DAG: %S.a.merge = phi i32 [ %S.a.final_reload, %polly.exiting ], [ %S.a, %do.cond ]
;
; CODEGEN: do.end:
; CODEGEN: %conv3 = sitofp i32 %S.a.merge to float
; CODEGEN: %add4 = fadd float %conv3, %S.b.merge
; CODEGEN: ret float %add4
;
; CODEGEN: polly.loop_exit:
; CODEGEN-DAG: %S.b.final_reload = load float, ptr %S.b.preload.s2a
; CODEGEN-DAG: %S.a.final_reload = load i32, ptr %S.a.preload.s2a
;
target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
%struct.anon = type { i32, float }
@S = common global %struct.anon zeroinitializer, align 4
define float @f(ptr %A) {
entry:
br label %do.body
do.body: ; preds = %do.cond, %entry
%indvars.iv = phi i64 [ %indvars.iv.next, %do.cond ], [ 0, %entry ]
%S.a = load i32, ptr @S, align 4
%S.b = load float, ptr getelementptr inbounds (%struct.anon, ptr @S, i64 0, i32 1), align 4
%conv = sitofp i32 %S.a to float
%add = fadd float %conv, %S.b
%conv1 = fptosi float %add to i32
%arrayidx = getelementptr inbounds i32, ptr %A, i64 %indvars.iv
store i32 %conv1, ptr %arrayidx, align 4
br label %do.cond
do.cond: ; preds = %do.body
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
%exitcond = icmp ne i64 %indvars.iv.next, 1001
br i1 %exitcond, label %do.body, label %do.end
do.end: ; preds = %do.cond
%conv3 = sitofp i32 %S.a to float
%add4 = fadd float %conv3, %S.b
ret float %add4
}