llvm/llvm/test/CodeGen/AArch64/arm64-prefetch.ll

; RUN: llc < %s -mtriple=arm64-eabi | FileCheck %s
; RUN: llc -O0 --global-isel-abort=1 < %s -mtriple=arm64-eabi | FileCheck %s

@a = common global ptr null, align 8

define void @test(i32 %i, i32 %j) nounwind ssp {
entry:
  ; CHECK: @test
  %j.addr = alloca i32, align 4
  store i32 %j, ptr %j.addr, align 4, !tbaa !0
  ; CHECK: prfum pldl1strm
  call void @llvm.prefetch(ptr %j.addr, i32 0, i32 0, i32 1)
  ; CHECK: prfum pldl3keep
  call void @llvm.prefetch(ptr %j.addr, i32 0, i32 1, i32 1)
  ; CHECK: prfum pldl2keep
  call void @llvm.prefetch(ptr %j.addr, i32 0, i32 2, i32 1)
  ; CHECK: prfum pldl1keep
  call void @llvm.prefetch(ptr %j.addr, i32 0, i32 3, i32 1)

  ; CHECK: prfum plil1strm
  call void @llvm.prefetch(ptr %j.addr, i32 0, i32 0, i32 0)
  ; CHECK: prfum plil3keep
  call void @llvm.prefetch(ptr %j.addr, i32 0, i32 1, i32 0)
  ; CHECK: prfum plil2keep
  call void @llvm.prefetch(ptr %j.addr, i32 0, i32 2, i32 0)
  ; CHECK: prfum plil1keep
  call void @llvm.prefetch(ptr %j.addr, i32 0, i32 3, i32 0)

  ; CHECK: prfum pstl1strm
  call void @llvm.prefetch(ptr %j.addr, i32 1, i32 0, i32 1)
  ; CHECK: prfum pstl3keep
  call void @llvm.prefetch(ptr %j.addr, i32 1, i32 1, i32 1)
  ; CHECK: prfum pstl2keep
  call void @llvm.prefetch(ptr %j.addr, i32 1, i32 2, i32 1)
  ; CHECK: prfum pstl1keep
  call void @llvm.prefetch(ptr %j.addr, i32 1, i32 3, i32 1)

  %tmp1 = load i32, ptr %j.addr, align 4, !tbaa !0
  %add = add nsw i32 %tmp1, %i
  %idxprom = sext i32 %add to i64
  %tmp2 = load ptr, ptr @a, align 8, !tbaa !3
  %arrayidx = getelementptr inbounds i32, ptr %tmp2, i64 %idxprom

  ; CHECK: prfm pldl1strm
  call void @llvm.prefetch(ptr %arrayidx, i32 0, i32 0, i32 1)
  %tmp4 = load ptr, ptr @a, align 8, !tbaa !3
  %arrayidx3 = getelementptr inbounds i32, ptr %tmp4, i64 %idxprom

  ; CHECK: prfm pldl3keep
  call void @llvm.prefetch(ptr %arrayidx3, i32 0, i32 1, i32 1)
  %tmp6 = load ptr, ptr @a, align 8, !tbaa !3
  %arrayidx6 = getelementptr inbounds i32, ptr %tmp6, i64 %idxprom

  ; CHECK: prfm pldl2keep
  call void @llvm.prefetch(ptr %arrayidx6, i32 0, i32 2, i32 1)
  %tmp8 = load ptr, ptr @a, align 8, !tbaa !3
  %arrayidx9 = getelementptr inbounds i32, ptr %tmp8, i64 %idxprom

  ; CHECK: prfm pldl1keep
  call void @llvm.prefetch(ptr %arrayidx9, i32 0, i32 3, i32 1)
  %tmp10 = load ptr, ptr @a, align 8, !tbaa !3
  %arrayidx12 = getelementptr inbounds i32, ptr %tmp10, i64 %idxprom


  ; CHECK: prfm plil1strm
  call void @llvm.prefetch(ptr %arrayidx12, i32 0, i32 0, i32 0)
  %tmp12 = load ptr, ptr @a, align 8, !tbaa !3
  %arrayidx15 = getelementptr inbounds i32, ptr %tmp12, i64 %idxprom

  ; CHECK: prfm plil3keep
  call void @llvm.prefetch(ptr %arrayidx3, i32 0, i32 1, i32 0)
  %tmp14 = load ptr, ptr @a, align 8, !tbaa !3
  %arrayidx18 = getelementptr inbounds i32, ptr %tmp14, i64 %idxprom

  ; CHECK: prfm plil2keep
  call void @llvm.prefetch(ptr %arrayidx6, i32 0, i32 2, i32 0)
  %tmp16 = load ptr, ptr @a, align 8, !tbaa !3
  %arrayidx21 = getelementptr inbounds i32, ptr %tmp16, i64 %idxprom

  ; CHECK: prfm plil1keep
  call void @llvm.prefetch(ptr %arrayidx9, i32 0, i32 3, i32 0)
  %tmp18 = load ptr, ptr @a, align 8, !tbaa !3
  %arrayidx24 = getelementptr inbounds i32, ptr %tmp18, i64 %idxprom


  ; CHECK: prfm pstl1strm
  call void @llvm.prefetch(ptr %arrayidx12, i32 1, i32 0, i32 1)
  %tmp20 = load ptr, ptr @a, align 8, !tbaa !3
  %arrayidx27 = getelementptr inbounds i32, ptr %tmp20, i64 %idxprom

  ; CHECK: prfm pstl3keep
  call void @llvm.prefetch(ptr %arrayidx15, i32 1, i32 1, i32 1)
  %tmp22 = load ptr, ptr @a, align 8, !tbaa !3
  %arrayidx30 = getelementptr inbounds i32, ptr %tmp22, i64 %idxprom

  ; CHECK: prfm pstl2keep
  call void @llvm.prefetch(ptr %arrayidx18, i32 1, i32 2, i32 1)
  %tmp24 = load ptr, ptr @a, align 8, !tbaa !3
  %arrayidx33 = getelementptr inbounds i32, ptr %tmp24, i64 %idxprom

  ; CHECK: prfm pstl1keep
  call void @llvm.prefetch(ptr %arrayidx21, i32 1, i32 3, i32 1)
  ret void
}

declare void @llvm.prefetch(ptr nocapture, i32, i32, i32) nounwind

!0 = !{!"int", !1}
!1 = !{!"omnipotent char", !2}
!2 = !{!"Simple C/C++ TBAA"}
!3 = !{!"any pointer", !1}