# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
# RUN: llc -mtriple=amdgcn -mcpu=gfx1200 -verify-machineinstrs -run-pass si-insert-waitcnts -o - %s | FileCheck -check-prefix=GFX12 %s
# Check that we correctly track that GLOBAL_INV increases LOAD_cnt.
# We use a straightforward dependency between a GLOBAL_LOAD and an instruction
# that uses its result - the S_WAIT_LOADCNT introduced before the use should
# reflect the fact that there is a GLOBAL_INV between them.
# FIXME: We could get away with a S_WAIT_LOADCNT 1 here.
---
name: waitcnt-global-inv
machineFunctionInfo:
isEntryFunction: true
body: |
bb.0:
liveins: $vgpr0, $vgpr1, $sgpr2_sgpr3
; GFX12-LABEL: name: waitcnt-global-inv
; GFX12: liveins: $vgpr0, $vgpr1, $sgpr2_sgpr3
; GFX12-NEXT: {{ $}}
; GFX12-NEXT: renamable $vgpr0 = GLOBAL_LOAD_DWORD_SADDR renamable $sgpr2_sgpr3, killed $vgpr0, 0, 0, implicit $exec :: (load (s32), addrspace 1)
; GFX12-NEXT: GLOBAL_INV 16, implicit $exec
; GFX12-NEXT: S_WAIT_LOADCNT 0
; GFX12-NEXT: $vgpr2 = V_MOV_B32_e32 $vgpr0, implicit $exec, implicit $exec
renamable $vgpr0 = GLOBAL_LOAD_DWORD_SADDR renamable $sgpr2_sgpr3, killed $vgpr0, 0, 0, implicit $exec :: (load (s32), addrspace 1)
GLOBAL_INV 16, implicit $exec
$vgpr2 = V_MOV_B32_e32 $vgpr0, implicit $exec, implicit $exec
...
# TODO: Test for GLOBAL_WB, GLOBAL_WBINV