llvm/llvm/test/CodeGen/AMDGPU/waitcnt-permute.mir

# RUN: llc -mtriple=amdgcn -mcpu=fiji -verify-machineinstrs -run-pass si-insert-waitcnts -o - %s | FileCheck %s

...
# CHECK-LABEL: name: waitcnt-permute{{$}}
# CHECK: DS_BPERMUTE_B32
# CHECK-NEXT: S_WAITCNT 127

name:            waitcnt-permute
liveins:
  - { reg: '$vgpr0' }
  - { reg: '$vgpr1' }
  - { reg: '$sgpr30_sgpr31' }
body:             |
  bb.0:
    liveins: $vgpr0, $vgpr1, $sgpr30_sgpr31

    $vgpr0 = DS_BPERMUTE_B32 killed $vgpr0, killed $vgpr1, 0, implicit $exec
    $vgpr0 = V_ADD_F32_e32 1065353216, killed $vgpr0, implicit $mode, implicit $exec
    S_SETPC_B64_return killed $sgpr30_sgpr31, implicit killed $vgpr0

...