# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py # RUN: llc -mtriple=amdgcn -mcpu=gfx1200 -verify-machineinstrs -run-pass si-insert-waitcnts -o - %s | FileCheck -check-prefix=GFX12 %s # Check that we correctly track that GLOBAL_INV increases LOAD_cnt. # We use a straightforward dependency between a GLOBAL_LOAD and an instruction # that uses its result - the S_WAIT_LOADCNT introduced before the use should # reflect the fact that there is a GLOBAL_INV between them. # FIXME: We could get away with a S_WAIT_LOADCNT 1 here. --- name: waitcnt-global-inv machineFunctionInfo: isEntryFunction: true body: | bb.0: liveins: $vgpr0, $vgpr1, $sgpr2_sgpr3 ; GFX12-LABEL: name: waitcnt-global-inv ; GFX12: liveins: $vgpr0, $vgpr1, $sgpr2_sgpr3 ; GFX12-NEXT: {{ $}} ; GFX12-NEXT: renamable $vgpr0 = GLOBAL_LOAD_DWORD_SADDR renamable $sgpr2_sgpr3, killed $vgpr0, 0, 0, implicit $exec :: (load (s32), addrspace 1) ; GFX12-NEXT: GLOBAL_INV 16, implicit $exec ; GFX12-NEXT: S_WAIT_LOADCNT 0 ; GFX12-NEXT: $vgpr2 = V_MOV_B32_e32 $vgpr0, implicit $exec, implicit $exec renamable $vgpr0 = GLOBAL_LOAD_DWORD_SADDR renamable $sgpr2_sgpr3, killed $vgpr0, 0, 0, implicit $exec :: (load (s32), addrspace 1) GLOBAL_INV 16, implicit $exec $vgpr2 = V_MOV_B32_e32 $vgpr0, implicit $exec, implicit $exec ... # TODO: Test for GLOBAL_WB, GLOBAL_WBINV