43 lines
1.6 KiB
LLVM
43 lines
1.6 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc -mtriple=amdgcn -mcpu=gfx900 -sgpr-regalloc=fast -vgpr-regalloc=fast -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s
|
|
|
|
; Make sure there's no verifier error from improperly updated
|
|
; SlotIndexes if regalloc fast is manually used.
|
|
|
|
declare void @foo()
|
|
|
|
define amdgpu_kernel void @kernel() {
|
|
; GCN-LABEL: kernel:
|
|
; GCN: ; %bb.0:
|
|
; GCN-NEXT: s_mov_b32 s36, SCRATCH_RSRC_DWORD0
|
|
; GCN-NEXT: s_mov_b32 s37, SCRATCH_RSRC_DWORD1
|
|
; GCN-NEXT: s_mov_b32 s38, -1
|
|
; GCN-NEXT: s_mov_b32 s39, 0xe00000
|
|
; GCN-NEXT: s_add_u32 s36, s36, s9
|
|
; GCN-NEXT: s_addc_u32 s37, s37, 0
|
|
; GCN-NEXT: s_mov_b32 s14, s8
|
|
; GCN-NEXT: s_add_u32 s8, s2, 36
|
|
; GCN-NEXT: s_addc_u32 s9, s3, 0
|
|
; GCN-NEXT: s_mov_b64 s[10:11], s[4:5]
|
|
; GCN-NEXT: s_mov_b64 s[4:5], s[0:1]
|
|
; GCN-NEXT: s_getpc_b64 s[0:1]
|
|
; GCN-NEXT: s_add_u32 s0, s0, foo@gotpcrel32@lo+4
|
|
; GCN-NEXT: s_addc_u32 s1, s1, foo@gotpcrel32@hi+12
|
|
; GCN-NEXT: s_mov_b32 s13, s7
|
|
; GCN-NEXT: s_mov_b32 s12, s6
|
|
; GCN-NEXT: s_load_dwordx2 s[6:7], s[0:1], 0x0
|
|
; GCN-NEXT: v_lshlrev_b32_e32 v2, 20, v2
|
|
; GCN-NEXT: v_lshlrev_b32_e32 v1, 10, v1
|
|
; GCN-NEXT: s_mov_b64 s[0:1], s[36:37]
|
|
; GCN-NEXT: v_or3_b32 v31, v0, v1, v2
|
|
; GCN-NEXT: s_mov_b64 s[2:3], s[38:39]
|
|
; GCN-NEXT: s_mov_b32 s32, 0
|
|
; GCN-NEXT: s_waitcnt lgkmcnt(0)
|
|
; GCN-NEXT: s_swappc_b64 s[30:31], s[6:7]
|
|
; GCN-NEXT: s_endpgm
|
|
call void @foo()
|
|
ret void
|
|
}
|
|
|
|
!llvm.module.flags = !{!0}
|
|
!0 = !{i32 1, !"amdgpu_code_object_version", i32 500}
|