forked from OSchip/llvm-project
44 lines
1.7 KiB
LLVM
44 lines
1.7 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc -global-isel -mattr=+enable-flat-scratch -mtriple=amdgcn-mesa-mesa3d -mcpu=gfx900 < %s | FileCheck -check-prefix=MESA %s
|
|
; RUN: llc -global-isel -mattr=+enable-flat-scratch -mtriple=amdgcn-amd-amdpal -mcpu=gfx900 < %s | FileCheck -check-prefix=PAL %s
|
|
|
|
; Test that the initialization for flat_scratch doesn't crash. PAL
|
|
; doesn't add a user SGPR for initializing flat_scratch, mesa does
|
|
; (although this probably isn't actually defined).
|
|
|
|
define amdgpu_ps void @amdgpu_ps() {
|
|
; MESA-LABEL: amdgpu_ps:
|
|
; MESA: ; %bb.0:
|
|
; MESA-NEXT: s_add_u32 flat_scratch_lo, s2, s4
|
|
; MESA-NEXT: s_mov_b64 s[0:1], src_private_base
|
|
; MESA-NEXT: s_addc_u32 flat_scratch_hi, s3, 0
|
|
; MESA-NEXT: v_mov_b32_e32 v0, 4
|
|
; MESA-NEXT: v_mov_b32_e32 v1, s1
|
|
; MESA-NEXT: v_mov_b32_e32 v2, 0
|
|
; MESA-NEXT: flat_store_dword v[0:1], v2
|
|
; MESA-NEXT: s_waitcnt vmcnt(0)
|
|
; MESA-NEXT: s_endpgm
|
|
;
|
|
; PAL-LABEL: amdgpu_ps:
|
|
; PAL: ; %bb.0:
|
|
; PAL-NEXT: s_getpc_b64 s[2:3]
|
|
; PAL-NEXT: s_mov_b32 s2, s0
|
|
; PAL-NEXT: s_load_dwordx2 s[2:3], s[2:3], 0x0
|
|
; PAL-NEXT: v_mov_b32_e32 v0, 4
|
|
; PAL-NEXT: v_mov_b32_e32 v2, 0
|
|
; PAL-NEXT: s_waitcnt lgkmcnt(0)
|
|
; PAL-NEXT: s_and_b32 s3, s3, 0xffff
|
|
; PAL-NEXT: s_add_u32 flat_scratch_lo, s2, s0
|
|
; PAL-NEXT: s_mov_b64 s[0:1], src_private_base
|
|
; PAL-NEXT: s_addc_u32 flat_scratch_hi, s3, 0
|
|
; PAL-NEXT: v_mov_b32_e32 v1, s1
|
|
; PAL-NEXT: flat_store_dword v[0:1], v2
|
|
; PAL-NEXT: s_waitcnt vmcnt(0)
|
|
; PAL-NEXT: s_endpgm
|
|
%alloca = alloca i32, addrspace(5)
|
|
%cast = addrspacecast ptr addrspace(5) %alloca to ptr
|
|
store volatile i32 0, ptr %cast
|
|
ret void
|
|
}
|
|
|