| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py |
| ; RUN: llc -global-isel -mattr=+enable-flat-scratch -mtriple=amdgcn-mesa-mesa3d -mcpu=gfx900 < %s | FileCheck -check-prefix=MESA %s |
| ; RUN: llc -global-isel -mattr=+enable-flat-scratch -mtriple=amdgcn-amd-amdpal -mcpu=gfx900 < %s | FileCheck -check-prefix=PAL %s |
| |
| ; Test that the initialization for flat_scratch doesn't crash. PAL |
| ; doesn't add a user SGPR for initializing flat_scratch, mesa does |
| ; (although this probably isn't actually defined). |
| |
| define amdgpu_ps void @amdgpu_ps() { |
| ; MESA-LABEL: amdgpu_ps: |
| ; MESA: ; %bb.0: |
| ; MESA-NEXT: s_add_u32 flat_scratch_lo, s2, s4 |
| ; MESA-NEXT: s_addc_u32 flat_scratch_hi, s3, 0 |
| ; MESA-NEXT: s_mov_b32 s0, 0 |
| ; MESA-NEXT: s_mov_b64 s[2:3], src_private_base |
| ; MESA-NEXT: s_mov_b32 s1, s3 |
| ; MESA-NEXT: v_mov_b32_e32 v0, s0 |
| ; MESA-NEXT: v_mov_b32_e32 v2, 0 |
| ; MESA-NEXT: v_mov_b32_e32 v1, s1 |
| ; MESA-NEXT: flat_store_dword v[0:1], v2 |
| ; MESA-NEXT: s_waitcnt vmcnt(0) |
| ; MESA-NEXT: s_endpgm |
| ; |
| ; PAL-LABEL: amdgpu_ps: |
| ; PAL: ; %bb.0: |
| ; PAL-NEXT: s_getpc_b64 s[2:3] |
| ; PAL-NEXT: s_mov_b32 s2, s0 |
| ; PAL-NEXT: s_load_dwordx2 s[2:3], s[2:3], 0x0 |
| ; PAL-NEXT: v_mov_b32_e32 v2, 0 |
| ; PAL-NEXT: s_waitcnt lgkmcnt(0) |
| ; PAL-NEXT: s_and_b32 s3, s3, 0xffff |
| ; PAL-NEXT: s_add_u32 flat_scratch_lo, s2, s0 |
| ; PAL-NEXT: s_addc_u32 flat_scratch_hi, s3, 0 |
| ; PAL-NEXT: s_mov_b32 s0, 0 |
| ; PAL-NEXT: s_mov_b64 s[2:3], src_private_base |
| ; PAL-NEXT: s_mov_b32 s1, s3 |
| ; PAL-NEXT: v_mov_b32_e32 v0, s0 |
| ; PAL-NEXT: v_mov_b32_e32 v1, s1 |
| ; PAL-NEXT: flat_store_dword v[0:1], v2 |
| ; PAL-NEXT: s_waitcnt vmcnt(0) |
| ; PAL-NEXT: s_endpgm |
| %alloca = alloca i32, addrspace(5) |
| %cast = addrspacecast ptr addrspace(5) %alloca to ptr |
| store volatile i32 0, ptr %cast |
| ret void |
| } |
| |