llvm/test/CodeGen/AMDGPU/GlobalISel/flat-scratch-init.gfx.ll

   1 ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
   2 ; RUN: llc -global-isel -mattr=+enable-flat-scratch -mtriple=amdgcn-mesa-mesa3d -mcpu=gfx900 < %s | FileCheck -check-prefix=MESA %s
   3 ; RUN: llc -global-isel -mattr=+enable-flat-scratch -mtriple=amdgcn-amd-amdpal -mcpu=gfx900 < %s | FileCheck -check-prefix=PAL %s
   4
   5 ; Test that the initialization for flat_scratch doesn't crash.  PAL
   6 ; doesn't add a user SGPR for initializing flat_scratch, mesa does
   7 ; (although this probably isn't actually defined).
   8
   9 define amdgpu_ps void @amdgpu_ps() {
  10 ; MESA-LABEL: amdgpu_ps:
  11 ; MESA:       ; %bb.0:
  12 ; MESA-NEXT:    s_add_u32 flat_scratch_lo, s2, s4
  13 ; MESA-NEXT:    s_mov_b64 s[0:1], src_private_base
  14 ; MESA-NEXT:    s_addc_u32 flat_scratch_hi, s3, 0
  15 ; MESA-NEXT:    v_mov_b32_e32 v0, 4
  16 ; MESA-NEXT:    v_mov_b32_e32 v1, s1
  17 ; MESA-NEXT:    v_mov_b32_e32 v2, 0
  18 ; MESA-NEXT:    flat_store_dword v[0:1], v2
  19 ; MESA-NEXT:    s_waitcnt vmcnt(0)
  20 ; MESA-NEXT:    s_endpgm
  21 ;
  22 ; PAL-LABEL: amdgpu_ps:
  23 ; PAL:       ; %bb.0:
  24 ; PAL-NEXT:    s_getpc_b64 s[2:3]
  25 ; PAL-NEXT:    s_mov_b32 s2, s0
  26 ; PAL-NEXT:    s_load_dwordx2 s[2:3], s[2:3], 0x0
  27 ; PAL-NEXT:    v_mov_b32_e32 v0, 4
  28 ; PAL-NEXT:    v_mov_b32_e32 v2, 0
  29 ; PAL-NEXT:    s_waitcnt lgkmcnt(0)
  30 ; PAL-NEXT:    s_and_b32 s3, s3, 0xffff
  31 ; PAL-NEXT:    s_add_u32 flat_scratch_lo, s2, s0
  32 ; PAL-NEXT:    s_mov_b64 s[0:1], src_private_base
  33 ; PAL-NEXT:    s_addc_u32 flat_scratch_hi, s3, 0
  34 ; PAL-NEXT:    v_mov_b32_e32 v1, s1
  35 ; PAL-NEXT:    flat_store_dword v[0:1], v2
  36 ; PAL-NEXT:    s_waitcnt vmcnt(0)
  37 ; PAL-NEXT:    s_endpgm
  38   %alloca = alloca i32, addrspace(5)
  39   %cast = addrspacecast ptr addrspace(5) %alloca to ptr
  40   store volatile i32 0, ptr %cast
  41   ret void
  42 }
  43