1 ; RUN: not llc -mtriple=amdgcn-- < %s 2>&1 | FileCheck -check-prefix=ERROR %s
2 ; RUN: not llc -mtriple=amdgcn-- < %s | FileCheck -check-prefix=GCN %s
4 declare void @llvm.memset.p5.i32(ptr addrspace(5) nocapture, i8, i32, i32, i1) #1
6 ; ERROR: error: <unknown>:0:0: stack frame size (131061) exceeds limit (131056) in function 'stack_size_limit_wave64'
7 ; GCN: ; ScratchSize: 131061
8 define amdgpu_kernel void @stack_size_limit_wave64() #0 {
10 %alloca = alloca [131057 x i8], align 1, addrspace(5)
11 call void @llvm.memset.p5.i32(ptr addrspace(5) %alloca, i8 9, i32 131057, i32 1, i1 true)
15 ; ERROR: error: <unknown>:0:0: stack frame size (262117) exceeds limit (262112) in function 'stack_size_limit_wave32'
16 ; GCN: ; ScratchSize: 262117
17 define amdgpu_kernel void @stack_size_limit_wave32() #1 {
19 %alloca = alloca [262113 x i8], align 1, addrspace(5)
20 call void @llvm.memset.p5.i32(ptr addrspace(5) %alloca, i8 9, i32 262113, i32 1, i1 true)
25 ; GCN: ; ScratchSize: 131056
26 define amdgpu_kernel void @max_stack_size_wave64() #0 {
28 %alloca = alloca [131052 x i8], align 1, addrspace(5)
29 call void @llvm.memset.p5.i32(ptr addrspace(5) %alloca, i8 9, i32 131052, i32 1, i1 true)
34 ; GCN: ; ScratchSize: 262112
35 define amdgpu_kernel void @max_stack_size_wave32() #1 {
37 %alloca = alloca [262108 x i8], align 1, addrspace(5)
38 call void @llvm.memset.p5.i32(ptr addrspace(5) %alloca, i8 9, i32 262108, i32 1, i1 true)
42 attributes #0 = { "target-cpu" = "gfx900" }
43 attributes #1 = { "target-cpu" = "gfx1010" }