1 ; RUN: llc -mtriple=amdgcn--amdpal -mcpu=gfx1100 <%s | FileCheck %s
3 ; CHECK-LABEL: {{^}}_amdgpu_cs_main:
6 ; CHECK: .amdgpu_pal_metadata
8 ; CHECK-NEXT: amdpal.pipelines:
9 ; CHECK-NEXT: - .api: Vulkan
10 ; CHECK-NEXT: .compute_registers:
11 ; CHECK-NEXT: .tg_size_en: true
12 ; CHECK-NEXT: .tgid_x_en: false
13 ; CHECK-NEXT: .tgid_y_en: false
14 ; CHECK-NEXT: .tgid_z_en: false
15 ; CHECK-NEXT: .tidig_comp_cnt: 0x1
16 ; CHECK-NEXT: .graphics_registers:
17 ; CHECK-NEXT: .ps_extra_lds_size: 0
18 ; CHECK-NEXT: .spi_ps_input_addr:
19 ; CHECK-NEXT: .ancillary_ena: false
20 ; CHECK-NEXT: .front_face_ena: true
21 ; CHECK-NEXT: .line_stipple_tex_ena: false
22 ; CHECK-NEXT: .linear_center_ena: true
23 ; CHECK-NEXT: .linear_centroid_ena: true
24 ; CHECK-NEXT: .linear_sample_ena: true
25 ; CHECK-NEXT: .persp_center_ena: true
26 ; CHECK-NEXT: .persp_centroid_ena: true
27 ; CHECK-NEXT: .persp_pull_model_ena: false
28 ; CHECK-NEXT: .persp_sample_ena: true
29 ; CHECK-NEXT: .pos_fixed_pt_ena: true
30 ; CHECK-NEXT: .pos_w_float_ena: false
31 ; CHECK-NEXT: .pos_x_float_ena: false
32 ; CHECK-NEXT: .pos_y_float_ena: false
33 ; CHECK-NEXT: .pos_z_float_ena: false
34 ; CHECK-NEXT: .sample_coverage_ena: false
35 ; CHECK-NEXT: .spi_ps_input_ena:
36 ; CHECK-NEXT: .ancillary_ena: false
37 ; CHECK-NEXT: .front_face_ena: false
38 ; CHECK-NEXT: .line_stipple_tex_ena: false
39 ; CHECK-NEXT: .linear_center_ena: false
40 ; CHECK-NEXT: .linear_centroid_ena: false
41 ; CHECK-NEXT: .linear_sample_ena: false
42 ; CHECK-NEXT: .persp_center_ena: false
43 ; CHECK-NEXT: .persp_centroid_ena: false
44 ; CHECK-NEXT: .persp_pull_model_ena: false
45 ; CHECK-NEXT: .persp_sample_ena: true
46 ; CHECK-NEXT: .pos_fixed_pt_ena: false
47 ; CHECK-NEXT: .pos_w_float_ena: false
48 ; CHECK-NEXT: .pos_x_float_ena: false
49 ; CHECK-NEXT: .pos_y_float_ena: false
50 ; CHECK-NEXT: .pos_z_float_ena: false
51 ; CHECK-NEXT: .sample_coverage_ena: false
52 ; CHECK-NEXT: .hardware_stages:
54 ; CHECK-NEXT: .checksum_value: 0x9444d7d0
55 ; CHECK-NEXT: .debug_mode: false
56 ; CHECK-NEXT: .entry_point: _amdgpu_cs_main
57 ; CHECK-NEXT: .excp_en: 0
58 ; CHECK-NEXT: .float_mode: 0xc0
59 ; CHECK-NEXT: .ieee_mode: false
60 ; CHECK-NEXT: .image_op: false
61 ; CHECK-NEXT: .lds_size: 0
62 ; CHECK-NEXT: .mem_ordered: true
63 ; CHECK-NEXT: .scratch_en: false
64 ; CHECK-NEXT: .scratch_memory_size: 0
65 ; CHECK-NEXT: .sgpr_count: 0x4
66 ; CHECK-NEXT: .sgpr_limit: 0x6a
67 ; CHECK-NEXT: .threadgroup_dimensions:
71 ; CHECK-NEXT: .trap_present: false
72 ; CHECK-NEXT: .user_data_reg_map:
73 ; CHECK-NEXT: - 0x10000000
74 ; CHECK-NEXT: - 0xffffffff
76 ; CHECK-NEXT: - 0xffffffff
77 ; CHECK-NEXT: - 0xffffffff
78 ; CHECK-NEXT: - 0xffffffff
79 ; CHECK-NEXT: - 0xffffffff
80 ; CHECK-NEXT: - 0xffffffff
81 ; CHECK-NEXT: - 0xffffffff
82 ; CHECK-NEXT: - 0xffffffff
83 ; CHECK-NEXT: - 0xffffffff
84 ; CHECK-NEXT: - 0xffffffff
85 ; CHECK-NEXT: - 0xffffffff
86 ; CHECK-NEXT: - 0xffffffff
87 ; CHECK-NEXT: - 0xffffffff
88 ; CHECK-NEXT: - 0xffffffff
89 ; CHECK-NEXT: - 0xffffffff
90 ; CHECK-NEXT: - 0xffffffff
91 ; CHECK-NEXT: - 0xffffffff
92 ; CHECK-NEXT: - 0xffffffff
93 ; CHECK-NEXT: - 0xffffffff
94 ; CHECK-NEXT: - 0xffffffff
95 ; CHECK-NEXT: - 0xffffffff
96 ; CHECK-NEXT: - 0xffffffff
97 ; CHECK-NEXT: - 0xffffffff
98 ; CHECK-NEXT: - 0xffffffff
99 ; CHECK-NEXT: - 0xffffffff
100 ; CHECK-NEXT: - 0xffffffff
101 ; CHECK-NEXT: - 0xffffffff
102 ; CHECK-NEXT: - 0xffffffff
103 ; CHECK-NEXT: - 0xffffffff
104 ; CHECK-NEXT: - 0xffffffff
105 ; CHECK-NEXT: .user_sgprs: 0x3
106 ; CHECK-NEXT: .vgpr_count: 0x2
107 ; CHECK-NEXT: .vgpr_limit: 0x100
108 ; CHECK-NEXT: .wavefront_size: 0x40
109 ; CHECK-NEXT: .wgp_mode: false
111 ; CHECK-NEXT: .debug_mode: false
112 ; CHECK-NEXT: .entry_point: ps_shader
113 ; CHECK-NEXT: .ieee_mode: false
114 ; CHECK-NEXT: .mem_ordered: true
115 ; CHECK-NEXT: .scratch_en: false
116 ; CHECK-NEXT: .scratch_memory_size: 0
117 ; CHECK-NEXT: .sgpr_count: 0x1
118 ; CHECK-NEXT: .vgpr_count: 0x1
119 ; CHECK-NEXT: .wgp_mode: true
120 ; CHECK: .registers: {}
121 ; CHECK:amdpal.version:
125 ; CHECK-NEXT: .end_amdgpu_pal_metadata
127 define dllexport amdgpu_cs void @_amdgpu_cs_main(i32 inreg %arg1, i32 %arg2) #0 !lgc.shaderstage !1 {
129 %i = call i64 @llvm.amdgcn.s.getpc()
130 %i1 = and i64 %i, -4294967296
131 %i2 = zext i32 %arg1 to i64
132 %i3 = or i64 %i1, %i2
133 %i4 = inttoptr i64 %i3 to ptr addrspace(4)
134 %i5 = and i32 %arg2, 1023
135 %i6 = lshr i32 %arg2, 10
136 %i7 = and i32 %i6, 1023
137 %i8 = add nuw nsw i32 %i7, %i5
138 %i9 = load <4 x i32>, ptr addrspace(4) %i4, align 16
139 %.idx = shl nuw nsw i32 %i8, 2
140 call void @llvm.amdgcn.raw.buffer.store.i32(i32 1, <4 x i32> %i9, i32 %.idx, i32 0, i32 0)
144 define dllexport amdgpu_ps void @ps_shader() #1 {
148 !amdgpu.pal.metadata.msgpack = !{!0}
150 ; Function Attrs: nounwind willreturn memory(none)
151 declare ptr addrspace(7) @lgc.buffer.desc.to.ptr(<4 x i32>) #1
153 ; Function Attrs: nocallback nofree nosync nounwind speculatable willreturn memory(none)
154 declare i64 @llvm.amdgcn.s.getpc() #2
156 ; Function Attrs: nocallback nofree nosync nounwind willreturn memory(write)
157 declare void @llvm.amdgcn.raw.buffer.store.i32(i32, <4 x i32>, i32, i32, i32 immarg) #3
159 attributes #0 = { nounwind memory(readwrite) "amdgpu-flat-work-group-size"="1024,1024" "amdgpu-memory-bound"="false" "amdgpu-unroll-threshold"="700" "amdgpu-wave-limiter"="false" "amdgpu-work-group-info-arg-no"="4" "denormal-fp-math-f32"="preserve-sign" "target-features"=",+wavefrontsize64,+cumode" }
161 attributes #1 = { nounwind memory(readwrite) "InitialPSInputAddr"="36983" }
163 !0 = !{!"\82\B0amdpal.pipelines\91\8A\A4.api\A6Vulkan\B2.compute_registers\85\AB.tg_size_en\C3\AA.tgid_x_en\C2\AA.tgid_y_en\C2\AA.tgid_z_en\C2\AF.tidig_comp_cnt\01\B0.hardware_stages\81\A3.cs\8C\AF.checksum_value\CE\94D\D7\D0\AB.debug_mode\00\AB.float_mode\CC\C0\A9.image_op\C2\AC.mem_ordered\C3\AB.sgpr_limitj\B7.threadgroup_dimensions\93\01\CD\04\00\01\AD.trap_present\00\B2.user_data_reg_map\DC\00 \CE\10\00\00\00\CE\FF\FF\FF\FF\00\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\CE\FF\FF\FF\FF\AB.user_sgprs\03\AB.vgpr_limit\CD\01\00\AF.wavefront_size@\B7.internal_pipeline_hash\92\CF\E7\10k\A6:\A6%\F7\CF\B2\1F\1A\D4{\DA\E1T\AA.registers\80\A8.shaders\81\A8.compute\82\B0.api_shader_hash\92\CF\E9Zn7}\1E\B9\E7\00\B1.hardware_mapping\91\A3.cs\B0.spill_threshold\CE\FF\FF\FF\FF\A5.type\A2Cs\B0.user_data_limit\01\AF.xgl_cache_info\82\B3.128_bit_cache_hash\92\CF\B4X\B8\11[\A4\88P\CF\A0;\B0\AF\FF\B4\BE\C0\AD.llpc_version\A461.1\AEamdpal.version\92\03\00"}