1 // RUN
: llvm-mc
-triple amdgcn-
-amdhsa
-mcpu
=gfx1010
--amdhsa-code-object-version
=2 -mattr
=-wavefrontsize32
,+wavefrontsize64
-show-encoding
%s | FileCheck
%s
--check-prefix
=ASM
2 // RUN
: llvm-mc
-filetype
=obj
-triple amdgcn-
-amdhsa
-mcpu
=gfx1010
--amdhsa-code-object-version
=2 -mattr
=-wavefrontsize32
,+wavefrontsize64
-show-encoding
%s | llvm-readobj
-S
--sd
--syms
- | FileCheck
%s
--check-prefix
=ELF
6 // ELF
: Type
: SHT_PROGBITS
(0x1)
8 // ELF
: SHF_ALLOC
(0x2)
9 // ELF
: SHF_EXECINSTR
(0x4)
12 // ELF
: 0000: 04000000 08000000 01000000 414D4400
13 // ELF
: 0010: 02000000 00000000 04000000 1B000000
14 // ELF
: 0020: 03000000 414D4400
04000700 07000000
15 // ELF
: 0030: 00000000 00000000 414D4400
414D4447
16 // ELF
: 0040: 50550000
17 // We can
't check binary representation of metadata note: it is different on
18 // Windows and Linux because of carriage return on Windows
21 // ELF: Name: amd_kernel_code_t_test_all
22 // ELF: Type: AMDGPU_HSA_KERNEL (0xA)
23 // ELF: Section: .text
26 // ELF: Name: amd_kernel_code_t_minimal
27 // ELF: Type: AMDGPU_HSA_KERNEL (0xA)
28 // ELF: Section: .text
34 .hsa_code_object_version 2,0
35 // ASM: .hsa_code_object_version 2,0
37 .hsa_code_object_isa 7,0,0,"AMD","AMDGPU"
38 // ASM: .hsa_code_object_isa 7,0,0,"AMD","AMDGPU"
40 .amd_amdgpu_hsa_metadata
43 - Name: amd_kernel_code_t_test_all
44 SymbolName: amd_kernel_code_t_test_all@kd
45 - Name: amd_kernel_code_t_minimal
46 SymbolName: amd_kernel_code_t_minimal@kd
47 .end_amd_amdgpu_hsa_metadata
49 // ASM: .amd_amdgpu_hsa_metadata
50 // ASM: Version: [ 3, 0 ]
52 // ASM: - Name: amd_kernel_code_t_test_all
53 // ASM: SymbolName: 'amd_kernel_code_t_test_all@kd
'
54 // ASM: - Name: amd_kernel_code_t_minimal
55 // ASM: SymbolName: 'amd_kernel_code_t_minimal@kd
'
56 // ASM: .end_amd_amdgpu_hsa_metadata
58 .amdgpu_hsa_kernel amd_kernel_code_t_test_all
59 .amdgpu_hsa_kernel amd_kernel_code_t_minimal
61 amd_kernel_code_t_test_all:
62 ; Test all amd_kernel_code_t members with non-default values.
64 kernel_code_version_major = 100
65 kernel_code_version_minor = 100
67 machine_version_major = 5
68 machine_version_minor = 5
69 machine_version_stepping = 5
70 kernel_code_entry_byte_offset = 512
71 kernel_code_prefetch_byte_size = 1
72 max_scratch_backing_memory_byte_size = 1
73 compute_pgm_rsrc1_vgprs = 1
74 compute_pgm_rsrc1_sgprs = 1
75 compute_pgm_rsrc1_priority = 1
76 compute_pgm_rsrc1_float_mode = 1
77 compute_pgm_rsrc1_priv = 1
78 compute_pgm_rsrc1_dx10_clamp = 1
79 compute_pgm_rsrc1_debug_mode = 1
80 compute_pgm_rsrc1_ieee_mode = 1
81 compute_pgm_rsrc1_wgp_mode = 0
82 compute_pgm_rsrc1_mem_ordered = 0
83 compute_pgm_rsrc1_fwd_progress = 1
84 compute_pgm_rsrc2_scratch_en = 1
85 compute_pgm_rsrc2_user_sgpr = 1
86 compute_pgm_rsrc2_tgid_x_en = 1
87 compute_pgm_rsrc2_tgid_y_en = 1
88 compute_pgm_rsrc2_tgid_z_en = 1
89 compute_pgm_rsrc2_tg_size_en = 1
90 compute_pgm_rsrc2_tidig_comp_cnt = 1
91 compute_pgm_rsrc2_excp_en_msb = 1
92 compute_pgm_rsrc2_lds_size = 1
93 compute_pgm_rsrc2_excp_en = 1
94 enable_sgpr_private_segment_buffer = 1
95 enable_sgpr_dispatch_ptr = 1
96 enable_sgpr_queue_ptr = 1
97 enable_sgpr_kernarg_segment_ptr = 1
98 enable_sgpr_dispatch_id = 1
99 enable_sgpr_flat_scratch_init = 1
100 enable_sgpr_private_segment_size = 1
101 enable_sgpr_grid_workgroup_count_x = 1
102 enable_sgpr_grid_workgroup_count_y = 1
103 enable_sgpr_grid_workgroup_count_z = 1
104 enable_ordered_append_gds = 1
105 private_element_size = 1
107 is_dynamic_callstack = 1
110 workitem_private_segment_byte_size = 1
111 workgroup_group_segment_byte_size = 1
112 gds_segment_byte_size = 1
113 kernarg_segment_byte_size = 1
114 workgroup_fbarrier_count = 1
115 wavefront_sgpr_count = 1
116 workitem_vgpr_count = 1
117 reserved_vgpr_first = 1
118 reserved_vgpr_count = 1
119 reserved_sgpr_first = 1
120 reserved_sgpr_count = 1
121 debug_wavefront_private_segment_offset_sgpr = 1
122 debug_private_segment_buffer_sgpr = 1
123 kernarg_segment_alignment = 5
124 group_segment_alignment = 5
125 private_segment_alignment = 5
128 runtime_loader_kernel_symbol = 1
129 .end_amd_kernel_code_t
131 // ASM-LABEL: {{^}}amd_kernel_code_t_test_all:
132 // ASM: .amd_kernel_code_t
133 // ASM: amd_code_version_major = 100
134 // ASM: amd_code_version_minor = 100
135 // ASM: amd_machine_kind = 0
136 // ASM: amd_machine_version_major = 5
137 // ASM: amd_machine_version_minor = 5
138 // ASM: amd_machine_version_stepping = 5
139 // ASM: kernel_code_entry_byte_offset = 512
140 // ASM: kernel_code_prefetch_byte_size = 1
141 // ASM: granulated_workitem_vgpr_count = 1
142 // ASM: granulated_wavefront_sgpr_count = 1
144 // ASM: float_mode = 1
146 // ASM: enable_dx10_clamp = 1
147 // ASM: debug_mode = 1
148 // ASM: enable_ieee_mode = 1
149 // ASM: enable_wgp_mode = 0
150 // ASM: enable_mem_ordered = 0
151 // ASM: enable_fwd_progress = 1
152 // ASM: enable_sgpr_private_segment_wave_byte_offset = 1
153 // ASM: user_sgpr_count = 1
154 // ASM: enable_sgpr_workgroup_id_x = 1
155 // ASM: enable_sgpr_workgroup_id_y = 1
156 // ASM: enable_sgpr_workgroup_id_z = 1
157 // ASM: enable_sgpr_workgroup_info = 1
158 // ASM: enable_vgpr_workitem_id = 1
159 // ASM: enable_exception_msb = 1
160 // ASM: granulated_lds_size = 1
161 // ASM: enable_exception = 1
162 // ASM: enable_sgpr_private_segment_buffer = 1
163 // ASM: enable_sgpr_dispatch_ptr = 1
164 // ASM: enable_sgpr_queue_ptr = 1
165 // ASM: enable_sgpr_kernarg_segment_ptr = 1
166 // ASM: enable_sgpr_dispatch_id = 1
167 // ASM: enable_sgpr_flat_scratch_init = 1
168 // ASM: enable_sgpr_private_segment_size = 1
169 // ASM: enable_sgpr_grid_workgroup_count_x = 1
170 // ASM: enable_sgpr_grid_workgroup_count_y = 1
171 // ASM: enable_sgpr_grid_workgroup_count_z = 1
172 // ASM: enable_ordered_append_gds = 1
173 // ASM: private_element_size = 1
175 // ASM: is_dynamic_callstack = 1
176 // ASM: is_debug_enabled = 1
177 // ASM: is_xnack_enabled = 1
178 // ASM: workitem_private_segment_byte_size = 1
179 // ASM: workgroup_group_segment_byte_size = 1
180 // ASM: gds_segment_byte_size = 1
181 // ASM: kernarg_segment_byte_size = 1
182 // ASM: workgroup_fbarrier_count = 1
183 // ASM: wavefront_sgpr_count = 1
184 // ASM: workitem_vgpr_count = 1
185 // ASM: reserved_vgpr_first = 1
186 // ASM: reserved_vgpr_count = 1
187 // ASM: reserved_sgpr_first = 1
188 // ASM: reserved_sgpr_count = 1
189 // ASM: debug_wavefront_private_segment_offset_sgpr = 1
190 // ASM: debug_private_segment_buffer_sgpr = 1
191 // ASM: kernarg_segment_alignment = 5
192 // ASM: group_segment_alignment = 5
193 // ASM: private_segment_alignment = 5
194 // ASM: wavefront_size = 6
195 // ASM: call_convention = 1
196 // ASM: runtime_loader_kernel_symbol = 1
197 // ASM: .end_amd_kernel_code_t
199 amd_kernel_code_t_minimal:
201 enable_sgpr_kernarg_segment_ptr = 1
203 granulated_workitem_vgpr_count = 1
204 granulated_wavefront_sgpr_count = 1
206 kernarg_segment_byte_size = 16
207 wavefront_sgpr_count = 8
208 // wavefront_sgpr_count = 7
209 ; wavefront_sgpr_count = 7
210 // Make sure a blank line won't break anything
:
212 // Make sure
a line with whitespace won
't break anything:
214 workitem_vgpr_count = 16
215 .end_amd_kernel_code_t
217 // ASM-LABEL: {{^}}amd_kernel_code_t_minimal:
218 // ASM: .amd_kernel_code_t
219 // ASM: amd_code_version_major = 1
220 // ASM: amd_code_version_minor = 2
221 // ASM: amd_machine_kind = 1
222 // ASM: amd_machine_version_major = 10
223 // ASM: amd_machine_version_minor = 1
224 // ASM: amd_machine_version_stepping = 0
225 // ASM: kernel_code_entry_byte_offset = 256
226 // ASM: kernel_code_prefetch_byte_size = 0
227 // ASM: granulated_workitem_vgpr_count = 1
228 // ASM: granulated_wavefront_sgpr_count = 1
230 // ASM: float_mode = 0
232 // ASM: enable_dx10_clamp = 0
233 // ASM: debug_mode = 0
234 // ASM: enable_ieee_mode = 0
235 // ASM: enable_wgp_mode = 1
236 // ASM: enable_mem_ordered = 1
237 // ASM: enable_fwd_progress = 0
238 // ASM: enable_sgpr_private_segment_wave_byte_offset = 0
239 // ASM: user_sgpr_count = 2
240 // ASM: enable_sgpr_workgroup_id_x = 0
241 // ASM: enable_sgpr_workgroup_id_y = 0
242 // ASM: enable_sgpr_workgroup_id_z = 0
243 // ASM: enable_sgpr_workgroup_info = 0
244 // ASM: enable_vgpr_workitem_id = 0
245 // ASM: enable_exception_msb = 0
246 // ASM: granulated_lds_size = 0
247 // ASM: enable_exception = 0
248 // ASM: enable_sgpr_private_segment_buffer = 0
249 // ASM: enable_sgpr_dispatch_ptr = 0
250 // ASM: enable_sgpr_queue_ptr = 0
251 // ASM: enable_sgpr_kernarg_segment_ptr = 1
252 // ASM: enable_sgpr_dispatch_id = 0
253 // ASM: enable_sgpr_flat_scratch_init = 0
254 // ASM: enable_sgpr_private_segment_size = 0
255 // ASM: enable_sgpr_grid_workgroup_count_x = 0
256 // ASM: enable_sgpr_grid_workgroup_count_y = 0
257 // ASM: enable_sgpr_grid_workgroup_count_z = 0
258 // ASM: enable_wavefront_size32 = 0
259 // ASM: enable_ordered_append_gds = 0
260 // ASM: private_element_size = 0
262 // ASM: is_dynamic_callstack = 0
263 // ASM: is_debug_enabled = 0
264 // ASM: is_xnack_enabled = 0
265 // ASM: workitem_private_segment_byte_size = 0
266 // ASM: workgroup_group_segment_byte_size = 0
267 // ASM: gds_segment_byte_size = 0
268 // ASM: kernarg_segment_byte_size = 16
269 // ASM: workgroup_fbarrier_count = 0
270 // ASM: wavefront_sgpr_count = 8
271 // ASM: workitem_vgpr_count = 16
272 // ASM: reserved_vgpr_first = 0
273 // ASM: reserved_vgpr_count = 0
274 // ASM: reserved_sgpr_first = 0
275 // ASM: reserved_sgpr_count = 0
276 // ASM: debug_wavefront_private_segment_offset_sgpr = 0
277 // ASM: debug_private_segment_buffer_sgpr = 0
278 // ASM: kernarg_segment_alignment = 4
279 // ASM: group_segment_alignment = 4
280 // ASM: private_segment_alignment = 4
281 // ASM: wavefront_size = 6
282 // ASM: call_convention = -1
283 // ASM: runtime_loader_kernel_symbol = 0
284 // ASM: .end_amd_kernel_code_t