1 // REQUIRES
: amdgpu-registered-target
2 // RUN
: %clang_cc1 -triple amdgcn-unknown-unknown -S -emit-llvm -o - %s | FileCheck %s
3 // RUN
: %clang_cc1 -triple r600-unknown-unknown -S -emit-llvm -o - %s | FileCheck %s
5 typedef __attribute__
(( ext_vector_type
(2) )) char char2
;
6 typedef __attribute__
(( ext_vector_type
(3) )) char char3
;
7 typedef __attribute__
(( ext_vector_type
(4) )) char char4
;
9 typedef __attribute__
(( ext_vector_type
(2) )) short short2
;
10 typedef __attribute__
(( ext_vector_type
(3) )) short short3
;
11 typedef __attribute__
(( ext_vector_type
(4) )) short short4
;
13 typedef __attribute__
(( ext_vector_type
(2) )) int int2
;
14 typedef __attribute__
(( ext_vector_type
(3) )) int int3
;
15 typedef __attribute__
(( ext_vector_type
(4) )) int int4
;
16 typedef __attribute__
(( ext_vector_type
(16) )) int int16
;
17 typedef __attribute__
(( ext_vector_type
(32) )) int int32
;
19 // CHECK
: %struct.empty_struct
= type
{}
20 typedef struct empty_struct
24 // CHECK-NOT
: %struct.single_element_struct_arg
25 typedef struct single_element_struct_arg
28 } single_element_struct_arg_t
;
30 // CHECK-NOT
: %struct.nested_single_element_struct_arg
31 typedef struct nested_single_element_struct_arg
33 single_element_struct_arg_t i
;
34 } nested_single_element_struct_arg_t
;
36 // CHECK
: %struct.struct_arg
= type
{ i32
, float
, i32
}
37 typedef struct struct_arg
44 // CHECK
: %struct.struct_padding_arg
= type
{ i8
, i64
}
45 typedef struct struct_padding_arg
51 // CHECK
: %struct.struct_of_arrays_arg
= type
{ [2 x i32
], float
, [4 x i32
], [3 x float
], i32
}
52 typedef struct struct_of_arrays_arg
59 } struct_of_arrays_arg_t;
61 // CHECK: %struct.struct_of_structs_arg = type { i32, float, %struct.struct_arg, i32 }
62 typedef struct struct_of_structs_arg
68 } struct_of_structs_arg_t;
74 } transparent_u __attribute__((__transparent_union__));
76 // CHECK: %struct.single_array_element_struct_arg = type { [4 x i32] }
77 typedef struct single_array_element_struct_arg
80 } single_array_element_struct_arg_t;
82 // CHECK: %struct.single_struct_element_struct_arg = type { %struct.inner }
83 // CHECK: %struct.inner = type { i32, i64 }
84 typedef struct single_struct_element_struct_arg
90 } single_struct_element_struct_arg_t;
92 // CHECK: %struct.different_size_type_pair
93 typedef struct different_size_type_pair {
96 } different_size_type_pair;
98 // CHECK: %struct.flexible_array = type { i32, [0 x i32] }
99 typedef struct flexible_array
105 // CHECK: %struct.struct_arr16 = type { [16 x i32] }
106 typedef struct struct_arr16
111 // CHECK: %struct.struct_arr32 = type { [32 x i32] }
112 typedef struct struct_arr32
117 // CHECK: %struct.struct_arr33 = type { [33 x i32] }
118 typedef struct struct_arr33
123 // CHECK: %struct.struct_char_arr32 = type { [32 x i8] }
124 typedef struct struct_char_arr32
129 // CHECK-NOT: %struct.struct_char_x8
130 typedef struct struct_char_x8 {
135 // CHECK-NOT: %struct.struct_char_x4
136 typedef struct struct_char_x4 {
140 // CHECK-NOT: %struct.struct_char_x3
141 typedef struct struct_char_x3 {
145 // CHECK-NOT: %struct.struct_char_x2
146 typedef struct struct_char_x2 {
150 // CHECK-NOT: %struct.struct_char_x1
151 typedef struct struct_char_x1 {
155 // 4 registers from fields, 5 if padding included.
156 // CHECK: %struct.nested = type { i8, i64 }
157 // CHECK: %struct.num_regs_nested_struct = type { i32, %struct.nested }
158 typedef struct num_regs_nested_struct {
164 } num_regs_nested_struct;
166 // CHECK: %struct.double_nested = type { %struct.inner_inner }
167 // CHECK: %struct.inner_inner = type { i8, i32, i8 }
168 // CHECK: %struct.double_nested_struct = type { i32, %struct.double_nested, i16 }
169 typedef struct double_nested_struct {
171 struct double_nested {
180 } double_nested_struct;
182 // This is a large struct, but uses fewer registers than the limit.
183 // CHECK: %struct.large_struct_padding = type { i8, i32, i8, i32, i8, i8, i16, i16, [3 x i8], i64, i32, i8, i32, i16, i8 }
184 typedef struct large_struct_padding {
200 } large_struct_padding;
202 // The number of registers computed should be 6, not 8.
203 typedef struct int3_pair {
208 // CHECK: %struct.struct_4regs = type { i32, i32, i32, i32 }
209 typedef struct struct_4regs
217 // CHECK: void @kernel_empty_struct_arg(%struct.empty_struct %s.coerce)
218 __kernel void kernel_empty_struct_arg(empty_struct s) { }
220 // CHECK: void @kernel_single_element_struct_arg(i32 %arg1.coerce)
221 __kernel void kernel_single_element_struct_arg(single_element_struct_arg_t arg1) { }
223 // CHECK: void @kernel_nested_single_element_struct_arg(i32 %arg1.coerce)
224 __kernel void kernel_nested_single_element_struct_arg(nested_single_element_struct_arg_t arg1) { }
226 // CHECK: void @kernel_struct_arg(%struct.struct_arg %arg1.coerce)
227 __kernel void kernel_struct_arg(struct_arg_t arg1) { }
229 // CHECK: void @kernel_struct_padding_arg(%struct.struct_padding_arg %arg1.coerce)
230 __kernel void kernel_struct_padding_arg(struct_padding_arg arg1) { }
232 // CHECK: void @kernel_test_struct_of_arrays_arg(%struct.struct_of_arrays_arg %arg1.coerce)
233 __kernel void kernel_test_struct_of_arrays_arg(struct_of_arrays_arg_t arg1) { }
235 // CHECK: void @kernel_struct_of_structs_arg(%struct.struct_of_structs_arg %arg1.coerce)
236 __kernel void kernel_struct_of_structs_arg(struct_of_structs_arg_t arg1) { }
238 // CHECK: void @test_kernel_transparent_union_arg(i32 %u.coerce)
239 __kernel void test_kernel_transparent_union_arg(transparent_u u) { }
241 // CHECK: void @kernel_single_array_element_struct_arg(%struct.single_array_element_struct_arg %arg1.coerce)
242 __kernel void kernel_single_array_element_struct_arg(single_array_element_struct_arg_t arg1) { }
244 // CHECK: void @kernel_single_struct_element_struct_arg(%struct.single_struct_element_struct_arg %arg1.coerce)
245 __kernel void kernel_single_struct_element_struct_arg(single_struct_element_struct_arg_t arg1) { }
247 // CHECK: void @kernel_different_size_type_pair_arg(%struct.different_size_type_pair %arg1.coerce)
248 __kernel void kernel_different_size_type_pair_arg(different_size_type_pair arg1) { }
250 // CHECK: define{{.*}} void @func_f32_arg(float noundef %arg)
251 void func_f32_arg(float arg) { }
253 // CHECK: define{{.*}} void @func_v2i16_arg(<2 x i16> noundef %arg)
254 void func_v2i16_arg(short2 arg) { }
256 // CHECK: define{{.*}} void @func_v3i32_arg(<3 x i32> noundef %arg)
257 void func_v3i32_arg(int3 arg) { }
259 // CHECK: define{{.*}} void @func_v4i32_arg(<4 x i32> noundef %arg)
260 void func_v4i32_arg(int4 arg) { }
262 // CHECK: define{{.*}} void @func_v16i32_arg(<16 x i32> noundef %arg)
263 void func_v16i32_arg(int16 arg) { }
265 // CHECK: define{{.*}} void @func_v32i32_arg(<32 x i32> noundef %arg)
266 void func_v32i32_arg(int32 arg) { }
268 // CHECK: define{{.*}} void @func_empty_struct_arg()
269 void func_empty_struct_arg(empty_struct empty) { }
271 // CHECK: void @func_single_element_struct_arg(i32 %arg1.coerce)
272 void func_single_element_struct_arg(single_element_struct_arg_t arg1) { }
274 // CHECK: void @func_nested_single_element_struct_arg(i32 %arg1.coerce)
275 void func_nested_single_element_struct_arg(nested_single_element_struct_arg_t arg1) { }
277 // CHECK: void @func_struct_arg(i32 %arg1.coerce0, float %arg1.coerce1, i32 %arg1.coerce2)
278 void func_struct_arg(struct_arg_t arg1) { }
280 // CHECK: void @func_struct_padding_arg(i8 %arg1.coerce0, i64 %arg1.coerce1)
281 void func_struct_padding_arg(struct_padding_arg arg1) { }
283 // CHECK: define{{.*}} void @func_struct_char_x8([2 x i32] %arg.coerce)
284 void func_struct_char_x8(struct_char_x8 arg) { }
286 // CHECK: define{{.*}} void @func_struct_char_x4(i32 %arg.coerce)
287 void func_struct_char_x4(struct_char_x4 arg) { }
289 // CHECK: define{{.*}} void @func_struct_char_x3(i32 %arg.coerce)
290 void func_struct_char_x3(struct_char_x3 arg) { }
292 // CHECK: define{{.*}} void @func_struct_char_x2(i16 %arg.coerce)
293 void func_struct_char_x2(struct_char_x2 arg) { }
295 // CHECK: define{{.*}} void @func_struct_char_x1(i8 %arg.coerce)
296 void func_struct_char_x1(struct_char_x1 arg) { }
298 // CHECK: void @func_transparent_union_arg(i32 %u.coerce)
299 void func_transparent_union_arg(transparent_u u) { }
301 // CHECK: void @func_single_array_element_struct_arg([4 x i32] %arg1.coerce)
302 void func_single_array_element_struct_arg(single_array_element_struct_arg_t arg1) { }
304 // CHECK: void @func_single_struct_element_struct_arg(%struct.inner %arg1.coerce)
305 void func_single_struct_element_struct_arg(single_struct_element_struct_arg_t arg1) { }
307 // CHECK: void @func_different_size_type_pair_arg(i64 %arg1.coerce0, i32 %arg1.coerce1)
308 void func_different_size_type_pair_arg(different_size_type_pair arg1) { }
310 // CHECK: void @func_flexible_array_arg(ptr addrspace(5) nocapture noundef readnone byval(%struct.flexible_array) align 4 %arg)
311 void func_flexible_array_arg(flexible_array arg) { }
313 // CHECK: define{{.*}} float @func_f32_ret()
319 // CHECK: define{{.*}} void @func_empty_struct_ret()
320 empty_struct func_empty_struct_ret()
326 // CHECK: define{{.*}} i32 @single_element_struct_ret()
328 single_element_struct_arg_t single_element_struct_ret()
330 single_element_struct_arg_t s = { 0 };
334 // CHECK: define{{.*}} i32 @nested_single_element_struct_ret()
336 nested_single_element_struct_arg_t nested_single_element_struct_ret()
338 nested_single_element_struct_arg_t s = { 0 };
342 // CHECK: define{{.*}} %struct.struct_arg @func_struct_ret()
343 // CHECK: ret %struct.struct_arg zeroinitializer
344 struct_arg_t func_struct_ret()
346 struct_arg_t s = { 0 };
350 // CHECK: define{{.*}} %struct.struct_padding_arg @func_struct_padding_ret()
351 // CHECK: ret %struct.struct_padding_arg zeroinitializer
352 struct_padding_arg func_struct_padding_ret()
354 struct_padding_arg s = { 0 };
358 // CHECK: define{{.*}} [2 x i32] @func_struct_char_x8_ret()
359 // CHECK: ret [2 x i32] zeroinitializer
360 struct_char_x8 func_struct_char_x8_ret()
362 struct_char_x8 s = { 0 };
366 // CHECK: define{{.*}} i32 @func_struct_char_x4_ret()
368 struct_char_x4 func_struct_char_x4_ret()
370 struct_char_x4 s = { 0 };
374 // CHECK: define{{.*}} i32 @func_struct_char_x3_ret()
376 struct_char_x3 func_struct_char_x3_ret()
378 struct_char_x3 s = { 0 };
382 // CHECK: define{{.*}} i16 @func_struct_char_x2_ret()
383 struct_char_x2 func_struct_char_x2_ret()
385 struct_char_x2 s = { 0 };
389 // CHECK: define{{.*}} i8 @func_struct_char_x1_ret()
391 struct_char_x1 func_struct_char_x1_ret()
393 struct_char_x1 s = { 0 };
397 // CHECK: define{{.*}} %struct.struct_arr16 @func_ret_struct_arr16()
398 // CHECK: ret %struct.struct_arr16 zeroinitializer
399 struct_arr16 func_ret_struct_arr16()
401 struct_arr16 s = { 0 };
405 // CHECK: define{{.*}} void @func_ret_struct_arr32(ptr addrspace(5) noalias nocapture writeonly sret(%struct.struct_arr32) align 4 %agg.result)
406 struct_arr32 func_ret_struct_arr32()
408 struct_arr32 s = { 0 };
412 // CHECK: define{{.*}} void @func_ret_struct_arr33(ptr addrspace(5) noalias nocapture writeonly sret(%struct.struct_arr33) align 4 %agg.result)
413 struct_arr33 func_ret_struct_arr33()
415 struct_arr33 s = { 0 };
419 // CHECK: define{{.*}} %struct.struct_char_arr32 @func_ret_struct_char_arr32()
420 struct_char_arr32 func_ret_struct_char_arr32()
422 struct_char_arr32 s = { 0 };
426 // CHECK: define{{.*}} i32 @func_transparent_union_ret() local_unnamed_addr #1 {
428 transparent_u func_transparent_union_ret()
430 transparent_u u = { 0 };
434 // CHECK: define{{.*}} %struct.different_size_type_pair @func_different_size_type_pair_ret()
435 different_size_type_pair func_different_size_type_pair_ret()
437 different_size_type_pair s = { 0 };
441 // CHECK: define{{.*}} void @func_flexible_array_ret(ptr addrspace(5) noalias nocapture writeonly sret(%struct.flexible_array) align 4 %agg.result)
442 flexible_array func_flexible_array_ret()
444 flexible_array s = { 0 };
448 // CHECK: define{{.*}} void @func_reg_state_lo(<4 x i32> noundef %arg0, <4 x i32> noundef %arg1, <4 x i32> noundef %arg2, i32 noundef %arg3, i32 %s.coerce0, float %s.coerce1, i32 %s.coerce2)
449 void func_reg_state_lo(int4 arg0, int4 arg1, int4 arg2, int arg3, struct_arg_t s) { }
451 // CHECK: define{{.*}} void @func_reg_state_hi(<4 x i32> noundef %arg0, <4 x i32> noundef %arg1, <4 x i32> noundef %arg2, i32 noundef %arg3, i32 noundef %arg4, ptr addrspace(5) nocapture noundef readnone byref(%struct.struct_arg) align 4 %{{.*}})
452 void func_reg_state_hi(int4 arg0, int4 arg1, int4 arg2, int arg3, int arg4, struct_arg_t s) { }
454 // XXX - Why don't the inner structs flatten?
455 // CHECK: define{{.*}} void @func_reg_state_num_regs_nested_struct(<4 x i32> noundef %arg0, i32 noundef %arg1, i32 %arg2.coerce0, %struct.nested %arg2.coerce1, i32 %arg3.coerce0, %struct.nested %arg3.coerce1, ptr addrspace(5) nocapture noundef readnone byref(%struct.num_regs_nested_struct) align 8 %{{.*}})
456 void func_reg_state_num_regs_nested_struct(int4 arg0, int arg1, num_regs_nested_struct arg2, num_regs_nested_struct arg3, num_regs_nested_struct arg4) { }
458 // CHECK: define{{.*}} void @func_double_nested_struct_arg(<4 x i32> noundef %arg0, i32 noundef %arg1, i32 %arg2.coerce0, %struct.double_nested %arg2.coerce1, i16 %arg2.coerce2)
459 void func_double_nested_struct_arg(int4 arg0, int arg1, double_nested_struct arg2) { }
461 // CHECK: define{{.*}} %struct.double_nested_struct @func_double_nested_struct_ret(<4 x i32> noundef %arg0, i32 noundef %arg1)
462 double_nested_struct func_double_nested_struct_ret(int4 arg0, int arg1) {
463 double_nested_struct s = { 0 };
467 // CHECK: define{{.*}} void @func_large_struct_padding_arg_direct(i8 %arg.coerce0, i32 %arg.coerce1, i8 %arg.coerce2, i32 %arg.coerce3, i8 %arg.coerce4, i8 %arg.coerce5, i16 %arg.coerce6, i16 %arg.coerce7, [3 x i8] %arg.coerce8, i64 %arg.coerce9, i32 %arg.coerce10, i8 %arg.coerce11, i32 %arg.coerce12, i16 %arg.coerce13, i8 %arg.coerce14)
468 void func_large_struct_padding_arg_direct(large_struct_padding arg) { }
470 // CHECK: define{{.*}} void @func_large_struct_padding_arg_store(ptr addrspace(1) nocapture noundef writeonly %out, ptr addrspace(5) nocapture noundef readonly byref(%struct.large_struct_padding) align 8 %{{.*}})
471 void func_large_struct_padding_arg_store(global large_struct_padding* out, large_struct_padding arg) {
475 // CHECK: define{{.*}} void @v3i32_reg_count(<3 x i32> noundef %arg1, <3 x i32> noundef %arg2, <3 x i32> noundef %arg3, <3 x i32> noundef %arg4, i32 %arg5.coerce0, float %arg5.coerce1, i32 %arg5.coerce2)
476 void v3i32_reg_count(int3 arg1, int3 arg2, int3 arg3, int3 arg4, struct_arg_t arg5) { }
478 // Function signature from blender, nothing should be passed byval. The v3i32
479 // should not count as 4 passed registers.
480 // CHECK: define{{.*}} void @v3i32_pair_reg_count(ptr addrspace(5) nocapture noundef readnone %arg0, <3 x i32> %arg1.coerce0, <3 x i32> %arg1.coerce1, <3 x i32> noundef %arg2, <3 x i32> %arg3.coerce0, <3 x i32> %arg3.coerce1, <3 x i32> noundef %arg4, float noundef %arg5)
481 void v3i32_pair_reg_count(int3_pair *arg0, int3_pair arg1, int3 arg2, int3_pair arg3, int3 arg4, float arg5) { }
483 // Each short4 should fit pack into 2 registers.
484 // CHECK: define{{.*}} void @v4i16_reg_count(<4 x i16> noundef %arg0, <4 x i16> noundef %arg1, <4 x i16> noundef %arg2, <4 x i16> noundef %arg3, <4 x i16> noundef %arg4, <4 x i16> noundef %arg5, i32 %arg6.coerce0, i32 %arg6.coerce1, i32 %arg6.coerce2, i32 %arg6.coerce3)
485 void v4i16_reg_count(short4 arg0, short4 arg1, short4 arg2, short4 arg3,
486 short4 arg4, short4 arg5, struct_4regs arg6) { }
488 // CHECK: define{{.*}} void @v4i16_pair_reg_count_over(<4 x i16> noundef %arg0, <4 x i16> noundef %arg1, <4 x i16> noundef %arg2, <4 x i16> noundef %arg3, <4 x i16> noundef %arg4, <4 x i16> noundef %arg5, <4 x i16> noundef %arg6, ptr addrspace(5) nocapture noundef readnone byref(%struct.struct_4regs) align 4 %{{.*}})
489 void v4i16_pair_reg_count_over(short4 arg0, short4 arg1, short4 arg2, short4 arg3,
490 short4 arg4, short4 arg5, short4 arg6, struct_4regs arg7) { }
492 // CHECK: define{{.*}} void @v3i16_reg_count(<3 x i16> noundef %arg0, <3 x i16> noundef %arg1, <3 x i16> noundef %arg2, <3 x i16> noundef %arg3, <3 x i16> noundef %arg4, <3 x i16> noundef %arg5, i32 %arg6.coerce0, i32 %arg6.coerce1, i32 %arg6.coerce2, i32 %arg6.coerce3)
493 void v3i16_reg_count(short3 arg0, short3 arg1, short3 arg2, short3 arg3,
494 short3 arg4, short3 arg5, struct_4regs arg6) { }
496 // CHECK: define{{.*}} void @v3i16_reg_count_over(<3 x i16> noundef %arg0, <3 x i16> noundef %arg1, <3 x i16> noundef %arg2, <3 x i16> noundef %arg3, <3 x i16> noundef %arg4, <3 x i16> noundef %arg5, <3 x i16> noundef %arg6, ptr addrspace(5) nocapture noundef readnone byref(%struct.struct_4regs) align 4 %{{.*}})
497 void v3i16_reg_count_over(short3 arg0, short3 arg1, short3 arg2, short3 arg3,
498 short3 arg4, short3 arg5, short3 arg6, struct_4regs arg7) { }
500 // CHECK: define{{.*}} void @v2i16_reg_count(<2 x i16> noundef %arg0, <2 x i16> noundef %arg1, <2 x i16> noundef %arg2, <2 x i16> noundef %arg3, <2 x i16> noundef %arg4, <2 x i16> noundef %arg5, <2 x i16> noundef %arg6, <2 x i16> noundef %arg7, <2 x i16> noundef %arg8, <2 x i16> noundef %arg9, <2 x i16> noundef %arg10, <2 x i16> noundef %arg11, i32 %arg13.coerce0, i32 %arg13.coerce1, i32 %arg13.coerce2, i32 %arg13.coerce3)
501 void v2i16_reg_count(short2 arg0, short2 arg1, short2 arg2, short2 arg3,
502 short2 arg4, short2 arg5, short2 arg6, short2 arg7,
503 short2 arg8, short2 arg9, short2 arg10, short2 arg11,
504 struct_4regs arg13) { }
506 // CHECK: define{{.*}} void @v2i16_reg_count_over(<2 x i16> noundef %arg0, <2 x i16> noundef %arg1, <2 x i16> noundef %arg2, <2 x i16> noundef %arg3, <2 x i16> noundef %arg4, <2 x i16> noundef %arg5, <2 x i16> noundef %arg6, <2 x i16> noundef %arg7, <2 x i16> noundef %arg8, <2 x i16> noundef %arg9, <2 x i16> noundef %arg10, <2 x i16> noundef %arg11, <2 x i16> noundef %arg12, ptr addrspace(5) nocapture noundef readnone byref(%struct.struct_4regs) align 4 %{{.*}})
507 void v2i16_reg_count_over(short2 arg0, short2 arg1, short2 arg2, short2 arg3,
508 short2 arg4, short2 arg5, short2 arg6, short2 arg7,
509 short2 arg8, short2 arg9, short2 arg10, short2 arg11,
510 short2 arg12, struct_4regs arg13) { }
512 // CHECK: define{{.*}} void @v2i8_reg_count(<2 x i8> noundef %arg0, <2 x i8> noundef %arg1, <2 x i8> noundef %arg2, <2 x i8> noundef %arg3, <2 x i8> noundef %arg4, <2 x i8> noundef %arg5, i32 %arg6.coerce0, i32 %arg6.coerce1, i32 %arg6.coerce2, i32 %arg6.coerce3)
513 void v2i8_reg_count(char2 arg0, char2 arg1, char2 arg2, char2 arg3,
514 char2 arg4, char2 arg5, struct_4regs arg6) { }
516 // CHECK: define{{.*}} void @v2i8_reg_count_over(<2 x i8> noundef %arg0, <2 x i8> noundef %arg1, <2 x i8> noundef %arg2, <2 x i8> noundef %arg3, <2 x i8> noundef %arg4, <2 x i8> noundef %arg5, i32 noundef %arg6, ptr addrspace(5) nocapture noundef readnone byref(%struct.struct_4regs) align 4 %{{.*}})
517 void v2i8_reg_count_over(char2 arg0, char2 arg1, char2 arg2, char2 arg3,
518 char2 arg4, char2 arg5, int arg6, struct_4regs arg7) { }
520 // CHECK: define{{.*}} void @num_regs_left_64bit_aggregate(<4 x i32> noundef %arg0, <4 x i32> noundef %arg1, <4 x i32> noundef %arg2, <3 x i32> noundef %arg3, [2 x i32] %arg4.coerce, i32 noundef %arg5)
521 void num_regs_left_64bit_aggregate(int4 arg0, int4 arg1, int4 arg2, int3 arg3, struct_char_x8 arg4, int arg5) { }