1 // RUN
: %clang_cc1 -O0 -cl-std
=CL2.0 -triple amdgcn-amd-amdhsa -target-cpu gfx1200 -target-feature
+wavefrontsize32 \
2 // RUN
: -verify -S -o - %s
4 // REQUIRES
: amdgpu-registered-target
6 typedef short v4s __attribute__
((ext_vector_type(4)));
7 typedef half v4h __attribute__
((ext_vector_type(4)));
8 typedef __bf16 v4y __attribute__
((ext_vector_type(4)));
10 void amdgcn_global_load_tr
(global int
* int_inptr
, global v4s
* v4s_inptr
, global v4h
* v4h_inptr
, global v4y
* v4y_inptr
)
12 int out_1
= __builtin_amdgcn_global_load_tr_b64_i32
(int_inptr); // expected-error{{'__builtin_amdgcn_global_load_tr_b64_i32' needs target feature gfx12-insts,wavefrontsize64}}
13 v4s out_2
= __builtin_amdgcn_global_load_tr_b128_v4i16
(v4s_inptr); // expected-error{{'__builtin_amdgcn_global_load_tr_b128_v4i16' needs target feature gfx12-insts,wavefrontsize64}}
14 v4h out_3
= __builtin_amdgcn_global_load_tr_b128_v4f16
(v4h_inptr); // expected-error{{'__builtin_amdgcn_global_load_tr_b128_v4f16' needs target feature gfx12-insts,wavefrontsize64}}
15 v4y out_4
= __builtin_amdgcn_global_load_tr_b128_v4bf16
(v4y_inptr); // expected-error{{'__builtin_amdgcn_global_load_tr_b128_v4bf16' needs target feature gfx12-insts,wavefrontsize64}}