[MLIR][NVVM] Add TMA Bulk Copy Ops (#123186)
[llvm-project.git] / llvm / test / MC / AMDGPU / gfx11_asm_vop1-fake16.s
blobc590d42c0dc663098b87993822aa4aec377e158c
1 // RUN: llvm-mc -triple=amdgcn -mcpu=gfx1100 -mattr=-real-true16,+wavefrontsize32 -show-encoding %s | FileCheck --check-prefix=GFX11 %s
2 // RUN: llvm-mc -triple=amdgcn -mcpu=gfx1100 -mattr=-real-true16,+wavefrontsize64 -show-encoding %s | FileCheck --check-prefix=GFX11 %s
4 v_floor_f16 v5, v1
5 // GFX11: encoding: [0x01,0xb7,0x0a,0x7e]
7 v_floor_f16 v5, v127
8 // GFX11: encoding: [0x7f,0xb7,0x0a,0x7e]
10 v_floor_f16 v5, s1
11 // GFX11: encoding: [0x01,0xb6,0x0a,0x7e]
13 v_floor_f16 v5, s105
14 // GFX11: encoding: [0x69,0xb6,0x0a,0x7e]
16 v_floor_f16 v5, vcc_lo
17 // GFX11: encoding: [0x6a,0xb6,0x0a,0x7e]
19 v_floor_f16 v5, vcc_hi
20 // GFX11: encoding: [0x6b,0xb6,0x0a,0x7e]
22 v_floor_f16 v5, ttmp15
23 // GFX11: encoding: [0x7b,0xb6,0x0a,0x7e]
25 v_floor_f16 v5, m0
26 // GFX11: encoding: [0x7d,0xb6,0x0a,0x7e]
28 v_floor_f16 v5, exec_lo
29 // GFX11: encoding: [0x7e,0xb6,0x0a,0x7e]
31 v_floor_f16 v5, exec_hi
32 // GFX11: encoding: [0x7f,0xb6,0x0a,0x7e]
34 v_floor_f16 v5, null
35 // GFX11: encoding: [0x7c,0xb6,0x0a,0x7e]
37 v_floor_f16 v5, -1
38 // GFX11: encoding: [0xc1,0xb6,0x0a,0x7e]
40 v_floor_f16 v5, 0.5
41 // GFX11: encoding: [0xf0,0xb6,0x0a,0x7e]
43 v_floor_f16 v5, src_scc
44 // GFX11: encoding: [0xfd,0xb6,0x0a,0x7e]
46 v_floor_f16 v127, 0xfe0b
47 // GFX11: encoding: [0xff,0xb6,0xfe,0x7e,0x0b,0xfe,0x00,0x00]
49 v_floor_f32 v5, v1
50 // GFX11: encoding: [0x01,0x49,0x0a,0x7e]
52 v_ceil_f16 v5, v1
53 // GFX11: encoding: [0x01,0xb9,0x0a,0x7e]
55 v_ceil_f16 v5, v127
56 // GFX11: encoding: [0x7f,0xb9,0x0a,0x7e]
58 v_ceil_f16 v5, s1
59 // GFX11: encoding: [0x01,0xb8,0x0a,0x7e]
61 v_ceil_f16 v5, s105
62 // GFX11: encoding: [0x69,0xb8,0x0a,0x7e]
64 v_ceil_f16 v5, vcc_lo
65 // GFX11: encoding: [0x6a,0xb8,0x0a,0x7e]
67 v_ceil_f16 v5, vcc_hi
68 // GFX11: encoding: [0x6b,0xb8,0x0a,0x7e]
70 v_ceil_f16 v5, ttmp15
71 // GFX11: encoding: [0x7b,0xb8,0x0a,0x7e]
73 v_ceil_f16 v5, m0
74 // GFX11: encoding: [0x7d,0xb8,0x0a,0x7e]
76 v_ceil_f16 v5, exec_lo
77 // GFX11: encoding: [0x7e,0xb8,0x0a,0x7e]
79 v_ceil_f16 v5, exec_hi
80 // GFX11: encoding: [0x7f,0xb8,0x0a,0x7e]
82 v_ceil_f16 v5, null
83 // GFX11: encoding: [0x7c,0xb8,0x0a,0x7e]
85 v_ceil_f16 v5, -1
86 // GFX11: encoding: [0xc1,0xb8,0x0a,0x7e]
88 v_ceil_f16 v5, 0.5
89 // GFX11: encoding: [0xf0,0xb8,0x0a,0x7e]
91 v_ceil_f16 v5, src_scc
92 // GFX11: encoding: [0xfd,0xb8,0x0a,0x7e]
94 v_ceil_f16 v127, 0xfe0b
95 // GFX11: encoding: [0xff,0xb8,0xfe,0x7e,0x0b,0xfe,0x00,0x00]
97 v_rcp_f16 v5, v1
98 // GFX11: encoding: [0x01,0xa9,0x0a,0x7e]
100 v_rcp_f16 v5, v127
101 // GFX11: encoding: [0x7f,0xa9,0x0a,0x7e]
103 v_rcp_f16 v5, s1
104 // GFX11: encoding: [0x01,0xa8,0x0a,0x7e]
106 v_rcp_f16 v5, s105
107 // GFX11: encoding: [0x69,0xa8,0x0a,0x7e]
109 v_rcp_f16 v5, vcc_lo
110 // GFX11: encoding: [0x6a,0xa8,0x0a,0x7e]
112 v_rcp_f16 v5, vcc_hi
113 // GFX11: encoding: [0x6b,0xa8,0x0a,0x7e]
115 v_rcp_f16 v5, ttmp15
116 // GFX11: encoding: [0x7b,0xa8,0x0a,0x7e]
118 v_rcp_f16 v5, m0
119 // GFX11: encoding: [0x7d,0xa8,0x0a,0x7e]
121 v_rcp_f16 v5, exec_lo
122 // GFX11: encoding: [0x7e,0xa8,0x0a,0x7e]
124 v_rcp_f16 v5, exec_hi
125 // GFX11: encoding: [0x7f,0xa8,0x0a,0x7e]
127 v_rcp_f16 v5, null
128 // GFX11: encoding: [0x7c,0xa8,0x0a,0x7e]
130 v_rcp_f16 v5, -1
131 // GFX11: encoding: [0xc1,0xa8,0x0a,0x7e]
133 v_rcp_f16 v5, 0.5
134 // GFX11: encoding: [0xf0,0xa8,0x0a,0x7e]
136 v_rcp_f16 v5, src_scc
137 // GFX11: encoding: [0xfd,0xa8,0x0a,0x7e]
139 v_rcp_f16 v127, 0xfe0b
140 // GFX11: encoding: [0xff,0xa8,0xfe,0x7e,0x0b,0xfe,0x00,0x00]
142 v_sqrt_f16 v5, v1
143 // GFX11: encoding: [0x01,0xab,0x0a,0x7e]
145 v_sqrt_f16 v5, v127
146 // GFX11: encoding: [0x7f,0xab,0x0a,0x7e]
148 v_sqrt_f16 v5, s1
149 // GFX11: encoding: [0x01,0xaa,0x0a,0x7e]
151 v_sqrt_f16 v5, s105
152 // GFX11: encoding: [0x69,0xaa,0x0a,0x7e]
154 v_sqrt_f16 v5, vcc_lo
155 // GFX11: encoding: [0x6a,0xaa,0x0a,0x7e]
157 v_sqrt_f16 v5, vcc_hi
158 // GFX11: encoding: [0x6b,0xaa,0x0a,0x7e]
160 v_sqrt_f16 v5, ttmp15
161 // GFX11: encoding: [0x7b,0xaa,0x0a,0x7e]
163 v_sqrt_f16 v5, m0
164 // GFX11: encoding: [0x7d,0xaa,0x0a,0x7e]
166 v_sqrt_f16 v5, exec_lo
167 // GFX11: encoding: [0x7e,0xaa,0x0a,0x7e]
169 v_sqrt_f16 v5, exec_hi
170 // GFX11: encoding: [0x7f,0xaa,0x0a,0x7e]
172 v_sqrt_f16 v5, null
173 // GFX11: encoding: [0x7c,0xaa,0x0a,0x7e]
175 v_sqrt_f16 v5, -1
176 // GFX11: encoding: [0xc1,0xaa,0x0a,0x7e]
178 v_sqrt_f16 v5, 0.5
179 // GFX11: encoding: [0xf0,0xaa,0x0a,0x7e]
181 v_sqrt_f16 v5, src_scc
182 // GFX11: encoding: [0xfd,0xaa,0x0a,0x7e]
184 v_sqrt_f16 v127, 0xfe0b
185 // GFX11: encoding: [0xff,0xaa,0xfe,0x7e,0x0b,0xfe,0x00,0x00]
187 v_rsq_f16 v5, v1
188 // GFX11: encoding: [0x01,0xad,0x0a,0x7e]
190 v_rsq_f16 v5, v127
191 // GFX11: encoding: [0x7f,0xad,0x0a,0x7e]
193 v_rsq_f16 v5, s1
194 // GFX11: encoding: [0x01,0xac,0x0a,0x7e]
196 v_rsq_f16 v5, s105
197 // GFX11: encoding: [0x69,0xac,0x0a,0x7e]
199 v_rsq_f16 v5, vcc_lo
200 // GFX11: encoding: [0x6a,0xac,0x0a,0x7e]
202 v_rsq_f16 v5, vcc_hi
203 // GFX11: encoding: [0x6b,0xac,0x0a,0x7e]
205 v_rsq_f16 v5, ttmp15
206 // GFX11: encoding: [0x7b,0xac,0x0a,0x7e]
208 v_rsq_f16 v5, m0
209 // GFX11: encoding: [0x7d,0xac,0x0a,0x7e]
211 v_rsq_f16 v5, exec_lo
212 // GFX11: encoding: [0x7e,0xac,0x0a,0x7e]
214 v_rsq_f16 v5, exec_hi
215 // GFX11: encoding: [0x7f,0xac,0x0a,0x7e]
217 v_rsq_f16 v5, null
218 // GFX11: encoding: [0x7c,0xac,0x0a,0x7e]
220 v_rsq_f16 v5, -1
221 // GFX11: encoding: [0xc1,0xac,0x0a,0x7e]
223 v_rsq_f16 v5, 0.5
224 // GFX11: encoding: [0xf0,0xac,0x0a,0x7e]
226 v_rsq_f16 v5, src_scc
227 // GFX11: encoding: [0xfd,0xac,0x0a,0x7e]
229 v_log_f16 v5, v1
230 // GFX11: encoding: [0x01,0xaf,0x0a,0x7e]
232 v_log_f16 v5, v127
233 // GFX11: encoding: [0x7f,0xaf,0x0a,0x7e]
235 v_log_f16 v5, s1
236 // GFX11: encoding: [0x01,0xae,0x0a,0x7e]
238 v_log_f16 v5, s105
239 // GFX11: encoding: [0x69,0xae,0x0a,0x7e]
241 v_log_f16 v5, vcc_lo
242 // GFX11: encoding: [0x6a,0xae,0x0a,0x7e]
244 v_log_f16 v5, vcc_hi
245 // GFX11: encoding: [0x6b,0xae,0x0a,0x7e]
247 v_log_f16 v5, ttmp15
248 // GFX11: encoding: [0x7b,0xae,0x0a,0x7e]
250 v_log_f16 v5, m0
251 // GFX11: encoding: [0x7d,0xae,0x0a,0x7e]
253 v_log_f16 v5, exec_lo
254 // GFX11: encoding: [0x7e,0xae,0x0a,0x7e]
256 v_log_f16 v5, exec_hi
257 // GFX11: encoding: [0x7f,0xae,0x0a,0x7e]
259 v_log_f16 v5, null
260 // GFX11: encoding: [0x7c,0xae,0x0a,0x7e]
262 v_log_f16 v5, -1
263 // GFX11: encoding: [0xc1,0xae,0x0a,0x7e]
265 v_log_f16 v5, 0.5
266 // GFX11: encoding: [0xf0,0xae,0x0a,0x7e]
268 v_log_f16 v5, src_scc
269 // GFX11: encoding: [0xfd,0xae,0x0a,0x7e]
271 v_log_f16 v127, 0xfe0b
272 // GFX11: encoding: [0xff,0xae,0xfe,0x7e,0x0b,0xfe,0x00,0x00]
274 v_exp_f16 v5, v1
275 // GFX11: encoding: [0x01,0xb1,0x0a,0x7e]
277 v_exp_f16 v5, v127
278 // GFX11: encoding: [0x7f,0xb1,0x0a,0x7e]
280 v_exp_f16 v5, s1
281 // GFX11: encoding: [0x01,0xb0,0x0a,0x7e]
283 v_exp_f16 v5, s105
284 // GFX11: encoding: [0x69,0xb0,0x0a,0x7e]
286 v_exp_f16 v5, vcc_lo
287 // GFX11: encoding: [0x6a,0xb0,0x0a,0x7e]
289 v_exp_f16 v5, vcc_hi
290 // GFX11: encoding: [0x6b,0xb0,0x0a,0x7e]
292 v_exp_f16 v5, ttmp15
293 // GFX11: encoding: [0x7b,0xb0,0x0a,0x7e]
295 v_exp_f16 v5, m0
296 // GFX11: encoding: [0x7d,0xb0,0x0a,0x7e]
298 v_exp_f16 v5, exec_lo
299 // GFX11: encoding: [0x7e,0xb0,0x0a,0x7e]
301 v_exp_f16 v5, exec_hi
302 // GFX11: encoding: [0x7f,0xb0,0x0a,0x7e]
304 v_exp_f16 v5, null
305 // GFX11: encoding: [0x7c,0xb0,0x0a,0x7e]
307 v_exp_f16 v5, -1
308 // GFX11: encoding: [0xc1,0xb0,0x0a,0x7e]
310 v_exp_f16 v5, 0.5
311 // GFX11: encoding: [0xf0,0xb0,0x0a,0x7e]
313 v_exp_f16 v5, src_scc
314 // GFX11: encoding: [0xfd,0xb0,0x0a,0x7e]
316 v_exp_f16 v127, 0xfe0b
317 // GFX11: encoding: [0xff,0xb0,0xfe,0x7e,0x0b,0xfe,0x00,0x00]