[Frontend] Remove unused includes (NFC) (#116927)
[llvm-project.git] / llvm / test / MC / AMDGPU / gfx12_asm_vop3p.s
blobdb9ad3d2a8418d778561e4670e24d48efce57215
1 // RUN: llvm-mc -triple=amdgcn -show-encoding -mcpu=gfx1200 %s | FileCheck --check-prefix=GFX12 %s
3 v_dot2_f32_bf16 v5, v1, v2, v3
4 // GFX12: [0x05,0x40,0x1a,0xcc,0x01,0x05,0x0e,0x1c]
6 v_dot2_f32_bf16 v5, v1, v2, s3
7 // GFX12: [0x05,0x40,0x1a,0xcc,0x01,0x05,0x0e,0x18]
9 v_dot2_f32_bf16 v5, v255, v255, s105
10 // GFX12: [0x05,0x40,0x1a,0xcc,0xff,0xff,0xa7,0x19]
12 v_dot2_f32_bf16 v5, s1, s2, v255
13 // GFX12: [0x05,0x40,0x1a,0xcc,0x01,0x04,0xfc,0x1f]
15 v_dot2_f32_bf16 v5, s105, s105, m0
16 // GFX12: [0x05,0x40,0x1a,0xcc,0x69,0xd2,0xf4,0x19]
18 v_dot2_f32_bf16 v5, vcc_lo, ttmp15, vcc_lo
19 // GFX12: [0x05,0x40,0x1a,0xcc,0x6a,0xf6,0xa8,0x19]
21 v_dot2_f32_bf16 v5, vcc_hi, 0xfe0b, vcc_hi
22 // GFX12: [0x05,0x40,0x1a,0xcc,0x6b,0xfe,0xad,0x19,0x0b,0xfe,0x00,0x00]
24 v_dot2_f32_bf16 v5, ttmp15, src_scc, ttmp15
25 // GFX12: [0x05,0x40,0x1a,0xcc,0x7b,0xfa,0xed,0x19]
27 v_dot2_f32_bf16 v5, m0, -1, exec_hi
28 // GFX12: [0x05,0x40,0x1a,0xcc,0x7d,0x82,0xfd,0x19]
30 v_dot2_f32_bf16 v5, exec_lo, null, exec_lo
31 // GFX12: [0x05,0x40,0x1a,0xcc,0x7e,0xf8,0xf8,0x19]
33 v_dot2_f32_bf16 v5, exec_hi, exec_lo, null
34 // GFX12: [0x05,0x40,0x1a,0xcc,0x7f,0xfc,0xf0,0x19]
36 v_dot2_f32_bf16 v5, null, exec_hi, -1
37 // GFX12: [0x05,0x40,0x1a,0xcc,0x7c,0xfe,0x04,0x1b]
39 v_dot2_f32_bf16 v5, -1, m0, 0xaf123456
40 // GFX12: [0x05,0x40,0x1a,0xcc,0xc1,0xfa,0xfc,0x1b,0x56,0x34,0x12,0xaf]
42 v_dot2_f32_bf16 v5, src_scc, vcc_lo, src_scc neg_lo:[1,0,0] neg_hi:[1,0,0]
43 // GFX12: [0x05,0x41,0x1a,0xcc,0xfd,0xd4,0xf4,0x3b]
45 v_dot2_f32_bf16 v255, 0xfe0b, vcc_hi, 0.5 neg_lo:[0,0,0] neg_hi:[0,0,0] clamp
46 // GFX12: [0xff,0xc0,0x1a,0xcc,0xff,0xd6,0xc0,0x1b,0x0b,0xfe,0x00,0x00]
48 v_dot2_f32_f16 v5, v1, v2, s3
49 // GFX12: [0x05,0x40,0x13,0xcc,0x01,0x05,0x0e,0x18]
51 v_dot2_f32_f16 v5, v255, s2, s105
52 // GFX12: [0x05,0x40,0x13,0xcc,0xff,0x05,0xa4,0x19]
54 v_dot2_f32_f16 v5, s1, v255, exec_hi
55 // GFX12: [0x05,0x40,0x13,0xcc,0x01,0xfe,0xff,0x19]
57 v_dot2_f32_f16 v5, s105, s105, exec_lo
58 // GFX12: [0x05,0x40,0x13,0xcc,0x69,0xd2,0xf8,0x19]
60 v_dot2_f32_f16 v5, vcc_lo, ttmp15, v3
61 // GFX12: [0x05,0x40,0x13,0xcc,0x6a,0xf6,0x0c,0x1c]
63 v_dot2_f32_f16 v5, vcc_hi, 0xfe0b, v255
64 // GFX12: [0x05,0x40,0x13,0xcc,0x6b,0xfe,0xfd,0x1f,0x0b,0xfe,0x00,0x00]
66 v_dot2_f32_f16 v5, ttmp15, src_scc, ttmp15
67 // GFX12: [0x05,0x40,0x13,0xcc,0x7b,0xfa,0xed,0x19]
69 v_dot2_f32_f16 v5, m0, 0.5, m0
70 // GFX12: [0x05,0x40,0x13,0xcc,0x7d,0xe0,0xf5,0x19]
72 v_dot2_f32_f16 v5, exec_lo, -1, vcc_hi
73 // GFX12: [0x05,0x40,0x13,0xcc,0x7e,0x82,0xad,0x19]
75 v_dot2_f32_f16 v5, exec_hi, null, vcc_lo
76 // GFX12: [0x05,0x40,0x13,0xcc,0x7f,0xf8,0xa8,0x19]
78 v_dot2_f32_f16 v5, null, exec_lo, 0xaf123456
79 // GFX12: [0x05,0x40,0x13,0xcc,0x7c,0xfc,0xfc,0x1b,0x56,0x34,0x12,0xaf]
81 v_dot2_f32_f16 v5, -1, exec_hi, src_scc
82 // GFX12: [0x05,0x40,0x13,0xcc,0xc1,0xfe,0xf4,0x1b]
84 v_dot2_f32_f16 v5, 0.5, m0, 0.5 neg_lo:[1,0,0] neg_hi:[1,0,0]
85 // GFX12: [0x05,0x41,0x13,0xcc,0xf0,0xfa,0xc0,0x3b]
87 v_dot2_f32_f16 v5, src_scc, vcc_lo, -1 neg_lo:[0,1,0] neg_hi:[0,1,0]
88 // GFX12: [0x05,0x42,0x13,0xcc,0xfd,0xd4,0x04,0x5b]
90 v_dot2_f32_f16 v255, 0xfe0b, vcc_hi, null neg_lo:[0,0,0] neg_hi:[0,0,0] clamp
91 // GFX12: [0xff,0xc0,0x13,0xcc,0xff,0xd6,0xf0,0x19,0x0b,0xfe,0x00,0x00]
93 v_dot4_i32_iu8 v5, v1, v2, s3
94 // GFX12: [0x05,0x40,0x16,0xcc,0x01,0x05,0x0e,0x18]
96 v_dot4_i32_iu8 v5, v255, s2, s105
97 // GFX12: [0x05,0x40,0x16,0xcc,0xff,0x05,0xa4,0x19]
99 v_dot4_i32_iu8 v5, s1, v255, exec_hi
100 // GFX12: [0x05,0x40,0x16,0xcc,0x01,0xfe,0xff,0x19]
102 v_dot4_i32_iu8 v5, s105, s105, exec_lo
103 // GFX12: [0x05,0x40,0x16,0xcc,0x69,0xd2,0xf8,0x19]
105 v_dot4_i32_iu8 v5, vcc_lo, ttmp15, v3
106 // GFX12: [0x05,0x40,0x16,0xcc,0x6a,0xf6,0x0c,0x1c]
108 v_dot4_i32_iu8 v5, vcc_hi, 0xaf123456, v255
109 // GFX12: [0x05,0x40,0x16,0xcc,0x6b,0xfe,0xfd,0x1f,0x56,0x34,0x12,0xaf]
111 v_dot4_i32_iu8 v5, ttmp15, src_scc, ttmp15
112 // GFX12: [0x05,0x40,0x16,0xcc,0x7b,0xfa,0xed,0x19]
114 v_dot4_i32_iu8 v5, m0, 0.5, m0
115 // GFX12: [0x05,0x40,0x16,0xcc,0x7d,0xe0,0xf5,0x19]
117 v_dot4_i32_iu8 v5, exec_lo, -1, vcc_hi
118 // GFX12: [0x05,0x40,0x16,0xcc,0x7e,0x82,0xad,0x19]
120 v_dot4_i32_iu8 v5, exec_hi, null, vcc_lo
121 // GFX12: [0x05,0x40,0x16,0xcc,0x7f,0xf8,0xa8,0x19]
123 v_dot4_i32_iu8 v5, null, exec_lo, 0xaf123456
124 // GFX12: [0x05,0x40,0x16,0xcc,0x7c,0xfc,0xfc,0x1b,0x56,0x34,0x12,0xaf]
126 v_dot4_i32_iu8 v5, -1, exec_hi, src_scc
127 // GFX12: [0x05,0x40,0x16,0xcc,0xc1,0xfe,0xf4,0x1b]
129 v_dot4_i32_iu8 v5, 0.5, m0, 0.5 neg_lo:[1,0,0]
130 // GFX12: [0x05,0x40,0x16,0xcc,0xf0,0xfa,0xc0,0x3b]
132 v_dot4_i32_iu8 v5, src_scc, vcc_lo, -1 neg_lo:[0,1,0]
133 // GFX12: [0x05,0x40,0x16,0xcc,0xfd,0xd4,0x04,0x5b]
135 v_dot4_i32_iu8 v255, 0xaf123456, vcc_hi, null neg_lo:[0,0,0]
136 // GFX12: [0xff,0x40,0x16,0xcc,0xff,0xd6,0xf0,0x19,0x56,0x34,0x12,0xaf]
138 v_dot4_u32_u8 v5, v1, v2, s3
139 // GFX12: [0x05,0x40,0x17,0xcc,0x01,0x05,0x0e,0x18]
141 v_dot4_u32_u8 v5, v255, s2, s105
142 // GFX12: [0x05,0x40,0x17,0xcc,0xff,0x05,0xa4,0x19]
144 v_dot4_u32_u8 v5, s1, v255, exec_hi
145 // GFX12: [0x05,0x40,0x17,0xcc,0x01,0xfe,0xff,0x19]
147 v_dot4_u32_u8 v5, s105, s105, exec_lo
148 // GFX12: [0x05,0x40,0x17,0xcc,0x69,0xd2,0xf8,0x19]
150 v_dot4_u32_u8 v5, vcc_lo, ttmp15, v3
151 // GFX12: [0x05,0x40,0x17,0xcc,0x6a,0xf6,0x0c,0x1c]
153 v_dot4_u32_u8 v5, vcc_hi, 0xaf123456, v255
154 // GFX12: [0x05,0x40,0x17,0xcc,0x6b,0xfe,0xfd,0x1f,0x56,0x34,0x12,0xaf]
156 v_dot4_u32_u8 v5, ttmp15, src_scc, ttmp15
157 // GFX12: [0x05,0x40,0x17,0xcc,0x7b,0xfa,0xed,0x19]
159 v_dot4_u32_u8 v5, m0, 0.5, m0
160 // GFX12: [0x05,0x40,0x17,0xcc,0x7d,0xe0,0xf5,0x19]
162 v_dot4_u32_u8 v5, exec_lo, -1, vcc_hi
163 // GFX12: [0x05,0x40,0x17,0xcc,0x7e,0x82,0xad,0x19]
165 v_dot4_u32_u8 v5, exec_hi, null, vcc_lo
166 // GFX12: [0x05,0x40,0x17,0xcc,0x7f,0xf8,0xa8,0x19]
168 v_dot4_u32_u8 v5, null, exec_lo, 0xaf123456
169 // GFX12: [0x05,0x40,0x17,0xcc,0x7c,0xfc,0xfc,0x1b,0x56,0x34,0x12,0xaf]
171 v_dot4_u32_u8 v5, -1, exec_hi, src_scc
172 // GFX12: [0x05,0x40,0x17,0xcc,0xc1,0xfe,0xf4,0x1b]
174 v_dot4_u32_u8 v5, 0.5, m0, 0.5
175 // GFX12: [0x05,0x40,0x17,0xcc,0xf0,0xfa,0xc0,0x1b]
177 v_dot4_u32_u8 v5, src_scc, vcc_lo, -1
178 // GFX12: [0x05,0x40,0x17,0xcc,0xfd,0xd4,0x04,0x1b]
180 v_dot4_u32_u8 v255, 0xaf123456, vcc_hi, null
181 // GFX12: [0xff,0x40,0x17,0xcc,0xff,0xd6,0xf0,0x19,0x56,0x34,0x12,0xaf]
183 v_dot8_i32_iu4 v5, v1, v2, s3
184 // GFX12: [0x05,0x40,0x18,0xcc,0x01,0x05,0x0e,0x18]
186 v_dot8_i32_iu4 v5, v255, s2, s105
187 // GFX12: [0x05,0x40,0x18,0xcc,0xff,0x05,0xa4,0x19]
189 v_dot8_i32_iu4 v5, s1, v255, exec_hi
190 // GFX12: [0x05,0x40,0x18,0xcc,0x01,0xfe,0xff,0x19]
192 v_dot8_i32_iu4 v5, s105, s105, exec_lo
193 // GFX12: [0x05,0x40,0x18,0xcc,0x69,0xd2,0xf8,0x19]
195 v_dot8_i32_iu4 v5, vcc_lo, ttmp15, v3
196 // GFX12: [0x05,0x40,0x18,0xcc,0x6a,0xf6,0x0c,0x1c]
198 v_dot8_i32_iu4 v5, vcc_hi, 0xaf123456, v255
199 // GFX12: [0x05,0x40,0x18,0xcc,0x6b,0xfe,0xfd,0x1f,0x56,0x34,0x12,0xaf]
201 v_dot8_i32_iu4 v5, ttmp15, src_scc, ttmp15
202 // GFX12: [0x05,0x40,0x18,0xcc,0x7b,0xfa,0xed,0x19]
204 v_dot8_i32_iu4 v5, m0, 0.5, m0
205 // GFX12: [0x05,0x40,0x18,0xcc,0x7d,0xe0,0xf5,0x19]
207 v_dot8_i32_iu4 v5, exec_lo, -1, vcc_hi
208 // GFX12: [0x05,0x40,0x18,0xcc,0x7e,0x82,0xad,0x19]
210 v_dot8_i32_iu4 v5, exec_hi, null, vcc_lo
211 // GFX12: [0x05,0x40,0x18,0xcc,0x7f,0xf8,0xa8,0x19]
213 v_dot8_i32_iu4 v5, null, exec_lo, 0xaf123456
214 // GFX12: [0x05,0x40,0x18,0xcc,0x7c,0xfc,0xfc,0x1b,0x56,0x34,0x12,0xaf]
216 v_dot8_i32_iu4 v5, -1, exec_hi, src_scc
217 // GFX12: [0x05,0x40,0x18,0xcc,0xc1,0xfe,0xf4,0x1b]
219 v_dot8_i32_iu4 v5, 0.5, m0, 0.5 neg_lo:[1,0,0]
220 // GFX12: [0x05,0x40,0x18,0xcc,0xf0,0xfa,0xc0,0x3b]
222 v_dot8_i32_iu4 v5, src_scc, vcc_lo, -1 neg_lo:[0,1,0]
223 // GFX12: [0x05,0x40,0x18,0xcc,0xfd,0xd4,0x04,0x5b]
225 v_dot8_i32_iu4 v255, 0xaf123456, vcc_hi, null neg_lo:[0,0,0] clamp
226 // GFX12: [0xff,0xc0,0x18,0xcc,0xff,0xd6,0xf0,0x19,0x56,0x34,0x12,0xaf]
228 v_dot8_u32_u4 v5, v1, v2, s3
229 // GFX12: [0x05,0x40,0x19,0xcc,0x01,0x05,0x0e,0x18]
231 v_dot8_u32_u4 v5, v255, s2, s105
232 // GFX12: [0x05,0x40,0x19,0xcc,0xff,0x05,0xa4,0x19]
234 v_dot8_u32_u4 v5, s1, v255, exec_hi
235 // GFX12: [0x05,0x40,0x19,0xcc,0x01,0xfe,0xff,0x19]
237 v_dot8_u32_u4 v5, s105, s105, exec_lo
238 // GFX12: [0x05,0x40,0x19,0xcc,0x69,0xd2,0xf8,0x19]
240 v_dot8_u32_u4 v5, vcc_lo, ttmp15, v3
241 // GFX12: [0x05,0x40,0x19,0xcc,0x6a,0xf6,0x0c,0x1c]
243 v_dot8_u32_u4 v5, vcc_hi, 0xaf123456, v255
244 // GFX12: [0x05,0x40,0x19,0xcc,0x6b,0xfe,0xfd,0x1f,0x56,0x34,0x12,0xaf]
246 v_dot8_u32_u4 v5, ttmp15, src_scc, ttmp15
247 // GFX12: [0x05,0x40,0x19,0xcc,0x7b,0xfa,0xed,0x19]
249 v_dot8_u32_u4 v5, m0, 0.5, m0
250 // GFX12: [0x05,0x40,0x19,0xcc,0x7d,0xe0,0xf5,0x19]
252 v_dot8_u32_u4 v5, exec_lo, -1, vcc_hi
253 // GFX12: [0x05,0x40,0x19,0xcc,0x7e,0x82,0xad,0x19]
255 v_dot8_u32_u4 v5, exec_hi, null, vcc_lo
256 // GFX12: [0x05,0x40,0x19,0xcc,0x7f,0xf8,0xa8,0x19]
258 v_dot8_u32_u4 v5, null, exec_lo, 0xaf123456
259 // GFX12: [0x05,0x40,0x19,0xcc,0x7c,0xfc,0xfc,0x1b,0x56,0x34,0x12,0xaf]
261 v_dot8_u32_u4 v5, -1, exec_hi, src_scc
262 // GFX12: [0x05,0x40,0x19,0xcc,0xc1,0xfe,0xf4,0x1b]
264 v_dot8_u32_u4 v5, 0.5, m0, 0.5
265 // GFX12: [0x05,0x40,0x19,0xcc,0xf0,0xfa,0xc0,0x1b]
267 v_dot8_u32_u4 v5, src_scc, vcc_lo, -1
268 // GFX12: [0x05,0x40,0x19,0xcc,0xfd,0xd4,0x04,0x1b]
270 v_dot8_u32_u4 v255, 0xaf123456, vcc_hi, null clamp
271 // GFX12: [0xff,0xc0,0x19,0xcc,0xff,0xd6,0xf0,0x19,0x56,0x34,0x12,0xaf]
273 v_fma_mix_f32 v5, v1, v2, s3
274 // GFX12: [0x05,0x00,0x20,0xcc,0x01,0x05,0x0e,0x00]
276 v_fma_mix_f32 v5, v255, v255, s105
277 // GFX12: [0x05,0x00,0x20,0xcc,0xff,0xff,0xa7,0x01]
279 v_fma_mix_f32 v5, s1, s2, v3
280 // GFX12: [0x05,0x00,0x20,0xcc,0x01,0x04,0x0c,0x04]
282 v_fma_mix_f32 v5, s105, s105, m0
283 // GFX12: [0x05,0x00,0x20,0xcc,0x69,0xd2,0xf4,0x01]
285 v_fma_mix_f32 v5, vcc_lo, ttmp15, ttmp15
286 // GFX12: [0x05,0x00,0x20,0xcc,0x6a,0xf6,0xec,0x01]
288 v_fma_mix_f32 v5, vcc_hi, src_scc, v255
289 // GFX12: [0x05,0x00,0x20,0xcc,0x6b,0xfa,0xfd,0x07]
291 v_fma_mix_f32 v5, |ttmp15|, 0.5, -vcc_hi
292 // GFX12: [0x05,0x01,0x20,0xcc,0x7b,0xe0,0xad,0x81]
294 v_fma_mix_f32 v5, -m0, -1, |vcc_lo|
295 // GFX12: [0x05,0x04,0x20,0xcc,0x7d,0x82,0xa9,0x21]
297 v_fma_mix_f32 v5, -|exec_lo|, null, -|src_scc|
298 // GFX12: [0x05,0x05,0x20,0xcc,0x7e,0xf8,0xf4,0xa3]
300 v_fma_mix_f32 v5, -|exec_hi|, -|exec_lo|, -|exec_lo| op_sel:[1,1,1] op_sel_hi:[1,1,1]
301 // GFX12: [0x05,0x7f,0x20,0xcc,0x7f,0xfc,0xf8,0xf9]
303 v_fma_mix_f32 v5, null, exec_hi, 0.5 op_sel:[0,0,0] op_sel_hi:[0,0,1]
304 // GFX12: [0x05,0x40,0x20,0xcc,0x7c,0xfe,0xc0,0x03]
306 v_fma_mix_f32 v5, -1, -|m0|, -1 op_sel:[1,0,0] op_sel_hi:[0,1,0]
307 // GFX12: [0x05,0x0a,0x20,0xcc,0xc1,0xfa,0x04,0x53]
309 v_fma_mix_f32 v5, 0.5, -|vcc_lo|, -|exec_hi| op_sel:[0,1,0] op_sel_hi:[1,0,0]
310 // GFX12: [0x05,0x16,0x20,0xcc,0xf0,0xd4,0xfc,0xc9]
312 v_fma_mix_f32 v255, -|src_scc|, -|vcc_hi|, null op_sel:[0,0,1] op_sel_hi:[0,0,0] clamp
313 // GFX12: [0xff,0xa3,0x20,0xcc,0xfd,0xd6,0xf0,0x61]
315 v_fma_mixhi_f16 v5, v1, v2, s3
316 // GFX12: [0x05,0x00,0x22,0xcc,0x01,0x05,0x0e,0x00]
318 v_fma_mixhi_f16 v5, v255, v255, s105
319 // GFX12: [0x05,0x00,0x22,0xcc,0xff,0xff,0xa7,0x01]
321 v_fma_mixhi_f16 v5, s1, s2, v3
322 // GFX12: [0x05,0x00,0x22,0xcc,0x01,0x04,0x0c,0x04]
324 v_fma_mixhi_f16 v5, s105, s105, m0
325 // GFX12: [0x05,0x00,0x22,0xcc,0x69,0xd2,0xf4,0x01]
327 v_fma_mixhi_f16 v5, vcc_lo, ttmp15, ttmp15
328 // GFX12: [0x05,0x00,0x22,0xcc,0x6a,0xf6,0xec,0x01]
330 v_fma_mixhi_f16 v5, vcc_hi, src_scc, v255
331 // GFX12: [0x05,0x00,0x22,0xcc,0x6b,0xfa,0xfd,0x07]
333 v_fma_mixhi_f16 v5, |ttmp15|, 0.5, -vcc_hi
334 // GFX12: [0x05,0x01,0x22,0xcc,0x7b,0xe0,0xad,0x81]
336 v_fma_mixhi_f16 v5, -m0, -1, |vcc_lo|
337 // GFX12: [0x05,0x04,0x22,0xcc,0x7d,0x82,0xa9,0x21]
339 v_fma_mixhi_f16 v5, -|exec_lo|, null, -|src_scc|
340 // GFX12: [0x05,0x05,0x22,0xcc,0x7e,0xf8,0xf4,0xa3]
342 v_fma_mixhi_f16 v5, -|exec_hi|, -|exec_lo|, -|exec_lo| op_sel:[1,1,1] op_sel_hi:[1,1,1]
343 // GFX12: [0x05,0x7f,0x22,0xcc,0x7f,0xfc,0xf8,0xf9]
345 v_fma_mixhi_f16 v5, null, exec_hi, 0.5 op_sel:[0,0,0] op_sel_hi:[0,0,1]
346 // GFX12: [0x05,0x40,0x22,0xcc,0x7c,0xfe,0xc0,0x03]
348 v_fma_mixhi_f16 v5, -1, -|m0|, -1 op_sel:[1,0,0] op_sel_hi:[0,1,0]
349 // GFX12: [0x05,0x0a,0x22,0xcc,0xc1,0xfa,0x04,0x53]
351 v_fma_mixhi_f16 v5, 0.5, -|vcc_lo|, -|exec_hi| op_sel:[0,1,0] op_sel_hi:[1,0,0]
352 // GFX12: [0x05,0x16,0x22,0xcc,0xf0,0xd4,0xfc,0xc9]
354 v_fma_mixhi_f16 v255, -|src_scc|, -|vcc_hi|, null op_sel:[0,0,1] op_sel_hi:[0,0,0] clamp
355 // GFX12: [0xff,0xa3,0x22,0xcc,0xfd,0xd6,0xf0,0x61]
357 v_fma_mixlo_f16 v5, v1, v2, s3
358 // GFX12: [0x05,0x00,0x21,0xcc,0x01,0x05,0x0e,0x00]
360 v_fma_mixlo_f16 v5, v255, v255, s105
361 // GFX12: [0x05,0x00,0x21,0xcc,0xff,0xff,0xa7,0x01]
363 v_fma_mixlo_f16 v5, s1, s2, v3
364 // GFX12: [0x05,0x00,0x21,0xcc,0x01,0x04,0x0c,0x04]
366 v_fma_mixlo_f16 v5, s105, s105, m0
367 // GFX12: [0x05,0x00,0x21,0xcc,0x69,0xd2,0xf4,0x01]
369 v_fma_mixlo_f16 v5, vcc_lo, ttmp15, ttmp15
370 // GFX12: [0x05,0x00,0x21,0xcc,0x6a,0xf6,0xec,0x01]
372 v_fma_mixlo_f16 v5, vcc_hi, src_scc, v255
373 // GFX12: [0x05,0x00,0x21,0xcc,0x6b,0xfa,0xfd,0x07]
375 v_fma_mixlo_f16 v5, |ttmp15|, 0.5, -vcc_hi
376 // GFX12: [0x05,0x01,0x21,0xcc,0x7b,0xe0,0xad,0x81]
378 v_fma_mixlo_f16 v5, -m0, -1, |vcc_lo|
379 // GFX12: [0x05,0x04,0x21,0xcc,0x7d,0x82,0xa9,0x21]
381 v_fma_mixlo_f16 v5, -|exec_lo|, null, -|src_scc|
382 // GFX12: [0x05,0x05,0x21,0xcc,0x7e,0xf8,0xf4,0xa3]
384 v_fma_mixlo_f16 v5, -|exec_hi|, -|exec_lo|, -|exec_lo| op_sel:[1,1,1] op_sel_hi:[1,1,1]
385 // GFX12: [0x05,0x7f,0x21,0xcc,0x7f,0xfc,0xf8,0xf9]
387 v_fma_mixlo_f16 v5, null, exec_hi, 0.5 op_sel:[0,0,0] op_sel_hi:[0,0,1]
388 // GFX12: [0x05,0x40,0x21,0xcc,0x7c,0xfe,0xc0,0x03]
390 v_fma_mixlo_f16 v5, -1, -|m0|, -1 op_sel:[1,0,0] op_sel_hi:[0,1,0]
391 // GFX12: [0x05,0x0a,0x21,0xcc,0xc1,0xfa,0x04,0x53]
393 v_fma_mixlo_f16 v5, 0.5, -|vcc_lo|, -|exec_hi| op_sel:[0,1,0] op_sel_hi:[1,0,0]
394 // GFX12: [0x05,0x16,0x21,0xcc,0xf0,0xd4,0xfc,0xc9]
396 v_fma_mixlo_f16 v255, -|src_scc|, -|vcc_hi|, null op_sel:[0,0,1] op_sel_hi:[0,0,0] clamp
397 // GFX12: [0xff,0xa3,0x21,0xcc,0xfd,0xd6,0xf0,0x61]
399 v_pk_add_f16 v5, v1, v2
400 // GFX12: [0x05,0x40,0x0f,0xcc,0x01,0x05,0x02,0x18]
402 v_pk_add_f16 v5, v255, v255
403 // GFX12: [0x05,0x40,0x0f,0xcc,0xff,0xff,0x03,0x18]
405 v_pk_add_f16 v5, s1, s2
406 // GFX12: [0x05,0x40,0x0f,0xcc,0x01,0x04,0x00,0x18]
408 v_pk_add_f16 v5, s105, s105
409 // GFX12: [0x05,0x40,0x0f,0xcc,0x69,0xd2,0x00,0x18]
411 v_pk_add_f16 v5, vcc_lo, ttmp15
412 // GFX12: [0x05,0x40,0x0f,0xcc,0x6a,0xf6,0x00,0x18]
414 v_pk_add_f16 v5, vcc_hi, 0xfe0b
415 // GFX12: [0x05,0x40,0x0f,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00]
417 v_pk_add_f16 v5, ttmp15, src_scc
418 // GFX12: [0x05,0x40,0x0f,0xcc,0x7b,0xfa,0x01,0x18]
420 v_pk_add_f16 v5, m0, 0.5
421 // GFX12: [0x05,0x40,0x0f,0xcc,0x7d,0xe0,0x01,0x18]
423 v_pk_add_f16 v5, exec_lo, -1
424 // GFX12: [0x05,0x40,0x0f,0xcc,0x7e,0x82,0x01,0x18]
426 v_pk_add_f16 v5, exec_hi, null
427 // GFX12: [0x05,0x40,0x0f,0xcc,0x7f,0xf8,0x00,0x18]
429 v_pk_add_f16 v5, null, exec_lo
430 // GFX12: [0x05,0x40,0x0f,0xcc,0x7c,0xfc,0x00,0x18]
432 v_pk_add_f16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] neg_lo:[1,0] neg_hi:[1,0]
433 // GFX12: [0x05,0x59,0x0f,0xcc,0xc1,0xfe,0x00,0x20]
435 v_pk_add_f16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] neg_lo:[0,1] neg_hi:[0,1]
436 // GFX12: [0x05,0x42,0x0f,0xcc,0xf0,0xfa,0x00,0x58]
438 v_pk_add_f16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] neg_lo:[0,0] neg_hi:[0,0]
439 // GFX12: [0x05,0x48,0x0f,0xcc,0xfd,0xd4,0x00,0x10]
441 v_pk_add_f16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] neg_lo:[1,1] neg_hi:[1,1] clamp
442 // GFX12: [0xff,0xd3,0x0f,0xcc,0xff,0xd6,0x00,0x68,0x0b,0xfe,0x00,0x00]
444 v_pk_add_i16 v5, v1, v2
445 // GFX12: [0x05,0x40,0x02,0xcc,0x01,0x05,0x02,0x18]
447 v_pk_add_i16 v5, v255, v255
448 // GFX12: [0x05,0x40,0x02,0xcc,0xff,0xff,0x03,0x18]
450 v_pk_add_i16 v5, s1, s2
451 // GFX12: [0x05,0x40,0x02,0xcc,0x01,0x04,0x00,0x18]
453 v_pk_add_i16 v5, s105, s105
454 // GFX12: [0x05,0x40,0x02,0xcc,0x69,0xd2,0x00,0x18]
456 v_pk_add_i16 v5, vcc_lo, ttmp15
457 // GFX12: [0x05,0x40,0x02,0xcc,0x6a,0xf6,0x00,0x18]
459 v_pk_add_i16 v5, vcc_hi, 0xfe0b
460 // GFX12: [0x05,0x40,0x02,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00]
462 v_pk_add_i16 v5, ttmp15, src_scc
463 // GFX12: [0x05,0x40,0x02,0xcc,0x7b,0xfa,0x01,0x18]
465 v_pk_add_i16 v5, m0, 0.5
466 // GFX12: [0x05,0x40,0x02,0xcc,0x7d,0xe0,0x01,0x18]
468 v_pk_add_i16 v5, exec_lo, -1
469 // GFX12: [0x05,0x40,0x02,0xcc,0x7e,0x82,0x01,0x18]
471 v_pk_add_i16 v5, exec_hi, null
472 // GFX12: [0x05,0x40,0x02,0xcc,0x7f,0xf8,0x00,0x18]
474 v_pk_add_i16 v5, null, exec_lo
475 // GFX12: [0x05,0x40,0x02,0xcc,0x7c,0xfc,0x00,0x18]
477 v_pk_add_i16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0]
478 // GFX12: [0x05,0x58,0x02,0xcc,0xc1,0xfe,0x00,0x00]
480 v_pk_add_i16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1]
481 // GFX12: [0x05,0x40,0x02,0xcc,0xf0,0xfa,0x00,0x18]
483 v_pk_add_i16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1]
484 // GFX12: [0x05,0x48,0x02,0xcc,0xfd,0xd4,0x00,0x10]
486 v_pk_add_i16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] clamp
487 // GFX12: [0xff,0xd0,0x02,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00]
489 v_pk_add_u16 v5, v1, v2
490 // GFX12: [0x05,0x40,0x0a,0xcc,0x01,0x05,0x02,0x18]
492 v_pk_add_u16 v5, v255, v255
493 // GFX12: [0x05,0x40,0x0a,0xcc,0xff,0xff,0x03,0x18]
495 v_pk_add_u16 v5, s1, s2
496 // GFX12: [0x05,0x40,0x0a,0xcc,0x01,0x04,0x00,0x18]
498 v_pk_add_u16 v5, s105, s105
499 // GFX12: [0x05,0x40,0x0a,0xcc,0x69,0xd2,0x00,0x18]
501 v_pk_add_u16 v5, vcc_lo, ttmp15
502 // GFX12: [0x05,0x40,0x0a,0xcc,0x6a,0xf6,0x00,0x18]
504 v_pk_add_u16 v5, vcc_hi, 0xfe0b
505 // GFX12: [0x05,0x40,0x0a,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00]
507 v_pk_add_u16 v5, ttmp15, src_scc
508 // GFX12: [0x05,0x40,0x0a,0xcc,0x7b,0xfa,0x01,0x18]
510 v_pk_add_u16 v5, m0, 0.5
511 // GFX12: [0x05,0x40,0x0a,0xcc,0x7d,0xe0,0x01,0x18]
513 v_pk_add_u16 v5, exec_lo, -1
514 // GFX12: [0x05,0x40,0x0a,0xcc,0x7e,0x82,0x01,0x18]
516 v_pk_add_u16 v5, exec_hi, null
517 // GFX12: [0x05,0x40,0x0a,0xcc,0x7f,0xf8,0x00,0x18]
519 v_pk_add_u16 v5, null, exec_lo
520 // GFX12: [0x05,0x40,0x0a,0xcc,0x7c,0xfc,0x00,0x18]
522 v_pk_add_u16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0]
523 // GFX12: [0x05,0x58,0x0a,0xcc,0xc1,0xfe,0x00,0x00]
525 v_pk_add_u16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1]
526 // GFX12: [0x05,0x40,0x0a,0xcc,0xf0,0xfa,0x00,0x18]
528 v_pk_add_u16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1]
529 // GFX12: [0x05,0x48,0x0a,0xcc,0xfd,0xd4,0x00,0x10]
531 v_pk_add_u16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] clamp
532 // GFX12: [0xff,0xd0,0x0a,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00]
534 v_pk_ashrrev_i16 v5, v1, v2
535 // GFX12: [0x05,0x40,0x06,0xcc,0x01,0x05,0x02,0x18]
537 v_pk_ashrrev_i16 v5, v255, v255
538 // GFX12: [0x05,0x40,0x06,0xcc,0xff,0xff,0x03,0x18]
540 v_pk_ashrrev_i16 v5, s1, s2
541 // GFX12: [0x05,0x40,0x06,0xcc,0x01,0x04,0x00,0x18]
543 v_pk_ashrrev_i16 v5, s105, s105
544 // GFX12: [0x05,0x40,0x06,0xcc,0x69,0xd2,0x00,0x18]
546 v_pk_ashrrev_i16 v5, vcc_lo, ttmp15
547 // GFX12: [0x05,0x40,0x06,0xcc,0x6a,0xf6,0x00,0x18]
549 v_pk_ashrrev_i16 v5, vcc_hi, 0xfe0b
550 // GFX12: [0x05,0x40,0x06,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00]
552 v_pk_ashrrev_i16 v5, ttmp15, src_scc
553 // GFX12: [0x05,0x40,0x06,0xcc,0x7b,0xfa,0x01,0x18]
555 v_pk_ashrrev_i16 v5, m0, 0.5
556 // GFX12: [0x05,0x40,0x06,0xcc,0x7d,0xe0,0x01,0x18]
558 v_pk_ashrrev_i16 v5, exec_lo, -1
559 // GFX12: [0x05,0x40,0x06,0xcc,0x7e,0x82,0x01,0x18]
561 v_pk_ashrrev_i16 v5, exec_hi, null
562 // GFX12: [0x05,0x40,0x06,0xcc,0x7f,0xf8,0x00,0x18]
564 v_pk_ashrrev_i16 v5, null, exec_lo
565 // GFX12: [0x05,0x40,0x06,0xcc,0x7c,0xfc,0x00,0x18]
567 v_pk_ashrrev_i16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0]
568 // GFX12: [0x05,0x58,0x06,0xcc,0xc1,0xfe,0x00,0x00]
570 v_pk_ashrrev_i16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1]
571 // GFX12: [0x05,0x40,0x06,0xcc,0xf0,0xfa,0x00,0x18]
573 v_pk_ashrrev_i16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1]
574 // GFX12: [0x05,0x48,0x06,0xcc,0xfd,0xd4,0x00,0x10]
576 v_pk_ashrrev_i16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0]
577 // GFX12: [0xff,0x50,0x06,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00]
579 v_pk_fma_f16 v5, v1, v2, s3
580 // GFX12: [0x05,0x40,0x0e,0xcc,0x01,0x05,0x0e,0x18]
582 v_pk_fma_f16 v5, v255, s2, s105
583 // GFX12: [0x05,0x40,0x0e,0xcc,0xff,0x05,0xa4,0x19]
585 v_pk_fma_f16 v5, s1, v255, exec_hi
586 // GFX12: [0x05,0x40,0x0e,0xcc,0x01,0xfe,0xff,0x19]
588 v_pk_fma_f16 v5, s105, s105, exec_lo
589 // GFX12: [0x05,0x40,0x0e,0xcc,0x69,0xd2,0xf8,0x19]
591 v_pk_fma_f16 v5, vcc_lo, ttmp15, v3
592 // GFX12: [0x05,0x40,0x0e,0xcc,0x6a,0xf6,0x0c,0x1c]
594 v_pk_fma_f16 v5, vcc_hi, 0xfe0b, v255
595 // GFX12: [0x05,0x40,0x0e,0xcc,0x6b,0xfe,0xfd,0x1f,0x0b,0xfe,0x00,0x00]
597 v_pk_fma_f16 v5, ttmp15, src_scc, ttmp15
598 // GFX12: [0x05,0x40,0x0e,0xcc,0x7b,0xfa,0xed,0x19]
600 v_pk_fma_f16 v5, m0, 0.5, m0 op_sel_hi:[0,0,0]
601 // GFX12: [0x05,0x00,0x0e,0xcc,0x7d,0xe0,0xf5,0x01]
603 v_pk_fma_f16 v5, exec_lo, -1, vcc_hi op_sel_hi:[0,0,1]
604 // GFX12: [0x05,0x40,0x0e,0xcc,0x7e,0x82,0xad,0x01]
606 v_pk_fma_f16 v5, exec_hi, null, vcc_lo op_sel_hi:[0,1,0]
607 // GFX12: [0x05,0x00,0x0e,0xcc,0x7f,0xf8,0xa8,0x11]
609 v_pk_fma_f16 v5, null, exec_lo, 0xfe0b op_sel:[1,1,1] op_sel_hi:[1,0,0] neg_lo:[1,0,0] neg_hi:[1,0,0]
610 // GFX12: [0x05,0x39,0x0e,0xcc,0x7c,0xfc,0xfc,0x2b,0x0b,0xfe,0x00,0x00]
612 v_pk_fma_f16 v5, -1, exec_hi, src_scc op_sel:[0,0,0] op_sel_hi:[1,1,1] neg_lo:[0,1,0] neg_hi:[0,1,0]
613 // GFX12: [0x05,0x42,0x0e,0xcc,0xc1,0xfe,0xf4,0x5b]
615 v_pk_fma_f16 v5, 0.5, m0, 0.5 op_sel:[1,0,0] op_sel_hi:[0,1,1] neg_lo:[0,0,1] neg_hi:[0,0,1]
616 // GFX12: [0x05,0x4c,0x0e,0xcc,0xf0,0xfa,0xc0,0x93]
618 v_pk_fma_f16 v5, src_scc, vcc_lo, -1 op_sel:[0,1,0] op_sel_hi:[1,0,1] neg_lo:[0,0,0] neg_hi:[0,0,0]
619 // GFX12: [0x05,0x50,0x0e,0xcc,0xfd,0xd4,0x04,0x0b]
621 v_pk_fma_f16 v255, 0xfe0b, vcc_hi, null op_sel:[0,0,1] op_sel_hi:[1,1,0] neg_lo:[1,1,1] neg_hi:[1,1,1] clamp
622 // GFX12: [0xff,0xa7,0x0e,0xcc,0xff,0xd6,0xf0,0xf9,0x0b,0xfe,0x00,0x00]
624 v_pk_lshlrev_b16 v5, v1, v2
625 // GFX12: [0x05,0x40,0x04,0xcc,0x01,0x05,0x02,0x18]
627 v_pk_lshlrev_b16 v5, v255, v255
628 // GFX12: [0x05,0x40,0x04,0xcc,0xff,0xff,0x03,0x18]
630 v_pk_lshlrev_b16 v5, s1, s2
631 // GFX12: [0x05,0x40,0x04,0xcc,0x01,0x04,0x00,0x18]
633 v_pk_lshlrev_b16 v5, s105, s105
634 // GFX12: [0x05,0x40,0x04,0xcc,0x69,0xd2,0x00,0x18]
636 v_pk_lshlrev_b16 v5, vcc_lo, ttmp15
637 // GFX12: [0x05,0x40,0x04,0xcc,0x6a,0xf6,0x00,0x18]
639 v_pk_lshlrev_b16 v5, vcc_hi, 0xfe0b
640 // GFX12: [0x05,0x40,0x04,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00]
642 v_pk_lshlrev_b16 v5, ttmp15, src_scc
643 // GFX12: [0x05,0x40,0x04,0xcc,0x7b,0xfa,0x01,0x18]
645 v_pk_lshlrev_b16 v5, m0, 0.5
646 // GFX12: [0x05,0x40,0x04,0xcc,0x7d,0xe0,0x01,0x18]
648 v_pk_lshlrev_b16 v5, exec_lo, -1
649 // GFX12: [0x05,0x40,0x04,0xcc,0x7e,0x82,0x01,0x18]
651 v_pk_lshlrev_b16 v5, exec_hi, null
652 // GFX12: [0x05,0x40,0x04,0xcc,0x7f,0xf8,0x00,0x18]
654 v_pk_lshlrev_b16 v5, null, exec_lo
655 // GFX12: [0x05,0x40,0x04,0xcc,0x7c,0xfc,0x00,0x18]
657 v_pk_lshlrev_b16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0]
658 // GFX12: [0x05,0x58,0x04,0xcc,0xc1,0xfe,0x00,0x00]
660 v_pk_lshlrev_b16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1]
661 // GFX12: [0x05,0x40,0x04,0xcc,0xf0,0xfa,0x00,0x18]
663 v_pk_lshlrev_b16 v5, 0x3800, m0 op_sel:[0,0] op_sel_hi:[1,1]
664 // GFX12: [0x05,0x40,0x04,0xcc,0xff,0xfa,0x00,0x18,0x00,0x38,0x00,0x00]
666 v_pk_lshlrev_b16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1]
667 // GFX12: [0x05,0x48,0x04,0xcc,0xfd,0xd4,0x00,0x10]
669 v_pk_lshlrev_b16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0]
670 // GFX12: [0xff,0x50,0x04,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00]
672 v_pk_lshrrev_b16 v5, v1, v2
673 // GFX12: [0x05,0x40,0x05,0xcc,0x01,0x05,0x02,0x18]
675 v_pk_lshrrev_b16 v5, v255, v255
676 // GFX12: [0x05,0x40,0x05,0xcc,0xff,0xff,0x03,0x18]
678 v_pk_lshrrev_b16 v5, s1, s2
679 // GFX12: [0x05,0x40,0x05,0xcc,0x01,0x04,0x00,0x18]
681 v_pk_lshrrev_b16 v5, s105, s105
682 // GFX12: [0x05,0x40,0x05,0xcc,0x69,0xd2,0x00,0x18]
684 v_pk_lshrrev_b16 v5, vcc_lo, ttmp15
685 // GFX12: [0x05,0x40,0x05,0xcc,0x6a,0xf6,0x00,0x18]
687 v_pk_lshrrev_b16 v5, vcc_hi, 0xfe0b
688 // GFX12: [0x05,0x40,0x05,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00]
690 v_pk_lshrrev_b16 v5, ttmp15, src_scc
691 // GFX12: [0x05,0x40,0x05,0xcc,0x7b,0xfa,0x01,0x18]
693 v_pk_lshrrev_b16 v5, m0, 0.5
694 // GFX12: [0x05,0x40,0x05,0xcc,0x7d,0xe0,0x01,0x18]
696 v_pk_lshrrev_b16 v5, exec_lo, -1
697 // GFX12: [0x05,0x40,0x05,0xcc,0x7e,0x82,0x01,0x18]
699 v_pk_lshrrev_b16 v5, exec_hi, null
700 // GFX12: [0x05,0x40,0x05,0xcc,0x7f,0xf8,0x00,0x18]
702 v_pk_lshrrev_b16 v5, null, exec_lo
703 // GFX12: [0x05,0x40,0x05,0xcc,0x7c,0xfc,0x00,0x18]
705 v_pk_lshrrev_b16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0]
706 // GFX12: [0x05,0x58,0x05,0xcc,0xc1,0xfe,0x00,0x00]
708 v_pk_lshrrev_b16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1]
709 // GFX12: [0x05,0x40,0x05,0xcc,0xf0,0xfa,0x00,0x18]
711 v_pk_lshrrev_b16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1]
712 // GFX12: [0x05,0x48,0x05,0xcc,0xfd,0xd4,0x00,0x10]
714 v_pk_lshrrev_b16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0]
715 // GFX12: [0xff,0x50,0x05,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00]
717 v_pk_mad_i16 v5, v1, v2, s3
718 // GFX12: [0x05,0x40,0x00,0xcc,0x01,0x05,0x0e,0x18]
720 v_pk_mad_i16 v5, v255, s2, s105
721 // GFX12: [0x05,0x40,0x00,0xcc,0xff,0x05,0xa4,0x19]
723 v_pk_mad_i16 v5, s1, v255, exec_hi
724 // GFX12: [0x05,0x40,0x00,0xcc,0x01,0xfe,0xff,0x19]
726 v_pk_mad_i16 v5, s105, s105, exec_lo
727 // GFX12: [0x05,0x40,0x00,0xcc,0x69,0xd2,0xf8,0x19]
729 v_pk_mad_i16 v5, vcc_lo, ttmp15, v3
730 // GFX12: [0x05,0x40,0x00,0xcc,0x6a,0xf6,0x0c,0x1c]
732 v_pk_mad_i16 v5, vcc_hi, 0xfe0b, v255
733 // GFX12: [0x05,0x40,0x00,0xcc,0x6b,0xfe,0xfd,0x1f,0x0b,0xfe,0x00,0x00]
735 v_pk_mad_i16 v5, ttmp15, src_scc, ttmp15
736 // GFX12: [0x05,0x40,0x00,0xcc,0x7b,0xfa,0xed,0x19]
738 v_pk_mad_i16 v5, m0, 0.5, m0 op_sel_hi:[0,0,0]
739 // GFX12: [0x05,0x00,0x00,0xcc,0x7d,0xe0,0xf5,0x01]
741 v_pk_mad_i16 v5, exec_lo, -1, vcc_hi op_sel_hi:[0,0,1]
742 // GFX12: [0x05,0x40,0x00,0xcc,0x7e,0x82,0xad,0x01]
744 v_pk_mad_i16 v5, exec_hi, null, vcc_lo op_sel_hi:[0,1,0]
745 // GFX12: [0x05,0x00,0x00,0xcc,0x7f,0xf8,0xa8,0x11]
747 v_pk_mad_i16 v5, null, exec_lo, 0xfe0b op_sel:[1,1,1] op_sel_hi:[1,0,0]
748 // GFX12: [0x05,0x38,0x00,0xcc,0x7c,0xfc,0xfc,0x0b,0x0b,0xfe,0x00,0x00]
750 v_pk_mad_i16 v5, -1, exec_hi, src_scc op_sel:[0,0,0] op_sel_hi:[1,1,1]
751 // GFX12: [0x05,0x40,0x00,0xcc,0xc1,0xfe,0xf4,0x1b]
753 v_pk_mad_i16 v5, 0.5, m0, 0.5 op_sel:[1,0,0] op_sel_hi:[0,1,1]
754 // GFX12: [0x05,0x48,0x00,0xcc,0xf0,0xfa,0xc0,0x13]
756 v_pk_mad_i16 v5, src_scc, vcc_lo, -1 op_sel:[0,1,0] op_sel_hi:[1,0,1]
757 // GFX12: [0x05,0x50,0x00,0xcc,0xfd,0xd4,0x04,0x0b]
759 v_pk_mad_i16 v255, 0xfe0b, vcc_hi, null op_sel:[0,0,1] op_sel_hi:[1,1,0] clamp
760 // GFX12: [0xff,0xa0,0x00,0xcc,0xff,0xd6,0xf0,0x19,0x0b,0xfe,0x00,0x00]
762 v_pk_mad_u16 v5, v1, v2, s3
763 // GFX12: [0x05,0x40,0x09,0xcc,0x01,0x05,0x0e,0x18]
765 v_pk_mad_u16 v5, v255, s2, s105
766 // GFX12: [0x05,0x40,0x09,0xcc,0xff,0x05,0xa4,0x19]
768 v_pk_mad_u16 v5, s1, v255, exec_hi
769 // GFX12: [0x05,0x40,0x09,0xcc,0x01,0xfe,0xff,0x19]
771 v_pk_mad_u16 v5, s105, s105, exec_lo
772 // GFX12: [0x05,0x40,0x09,0xcc,0x69,0xd2,0xf8,0x19]
774 v_pk_mad_u16 v5, vcc_lo, ttmp15, v3
775 // GFX12: [0x05,0x40,0x09,0xcc,0x6a,0xf6,0x0c,0x1c]
777 v_pk_mad_u16 v5, vcc_hi, 0xfe0b, v255
778 // GFX12: [0x05,0x40,0x09,0xcc,0x6b,0xfe,0xfd,0x1f,0x0b,0xfe,0x00,0x00]
780 v_pk_mad_u16 v5, ttmp15, src_scc, ttmp15
781 // GFX12: [0x05,0x40,0x09,0xcc,0x7b,0xfa,0xed,0x19]
783 v_pk_mad_u16 v5, m0, 0.5, m0 op_sel_hi:[0,0,0]
784 // GFX12: [0x05,0x00,0x09,0xcc,0x7d,0xe0,0xf5,0x01]
786 v_pk_mad_u16 v5, exec_lo, -1, vcc_hi op_sel_hi:[0,0,1]
787 // GFX12: [0x05,0x40,0x09,0xcc,0x7e,0x82,0xad,0x01]
789 v_pk_mad_u16 v5, exec_hi, null, vcc_lo op_sel_hi:[0,1,0]
790 // GFX12: [0x05,0x00,0x09,0xcc,0x7f,0xf8,0xa8,0x11]
792 v_pk_mad_u16 v5, null, exec_lo, 0xfe0b op_sel:[1,1,1] op_sel_hi:[1,0,0]
793 // GFX12: [0x05,0x38,0x09,0xcc,0x7c,0xfc,0xfc,0x0b,0x0b,0xfe,0x00,0x00]
795 v_pk_mad_u16 v5, -1, exec_hi, src_scc op_sel:[0,0,0] op_sel_hi:[1,1,1]
796 // GFX12: [0x05,0x40,0x09,0xcc,0xc1,0xfe,0xf4,0x1b]
798 v_pk_mad_u16 v5, 0.5, m0, 0.5 op_sel:[1,0,0] op_sel_hi:[0,1,1]
799 // GFX12: [0x05,0x48,0x09,0xcc,0xf0,0xfa,0xc0,0x13]
801 v_pk_mad_u16 v5, src_scc, vcc_lo, -1 op_sel:[0,1,0] op_sel_hi:[1,0,1]
802 // GFX12: [0x05,0x50,0x09,0xcc,0xfd,0xd4,0x04,0x0b]
804 v_pk_mad_u16 v255, 0xfe0b, vcc_hi, null op_sel:[0,0,1] op_sel_hi:[1,1,0] clamp
805 // GFX12: [0xff,0xa0,0x09,0xcc,0xff,0xd6,0xf0,0x19,0x0b,0xfe,0x00,0x00]
807 v_pk_max_num_f16 v5, v1, v2
808 // GFX12: [0x05,0x40,0x1c,0xcc,0x01,0x05,0x02,0x18]
810 v_pk_max_num_f16 v5, v255, v255
811 // GFX12: [0x05,0x40,0x1c,0xcc,0xff,0xff,0x03,0x18]
813 v_pk_max_num_f16 v5, s1, s2
814 // GFX12: [0x05,0x40,0x1c,0xcc,0x01,0x04,0x00,0x18]
816 v_pk_max_num_f16 v5, s105, s105
817 // GFX12: [0x05,0x40,0x1c,0xcc,0x69,0xd2,0x00,0x18]
819 v_pk_max_num_f16 v5, vcc_lo, ttmp15
820 // GFX12: [0x05,0x40,0x1c,0xcc,0x6a,0xf6,0x00,0x18]
822 v_pk_max_num_f16 v5, vcc_hi, 0xfe0b
823 // GFX12: [0x05,0x40,0x1c,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00]
825 v_pk_max_num_f16 v5, ttmp15, src_scc
826 // GFX12: [0x05,0x40,0x1c,0xcc,0x7b,0xfa,0x01,0x18]
828 v_pk_max_num_f16 v5, m0, 0.5
829 // GFX12: [0x05,0x40,0x1c,0xcc,0x7d,0xe0,0x01,0x18]
831 v_pk_max_num_f16 v5, exec_lo, -1
832 // GFX12: [0x05,0x40,0x1c,0xcc,0x7e,0x82,0x01,0x18]
834 v_pk_max_num_f16 v5, exec_hi, null
835 // GFX12: [0x05,0x40,0x1c,0xcc,0x7f,0xf8,0x00,0x18]
837 v_pk_max_num_f16 v5, null, exec_lo
838 // GFX12: [0x05,0x40,0x1c,0xcc,0x7c,0xfc,0x00,0x18]
840 v_pk_max_num_f16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] neg_lo:[1,0] neg_hi:[1,0]
841 // GFX12: [0x05,0x59,0x1c,0xcc,0xc1,0xfe,0x00,0x20]
843 v_pk_max_num_f16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] neg_lo:[0,1] neg_hi:[0,1]
844 // GFX12: [0x05,0x42,0x1c,0xcc,0xf0,0xfa,0x00,0x58]
846 v_pk_max_num_f16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] neg_lo:[0,0] neg_hi:[0,0]
847 // GFX12: [0x05,0x48,0x1c,0xcc,0xfd,0xd4,0x00,0x10]
849 v_pk_max_num_f16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] neg_lo:[1,1] neg_hi:[1,1] clamp
850 // GFX12: [0xff,0xd3,0x1c,0xcc,0xff,0xd6,0x00,0x68,0x0b,0xfe,0x00,0x00]
852 v_pk_max_i16 v5, v1, v2
853 // GFX12: [0x05,0x40,0x07,0xcc,0x01,0x05,0x02,0x18]
855 v_pk_max_i16 v5, v255, v255
856 // GFX12: [0x05,0x40,0x07,0xcc,0xff,0xff,0x03,0x18]
858 v_pk_max_i16 v5, s1, s2
859 // GFX12: [0x05,0x40,0x07,0xcc,0x01,0x04,0x00,0x18]
861 v_pk_max_i16 v5, s105, s105
862 // GFX12: [0x05,0x40,0x07,0xcc,0x69,0xd2,0x00,0x18]
864 v_pk_max_i16 v5, vcc_lo, ttmp15
865 // GFX12: [0x05,0x40,0x07,0xcc,0x6a,0xf6,0x00,0x18]
867 v_pk_max_i16 v5, vcc_hi, 0xfe0b
868 // GFX12: [0x05,0x40,0x07,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00]
870 v_pk_max_i16 v5, ttmp15, src_scc
871 // GFX12: [0x05,0x40,0x07,0xcc,0x7b,0xfa,0x01,0x18]
873 v_pk_max_i16 v5, m0, 0.5
874 // GFX12: [0x05,0x40,0x07,0xcc,0x7d,0xe0,0x01,0x18]
876 v_pk_max_i16 v5, exec_lo, -1
877 // GFX12: [0x05,0x40,0x07,0xcc,0x7e,0x82,0x01,0x18]
879 v_pk_max_i16 v5, exec_hi, null
880 // GFX12: [0x05,0x40,0x07,0xcc,0x7f,0xf8,0x00,0x18]
882 v_pk_max_i16 v5, null, exec_lo
883 // GFX12: [0x05,0x40,0x07,0xcc,0x7c,0xfc,0x00,0x18]
885 v_pk_max_i16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0]
886 // GFX12: [0x05,0x58,0x07,0xcc,0xc1,0xfe,0x00,0x00]
888 v_pk_max_i16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1]
889 // GFX12: [0x05,0x40,0x07,0xcc,0xf0,0xfa,0x00,0x18]
891 v_pk_max_i16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1]
892 // GFX12: [0x05,0x48,0x07,0xcc,0xfd,0xd4,0x00,0x10]
894 v_pk_max_i16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0]
895 // GFX12: [0xff,0x50,0x07,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00]
897 v_pk_max_u16 v5, v1, v2
898 // GFX12: [0x05,0x40,0x0c,0xcc,0x01,0x05,0x02,0x18]
900 v_pk_max_u16 v5, v255, v255
901 // GFX12: [0x05,0x40,0x0c,0xcc,0xff,0xff,0x03,0x18]
903 v_pk_max_u16 v5, s1, s2
904 // GFX12: [0x05,0x40,0x0c,0xcc,0x01,0x04,0x00,0x18]
906 v_pk_max_u16 v5, s105, s105
907 // GFX12: [0x05,0x40,0x0c,0xcc,0x69,0xd2,0x00,0x18]
909 v_pk_max_u16 v5, vcc_lo, ttmp15
910 // GFX12: [0x05,0x40,0x0c,0xcc,0x6a,0xf6,0x00,0x18]
912 v_pk_max_u16 v5, vcc_hi, 0xfe0b
913 // GFX12: [0x05,0x40,0x0c,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00]
915 v_pk_max_u16 v5, ttmp15, src_scc
916 // GFX12: [0x05,0x40,0x0c,0xcc,0x7b,0xfa,0x01,0x18]
918 v_pk_max_u16 v5, m0, 0.5
919 // GFX12: [0x05,0x40,0x0c,0xcc,0x7d,0xe0,0x01,0x18]
921 v_pk_max_u16 v5, exec_lo, -1
922 // GFX12: [0x05,0x40,0x0c,0xcc,0x7e,0x82,0x01,0x18]
924 v_pk_max_u16 v5, exec_hi, null
925 // GFX12: [0x05,0x40,0x0c,0xcc,0x7f,0xf8,0x00,0x18]
927 v_pk_max_u16 v5, null, exec_lo
928 // GFX12: [0x05,0x40,0x0c,0xcc,0x7c,0xfc,0x00,0x18]
930 v_pk_max_u16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0]
931 // GFX12: [0x05,0x58,0x0c,0xcc,0xc1,0xfe,0x00,0x00]
933 v_pk_max_u16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1]
934 // GFX12: [0x05,0x40,0x0c,0xcc,0xf0,0xfa,0x00,0x18]
936 v_pk_max_u16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1]
937 // GFX12: [0x05,0x48,0x0c,0xcc,0xfd,0xd4,0x00,0x10]
939 v_pk_max_u16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0]
940 // GFX12: [0xff,0x50,0x0c,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00]
942 v_pk_min_num_f16 v5, v1, v2
943 // GFX12: [0x05,0x40,0x1b,0xcc,0x01,0x05,0x02,0x18]
945 v_pk_min_num_f16 v5, v255, v255
946 // GFX12: [0x05,0x40,0x1b,0xcc,0xff,0xff,0x03,0x18]
948 v_pk_min_num_f16 v5, s1, s2
949 // GFX12: [0x05,0x40,0x1b,0xcc,0x01,0x04,0x00,0x18]
951 v_pk_min_num_f16 v5, s105, s105
952 // GFX12: [0x05,0x40,0x1b,0xcc,0x69,0xd2,0x00,0x18]
954 v_pk_min_num_f16 v5, vcc_lo, ttmp15
955 // GFX12: [0x05,0x40,0x1b,0xcc,0x6a,0xf6,0x00,0x18]
957 v_pk_min_num_f16 v5, vcc_hi, 0xfe0b
958 // GFX12: [0x05,0x40,0x1b,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00]
960 v_pk_min_num_f16 v5, ttmp15, src_scc
961 // GFX12: [0x05,0x40,0x1b,0xcc,0x7b,0xfa,0x01,0x18]
963 v_pk_min_num_f16 v5, m0, 0.5
964 // GFX12: [0x05,0x40,0x1b,0xcc,0x7d,0xe0,0x01,0x18]
966 v_pk_min_num_f16 v5, exec_lo, -1
967 // GFX12: [0x05,0x40,0x1b,0xcc,0x7e,0x82,0x01,0x18]
969 v_pk_min_num_f16 v5, exec_hi, null
970 // GFX12: [0x05,0x40,0x1b,0xcc,0x7f,0xf8,0x00,0x18]
972 v_pk_min_num_f16 v5, null, exec_lo
973 // GFX12: [0x05,0x40,0x1b,0xcc,0x7c,0xfc,0x00,0x18]
975 v_pk_min_num_f16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] neg_lo:[1,0] neg_hi:[1,0]
976 // GFX12: [0x05,0x59,0x1b,0xcc,0xc1,0xfe,0x00,0x20]
978 v_pk_min_num_f16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] neg_lo:[0,1] neg_hi:[0,1]
979 // GFX12: [0x05,0x42,0x1b,0xcc,0xf0,0xfa,0x00,0x58]
981 v_pk_min_num_f16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] neg_lo:[0,0] neg_hi:[0,0]
982 // GFX12: [0x05,0x48,0x1b,0xcc,0xfd,0xd4,0x00,0x10]
984 v_pk_min_num_f16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] neg_lo:[1,1] neg_hi:[1,1] clamp
985 // GFX12: [0xff,0xd3,0x1b,0xcc,0xff,0xd6,0x00,0x68,0x0b,0xfe,0x00,0x00]
987 v_pk_min_i16 v5, v1, v2
988 // GFX12: [0x05,0x40,0x08,0xcc,0x01,0x05,0x02,0x18]
990 v_pk_min_i16 v5, v255, v255
991 // GFX12: [0x05,0x40,0x08,0xcc,0xff,0xff,0x03,0x18]
993 v_pk_min_i16 v5, s1, s2
994 // GFX12: [0x05,0x40,0x08,0xcc,0x01,0x04,0x00,0x18]
996 v_pk_min_i16 v5, s105, s105
997 // GFX12: [0x05,0x40,0x08,0xcc,0x69,0xd2,0x00,0x18]
999 v_pk_min_i16 v5, vcc_lo, ttmp15
1000 // GFX12: [0x05,0x40,0x08,0xcc,0x6a,0xf6,0x00,0x18]
1002 v_pk_min_i16 v5, vcc_hi, 0xfe0b
1003 // GFX12: [0x05,0x40,0x08,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00]
1005 v_pk_min_i16 v5, ttmp15, src_scc
1006 // GFX12: [0x05,0x40,0x08,0xcc,0x7b,0xfa,0x01,0x18]
1008 v_pk_min_i16 v5, m0, 0.5
1009 // GFX12: [0x05,0x40,0x08,0xcc,0x7d,0xe0,0x01,0x18]
1011 v_pk_min_i16 v5, exec_lo, -1
1012 // GFX12: [0x05,0x40,0x08,0xcc,0x7e,0x82,0x01,0x18]
1014 v_pk_min_i16 v5, exec_hi, null
1015 // GFX12: [0x05,0x40,0x08,0xcc,0x7f,0xf8,0x00,0x18]
1017 v_pk_min_i16 v5, null, exec_lo
1018 // GFX12: [0x05,0x40,0x08,0xcc,0x7c,0xfc,0x00,0x18]
1020 v_pk_min_i16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0]
1021 // GFX12: [0x05,0x58,0x08,0xcc,0xc1,0xfe,0x00,0x00]
1023 v_pk_min_i16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1]
1024 // GFX12: [0x05,0x40,0x08,0xcc,0xf0,0xfa,0x00,0x18]
1026 v_pk_min_i16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1]
1027 // GFX12: [0x05,0x48,0x08,0xcc,0xfd,0xd4,0x00,0x10]
1029 v_pk_min_i16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0]
1030 // GFX12: [0xff,0x50,0x08,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00]
1032 v_pk_min_u16 v5, v1, v2
1033 // GFX12: [0x05,0x40,0x0d,0xcc,0x01,0x05,0x02,0x18]
1035 v_pk_min_u16 v5, v255, v255
1036 // GFX12: [0x05,0x40,0x0d,0xcc,0xff,0xff,0x03,0x18]
1038 v_pk_min_u16 v5, s1, s2
1039 // GFX12: [0x05,0x40,0x0d,0xcc,0x01,0x04,0x00,0x18]
1041 v_pk_min_u16 v5, s105, s105
1042 // GFX12: [0x05,0x40,0x0d,0xcc,0x69,0xd2,0x00,0x18]
1044 v_pk_min_u16 v5, vcc_lo, ttmp15
1045 // GFX12: [0x05,0x40,0x0d,0xcc,0x6a,0xf6,0x00,0x18]
1047 v_pk_min_u16 v5, vcc_hi, 0xfe0b
1048 // GFX12: [0x05,0x40,0x0d,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00]
1050 v_pk_min_u16 v5, ttmp15, src_scc
1051 // GFX12: [0x05,0x40,0x0d,0xcc,0x7b,0xfa,0x01,0x18]
1053 v_pk_min_u16 v5, m0, 0.5
1054 // GFX12: [0x05,0x40,0x0d,0xcc,0x7d,0xe0,0x01,0x18]
1056 v_pk_min_u16 v5, exec_lo, -1
1057 // GFX12: [0x05,0x40,0x0d,0xcc,0x7e,0x82,0x01,0x18]
1059 v_pk_min_u16 v5, exec_hi, null
1060 // GFX12: [0x05,0x40,0x0d,0xcc,0x7f,0xf8,0x00,0x18]
1062 v_pk_min_u16 v5, null, exec_lo
1063 // GFX12: [0x05,0x40,0x0d,0xcc,0x7c,0xfc,0x00,0x18]
1065 v_pk_min_u16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0]
1066 // GFX12: [0x05,0x58,0x0d,0xcc,0xc1,0xfe,0x00,0x00]
1068 v_pk_min_u16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1]
1069 // GFX12: [0x05,0x40,0x0d,0xcc,0xf0,0xfa,0x00,0x18]
1071 v_pk_min_u16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1]
1072 // GFX12: [0x05,0x48,0x0d,0xcc,0xfd,0xd4,0x00,0x10]
1074 v_pk_min_u16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0]
1075 // GFX12: [0xff,0x50,0x0d,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00]
1077 v_pk_mul_f16 v5, v1, v2
1078 // GFX12: [0x05,0x40,0x10,0xcc,0x01,0x05,0x02,0x18]
1080 v_pk_mul_f16 v5, v255, v255
1081 // GFX12: [0x05,0x40,0x10,0xcc,0xff,0xff,0x03,0x18]
1083 v_pk_mul_f16 v5, s1, s2
1084 // GFX12: [0x05,0x40,0x10,0xcc,0x01,0x04,0x00,0x18]
1086 v_pk_mul_f16 v5, s105, s105
1087 // GFX12: [0x05,0x40,0x10,0xcc,0x69,0xd2,0x00,0x18]
1089 v_pk_mul_f16 v5, vcc_lo, ttmp15
1090 // GFX12: [0x05,0x40,0x10,0xcc,0x6a,0xf6,0x00,0x18]
1092 v_pk_mul_f16 v5, vcc_hi, 0xfe0b
1093 // GFX12: [0x05,0x40,0x10,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00]
1095 v_pk_mul_f16 v5, ttmp15, src_scc
1096 // GFX12: [0x05,0x40,0x10,0xcc,0x7b,0xfa,0x01,0x18]
1098 v_pk_mul_f16 v5, m0, 0.5
1099 // GFX12: [0x05,0x40,0x10,0xcc,0x7d,0xe0,0x01,0x18]
1101 v_pk_mul_f16 v5, exec_lo, -1
1102 // GFX12: [0x05,0x40,0x10,0xcc,0x7e,0x82,0x01,0x18]
1104 v_pk_mul_f16 v5, exec_hi, null
1105 // GFX12: [0x05,0x40,0x10,0xcc,0x7f,0xf8,0x00,0x18]
1107 v_pk_mul_f16 v5, null, exec_lo
1108 // GFX12: [0x05,0x40,0x10,0xcc,0x7c,0xfc,0x00,0x18]
1110 v_pk_mul_f16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] neg_lo:[1,0] neg_hi:[1,0]
1111 // GFX12: [0x05,0x59,0x10,0xcc,0xc1,0xfe,0x00,0x20]
1113 v_pk_mul_f16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] neg_lo:[0,1] neg_hi:[0,1]
1114 // GFX12: [0x05,0x42,0x10,0xcc,0xf0,0xfa,0x00,0x58]
1116 v_pk_mul_f16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] neg_lo:[0,0] neg_hi:[0,0]
1117 // GFX12: [0x05,0x48,0x10,0xcc,0xfd,0xd4,0x00,0x10]
1119 v_pk_mul_f16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] neg_lo:[1,1] neg_hi:[1,1] clamp
1120 // GFX12: [0xff,0xd3,0x10,0xcc,0xff,0xd6,0x00,0x68,0x0b,0xfe,0x00,0x00]
1122 v_pk_mul_lo_u16 v5, v1, v2
1123 // GFX12: [0x05,0x40,0x01,0xcc,0x01,0x05,0x02,0x18]
1125 v_pk_mul_lo_u16 v5, v255, v255
1126 // GFX12: [0x05,0x40,0x01,0xcc,0xff,0xff,0x03,0x18]
1128 v_pk_mul_lo_u16 v5, s1, s2
1129 // GFX12: [0x05,0x40,0x01,0xcc,0x01,0x04,0x00,0x18]
1131 v_pk_mul_lo_u16 v5, s105, s105
1132 // GFX12: [0x05,0x40,0x01,0xcc,0x69,0xd2,0x00,0x18]
1134 v_pk_mul_lo_u16 v5, vcc_lo, ttmp15
1135 // GFX12: [0x05,0x40,0x01,0xcc,0x6a,0xf6,0x00,0x18]
1137 v_pk_mul_lo_u16 v5, vcc_hi, 0xfe0b
1138 // GFX12: [0x05,0x40,0x01,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00]
1140 v_pk_mul_lo_u16 v5, ttmp15, src_scc
1141 // GFX12: [0x05,0x40,0x01,0xcc,0x7b,0xfa,0x01,0x18]
1143 v_pk_mul_lo_u16 v5, m0, 0.5
1144 // GFX12: [0x05,0x40,0x01,0xcc,0x7d,0xe0,0x01,0x18]
1146 v_pk_mul_lo_u16 v5, exec_lo, -1
1147 // GFX12: [0x05,0x40,0x01,0xcc,0x7e,0x82,0x01,0x18]
1149 v_pk_mul_lo_u16 v5, exec_hi, null
1150 // GFX12: [0x05,0x40,0x01,0xcc,0x7f,0xf8,0x00,0x18]
1152 v_pk_mul_lo_u16 v5, null, exec_lo
1153 // GFX12: [0x05,0x40,0x01,0xcc,0x7c,0xfc,0x00,0x18]
1155 v_pk_mul_lo_u16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0]
1156 // GFX12: [0x05,0x58,0x01,0xcc,0xc1,0xfe,0x00,0x00]
1158 v_pk_mul_lo_u16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1]
1159 // GFX12: [0x05,0x40,0x01,0xcc,0xf0,0xfa,0x00,0x18]
1161 v_pk_mul_lo_u16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1]
1162 // GFX12: [0x05,0x48,0x01,0xcc,0xfd,0xd4,0x00,0x10]
1164 v_pk_mul_lo_u16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0]
1165 // GFX12: [0xff,0x50,0x01,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00]
1167 v_pk_sub_i16 v5, v1, v2
1168 // GFX12: [0x05,0x40,0x03,0xcc,0x01,0x05,0x02,0x18]
1170 v_pk_sub_i16 v5, v255, v255
1171 // GFX12: [0x05,0x40,0x03,0xcc,0xff,0xff,0x03,0x18]
1173 v_pk_sub_i16 v5, s1, s2
1174 // GFX12: [0x05,0x40,0x03,0xcc,0x01,0x04,0x00,0x18]
1176 v_pk_sub_i16 v5, s105, s105
1177 // GFX12: [0x05,0x40,0x03,0xcc,0x69,0xd2,0x00,0x18]
1179 v_pk_sub_i16 v5, vcc_lo, ttmp15
1180 // GFX12: [0x05,0x40,0x03,0xcc,0x6a,0xf6,0x00,0x18]
1182 v_pk_sub_i16 v5, vcc_hi, 0xfe0b
1183 // GFX12: [0x05,0x40,0x03,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00]
1185 v_pk_sub_i16 v5, ttmp15, src_scc
1186 // GFX12: [0x05,0x40,0x03,0xcc,0x7b,0xfa,0x01,0x18]
1188 v_pk_sub_i16 v5, m0, 0.5
1189 // GFX12: [0x05,0x40,0x03,0xcc,0x7d,0xe0,0x01,0x18]
1191 v_pk_sub_i16 v5, exec_lo, -1
1192 // GFX12: [0x05,0x40,0x03,0xcc,0x7e,0x82,0x01,0x18]
1194 v_pk_sub_i16 v5, exec_hi, null
1195 // GFX12: [0x05,0x40,0x03,0xcc,0x7f,0xf8,0x00,0x18]
1197 v_pk_sub_i16 v5, null, exec_lo
1198 // GFX12: [0x05,0x40,0x03,0xcc,0x7c,0xfc,0x00,0x18]
1200 v_pk_sub_i16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0]
1201 // GFX12: [0x05,0x58,0x03,0xcc,0xc1,0xfe,0x00,0x00]
1203 v_pk_sub_i16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1]
1204 // GFX12: [0x05,0x40,0x03,0xcc,0xf0,0xfa,0x00,0x18]
1206 v_pk_sub_i16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1]
1207 // GFX12: [0x05,0x48,0x03,0xcc,0xfd,0xd4,0x00,0x10]
1209 v_pk_sub_i16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] clamp
1210 // GFX12: [0xff,0xd0,0x03,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00]
1212 v_pk_sub_u16 v5, v1, v2
1213 // GFX12: [0x05,0x40,0x0b,0xcc,0x01,0x05,0x02,0x18]
1215 v_pk_sub_u16 v5, v255, v255
1216 // GFX12: [0x05,0x40,0x0b,0xcc,0xff,0xff,0x03,0x18]
1218 v_pk_sub_u16 v5, s1, s2
1219 // GFX12: [0x05,0x40,0x0b,0xcc,0x01,0x04,0x00,0x18]
1221 v_pk_sub_u16 v5, s105, s105
1222 // GFX12: [0x05,0x40,0x0b,0xcc,0x69,0xd2,0x00,0x18]
1224 v_pk_sub_u16 v5, vcc_lo, ttmp15
1225 // GFX12: [0x05,0x40,0x0b,0xcc,0x6a,0xf6,0x00,0x18]
1227 v_pk_sub_u16 v5, vcc_hi, 0xfe0b
1228 // GFX12: [0x05,0x40,0x0b,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00]
1230 v_pk_sub_u16 v5, ttmp15, src_scc
1231 // GFX12: [0x05,0x40,0x0b,0xcc,0x7b,0xfa,0x01,0x18]
1233 v_pk_sub_u16 v5, m0, 0.5
1234 // GFX12: [0x05,0x40,0x0b,0xcc,0x7d,0xe0,0x01,0x18]
1236 v_pk_sub_u16 v5, exec_lo, -1
1237 // GFX12: [0x05,0x40,0x0b,0xcc,0x7e,0x82,0x01,0x18]
1239 v_pk_sub_u16 v5, exec_hi, null
1240 // GFX12: [0x05,0x40,0x0b,0xcc,0x7f,0xf8,0x00,0x18]
1242 v_pk_sub_u16 v5, null, exec_lo
1243 // GFX12: [0x05,0x40,0x0b,0xcc,0x7c,0xfc,0x00,0x18]
1245 v_pk_sub_u16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0]
1246 // GFX12: [0x05,0x58,0x0b,0xcc,0xc1,0xfe,0x00,0x00]
1248 v_pk_sub_u16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1]
1249 // GFX12: [0x05,0x40,0x0b,0xcc,0xf0,0xfa,0x00,0x18]
1251 v_pk_sub_u16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1]
1252 // GFX12: [0x05,0x48,0x0b,0xcc,0xfd,0xd4,0x00,0x10]
1254 v_pk_sub_u16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] clamp
1255 // GFX12: [0xff,0xd0,0x0b,0xcc,0xff,0xd6,0x00,0x08,0x0b,0xfe,0x00,0x00]
1257 v_pk_minimum_f16 v5, v1, v2
1258 // GFX12: [0x05,0x40,0x1d,0xcc,0x01,0x05,0x02,0x18]
1260 v_pk_minimum_f16 v5, v255, v255
1261 // GFX12: [0x05,0x40,0x1d,0xcc,0xff,0xff,0x03,0x18]
1263 v_pk_minimum_f16 v5, s1, s2
1264 // GFX12: [0x05,0x40,0x1d,0xcc,0x01,0x04,0x00,0x18]
1266 v_pk_minimum_f16 v5, s105, s105
1267 // GFX12: [0x05,0x40,0x1d,0xcc,0x69,0xd2,0x00,0x18]
1269 v_pk_minimum_f16 v5, vcc_lo, ttmp15
1270 // GFX12: [0x05,0x40,0x1d,0xcc,0x6a,0xf6,0x00,0x18]
1272 v_pk_minimum_f16 v5, vcc_hi, 0xfe0b
1273 // GFX12: [0x05,0x40,0x1d,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00]
1275 v_pk_minimum_f16 v5, ttmp15, src_scc
1276 // GFX12: [0x05,0x40,0x1d,0xcc,0x7b,0xfa,0x01,0x18]
1278 v_pk_minimum_f16 v5, m0, 0.5
1279 // GFX12: [0x05,0x40,0x1d,0xcc,0x7d,0xe0,0x01,0x18]
1281 v_pk_minimum_f16 v5, exec_lo, -1
1282 // GFX12: [0x05,0x40,0x1d,0xcc,0x7e,0x82,0x01,0x18]
1284 v_pk_minimum_f16 v5, exec_hi, null
1285 // GFX12: [0x05,0x40,0x1d,0xcc,0x7f,0xf8,0x00,0x18]
1287 v_pk_minimum_f16 v5, null, exec_lo
1288 // GFX12: [0x05,0x40,0x1d,0xcc,0x7c,0xfc,0x00,0x18]
1290 v_pk_minimum_f16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] neg_lo:[1,0] neg_hi:[1,0]
1291 // GFX12: [0x05,0x59,0x1d,0xcc,0xc1,0xfe,0x00,0x20]
1293 v_pk_minimum_f16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] neg_lo:[0,1] neg_hi:[0,1]
1294 // GFX12: [0x05,0x42,0x1d,0xcc,0xf0,0xfa,0x00,0x58]
1296 v_pk_minimum_f16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] neg_lo:[0,0] neg_hi:[0,0]
1297 // GFX12: [0x05,0x48,0x1d,0xcc,0xfd,0xd4,0x00,0x10]
1299 v_pk_minimum_f16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] neg_lo:[1,1] neg_hi:[1,1] clamp
1300 // GFX12: [0xff,0xd3,0x1d,0xcc,0xff,0xd6,0x00,0x68,0x0b,0xfe,0x00,0x00]
1302 v_pk_maximum_f16 v5, v1, v2
1303 // GFX12: [0x05,0x40,0x1e,0xcc,0x01,0x05,0x02,0x18]
1305 v_pk_maximum_f16 v5, v255, v255
1306 // GFX12: [0x05,0x40,0x1e,0xcc,0xff,0xff,0x03,0x18]
1308 v_pk_maximum_f16 v5, s1, s2
1309 // GFX12: [0x05,0x40,0x1e,0xcc,0x01,0x04,0x00,0x18]
1311 v_pk_maximum_f16 v5, s105, s105
1312 // GFX12: [0x05,0x40,0x1e,0xcc,0x69,0xd2,0x00,0x18]
1314 v_pk_maximum_f16 v5, vcc_lo, ttmp15
1315 // GFX12: [0x05,0x40,0x1e,0xcc,0x6a,0xf6,0x00,0x18]
1317 v_pk_maximum_f16 v5, vcc_hi, 0xfe0b
1318 // GFX12: [0x05,0x40,0x1e,0xcc,0x6b,0xfe,0x01,0x18,0x0b,0xfe,0x00,0x00]
1320 v_pk_maximum_f16 v5, ttmp15, src_scc
1321 // GFX12: [0x05,0x40,0x1e,0xcc,0x7b,0xfa,0x01,0x18]
1323 v_pk_maximum_f16 v5, m0, 0.5
1324 // GFX12: [0x05,0x40,0x1e,0xcc,0x7d,0xe0,0x01,0x18]
1326 v_pk_maximum_f16 v5, exec_lo, -1
1327 // GFX12: [0x05,0x40,0x1e,0xcc,0x7e,0x82,0x01,0x18]
1329 v_pk_maximum_f16 v5, exec_hi, null
1330 // GFX12: [0x05,0x40,0x1e,0xcc,0x7f,0xf8,0x00,0x18]
1332 v_pk_maximum_f16 v5, null, exec_lo
1333 // GFX12: [0x05,0x40,0x1e,0xcc,0x7c,0xfc,0x00,0x18]
1335 v_pk_maximum_f16 v5, -1, exec_hi op_sel:[1,1] op_sel_hi:[0,0] neg_lo:[1,0] neg_hi:[1,0]
1336 // GFX12: [0x05,0x59,0x1e,0xcc,0xc1,0xfe,0x00,0x20]
1338 v_pk_maximum_f16 v5, 0.5, m0 op_sel:[0,0] op_sel_hi:[1,1] neg_lo:[0,1] neg_hi:[0,1]
1339 // GFX12: [0x05,0x42,0x1e,0xcc,0xf0,0xfa,0x00,0x58]
1341 v_pk_maximum_f16 v5, src_scc, vcc_lo op_sel:[1,0] op_sel_hi:[0,1] neg_lo:[0,0] neg_hi:[0,0]
1342 // GFX12: [0x05,0x48,0x1e,0xcc,0xfd,0xd4,0x00,0x10]
1344 v_pk_maximum_f16 v255, 0xfe0b, vcc_hi op_sel:[0,1] op_sel_hi:[1,0] neg_lo:[1,1] neg_hi:[1,1] clamp
1345 // GFX12: [0xff,0xd3,0x1e,0xcc,0xff,0xd6,0x00,0x68,0x0b,0xfe,0x00,0x00]
1347 v_dot4_f32_fp8_bf8 v0, v1, v2, v3
1348 // GFX12: v_dot4_f32_fp8_bf8 v0, v1, v2, v3 ; encoding: [0x00,0x40,0x24,0xcc,0x01,0x05,0x0e,0x1c]
1350 v_dot4_f32_fp8_bf8 v0, v1, v2, v3 neg_lo:[0,0,1]
1351 // GFX12: v_dot4_f32_fp8_bf8 v0, v1, v2, v3 neg_lo:[0,0,1] ; encoding: [0x00,0x40,0x24,0xcc,0x01,0x05,0x0e,0x9c]
1353 v_dot4_f32_fp8_bf8 v0, v1, v2, v3 neg_hi:[0,0,1]
1354 // GFX12: v_dot4_f32_fp8_bf8 v0, v1, v2, v3 neg_hi:[0,0,1] ; encoding: [0x00,0x44,0x24,0xcc,0x01,0x05,0x0e,0x1c]
1356 v_dot4_f32_fp8_bf8 v0, s0, v2, v3
1357 // GFX12: v_dot4_f32_fp8_bf8 v0, s0, v2, v3 ; encoding: [0x00,0x40,0x24,0xcc,0x00,0x04,0x0e,0x1c]
1359 v_dot4_f32_fp8_bf8 v0, v1, s0, v3
1360 // GFX12: v_dot4_f32_fp8_bf8 v0, v1, s0, v3 ; encoding: [0x00,0x40,0x24,0xcc,0x01,0x01,0x0c,0x1c]
1362 v_dot4_f32_fp8_bf8 v0, v1, v2, s0
1363 // GFX12: v_dot4_f32_fp8_bf8 v0, v1, v2, s0 ; encoding: [0x00,0x40,0x24,0xcc,0x01,0x05,0x02,0x18]
1365 v_dot4_f32_fp8_bf8 v0, 1.0, v2, v3
1366 // GFX12: v_dot4_f32_fp8_bf8 v0, 1.0, v2, v3 ; encoding: [0x00,0x40,0x24,0xcc,0xf2,0x04,0x0e,0x1c]
1368 v_dot4_f32_fp8_bf8 v0, v1, 1.0, v3
1369 // GFX12: v_dot4_f32_fp8_bf8 v0, v1, 1.0, v3 ; encoding: [0x00,0x40,0x24,0xcc,0x01,0xe5,0x0d,0x1c]
1371 v_dot4_f32_fp8_bf8 v0, v1, v2, 1.0
1372 // GFX12: v_dot4_f32_fp8_bf8 v0, v1, v2, 1.0 ; encoding: [0x00,0x40,0x24,0xcc,0x01,0x05,0xca,0x1b]
1374 v_dot4_f32_fp8_bf8 v0, v1, v2, 1
1375 // GFX12: v_dot4_f32_fp8_bf8 v0, v1, v2, 1 ; encoding: [0x00,0x40,0x24,0xcc,0x01,0x05,0x06,0x1a]
1377 v_dot4_f32_bf8_fp8 v0, v1, v2, v3
1378 // GFX12: v_dot4_f32_bf8_fp8 v0, v1, v2, v3 ; encoding: [0x00,0x40,0x25,0xcc,0x01,0x05,0x0e,0x1c]
1380 v_dot4_f32_bf8_fp8 v0, v1, v2, v3 neg_lo:[0,0,1]
1381 // GFX12: v_dot4_f32_bf8_fp8 v0, v1, v2, v3 neg_lo:[0,0,1] ; encoding: [0x00,0x40,0x25,0xcc,0x01,0x05,0x0e,0x9c]
1383 v_dot4_f32_bf8_fp8 v0, v1, v2, v3 neg_hi:[0,0,1]
1384 // GFX12: v_dot4_f32_bf8_fp8 v0, v1, v2, v3 neg_hi:[0,0,1] ; encoding: [0x00,0x44,0x25,0xcc,0x01,0x05,0x0e,0x1c]
1386 v_dot4_f32_bf8_fp8 v0, s0, v2, v3
1387 // GFX12: v_dot4_f32_bf8_fp8 v0, s0, v2, v3 ; encoding: [0x00,0x40,0x25,0xcc,0x00,0x04,0x0e,0x1c]
1389 v_dot4_f32_bf8_fp8 v0, v1, s0, v3
1390 // GFX12: v_dot4_f32_bf8_fp8 v0, v1, s0, v3 ; encoding: [0x00,0x40,0x25,0xcc,0x01,0x01,0x0c,0x1c]
1392 v_dot4_f32_bf8_fp8 v0, v1, v2, s0
1393 // GFX12: v_dot4_f32_bf8_fp8 v0, v1, v2, s0 ; encoding: [0x00,0x40,0x25,0xcc,0x01,0x05,0x02,0x18]
1395 v_dot4_f32_bf8_fp8 v0, 1.0, v2, v3
1396 // GFX12: v_dot4_f32_bf8_fp8 v0, 1.0, v2, v3 ; encoding: [0x00,0x40,0x25,0xcc,0xf2,0x04,0x0e,0x1c]
1398 v_dot4_f32_bf8_fp8 v0, v1, 1.0, v3
1399 // GFX12: v_dot4_f32_bf8_fp8 v0, v1, 1.0, v3 ; encoding: [0x00,0x40,0x25,0xcc,0x01,0xe5,0x0d,0x1c]
1401 v_dot4_f32_bf8_fp8 v0, v1, v2, 1.0
1402 // GFX12: v_dot4_f32_bf8_fp8 v0, v1, v2, 1.0 ; encoding: [0x00,0x40,0x25,0xcc,0x01,0x05,0xca,0x1b]
1404 v_dot4_f32_bf8_fp8 v0, v1, v2, 1
1405 // GFX12: v_dot4_f32_bf8_fp8 v0, v1, v2, 1 ; encoding: [0x00,0x40,0x25,0xcc,0x01,0x05,0x06,0x1a]
1407 v_dot4_f32_fp8_fp8 v0, v1, v2, v3
1408 // GFX12: v_dot4_f32_fp8_fp8 v0, v1, v2, v3 ; encoding: [0x00,0x40,0x26,0xcc,0x01,0x05,0x0e,0x1c]
1410 v_dot4_f32_fp8_fp8 v0, v1, v2, v3 neg_lo:[0,0,1]
1411 // GFX12: v_dot4_f32_fp8_fp8 v0, v1, v2, v3 neg_lo:[0,0,1] ; encoding: [0x00,0x40,0x26,0xcc,0x01,0x05,0x0e,0x9c]
1413 v_dot4_f32_fp8_fp8 v0, v1, v2, v3 neg_hi:[0,0,1]
1414 // GFX12: v_dot4_f32_fp8_fp8 v0, v1, v2, v3 neg_hi:[0,0,1] ; encoding: [0x00,0x44,0x26,0xcc,0x01,0x05,0x0e,0x1c]
1416 v_dot4_f32_fp8_fp8 v0, s0, v2, v3
1417 // GFX12: v_dot4_f32_fp8_fp8 v0, s0, v2, v3 ; encoding: [0x00,0x40,0x26,0xcc,0x00,0x04,0x0e,0x1c]
1419 v_dot4_f32_fp8_fp8 v0, v1, s0, v3
1420 // GFX12: v_dot4_f32_fp8_fp8 v0, v1, s0, v3 ; encoding: [0x00,0x40,0x26,0xcc,0x01,0x01,0x0c,0x1c]
1422 v_dot4_f32_fp8_fp8 v0, v1, v2, s0
1423 // GFX12: v_dot4_f32_fp8_fp8 v0, v1, v2, s0 ; encoding: [0x00,0x40,0x26,0xcc,0x01,0x05,0x02,0x18]
1425 v_dot4_f32_fp8_fp8 v0, 1.0, v2, v3
1426 // GFX12: v_dot4_f32_fp8_fp8 v0, 1.0, v2, v3 ; encoding: [0x00,0x40,0x26,0xcc,0xf2,0x04,0x0e,0x1c]
1428 v_dot4_f32_fp8_fp8 v0, v1, 1.0, v3
1429 // GFX12: v_dot4_f32_fp8_fp8 v0, v1, 1.0, v3 ; encoding: [0x00,0x40,0x26,0xcc,0x01,0xe5,0x0d,0x1c]
1431 v_dot4_f32_fp8_fp8 v0, v1, v2, 1.0
1432 // GFX12: v_dot4_f32_fp8_fp8 v0, v1, v2, 1.0 ; encoding: [0x00,0x40,0x26,0xcc,0x01,0x05,0xca,0x1b]
1434 v_dot4_f32_fp8_fp8 v0, v1, v2, 1
1435 // GFX12: v_dot4_f32_fp8_fp8 v0, v1, v2, 1 ; encoding: [0x00,0x40,0x26,0xcc,0x01,0x05,0x06,0x1a]
1437 v_dot4_f32_bf8_bf8 v0, v1, v2, v3
1438 // GFX12: v_dot4_f32_bf8_bf8 v0, v1, v2, v3 ; encoding: [0x00,0x40,0x27,0xcc,0x01,0x05,0x0e,0x1c]
1440 v_dot4_f32_bf8_bf8 v0, v1, v2, v3 neg_lo:[0,0,1]
1441 // GFX12: v_dot4_f32_bf8_bf8 v0, v1, v2, v3 neg_lo:[0,0,1] ; encoding: [0x00,0x40,0x27,0xcc,0x01,0x05,0x0e,0x9c]
1443 v_dot4_f32_bf8_bf8 v0, v1, v2, v3 neg_hi:[0,0,1]
1444 // GFX12: _dot4_f32_bf8_bf8 v0, v1, v2, v3 neg_hi:[0,0,1] ; encoding: [0x00,0x44,0x27,0xcc,0x01,0x05,0x0e,0x1c]
1446 v_dot4_f32_bf8_bf8 v0, s0, v2, v3
1447 // GFX12: v_dot4_f32_bf8_bf8 v0, s0, v2, v3 ; encoding: [0x00,0x40,0x27,0xcc,0x00,0x04,0x0e,0x1c]
1449 v_dot4_f32_bf8_bf8 v0, v1, s0, v3
1450 // GFX12: v_dot4_f32_bf8_bf8 v0, v1, s0, v3 ; encoding: [0x00,0x40,0x27,0xcc,0x01,0x01,0x0c,0x1c]
1452 v_dot4_f32_bf8_bf8 v0, v1, v2, s0
1453 // GFX12: v_dot4_f32_bf8_bf8 v0, v1, v2, s0 ; encoding: [0x00,0x40,0x27,0xcc,0x01,0x05,0x02,0x18]
1455 v_dot4_f32_bf8_bf8 v0, 1.0, v2, v3
1456 // GFX12: v_dot4_f32_bf8_bf8 v0, 1.0, v2, v3 ; encoding: [0x00,0x40,0x27,0xcc,0xf2,0x04,0x0e,0x1c]
1458 v_dot4_f32_bf8_bf8 v0, v1, 1.0, v3
1459 // GFX12: v_dot4_f32_bf8_bf8 v0, v1, 1.0, v3 ; encoding: [0x00,0x40,0x27,0xcc,0x01,0xe5,0x0d,0x1c]
1461 v_dot4_f32_bf8_bf8 v0, v1, v2, 1.0
1462 // GFX12: v_dot4_f32_bf8_bf8 v0, v1, v2, 1.0 ; encoding: [0x00,0x40,0x27,0xcc,0x01,0x05,0xca,0x1b]
1464 v_dot4_f32_bf8_bf8 v0, v1, v2, 1
1465 // GFX12: v_dot4_f32_bf8_bf8 v0, v1, v2, 1 ; encoding: [0x00,0x40,0x27,0xcc,0x01,0x05,0x06,0x1a]