1 // RUN
: llvm-mc
-triple
=amdgcn
-mcpu
=gfx1200
-mattr
=+wavefrontsize32
,-real-true16
-show-encoding
%s | FileCheck
--check-prefix
=GFX12
%s
3 v_bfrev_b32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
4 // GFX12
: [0x05,0x00,0xb8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
6 v_bfrev_b32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
7 // GFX12
: [0x05,0x00,0xb8,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
9 v_bfrev_b32_e64_dpp v5
, v1 row_mirror
10 // GFX12
: [0x05,0x00,0xb8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
12 v_bfrev_b32_e64_dpp v5
, v1 row_half_mirror
13 // GFX12
: [0x05,0x00,0xb8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
15 v_bfrev_b32_e64_dpp v5
, v1 row_shl
:1
16 // GFX12
: [0x05,0x00,0xb8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
18 v_bfrev_b32_e64_dpp v5
, v1 row_shl
:15
19 // GFX12
: [0x05,0x00,0xb8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
21 v_bfrev_b32_e64_dpp v5
, v1 row_shr
:1
22 // GFX12
: [0x05,0x00,0xb8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
24 v_bfrev_b32_e64_dpp v5
, v1 row_shr
:15
25 // GFX12
: [0x05,0x00,0xb8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
27 v_bfrev_b32_e64_dpp v5
, v1 row_ror
:1
28 // GFX12
: [0x05,0x00,0xb8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
30 v_bfrev_b32_e64_dpp v5
, v1 row_ror
:15
31 // GFX12
: [0x05,0x00,0xb8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
33 v_bfrev_b32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
34 // GFX12
: [0x05,0x00,0xb8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
36 v_bfrev_b32_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
37 // GFX12
: [0x05,0x00,0xb8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
39 v_bfrev_b32_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
40 // GFX12
: [0x05,0x00,0xb8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
42 v_bfrev_b32_e64_dpp v255
, v255 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
43 // GFX12
: [0xff,0x00,0xb8,0xd5,0xfa,0x00,0x00,0x00,0xff,0x6f,0x05,0x30]
45 v_ceil_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
46 // GFX12
: [0x05,0x00,0xdc,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
48 v_ceil_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
49 // GFX12
: [0x05,0x00,0xdc,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
51 v_ceil_f16_e64_dpp v5
, v1 row_mirror
52 // GFX12
: [0x05,0x00,0xdc,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
54 v_ceil_f16_e64_dpp v5
, v1 row_half_mirror
55 // GFX12
: [0x05,0x00,0xdc,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
57 v_ceil_f16_e64_dpp v5
, v1 row_shl
:1
58 // GFX12
: [0x05,0x00,0xdc,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
60 v_ceil_f16_e64_dpp v5
, v1 row_shl
:15
61 // GFX12
: [0x05,0x00,0xdc,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
63 v_ceil_f16_e64_dpp v5
, v1 row_shr
:1
64 // GFX12
: [0x05,0x00,0xdc,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
66 v_ceil_f16_e64_dpp v5
, v1 row_shr
:15
67 // GFX12
: [0x05,0x00,0xdc,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
69 v_ceil_f16_e64_dpp v5
, v1 row_ror
:1
70 // GFX12
: [0x05,0x00,0xdc,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
72 v_ceil_f16_e64_dpp v5
, v1 row_ror
:15
73 // GFX12
: [0x05,0x00,0xdc,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
75 v_ceil_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
76 // GFX12
: [0x05,0x00,0xdc,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
78 v_ceil_f16_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
79 // GFX12
: [0x05,0x00,0xdc,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
81 v_ceil_f16_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
82 // GFX12
: [0x05,0x00,0xdc,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
84 v_ceil_f16_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
85 // GFX12
: [0xff,0x81,0xdc,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
87 v_ceil_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
88 // GFX12
: [0x05,0x00,0xa2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
90 v_ceil_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
91 // GFX12
: [0x05,0x00,0xa2,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
93 v_ceil_f32_e64_dpp v5
, v1 row_mirror
94 // GFX12
: [0x05,0x00,0xa2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
96 v_ceil_f32_e64_dpp v5
, v1 row_half_mirror
97 // GFX12
: [0x05,0x00,0xa2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
99 v_ceil_f32_e64_dpp v5
, v1 row_shl
:1
100 // GFX12
: [0x05,0x00,0xa2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
102 v_ceil_f32_e64_dpp v5
, v1 row_shl
:15
103 // GFX12
: [0x05,0x00,0xa2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
105 v_ceil_f32_e64_dpp v5
, v1 row_shr
:1
106 // GFX12
: [0x05,0x00,0xa2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
108 v_ceil_f32_e64_dpp v5
, v1 row_shr
:15
109 // GFX12
: [0x05,0x00,0xa2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
111 v_ceil_f32_e64_dpp v5
, v1 row_ror
:1
112 // GFX12
: [0x05,0x00,0xa2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
114 v_ceil_f32_e64_dpp v5
, v1 row_ror
:15
115 // GFX12
: [0x05,0x00,0xa2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
117 v_ceil_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
118 // GFX12
: [0x05,0x00,0xa2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
120 v_ceil_f32_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
121 // GFX12
: [0x05,0x00,0xa2,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
123 v_ceil_f32_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
124 // GFX12
: [0x05,0x00,0xa2,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
126 v_ceil_f32_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
127 // GFX12
: [0xff,0x81,0xa2,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
129 v_cls_i32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
130 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
132 v_cls_i32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
133 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
135 v_cls_i32_e64_dpp v5
, v1 row_mirror
136 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
138 v_cls_i32_e64_dpp v5
, v1 row_half_mirror
139 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
141 v_cls_i32_e64_dpp v5
, v1 row_shl
:1
142 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
144 v_cls_i32_e64_dpp v5
, v1 row_shl
:15
145 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
147 v_cls_i32_e64_dpp v5
, v1 row_shr
:1
148 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
150 v_cls_i32_e64_dpp v5
, v1 row_shr
:15
151 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
153 v_cls_i32_e64_dpp v5
, v1 row_ror
:1
154 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
156 v_cls_i32_e64_dpp v5
, v1 row_ror
:15
157 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
159 v_cls_i32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
160 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
162 v_cls_i32_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
163 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
165 v_cls_i32_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
166 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
168 v_cls_i32_e64_dpp v255
, v255 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
169 // GFX12
: [0xff,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0xff,0x6f,0x05,0x30]
171 v_clz_i32_u32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
172 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
174 v_clz_i32_u32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
175 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
177 v_clz_i32_u32_e64_dpp v5
, v1 row_mirror
178 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
180 v_clz_i32_u32_e64_dpp v5
, v1 row_half_mirror
181 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
183 v_clz_i32_u32_e64_dpp v5
, v1 row_shl
:1
184 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
186 v_clz_i32_u32_e64_dpp v5
, v1 row_shl
:15
187 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
189 v_clz_i32_u32_e64_dpp v5
, v1 row_shr
:1
190 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
192 v_clz_i32_u32_e64_dpp v5
, v1 row_shr
:15
193 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
195 v_clz_i32_u32_e64_dpp v5
, v1 row_ror
:1
196 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
198 v_clz_i32_u32_e64_dpp v5
, v1 row_ror
:15
199 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
201 v_clz_i32_u32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
202 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
204 v_clz_i32_u32_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
205 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
207 v_clz_i32_u32_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
208 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
210 v_clz_i32_u32_e64_dpp v255
, v255 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
211 // GFX12
: [0xff,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0xff,0x6f,0x05,0x30]
213 v_cos_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
214 // GFX12
: [0x05,0x00,0xe1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
216 v_cos_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
217 // GFX12
: [0x05,0x00,0xe1,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
219 v_cos_f16_e64_dpp v5
, v1 row_mirror
220 // GFX12
: [0x05,0x00,0xe1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
222 v_cos_f16_e64_dpp v5
, v1 row_half_mirror
223 // GFX12
: [0x05,0x00,0xe1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
225 v_cos_f16_e64_dpp v5
, v1 row_shl
:1
226 // GFX12
: [0x05,0x00,0xe1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
228 v_cos_f16_e64_dpp v5
, v1 row_shl
:15
229 // GFX12
: [0x05,0x00,0xe1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
231 v_cos_f16_e64_dpp v5
, v1 row_shr
:1
232 // GFX12
: [0x05,0x00,0xe1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
234 v_cos_f16_e64_dpp v5
, v1 row_shr
:15
235 // GFX12
: [0x05,0x00,0xe1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
237 v_cos_f16_e64_dpp v5
, v1 row_ror
:1
238 // GFX12
: [0x05,0x00,0xe1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
240 v_cos_f16_e64_dpp v5
, v1 row_ror
:15
241 // GFX12
: [0x05,0x00,0xe1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
243 v_cos_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
244 // GFX12
: [0x05,0x00,0xe1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
246 v_cos_f16_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
247 // GFX12
: [0x05,0x00,0xe1,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
249 v_cos_f16_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
250 // GFX12
: [0x05,0x00,0xe1,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
252 v_cos_f16_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
253 // GFX12
: [0xff,0x81,0xe1,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
255 v_cos_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
256 // GFX12
: [0x05,0x00,0xb6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
258 v_cos_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
259 // GFX12
: [0x05,0x00,0xb6,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
261 v_cos_f32_e64_dpp v5
, v1 row_mirror
262 // GFX12
: [0x05,0x00,0xb6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
264 v_cos_f32_e64_dpp v5
, v1 row_half_mirror
265 // GFX12
: [0x05,0x00,0xb6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
267 v_cos_f32_e64_dpp v5
, v1 row_shl
:1
268 // GFX12
: [0x05,0x00,0xb6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
270 v_cos_f32_e64_dpp v5
, v1 row_shl
:15
271 // GFX12
: [0x05,0x00,0xb6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
273 v_cos_f32_e64_dpp v5
, v1 row_shr
:1
274 // GFX12
: [0x05,0x00,0xb6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
276 v_cos_f32_e64_dpp v5
, v1 row_shr
:15
277 // GFX12
: [0x05,0x00,0xb6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
279 v_cos_f32_e64_dpp v5
, v1 row_ror
:1
280 // GFX12
: [0x05,0x00,0xb6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
282 v_cos_f32_e64_dpp v5
, v1 row_ror
:15
283 // GFX12
: [0x05,0x00,0xb6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
285 v_cos_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
286 // GFX12
: [0x05,0x00,0xb6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
288 v_cos_f32_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
289 // GFX12
: [0x05,0x00,0xb6,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
291 v_cos_f32_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
292 // GFX12
: [0x05,0x00,0xb6,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
294 v_cos_f32_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
295 // GFX12
: [0xff,0x81,0xb6,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
297 v_ctz_i32_b32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
298 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
300 v_ctz_i32_b32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
301 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
303 v_ctz_i32_b32_e64_dpp v5
, v1 row_mirror
304 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
306 v_ctz_i32_b32_e64_dpp v5
, v1 row_half_mirror
307 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
309 v_ctz_i32_b32_e64_dpp v5
, v1 row_shl
:1
310 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
312 v_ctz_i32_b32_e64_dpp v5
, v1 row_shl
:15
313 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
315 v_ctz_i32_b32_e64_dpp v5
, v1 row_shr
:1
316 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
318 v_ctz_i32_b32_e64_dpp v5
, v1 row_shr
:15
319 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
321 v_ctz_i32_b32_e64_dpp v5
, v1 row_ror
:1
322 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
324 v_ctz_i32_b32_e64_dpp v5
, v1 row_ror
:15
325 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
327 v_ctz_i32_b32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
328 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
330 v_ctz_i32_b32_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
331 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
333 v_ctz_i32_b32_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
334 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
336 v_ctz_i32_b32_e64_dpp v255
, v255 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
337 // GFX12
: [0xff,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0xff,0x6f,0x05,0x30]
339 V_CVT_F32_FP8_e64_dpp v5
, v1 quad_perm
:[3,1,2,0] row_mask
:0x2 bank_mask
:0xd
340 // GFX12
: encoding
: [0x05,0x00,0xec,0xd5,0xfa,0x00,0x00,0x00,0x01,0x27,0x00,0x2d]
342 V_CVT_F32_FP8_e64_dpp v1
, v3 quad_perm
:[2,1,0,3] row_mask
:0x5 bank_mask
:0xe
343 // GFX12
: encoding
: [0x01,0x00,0xec,0xd5,0xfa,0x00,0x00,0x00,0x03,0xc6,0x00,0x5e]
345 V_CVT_F32_BF8_e64_dpp v5
, v1 quad_perm
:[0,3,2,1] row_mask
:0x2 bank_mask
:0xd
346 // GFX12
: encoding
: [0x05,0x00,0xed,0xd5,0xfa,0x00,0x00,0x00,0x01,0x6c,0x00,0x2d]
348 V_CVT_F32_BF8_e64_dpp v1
, v3 quad_perm
:[0,1,3,2] row_mask
:0x5 bank_mask
:0xe
349 // GFX12
: encoding
: [0x01,0x00,0xed,0xd5,0xfa,0x00,0x00,0x00,0x03,0xb4,0x00,0x5e]
351 v_cvt_f16_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
352 // GFX12
: [0x05,0x00,0x8a,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
354 v_cvt_f16_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
355 // GFX12
: [0x05,0x00,0x8a,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
357 v_cvt_f16_f32_e64_dpp v5
, v1 row_mirror
358 // GFX12
: [0x05,0x00,0x8a,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
360 v_cvt_f16_f32_e64_dpp v5
, v1 row_half_mirror
361 // GFX12
: [0x05,0x00,0x8a,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
363 v_cvt_f16_f32_e64_dpp v5
, v1 row_shl
:1
364 // GFX12
: [0x05,0x00,0x8a,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
366 v_cvt_f16_f32_e64_dpp v5
, v1 row_shl
:15
367 // GFX12
: [0x05,0x00,0x8a,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
369 v_cvt_f16_f32_e64_dpp v5
, v1 row_shr
:1
370 // GFX12
: [0x05,0x00,0x8a,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
372 v_cvt_f16_f32_e64_dpp v5
, v1 row_shr
:15
373 // GFX12
: [0x05,0x00,0x8a,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
375 v_cvt_f16_f32_e64_dpp v5
, v1 row_ror
:1
376 // GFX12
: [0x05,0x00,0x8a,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
378 v_cvt_f16_f32_e64_dpp v5
, v1 row_ror
:15
379 // GFX12
: [0x05,0x00,0x8a,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
381 v_cvt_f16_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
382 // GFX12
: [0x05,0x00,0x8a,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
384 v_cvt_f16_f32_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
385 // GFX12
: [0x05,0x00,0x8a,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
387 v_cvt_f16_f32_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
388 // GFX12
: [0x05,0x00,0x8a,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
390 v_cvt_f16_f32_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
391 // GFX12
: [0xff,0x81,0x8a,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
393 v_cvt_f16_i16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
394 // GFX12
: [0x05,0x00,0xd1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
396 v_cvt_f16_i16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
397 // GFX12
: [0x05,0x00,0xd1,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
399 v_cvt_f16_i16_e64_dpp v5
, v1 row_mirror
400 // GFX12
: [0x05,0x00,0xd1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
402 v_cvt_f16_i16_e64_dpp v5
, v1 row_half_mirror
403 // GFX12
: [0x05,0x00,0xd1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
405 v_cvt_f16_i16_e64_dpp v5
, v1 row_shl
:1
406 // GFX12
: [0x05,0x00,0xd1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
408 v_cvt_f16_i16_e64_dpp v5
, v1 row_shl
:15
409 // GFX12
: [0x05,0x00,0xd1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
411 v_cvt_f16_i16_e64_dpp v5
, v1 row_shr
:1
412 // GFX12
: [0x05,0x00,0xd1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
414 v_cvt_f16_i16_e64_dpp v5
, v1 row_shr
:15
415 // GFX12
: [0x05,0x00,0xd1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
417 v_cvt_f16_i16_e64_dpp v5
, v1 row_ror
:1
418 // GFX12
: [0x05,0x00,0xd1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
420 v_cvt_f16_i16_e64_dpp v5
, v1 row_ror
:15
421 // GFX12
: [0x05,0x00,0xd1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
423 v_cvt_f16_i16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
424 // GFX12
: [0x05,0x00,0xd1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
426 v_cvt_f16_i16_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
427 // GFX12
: [0x05,0x00,0xd1,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
429 v_cvt_f16_i16_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
430 // GFX12
: [0x05,0x00,0xd1,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
432 v_cvt_f16_i16_e64_dpp v255
, v255 clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
433 // GFX12
: [0xff,0x80,0xd1,0xd5,0xfa,0x00,0x00,0x18,0xff,0x6f,0x05,0x30]
435 v_cvt_f16_u16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
436 // GFX12
: [0x05,0x00,0xd0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
438 v_cvt_f16_u16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
439 // GFX12
: [0x05,0x00,0xd0,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
441 v_cvt_f16_u16_e64_dpp v5
, v1 row_mirror
442 // GFX12
: [0x05,0x00,0xd0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
444 v_cvt_f16_u16_e64_dpp v5
, v1 row_half_mirror
445 // GFX12
: [0x05,0x00,0xd0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
447 v_cvt_f16_u16_e64_dpp v5
, v1 row_shl
:1
448 // GFX12
: [0x05,0x00,0xd0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
450 v_cvt_f16_u16_e64_dpp v5
, v1 row_shl
:15
451 // GFX12
: [0x05,0x00,0xd0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
453 v_cvt_f16_u16_e64_dpp v5
, v1 row_shr
:1
454 // GFX12
: [0x05,0x00,0xd0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
456 v_cvt_f16_u16_e64_dpp v5
, v1 row_shr
:15
457 // GFX12
: [0x05,0x00,0xd0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
459 v_cvt_f16_u16_e64_dpp v5
, v1 row_ror
:1
460 // GFX12
: [0x05,0x00,0xd0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
462 v_cvt_f16_u16_e64_dpp v5
, v1 row_ror
:15
463 // GFX12
: [0x05,0x00,0xd0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
465 v_cvt_f16_u16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
466 // GFX12
: [0x05,0x00,0xd0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
468 v_cvt_f16_u16_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
469 // GFX12
: [0x05,0x00,0xd0,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
471 v_cvt_f16_u16_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
472 // GFX12
: [0x05,0x00,0xd0,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
474 v_cvt_f16_u16_e64_dpp v255
, v255 clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
475 // GFX12
: [0xff,0x80,0xd0,0xd5,0xfa,0x00,0x00,0x18,0xff,0x6f,0x05,0x30]
477 v_cvt_f32_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
478 // GFX12
: [0x05,0x00,0x8b,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
480 v_cvt_f32_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
481 // GFX12
: [0x05,0x00,0x8b,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
483 v_cvt_f32_f16_e64_dpp v5
, v1 row_mirror
484 // GFX12
: [0x05,0x00,0x8b,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
486 v_cvt_f32_f16_e64_dpp v5
, v1 row_half_mirror
487 // GFX12
: [0x05,0x00,0x8b,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
489 v_cvt_f32_f16_e64_dpp v5
, v1 row_shl
:1
490 // GFX12
: [0x05,0x00,0x8b,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
492 v_cvt_f32_f16_e64_dpp v5
, v1 row_shl
:15
493 // GFX12
: [0x05,0x00,0x8b,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
495 v_cvt_f32_f16_e64_dpp v5
, v1 row_shr
:1
496 // GFX12
: [0x05,0x00,0x8b,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
498 v_cvt_f32_f16_e64_dpp v5
, v1 row_shr
:15
499 // GFX12
: [0x05,0x00,0x8b,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
501 v_cvt_f32_f16_e64_dpp v5
, v1 row_ror
:1
502 // GFX12
: [0x05,0x00,0x8b,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
504 v_cvt_f32_f16_e64_dpp v5
, v1 row_ror
:15
505 // GFX12
: [0x05,0x00,0x8b,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
507 v_cvt_f32_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
508 // GFX12
: [0x05,0x00,0x8b,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
510 v_cvt_f32_f16_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
511 // GFX12
: [0x05,0x00,0x8b,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
513 v_cvt_f32_f16_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
514 // GFX12
: [0x05,0x00,0x8b,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
516 v_cvt_f32_f16_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
517 // GFX12
: [0xff,0x81,0x8b,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
519 v_cvt_f32_fp8 v1
, v2 quad_perm
:[0,1,2,3]
520 // GFX12
: v_cvt_f32_fp8_dpp v1
, v2 quad_perm
:[0,1,2,3] row_mask
:0xf bank_mask
:0xf ; encoding
: [0xfa,0xd8,0x02,0x7e,0x02,0xe4,0x00,0xff]
522 v_cvt_f32_fp8 v1
, v2 byte_sel
:0 quad_perm
:[0,1,2,3]
523 // GFX12
: v_cvt_f32_fp8_e64_dpp v1
, v2 quad_perm
:[0,1,2,3] row_mask
:0xf bank_mask
:0xf ; encoding
: [0x01,0x00,0xec,0xd5,0xfa,0x00,0x00,0x00,0x02,0xe4,0x00,0xff]
525 v_cvt_f32_fp8 v1
, v2 byte_sel
:1 quad_perm
:[0,1,2,3]
526 // GFX12
: v_cvt_f32_fp8_e64_dpp v1
, v2 byte_sel
:1 quad_perm
:[0,1,2,3] row_mask
:0xf bank_mask
:0xf ; encoding
: [0x01,0x10,0xec,0xd5,0xfa,0x00,0x00,0x00,0x02,0xe4,0x00,0xff]
528 v_cvt_f32_fp8 v1
, v2 byte_sel
:2 quad_perm
:[0,1,2,3]
529 // GFX12
: v_cvt_f32_fp8_e64_dpp v1
, v2 byte_sel
:2 quad_perm
:[0,1,2,3] row_mask
:0xf bank_mask
:0xf ; encoding
: [0x01,0x08,0xec,0xd5,0xfa,0x00,0x00,0x00,0x02,0xe4,0x00,0xff]
531 v_cvt_f32_fp8 v1
, v2 byte_sel
:3 quad_perm
:[0,1,2,3]
532 // GFX12
: v_cvt_f32_fp8_e64_dpp v1
, v2 byte_sel
:3 quad_perm
:[0,1,2,3] row_mask
:0xf bank_mask
:0xf ; encoding
: [0x01,0x18,0xec,0xd5,0xfa,0x00,0x00,0x00,0x02,0xe4,0x00,0xff]
534 v_cvt_f32_bf8 v1
, v2 quad_perm
:[0,1,2,3]
535 // GFX12
: v_cvt_f32_bf8_dpp v1
, v2 quad_perm
:[0,1,2,3] row_mask
:0xf bank_mask
:0xf ; encoding
: [0xfa,0xda,0x02,0x7e,0x02,0xe4,0x00,0xff]
537 v_cvt_f32_bf8 v1
, v2 byte_sel
:0 quad_perm
:[0,1,2,3]
538 // GFX12
: v_cvt_f32_bf8_e64_dpp v1
, v2 quad_perm
:[0,1,2,3] row_mask
:0xf bank_mask
:0xf ; encoding
: [0x01,0x00,0xed,0xd5,0xfa,0x00,0x00,0x00,0x02,0xe4,0x00,0xff]
540 v_cvt_f32_bf8 v1
, v2 byte_sel
:1 quad_perm
:[0,1,2,3]
541 // GFX12
: v_cvt_f32_bf8_e64_dpp v1
, v2 byte_sel
:1 quad_perm
:[0,1,2,3] row_mask
:0xf bank_mask
:0xf ; encoding
: [0x01,0x10,0xed,0xd5,0xfa,0x00,0x00,0x00,0x02,0xe4,0x00,0xff]
543 v_cvt_f32_bf8 v1
, v2 byte_sel
:2 quad_perm
:[0,1,2,3]
544 // GFX12
: v_cvt_f32_bf8_e64_dpp v1
, v2 byte_sel
:2 quad_perm
:[0,1,2,3] row_mask
:0xf bank_mask
:0xf ; encoding
: [0x01,0x08,0xed,0xd5,0xfa,0x00,0x00,0x00,0x02,0xe4,0x00,0xff]
546 v_cvt_f32_bf8 v1
, v2 byte_sel
:3 quad_perm
:[0,1,2,3]
547 // GFX12
: v_cvt_f32_bf8_e64_dpp v1
, v2 byte_sel
:3 quad_perm
:[0,1,2,3] row_mask
:0xf bank_mask
:0xf ; encoding
: [0x01,0x18,0xed,0xd5,0xfa,0x00,0x00,0x00,0x02,0xe4,0x00,0xff]
549 v_cvt_f32_i32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
550 // GFX12
: [0x05,0x00,0x85,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
552 v_cvt_f32_i32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
553 // GFX12
: [0x05,0x00,0x85,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
555 v_cvt_f32_i32_e64_dpp v5
, v1 row_mirror
556 // GFX12
: [0x05,0x00,0x85,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
558 v_cvt_f32_i32_e64_dpp v5
, v1 row_half_mirror
559 // GFX12
: [0x05,0x00,0x85,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
561 v_cvt_f32_i32_e64_dpp v5
, v1 row_shl
:1
562 // GFX12
: [0x05,0x00,0x85,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
564 v_cvt_f32_i32_e64_dpp v5
, v1 row_shl
:15
565 // GFX12
: [0x05,0x00,0x85,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
567 v_cvt_f32_i32_e64_dpp v5
, v1 row_shr
:1
568 // GFX12
: [0x05,0x00,0x85,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
570 v_cvt_f32_i32_e64_dpp v5
, v1 row_shr
:15
571 // GFX12
: [0x05,0x00,0x85,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
573 v_cvt_f32_i32_e64_dpp v5
, v1 row_ror
:1
574 // GFX12
: [0x05,0x00,0x85,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
576 v_cvt_f32_i32_e64_dpp v5
, v1 row_ror
:15
577 // GFX12
: [0x05,0x00,0x85,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
579 v_cvt_f32_i32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
580 // GFX12
: [0x05,0x00,0x85,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
582 v_cvt_f32_i32_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
583 // GFX12
: [0x05,0x00,0x85,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
585 v_cvt_f32_i32_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
586 // GFX12
: [0x05,0x00,0x85,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
588 v_cvt_f32_i32_e64_dpp v255
, v255 clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
589 // GFX12
: [0xff,0x80,0x85,0xd5,0xfa,0x00,0x00,0x18,0xff,0x6f,0x05,0x30]
591 v_cvt_f32_u32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
592 // GFX12
: [0x05,0x00,0x86,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
594 v_cvt_f32_u32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
595 // GFX12
: [0x05,0x00,0x86,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
597 v_cvt_f32_u32_e64_dpp v5
, v1 row_mirror
598 // GFX12
: [0x05,0x00,0x86,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
600 v_cvt_f32_u32_e64_dpp v5
, v1 row_half_mirror
601 // GFX12
: [0x05,0x00,0x86,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
603 v_cvt_f32_u32_e64_dpp v5
, v1 row_shl
:1
604 // GFX12
: [0x05,0x00,0x86,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
606 v_cvt_f32_u32_e64_dpp v5
, v1 row_shl
:15
607 // GFX12
: [0x05,0x00,0x86,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
609 v_cvt_f32_u32_e64_dpp v5
, v1 row_shr
:1
610 // GFX12
: [0x05,0x00,0x86,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
612 v_cvt_f32_u32_e64_dpp v5
, v1 row_shr
:15
613 // GFX12
: [0x05,0x00,0x86,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
615 v_cvt_f32_u32_e64_dpp v5
, v1 row_ror
:1
616 // GFX12
: [0x05,0x00,0x86,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
618 v_cvt_f32_u32_e64_dpp v5
, v1 row_ror
:15
619 // GFX12
: [0x05,0x00,0x86,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
621 v_cvt_f32_u32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
622 // GFX12
: [0x05,0x00,0x86,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
624 v_cvt_f32_u32_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
625 // GFX12
: [0x05,0x00,0x86,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
627 v_cvt_f32_u32_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
628 // GFX12
: [0x05,0x00,0x86,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
630 v_cvt_f32_u32_e64_dpp v255
, v255 clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
631 // GFX12
: [0xff,0x80,0x86,0xd5,0xfa,0x00,0x00,0x18,0xff,0x6f,0x05,0x30]
633 v_cvt_f32_ubyte0_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
634 // GFX12
: [0x05,0x00,0x91,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
636 v_cvt_f32_ubyte0_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
637 // GFX12
: [0x05,0x00,0x91,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
639 v_cvt_f32_ubyte0_e64_dpp v5
, v1 row_mirror
640 // GFX12
: [0x05,0x00,0x91,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
642 v_cvt_f32_ubyte0_e64_dpp v5
, v1 row_half_mirror
643 // GFX12
: [0x05,0x00,0x91,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
645 v_cvt_f32_ubyte0_e64_dpp v5
, v1 row_shl
:1
646 // GFX12
: [0x05,0x00,0x91,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
648 v_cvt_f32_ubyte0_e64_dpp v5
, v1 row_shl
:15
649 // GFX12
: [0x05,0x00,0x91,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
651 v_cvt_f32_ubyte0_e64_dpp v5
, v1 row_shr
:1
652 // GFX12
: [0x05,0x00,0x91,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
654 v_cvt_f32_ubyte0_e64_dpp v5
, v1 row_shr
:15
655 // GFX12
: [0x05,0x00,0x91,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
657 v_cvt_f32_ubyte0_e64_dpp v5
, v1 row_ror
:1
658 // GFX12
: [0x05,0x00,0x91,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
660 v_cvt_f32_ubyte0_e64_dpp v5
, v1 row_ror
:15
661 // GFX12
: [0x05,0x00,0x91,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
663 v_cvt_f32_ubyte0_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
664 // GFX12
: [0x05,0x00,0x91,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
666 v_cvt_f32_ubyte0_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
667 // GFX12
: [0x05,0x00,0x91,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
669 v_cvt_f32_ubyte0_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
670 // GFX12
: [0x05,0x00,0x91,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
672 v_cvt_f32_ubyte0_e64_dpp v255
, v255 clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
673 // GFX12
: [0xff,0x80,0x91,0xd5,0xfa,0x00,0x00,0x18,0xff,0x6f,0x05,0x30]
675 v_cvt_f32_ubyte1_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
676 // GFX12
: [0x05,0x00,0x92,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
678 v_cvt_f32_ubyte1_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
679 // GFX12
: [0x05,0x00,0x92,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
681 v_cvt_f32_ubyte1_e64_dpp v5
, v1 row_mirror
682 // GFX12
: [0x05,0x00,0x92,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
684 v_cvt_f32_ubyte1_e64_dpp v5
, v1 row_half_mirror
685 // GFX12
: [0x05,0x00,0x92,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
687 v_cvt_f32_ubyte1_e64_dpp v5
, v1 row_shl
:1
688 // GFX12
: [0x05,0x00,0x92,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
690 v_cvt_f32_ubyte1_e64_dpp v5
, v1 row_shl
:15
691 // GFX12
: [0x05,0x00,0x92,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
693 v_cvt_f32_ubyte1_e64_dpp v5
, v1 row_shr
:1
694 // GFX12
: [0x05,0x00,0x92,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
696 v_cvt_f32_ubyte1_e64_dpp v5
, v1 row_shr
:15
697 // GFX12
: [0x05,0x00,0x92,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
699 v_cvt_f32_ubyte1_e64_dpp v5
, v1 row_ror
:1
700 // GFX12
: [0x05,0x00,0x92,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
702 v_cvt_f32_ubyte1_e64_dpp v5
, v1 row_ror
:15
703 // GFX12
: [0x05,0x00,0x92,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
705 v_cvt_f32_ubyte1_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
706 // GFX12
: [0x05,0x00,0x92,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
708 v_cvt_f32_ubyte1_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
709 // GFX12
: [0x05,0x00,0x92,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
711 v_cvt_f32_ubyte1_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
712 // GFX12
: [0x05,0x00,0x92,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
714 v_cvt_f32_ubyte1_e64_dpp v255
, v255 clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
715 // GFX12
: [0xff,0x80,0x92,0xd5,0xfa,0x00,0x00,0x18,0xff,0x6f,0x05,0x30]
717 v_cvt_f32_ubyte2_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
718 // GFX12
: [0x05,0x00,0x93,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
720 v_cvt_f32_ubyte2_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
721 // GFX12
: [0x05,0x00,0x93,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
723 v_cvt_f32_ubyte2_e64_dpp v5
, v1 row_mirror
724 // GFX12
: [0x05,0x00,0x93,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
726 v_cvt_f32_ubyte2_e64_dpp v5
, v1 row_half_mirror
727 // GFX12
: [0x05,0x00,0x93,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
729 v_cvt_f32_ubyte2_e64_dpp v5
, v1 row_shl
:1
730 // GFX12
: [0x05,0x00,0x93,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
732 v_cvt_f32_ubyte2_e64_dpp v5
, v1 row_shl
:15
733 // GFX12
: [0x05,0x00,0x93,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
735 v_cvt_f32_ubyte2_e64_dpp v5
, v1 row_shr
:1
736 // GFX12
: [0x05,0x00,0x93,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
738 v_cvt_f32_ubyte2_e64_dpp v5
, v1 row_shr
:15
739 // GFX12
: [0x05,0x00,0x93,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
741 v_cvt_f32_ubyte2_e64_dpp v5
, v1 row_ror
:1
742 // GFX12
: [0x05,0x00,0x93,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
744 v_cvt_f32_ubyte2_e64_dpp v5
, v1 row_ror
:15
745 // GFX12
: [0x05,0x00,0x93,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
747 v_cvt_f32_ubyte2_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
748 // GFX12
: [0x05,0x00,0x93,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
750 v_cvt_f32_ubyte2_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
751 // GFX12
: [0x05,0x00,0x93,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
753 v_cvt_f32_ubyte2_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
754 // GFX12
: [0x05,0x00,0x93,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
756 v_cvt_f32_ubyte2_e64_dpp v255
, v255 clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
757 // GFX12
: [0xff,0x80,0x93,0xd5,0xfa,0x00,0x00,0x18,0xff,0x6f,0x05,0x30]
759 v_cvt_f32_ubyte3_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
760 // GFX12
: [0x05,0x00,0x94,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
762 v_cvt_f32_ubyte3_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
763 // GFX12
: [0x05,0x00,0x94,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
765 v_cvt_f32_ubyte3_e64_dpp v5
, v1 row_mirror
766 // GFX12
: [0x05,0x00,0x94,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
768 v_cvt_f32_ubyte3_e64_dpp v5
, v1 row_half_mirror
769 // GFX12
: [0x05,0x00,0x94,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
771 v_cvt_f32_ubyte3_e64_dpp v5
, v1 row_shl
:1
772 // GFX12
: [0x05,0x00,0x94,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
774 v_cvt_f32_ubyte3_e64_dpp v5
, v1 row_shl
:15
775 // GFX12
: [0x05,0x00,0x94,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
777 v_cvt_f32_ubyte3_e64_dpp v5
, v1 row_shr
:1
778 // GFX12
: [0x05,0x00,0x94,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
780 v_cvt_f32_ubyte3_e64_dpp v5
, v1 row_shr
:15
781 // GFX12
: [0x05,0x00,0x94,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
783 v_cvt_f32_ubyte3_e64_dpp v5
, v1 row_ror
:1
784 // GFX12
: [0x05,0x00,0x94,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
786 v_cvt_f32_ubyte3_e64_dpp v5
, v1 row_ror
:15
787 // GFX12
: [0x05,0x00,0x94,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
789 v_cvt_f32_ubyte3_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
790 // GFX12
: [0x05,0x00,0x94,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
792 v_cvt_f32_ubyte3_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
793 // GFX12
: [0x05,0x00,0x94,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
795 v_cvt_f32_ubyte3_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
796 // GFX12
: [0x05,0x00,0x94,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
798 v_cvt_f32_ubyte3_e64_dpp v255
, v255 clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
799 // GFX12
: [0xff,0x80,0x94,0xd5,0xfa,0x00,0x00,0x18,0xff,0x6f,0x05,0x30]
801 v_cvt_floor_i32_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
802 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
804 v_cvt_floor_i32_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
805 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
807 v_cvt_floor_i32_f32_e64_dpp v5
, v1 row_mirror
808 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
810 v_cvt_floor_i32_f32_e64_dpp v5
, v1 row_half_mirror
811 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
813 v_cvt_floor_i32_f32_e64_dpp v5
, v1 row_shl
:1
814 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
816 v_cvt_floor_i32_f32_e64_dpp v5
, v1 row_shl
:15
817 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
819 v_cvt_floor_i32_f32_e64_dpp v5
, v1 row_shr
:1
820 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
822 v_cvt_floor_i32_f32_e64_dpp v5
, v1 row_shr
:15
823 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
825 v_cvt_floor_i32_f32_e64_dpp v5
, v1 row_ror
:1
826 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
828 v_cvt_floor_i32_f32_e64_dpp v5
, v1 row_ror
:15
829 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
831 v_cvt_floor_i32_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
832 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
834 v_cvt_floor_i32_f32_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
835 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
837 v_cvt_floor_i32_f32_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
838 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
840 v_cvt_floor_i32_f32_e64_dpp v255
, -|v255| row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
841 // GFX12
: [0xff,0x01,0x8d,0xd5,0xfa,0x00,0x00,0x20,0xff,0x6f,0x05,0x30]
843 v_cvt_flr_i32_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
844 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
846 v_cvt_flr_i32_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
847 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
849 v_cvt_flr_i32_f32_e64_dpp v5
, v1 row_mirror
850 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
852 v_cvt_flr_i32_f32_e64_dpp v5
, v1 row_half_mirror
853 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
855 v_cvt_flr_i32_f32_e64_dpp v5
, v1 row_shl
:1
856 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
858 v_cvt_flr_i32_f32_e64_dpp v5
, v1 row_shl
:15
859 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
861 v_cvt_flr_i32_f32_e64_dpp v5
, v1 row_shr
:1
862 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
864 v_cvt_flr_i32_f32_e64_dpp v5
, v1 row_shr
:15
865 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
867 v_cvt_flr_i32_f32_e64_dpp v5
, v1 row_ror
:1
868 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
870 v_cvt_flr_i32_f32_e64_dpp v5
, v1 row_ror
:15
871 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
873 v_cvt_flr_i32_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
874 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
876 v_cvt_flr_i32_f32_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
877 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
879 v_cvt_flr_i32_f32_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
880 // GFX12
: [0x05,0x00,0x8d,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
882 v_cvt_flr_i32_f32_e64_dpp v255
, -|v255| row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
883 // GFX12
: [0xff,0x01,0x8d,0xd5,0xfa,0x00,0x00,0x20,0xff,0x6f,0x05,0x30]
885 v_cvt_i16_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
886 // GFX12
: [0x05,0x00,0xd3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
888 v_cvt_i16_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
889 // GFX12
: [0x05,0x00,0xd3,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
891 v_cvt_i16_f16_e64_dpp v5
, v1 row_mirror
892 // GFX12
: [0x05,0x00,0xd3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
894 v_cvt_i16_f16_e64_dpp v5
, v1 row_half_mirror
895 // GFX12
: [0x05,0x00,0xd3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
897 v_cvt_i16_f16_e64_dpp v5
, v1 row_shl
:1
898 // GFX12
: [0x05,0x00,0xd3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
900 v_cvt_i16_f16_e64_dpp v5
, v1 row_shl
:15
901 // GFX12
: [0x05,0x00,0xd3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
903 v_cvt_i16_f16_e64_dpp v5
, v1 row_shr
:1
904 // GFX12
: [0x05,0x00,0xd3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
906 v_cvt_i16_f16_e64_dpp v5
, v1 row_shr
:15
907 // GFX12
: [0x05,0x00,0xd3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
909 v_cvt_i16_f16_e64_dpp v5
, v1 row_ror
:1
910 // GFX12
: [0x05,0x00,0xd3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
912 v_cvt_i16_f16_e64_dpp v5
, v1 row_ror
:15
913 // GFX12
: [0x05,0x00,0xd3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
915 v_cvt_i16_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
916 // GFX12
: [0x05,0x00,0xd3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
918 v_cvt_i16_f16_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
919 // GFX12
: [0x05,0x00,0xd3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
921 v_cvt_i16_f16_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
922 // GFX12
: [0x05,0x00,0xd3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
924 v_cvt_i16_f16_e64_dpp v255
, -|v255| clamp row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
925 // GFX12
: [0xff,0x81,0xd3,0xd5,0xfa,0x00,0x00,0x20,0xff,0x6f,0x05,0x30]
927 v_cvt_i32_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
928 // GFX12
: [0x05,0x00,0x88,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
930 v_cvt_i32_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
931 // GFX12
: [0x05,0x00,0x88,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
933 v_cvt_i32_f32_e64_dpp v5
, v1 row_mirror
934 // GFX12
: [0x05,0x00,0x88,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
936 v_cvt_i32_f32_e64_dpp v5
, v1 row_half_mirror
937 // GFX12
: [0x05,0x00,0x88,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
939 v_cvt_i32_f32_e64_dpp v5
, v1 row_shl
:1
940 // GFX12
: [0x05,0x00,0x88,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
942 v_cvt_i32_f32_e64_dpp v5
, v1 row_shl
:15
943 // GFX12
: [0x05,0x00,0x88,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
945 v_cvt_i32_f32_e64_dpp v5
, v1 row_shr
:1
946 // GFX12
: [0x05,0x00,0x88,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
948 v_cvt_i32_f32_e64_dpp v5
, v1 row_shr
:15
949 // GFX12
: [0x05,0x00,0x88,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
951 v_cvt_i32_f32_e64_dpp v5
, v1 row_ror
:1
952 // GFX12
: [0x05,0x00,0x88,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
954 v_cvt_i32_f32_e64_dpp v5
, v1 row_ror
:15
955 // GFX12
: [0x05,0x00,0x88,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
957 v_cvt_i32_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
958 // GFX12
: [0x05,0x00,0x88,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
960 v_cvt_i32_f32_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
961 // GFX12
: [0x05,0x00,0x88,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
963 v_cvt_i32_f32_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
964 // GFX12
: [0x05,0x00,0x88,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
966 v_cvt_i32_f32_e64_dpp v255
, -|v255| clamp row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
967 // GFX12
: [0xff,0x81,0x88,0xd5,0xfa,0x00,0x00,0x20,0xff,0x6f,0x05,0x30]
969 v_cvt_i32_i16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
970 // GFX12
: [0x05,0x00,0xea,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
972 v_cvt_i32_i16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
973 // GFX12
: [0x05,0x00,0xea,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
975 v_cvt_i32_i16_e64_dpp v5
, v1 row_mirror
976 // GFX12
: [0x05,0x00,0xea,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
978 v_cvt_i32_i16_e64_dpp v5
, v1 row_half_mirror
979 // GFX12
: [0x05,0x00,0xea,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
981 v_cvt_i32_i16_e64_dpp v5
, v1 row_shl
:1
982 // GFX12
: [0x05,0x00,0xea,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
984 v_cvt_i32_i16_e64_dpp v5
, v1 row_shl
:15
985 // GFX12
: [0x05,0x00,0xea,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
987 v_cvt_i32_i16_e64_dpp v5
, v1 row_shr
:1
988 // GFX12
: [0x05,0x00,0xea,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
990 v_cvt_i32_i16_e64_dpp v5
, v1 row_shr
:15
991 // GFX12
: [0x05,0x00,0xea,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
993 v_cvt_i32_i16_e64_dpp v5
, v1 row_ror
:1
994 // GFX12
: [0x05,0x00,0xea,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
996 v_cvt_i32_i16_e64_dpp v5
, v1 row_ror
:15
997 // GFX12
: [0x05,0x00,0xea,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
999 v_cvt_i32_i16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1000 // GFX12
: [0x05,0x00,0xea,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1002 v_cvt_i32_i16_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1003 // GFX12
: [0x05,0x00,0xea,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
1005 v_cvt_i32_i16_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1006 // GFX12
: [0x05,0x00,0xea,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
1008 v_cvt_i32_i16_e64_dpp v255
, v255 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1009 // GFX12
: [0xff,0x00,0xea,0xd5,0xfa,0x00,0x00,0x00,0xff,0x6f,0x05,0x30]
1011 v_cvt_nearest_i32_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1012 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1014 v_cvt_nearest_i32_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1015 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1017 v_cvt_nearest_i32_f32_e64_dpp v5
, v1 row_mirror
1018 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1020 v_cvt_nearest_i32_f32_e64_dpp v5
, v1 row_half_mirror
1021 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1023 v_cvt_nearest_i32_f32_e64_dpp v5
, v1 row_shl
:1
1024 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1026 v_cvt_nearest_i32_f32_e64_dpp v5
, v1 row_shl
:15
1027 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1029 v_cvt_nearest_i32_f32_e64_dpp v5
, v1 row_shr
:1
1030 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1032 v_cvt_nearest_i32_f32_e64_dpp v5
, v1 row_shr
:15
1033 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1035 v_cvt_nearest_i32_f32_e64_dpp v5
, v1 row_ror
:1
1036 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1038 v_cvt_nearest_i32_f32_e64_dpp v5
, v1 row_ror
:15
1039 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1041 v_cvt_nearest_i32_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1042 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1044 v_cvt_nearest_i32_f32_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1045 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
1047 v_cvt_nearest_i32_f32_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1048 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
1050 v_cvt_nearest_i32_f32_e64_dpp v255
, -|v255| row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1051 // GFX12
: [0xff,0x01,0x8c,0xd5,0xfa,0x00,0x00,0x20,0xff,0x6f,0x05,0x30]
1053 v_cvt_norm_i16_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1054 // GFX12
: [0x05,0x00,0xe3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1056 v_cvt_norm_i16_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1057 // GFX12
: [0x05,0x00,0xe3,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1059 v_cvt_norm_i16_f16_e64_dpp v5
, v1 row_mirror
1060 // GFX12
: [0x05,0x00,0xe3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1062 v_cvt_norm_i16_f16_e64_dpp v5
, v1 row_half_mirror
1063 // GFX12
: [0x05,0x00,0xe3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1065 v_cvt_norm_i16_f16_e64_dpp v5
, v1 row_shl
:1
1066 // GFX12
: [0x05,0x00,0xe3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1068 v_cvt_norm_i16_f16_e64_dpp v5
, v1 row_shl
:15
1069 // GFX12
: [0x05,0x00,0xe3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1071 v_cvt_norm_i16_f16_e64_dpp v5
, v1 row_shr
:1
1072 // GFX12
: [0x05,0x00,0xe3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1074 v_cvt_norm_i16_f16_e64_dpp v5
, v1 row_shr
:15
1075 // GFX12
: [0x05,0x00,0xe3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1077 v_cvt_norm_i16_f16_e64_dpp v5
, v1 row_ror
:1
1078 // GFX12
: [0x05,0x00,0xe3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1080 v_cvt_norm_i16_f16_e64_dpp v5
, v1 row_ror
:15
1081 // GFX12
: [0x05,0x00,0xe3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1083 v_cvt_norm_i16_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1084 // GFX12
: [0x05,0x00,0xe3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1086 v_cvt_norm_i16_f16_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1087 // GFX12
: [0x05,0x00,0xe3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
1089 v_cvt_norm_i16_f16_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1090 // GFX12
: [0x05,0x00,0xe3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
1092 v_cvt_norm_i16_f16_e64_dpp v255
, -|v255| row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1093 // GFX12
: [0xff,0x01,0xe3,0xd5,0xfa,0x00,0x00,0x20,0xff,0x6f,0x05,0x30]
1095 v_cvt_norm_u16_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1096 // GFX12
: [0x05,0x00,0xe4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1098 v_cvt_norm_u16_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1099 // GFX12
: [0x05,0x00,0xe4,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1101 v_cvt_norm_u16_f16_e64_dpp v5
, v1 row_mirror
1102 // GFX12
: [0x05,0x00,0xe4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1104 v_cvt_norm_u16_f16_e64_dpp v5
, v1 row_half_mirror
1105 // GFX12
: [0x05,0x00,0xe4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1107 v_cvt_norm_u16_f16_e64_dpp v5
, v1 row_shl
:1
1108 // GFX12
: [0x05,0x00,0xe4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1110 v_cvt_norm_u16_f16_e64_dpp v5
, v1 row_shl
:15
1111 // GFX12
: [0x05,0x00,0xe4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1113 v_cvt_norm_u16_f16_e64_dpp v5
, v1 row_shr
:1
1114 // GFX12
: [0x05,0x00,0xe4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1116 v_cvt_norm_u16_f16_e64_dpp v5
, v1 row_shr
:15
1117 // GFX12
: [0x05,0x00,0xe4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1119 v_cvt_norm_u16_f16_e64_dpp v5
, v1 row_ror
:1
1120 // GFX12
: [0x05,0x00,0xe4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1122 v_cvt_norm_u16_f16_e64_dpp v5
, v1 row_ror
:15
1123 // GFX12
: [0x05,0x00,0xe4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1125 v_cvt_norm_u16_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1126 // GFX12
: [0x05,0x00,0xe4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1128 v_cvt_norm_u16_f16_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1129 // GFX12
: [0x05,0x00,0xe4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
1131 v_cvt_norm_u16_f16_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1132 // GFX12
: [0x05,0x00,0xe4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
1134 v_cvt_norm_u16_f16_e64_dpp v255
, -|v255| row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1135 // GFX12
: [0xff,0x01,0xe4,0xd5,0xfa,0x00,0x00,0x20,0xff,0x6f,0x05,0x30]
1137 v_cvt_off_f32_i4_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1138 // GFX12
: [0x05,0x00,0x8e,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1140 v_cvt_off_f32_i4_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1141 // GFX12
: [0x05,0x00,0x8e,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1143 v_cvt_off_f32_i4_e64_dpp v5
, v1 row_mirror
1144 // GFX12
: [0x05,0x00,0x8e,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1146 v_cvt_off_f32_i4_e64_dpp v5
, v1 row_half_mirror
1147 // GFX12
: [0x05,0x00,0x8e,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1149 v_cvt_off_f32_i4_e64_dpp v5
, v1 row_shl
:1
1150 // GFX12
: [0x05,0x00,0x8e,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1152 v_cvt_off_f32_i4_e64_dpp v5
, v1 row_shl
:15
1153 // GFX12
: [0x05,0x00,0x8e,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1155 v_cvt_off_f32_i4_e64_dpp v5
, v1 row_shr
:1
1156 // GFX12
: [0x05,0x00,0x8e,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1158 v_cvt_off_f32_i4_e64_dpp v5
, v1 row_shr
:15
1159 // GFX12
: [0x05,0x00,0x8e,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1161 v_cvt_off_f32_i4_e64_dpp v5
, v1 row_ror
:1
1162 // GFX12
: [0x05,0x00,0x8e,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1164 v_cvt_off_f32_i4_e64_dpp v5
, v1 row_ror
:15
1165 // GFX12
: [0x05,0x00,0x8e,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1167 v_cvt_off_f32_i4_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1168 // GFX12
: [0x05,0x00,0x8e,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1170 v_cvt_off_f32_i4_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1171 // GFX12
: [0x05,0x00,0x8e,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
1173 v_cvt_off_f32_i4_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1174 // GFX12
: [0x05,0x00,0x8e,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
1176 v_cvt_off_f32_i4_e64_dpp v255
, v255 clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1177 // GFX12
: [0xff,0x80,0x8e,0xd5,0xfa,0x00,0x00,0x18,0xff,0x6f,0x05,0x30]
1179 v_cvt_rpi_i32_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1180 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1182 v_cvt_rpi_i32_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1183 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1185 v_cvt_rpi_i32_f32_e64_dpp v5
, v1 row_mirror
1186 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1188 v_cvt_rpi_i32_f32_e64_dpp v5
, v1 row_half_mirror
1189 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1191 v_cvt_rpi_i32_f32_e64_dpp v5
, v1 row_shl
:1
1192 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1194 v_cvt_rpi_i32_f32_e64_dpp v5
, v1 row_shl
:15
1195 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1197 v_cvt_rpi_i32_f32_e64_dpp v5
, v1 row_shr
:1
1198 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1200 v_cvt_rpi_i32_f32_e64_dpp v5
, v1 row_shr
:15
1201 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1203 v_cvt_rpi_i32_f32_e64_dpp v5
, v1 row_ror
:1
1204 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1206 v_cvt_rpi_i32_f32_e64_dpp v5
, v1 row_ror
:15
1207 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1209 v_cvt_rpi_i32_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1210 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1212 v_cvt_rpi_i32_f32_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1213 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
1215 v_cvt_rpi_i32_f32_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1216 // GFX12
: [0x05,0x00,0x8c,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
1218 v_cvt_rpi_i32_f32_e64_dpp v255
, -|v255| row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1219 // GFX12
: [0xff,0x01,0x8c,0xd5,0xfa,0x00,0x00,0x20,0xff,0x6f,0x05,0x30]
1221 v_cvt_u16_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1222 // GFX12
: [0x05,0x00,0xd2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1224 v_cvt_u16_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1225 // GFX12
: [0x05,0x00,0xd2,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1227 v_cvt_u16_f16_e64_dpp v5
, v1 row_mirror
1228 // GFX12
: [0x05,0x00,0xd2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1230 v_cvt_u16_f16_e64_dpp v5
, v1 row_half_mirror
1231 // GFX12
: [0x05,0x00,0xd2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1233 v_cvt_u16_f16_e64_dpp v5
, v1 row_shl
:1
1234 // GFX12
: [0x05,0x00,0xd2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1236 v_cvt_u16_f16_e64_dpp v5
, v1 row_shl
:15
1237 // GFX12
: [0x05,0x00,0xd2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1239 v_cvt_u16_f16_e64_dpp v5
, v1 row_shr
:1
1240 // GFX12
: [0x05,0x00,0xd2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1242 v_cvt_u16_f16_e64_dpp v5
, v1 row_shr
:15
1243 // GFX12
: [0x05,0x00,0xd2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1245 v_cvt_u16_f16_e64_dpp v5
, v1 row_ror
:1
1246 // GFX12
: [0x05,0x00,0xd2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1248 v_cvt_u16_f16_e64_dpp v5
, v1 row_ror
:15
1249 // GFX12
: [0x05,0x00,0xd2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1251 v_cvt_u16_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1252 // GFX12
: [0x05,0x00,0xd2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1254 v_cvt_u16_f16_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1255 // GFX12
: [0x05,0x00,0xd2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
1257 v_cvt_u16_f16_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1258 // GFX12
: [0x05,0x00,0xd2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
1260 v_cvt_u16_f16_e64_dpp v255
, -|v255| clamp row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1261 // GFX12
: [0xff,0x81,0xd2,0xd5,0xfa,0x00,0x00,0x20,0xff,0x6f,0x05,0x30]
1263 v_cvt_u32_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1264 // GFX12
: [0x05,0x00,0x87,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1266 v_cvt_u32_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1267 // GFX12
: [0x05,0x00,0x87,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1269 v_cvt_u32_f32_e64_dpp v5
, v1 row_mirror
1270 // GFX12
: [0x05,0x00,0x87,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1272 v_cvt_u32_f32_e64_dpp v5
, v1 row_half_mirror
1273 // GFX12
: [0x05,0x00,0x87,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1275 v_cvt_u32_f32_e64_dpp v5
, v1 row_shl
:1
1276 // GFX12
: [0x05,0x00,0x87,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1278 v_cvt_u32_f32_e64_dpp v5
, v1 row_shl
:15
1279 // GFX12
: [0x05,0x00,0x87,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1281 v_cvt_u32_f32_e64_dpp v5
, v1 row_shr
:1
1282 // GFX12
: [0x05,0x00,0x87,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1284 v_cvt_u32_f32_e64_dpp v5
, v1 row_shr
:15
1285 // GFX12
: [0x05,0x00,0x87,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1287 v_cvt_u32_f32_e64_dpp v5
, v1 row_ror
:1
1288 // GFX12
: [0x05,0x00,0x87,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1290 v_cvt_u32_f32_e64_dpp v5
, v1 row_ror
:15
1291 // GFX12
: [0x05,0x00,0x87,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1293 v_cvt_u32_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1294 // GFX12
: [0x05,0x00,0x87,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1296 v_cvt_u32_f32_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1297 // GFX12
: [0x05,0x00,0x87,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
1299 v_cvt_u32_f32_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1300 // GFX12
: [0x05,0x00,0x87,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
1302 v_cvt_u32_f32_e64_dpp v255
, -|v255| clamp row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1303 // GFX12
: [0xff,0x81,0x87,0xd5,0xfa,0x00,0x00,0x20,0xff,0x6f,0x05,0x30]
1305 v_cvt_u32_u16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1306 // GFX12
: [0x05,0x00,0xeb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1308 v_cvt_u32_u16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1309 // GFX12
: [0x05,0x00,0xeb,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1311 v_cvt_u32_u16_e64_dpp v5
, v1 row_mirror
1312 // GFX12
: [0x05,0x00,0xeb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1314 v_cvt_u32_u16_e64_dpp v5
, v1 row_half_mirror
1315 // GFX12
: [0x05,0x00,0xeb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1317 v_cvt_u32_u16_e64_dpp v5
, v1 row_shl
:1
1318 // GFX12
: [0x05,0x00,0xeb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1320 v_cvt_u32_u16_e64_dpp v5
, v1 row_shl
:15
1321 // GFX12
: [0x05,0x00,0xeb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1323 v_cvt_u32_u16_e64_dpp v5
, v1 row_shr
:1
1324 // GFX12
: [0x05,0x00,0xeb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1326 v_cvt_u32_u16_e64_dpp v5
, v1 row_shr
:15
1327 // GFX12
: [0x05,0x00,0xeb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1329 v_cvt_u32_u16_e64_dpp v5
, v1 row_ror
:1
1330 // GFX12
: [0x05,0x00,0xeb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1332 v_cvt_u32_u16_e64_dpp v5
, v1 row_ror
:15
1333 // GFX12
: [0x05,0x00,0xeb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1335 v_cvt_u32_u16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1336 // GFX12
: [0x05,0x00,0xeb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1338 v_cvt_u32_u16_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1339 // GFX12
: [0x05,0x00,0xeb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
1341 v_cvt_u32_u16_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1342 // GFX12
: [0x05,0x00,0xeb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
1344 v_cvt_u32_u16_e64_dpp v255
, v255 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1345 // GFX12
: [0xff,0x00,0xeb,0xd5,0xfa,0x00,0x00,0x00,0xff,0x6f,0x05,0x30]
1347 v_exp_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1348 // GFX12
: [0x05,0x00,0xd8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1350 v_exp_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1351 // GFX12
: [0x05,0x00,0xd8,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1353 v_exp_f16_e64_dpp v5
, v1 row_mirror
1354 // GFX12
: [0x05,0x00,0xd8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1356 v_exp_f16_e64_dpp v5
, v1 row_half_mirror
1357 // GFX12
: [0x05,0x00,0xd8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1359 v_exp_f16_e64_dpp v5
, v1 row_shl
:1
1360 // GFX12
: [0x05,0x00,0xd8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1362 v_exp_f16_e64_dpp v5
, v1 row_shl
:15
1363 // GFX12
: [0x05,0x00,0xd8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1365 v_exp_f16_e64_dpp v5
, v1 row_shr
:1
1366 // GFX12
: [0x05,0x00,0xd8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1368 v_exp_f16_e64_dpp v5
, v1 row_shr
:15
1369 // GFX12
: [0x05,0x00,0xd8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1371 v_exp_f16_e64_dpp v5
, v1 row_ror
:1
1372 // GFX12
: [0x05,0x00,0xd8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1374 v_exp_f16_e64_dpp v5
, v1 row_ror
:15
1375 // GFX12
: [0x05,0x00,0xd8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1377 v_exp_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1378 // GFX12
: [0x05,0x00,0xd8,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1380 v_exp_f16_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1381 // GFX12
: [0x05,0x00,0xd8,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
1383 v_exp_f16_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1384 // GFX12
: [0x05,0x00,0xd8,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
1386 v_exp_f16_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1387 // GFX12
: [0xff,0x81,0xd8,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
1389 v_exp_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1390 // GFX12
: [0x05,0x00,0xa5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1392 v_exp_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1393 // GFX12
: [0x05,0x00,0xa5,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1395 v_exp_f32_e64_dpp v5
, v1 row_mirror
1396 // GFX12
: [0x05,0x00,0xa5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1398 v_exp_f32_e64_dpp v5
, v1 row_half_mirror
1399 // GFX12
: [0x05,0x00,0xa5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1401 v_exp_f32_e64_dpp v5
, v1 row_shl
:1
1402 // GFX12
: [0x05,0x00,0xa5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1404 v_exp_f32_e64_dpp v5
, v1 row_shl
:15
1405 // GFX12
: [0x05,0x00,0xa5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1407 v_exp_f32_e64_dpp v5
, v1 row_shr
:1
1408 // GFX12
: [0x05,0x00,0xa5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1410 v_exp_f32_e64_dpp v5
, v1 row_shr
:15
1411 // GFX12
: [0x05,0x00,0xa5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1413 v_exp_f32_e64_dpp v5
, v1 row_ror
:1
1414 // GFX12
: [0x05,0x00,0xa5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1416 v_exp_f32_e64_dpp v5
, v1 row_ror
:15
1417 // GFX12
: [0x05,0x00,0xa5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1419 v_exp_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1420 // GFX12
: [0x05,0x00,0xa5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1422 v_exp_f32_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1423 // GFX12
: [0x05,0x00,0xa5,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
1425 v_exp_f32_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1426 // GFX12
: [0x05,0x00,0xa5,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
1428 v_exp_f32_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1429 // GFX12
: [0xff,0x81,0xa5,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
1431 v_ffbh_i32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1432 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1434 v_ffbh_i32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1435 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1437 v_ffbh_i32_e64_dpp v5
, v1 row_mirror
1438 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1440 v_ffbh_i32_e64_dpp v5
, v1 row_half_mirror
1441 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1443 v_ffbh_i32_e64_dpp v5
, v1 row_shl
:1
1444 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1446 v_ffbh_i32_e64_dpp v5
, v1 row_shl
:15
1447 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1449 v_ffbh_i32_e64_dpp v5
, v1 row_shr
:1
1450 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1452 v_ffbh_i32_e64_dpp v5
, v1 row_shr
:15
1453 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1455 v_ffbh_i32_e64_dpp v5
, v1 row_ror
:1
1456 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1458 v_ffbh_i32_e64_dpp v5
, v1 row_ror
:15
1459 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1461 v_ffbh_i32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1462 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1464 v_ffbh_i32_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1465 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
1467 v_ffbh_i32_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1468 // GFX12
: [0x05,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
1470 v_ffbh_i32_e64_dpp v255
, v255 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1471 // GFX12
: [0xff,0x00,0xbb,0xd5,0xfa,0x00,0x00,0x00,0xff,0x6f,0x05,0x30]
1473 v_ffbh_u32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1474 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1476 v_ffbh_u32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1477 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1479 v_ffbh_u32_e64_dpp v5
, v1 row_mirror
1480 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1482 v_ffbh_u32_e64_dpp v5
, v1 row_half_mirror
1483 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1485 v_ffbh_u32_e64_dpp v5
, v1 row_shl
:1
1486 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1488 v_ffbh_u32_e64_dpp v5
, v1 row_shl
:15
1489 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1491 v_ffbh_u32_e64_dpp v5
, v1 row_shr
:1
1492 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1494 v_ffbh_u32_e64_dpp v5
, v1 row_shr
:15
1495 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1497 v_ffbh_u32_e64_dpp v5
, v1 row_ror
:1
1498 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1500 v_ffbh_u32_e64_dpp v5
, v1 row_ror
:15
1501 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1503 v_ffbh_u32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1504 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1506 v_ffbh_u32_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1507 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
1509 v_ffbh_u32_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1510 // GFX12
: [0x05,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
1512 v_ffbh_u32_e64_dpp v255
, v255 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1513 // GFX12
: [0xff,0x00,0xb9,0xd5,0xfa,0x00,0x00,0x00,0xff,0x6f,0x05,0x30]
1515 v_ffbl_b32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1516 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1518 v_ffbl_b32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1519 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1521 v_ffbl_b32_e64_dpp v5
, v1 row_mirror
1522 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1524 v_ffbl_b32_e64_dpp v5
, v1 row_half_mirror
1525 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1527 v_ffbl_b32_e64_dpp v5
, v1 row_shl
:1
1528 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1530 v_ffbl_b32_e64_dpp v5
, v1 row_shl
:15
1531 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1533 v_ffbl_b32_e64_dpp v5
, v1 row_shr
:1
1534 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1536 v_ffbl_b32_e64_dpp v5
, v1 row_shr
:15
1537 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1539 v_ffbl_b32_e64_dpp v5
, v1 row_ror
:1
1540 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1542 v_ffbl_b32_e64_dpp v5
, v1 row_ror
:15
1543 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1545 v_ffbl_b32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1546 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1548 v_ffbl_b32_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1549 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
1551 v_ffbl_b32_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1552 // GFX12
: [0x05,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
1554 v_ffbl_b32_e64_dpp v255
, v255 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1555 // GFX12
: [0xff,0x00,0xba,0xd5,0xfa,0x00,0x00,0x00,0xff,0x6f,0x05,0x30]
1557 v_floor_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1558 // GFX12
: [0x05,0x00,0xdb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1560 v_floor_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1561 // GFX12
: [0x05,0x00,0xdb,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1563 v_floor_f16_e64_dpp v5
, v1 row_mirror
1564 // GFX12
: [0x05,0x00,0xdb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1566 v_floor_f16_e64_dpp v5
, v1 row_half_mirror
1567 // GFX12
: [0x05,0x00,0xdb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1569 v_floor_f16_e64_dpp v5
, v1 row_shl
:1
1570 // GFX12
: [0x05,0x00,0xdb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1572 v_floor_f16_e64_dpp v5
, v1 row_shl
:15
1573 // GFX12
: [0x05,0x00,0xdb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1575 v_floor_f16_e64_dpp v5
, v1 row_shr
:1
1576 // GFX12
: [0x05,0x00,0xdb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1578 v_floor_f16_e64_dpp v5
, v1 row_shr
:15
1579 // GFX12
: [0x05,0x00,0xdb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1581 v_floor_f16_e64_dpp v5
, v1 row_ror
:1
1582 // GFX12
: [0x05,0x00,0xdb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1584 v_floor_f16_e64_dpp v5
, v1 row_ror
:15
1585 // GFX12
: [0x05,0x00,0xdb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1587 v_floor_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1588 // GFX12
: [0x05,0x00,0xdb,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1590 v_floor_f16_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1591 // GFX12
: [0x05,0x00,0xdb,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
1593 v_floor_f16_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1594 // GFX12
: [0x05,0x00,0xdb,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
1596 v_floor_f16_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1597 // GFX12
: [0xff,0x81,0xdb,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
1599 v_floor_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1600 // GFX12
: [0x05,0x00,0xa4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1602 v_floor_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1603 // GFX12
: [0x05,0x00,0xa4,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1605 v_floor_f32_e64_dpp v5
, v1 row_mirror
1606 // GFX12
: [0x05,0x00,0xa4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1608 v_floor_f32_e64_dpp v5
, v1 row_half_mirror
1609 // GFX12
: [0x05,0x00,0xa4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1611 v_floor_f32_e64_dpp v5
, v1 row_shl
:1
1612 // GFX12
: [0x05,0x00,0xa4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1614 v_floor_f32_e64_dpp v5
, v1 row_shl
:15
1615 // GFX12
: [0x05,0x00,0xa4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1617 v_floor_f32_e64_dpp v5
, v1 row_shr
:1
1618 // GFX12
: [0x05,0x00,0xa4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1620 v_floor_f32_e64_dpp v5
, v1 row_shr
:15
1621 // GFX12
: [0x05,0x00,0xa4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1623 v_floor_f32_e64_dpp v5
, v1 row_ror
:1
1624 // GFX12
: [0x05,0x00,0xa4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1626 v_floor_f32_e64_dpp v5
, v1 row_ror
:15
1627 // GFX12
: [0x05,0x00,0xa4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1629 v_floor_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1630 // GFX12
: [0x05,0x00,0xa4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1632 v_floor_f32_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1633 // GFX12
: [0x05,0x00,0xa4,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
1635 v_floor_f32_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1636 // GFX12
: [0x05,0x00,0xa4,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
1638 v_floor_f32_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1639 // GFX12
: [0xff,0x81,0xa4,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
1641 v_fract_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1642 // GFX12
: [0x05,0x00,0xdf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1644 v_fract_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1645 // GFX12
: [0x05,0x00,0xdf,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1647 v_fract_f16_e64_dpp v5
, v1 row_mirror
1648 // GFX12
: [0x05,0x00,0xdf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1650 v_fract_f16_e64_dpp v5
, v1 row_half_mirror
1651 // GFX12
: [0x05,0x00,0xdf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1653 v_fract_f16_e64_dpp v5
, v1 row_shl
:1
1654 // GFX12
: [0x05,0x00,0xdf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1656 v_fract_f16_e64_dpp v5
, v1 row_shl
:15
1657 // GFX12
: [0x05,0x00,0xdf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1659 v_fract_f16_e64_dpp v5
, v1 row_shr
:1
1660 // GFX12
: [0x05,0x00,0xdf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1662 v_fract_f16_e64_dpp v5
, v1 row_shr
:15
1663 // GFX12
: [0x05,0x00,0xdf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1665 v_fract_f16_e64_dpp v5
, v1 row_ror
:1
1666 // GFX12
: [0x05,0x00,0xdf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1668 v_fract_f16_e64_dpp v5
, v1 row_ror
:15
1669 // GFX12
: [0x05,0x00,0xdf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1671 v_fract_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1672 // GFX12
: [0x05,0x00,0xdf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1674 v_fract_f16_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1675 // GFX12
: [0x05,0x00,0xdf,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
1677 v_fract_f16_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1678 // GFX12
: [0x05,0x00,0xdf,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
1680 v_fract_f16_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1681 // GFX12
: [0xff,0x81,0xdf,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
1683 v_fract_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1684 // GFX12
: [0x05,0x00,0xa0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1686 v_fract_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1687 // GFX12
: [0x05,0x00,0xa0,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1689 v_fract_f32_e64_dpp v5
, v1 row_mirror
1690 // GFX12
: [0x05,0x00,0xa0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1692 v_fract_f32_e64_dpp v5
, v1 row_half_mirror
1693 // GFX12
: [0x05,0x00,0xa0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1695 v_fract_f32_e64_dpp v5
, v1 row_shl
:1
1696 // GFX12
: [0x05,0x00,0xa0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1698 v_fract_f32_e64_dpp v5
, v1 row_shl
:15
1699 // GFX12
: [0x05,0x00,0xa0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1701 v_fract_f32_e64_dpp v5
, v1 row_shr
:1
1702 // GFX12
: [0x05,0x00,0xa0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1704 v_fract_f32_e64_dpp v5
, v1 row_shr
:15
1705 // GFX12
: [0x05,0x00,0xa0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1707 v_fract_f32_e64_dpp v5
, v1 row_ror
:1
1708 // GFX12
: [0x05,0x00,0xa0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1710 v_fract_f32_e64_dpp v5
, v1 row_ror
:15
1711 // GFX12
: [0x05,0x00,0xa0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1713 v_fract_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1714 // GFX12
: [0x05,0x00,0xa0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1716 v_fract_f32_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1717 // GFX12
: [0x05,0x00,0xa0,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
1719 v_fract_f32_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1720 // GFX12
: [0x05,0x00,0xa0,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
1722 v_fract_f32_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1723 // GFX12
: [0xff,0x81,0xa0,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
1725 v_frexp_exp_i16_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1726 // GFX12
: [0x05,0x00,0xda,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1728 v_frexp_exp_i16_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1729 // GFX12
: [0x05,0x00,0xda,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1731 v_frexp_exp_i16_f16_e64_dpp v5
, v1 row_mirror
1732 // GFX12
: [0x05,0x00,0xda,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1734 v_frexp_exp_i16_f16_e64_dpp v5
, v1 row_half_mirror
1735 // GFX12
: [0x05,0x00,0xda,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1737 v_frexp_exp_i16_f16_e64_dpp v5
, v1 row_shl
:1
1738 // GFX12
: [0x05,0x00,0xda,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1740 v_frexp_exp_i16_f16_e64_dpp v5
, v1 row_shl
:15
1741 // GFX12
: [0x05,0x00,0xda,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1743 v_frexp_exp_i16_f16_e64_dpp v5
, v1 row_shr
:1
1744 // GFX12
: [0x05,0x00,0xda,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1746 v_frexp_exp_i16_f16_e64_dpp v5
, v1 row_shr
:15
1747 // GFX12
: [0x05,0x00,0xda,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1749 v_frexp_exp_i16_f16_e64_dpp v5
, v1 row_ror
:1
1750 // GFX12
: [0x05,0x00,0xda,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1752 v_frexp_exp_i16_f16_e64_dpp v5
, v1 row_ror
:15
1753 // GFX12
: [0x05,0x00,0xda,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1755 v_frexp_exp_i16_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1756 // GFX12
: [0x05,0x00,0xda,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1758 v_frexp_exp_i16_f16_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1759 // GFX12
: [0x05,0x00,0xda,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
1761 v_frexp_exp_i16_f16_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1762 // GFX12
: [0x05,0x00,0xda,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
1764 v_frexp_exp_i16_f16_e64_dpp v255
, -|v255| row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1765 // GFX12
: [0xff,0x01,0xda,0xd5,0xfa,0x00,0x00,0x20,0xff,0x6f,0x05,0x30]
1767 v_frexp_exp_i32_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1768 // GFX12
: [0x05,0x00,0xbf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1770 v_frexp_exp_i32_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1771 // GFX12
: [0x05,0x00,0xbf,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1773 v_frexp_exp_i32_f32_e64_dpp v5
, v1 row_mirror
1774 // GFX12
: [0x05,0x00,0xbf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1776 v_frexp_exp_i32_f32_e64_dpp v5
, v1 row_half_mirror
1777 // GFX12
: [0x05,0x00,0xbf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1779 v_frexp_exp_i32_f32_e64_dpp v5
, v1 row_shl
:1
1780 // GFX12
: [0x05,0x00,0xbf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1782 v_frexp_exp_i32_f32_e64_dpp v5
, v1 row_shl
:15
1783 // GFX12
: [0x05,0x00,0xbf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1785 v_frexp_exp_i32_f32_e64_dpp v5
, v1 row_shr
:1
1786 // GFX12
: [0x05,0x00,0xbf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1788 v_frexp_exp_i32_f32_e64_dpp v5
, v1 row_shr
:15
1789 // GFX12
: [0x05,0x00,0xbf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1791 v_frexp_exp_i32_f32_e64_dpp v5
, v1 row_ror
:1
1792 // GFX12
: [0x05,0x00,0xbf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1794 v_frexp_exp_i32_f32_e64_dpp v5
, v1 row_ror
:15
1795 // GFX12
: [0x05,0x00,0xbf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1797 v_frexp_exp_i32_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1798 // GFX12
: [0x05,0x00,0xbf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1800 v_frexp_exp_i32_f32_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1801 // GFX12
: [0x05,0x00,0xbf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
1803 v_frexp_exp_i32_f32_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1804 // GFX12
: [0x05,0x00,0xbf,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
1806 v_frexp_exp_i32_f32_e64_dpp v255
, -|v255| row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1807 // GFX12
: [0xff,0x01,0xbf,0xd5,0xfa,0x00,0x00,0x20,0xff,0x6f,0x05,0x30]
1809 v_frexp_mant_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1810 // GFX12
: [0x05,0x00,0xd9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1812 v_frexp_mant_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1813 // GFX12
: [0x05,0x00,0xd9,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1815 v_frexp_mant_f16_e64_dpp v5
, v1 row_mirror
1816 // GFX12
: [0x05,0x00,0xd9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1818 v_frexp_mant_f16_e64_dpp v5
, v1 row_half_mirror
1819 // GFX12
: [0x05,0x00,0xd9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1821 v_frexp_mant_f16_e64_dpp v5
, v1 row_shl
:1
1822 // GFX12
: [0x05,0x00,0xd9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1824 v_frexp_mant_f16_e64_dpp v5
, v1 row_shl
:15
1825 // GFX12
: [0x05,0x00,0xd9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1827 v_frexp_mant_f16_e64_dpp v5
, v1 row_shr
:1
1828 // GFX12
: [0x05,0x00,0xd9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1830 v_frexp_mant_f16_e64_dpp v5
, v1 row_shr
:15
1831 // GFX12
: [0x05,0x00,0xd9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1833 v_frexp_mant_f16_e64_dpp v5
, v1 row_ror
:1
1834 // GFX12
: [0x05,0x00,0xd9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1836 v_frexp_mant_f16_e64_dpp v5
, v1 row_ror
:15
1837 // GFX12
: [0x05,0x00,0xd9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1839 v_frexp_mant_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1840 // GFX12
: [0x05,0x00,0xd9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1842 v_frexp_mant_f16_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1843 // GFX12
: [0x05,0x00,0xd9,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
1845 v_frexp_mant_f16_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1846 // GFX12
: [0x05,0x00,0xd9,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
1848 v_frexp_mant_f16_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1849 // GFX12
: [0xff,0x81,0xd9,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
1851 v_frexp_mant_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1852 // GFX12
: [0x05,0x00,0xc0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1854 v_frexp_mant_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1855 // GFX12
: [0x05,0x00,0xc0,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1857 v_frexp_mant_f32_e64_dpp v5
, v1 row_mirror
1858 // GFX12
: [0x05,0x00,0xc0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1860 v_frexp_mant_f32_e64_dpp v5
, v1 row_half_mirror
1861 // GFX12
: [0x05,0x00,0xc0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1863 v_frexp_mant_f32_e64_dpp v5
, v1 row_shl
:1
1864 // GFX12
: [0x05,0x00,0xc0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1866 v_frexp_mant_f32_e64_dpp v5
, v1 row_shl
:15
1867 // GFX12
: [0x05,0x00,0xc0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1869 v_frexp_mant_f32_e64_dpp v5
, v1 row_shr
:1
1870 // GFX12
: [0x05,0x00,0xc0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1872 v_frexp_mant_f32_e64_dpp v5
, v1 row_shr
:15
1873 // GFX12
: [0x05,0x00,0xc0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1875 v_frexp_mant_f32_e64_dpp v5
, v1 row_ror
:1
1876 // GFX12
: [0x05,0x00,0xc0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1878 v_frexp_mant_f32_e64_dpp v5
, v1 row_ror
:15
1879 // GFX12
: [0x05,0x00,0xc0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1881 v_frexp_mant_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1882 // GFX12
: [0x05,0x00,0xc0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1884 v_frexp_mant_f32_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1885 // GFX12
: [0x05,0x00,0xc0,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
1887 v_frexp_mant_f32_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1888 // GFX12
: [0x05,0x00,0xc0,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
1890 v_frexp_mant_f32_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1891 // GFX12
: [0xff,0x81,0xc0,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
1893 v_log_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1894 // GFX12
: [0x05,0x00,0xd7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1896 v_log_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1897 // GFX12
: [0x05,0x00,0xd7,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1899 v_log_f16_e64_dpp v5
, v1 row_mirror
1900 // GFX12
: [0x05,0x00,0xd7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1902 v_log_f16_e64_dpp v5
, v1 row_half_mirror
1903 // GFX12
: [0x05,0x00,0xd7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1905 v_log_f16_e64_dpp v5
, v1 row_shl
:1
1906 // GFX12
: [0x05,0x00,0xd7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1908 v_log_f16_e64_dpp v5
, v1 row_shl
:15
1909 // GFX12
: [0x05,0x00,0xd7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1911 v_log_f16_e64_dpp v5
, v1 row_shr
:1
1912 // GFX12
: [0x05,0x00,0xd7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1914 v_log_f16_e64_dpp v5
, v1 row_shr
:15
1915 // GFX12
: [0x05,0x00,0xd7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1917 v_log_f16_e64_dpp v5
, v1 row_ror
:1
1918 // GFX12
: [0x05,0x00,0xd7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1920 v_log_f16_e64_dpp v5
, v1 row_ror
:15
1921 // GFX12
: [0x05,0x00,0xd7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1923 v_log_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1924 // GFX12
: [0x05,0x00,0xd7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1926 v_log_f16_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1927 // GFX12
: [0x05,0x00,0xd7,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
1929 v_log_f16_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1930 // GFX12
: [0x05,0x00,0xd7,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
1932 v_log_f16_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1933 // GFX12
: [0xff,0x81,0xd7,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
1935 v_log_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1936 // GFX12
: [0x05,0x00,0xa7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1938 v_log_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1939 // GFX12
: [0x05,0x00,0xa7,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1941 v_log_f32_e64_dpp v5
, v1 row_mirror
1942 // GFX12
: [0x05,0x00,0xa7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1944 v_log_f32_e64_dpp v5
, v1 row_half_mirror
1945 // GFX12
: [0x05,0x00,0xa7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1947 v_log_f32_e64_dpp v5
, v1 row_shl
:1
1948 // GFX12
: [0x05,0x00,0xa7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1950 v_log_f32_e64_dpp v5
, v1 row_shl
:15
1951 // GFX12
: [0x05,0x00,0xa7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1953 v_log_f32_e64_dpp v5
, v1 row_shr
:1
1954 // GFX12
: [0x05,0x00,0xa7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1956 v_log_f32_e64_dpp v5
, v1 row_shr
:15
1957 // GFX12
: [0x05,0x00,0xa7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
1959 v_log_f32_e64_dpp v5
, v1 row_ror
:1
1960 // GFX12
: [0x05,0x00,0xa7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
1962 v_log_f32_e64_dpp v5
, v1 row_ror
:15
1963 // GFX12
: [0x05,0x00,0xa7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
1965 v_log_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
1966 // GFX12
: [0x05,0x00,0xa7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
1968 v_log_f32_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
1969 // GFX12
: [0x05,0x00,0xa7,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
1971 v_log_f32_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
1972 // GFX12
: [0x05,0x00,0xa7,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
1974 v_log_f32_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
1975 // GFX12
: [0xff,0x81,0xa7,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
1977 v_mov_b32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
1978 // GFX12
: [0x05,0x00,0x81,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
1980 v_mov_b32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
1981 // GFX12
: [0x05,0x00,0x81,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
1983 v_mov_b32_e64_dpp v5
, v1 row_mirror
1984 // GFX12
: [0x05,0x00,0x81,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
1986 v_mov_b32_e64_dpp v5
, v1 row_half_mirror
1987 // GFX12
: [0x05,0x00,0x81,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
1989 v_mov_b32_e64_dpp v5
, v1 row_shl
:1
1990 // GFX12
: [0x05,0x00,0x81,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
1992 v_mov_b32_e64_dpp v5
, v1 row_shl
:15
1993 // GFX12
: [0x05,0x00,0x81,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
1995 v_mov_b32_e64_dpp v5
, v1 row_shr
:1
1996 // GFX12
: [0x05,0x00,0x81,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
1998 v_mov_b32_e64_dpp v5
, v1 row_shr
:15
1999 // GFX12
: [0x05,0x00,0x81,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
2001 v_mov_b32_e64_dpp v5
, v1 row_ror
:1
2002 // GFX12
: [0x05,0x00,0x81,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
2004 v_mov_b32_e64_dpp v5
, v1 row_ror
:15
2005 // GFX12
: [0x05,0x00,0x81,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
2007 v_mov_b32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
2008 // GFX12
: [0x05,0x00,0x81,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
2010 v_mov_b32_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
2011 // GFX12
: [0x05,0x00,0x81,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
2013 v_mov_b32_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
2014 // GFX12
: [0x05,0x00,0x81,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
2016 v_mov_b32_e64_dpp v255
, v255 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
2017 // GFX12
: [0xff,0x00,0x81,0xd5,0xfa,0x00,0x00,0x00,0xff,0x6f,0x05,0x30]
2019 v_movrels_b32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
2020 // GFX12
: [0x05,0x00,0xc3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
2022 v_movrels_b32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
2023 // GFX12
: [0x05,0x00,0xc3,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
2025 v_movrels_b32_e64_dpp v5
, v1 row_mirror
2026 // GFX12
: [0x05,0x00,0xc3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
2028 v_movrels_b32_e64_dpp v5
, v1 row_half_mirror
2029 // GFX12
: [0x05,0x00,0xc3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
2031 v_movrels_b32_e64_dpp v5
, v1 row_shl
:1
2032 // GFX12
: [0x05,0x00,0xc3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
2034 v_movrels_b32_e64_dpp v5
, v1 row_shl
:15
2035 // GFX12
: [0x05,0x00,0xc3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
2037 v_movrels_b32_e64_dpp v5
, v1 row_shr
:1
2038 // GFX12
: [0x05,0x00,0xc3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
2040 v_movrels_b32_e64_dpp v5
, v1 row_shr
:15
2041 // GFX12
: [0x05,0x00,0xc3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
2043 v_movrels_b32_e64_dpp v5
, v1 row_ror
:1
2044 // GFX12
: [0x05,0x00,0xc3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
2046 v_movrels_b32_e64_dpp v5
, v1 row_ror
:15
2047 // GFX12
: [0x05,0x00,0xc3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
2049 v_movrels_b32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
2050 // GFX12
: [0x05,0x00,0xc3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
2052 v_movrels_b32_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
2053 // GFX12
: [0x05,0x00,0xc3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
2055 v_movrels_b32_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
2056 // GFX12
: [0x05,0x00,0xc3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
2058 v_movrels_b32_e64_dpp v255
, v255 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
2059 // GFX12
: [0xff,0x00,0xc3,0xd5,0xfa,0x00,0x00,0x00,0xff,0x6f,0x05,0x30]
2061 v_not_b16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
2062 // GFX12
: [0x05,0x00,0xe9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
2064 v_not_b16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
2065 // GFX12
: [0x05,0x00,0xe9,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
2067 v_not_b16_e64_dpp v5
, v1 row_mirror
2068 // GFX12
: [0x05,0x00,0xe9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
2070 v_not_b16_e64_dpp v5
, v1 row_half_mirror
2071 // GFX12
: [0x05,0x00,0xe9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
2073 v_not_b16_e64_dpp v5
, v1 row_shl
:1
2074 // GFX12
: [0x05,0x00,0xe9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
2076 v_not_b16_e64_dpp v5
, v1 row_shl
:15
2077 // GFX12
: [0x05,0x00,0xe9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
2079 v_not_b16_e64_dpp v5
, v1 row_shr
:1
2080 // GFX12
: [0x05,0x00,0xe9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
2082 v_not_b16_e64_dpp v5
, v1 row_shr
:15
2083 // GFX12
: [0x05,0x00,0xe9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
2085 v_not_b16_e64_dpp v5
, v1 row_ror
:1
2086 // GFX12
: [0x05,0x00,0xe9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
2088 v_not_b16_e64_dpp v5
, v1 row_ror
:15
2089 // GFX12
: [0x05,0x00,0xe9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
2091 v_not_b16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
2092 // GFX12
: [0x05,0x00,0xe9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
2094 v_not_b16_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
2095 // GFX12
: [0x05,0x00,0xe9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
2097 v_not_b16_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
2098 // GFX12
: [0x05,0x00,0xe9,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
2100 v_not_b16_e64_dpp v255
, v255 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
2101 // GFX12
: [0xff,0x00,0xe9,0xd5,0xfa,0x00,0x00,0x00,0xff,0x6f,0x05,0x30]
2103 v_not_b32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
2104 // GFX12
: [0x05,0x00,0xb7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
2106 v_not_b32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
2107 // GFX12
: [0x05,0x00,0xb7,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
2109 v_not_b32_e64_dpp v5
, v1 row_mirror
2110 // GFX12
: [0x05,0x00,0xb7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
2112 v_not_b32_e64_dpp v5
, v1 row_half_mirror
2113 // GFX12
: [0x05,0x00,0xb7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
2115 v_not_b32_e64_dpp v5
, v1 row_shl
:1
2116 // GFX12
: [0x05,0x00,0xb7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
2118 v_not_b32_e64_dpp v5
, v1 row_shl
:15
2119 // GFX12
: [0x05,0x00,0xb7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
2121 v_not_b32_e64_dpp v5
, v1 row_shr
:1
2122 // GFX12
: [0x05,0x00,0xb7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
2124 v_not_b32_e64_dpp v5
, v1 row_shr
:15
2125 // GFX12
: [0x05,0x00,0xb7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
2127 v_not_b32_e64_dpp v5
, v1 row_ror
:1
2128 // GFX12
: [0x05,0x00,0xb7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
2130 v_not_b32_e64_dpp v5
, v1 row_ror
:15
2131 // GFX12
: [0x05,0x00,0xb7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
2133 v_not_b32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
2134 // GFX12
: [0x05,0x00,0xb7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
2136 v_not_b32_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
2137 // GFX12
: [0x05,0x00,0xb7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
2139 v_not_b32_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
2140 // GFX12
: [0x05,0x00,0xb7,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
2142 v_not_b32_e64_dpp v255
, v255 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
2143 // GFX12
: [0xff,0x00,0xb7,0xd5,0xfa,0x00,0x00,0x00,0xff,0x6f,0x05,0x30]
2145 v_rcp_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
2146 // GFX12
: [0x05,0x00,0xd4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
2148 v_rcp_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
2149 // GFX12
: [0x05,0x00,0xd4,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
2151 v_rcp_f16_e64_dpp v5
, v1 row_mirror
2152 // GFX12
: [0x05,0x00,0xd4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
2154 v_rcp_f16_e64_dpp v5
, v1 row_half_mirror
2155 // GFX12
: [0x05,0x00,0xd4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
2157 v_rcp_f16_e64_dpp v5
, v1 row_shl
:1
2158 // GFX12
: [0x05,0x00,0xd4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
2160 v_rcp_f16_e64_dpp v5
, v1 row_shl
:15
2161 // GFX12
: [0x05,0x00,0xd4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
2163 v_rcp_f16_e64_dpp v5
, v1 row_shr
:1
2164 // GFX12
: [0x05,0x00,0xd4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
2166 v_rcp_f16_e64_dpp v5
, v1 row_shr
:15
2167 // GFX12
: [0x05,0x00,0xd4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
2169 v_rcp_f16_e64_dpp v5
, v1 row_ror
:1
2170 // GFX12
: [0x05,0x00,0xd4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
2172 v_rcp_f16_e64_dpp v5
, v1 row_ror
:15
2173 // GFX12
: [0x05,0x00,0xd4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
2175 v_rcp_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
2176 // GFX12
: [0x05,0x00,0xd4,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
2178 v_rcp_f16_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
2179 // GFX12
: [0x05,0x00,0xd4,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
2181 v_rcp_f16_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
2182 // GFX12
: [0x05,0x00,0xd4,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
2184 v_rcp_f16_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
2185 // GFX12
: [0xff,0x81,0xd4,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
2187 v_rcp_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
2188 // GFX12
: [0x05,0x00,0xaa,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
2190 v_rcp_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
2191 // GFX12
: [0x05,0x00,0xaa,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
2193 v_rcp_f32_e64_dpp v5
, v1 row_mirror
2194 // GFX12
: [0x05,0x00,0xaa,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
2196 v_rcp_f32_e64_dpp v5
, v1 row_half_mirror
2197 // GFX12
: [0x05,0x00,0xaa,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
2199 v_rcp_f32_e64_dpp v5
, v1 row_shl
:1
2200 // GFX12
: [0x05,0x00,0xaa,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
2202 v_rcp_f32_e64_dpp v5
, v1 row_shl
:15
2203 // GFX12
: [0x05,0x00,0xaa,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
2205 v_rcp_f32_e64_dpp v5
, v1 row_shr
:1
2206 // GFX12
: [0x05,0x00,0xaa,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
2208 v_rcp_f32_e64_dpp v5
, v1 row_shr
:15
2209 // GFX12
: [0x05,0x00,0xaa,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
2211 v_rcp_f32_e64_dpp v5
, v1 row_ror
:1
2212 // GFX12
: [0x05,0x00,0xaa,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
2214 v_rcp_f32_e64_dpp v5
, v1 row_ror
:15
2215 // GFX12
: [0x05,0x00,0xaa,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
2217 v_rcp_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
2218 // GFX12
: [0x05,0x00,0xaa,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
2220 v_rcp_f32_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
2221 // GFX12
: [0x05,0x00,0xaa,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
2223 v_rcp_f32_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
2224 // GFX12
: [0x05,0x00,0xaa,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
2226 v_rcp_f32_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
2227 // GFX12
: [0xff,0x81,0xaa,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
2229 v_rcp_iflag_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
2230 // GFX12
: [0x05,0x00,0xab,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
2232 v_rcp_iflag_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
2233 // GFX12
: [0x05,0x00,0xab,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
2235 v_rcp_iflag_f32_e64_dpp v5
, v1 row_mirror
2236 // GFX12
: [0x05,0x00,0xab,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
2238 v_rcp_iflag_f32_e64_dpp v5
, v1 row_half_mirror
2239 // GFX12
: [0x05,0x00,0xab,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
2241 v_rcp_iflag_f32_e64_dpp v5
, v1 row_shl
:1
2242 // GFX12
: [0x05,0x00,0xab,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
2244 v_rcp_iflag_f32_e64_dpp v5
, v1 row_shl
:15
2245 // GFX12
: [0x05,0x00,0xab,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
2247 v_rcp_iflag_f32_e64_dpp v5
, v1 row_shr
:1
2248 // GFX12
: [0x05,0x00,0xab,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
2250 v_rcp_iflag_f32_e64_dpp v5
, v1 row_shr
:15
2251 // GFX12
: [0x05,0x00,0xab,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
2253 v_rcp_iflag_f32_e64_dpp v5
, v1 row_ror
:1
2254 // GFX12
: [0x05,0x00,0xab,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
2256 v_rcp_iflag_f32_e64_dpp v5
, v1 row_ror
:15
2257 // GFX12
: [0x05,0x00,0xab,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
2259 v_rcp_iflag_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
2260 // GFX12
: [0x05,0x00,0xab,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
2262 v_rcp_iflag_f32_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
2263 // GFX12
: [0x05,0x00,0xab,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
2265 v_rcp_iflag_f32_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
2266 // GFX12
: [0x05,0x00,0xab,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
2268 v_rcp_iflag_f32_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
2269 // GFX12
: [0xff,0x81,0xab,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
2271 v_rndne_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
2272 // GFX12
: [0x05,0x00,0xde,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
2274 v_rndne_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
2275 // GFX12
: [0x05,0x00,0xde,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
2277 v_rndne_f16_e64_dpp v5
, v1 row_mirror
2278 // GFX12
: [0x05,0x00,0xde,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
2280 v_rndne_f16_e64_dpp v5
, v1 row_half_mirror
2281 // GFX12
: [0x05,0x00,0xde,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
2283 v_rndne_f16_e64_dpp v5
, v1 row_shl
:1
2284 // GFX12
: [0x05,0x00,0xde,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
2286 v_rndne_f16_e64_dpp v5
, v1 row_shl
:15
2287 // GFX12
: [0x05,0x00,0xde,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
2289 v_rndne_f16_e64_dpp v5
, v1 row_shr
:1
2290 // GFX12
: [0x05,0x00,0xde,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
2292 v_rndne_f16_e64_dpp v5
, v1 row_shr
:15
2293 // GFX12
: [0x05,0x00,0xde,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
2295 v_rndne_f16_e64_dpp v5
, v1 row_ror
:1
2296 // GFX12
: [0x05,0x00,0xde,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
2298 v_rndne_f16_e64_dpp v5
, v1 row_ror
:15
2299 // GFX12
: [0x05,0x00,0xde,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
2301 v_rndne_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
2302 // GFX12
: [0x05,0x00,0xde,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
2304 v_rndne_f16_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
2305 // GFX12
: [0x05,0x00,0xde,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
2307 v_rndne_f16_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
2308 // GFX12
: [0x05,0x00,0xde,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
2310 v_rndne_f16_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
2311 // GFX12
: [0xff,0x81,0xde,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
2313 v_rndne_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
2314 // GFX12
: [0x05,0x00,0xa3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
2316 v_rndne_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
2317 // GFX12
: [0x05,0x00,0xa3,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
2319 v_rndne_f32_e64_dpp v5
, v1 row_mirror
2320 // GFX12
: [0x05,0x00,0xa3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
2322 v_rndne_f32_e64_dpp v5
, v1 row_half_mirror
2323 // GFX12
: [0x05,0x00,0xa3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
2325 v_rndne_f32_e64_dpp v5
, v1 row_shl
:1
2326 // GFX12
: [0x05,0x00,0xa3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
2328 v_rndne_f32_e64_dpp v5
, v1 row_shl
:15
2329 // GFX12
: [0x05,0x00,0xa3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
2331 v_rndne_f32_e64_dpp v5
, v1 row_shr
:1
2332 // GFX12
: [0x05,0x00,0xa3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
2334 v_rndne_f32_e64_dpp v5
, v1 row_shr
:15
2335 // GFX12
: [0x05,0x00,0xa3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
2337 v_rndne_f32_e64_dpp v5
, v1 row_ror
:1
2338 // GFX12
: [0x05,0x00,0xa3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
2340 v_rndne_f32_e64_dpp v5
, v1 row_ror
:15
2341 // GFX12
: [0x05,0x00,0xa3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
2343 v_rndne_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
2344 // GFX12
: [0x05,0x00,0xa3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
2346 v_rndne_f32_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
2347 // GFX12
: [0x05,0x00,0xa3,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
2349 v_rndne_f32_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
2350 // GFX12
: [0x05,0x00,0xa3,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
2352 v_rndne_f32_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
2353 // GFX12
: [0xff,0x81,0xa3,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
2355 v_rsq_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
2356 // GFX12
: [0x05,0x00,0xd6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
2358 v_rsq_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
2359 // GFX12
: [0x05,0x00,0xd6,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
2361 v_rsq_f16_e64_dpp v5
, v1 row_mirror
2362 // GFX12
: [0x05,0x00,0xd6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
2364 v_rsq_f16_e64_dpp v5
, v1 row_half_mirror
2365 // GFX12
: [0x05,0x00,0xd6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
2367 v_rsq_f16_e64_dpp v5
, v1 row_shl
:1
2368 // GFX12
: [0x05,0x00,0xd6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
2370 v_rsq_f16_e64_dpp v5
, v1 row_shl
:15
2371 // GFX12
: [0x05,0x00,0xd6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
2373 v_rsq_f16_e64_dpp v5
, v1 row_shr
:1
2374 // GFX12
: [0x05,0x00,0xd6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
2376 v_rsq_f16_e64_dpp v5
, v1 row_shr
:15
2377 // GFX12
: [0x05,0x00,0xd6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
2379 v_rsq_f16_e64_dpp v5
, v1 row_ror
:1
2380 // GFX12
: [0x05,0x00,0xd6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
2382 v_rsq_f16_e64_dpp v5
, v1 row_ror
:15
2383 // GFX12
: [0x05,0x00,0xd6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
2385 v_rsq_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
2386 // GFX12
: [0x05,0x00,0xd6,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
2388 v_rsq_f16_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
2389 // GFX12
: [0x05,0x00,0xd6,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
2391 v_rsq_f16_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
2392 // GFX12
: [0x05,0x00,0xd6,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
2394 v_rsq_f16_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
2395 // GFX12
: [0xff,0x81,0xd6,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
2397 v_rsq_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
2398 // GFX12
: [0x05,0x00,0xae,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
2400 v_rsq_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
2401 // GFX12
: [0x05,0x00,0xae,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
2403 v_rsq_f32_e64_dpp v5
, v1 row_mirror
2404 // GFX12
: [0x05,0x00,0xae,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
2406 v_rsq_f32_e64_dpp v5
, v1 row_half_mirror
2407 // GFX12
: [0x05,0x00,0xae,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
2409 v_rsq_f32_e64_dpp v5
, v1 row_shl
:1
2410 // GFX12
: [0x05,0x00,0xae,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
2412 v_rsq_f32_e64_dpp v5
, v1 row_shl
:15
2413 // GFX12
: [0x05,0x00,0xae,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
2415 v_rsq_f32_e64_dpp v5
, v1 row_shr
:1
2416 // GFX12
: [0x05,0x00,0xae,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
2418 v_rsq_f32_e64_dpp v5
, v1 row_shr
:15
2419 // GFX12
: [0x05,0x00,0xae,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
2421 v_rsq_f32_e64_dpp v5
, v1 row_ror
:1
2422 // GFX12
: [0x05,0x00,0xae,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
2424 v_rsq_f32_e64_dpp v5
, v1 row_ror
:15
2425 // GFX12
: [0x05,0x00,0xae,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
2427 v_rsq_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
2428 // GFX12
: [0x05,0x00,0xae,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
2430 v_rsq_f32_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
2431 // GFX12
: [0x05,0x00,0xae,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
2433 v_rsq_f32_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
2434 // GFX12
: [0x05,0x00,0xae,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
2436 v_rsq_f32_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
2437 // GFX12
: [0xff,0x81,0xae,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
2439 v_sat_pk_u8_i16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
2440 // GFX12
: [0x05,0x00,0xe2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
2442 v_sat_pk_u8_i16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
2443 // GFX12
: [0x05,0x00,0xe2,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
2445 v_sat_pk_u8_i16_e64_dpp v5
, v1 row_mirror
2446 // GFX12
: [0x05,0x00,0xe2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
2448 v_sat_pk_u8_i16_e64_dpp v5
, v1 row_half_mirror
2449 // GFX12
: [0x05,0x00,0xe2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
2451 v_sat_pk_u8_i16_e64_dpp v5
, v1 row_shl
:1
2452 // GFX12
: [0x05,0x00,0xe2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
2454 v_sat_pk_u8_i16_e64_dpp v5
, v1 row_shl
:15
2455 // GFX12
: [0x05,0x00,0xe2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
2457 v_sat_pk_u8_i16_e64_dpp v5
, v1 row_shr
:1
2458 // GFX12
: [0x05,0x00,0xe2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
2460 v_sat_pk_u8_i16_e64_dpp v5
, v1 row_shr
:15
2461 // GFX12
: [0x05,0x00,0xe2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
2463 v_sat_pk_u8_i16_e64_dpp v5
, v1 row_ror
:1
2464 // GFX12
: [0x05,0x00,0xe2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
2466 v_sat_pk_u8_i16_e64_dpp v5
, v1 row_ror
:15
2467 // GFX12
: [0x05,0x00,0xe2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
2469 v_sat_pk_u8_i16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
2470 // GFX12
: [0x05,0x00,0xe2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
2472 v_sat_pk_u8_i16_e64_dpp v5
, v1 row_share
:15 row_mask
:0x0 bank_mask
:0x1
2473 // GFX12
: [0x05,0x00,0xe2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x5f,0x01,0x01]
2475 v_sat_pk_u8_i16_e64_dpp v5
, v1 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
2476 // GFX12
: [0x05,0x00,0xe2,0xd5,0xfa,0x00,0x00,0x00,0x01,0x60,0x09,0x13]
2478 v_sat_pk_u8_i16_e64_dpp v255
, v255 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
2479 // GFX12
: [0xff,0x00,0xe2,0xd5,0xfa,0x00,0x00,0x00,0xff,0x6f,0x05,0x30]
2481 v_sin_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
2482 // GFX12
: [0x05,0x00,0xe0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
2484 v_sin_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
2485 // GFX12
: [0x05,0x00,0xe0,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
2487 v_sin_f16_e64_dpp v5
, v1 row_mirror
2488 // GFX12
: [0x05,0x00,0xe0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
2490 v_sin_f16_e64_dpp v5
, v1 row_half_mirror
2491 // GFX12
: [0x05,0x00,0xe0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
2493 v_sin_f16_e64_dpp v5
, v1 row_shl
:1
2494 // GFX12
: [0x05,0x00,0xe0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
2496 v_sin_f16_e64_dpp v5
, v1 row_shl
:15
2497 // GFX12
: [0x05,0x00,0xe0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
2499 v_sin_f16_e64_dpp v5
, v1 row_shr
:1
2500 // GFX12
: [0x05,0x00,0xe0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
2502 v_sin_f16_e64_dpp v5
, v1 row_shr
:15
2503 // GFX12
: [0x05,0x00,0xe0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
2505 v_sin_f16_e64_dpp v5
, v1 row_ror
:1
2506 // GFX12
: [0x05,0x00,0xe0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
2508 v_sin_f16_e64_dpp v5
, v1 row_ror
:15
2509 // GFX12
: [0x05,0x00,0xe0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
2511 v_sin_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
2512 // GFX12
: [0x05,0x00,0xe0,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
2514 v_sin_f16_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
2515 // GFX12
: [0x05,0x00,0xe0,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
2517 v_sin_f16_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
2518 // GFX12
: [0x05,0x00,0xe0,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
2520 v_sin_f16_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
2521 // GFX12
: [0xff,0x81,0xe0,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
2523 v_sin_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
2524 // GFX12
: [0x05,0x00,0xb5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
2526 v_sin_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
2527 // GFX12
: [0x05,0x00,0xb5,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
2529 v_sin_f32_e64_dpp v5
, v1 row_mirror
2530 // GFX12
: [0x05,0x00,0xb5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
2532 v_sin_f32_e64_dpp v5
, v1 row_half_mirror
2533 // GFX12
: [0x05,0x00,0xb5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
2535 v_sin_f32_e64_dpp v5
, v1 row_shl
:1
2536 // GFX12
: [0x05,0x00,0xb5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
2538 v_sin_f32_e64_dpp v5
, v1 row_shl
:15
2539 // GFX12
: [0x05,0x00,0xb5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
2541 v_sin_f32_e64_dpp v5
, v1 row_shr
:1
2542 // GFX12
: [0x05,0x00,0xb5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
2544 v_sin_f32_e64_dpp v5
, v1 row_shr
:15
2545 // GFX12
: [0x05,0x00,0xb5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
2547 v_sin_f32_e64_dpp v5
, v1 row_ror
:1
2548 // GFX12
: [0x05,0x00,0xb5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
2550 v_sin_f32_e64_dpp v5
, v1 row_ror
:15
2551 // GFX12
: [0x05,0x00,0xb5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
2553 v_sin_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
2554 // GFX12
: [0x05,0x00,0xb5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
2556 v_sin_f32_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
2557 // GFX12
: [0x05,0x00,0xb5,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
2559 v_sin_f32_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
2560 // GFX12
: [0x05,0x00,0xb5,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
2562 v_sin_f32_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
2563 // GFX12
: [0xff,0x81,0xb5,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
2565 v_sqrt_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
2566 // GFX12
: [0x05,0x00,0xd5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
2568 v_sqrt_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
2569 // GFX12
: [0x05,0x00,0xd5,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
2571 v_sqrt_f16_e64_dpp v5
, v1 row_mirror
2572 // GFX12
: [0x05,0x00,0xd5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
2574 v_sqrt_f16_e64_dpp v5
, v1 row_half_mirror
2575 // GFX12
: [0x05,0x00,0xd5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
2577 v_sqrt_f16_e64_dpp v5
, v1 row_shl
:1
2578 // GFX12
: [0x05,0x00,0xd5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
2580 v_sqrt_f16_e64_dpp v5
, v1 row_shl
:15
2581 // GFX12
: [0x05,0x00,0xd5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
2583 v_sqrt_f16_e64_dpp v5
, v1 row_shr
:1
2584 // GFX12
: [0x05,0x00,0xd5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
2586 v_sqrt_f16_e64_dpp v5
, v1 row_shr
:15
2587 // GFX12
: [0x05,0x00,0xd5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
2589 v_sqrt_f16_e64_dpp v5
, v1 row_ror
:1
2590 // GFX12
: [0x05,0x00,0xd5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
2592 v_sqrt_f16_e64_dpp v5
, v1 row_ror
:15
2593 // GFX12
: [0x05,0x00,0xd5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
2595 v_sqrt_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
2596 // GFX12
: [0x05,0x00,0xd5,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
2598 v_sqrt_f16_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
2599 // GFX12
: [0x05,0x00,0xd5,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
2601 v_sqrt_f16_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
2602 // GFX12
: [0x05,0x00,0xd5,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
2604 v_sqrt_f16_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
2605 // GFX12
: [0xff,0x81,0xd5,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
2607 v_sqrt_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
2608 // GFX12
: [0x05,0x00,0xb3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
2610 v_sqrt_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
2611 // GFX12
: [0x05,0x00,0xb3,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
2613 v_sqrt_f32_e64_dpp v5
, v1 row_mirror
2614 // GFX12
: [0x05,0x00,0xb3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
2616 v_sqrt_f32_e64_dpp v5
, v1 row_half_mirror
2617 // GFX12
: [0x05,0x00,0xb3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
2619 v_sqrt_f32_e64_dpp v5
, v1 row_shl
:1
2620 // GFX12
: [0x05,0x00,0xb3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
2622 v_sqrt_f32_e64_dpp v5
, v1 row_shl
:15
2623 // GFX12
: [0x05,0x00,0xb3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
2625 v_sqrt_f32_e64_dpp v5
, v1 row_shr
:1
2626 // GFX12
: [0x05,0x00,0xb3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
2628 v_sqrt_f32_e64_dpp v5
, v1 row_shr
:15
2629 // GFX12
: [0x05,0x00,0xb3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
2631 v_sqrt_f32_e64_dpp v5
, v1 row_ror
:1
2632 // GFX12
: [0x05,0x00,0xb3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
2634 v_sqrt_f32_e64_dpp v5
, v1 row_ror
:15
2635 // GFX12
: [0x05,0x00,0xb3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
2637 v_sqrt_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
2638 // GFX12
: [0x05,0x00,0xb3,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
2640 v_sqrt_f32_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
2641 // GFX12
: [0x05,0x00,0xb3,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
2643 v_sqrt_f32_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
2644 // GFX12
: [0x05,0x00,0xb3,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
2646 v_sqrt_f32_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
2647 // GFX12
: [0xff,0x81,0xb3,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
2649 v_trunc_f16_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
2650 // GFX12
: [0x05,0x00,0xdd,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
2652 v_trunc_f16_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
2653 // GFX12
: [0x05,0x00,0xdd,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
2655 v_trunc_f16_e64_dpp v5
, v1 row_mirror
2656 // GFX12
: [0x05,0x00,0xdd,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
2658 v_trunc_f16_e64_dpp v5
, v1 row_half_mirror
2659 // GFX12
: [0x05,0x00,0xdd,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
2661 v_trunc_f16_e64_dpp v5
, v1 row_shl
:1
2662 // GFX12
: [0x05,0x00,0xdd,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
2664 v_trunc_f16_e64_dpp v5
, v1 row_shl
:15
2665 // GFX12
: [0x05,0x00,0xdd,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
2667 v_trunc_f16_e64_dpp v5
, v1 row_shr
:1
2668 // GFX12
: [0x05,0x00,0xdd,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
2670 v_trunc_f16_e64_dpp v5
, v1 row_shr
:15
2671 // GFX12
: [0x05,0x00,0xdd,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
2673 v_trunc_f16_e64_dpp v5
, v1 row_ror
:1
2674 // GFX12
: [0x05,0x00,0xdd,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
2676 v_trunc_f16_e64_dpp v5
, v1 row_ror
:15
2677 // GFX12
: [0x05,0x00,0xdd,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
2679 v_trunc_f16_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
2680 // GFX12
: [0x05,0x00,0xdd,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
2682 v_trunc_f16_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
2683 // GFX12
: [0x05,0x00,0xdd,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
2685 v_trunc_f16_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
2686 // GFX12
: [0x05,0x00,0xdd,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
2688 v_trunc_f16_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
2689 // GFX12
: [0xff,0x81,0xdd,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]
2691 v_trunc_f32_e64_dpp v5
, v1 quad_perm
:[3,2,1,0]
2692 // GFX12
: [0x05,0x00,0xa1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1b,0x00,0xff]
2694 v_trunc_f32_e64_dpp v5
, v1 quad_perm
:[0,1,2,3]
2695 // GFX12
: [0x05,0x00,0xa1,0xd5,0xfa,0x00,0x00,0x00,0x01,0xe4,0x00,0xff]
2697 v_trunc_f32_e64_dpp v5
, v1 row_mirror
2698 // GFX12
: [0x05,0x00,0xa1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x40,0x01,0xff]
2700 v_trunc_f32_e64_dpp v5
, v1 row_half_mirror
2701 // GFX12
: [0x05,0x00,0xa1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x41,0x01,0xff]
2703 v_trunc_f32_e64_dpp v5
, v1 row_shl
:1
2704 // GFX12
: [0x05,0x00,0xa1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x01,0x01,0xff]
2706 v_trunc_f32_e64_dpp v5
, v1 row_shl
:15
2707 // GFX12
: [0x05,0x00,0xa1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x0f,0x01,0xff]
2709 v_trunc_f32_e64_dpp v5
, v1 row_shr
:1
2710 // GFX12
: [0x05,0x00,0xa1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x11,0x01,0xff]
2712 v_trunc_f32_e64_dpp v5
, v1 row_shr
:15
2713 // GFX12
: [0x05,0x00,0xa1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x1f,0x01,0xff]
2715 v_trunc_f32_e64_dpp v5
, v1 row_ror
:1
2716 // GFX12
: [0x05,0x00,0xa1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x21,0x01,0xff]
2718 v_trunc_f32_e64_dpp v5
, v1 row_ror
:15
2719 // GFX12
: [0x05,0x00,0xa1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x2f,0x01,0xff]
2721 v_trunc_f32_e64_dpp v5
, v1 row_share
:0 row_mask
:0xf bank_mask
:0xf
2722 // GFX12
: [0x05,0x00,0xa1,0xd5,0xfa,0x00,0x00,0x00,0x01,0x50,0x01,0xff]
2724 v_trunc_f32_e64_dpp v5
, v1
mul:2 row_share
:15 row_mask
:0x0 bank_mask
:0x1
2725 // GFX12
: [0x05,0x00,0xa1,0xd5,0xfa,0x00,0x00,0x08,0x01,0x5f,0x01,0x01]
2727 v_trunc_f32_e64_dpp v5
, v1
mul:4 row_xmask
:0 row_mask
:0x1 bank_mask
:0x3 bound_ctrl
:1 fi
:0
2728 // GFX12
: [0x05,0x00,0xa1,0xd5,0xfa,0x00,0x00,0x10,0x01,0x60,0x09,0x13]
2730 v_trunc_f32_e64_dpp v255
, -|v255| clamp
div:2 row_xmask
:15 row_mask
:0x3 bank_mask
:0x0 bound_ctrl
:0 fi
:1
2731 // GFX12
: [0xff,0x81,0xa1,0xd5,0xfa,0x00,0x00,0x38,0xff,0x6f,0x05,0x30]