Run DCE after a LoopFlatten test to reduce spurious output [nfc]
[llvm-project.git] / llvm / test / MC / AMDGPU / gfx10_asm_flat.s
blob7340e48db3e84b6b6bef05a9c6916d688ed14223
1 // RUN: llvm-mc -triple=amdgcn -mcpu=gfx1010 -mattr=+wavefrontsize32,-wavefrontsize64 -show-encoding %s | FileCheck --check-prefix=GFX10 %s
2 // RUN: llvm-mc -triple=amdgcn -mcpu=gfx1010 -mattr=-wavefrontsize32,+wavefrontsize64 -show-encoding %s | FileCheck --check-prefix=GFX10 %s
4 //===----------------------------------------------------------------------===//
5 // ENC_FLAT.
6 //===----------------------------------------------------------------------===//
8 flat_load_ubyte v5, v[1:2]
9 // GFX10: encoding: [0x00,0x00,0x20,0xdc,0x01,0x00,0x7d,0x05]
11 flat_load_sbyte v5, v[1:2]
12 // GFX10: encoding: [0x00,0x00,0x24,0xdc,0x01,0x00,0x7d,0x05]
14 flat_load_ushort v5, v[1:2]
15 // GFX10: encoding: [0x00,0x00,0x28,0xdc,0x01,0x00,0x7d,0x05]
17 flat_load_sshort v5, v[1:2]
18 // GFX10: encoding: [0x00,0x00,0x2c,0xdc,0x01,0x00,0x7d,0x05]
20 flat_load_dword v5, v[1:2]
21 // GFX10: encoding: [0x00,0x00,0x30,0xdc,0x01,0x00,0x7d,0x05]
23 flat_load_dwordx2 v[5:6], v[1:2]
24 // GFX10: encoding: [0x00,0x00,0x34,0xdc,0x01,0x00,0x7d,0x05]
26 flat_load_dwordx3 v[5:7], v[1:2]
27 // GFX10: encoding: [0x00,0x00,0x3c,0xdc,0x01,0x00,0x7d,0x05]
29 flat_load_dwordx4 v[5:8], v[1:2]
30 // GFX10: encoding: [0x00,0x00,0x38,0xdc,0x01,0x00,0x7d,0x05]
32 flat_store_byte v[1:2], v2
33 // GFX10: encoding: [0x00,0x00,0x60,0xdc,0x01,0x02,0x7d,0x00]
35 flat_store_short v[1:2], v2
36 // GFX10: encoding: [0x00,0x00,0x68,0xdc,0x01,0x02,0x7d,0x00]
38 flat_store_dword v[1:2], v2
39 // GFX10: encoding: [0x00,0x00,0x70,0xdc,0x01,0x02,0x7d,0x00]
41 flat_store_dwordx2 v[1:2], v[2:3]
42 // GFX10: encoding: [0x00,0x00,0x74,0xdc,0x01,0x02,0x7d,0x00]
44 flat_store_dwordx3 v[1:2], v[2:4]
45 // GFX10: encoding: [0x00,0x00,0x7c,0xdc,0x01,0x02,0x7d,0x00]
47 flat_store_dwordx4 v[1:2], v[2:5]
48 // GFX10: encoding: [0x00,0x00,0x78,0xdc,0x01,0x02,0x7d,0x00]
50 flat_atomic_swap v[1:2], v2
51 // GFX10: encoding: [0x00,0x00,0xc0,0xdc,0x01,0x02,0x7d,0x00]
53 flat_atomic_cmpswap v[1:2], v[2:3]
54 // GFX10: encoding: [0x00,0x00,0xc4,0xdc,0x01,0x02,0x7d,0x00]
56 flat_atomic_add v[1:2], v2
57 // GFX10: encoding: [0x00,0x00,0xc8,0xdc,0x01,0x02,0x7d,0x00]
59 flat_atomic_sub v[1:2], v2
60 // GFX10: encoding: [0x00,0x00,0xcc,0xdc,0x01,0x02,0x7d,0x00]
62 flat_atomic_smin v[1:2], v2
63 // GFX10: encoding: [0x00,0x00,0xd4,0xdc,0x01,0x02,0x7d,0x00]
65 flat_atomic_umin v[1:2], v2
66 // GFX10: encoding: [0x00,0x00,0xd8,0xdc,0x01,0x02,0x7d,0x00]
68 flat_atomic_smax v[1:2], v2
69 // GFX10: encoding: [0x00,0x00,0xdc,0xdc,0x01,0x02,0x7d,0x00]
71 flat_atomic_umax v[1:2], v2
72 // GFX10: encoding: [0x00,0x00,0xe0,0xdc,0x01,0x02,0x7d,0x00]
74 flat_atomic_and v[1:2], v2
75 // GFX10: encoding: [0x00,0x00,0xe4,0xdc,0x01,0x02,0x7d,0x00]
77 flat_atomic_or v[1:2], v2
78 // GFX10: encoding: [0x00,0x00,0xe8,0xdc,0x01,0x02,0x7d,0x00]
80 flat_atomic_xor v[1:2], v2
81 // GFX10: encoding: [0x00,0x00,0xec,0xdc,0x01,0x02,0x7d,0x00]
83 flat_atomic_inc v[1:2], v2
84 // GFX10: encoding: [0x00,0x00,0xf0,0xdc,0x01,0x02,0x7d,0x00]
86 flat_atomic_dec v[1:2], v2
87 // GFX10: encoding: [0x00,0x00,0xf4,0xdc,0x01,0x02,0x7d,0x00]
89 flat_atomic_swap_x2 v[1:2], v[2:3]
90 // GFX10: encoding: [0x00,0x00,0x40,0xdd,0x01,0x02,0x7d,0x00]
92 flat_atomic_cmpswap_x2 v[1:2], v[2:5]
93 // GFX10: encoding: [0x00,0x00,0x44,0xdd,0x01,0x02,0x7d,0x00]
95 flat_atomic_add_x2 v[1:2], v[2:3]
96 // GFX10: encoding: [0x00,0x00,0x48,0xdd,0x01,0x02,0x7d,0x00]
98 flat_atomic_sub_x2 v[1:2], v[2:3]
99 // GFX10: encoding: [0x00,0x00,0x4c,0xdd,0x01,0x02,0x7d,0x00]
101 flat_atomic_smin_x2 v[1:2], v[2:3]
102 // GFX10: encoding: [0x00,0x00,0x54,0xdd,0x01,0x02,0x7d,0x00]
104 flat_atomic_umin_x2 v[1:2], v[2:3]
105 // GFX10: encoding: [0x00,0x00,0x58,0xdd,0x01,0x02,0x7d,0x00]
107 flat_atomic_smax_x2 v[1:2], v[2:3]
108 // GFX10: encoding: [0x00,0x00,0x5c,0xdd,0x01,0x02,0x7d,0x00]
110 flat_atomic_umax_x2 v[1:2], v[2:3]
111 // GFX10: encoding: [0x00,0x00,0x60,0xdd,0x01,0x02,0x7d,0x00]
113 flat_atomic_and_x2 v[1:2], v[2:3]
114 // GFX10: encoding: [0x00,0x00,0x64,0xdd,0x01,0x02,0x7d,0x00]
116 flat_atomic_or_x2 v[1:2], v[2:3]
117 // GFX10: encoding: [0x00,0x00,0x68,0xdd,0x01,0x02,0x7d,0x00]
119 flat_atomic_xor_x2 v[1:2], v[2:3]
120 // GFX10: encoding: [0x00,0x00,0x6c,0xdd,0x01,0x02,0x7d,0x00]
122 flat_atomic_inc_x2 v[1:2], v[2:3]
123 // GFX10: encoding: [0x00,0x00,0x70,0xdd,0x01,0x02,0x7d,0x00]
125 flat_atomic_dec_x2 v[1:2], v[2:3]
126 // GFX10: encoding: [0x00,0x00,0x74,0xdd,0x01,0x02,0x7d,0x00]
128 //===----------------------------------------------------------------------===//
129 // ENC_FLAT: dlc support for atomics.
130 //===----------------------------------------------------------------------===//
132 flat_atomic_add v[1:2], v2 dlc
133 // GFX10: [0x00,0x10,0xc8,0xdc,0x01,0x02,0x7d,0x00]
135 flat_atomic_add_x2 v[1:2], v[2:3] dlc
136 // GFX10: [0x00,0x10,0x48,0xdd,0x01,0x02,0x7d,0x00]
138 flat_atomic_and v[1:2], v2 dlc
139 // GFX10: [0x00,0x10,0xe4,0xdc,0x01,0x02,0x7d,0x00]
141 flat_atomic_and_x2 v[1:2], v[2:3] dlc
142 // GFX10: [0x00,0x10,0x64,0xdd,0x01,0x02,0x7d,0x00]
144 flat_atomic_cmpswap v[1:2], v[2:3] dlc
145 // GFX10: [0x00,0x10,0xc4,0xdc,0x01,0x02,0x7d,0x00]
147 flat_atomic_cmpswap_x2 v[1:2], v[2:5] dlc
148 // GFX10: [0x00,0x10,0x44,0xdd,0x01,0x02,0x7d,0x00]
150 flat_atomic_dec v[1:2], v2 dlc
151 // GFX10: [0x00,0x10,0xf4,0xdc,0x01,0x02,0x7d,0x00]
153 flat_atomic_dec_x2 v[1:2], v[2:3] dlc
154 // GFX10: [0x00,0x10,0x74,0xdd,0x01,0x02,0x7d,0x00]
156 flat_atomic_fcmpswap v[1:2], v[2:3] dlc
157 // GFX10: [0x00,0x10,0xf8,0xdc,0x01,0x02,0x7d,0x00]
159 flat_atomic_fcmpswap_x2 v[1:2], v[2:5] dlc
160 // GFX10: [0x00,0x10,0x78,0xdd,0x01,0x02,0x7d,0x00]
162 flat_atomic_fmax v[1:2], v2 dlc
163 // GFX10: [0x00,0x10,0x00,0xdd,0x01,0x02,0x7d,0x00]
165 flat_atomic_fmax_x2 v[1:2], v[2:3] dlc
166 // GFX10: [0x00,0x10,0x80,0xdd,0x01,0x02,0x7d,0x00]
168 flat_atomic_fmin v[1:2], v2 dlc
169 // GFX10: [0x00,0x10,0xfc,0xdc,0x01,0x02,0x7d,0x00]
171 flat_atomic_fmin_x2 v[1:2], v[2:3] dlc
172 // GFX10: [0x00,0x10,0x7c,0xdd,0x01,0x02,0x7d,0x00]
174 flat_atomic_inc v[1:2], v2 dlc
175 // GFX10: [0x00,0x10,0xf0,0xdc,0x01,0x02,0x7d,0x00]
177 flat_atomic_inc_x2 v[1:2], v[2:3] dlc
178 // GFX10: [0x00,0x10,0x70,0xdd,0x01,0x02,0x7d,0x00]
180 flat_atomic_or v[1:2], v2 dlc
181 // GFX10: [0x00,0x10,0xe8,0xdc,0x01,0x02,0x7d,0x00]
183 flat_atomic_or_x2 v[1:2], v[2:3] dlc
184 // GFX10: [0x00,0x10,0x68,0xdd,0x01,0x02,0x7d,0x00]
186 flat_atomic_smax v[1:2], v2 dlc
187 // GFX10: [0x00,0x10,0xdc,0xdc,0x01,0x02,0x7d,0x00]
189 flat_atomic_smax_x2 v[1:2], v[2:3] dlc
190 // GFX10: [0x00,0x10,0x5c,0xdd,0x01,0x02,0x7d,0x00]
192 flat_atomic_smin v[1:2], v2 dlc
193 // GFX10: [0x00,0x10,0xd4,0xdc,0x01,0x02,0x7d,0x00]
195 flat_atomic_smin_x2 v[1:2], v[2:3] dlc
196 // GFX10: [0x00,0x10,0x54,0xdd,0x01,0x02,0x7d,0x00]
198 flat_atomic_sub v[1:2], v2 dlc
199 // GFX10: [0x00,0x10,0xcc,0xdc,0x01,0x02,0x7d,0x00]
201 flat_atomic_sub_x2 v[1:2], v[2:3] dlc
202 // GFX10: [0x00,0x10,0x4c,0xdd,0x01,0x02,0x7d,0x00]
204 flat_atomic_swap v[1:2], v2 dlc
205 // GFX10: [0x00,0x10,0xc0,0xdc,0x01,0x02,0x7d,0x00]
207 flat_atomic_swap_x2 v[1:2], v[2:3] dlc
208 // GFX10: [0x00,0x10,0x40,0xdd,0x01,0x02,0x7d,0x00]
210 flat_atomic_umax v[1:2], v2 dlc
211 // GFX10: [0x00,0x10,0xe0,0xdc,0x01,0x02,0x7d,0x00]
213 flat_atomic_umax_x2 v[1:2], v[2:3] dlc
214 // GFX10: [0x00,0x10,0x60,0xdd,0x01,0x02,0x7d,0x00]
216 flat_atomic_umin v[1:2], v2 dlc
217 // GFX10: [0x00,0x10,0xd8,0xdc,0x01,0x02,0x7d,0x00]
219 flat_atomic_umin_x2 v[1:2], v[2:3] dlc
220 // GFX10: [0x00,0x10,0x58,0xdd,0x01,0x02,0x7d,0x00]
222 flat_atomic_xor v[1:2], v2 dlc
223 // GFX10: [0x00,0x10,0xec,0xdc,0x01,0x02,0x7d,0x00]
225 flat_atomic_xor_x2 v[1:2], v[2:3] dlc
226 // GFX10: [0x00,0x10,0x6c,0xdd,0x01,0x02,0x7d,0x00]
228 //===----------------------------------------------------------------------===//
229 // ENC_FLAT_GLOBAL: fcmpswap.
230 //===----------------------------------------------------------------------===//
232 global_atomic_fcmpswap v[1:2], v[2:3], off offset:-1
233 // GFX10: [0xff,0x8f,0xf8,0xdc,0x01,0x02,0x7d,0x00]
235 global_atomic_fcmpswap v5, v[1:2], v[2:3], off offset:-1 glc
236 // GFX10: [0xff,0x8f,0xf9,0xdc,0x01,0x02,0x7d,0x05]
238 global_atomic_fcmpswap v[1:2], v[2:3], off offset:2047
239 // GFX10: [0xff,0x87,0xf8,0xdc,0x01,0x02,0x7d,0x00]
241 global_atomic_fcmpswap v[1:2], v[2:3], off offset:-2048
242 // GFX10: [0x00,0x88,0xf8,0xdc,0x01,0x02,0x7d,0x00]
244 global_atomic_fcmpswap v[1:2], v[2:3], off offset:-1 slc
245 // GFX10: [0xff,0x8f,0xfa,0xdc,0x01,0x02,0x7d,0x00]
247 global_atomic_fcmpswap v[1:2], v[2:3], off offset:-1 dlc
248 // GFX10: [0xff,0x9f,0xf8,0xdc,0x01,0x02,0x7d,0x00]
250 global_atomic_fcmpswap_x2 v[1:2], v[2:5], off offset:-1
251 // GFX10: [0xff,0x8f,0x78,0xdd,0x01,0x02,0x7d,0x00]
253 global_atomic_fcmpswap_x2 v[5:6], v[1:2], v[2:5], off offset:-1 glc
254 // GFX10: [0xff,0x8f,0x79,0xdd,0x01,0x02,0x7d,0x05]
256 global_atomic_fcmpswap_x2 v[1:2], v[2:5], off offset:2047
257 // GFX10: [0xff,0x87,0x78,0xdd,0x01,0x02,0x7d,0x00]
259 global_atomic_fcmpswap_x2 v[1:2], v[2:5], off offset:-2048
260 // GFX10: [0x00,0x88,0x78,0xdd,0x01,0x02,0x7d,0x00]
262 global_atomic_fcmpswap_x2 v[1:2], v[2:5], off offset:-1 slc
263 // GFX10: [0xff,0x8f,0x7a,0xdd,0x01,0x02,0x7d,0x00]
265 global_atomic_fcmpswap_x2 v[1:2], v[2:5], off offset:-1 dlc
266 // GFX10: [0xff,0x9f,0x78,0xdd,0x01,0x02,0x7d,0x00]
268 //===----------------------------------------------------------------------===//
269 // ENC_FLAT_GLOBAL: dlc support for atomics.
270 //===----------------------------------------------------------------------===//
272 global_atomic_add v[1:2], v2, off dlc
273 // GFX10: [0x00,0x90,0xc8,0xdc,0x01,0x02,0x7d,0x00]
275 global_atomic_add_x2 v[1:2], v[2:3], off dlc
276 // GFX10: [0x00,0x90,0x48,0xdd,0x01,0x02,0x7d,0x00]
278 global_atomic_and v[1:2], v2, off dlc
279 // GFX10: [0x00,0x90,0xe4,0xdc,0x01,0x02,0x7d,0x00]
281 global_atomic_and_x2 v[1:2], v[2:3], off dlc
282 // GFX10: [0x00,0x90,0x64,0xdd,0x01,0x02,0x7d,0x00]
284 global_atomic_cmpswap v[1:2], v[2:3], off dlc
285 // GFX10: [0x00,0x90,0xc4,0xdc,0x01,0x02,0x7d,0x00]
287 global_atomic_cmpswap_x2 v[1:2], v[2:5], off dlc
288 // GFX10: [0x00,0x90,0x44,0xdd,0x01,0x02,0x7d,0x00]
290 global_atomic_dec v[1:2], v2, off dlc
291 // GFX10: [0x00,0x90,0xf4,0xdc,0x01,0x02,0x7d,0x00]
293 global_atomic_dec_x2 v[1:2], v[2:3], off dlc
294 // GFX10: [0x00,0x90,0x74,0xdd,0x01,0x02,0x7d,0x00]
296 global_atomic_fmax v[1:2], v2, off dlc
297 // GFX10: [0x00,0x90,0x00,0xdd,0x01,0x02,0x7d,0x00]
299 global_atomic_fmax_x2 v[1:2], v[2:3], off dlc
300 // GFX10: [0x00,0x90,0x80,0xdd,0x01,0x02,0x7d,0x00]
302 global_atomic_fmin v[1:2], v2, off dlc
303 // GFX10: [0x00,0x90,0xfc,0xdc,0x01,0x02,0x7d,0x00]
305 global_atomic_fmin_x2 v[1:2], v[2:3], off dlc
306 // GFX10: [0x00,0x90,0x7c,0xdd,0x01,0x02,0x7d,0x00]
308 global_atomic_inc v[1:2], v2, off dlc
309 // GFX10: [0x00,0x90,0xf0,0xdc,0x01,0x02,0x7d,0x00]
311 global_atomic_inc_x2 v[1:2], v[2:3], off dlc
312 // GFX10: [0x00,0x90,0x70,0xdd,0x01,0x02,0x7d,0x00]
314 global_atomic_or v[1:2], v2, off dlc
315 // GFX10: [0x00,0x90,0xe8,0xdc,0x01,0x02,0x7d,0x00]
317 global_atomic_or_x2 v[1:2], v[2:3], off dlc
318 // GFX10: [0x00,0x90,0x68,0xdd,0x01,0x02,0x7d,0x00]
320 global_atomic_smax v[1:2], v2, off dlc
321 // GFX10: [0x00,0x90,0xdc,0xdc,0x01,0x02,0x7d,0x00]
323 global_atomic_smax_x2 v[1:2], v[2:3], off dlc
324 // GFX10: [0x00,0x90,0x5c,0xdd,0x01,0x02,0x7d,0x00]
326 global_atomic_smin v[1:2], v2, off dlc
327 // GFX10: [0x00,0x90,0xd4,0xdc,0x01,0x02,0x7d,0x00]
329 global_atomic_smin_x2 v[1:2], v[2:3], off dlc
330 // GFX10: [0x00,0x90,0x54,0xdd,0x01,0x02,0x7d,0x00]
332 global_atomic_sub v[1:2], v2, off dlc
333 // GFX10: [0x00,0x90,0xcc,0xdc,0x01,0x02,0x7d,0x00]
335 global_atomic_sub_x2 v[1:2], v[2:3], off dlc
336 // GFX10: [0x00,0x90,0x4c,0xdd,0x01,0x02,0x7d,0x00]
338 global_atomic_swap v[1:2], v2, off dlc
339 // GFX10: [0x00,0x90,0xc0,0xdc,0x01,0x02,0x7d,0x00]
341 global_atomic_swap_x2 v[1:2], v[2:3], off dlc
342 // GFX10: [0x00,0x90,0x40,0xdd,0x01,0x02,0x7d,0x00]
344 global_atomic_umax v[1:2], v2, off dlc
345 // GFX10: [0x00,0x90,0xe0,0xdc,0x01,0x02,0x7d,0x00]
347 global_atomic_umax_x2 v[1:2], v[2:3], off dlc
348 // GFX10: [0x00,0x90,0x60,0xdd,0x01,0x02,0x7d,0x00]
350 global_atomic_umin v[1:2], v2, off dlc
351 // GFX10: [0x00,0x90,0xd8,0xdc,0x01,0x02,0x7d,0x00]
353 global_atomic_umin_x2 v[1:2], v[2:3], off dlc
354 // GFX10: [0x00,0x90,0x58,0xdd,0x01,0x02,0x7d,0x00]
356 global_atomic_xor v[1:2], v2, off dlc
357 // GFX10: [0x00,0x90,0xec,0xdc,0x01,0x02,0x7d,0x00]
359 global_atomic_xor_x2 v[1:2], v[2:3], off dlc
360 // GFX10: [0x00,0x90,0x6c,0xdd,0x01,0x02,0x7d,0x00]
362 global_load_dword v2, s[4:5] offset:1024 lds
363 // GFX10: [0x00,0xa4,0x30,0xdc,0x02,0x00,0x04,0x00]
365 global_load_dword v2, s[4:5] offset:1024 lds
366 // GFX10: [0x00,0xa4,0x30,0xdc,0x02,0x00,0x04,0x00]
368 global_load_ubyte v2, s[4:5] offset:1024 lds
369 // GFX10: [0x00,0xa4,0x20,0xdc,0x02,0x00,0x04,0x00]
371 global_load_sbyte v2, s[4:5] offset:1024 lds
372 // GFX10: [0x00,0xa4,0x24,0xdc,0x02,0x00,0x04,0x00]
374 global_load_ushort v2, s[4:5] offset:1024 lds
375 // GFX10: [0x00,0xa4,0x28,0xdc,0x02,0x00,0x04,0x00]
377 global_load_sshort v2, s[4:5] offset:1024 lds
378 // GFX10: [0x00,0xa4,0x2c,0xdc,0x02,0x00,0x04,0x00]
380 global_load_dword v[2:3], off offset:1024 lds
381 // GFX10: [0x00,0xa4,0x30,0xdc,0x02,0x00,0x7d,0x00]
383 global_load_ubyte v[2:3], off offset:1024 lds
384 // GFX10: [0x00,0xa4,0x20,0xdc,0x02,0x00,0x7d,0x00]
386 global_load_sbyte v[2:3], off offset:1024 lds
387 // GFX10: [0x00,0xa4,0x24,0xdc,0x02,0x00,0x7d,0x00]
389 global_load_ushort v[2:3], off offset:1024 lds
390 // GFX10: [0x00,0xa4,0x28,0xdc,0x02,0x00,0x7d,0x00]
392 global_load_sshort v[2:3], off offset:1024 lds
393 // GFX10: [0x00,0xa4,0x2c,0xdc,0x02,0x00,0x7d,0x00]
395 scratch_load_dword v2, off offset:1024 lds
396 // GFX10: [0x00,0x64,0x30,0xdc,0x02,0x00,0x7d,0x00]
398 scratch_load_ubyte v2, off offset:1024 lds
399 // GFX10: [0x00,0x64,0x20,0xdc,0x02,0x00,0x7d,0x00]
401 scratch_load_sbyte v2, off offset:1024 lds
402 // GFX10: [0x00,0x64,0x24,0xdc,0x02,0x00,0x7d,0x00]
404 scratch_load_ushort v2, off offset:1024 lds
405 // GFX10: [0x00,0x64,0x28,0xdc,0x02,0x00,0x7d,0x00]
407 scratch_load_sshort v2, off offset:1024 lds
408 // GFX10: [0x00,0x64,0x2c,0xdc,0x02,0x00,0x7d,0x00]
410 scratch_load_dword off, s4 offset:1024 lds
411 // GFX10: [0x00,0x64,0x30,0xdc,0x00,0x00,0x04,0x00]
413 scratch_load_ubyte off, s4 offset:1024 lds
414 // GFX10: [0x00,0x64,0x20,0xdc,0x00,0x00,0x04,0x00]
416 scratch_load_sbyte off, s4 offset:1024 lds
417 // GFX10: [0x00,0x64,0x24,0xdc,0x00,0x00,0x04,0x00]
419 scratch_load_ushort off, s4 offset:1024 lds
420 // GFX10: [0x00,0x64,0x28,0xdc,0x00,0x00,0x04,0x00]
422 scratch_load_sshort off, s4 offset:1024 lds
423 // GFX10: [0x00,0x64,0x2c,0xdc,0x00,0x00,0x04,0x00]
425 //===----------------------------------------------------------------------===//
426 // Also see flat-gfx10.s, flat-global.s, flat-scratch-instructions.s.
427 //===----------------------------------------------------------------------===//