1 // WebAssemblyInstrAtomics.td-WebAssembly Atomic codegen support-*- tablegen -*-
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
10 /// WebAssembly Atomic operand code-gen constructs.
12 //===----------------------------------------------------------------------===//
14 let UseNamedOperandTable = 1 in
15 multiclass ATOMIC_I<dag oops_r, dag iops_r, dag oops_s, dag iops_s,
16 list<dag> pattern_r, string asmstr_r = "",
17 string asmstr_s = "", bits<32> atomic_op = -1> {
18 defm "" : I<oops_r, iops_r, oops_s, iops_s, pattern_r, asmstr_r, asmstr_s,
19 !or(0xfe00, !and(0xff, atomic_op))>,
20 Requires<[HasAtomics]>;
23 multiclass ATOMIC_NRI<dag oops, dag iops, list<dag> pattern, string asmstr = "",
24 bits<32> atomic_op = -1> {
25 defm "" : NRI<oops, iops, pattern, asmstr,
26 !or(0xfe00, !and(0xff, atomic_op))>,
27 Requires<[HasAtomics]>;
30 //===----------------------------------------------------------------------===//
31 // Atomic wait / notify
32 //===----------------------------------------------------------------------===//
34 let hasSideEffects = 1 in {
36 ATOMIC_I<(outs I32:$dst),
37 (ins P2Align:$p2align, offset32_op:$off, I32:$addr, I32:$count),
38 (outs), (ins P2Align:$p2align, offset32_op:$off), [],
39 "atomic.notify \t$dst, ${off}(${addr})${p2align}, $count",
40 "atomic.notify \t${off}${p2align}", 0x00>;
42 defm ATOMIC_WAIT_I32 :
43 ATOMIC_I<(outs I32:$dst),
44 (ins P2Align:$p2align, offset32_op:$off, I32:$addr, I32:$exp,
46 (outs), (ins P2Align:$p2align, offset32_op:$off), [],
47 "i32.atomic.wait \t$dst, ${off}(${addr})${p2align}, $exp, $timeout",
48 "i32.atomic.wait \t${off}${p2align}", 0x01>;
49 defm ATOMIC_WAIT_I64 :
50 ATOMIC_I<(outs I32:$dst),
51 (ins P2Align:$p2align, offset32_op:$off, I32:$addr, I64:$exp,
53 (outs), (ins P2Align:$p2align, offset32_op:$off), [],
54 "i64.atomic.wait \t$dst, ${off}(${addr})${p2align}, $exp, $timeout",
55 "i64.atomic.wait \t${off}${p2align}", 0x02>;
57 } // hasSideEffects = 1
59 let Predicates = [HasAtomics] in {
60 // Select notifys with no constant offset.
61 def NotifyPatNoOffset :
62 Pat<(i32 (int_wasm_atomic_notify I32:$addr, I32:$count)),
63 (ATOMIC_NOTIFY 0, 0, I32:$addr, I32:$count)>;
65 // Select notifys with a constant offset.
67 // Pattern with address + immediate offset
68 class NotifyPatImmOff<PatFrag operand> :
69 Pat<(i32 (int_wasm_atomic_notify (operand I32:$addr, imm:$off), I32:$count)),
70 (ATOMIC_NOTIFY 0, imm:$off, I32:$addr, I32:$count)>;
71 def : NotifyPatImmOff<regPlusImm>;
72 def : NotifyPatImmOff<or_is_add>;
74 def NotifyPatGlobalAddr :
75 Pat<(i32 (int_wasm_atomic_notify (regPlusGA I32:$addr,
76 (WebAssemblywrapper tglobaladdr:$off)),
78 (ATOMIC_NOTIFY 0, tglobaladdr:$off, I32:$addr, I32:$count)>;
80 // Select notifys with just a constant offset.
81 def NotifyPatOffsetOnly :
82 Pat<(i32 (int_wasm_atomic_notify imm:$off, I32:$count)),
83 (ATOMIC_NOTIFY 0, imm:$off, (CONST_I32 0), I32:$count)>;
85 def NotifyPatGlobalAddrOffOnly :
86 Pat<(i32 (int_wasm_atomic_notify (WebAssemblywrapper tglobaladdr:$off),
88 (ATOMIC_NOTIFY 0, tglobaladdr:$off, (CONST_I32 0), I32:$count)>;
90 // Select waits with no constant offset.
91 class WaitPatNoOffset<ValueType ty, Intrinsic kind, NI inst> :
92 Pat<(i32 (kind I32:$addr, ty:$exp, I64:$timeout)),
93 (inst 0, 0, I32:$addr, ty:$exp, I64:$timeout)>;
94 def : WaitPatNoOffset<i32, int_wasm_atomic_wait_i32, ATOMIC_WAIT_I32>;
95 def : WaitPatNoOffset<i64, int_wasm_atomic_wait_i64, ATOMIC_WAIT_I64>;
97 // Select waits with a constant offset.
99 // Pattern with address + immediate offset
100 class WaitPatImmOff<ValueType ty, Intrinsic kind, PatFrag operand, NI inst> :
101 Pat<(i32 (kind (operand I32:$addr, imm:$off), ty:$exp, I64:$timeout)),
102 (inst 0, imm:$off, I32:$addr, ty:$exp, I64:$timeout)>;
103 def : WaitPatImmOff<i32, int_wasm_atomic_wait_i32, regPlusImm, ATOMIC_WAIT_I32>;
104 def : WaitPatImmOff<i32, int_wasm_atomic_wait_i32, or_is_add, ATOMIC_WAIT_I32>;
105 def : WaitPatImmOff<i64, int_wasm_atomic_wait_i64, regPlusImm, ATOMIC_WAIT_I64>;
106 def : WaitPatImmOff<i64, int_wasm_atomic_wait_i64, or_is_add, ATOMIC_WAIT_I64>;
108 class WaitPatGlobalAddr<ValueType ty, Intrinsic kind, NI inst> :
109 Pat<(i32 (kind (regPlusGA I32:$addr, (WebAssemblywrapper tglobaladdr:$off)),
110 ty:$exp, I64:$timeout)),
111 (inst 0, tglobaladdr:$off, I32:$addr, ty:$exp, I64:$timeout)>;
112 def : WaitPatGlobalAddr<i32, int_wasm_atomic_wait_i32, ATOMIC_WAIT_I32>;
113 def : WaitPatGlobalAddr<i64, int_wasm_atomic_wait_i64, ATOMIC_WAIT_I64>;
115 // Select wait_i32, ATOMIC_WAIT_I32s with just a constant offset.
116 class WaitPatOffsetOnly<ValueType ty, Intrinsic kind, NI inst> :
117 Pat<(i32 (kind imm:$off, ty:$exp, I64:$timeout)),
118 (inst 0, imm:$off, (CONST_I32 0), ty:$exp, I64:$timeout)>;
119 def : WaitPatOffsetOnly<i32, int_wasm_atomic_wait_i32, ATOMIC_WAIT_I32>;
120 def : WaitPatOffsetOnly<i64, int_wasm_atomic_wait_i64, ATOMIC_WAIT_I64>;
122 class WaitPatGlobalAddrOffOnly<ValueType ty, Intrinsic kind, NI inst> :
123 Pat<(i32 (kind (WebAssemblywrapper tglobaladdr:$off), ty:$exp, I64:$timeout)),
124 (inst 0, tglobaladdr:$off, (CONST_I32 0), ty:$exp, I64:$timeout)>;
125 def : WaitPatGlobalAddrOffOnly<i32, int_wasm_atomic_wait_i32, ATOMIC_WAIT_I32>;
126 def : WaitPatGlobalAddrOffOnly<i64, int_wasm_atomic_wait_i64, ATOMIC_WAIT_I64>;
127 } // Predicates = [HasAtomics]
129 //===----------------------------------------------------------------------===//
131 //===----------------------------------------------------------------------===//
133 multiclass AtomicLoad<WebAssemblyRegClass rc, string name, int atomic_op> {
134 defm "" : WebAssemblyLoad<rc, name, !or(0xfe00, !and(0xff, atomic_op))>,
135 Requires<[HasAtomics]>;
138 defm ATOMIC_LOAD_I32 : AtomicLoad<I32, "i32.atomic.load", 0x10>;
139 defm ATOMIC_LOAD_I64 : AtomicLoad<I64, "i64.atomic.load", 0x11>;
141 // Select loads with no constant offset.
142 let Predicates = [HasAtomics] in {
143 def : LoadPatNoOffset<i32, atomic_load_32, ATOMIC_LOAD_I32>;
144 def : LoadPatNoOffset<i64, atomic_load_64, ATOMIC_LOAD_I64>;
146 // Select loads with a constant offset.
148 // Pattern with address + immediate offset
149 def : LoadPatImmOff<i32, atomic_load_32, regPlusImm, ATOMIC_LOAD_I32>;
150 def : LoadPatImmOff<i64, atomic_load_64, regPlusImm, ATOMIC_LOAD_I64>;
151 def : LoadPatImmOff<i32, atomic_load_32, or_is_add, ATOMIC_LOAD_I32>;
152 def : LoadPatImmOff<i64, atomic_load_64, or_is_add, ATOMIC_LOAD_I64>;
154 def : LoadPatGlobalAddr<i32, atomic_load_32, ATOMIC_LOAD_I32>;
155 def : LoadPatGlobalAddr<i64, atomic_load_64, ATOMIC_LOAD_I64>;
157 // Select loads with just a constant offset.
158 def : LoadPatOffsetOnly<i32, atomic_load_32, ATOMIC_LOAD_I32>;
159 def : LoadPatOffsetOnly<i64, atomic_load_64, ATOMIC_LOAD_I64>;
161 def : LoadPatGlobalAddrOffOnly<i32, atomic_load_32, ATOMIC_LOAD_I32>;
162 def : LoadPatGlobalAddrOffOnly<i64, atomic_load_64, ATOMIC_LOAD_I64>;
164 } // Predicates = [HasAtomics]
166 // Extending loads. Note that there are only zero-extending atomic loads, no
167 // sign-extending loads.
168 defm ATOMIC_LOAD8_U_I32 : AtomicLoad<I32, "i32.atomic.load8_u", 0x12>;
169 defm ATOMIC_LOAD16_U_I32 : AtomicLoad<I32, "i32.atomic.load16_u", 0x13>;
170 defm ATOMIC_LOAD8_U_I64 : AtomicLoad<I64, "i64.atomic.load8_u", 0x14>;
171 defm ATOMIC_LOAD16_U_I64 : AtomicLoad<I64, "i64.atomic.load16_u", 0x15>;
172 defm ATOMIC_LOAD32_U_I64 : AtomicLoad<I64, "i64.atomic.load32_u", 0x16>;
174 // Fragments for extending loads. These are different from regular loads because
175 // the SDNodes are derived from AtomicSDNode rather than LoadSDNode and
176 // therefore don't have the extension type field. So instead of matching that,
177 // we match the patterns that the type legalizer expands them to.
179 // We directly match zext patterns and select the zext atomic loads.
180 // i32 (zext (i8 (atomic_load_8))) gets legalized to
181 // i32 (and (i32 (atomic_load_8)), 255)
182 // These can be selected to a single zero-extending atomic load instruction.
183 def zext_aload_8_32 :
184 PatFrag<(ops node:$addr), (and (i32 (atomic_load_8 node:$addr)), 255)>;
185 def zext_aload_16_32 :
186 PatFrag<(ops node:$addr), (and (i32 (atomic_load_16 node:$addr)), 65535)>;
187 // Unlike regular loads, extension to i64 is handled differently than i32.
188 // i64 (zext (i8 (atomic_load_8))) gets legalized to
189 // i64 (and (i64 (anyext (i32 (atomic_load_8)))), 255)
190 def zext_aload_8_64 :
191 PatFrag<(ops node:$addr),
192 (and (i64 (anyext (i32 (atomic_load_8 node:$addr)))), 255)>;
193 def zext_aload_16_64 :
194 PatFrag<(ops node:$addr),
195 (and (i64 (anyext (i32 (atomic_load_16 node:$addr)))), 65535)>;
196 def zext_aload_32_64 :
197 PatFrag<(ops node:$addr),
198 (zext (i32 (atomic_load node:$addr)))>;
200 // We don't have single sext atomic load instructions. So for sext loads, we
201 // match bare subword loads (for 32-bit results) and anyext loads (for 64-bit
202 // results) and select a zext load; the next instruction will be sext_inreg
203 // which is selected by itself.
204 def sext_aload_8_64 :
205 PatFrag<(ops node:$addr), (anyext (i32 (atomic_load_8 node:$addr)))>;
206 def sext_aload_16_64 :
207 PatFrag<(ops node:$addr), (anyext (i32 (atomic_load_16 node:$addr)))>;
209 let Predicates = [HasAtomics] in {
210 // Select zero-extending loads with no constant offset.
211 def : LoadPatNoOffset<i32, zext_aload_8_32, ATOMIC_LOAD8_U_I32>;
212 def : LoadPatNoOffset<i32, zext_aload_16_32, ATOMIC_LOAD16_U_I32>;
213 def : LoadPatNoOffset<i64, zext_aload_8_64, ATOMIC_LOAD8_U_I64>;
214 def : LoadPatNoOffset<i64, zext_aload_16_64, ATOMIC_LOAD16_U_I64>;
215 def : LoadPatNoOffset<i64, zext_aload_32_64, ATOMIC_LOAD32_U_I64>;
217 // Select sign-extending loads with no constant offset
218 def : LoadPatNoOffset<i32, atomic_load_8, ATOMIC_LOAD8_U_I32>;
219 def : LoadPatNoOffset<i32, atomic_load_16, ATOMIC_LOAD16_U_I32>;
220 def : LoadPatNoOffset<i64, sext_aload_8_64, ATOMIC_LOAD8_U_I64>;
221 def : LoadPatNoOffset<i64, sext_aload_16_64, ATOMIC_LOAD16_U_I64>;
222 // 32->64 sext load gets selected as i32.atomic.load, i64.extend_i32_s
224 // Zero-extending loads with constant offset
225 def : LoadPatImmOff<i32, zext_aload_8_32, regPlusImm, ATOMIC_LOAD8_U_I32>;
226 def : LoadPatImmOff<i32, zext_aload_16_32, regPlusImm, ATOMIC_LOAD16_U_I32>;
227 def : LoadPatImmOff<i32, zext_aload_8_32, or_is_add, ATOMIC_LOAD8_U_I32>;
228 def : LoadPatImmOff<i32, zext_aload_16_32, or_is_add, ATOMIC_LOAD16_U_I32>;
229 def : LoadPatImmOff<i64, zext_aload_8_64, regPlusImm, ATOMIC_LOAD8_U_I64>;
230 def : LoadPatImmOff<i64, zext_aload_16_64, regPlusImm, ATOMIC_LOAD16_U_I64>;
231 def : LoadPatImmOff<i64, zext_aload_32_64, regPlusImm, ATOMIC_LOAD32_U_I64>;
232 def : LoadPatImmOff<i64, zext_aload_8_64, or_is_add, ATOMIC_LOAD8_U_I64>;
233 def : LoadPatImmOff<i64, zext_aload_16_64, or_is_add, ATOMIC_LOAD16_U_I64>;
234 def : LoadPatImmOff<i64, zext_aload_32_64, or_is_add, ATOMIC_LOAD32_U_I64>;
236 // Sign-extending loads with constant offset
237 def : LoadPatImmOff<i32, atomic_load_8, regPlusImm, ATOMIC_LOAD8_U_I32>;
238 def : LoadPatImmOff<i32, atomic_load_16, regPlusImm, ATOMIC_LOAD16_U_I32>;
239 def : LoadPatImmOff<i32, atomic_load_8, or_is_add, ATOMIC_LOAD8_U_I32>;
240 def : LoadPatImmOff<i32, atomic_load_16, or_is_add, ATOMIC_LOAD16_U_I32>;
241 def : LoadPatImmOff<i64, sext_aload_8_64, regPlusImm, ATOMIC_LOAD8_U_I64>;
242 def : LoadPatImmOff<i64, sext_aload_16_64, regPlusImm, ATOMIC_LOAD16_U_I64>;
243 def : LoadPatImmOff<i64, sext_aload_8_64, or_is_add, ATOMIC_LOAD8_U_I64>;
244 def : LoadPatImmOff<i64, sext_aload_16_64, or_is_add, ATOMIC_LOAD16_U_I64>;
245 // No 32->64 patterns, just use i32.atomic.load and i64.extend_s/i64
247 def : LoadPatGlobalAddr<i32, zext_aload_8_32, ATOMIC_LOAD8_U_I32>;
248 def : LoadPatGlobalAddr<i32, zext_aload_16_32, ATOMIC_LOAD16_U_I32>;
249 def : LoadPatGlobalAddr<i64, zext_aload_8_64, ATOMIC_LOAD8_U_I64>;
250 def : LoadPatGlobalAddr<i64, zext_aload_16_64, ATOMIC_LOAD16_U_I64>;
251 def : LoadPatGlobalAddr<i64, zext_aload_32_64, ATOMIC_LOAD32_U_I64>;
252 def : LoadPatGlobalAddr<i32, atomic_load_8, ATOMIC_LOAD8_U_I32>;
253 def : LoadPatGlobalAddr<i32, atomic_load_16, ATOMIC_LOAD16_U_I32>;
254 def : LoadPatGlobalAddr<i64, sext_aload_8_64, ATOMIC_LOAD8_U_I64>;
255 def : LoadPatGlobalAddr<i64, sext_aload_16_64, ATOMIC_LOAD16_U_I64>;
257 // Extending loads with just a constant offset
258 def : LoadPatOffsetOnly<i32, zext_aload_8_32, ATOMIC_LOAD8_U_I32>;
259 def : LoadPatOffsetOnly<i32, zext_aload_16_32, ATOMIC_LOAD16_U_I32>;
260 def : LoadPatOffsetOnly<i64, zext_aload_8_64, ATOMIC_LOAD8_U_I64>;
261 def : LoadPatOffsetOnly<i64, zext_aload_16_64, ATOMIC_LOAD16_U_I64>;
262 def : LoadPatOffsetOnly<i64, zext_aload_32_64, ATOMIC_LOAD32_U_I64>;
263 def : LoadPatOffsetOnly<i32, atomic_load_8, ATOMIC_LOAD8_U_I32>;
264 def : LoadPatOffsetOnly<i32, atomic_load_16, ATOMIC_LOAD16_U_I32>;
265 def : LoadPatOffsetOnly<i64, sext_aload_8_64, ATOMIC_LOAD8_U_I64>;
266 def : LoadPatOffsetOnly<i64, sext_aload_16_64, ATOMIC_LOAD16_U_I64>;
268 def : LoadPatGlobalAddrOffOnly<i32, zext_aload_8_32, ATOMIC_LOAD8_U_I32>;
269 def : LoadPatGlobalAddrOffOnly<i32, zext_aload_16_32, ATOMIC_LOAD16_U_I32>;
270 def : LoadPatGlobalAddrOffOnly<i64, zext_aload_8_64, ATOMIC_LOAD8_U_I64>;
271 def : LoadPatGlobalAddrOffOnly<i64, zext_aload_16_64, ATOMIC_LOAD16_U_I64>;
272 def : LoadPatGlobalAddrOffOnly<i64, zext_aload_32_64, ATOMIC_LOAD32_U_I64>;
273 def : LoadPatGlobalAddrOffOnly<i32, atomic_load_8, ATOMIC_LOAD8_U_I32>;
274 def : LoadPatGlobalAddrOffOnly<i32, atomic_load_16, ATOMIC_LOAD16_U_I32>;
275 def : LoadPatGlobalAddrOffOnly<i64, sext_aload_8_64, ATOMIC_LOAD8_U_I64>;
276 def : LoadPatGlobalAddrOffOnly<i64, sext_aload_16_64, ATOMIC_LOAD16_U_I64>;
278 } // Predicates = [HasAtomics]
280 //===----------------------------------------------------------------------===//
282 //===----------------------------------------------------------------------===//
284 multiclass AtomicStore<WebAssemblyRegClass rc, string name, int atomic_op> {
285 defm "" : WebAssemblyStore<rc, name, !or(0xfe00, !and(0xff, atomic_op))>,
286 Requires<[HasAtomics]>;
289 defm ATOMIC_STORE_I32 : AtomicStore<I32, "i32.atomic.store", 0x17>;
290 defm ATOMIC_STORE_I64 : AtomicStore<I64, "i64.atomic.store", 0x18>;
292 // We need an 'atomic' version of store patterns because store and atomic_store
293 // nodes have different operand orders:
294 // store: (store $val, $ptr)
295 // atomic_store: (store $ptr, $val)
297 let Predicates = [HasAtomics] in {
299 // Select stores with no constant offset.
300 class AStorePatNoOffset<ValueType ty, PatFrag kind, NI inst> :
301 Pat<(kind I32:$addr, ty:$val), (inst 0, 0, I32:$addr, ty:$val)>;
302 def : AStorePatNoOffset<i32, atomic_store_32, ATOMIC_STORE_I32>;
303 def : AStorePatNoOffset<i64, atomic_store_64, ATOMIC_STORE_I64>;
305 // Select stores with a constant offset.
307 // Pattern with address + immediate offset
308 class AStorePatImmOff<ValueType ty, PatFrag kind, PatFrag operand, NI inst> :
309 Pat<(kind (operand I32:$addr, imm:$off), ty:$val),
310 (inst 0, imm:$off, I32:$addr, ty:$val)>;
311 def : AStorePatImmOff<i32, atomic_store_32, regPlusImm, ATOMIC_STORE_I32>;
312 def : AStorePatImmOff<i64, atomic_store_64, regPlusImm, ATOMIC_STORE_I64>;
313 def : AStorePatImmOff<i32, atomic_store_32, or_is_add, ATOMIC_STORE_I32>;
314 def : AStorePatImmOff<i64, atomic_store_64, or_is_add, ATOMIC_STORE_I64>;
316 class AStorePatGlobalAddr<ValueType ty, PatFrag kind, NI inst> :
317 Pat<(kind (regPlusGA I32:$addr, (WebAssemblywrapper tglobaladdr:$off)),
319 (inst 0, tglobaladdr:$off, I32:$addr, ty:$val)>;
320 def : AStorePatGlobalAddr<i32, atomic_store_32, ATOMIC_STORE_I32>;
321 def : AStorePatGlobalAddr<i64, atomic_store_64, ATOMIC_STORE_I64>;
323 // Select stores with just a constant offset.
324 class AStorePatOffsetOnly<ValueType ty, PatFrag kind, NI inst> :
325 Pat<(kind imm:$off, ty:$val), (inst 0, imm:$off, (CONST_I32 0), ty:$val)>;
326 def : AStorePatOffsetOnly<i32, atomic_store_32, ATOMIC_STORE_I32>;
327 def : AStorePatOffsetOnly<i64, atomic_store_64, ATOMIC_STORE_I64>;
329 class AStorePatGlobalAddrOffOnly<ValueType ty, PatFrag kind, NI inst> :
330 Pat<(kind (WebAssemblywrapper tglobaladdr:$off), ty:$val),
331 (inst 0, tglobaladdr:$off, (CONST_I32 0), ty:$val)>;
332 def : AStorePatGlobalAddrOffOnly<i32, atomic_store_32, ATOMIC_STORE_I32>;
333 def : AStorePatGlobalAddrOffOnly<i64, atomic_store_64, ATOMIC_STORE_I64>;
335 } // Predicates = [HasAtomics]
337 // Truncating stores.
338 defm ATOMIC_STORE8_I32 : AtomicStore<I32, "i32.atomic.store8", 0x19>;
339 defm ATOMIC_STORE16_I32 : AtomicStore<I32, "i32.atomic.store16", 0x1a>;
340 defm ATOMIC_STORE8_I64 : AtomicStore<I64, "i64.atomic.store8", 0x1b>;
341 defm ATOMIC_STORE16_I64 : AtomicStore<I64, "i64.atomic.store16", 0x1c>;
342 defm ATOMIC_STORE32_I64 : AtomicStore<I64, "i64.atomic.store32", 0x1d>;
344 // Fragments for truncating stores.
346 // We don't have single truncating atomic store instructions. For 32-bit
347 // instructions, we just need to match bare atomic stores. On the other hand,
348 // truncating stores from i64 values are once truncated to i32 first.
349 class trunc_astore_64<PatFrag kind> :
350 PatFrag<(ops node:$addr, node:$val),
351 (kind node:$addr, (i32 (trunc (i64 node:$val))))>;
352 def trunc_astore_8_64 : trunc_astore_64<atomic_store_8>;
353 def trunc_astore_16_64 : trunc_astore_64<atomic_store_16>;
354 def trunc_astore_32_64 : trunc_astore_64<atomic_store_32>;
356 let Predicates = [HasAtomics] in {
358 // Truncating stores with no constant offset
359 def : AStorePatNoOffset<i32, atomic_store_8, ATOMIC_STORE8_I32>;
360 def : AStorePatNoOffset<i32, atomic_store_16, ATOMIC_STORE16_I32>;
361 def : AStorePatNoOffset<i64, trunc_astore_8_64, ATOMIC_STORE8_I64>;
362 def : AStorePatNoOffset<i64, trunc_astore_16_64, ATOMIC_STORE16_I64>;
363 def : AStorePatNoOffset<i64, trunc_astore_32_64, ATOMIC_STORE32_I64>;
365 // Truncating stores with a constant offset
366 def : AStorePatImmOff<i32, atomic_store_8, regPlusImm, ATOMIC_STORE8_I32>;
367 def : AStorePatImmOff<i32, atomic_store_16, regPlusImm, ATOMIC_STORE16_I32>;
368 def : AStorePatImmOff<i64, trunc_astore_8_64, regPlusImm, ATOMIC_STORE8_I64>;
369 def : AStorePatImmOff<i64, trunc_astore_16_64, regPlusImm, ATOMIC_STORE16_I64>;
370 def : AStorePatImmOff<i64, trunc_astore_32_64, regPlusImm, ATOMIC_STORE32_I64>;
371 def : AStorePatImmOff<i32, atomic_store_8, or_is_add, ATOMIC_STORE8_I32>;
372 def : AStorePatImmOff<i32, atomic_store_16, or_is_add, ATOMIC_STORE16_I32>;
373 def : AStorePatImmOff<i64, trunc_astore_8_64, or_is_add, ATOMIC_STORE8_I64>;
374 def : AStorePatImmOff<i64, trunc_astore_16_64, or_is_add, ATOMIC_STORE16_I64>;
375 def : AStorePatImmOff<i64, trunc_astore_32_64, or_is_add, ATOMIC_STORE32_I64>;
377 def : AStorePatGlobalAddr<i32, atomic_store_8, ATOMIC_STORE8_I32>;
378 def : AStorePatGlobalAddr<i32, atomic_store_16, ATOMIC_STORE16_I32>;
379 def : AStorePatGlobalAddr<i64, trunc_astore_8_64, ATOMIC_STORE8_I64>;
380 def : AStorePatGlobalAddr<i64, trunc_astore_16_64, ATOMIC_STORE16_I64>;
381 def : AStorePatGlobalAddr<i64, trunc_astore_32_64, ATOMIC_STORE32_I64>;
383 // Truncating stores with just a constant offset
384 def : AStorePatOffsetOnly<i32, atomic_store_8, ATOMIC_STORE8_I32>;
385 def : AStorePatOffsetOnly<i32, atomic_store_16, ATOMIC_STORE16_I32>;
386 def : AStorePatOffsetOnly<i64, trunc_astore_8_64, ATOMIC_STORE8_I64>;
387 def : AStorePatOffsetOnly<i64, trunc_astore_16_64, ATOMIC_STORE16_I64>;
388 def : AStorePatOffsetOnly<i64, trunc_astore_32_64, ATOMIC_STORE32_I64>;
390 def : AStorePatGlobalAddrOffOnly<i32, atomic_store_8, ATOMIC_STORE8_I32>;
391 def : AStorePatGlobalAddrOffOnly<i32, atomic_store_16, ATOMIC_STORE16_I32>;
392 def : AStorePatGlobalAddrOffOnly<i64, trunc_astore_8_64, ATOMIC_STORE8_I64>;
393 def : AStorePatGlobalAddrOffOnly<i64, trunc_astore_16_64, ATOMIC_STORE16_I64>;
394 def : AStorePatGlobalAddrOffOnly<i64, trunc_astore_32_64, ATOMIC_STORE32_I64>;
396 } // Predicates = [HasAtomics]
398 //===----------------------------------------------------------------------===//
399 // Atomic binary read-modify-writes
400 //===----------------------------------------------------------------------===//
402 multiclass WebAssemblyBinRMW<WebAssemblyRegClass rc, string name,
405 ATOMIC_I<(outs rc:$dst),
406 (ins P2Align:$p2align, offset32_op:$off, I32:$addr, rc:$val),
407 (outs), (ins P2Align:$p2align, offset32_op:$off), [],
408 !strconcat(name, "\t$dst, ${off}(${addr})${p2align}, $val"),
409 !strconcat(name, "\t${off}${p2align}"), atomic_op>;
412 defm ATOMIC_RMW_ADD_I32 : WebAssemblyBinRMW<I32, "i32.atomic.rmw.add", 0x1e>;
413 defm ATOMIC_RMW_ADD_I64 : WebAssemblyBinRMW<I64, "i64.atomic.rmw.add", 0x1f>;
414 defm ATOMIC_RMW8_U_ADD_I32 :
415 WebAssemblyBinRMW<I32, "i32.atomic.rmw8.add_u", 0x20>;
416 defm ATOMIC_RMW16_U_ADD_I32 :
417 WebAssemblyBinRMW<I32, "i32.atomic.rmw16.add_u", 0x21>;
418 defm ATOMIC_RMW8_U_ADD_I64 :
419 WebAssemblyBinRMW<I64, "i64.atomic.rmw8.add_u", 0x22>;
420 defm ATOMIC_RMW16_U_ADD_I64 :
421 WebAssemblyBinRMW<I64, "i64.atomic.rmw16.add_u", 0x23>;
422 defm ATOMIC_RMW32_U_ADD_I64 :
423 WebAssemblyBinRMW<I64, "i64.atomic.rmw32.add_u", 0x24>;
425 defm ATOMIC_RMW_SUB_I32 : WebAssemblyBinRMW<I32, "i32.atomic.rmw.sub", 0x25>;
426 defm ATOMIC_RMW_SUB_I64 : WebAssemblyBinRMW<I64, "i64.atomic.rmw.sub", 0x26>;
427 defm ATOMIC_RMW8_U_SUB_I32 :
428 WebAssemblyBinRMW<I32, "i32.atomic.rmw8.sub_u", 0x27>;
429 defm ATOMIC_RMW16_U_SUB_I32 :
430 WebAssemblyBinRMW<I32, "i32.atomic.rmw16.sub_u", 0x28>;
431 defm ATOMIC_RMW8_U_SUB_I64 :
432 WebAssemblyBinRMW<I64, "i64.atomic.rmw8.sub_u", 0x29>;
433 defm ATOMIC_RMW16_U_SUB_I64 :
434 WebAssemblyBinRMW<I64, "i64.atomic.rmw16.sub_u", 0x2a>;
435 defm ATOMIC_RMW32_U_SUB_I64 :
436 WebAssemblyBinRMW<I64, "i64.atomic.rmw32.sub_u", 0x2b>;
438 defm ATOMIC_RMW_AND_I32 : WebAssemblyBinRMW<I32, "i32.atomic.rmw.and", 0x2c>;
439 defm ATOMIC_RMW_AND_I64 : WebAssemblyBinRMW<I64, "i64.atomic.rmw.and", 0x2d>;
440 defm ATOMIC_RMW8_U_AND_I32 :
441 WebAssemblyBinRMW<I32, "i32.atomic.rmw8.and_u", 0x2e>;
442 defm ATOMIC_RMW16_U_AND_I32 :
443 WebAssemblyBinRMW<I32, "i32.atomic.rmw16.and_u", 0x2f>;
444 defm ATOMIC_RMW8_U_AND_I64 :
445 WebAssemblyBinRMW<I64, "i64.atomic.rmw8.and_u", 0x30>;
446 defm ATOMIC_RMW16_U_AND_I64 :
447 WebAssemblyBinRMW<I64, "i64.atomic.rmw16.and_u", 0x31>;
448 defm ATOMIC_RMW32_U_AND_I64 :
449 WebAssemblyBinRMW<I64, "i64.atomic.rmw32.and_u", 0x32>;
451 defm ATOMIC_RMW_OR_I32 : WebAssemblyBinRMW<I32, "i32.atomic.rmw.or", 0x33>;
452 defm ATOMIC_RMW_OR_I64 : WebAssemblyBinRMW<I64, "i64.atomic.rmw.or", 0x34>;
453 defm ATOMIC_RMW8_U_OR_I32 :
454 WebAssemblyBinRMW<I32, "i32.atomic.rmw8.or_u", 0x35>;
455 defm ATOMIC_RMW16_U_OR_I32 :
456 WebAssemblyBinRMW<I32, "i32.atomic.rmw16.or_u", 0x36>;
457 defm ATOMIC_RMW8_U_OR_I64 :
458 WebAssemblyBinRMW<I64, "i64.atomic.rmw8.or_u", 0x37>;
459 defm ATOMIC_RMW16_U_OR_I64 :
460 WebAssemblyBinRMW<I64, "i64.atomic.rmw16.or_u", 0x38>;
461 defm ATOMIC_RMW32_U_OR_I64 :
462 WebAssemblyBinRMW<I64, "i64.atomic.rmw32.or_u", 0x39>;
464 defm ATOMIC_RMW_XOR_I32 : WebAssemblyBinRMW<I32, "i32.atomic.rmw.xor", 0x3a>;
465 defm ATOMIC_RMW_XOR_I64 : WebAssemblyBinRMW<I64, "i64.atomic.rmw.xor", 0x3b>;
466 defm ATOMIC_RMW8_U_XOR_I32 :
467 WebAssemblyBinRMW<I32, "i32.atomic.rmw8.xor_u", 0x3c>;
468 defm ATOMIC_RMW16_U_XOR_I32 :
469 WebAssemblyBinRMW<I32, "i32.atomic.rmw16.xor_u", 0x3d>;
470 defm ATOMIC_RMW8_U_XOR_I64 :
471 WebAssemblyBinRMW<I64, "i64.atomic.rmw8.xor_u", 0x3e>;
472 defm ATOMIC_RMW16_U_XOR_I64 :
473 WebAssemblyBinRMW<I64, "i64.atomic.rmw16.xor_u", 0x3f>;
474 defm ATOMIC_RMW32_U_XOR_I64 :
475 WebAssemblyBinRMW<I64, "i64.atomic.rmw32.xor_u", 0x40>;
477 defm ATOMIC_RMW_XCHG_I32 :
478 WebAssemblyBinRMW<I32, "i32.atomic.rmw.xchg", 0x41>;
479 defm ATOMIC_RMW_XCHG_I64 :
480 WebAssemblyBinRMW<I64, "i64.atomic.rmw.xchg", 0x42>;
481 defm ATOMIC_RMW8_U_XCHG_I32 :
482 WebAssemblyBinRMW<I32, "i32.atomic.rmw8.xchg_u", 0x43>;
483 defm ATOMIC_RMW16_U_XCHG_I32 :
484 WebAssemblyBinRMW<I32, "i32.atomic.rmw16.xchg_u", 0x44>;
485 defm ATOMIC_RMW8_U_XCHG_I64 :
486 WebAssemblyBinRMW<I64, "i64.atomic.rmw8.xchg_u", 0x45>;
487 defm ATOMIC_RMW16_U_XCHG_I64 :
488 WebAssemblyBinRMW<I64, "i64.atomic.rmw16.xchg_u", 0x46>;
489 defm ATOMIC_RMW32_U_XCHG_I64 :
490 WebAssemblyBinRMW<I64, "i64.atomic.rmw32.xchg_u", 0x47>;
492 // Select binary RMWs with no constant offset.
493 class BinRMWPatNoOffset<ValueType ty, PatFrag kind, NI inst> :
494 Pat<(ty (kind I32:$addr, ty:$val)), (inst 0, 0, I32:$addr, ty:$val)>;
496 // Select binary RMWs with a constant offset.
498 // Pattern with address + immediate offset
499 class BinRMWPatImmOff<ValueType ty, PatFrag kind, PatFrag operand, NI inst> :
500 Pat<(ty (kind (operand I32:$addr, imm:$off), ty:$val)),
501 (inst 0, imm:$off, I32:$addr, ty:$val)>;
503 class BinRMWPatGlobalAddr<ValueType ty, PatFrag kind, NI inst> :
504 Pat<(ty (kind (regPlusGA I32:$addr, (WebAssemblywrapper tglobaladdr:$off)),
506 (inst 0, tglobaladdr:$off, I32:$addr, ty:$val)>;
508 // Select binary RMWs with just a constant offset.
509 class BinRMWPatOffsetOnly<ValueType ty, PatFrag kind, NI inst> :
510 Pat<(ty (kind imm:$off, ty:$val)),
511 (inst 0, imm:$off, (CONST_I32 0), ty:$val)>;
513 class BinRMWPatGlobalAddrOffOnly<ValueType ty, PatFrag kind, NI inst> :
514 Pat<(ty (kind (WebAssemblywrapper tglobaladdr:$off), ty:$val)),
515 (inst 0, tglobaladdr:$off, (CONST_I32 0), ty:$val)>;
517 // Patterns for various addressing modes.
518 multiclass BinRMWPattern<PatFrag rmw_32, PatFrag rmw_64, NI inst_32,
520 def : BinRMWPatNoOffset<i32, rmw_32, inst_32>;
521 def : BinRMWPatNoOffset<i64, rmw_64, inst_64>;
523 def : BinRMWPatImmOff<i32, rmw_32, regPlusImm, inst_32>;
524 def : BinRMWPatImmOff<i64, rmw_64, regPlusImm, inst_64>;
525 def : BinRMWPatImmOff<i32, rmw_32, or_is_add, inst_32>;
526 def : BinRMWPatImmOff<i64, rmw_64, or_is_add, inst_64>;
528 def : BinRMWPatGlobalAddr<i32, rmw_32, inst_32>;
529 def : BinRMWPatGlobalAddr<i64, rmw_64, inst_64>;
531 def : BinRMWPatOffsetOnly<i32, rmw_32, inst_32>;
532 def : BinRMWPatOffsetOnly<i64, rmw_64, inst_64>;
534 def : BinRMWPatGlobalAddrOffOnly<i32, rmw_32, inst_32>;
535 def : BinRMWPatGlobalAddrOffOnly<i64, rmw_64, inst_64>;
538 let Predicates = [HasAtomics] in {
539 defm : BinRMWPattern<atomic_load_add_32, atomic_load_add_64, ATOMIC_RMW_ADD_I32,
541 defm : BinRMWPattern<atomic_load_sub_32, atomic_load_sub_64, ATOMIC_RMW_SUB_I32,
543 defm : BinRMWPattern<atomic_load_and_32, atomic_load_and_64, ATOMIC_RMW_AND_I32,
545 defm : BinRMWPattern<atomic_load_or_32, atomic_load_or_64, ATOMIC_RMW_OR_I32,
547 defm : BinRMWPattern<atomic_load_xor_32, atomic_load_xor_64, ATOMIC_RMW_XOR_I32,
549 defm : BinRMWPattern<atomic_swap_32, atomic_swap_64, ATOMIC_RMW_XCHG_I32,
550 ATOMIC_RMW_XCHG_I64>;
551 } // Predicates = [HasAtomics]
553 // Truncating & zero-extending binary RMW patterns.
554 // These are combined patterns of truncating store patterns and zero-extending
555 // load patterns above.
556 class zext_bin_rmw_8_32<PatFrag kind> :
557 PatFrag<(ops node:$addr, node:$val),
558 (and (i32 (kind node:$addr, node:$val)), 255)>;
559 class zext_bin_rmw_16_32<PatFrag kind> :
560 PatFrag<(ops node:$addr, node:$val),
561 (and (i32 (kind node:$addr, node:$val)), 65535)>;
562 class zext_bin_rmw_8_64<PatFrag kind> :
563 PatFrag<(ops node:$addr, node:$val),
564 (and (i64 (anyext (i32 (kind node:$addr,
565 (i32 (trunc (i64 node:$val))))))), 255)>;
566 class zext_bin_rmw_16_64<PatFrag kind> :
567 PatFrag<(ops node:$addr, node:$val),
568 (and (i64 (anyext (i32 (kind node:$addr,
569 (i32 (trunc (i64 node:$val))))))), 65535)>;
570 class zext_bin_rmw_32_64<PatFrag kind> :
571 PatFrag<(ops node:$addr, node:$val),
572 (zext (i32 (kind node:$addr, (i32 (trunc (i64 node:$val))))))>;
574 // Truncating & sign-extending binary RMW patterns.
575 // These are combined patterns of truncating store patterns and sign-extending
576 // load patterns above. We match subword RMWs (for 32-bit) and anyext RMWs (for
577 // 64-bit) and select a zext RMW; the next instruction will be sext_inreg which
578 // is selected by itself.
579 class sext_bin_rmw_8_32<PatFrag kind> :
580 PatFrag<(ops node:$addr, node:$val), (kind node:$addr, node:$val)>;
581 class sext_bin_rmw_16_32<PatFrag kind> : sext_bin_rmw_8_32<kind>;
582 class sext_bin_rmw_8_64<PatFrag kind> :
583 PatFrag<(ops node:$addr, node:$val),
584 (anyext (i32 (kind node:$addr, (i32 (trunc (i64 node:$val))))))>;
585 class sext_bin_rmw_16_64<PatFrag kind> : sext_bin_rmw_8_64<kind>;
586 // 32->64 sext RMW gets selected as i32.atomic.rmw.***, i64.extend_i32_s
588 // Patterns for various addressing modes for truncating-extending binary RMWs.
589 multiclass BinRMWTruncExtPattern<
590 PatFrag rmw_8, PatFrag rmw_16, PatFrag rmw_32, PatFrag rmw_64,
591 NI inst8_32, NI inst16_32, NI inst8_64, NI inst16_64, NI inst32_64> {
592 // Truncating-extending binary RMWs with no constant offset
593 def : BinRMWPatNoOffset<i32, zext_bin_rmw_8_32<rmw_8>, inst8_32>;
594 def : BinRMWPatNoOffset<i32, zext_bin_rmw_16_32<rmw_16>, inst16_32>;
595 def : BinRMWPatNoOffset<i64, zext_bin_rmw_8_64<rmw_8>, inst8_64>;
596 def : BinRMWPatNoOffset<i64, zext_bin_rmw_16_64<rmw_16>, inst16_64>;
597 def : BinRMWPatNoOffset<i64, zext_bin_rmw_32_64<rmw_32>, inst32_64>;
599 def : BinRMWPatNoOffset<i32, sext_bin_rmw_8_32<rmw_8>, inst8_32>;
600 def : BinRMWPatNoOffset<i32, sext_bin_rmw_16_32<rmw_16>, inst16_32>;
601 def : BinRMWPatNoOffset<i64, sext_bin_rmw_8_64<rmw_8>, inst8_64>;
602 def : BinRMWPatNoOffset<i64, sext_bin_rmw_16_64<rmw_16>, inst16_64>;
604 // Truncating-extending binary RMWs with a constant offset
605 def : BinRMWPatImmOff<i32, zext_bin_rmw_8_32<rmw_8>, regPlusImm, inst8_32>;
606 def : BinRMWPatImmOff<i32, zext_bin_rmw_16_32<rmw_16>, regPlusImm, inst16_32>;
607 def : BinRMWPatImmOff<i64, zext_bin_rmw_8_64<rmw_8>, regPlusImm, inst8_64>;
608 def : BinRMWPatImmOff<i64, zext_bin_rmw_16_64<rmw_16>, regPlusImm, inst16_64>;
609 def : BinRMWPatImmOff<i64, zext_bin_rmw_32_64<rmw_32>, regPlusImm, inst32_64>;
610 def : BinRMWPatImmOff<i32, zext_bin_rmw_8_32<rmw_8>, or_is_add, inst8_32>;
611 def : BinRMWPatImmOff<i32, zext_bin_rmw_16_32<rmw_16>, or_is_add, inst16_32>;
612 def : BinRMWPatImmOff<i64, zext_bin_rmw_8_64<rmw_8>, or_is_add, inst8_64>;
613 def : BinRMWPatImmOff<i64, zext_bin_rmw_16_64<rmw_16>, or_is_add, inst16_64>;
614 def : BinRMWPatImmOff<i64, zext_bin_rmw_32_64<rmw_32>, or_is_add, inst32_64>;
616 def : BinRMWPatImmOff<i32, sext_bin_rmw_8_32<rmw_8>, regPlusImm, inst8_32>;
617 def : BinRMWPatImmOff<i32, sext_bin_rmw_16_32<rmw_16>, regPlusImm, inst16_32>;
618 def : BinRMWPatImmOff<i64, sext_bin_rmw_8_64<rmw_8>, regPlusImm, inst8_64>;
619 def : BinRMWPatImmOff<i64, sext_bin_rmw_16_64<rmw_16>, regPlusImm, inst16_64>;
620 def : BinRMWPatImmOff<i32, sext_bin_rmw_8_32<rmw_8>, or_is_add, inst8_32>;
621 def : BinRMWPatImmOff<i32, sext_bin_rmw_16_32<rmw_16>, or_is_add, inst16_32>;
622 def : BinRMWPatImmOff<i64, sext_bin_rmw_8_64<rmw_8>, or_is_add, inst8_64>;
623 def : BinRMWPatImmOff<i64, sext_bin_rmw_16_64<rmw_16>, or_is_add, inst16_64>;
625 def : BinRMWPatGlobalAddr<i32, zext_bin_rmw_8_32<rmw_8>, inst8_32>;
626 def : BinRMWPatGlobalAddr<i32, zext_bin_rmw_16_32<rmw_16>, inst16_32>;
627 def : BinRMWPatGlobalAddr<i64, zext_bin_rmw_8_64<rmw_8>, inst8_64>;
628 def : BinRMWPatGlobalAddr<i64, zext_bin_rmw_16_64<rmw_16>, inst16_64>;
629 def : BinRMWPatGlobalAddr<i64, zext_bin_rmw_32_64<rmw_32>, inst32_64>;
631 def : BinRMWPatGlobalAddr<i32, sext_bin_rmw_8_32<rmw_8>, inst8_32>;
632 def : BinRMWPatGlobalAddr<i32, sext_bin_rmw_16_32<rmw_16>, inst16_32>;
633 def : BinRMWPatGlobalAddr<i64, sext_bin_rmw_8_64<rmw_8>, inst8_64>;
634 def : BinRMWPatGlobalAddr<i64, sext_bin_rmw_16_64<rmw_16>, inst16_64>;
636 // Truncating-extending binary RMWs with just a constant offset
637 def : BinRMWPatOffsetOnly<i32, zext_bin_rmw_8_32<rmw_8>, inst8_32>;
638 def : BinRMWPatOffsetOnly<i32, zext_bin_rmw_16_32<rmw_16>, inst16_32>;
639 def : BinRMWPatOffsetOnly<i64, zext_bin_rmw_8_64<rmw_8>, inst8_64>;
640 def : BinRMWPatOffsetOnly<i64, zext_bin_rmw_16_64<rmw_16>, inst16_64>;
641 def : BinRMWPatOffsetOnly<i64, zext_bin_rmw_32_64<rmw_32>, inst32_64>;
643 def : BinRMWPatOffsetOnly<i32, sext_bin_rmw_8_32<rmw_8>, inst8_32>;
644 def : BinRMWPatOffsetOnly<i32, sext_bin_rmw_16_32<rmw_16>, inst16_32>;
645 def : BinRMWPatOffsetOnly<i64, sext_bin_rmw_8_64<rmw_8>, inst8_64>;
646 def : BinRMWPatOffsetOnly<i64, sext_bin_rmw_16_64<rmw_16>, inst16_64>;
648 def : BinRMWPatGlobalAddrOffOnly<i32, zext_bin_rmw_8_32<rmw_8>, inst8_32>;
649 def : BinRMWPatGlobalAddrOffOnly<i32, zext_bin_rmw_16_32<rmw_16>, inst16_32>;
650 def : BinRMWPatGlobalAddrOffOnly<i64, zext_bin_rmw_8_64<rmw_8>, inst8_64>;
651 def : BinRMWPatGlobalAddrOffOnly<i64, zext_bin_rmw_16_64<rmw_16>, inst16_64>;
652 def : BinRMWPatGlobalAddrOffOnly<i64, zext_bin_rmw_32_64<rmw_32>, inst32_64>;
654 def : BinRMWPatGlobalAddrOffOnly<i32, sext_bin_rmw_8_32<rmw_8>, inst8_32>;
655 def : BinRMWPatGlobalAddrOffOnly<i32, sext_bin_rmw_16_32<rmw_16>, inst16_32>;
656 def : BinRMWPatGlobalAddrOffOnly<i64, sext_bin_rmw_8_64<rmw_8>, inst8_64>;
657 def : BinRMWPatGlobalAddrOffOnly<i64, sext_bin_rmw_16_64<rmw_16>, inst16_64>;
660 let Predicates = [HasAtomics] in {
661 defm : BinRMWTruncExtPattern<
662 atomic_load_add_8, atomic_load_add_16, atomic_load_add_32, atomic_load_add_64,
663 ATOMIC_RMW8_U_ADD_I32, ATOMIC_RMW16_U_ADD_I32,
664 ATOMIC_RMW8_U_ADD_I64, ATOMIC_RMW16_U_ADD_I64, ATOMIC_RMW32_U_ADD_I64>;
665 defm : BinRMWTruncExtPattern<
666 atomic_load_sub_8, atomic_load_sub_16, atomic_load_sub_32, atomic_load_sub_64,
667 ATOMIC_RMW8_U_SUB_I32, ATOMIC_RMW16_U_SUB_I32,
668 ATOMIC_RMW8_U_SUB_I64, ATOMIC_RMW16_U_SUB_I64, ATOMIC_RMW32_U_SUB_I64>;
669 defm : BinRMWTruncExtPattern<
670 atomic_load_and_8, atomic_load_and_16, atomic_load_and_32, atomic_load_and_64,
671 ATOMIC_RMW8_U_AND_I32, ATOMIC_RMW16_U_AND_I32,
672 ATOMIC_RMW8_U_AND_I64, ATOMIC_RMW16_U_AND_I64, ATOMIC_RMW32_U_AND_I64>;
673 defm : BinRMWTruncExtPattern<
674 atomic_load_or_8, atomic_load_or_16, atomic_load_or_32, atomic_load_or_64,
675 ATOMIC_RMW8_U_OR_I32, ATOMIC_RMW16_U_OR_I32,
676 ATOMIC_RMW8_U_OR_I64, ATOMIC_RMW16_U_OR_I64, ATOMIC_RMW32_U_OR_I64>;
677 defm : BinRMWTruncExtPattern<
678 atomic_load_xor_8, atomic_load_xor_16, atomic_load_xor_32, atomic_load_xor_64,
679 ATOMIC_RMW8_U_XOR_I32, ATOMIC_RMW16_U_XOR_I32,
680 ATOMIC_RMW8_U_XOR_I64, ATOMIC_RMW16_U_XOR_I64, ATOMIC_RMW32_U_XOR_I64>;
681 defm : BinRMWTruncExtPattern<
682 atomic_swap_8, atomic_swap_16, atomic_swap_32, atomic_swap_64,
683 ATOMIC_RMW8_U_XCHG_I32, ATOMIC_RMW16_U_XCHG_I32,
684 ATOMIC_RMW8_U_XCHG_I64, ATOMIC_RMW16_U_XCHG_I64, ATOMIC_RMW32_U_XCHG_I64>;
685 } // Predicates = [HasAtomics]
687 //===----------------------------------------------------------------------===//
688 // Atomic ternary read-modify-writes
689 //===----------------------------------------------------------------------===//
691 // TODO LLVM IR's cmpxchg instruction returns a pair of {loaded value, success
692 // flag}. When we use the success flag or both values, we can't make use of i64
693 // truncate/extend versions of instructions for now, which is suboptimal.
694 // Consider adding a pass after instruction selection that optimizes this case
695 // if it is frequent.
697 multiclass WebAssemblyTerRMW<WebAssemblyRegClass rc, string name,
700 ATOMIC_I<(outs rc:$dst),
701 (ins P2Align:$p2align, offset32_op:$off, I32:$addr, rc:$exp,
703 (outs), (ins P2Align:$p2align, offset32_op:$off), [],
704 !strconcat(name, "\t$dst, ${off}(${addr})${p2align}, $exp, $new_"),
705 !strconcat(name, "\t${off}${p2align}"), atomic_op>;
708 defm ATOMIC_RMW_CMPXCHG_I32 :
709 WebAssemblyTerRMW<I32, "i32.atomic.rmw.cmpxchg", 0x48>;
710 defm ATOMIC_RMW_CMPXCHG_I64 :
711 WebAssemblyTerRMW<I64, "i64.atomic.rmw.cmpxchg", 0x49>;
712 defm ATOMIC_RMW8_U_CMPXCHG_I32 :
713 WebAssemblyTerRMW<I32, "i32.atomic.rmw8.cmpxchg_u", 0x4a>;
714 defm ATOMIC_RMW16_U_CMPXCHG_I32 :
715 WebAssemblyTerRMW<I32, "i32.atomic.rmw16.cmpxchg_u", 0x4b>;
716 defm ATOMIC_RMW8_U_CMPXCHG_I64 :
717 WebAssemblyTerRMW<I64, "i64.atomic.rmw8.cmpxchg_u", 0x4c>;
718 defm ATOMIC_RMW16_U_CMPXCHG_I64 :
719 WebAssemblyTerRMW<I64, "i64.atomic.rmw16.cmpxchg_u", 0x4d>;
720 defm ATOMIC_RMW32_U_CMPXCHG_I64 :
721 WebAssemblyTerRMW<I64, "i64.atomic.rmw32.cmpxchg_u", 0x4e>;
723 // Select ternary RMWs with no constant offset.
724 class TerRMWPatNoOffset<ValueType ty, PatFrag kind, NI inst> :
725 Pat<(ty (kind I32:$addr, ty:$exp, ty:$new)),
726 (inst 0, 0, I32:$addr, ty:$exp, ty:$new)>;
728 // Select ternary RMWs with a constant offset.
730 // Pattern with address + immediate offset
731 class TerRMWPatImmOff<ValueType ty, PatFrag kind, PatFrag operand, NI inst> :
732 Pat<(ty (kind (operand I32:$addr, imm:$off), ty:$exp, ty:$new)),
733 (inst 0, imm:$off, I32:$addr, ty:$exp, ty:$new)>;
735 class TerRMWPatGlobalAddr<ValueType ty, PatFrag kind, NI inst> :
736 Pat<(ty (kind (regPlusGA I32:$addr, (WebAssemblywrapper tglobaladdr:$off)),
738 (inst 0, tglobaladdr:$off, I32:$addr, ty:$exp, ty:$new)>;
740 // Select ternary RMWs with just a constant offset.
741 class TerRMWPatOffsetOnly<ValueType ty, PatFrag kind, NI inst> :
742 Pat<(ty (kind imm:$off, ty:$exp, ty:$new)),
743 (inst 0, imm:$off, (CONST_I32 0), ty:$exp, ty:$new)>;
745 class TerRMWPatGlobalAddrOffOnly<ValueType ty, PatFrag kind, NI inst> :
746 Pat<(ty (kind (WebAssemblywrapper tglobaladdr:$off), ty:$exp, ty:$new)),
747 (inst 0, tglobaladdr:$off, (CONST_I32 0), ty:$exp, ty:$new)>;
749 // Patterns for various addressing modes.
750 multiclass TerRMWPattern<PatFrag rmw_32, PatFrag rmw_64, NI inst_32,
752 def : TerRMWPatNoOffset<i32, rmw_32, inst_32>;
753 def : TerRMWPatNoOffset<i64, rmw_64, inst_64>;
755 def : TerRMWPatImmOff<i32, rmw_32, regPlusImm, inst_32>;
756 def : TerRMWPatImmOff<i64, rmw_64, regPlusImm, inst_64>;
757 def : TerRMWPatImmOff<i32, rmw_32, or_is_add, inst_32>;
758 def : TerRMWPatImmOff<i64, rmw_64, or_is_add, inst_64>;
760 def : TerRMWPatGlobalAddr<i32, rmw_32, inst_32>;
761 def : TerRMWPatGlobalAddr<i64, rmw_64, inst_64>;
763 def : TerRMWPatOffsetOnly<i32, rmw_32, inst_32>;
764 def : TerRMWPatOffsetOnly<i64, rmw_64, inst_64>;
766 def : TerRMWPatGlobalAddrOffOnly<i32, rmw_32, inst_32>;
767 def : TerRMWPatGlobalAddrOffOnly<i64, rmw_64, inst_64>;
770 let Predicates = [HasAtomics] in
771 defm : TerRMWPattern<atomic_cmp_swap_32, atomic_cmp_swap_64,
772 ATOMIC_RMW_CMPXCHG_I32, ATOMIC_RMW_CMPXCHG_I64>;
774 // Truncating & zero-extending ternary RMW patterns.
775 // DAG legalization & optimization before instruction selection may introduce
776 // additional nodes such as anyext or assertzext depending on operand types.
777 class zext_ter_rmw_8_32<PatFrag kind> :
778 PatFrag<(ops node:$addr, node:$exp, node:$new),
779 (and (i32 (kind node:$addr, node:$exp, node:$new)), 255)>;
780 class zext_ter_rmw_16_32<PatFrag kind> :
781 PatFrag<(ops node:$addr, node:$exp, node:$new),
782 (and (i32 (kind node:$addr, node:$exp, node:$new)), 65535)>;
783 class zext_ter_rmw_8_64<PatFrag kind> :
784 PatFrag<(ops node:$addr, node:$exp, node:$new),
785 (zext (i32 (assertzext (i32 (kind node:$addr,
786 (i32 (trunc (i64 node:$exp))),
787 (i32 (trunc (i64 node:$new))))))))>;
788 class zext_ter_rmw_16_64<PatFrag kind> : zext_ter_rmw_8_64<kind>;
789 class zext_ter_rmw_32_64<PatFrag kind> :
790 PatFrag<(ops node:$addr, node:$exp, node:$new),
791 (zext (i32 (kind node:$addr,
792 (i32 (trunc (i64 node:$exp))),
793 (i32 (trunc (i64 node:$new))))))>;
795 // Truncating & sign-extending ternary RMW patterns.
796 // We match subword RMWs (for 32-bit) and anyext RMWs (for 64-bit) and select a
797 // zext RMW; the next instruction will be sext_inreg which is selected by
799 class sext_ter_rmw_8_32<PatFrag kind> :
800 PatFrag<(ops node:$addr, node:$exp, node:$new),
801 (kind node:$addr, node:$exp, node:$new)>;
802 class sext_ter_rmw_16_32<PatFrag kind> : sext_ter_rmw_8_32<kind>;
803 class sext_ter_rmw_8_64<PatFrag kind> :
804 PatFrag<(ops node:$addr, node:$exp, node:$new),
805 (anyext (i32 (assertzext (i32
807 (i32 (trunc (i64 node:$exp))),
808 (i32 (trunc (i64 node:$new))))))))>;
809 class sext_ter_rmw_16_64<PatFrag kind> : sext_ter_rmw_8_64<kind>;
810 // 32->64 sext RMW gets selected as i32.atomic.rmw.***, i64.extend_i32_s
812 // Patterns for various addressing modes for truncating-extending ternary RMWs.
813 multiclass TerRMWTruncExtPattern<
814 PatFrag rmw_8, PatFrag rmw_16, PatFrag rmw_32, PatFrag rmw_64,
815 NI inst8_32, NI inst16_32, NI inst8_64, NI inst16_64, NI inst32_64> {
816 // Truncating-extending ternary RMWs with no constant offset
817 def : TerRMWPatNoOffset<i32, zext_ter_rmw_8_32<rmw_8>, inst8_32>;
818 def : TerRMWPatNoOffset<i32, zext_ter_rmw_16_32<rmw_16>, inst16_32>;
819 def : TerRMWPatNoOffset<i64, zext_ter_rmw_8_64<rmw_8>, inst8_64>;
820 def : TerRMWPatNoOffset<i64, zext_ter_rmw_16_64<rmw_16>, inst16_64>;
821 def : TerRMWPatNoOffset<i64, zext_ter_rmw_32_64<rmw_32>, inst32_64>;
823 def : TerRMWPatNoOffset<i32, sext_ter_rmw_8_32<rmw_8>, inst8_32>;
824 def : TerRMWPatNoOffset<i32, sext_ter_rmw_16_32<rmw_16>, inst16_32>;
825 def : TerRMWPatNoOffset<i64, sext_ter_rmw_8_64<rmw_8>, inst8_64>;
826 def : TerRMWPatNoOffset<i64, sext_ter_rmw_16_64<rmw_16>, inst16_64>;
828 // Truncating-extending ternary RMWs with a constant offset
829 def : TerRMWPatImmOff<i32, zext_ter_rmw_8_32<rmw_8>, regPlusImm, inst8_32>;
830 def : TerRMWPatImmOff<i32, zext_ter_rmw_16_32<rmw_16>, regPlusImm, inst16_32>;
831 def : TerRMWPatImmOff<i64, zext_ter_rmw_8_64<rmw_8>, regPlusImm, inst8_64>;
832 def : TerRMWPatImmOff<i64, zext_ter_rmw_16_64<rmw_16>, regPlusImm, inst16_64>;
833 def : TerRMWPatImmOff<i64, zext_ter_rmw_32_64<rmw_32>, regPlusImm, inst32_64>;
834 def : TerRMWPatImmOff<i32, zext_ter_rmw_8_32<rmw_8>, or_is_add, inst8_32>;
835 def : TerRMWPatImmOff<i32, zext_ter_rmw_16_32<rmw_16>, or_is_add, inst16_32>;
836 def : TerRMWPatImmOff<i64, zext_ter_rmw_8_64<rmw_8>, or_is_add, inst8_64>;
837 def : TerRMWPatImmOff<i64, zext_ter_rmw_16_64<rmw_16>, or_is_add, inst16_64>;
838 def : TerRMWPatImmOff<i64, zext_ter_rmw_32_64<rmw_32>, or_is_add, inst32_64>;
840 def : TerRMWPatImmOff<i32, sext_ter_rmw_8_32<rmw_8>, regPlusImm, inst8_32>;
841 def : TerRMWPatImmOff<i32, sext_ter_rmw_16_32<rmw_16>, regPlusImm, inst16_32>;
842 def : TerRMWPatImmOff<i64, sext_ter_rmw_8_64<rmw_8>, regPlusImm, inst8_64>;
843 def : TerRMWPatImmOff<i64, sext_ter_rmw_16_64<rmw_16>, regPlusImm, inst16_64>;
844 def : TerRMWPatImmOff<i32, sext_ter_rmw_8_32<rmw_8>, or_is_add, inst8_32>;
845 def : TerRMWPatImmOff<i32, sext_ter_rmw_16_32<rmw_16>, or_is_add, inst16_32>;
846 def : TerRMWPatImmOff<i64, sext_ter_rmw_8_64<rmw_8>, or_is_add, inst8_64>;
847 def : TerRMWPatImmOff<i64, sext_ter_rmw_16_64<rmw_16>, or_is_add, inst16_64>;
849 def : TerRMWPatGlobalAddr<i32, zext_ter_rmw_8_32<rmw_8>, inst8_32>;
850 def : TerRMWPatGlobalAddr<i32, zext_ter_rmw_16_32<rmw_16>, inst16_32>;
851 def : TerRMWPatGlobalAddr<i64, zext_ter_rmw_8_64<rmw_8>, inst8_64>;
852 def : TerRMWPatGlobalAddr<i64, zext_ter_rmw_16_64<rmw_16>, inst16_64>;
853 def : TerRMWPatGlobalAddr<i64, zext_ter_rmw_32_64<rmw_32>, inst32_64>;
855 def : TerRMWPatGlobalAddr<i32, sext_ter_rmw_8_32<rmw_8>, inst8_32>;
856 def : TerRMWPatGlobalAddr<i32, sext_ter_rmw_16_32<rmw_16>, inst16_32>;
857 def : TerRMWPatGlobalAddr<i64, sext_ter_rmw_8_64<rmw_8>, inst8_64>;
858 def : TerRMWPatGlobalAddr<i64, sext_ter_rmw_16_64<rmw_16>, inst16_64>;
860 // Truncating-extending ternary RMWs with just a constant offset
861 def : TerRMWPatOffsetOnly<i32, zext_ter_rmw_8_32<rmw_8>, inst8_32>;
862 def : TerRMWPatOffsetOnly<i32, zext_ter_rmw_16_32<rmw_16>, inst16_32>;
863 def : TerRMWPatOffsetOnly<i64, zext_ter_rmw_8_64<rmw_8>, inst8_64>;
864 def : TerRMWPatOffsetOnly<i64, zext_ter_rmw_16_64<rmw_16>, inst16_64>;
865 def : TerRMWPatOffsetOnly<i64, zext_ter_rmw_32_64<rmw_32>, inst32_64>;
867 def : TerRMWPatOffsetOnly<i32, sext_ter_rmw_8_32<rmw_8>, inst8_32>;
868 def : TerRMWPatOffsetOnly<i32, sext_ter_rmw_16_32<rmw_16>, inst16_32>;
869 def : TerRMWPatOffsetOnly<i64, sext_ter_rmw_8_64<rmw_8>, inst8_64>;
870 def : TerRMWPatOffsetOnly<i64, sext_ter_rmw_16_64<rmw_16>, inst16_64>;
872 def : TerRMWPatGlobalAddrOffOnly<i32, zext_ter_rmw_8_32<rmw_8>, inst8_32>;
873 def : TerRMWPatGlobalAddrOffOnly<i32, zext_ter_rmw_16_32<rmw_16>, inst16_32>;
874 def : TerRMWPatGlobalAddrOffOnly<i64, zext_ter_rmw_8_64<rmw_8>, inst8_64>;
875 def : TerRMWPatGlobalAddrOffOnly<i64, zext_ter_rmw_16_64<rmw_16>, inst16_64>;
876 def : TerRMWPatGlobalAddrOffOnly<i64, zext_ter_rmw_32_64<rmw_32>, inst32_64>;
878 def : TerRMWPatGlobalAddrOffOnly<i32, sext_ter_rmw_8_32<rmw_8>, inst8_32>;
879 def : TerRMWPatGlobalAddrOffOnly<i32, sext_ter_rmw_16_32<rmw_16>, inst16_32>;
880 def : TerRMWPatGlobalAddrOffOnly<i64, sext_ter_rmw_8_64<rmw_8>, inst8_64>;
881 def : TerRMWPatGlobalAddrOffOnly<i64, sext_ter_rmw_16_64<rmw_16>, inst16_64>;
884 let Predicates = [HasAtomics] in
885 defm : TerRMWTruncExtPattern<
886 atomic_cmp_swap_8, atomic_cmp_swap_16, atomic_cmp_swap_32, atomic_cmp_swap_64,
887 ATOMIC_RMW8_U_CMPXCHG_I32, ATOMIC_RMW16_U_CMPXCHG_I32,
888 ATOMIC_RMW8_U_CMPXCHG_I64, ATOMIC_RMW16_U_CMPXCHG_I64,
889 ATOMIC_RMW32_U_CMPXCHG_I64>;
891 //===----------------------------------------------------------------------===//
893 //===----------------------------------------------------------------------===//
895 // A compiler fence instruction that prevents reordering of instructions.
896 let Defs = [ARGUMENTS] in {
897 let isPseudo = 1, hasSideEffects = 1 in
898 defm COMPILER_FENCE : ATOMIC_NRI<(outs), (ins), [], "compiler_fence">;
899 } // Defs = [ARGUMENTS]