blob: f0cb0c284bf2be986b5d8ad369676b752a16ce8b [file] [log] [blame]
Dan Gohman10e730a2015-06-29 23:51:55 +00001// WebAssemblyInstrAtomics.td-WebAssembly Atomic codegen support-*- tablegen -*-
2//
Chandler Carruth2946cd72019-01-19 08:50:56 +00003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Dan Gohman10e730a2015-06-29 23:51:55 +00006//
7//===----------------------------------------------------------------------===//
JF Bastien5ca0bac2015-07-10 18:23:10 +00008///
9/// \file
Adrian Prantl5f8f34e42018-05-01 15:54:18 +000010/// WebAssembly Atomic operand code-gen constructs.
JF Bastien5ca0bac2015-07-10 18:23:10 +000011///
Dan Gohman10e730a2015-06-29 23:51:55 +000012//===----------------------------------------------------------------------===//
13
Thomas Lively972d7d52019-03-09 04:31:37 +000014let UseNamedOperandTable = 1 in
Heejin Ahn20ea1822019-02-20 01:29:34 +000015multiclass ATOMIC_I<dag oops_r, dag iops_r, dag oops_s, dag iops_s,
16 list<dag> pattern_r, string asmstr_r = "",
17 string asmstr_s = "", bits<32> atomic_op = -1> {
18 defm "" : I<oops_r, iops_r, oops_s, iops_s, pattern_r, asmstr_r, asmstr_s,
19 !or(0xfe00, !and(0xff, atomic_op))>,
20 Requires<[HasAtomics]>;
21}
22
23multiclass ATOMIC_NRI<dag oops, dag iops, list<dag> pattern, string asmstr = "",
24 bits<32> atomic_op = -1> {
25 defm "" : NRI<oops, iops, pattern, asmstr,
26 !or(0xfe00, !and(0xff, atomic_op))>,
27 Requires<[HasAtomics]>;
28}
29
30//===----------------------------------------------------------------------===//
31// Atomic wait / notify
32//===----------------------------------------------------------------------===//
33
34let hasSideEffects = 1 in {
35defm ATOMIC_NOTIFY :
36 ATOMIC_I<(outs I32:$dst),
37 (ins P2Align:$p2align, offset32_op:$off, I32:$addr, I32:$count),
38 (outs), (ins P2Align:$p2align, offset32_op:$off), [],
39 "atomic.notify \t$dst, ${off}(${addr})${p2align}, $count",
40 "atomic.notify \t${off}${p2align}", 0x00>;
41let mayLoad = 1 in {
42defm ATOMIC_WAIT_I32 :
43 ATOMIC_I<(outs I32:$dst),
44 (ins P2Align:$p2align, offset32_op:$off, I32:$addr, I32:$exp,
45 I64:$timeout),
46 (outs), (ins P2Align:$p2align, offset32_op:$off), [],
47 "i32.atomic.wait \t$dst, ${off}(${addr})${p2align}, $exp, $timeout",
48 "i32.atomic.wait \t${off}${p2align}", 0x01>;
49defm ATOMIC_WAIT_I64 :
50 ATOMIC_I<(outs I32:$dst),
51 (ins P2Align:$p2align, offset32_op:$off, I32:$addr, I64:$exp,
52 I64:$timeout),
53 (outs), (ins P2Align:$p2align, offset32_op:$off), [],
54 "i64.atomic.wait \t$dst, ${off}(${addr})${p2align}, $exp, $timeout",
55 "i64.atomic.wait \t${off}${p2align}", 0x02>;
56} // mayLoad = 1
57} // hasSideEffects = 1
58
59let Predicates = [HasAtomics] in {
60// Select notifys with no constant offset.
61def NotifyPatNoOffset :
62 Pat<(i32 (int_wasm_atomic_notify I32:$addr, I32:$count)),
63 (ATOMIC_NOTIFY 0, 0, I32:$addr, I32:$count)>;
64
65// Select notifys with a constant offset.
66
67// Pattern with address + immediate offset
68class NotifyPatImmOff<PatFrag operand> :
69 Pat<(i32 (int_wasm_atomic_notify (operand I32:$addr, imm:$off), I32:$count)),
70 (ATOMIC_NOTIFY 0, imm:$off, I32:$addr, I32:$count)>;
71def : NotifyPatImmOff<regPlusImm>;
72def : NotifyPatImmOff<or_is_add>;
73
74def NotifyPatGlobalAddr :
75 Pat<(i32 (int_wasm_atomic_notify (regPlusGA I32:$addr,
76 (WebAssemblywrapper tglobaladdr:$off)),
77 I32:$count)),
78 (ATOMIC_NOTIFY 0, tglobaladdr:$off, I32:$addr, I32:$count)>;
79
80def NotifyPatExternalSym :
81 Pat<(i32 (int_wasm_atomic_notify (add I32:$addr,
82 (WebAssemblywrapper texternalsym:$off)),
83 I32:$count)),
84 (ATOMIC_NOTIFY 0, texternalsym:$off, I32:$addr, I32:$count)>;
85
86// Select notifys with just a constant offset.
87def NotifyPatOffsetOnly :
88 Pat<(i32 (int_wasm_atomic_notify imm:$off, I32:$count)),
89 (ATOMIC_NOTIFY 0, imm:$off, (CONST_I32 0), I32:$count)>;
90
91def NotifyPatGlobalAddrOffOnly :
92 Pat<(i32 (int_wasm_atomic_notify (WebAssemblywrapper tglobaladdr:$off),
93 I32:$count)),
94 (ATOMIC_NOTIFY 0, tglobaladdr:$off, (CONST_I32 0), I32:$count)>;
95
96def NotifyPatExternSymOffOnly :
97 Pat<(i32 (int_wasm_atomic_notify (WebAssemblywrapper texternalsym:$off),
98 I32:$count)),
99 (ATOMIC_NOTIFY 0, texternalsym:$off, (CONST_I32 0), I32:$count)>;
100
101// Select waits with no constant offset.
102class WaitPatNoOffset<ValueType ty, Intrinsic kind, NI inst> :
103 Pat<(i32 (kind I32:$addr, ty:$exp, I64:$timeout)),
104 (inst 0, 0, I32:$addr, ty:$exp, I64:$timeout)>;
105def : WaitPatNoOffset<i32, int_wasm_atomic_wait_i32, ATOMIC_WAIT_I32>;
106def : WaitPatNoOffset<i64, int_wasm_atomic_wait_i64, ATOMIC_WAIT_I64>;
107
108// Select waits with a constant offset.
109
110// Pattern with address + immediate offset
111class WaitPatImmOff<ValueType ty, Intrinsic kind, PatFrag operand, NI inst> :
112 Pat<(i32 (kind (operand I32:$addr, imm:$off), ty:$exp, I64:$timeout)),
113 (inst 0, imm:$off, I32:$addr, ty:$exp, I64:$timeout)>;
114def : WaitPatImmOff<i32, int_wasm_atomic_wait_i32, regPlusImm, ATOMIC_WAIT_I32>;
115def : WaitPatImmOff<i32, int_wasm_atomic_wait_i32, or_is_add, ATOMIC_WAIT_I32>;
116def : WaitPatImmOff<i64, int_wasm_atomic_wait_i64, regPlusImm, ATOMIC_WAIT_I64>;
117def : WaitPatImmOff<i64, int_wasm_atomic_wait_i64, or_is_add, ATOMIC_WAIT_I64>;
118
119class WaitPatGlobalAddr<ValueType ty, Intrinsic kind, NI inst> :
120 Pat<(i32 (kind (regPlusGA I32:$addr, (WebAssemblywrapper tglobaladdr:$off)),
121 ty:$exp, I64:$timeout)),
122 (inst 0, tglobaladdr:$off, I32:$addr, ty:$exp, I64:$timeout)>;
123def : WaitPatGlobalAddr<i32, int_wasm_atomic_wait_i32, ATOMIC_WAIT_I32>;
124def : WaitPatGlobalAddr<i64, int_wasm_atomic_wait_i64, ATOMIC_WAIT_I64>;
125
126class WaitPatExternalSym<ValueType ty, Intrinsic kind, NI inst> :
127 Pat<(i32 (kind (add I32:$addr, (WebAssemblywrapper texternalsym:$off)),
128 ty:$exp, I64:$timeout)),
129 (inst 0, texternalsym:$off, I32:$addr, ty:$exp, I64:$timeout)>;
130def : WaitPatExternalSym<i32, int_wasm_atomic_wait_i32, ATOMIC_WAIT_I32>;
131def : WaitPatExternalSym<i64, int_wasm_atomic_wait_i64, ATOMIC_WAIT_I64>;
132
133// Select wait_i32, ATOMIC_WAIT_I32s with just a constant offset.
134class WaitPatOffsetOnly<ValueType ty, Intrinsic kind, NI inst> :
135 Pat<(i32 (kind imm:$off, ty:$exp, I64:$timeout)),
136 (inst 0, imm:$off, (CONST_I32 0), ty:$exp, I64:$timeout)>;
137def : WaitPatOffsetOnly<i32, int_wasm_atomic_wait_i32, ATOMIC_WAIT_I32>;
138def : WaitPatOffsetOnly<i64, int_wasm_atomic_wait_i64, ATOMIC_WAIT_I64>;
139
140class WaitPatGlobalAddrOffOnly<ValueType ty, Intrinsic kind, NI inst> :
141 Pat<(i32 (kind (WebAssemblywrapper tglobaladdr:$off), ty:$exp, I64:$timeout)),
142 (inst 0, tglobaladdr:$off, (CONST_I32 0), ty:$exp, I64:$timeout)>;
143def : WaitPatGlobalAddrOffOnly<i32, int_wasm_atomic_wait_i32, ATOMIC_WAIT_I32>;
144def : WaitPatGlobalAddrOffOnly<i64, int_wasm_atomic_wait_i64, ATOMIC_WAIT_I64>;
145
146class WaitPatExternSymOffOnly<ValueType ty, Intrinsic kind, NI inst> :
147 Pat<(i32 (kind (WebAssemblywrapper texternalsym:$off), ty:$exp,
148 I64:$timeout)),
149 (inst 0, texternalsym:$off, (CONST_I32 0), ty:$exp, I64:$timeout)>;
150def : WaitPatExternSymOffOnly<i32, int_wasm_atomic_wait_i32, ATOMIC_WAIT_I32>;
151def : WaitPatExternSymOffOnly<i64, int_wasm_atomic_wait_i64, ATOMIC_WAIT_I64>;
152} // Predicates = [HasAtomics]
153
Dan Gohman10e730a2015-06-29 23:51:55 +0000154//===----------------------------------------------------------------------===//
155// Atomic loads
156//===----------------------------------------------------------------------===//
157
Heejin Ahn20ea1822019-02-20 01:29:34 +0000158multiclass AtomicLoad<WebAssemblyRegClass rc, string name, int atomic_op> {
159 defm "" : WebAssemblyLoad<rc, name, !or(0xfe00, !and(0xff, atomic_op))>,
Thomas Lively914f0f22018-08-23 00:36:43 +0000160 Requires<[HasAtomics]>;
161}
162
Heejin Ahn20ea1822019-02-20 01:29:34 +0000163defm ATOMIC_LOAD_I32 : AtomicLoad<I32, "i32.atomic.load", 0x10>;
164defm ATOMIC_LOAD_I64 : AtomicLoad<I64, "i64.atomic.load", 0x11>;
Derek Schuff18ba1922017-08-30 18:07:45 +0000165
166// Select loads with no constant offset.
167let Predicates = [HasAtomics] in {
Derek Schuff885dc592017-10-05 21:18:42 +0000168def : LoadPatNoOffset<i32, atomic_load_32, ATOMIC_LOAD_I32>;
169def : LoadPatNoOffset<i64, atomic_load_64, ATOMIC_LOAD_I64>;
Derek Schuff0f3bc0f2017-08-31 21:51:48 +0000170
Derek Schuff885dc592017-10-05 21:18:42 +0000171// Select loads with a constant offset.
172
173// Pattern with address + immediate offset
174def : LoadPatImmOff<i32, atomic_load_32, regPlusImm, ATOMIC_LOAD_I32>;
175def : LoadPatImmOff<i64, atomic_load_64, regPlusImm, ATOMIC_LOAD_I64>;
176def : LoadPatImmOff<i32, atomic_load_32, or_is_add, ATOMIC_LOAD_I32>;
177def : LoadPatImmOff<i64, atomic_load_64, or_is_add, ATOMIC_LOAD_I64>;
178
179def : LoadPatGlobalAddr<i32, atomic_load_32, ATOMIC_LOAD_I32>;
180def : LoadPatGlobalAddr<i64, atomic_load_64, ATOMIC_LOAD_I64>;
181
182def : LoadPatExternalSym<i32, atomic_load_32, ATOMIC_LOAD_I32>;
183def : LoadPatExternalSym<i64, atomic_load_64, ATOMIC_LOAD_I64>;
184
Derek Schuff885dc592017-10-05 21:18:42 +0000185// Select loads with just a constant offset.
186def : LoadPatOffsetOnly<i32, atomic_load_32, ATOMIC_LOAD_I32>;
187def : LoadPatOffsetOnly<i64, atomic_load_64, ATOMIC_LOAD_I64>;
188
189def : LoadPatGlobalAddrOffOnly<i32, atomic_load_32, ATOMIC_LOAD_I32>;
190def : LoadPatGlobalAddrOffOnly<i64, atomic_load_64, ATOMIC_LOAD_I64>;
191
192def : LoadPatExternSymOffOnly<i32, atomic_load_32, ATOMIC_LOAD_I32>;
193def : LoadPatExternSymOffOnly<i64, atomic_load_64, ATOMIC_LOAD_I64>;
194
195} // Predicates = [HasAtomics]
196
197// Extending loads. Note that there are only zero-extending atomic loads, no
198// sign-extending loads.
Heejin Ahn20ea1822019-02-20 01:29:34 +0000199defm ATOMIC_LOAD8_U_I32 : AtomicLoad<I32, "i32.atomic.load8_u", 0x12>;
200defm ATOMIC_LOAD16_U_I32 : AtomicLoad<I32, "i32.atomic.load16_u", 0x13>;
201defm ATOMIC_LOAD8_U_I64 : AtomicLoad<I64, "i64.atomic.load8_u", 0x14>;
202defm ATOMIC_LOAD16_U_I64 : AtomicLoad<I64, "i64.atomic.load16_u", 0x15>;
203defm ATOMIC_LOAD32_U_I64 : AtomicLoad<I64, "i64.atomic.load32_u", 0x16>;
Derek Schuff885dc592017-10-05 21:18:42 +0000204
Heejin Ahnd31bc982018-07-09 20:18:21 +0000205// Fragments for extending loads. These are different from regular loads because
Derek Schuff885dc592017-10-05 21:18:42 +0000206// the SDNodes are derived from AtomicSDNode rather than LoadSDNode and
207// therefore don't have the extension type field. So instead of matching that,
208// we match the patterns that the type legalizer expands them to.
209
210// We directly match zext patterns and select the zext atomic loads.
211// i32 (zext (i8 (atomic_load_8))) gets legalized to
212// i32 (and (i32 (atomic_load_8)), 255)
213// These can be selected to a single zero-extending atomic load instruction.
Heejin Ahnd31bc982018-07-09 20:18:21 +0000214def zext_aload_8_32 :
215 PatFrag<(ops node:$addr), (and (i32 (atomic_load_8 node:$addr)), 255)>;
216def zext_aload_16_32 :
217 PatFrag<(ops node:$addr), (and (i32 (atomic_load_16 node:$addr)), 65535)>;
Derek Schuff885dc592017-10-05 21:18:42 +0000218// Unlike regular loads, extension to i64 is handled differently than i32.
219// i64 (zext (i8 (atomic_load_8))) gets legalized to
220// i64 (and (i64 (anyext (i32 (atomic_load_8)))), 255)
221def zext_aload_8_64 :
222 PatFrag<(ops node:$addr),
223 (and (i64 (anyext (i32 (atomic_load_8 node:$addr)))), 255)>;
224def zext_aload_16_64 :
225 PatFrag<(ops node:$addr),
226 (and (i64 (anyext (i32 (atomic_load_16 node:$addr)))), 65535)>;
227def zext_aload_32_64 :
228 PatFrag<(ops node:$addr),
229 (zext (i32 (atomic_load node:$addr)))>;
230
231// We don't have single sext atomic load instructions. So for sext loads, we
232// match bare subword loads (for 32-bit results) and anyext loads (for 64-bit
233// results) and select a zext load; the next instruction will be sext_inreg
234// which is selected by itself.
Heejin Ahnd31bc982018-07-09 20:18:21 +0000235def sext_aload_8_64 :
Derek Schuff885dc592017-10-05 21:18:42 +0000236 PatFrag<(ops node:$addr), (anyext (i32 (atomic_load_8 node:$addr)))>;
Heejin Ahnd31bc982018-07-09 20:18:21 +0000237def sext_aload_16_64 :
Derek Schuff885dc592017-10-05 21:18:42 +0000238 PatFrag<(ops node:$addr), (anyext (i32 (atomic_load_16 node:$addr)))>;
239
240let Predicates = [HasAtomics] in {
241// Select zero-extending loads with no constant offset.
Heejin Ahnd31bc982018-07-09 20:18:21 +0000242def : LoadPatNoOffset<i32, zext_aload_8_32, ATOMIC_LOAD8_U_I32>;
243def : LoadPatNoOffset<i32, zext_aload_16_32, ATOMIC_LOAD16_U_I32>;
Derek Schuff885dc592017-10-05 21:18:42 +0000244def : LoadPatNoOffset<i64, zext_aload_8_64, ATOMIC_LOAD8_U_I64>;
245def : LoadPatNoOffset<i64, zext_aload_16_64, ATOMIC_LOAD16_U_I64>;
246def : LoadPatNoOffset<i64, zext_aload_32_64, ATOMIC_LOAD32_U_I64>;
247
248// Select sign-extending loads with no constant offset
249def : LoadPatNoOffset<i32, atomic_load_8, ATOMIC_LOAD8_U_I32>;
250def : LoadPatNoOffset<i32, atomic_load_16, ATOMIC_LOAD16_U_I32>;
Heejin Ahnd31bc982018-07-09 20:18:21 +0000251def : LoadPatNoOffset<i64, sext_aload_8_64, ATOMIC_LOAD8_U_I64>;
252def : LoadPatNoOffset<i64, sext_aload_16_64, ATOMIC_LOAD16_U_I64>;
Thomas Lively6a87dda2019-01-08 06:25:55 +0000253// 32->64 sext load gets selected as i32.atomic.load, i64.extend_i32_s
Derek Schuff885dc592017-10-05 21:18:42 +0000254
255// Zero-extending loads with constant offset
Heejin Ahnd31bc982018-07-09 20:18:21 +0000256def : LoadPatImmOff<i32, zext_aload_8_32, regPlusImm, ATOMIC_LOAD8_U_I32>;
257def : LoadPatImmOff<i32, zext_aload_16_32, regPlusImm, ATOMIC_LOAD16_U_I32>;
258def : LoadPatImmOff<i32, zext_aload_8_32, or_is_add, ATOMIC_LOAD8_U_I32>;
259def : LoadPatImmOff<i32, zext_aload_16_32, or_is_add, ATOMIC_LOAD16_U_I32>;
Derek Schuff885dc592017-10-05 21:18:42 +0000260def : LoadPatImmOff<i64, zext_aload_8_64, regPlusImm, ATOMIC_LOAD8_U_I64>;
261def : LoadPatImmOff<i64, zext_aload_16_64, regPlusImm, ATOMIC_LOAD16_U_I64>;
262def : LoadPatImmOff<i64, zext_aload_32_64, regPlusImm, ATOMIC_LOAD32_U_I64>;
263def : LoadPatImmOff<i64, zext_aload_8_64, or_is_add, ATOMIC_LOAD8_U_I64>;
264def : LoadPatImmOff<i64, zext_aload_16_64, or_is_add, ATOMIC_LOAD16_U_I64>;
265def : LoadPatImmOff<i64, zext_aload_32_64, or_is_add, ATOMIC_LOAD32_U_I64>;
266
267// Sign-extending loads with constant offset
268def : LoadPatImmOff<i32, atomic_load_8, regPlusImm, ATOMIC_LOAD8_U_I32>;
269def : LoadPatImmOff<i32, atomic_load_16, regPlusImm, ATOMIC_LOAD16_U_I32>;
270def : LoadPatImmOff<i32, atomic_load_8, or_is_add, ATOMIC_LOAD8_U_I32>;
271def : LoadPatImmOff<i32, atomic_load_16, or_is_add, ATOMIC_LOAD16_U_I32>;
Heejin Ahnd31bc982018-07-09 20:18:21 +0000272def : LoadPatImmOff<i64, sext_aload_8_64, regPlusImm, ATOMIC_LOAD8_U_I64>;
273def : LoadPatImmOff<i64, sext_aload_16_64, regPlusImm, ATOMIC_LOAD16_U_I64>;
274def : LoadPatImmOff<i64, sext_aload_8_64, or_is_add, ATOMIC_LOAD8_U_I64>;
275def : LoadPatImmOff<i64, sext_aload_16_64, or_is_add, ATOMIC_LOAD16_U_I64>;
Derek Schuff885dc592017-10-05 21:18:42 +0000276// No 32->64 patterns, just use i32.atomic.load and i64.extend_s/i64
277
Heejin Ahnd31bc982018-07-09 20:18:21 +0000278def : LoadPatGlobalAddr<i32, zext_aload_8_32, ATOMIC_LOAD8_U_I32>;
279def : LoadPatGlobalAddr<i32, zext_aload_16_32, ATOMIC_LOAD16_U_I32>;
Derek Schuff885dc592017-10-05 21:18:42 +0000280def : LoadPatGlobalAddr<i64, zext_aload_8_64, ATOMIC_LOAD8_U_I64>;
281def : LoadPatGlobalAddr<i64, zext_aload_16_64, ATOMIC_LOAD16_U_I64>;
282def : LoadPatGlobalAddr<i64, zext_aload_32_64, ATOMIC_LOAD32_U_I64>;
283def : LoadPatGlobalAddr<i32, atomic_load_8, ATOMIC_LOAD8_U_I32>;
284def : LoadPatGlobalAddr<i32, atomic_load_16, ATOMIC_LOAD16_U_I32>;
Heejin Ahnd31bc982018-07-09 20:18:21 +0000285def : LoadPatGlobalAddr<i64, sext_aload_8_64, ATOMIC_LOAD8_U_I64>;
286def : LoadPatGlobalAddr<i64, sext_aload_16_64, ATOMIC_LOAD16_U_I64>;
Derek Schuff885dc592017-10-05 21:18:42 +0000287
Heejin Ahnd31bc982018-07-09 20:18:21 +0000288def : LoadPatExternalSym<i32, zext_aload_8_32, ATOMIC_LOAD8_U_I32>;
289def : LoadPatExternalSym<i32, zext_aload_16_32, ATOMIC_LOAD16_U_I32>;
Derek Schuff885dc592017-10-05 21:18:42 +0000290def : LoadPatExternalSym<i64, zext_aload_8_64, ATOMIC_LOAD8_U_I64>;
291def : LoadPatExternalSym<i64, zext_aload_16_64, ATOMIC_LOAD16_U_I64>;
292def : LoadPatExternalSym<i64, zext_aload_32_64, ATOMIC_LOAD32_U_I64>;
293def : LoadPatExternalSym<i32, atomic_load_8, ATOMIC_LOAD8_U_I32>;
294def : LoadPatExternalSym<i32, atomic_load_16, ATOMIC_LOAD16_U_I32>;
Heejin Ahnd31bc982018-07-09 20:18:21 +0000295def : LoadPatExternalSym<i64, sext_aload_8_64, ATOMIC_LOAD8_U_I64>;
296def : LoadPatExternalSym<i64, sext_aload_16_64, ATOMIC_LOAD16_U_I64>;
Derek Schuff885dc592017-10-05 21:18:42 +0000297
298// Extending loads with just a constant offset
Heejin Ahnd31bc982018-07-09 20:18:21 +0000299def : LoadPatOffsetOnly<i32, zext_aload_8_32, ATOMIC_LOAD8_U_I32>;
300def : LoadPatOffsetOnly<i32, zext_aload_16_32, ATOMIC_LOAD16_U_I32>;
Derek Schuff885dc592017-10-05 21:18:42 +0000301def : LoadPatOffsetOnly<i64, zext_aload_8_64, ATOMIC_LOAD8_U_I64>;
302def : LoadPatOffsetOnly<i64, zext_aload_16_64, ATOMIC_LOAD16_U_I64>;
303def : LoadPatOffsetOnly<i64, zext_aload_32_64, ATOMIC_LOAD32_U_I64>;
304def : LoadPatOffsetOnly<i32, atomic_load_8, ATOMIC_LOAD8_U_I32>;
305def : LoadPatOffsetOnly<i32, atomic_load_16, ATOMIC_LOAD16_U_I32>;
Heejin Ahnd31bc982018-07-09 20:18:21 +0000306def : LoadPatOffsetOnly<i64, sext_aload_8_64, ATOMIC_LOAD8_U_I64>;
307def : LoadPatOffsetOnly<i64, sext_aload_16_64, ATOMIC_LOAD16_U_I64>;
Derek Schuff885dc592017-10-05 21:18:42 +0000308
Heejin Ahnd31bc982018-07-09 20:18:21 +0000309def : LoadPatGlobalAddrOffOnly<i32, zext_aload_8_32, ATOMIC_LOAD8_U_I32>;
310def : LoadPatGlobalAddrOffOnly<i32, zext_aload_16_32, ATOMIC_LOAD16_U_I32>;
Derek Schuff885dc592017-10-05 21:18:42 +0000311def : LoadPatGlobalAddrOffOnly<i64, zext_aload_8_64, ATOMIC_LOAD8_U_I64>;
312def : LoadPatGlobalAddrOffOnly<i64, zext_aload_16_64, ATOMIC_LOAD16_U_I64>;
313def : LoadPatGlobalAddrOffOnly<i64, zext_aload_32_64, ATOMIC_LOAD32_U_I64>;
314def : LoadPatGlobalAddrOffOnly<i32, atomic_load_8, ATOMIC_LOAD8_U_I32>;
315def : LoadPatGlobalAddrOffOnly<i32, atomic_load_16, ATOMIC_LOAD16_U_I32>;
Heejin Ahnd31bc982018-07-09 20:18:21 +0000316def : LoadPatGlobalAddrOffOnly<i64, sext_aload_8_64, ATOMIC_LOAD8_U_I64>;
317def : LoadPatGlobalAddrOffOnly<i64, sext_aload_16_64, ATOMIC_LOAD16_U_I64>;
Derek Schuff885dc592017-10-05 21:18:42 +0000318
Heejin Ahnd31bc982018-07-09 20:18:21 +0000319def : LoadPatExternSymOffOnly<i32, zext_aload_8_32, ATOMIC_LOAD8_U_I32>;
320def : LoadPatExternSymOffOnly<i32, zext_aload_16_32, ATOMIC_LOAD16_U_I32>;
Derek Schuff885dc592017-10-05 21:18:42 +0000321def : LoadPatExternSymOffOnly<i64, zext_aload_8_64, ATOMIC_LOAD8_U_I64>;
322def : LoadPatExternSymOffOnly<i64, zext_aload_16_64, ATOMIC_LOAD16_U_I64>;
323def : LoadPatExternSymOffOnly<i64, zext_aload_32_64, ATOMIC_LOAD32_U_I64>;
324def : LoadPatExternSymOffOnly<i32, atomic_load_8, ATOMIC_LOAD8_U_I32>;
325def : LoadPatExternSymOffOnly<i32, atomic_load_16, ATOMIC_LOAD16_U_I32>;
Heejin Ahnd31bc982018-07-09 20:18:21 +0000326def : LoadPatExternSymOffOnly<i64, sext_aload_8_64, ATOMIC_LOAD8_U_I64>;
327def : LoadPatExternSymOffOnly<i64, sext_aload_16_64, ATOMIC_LOAD16_U_I64>;
Derek Schuff885dc592017-10-05 21:18:42 +0000328
329} // Predicates = [HasAtomics]
Dan Gohman10e730a2015-06-29 23:51:55 +0000330
331//===----------------------------------------------------------------------===//
332// Atomic stores
333//===----------------------------------------------------------------------===//
334
Heejin Ahn20ea1822019-02-20 01:29:34 +0000335multiclass AtomicStore<WebAssemblyRegClass rc, string name, int atomic_op> {
336 defm "" : WebAssemblyStore<rc, name, !or(0xfe00, !and(0xff, atomic_op))>,
337 Requires<[HasAtomics]>;
338}
339
340defm ATOMIC_STORE_I32 : AtomicStore<I32, "i32.atomic.store", 0x17>;
341defm ATOMIC_STORE_I64 : AtomicStore<I64, "i64.atomic.store", 0x18>;
Heejin Ahn402b4902018-07-02 21:22:59 +0000342
343// We need an 'atomic' version of store patterns because store and atomic_store
344// nodes have different operand orders:
345// store: (store $val, $ptr)
346// atomic_store: (store $ptr, $val)
347
348let Predicates = [HasAtomics] in {
349
350// Select stores with no constant offset.
Heejin Ahnd31bc982018-07-09 20:18:21 +0000351class AStorePatNoOffset<ValueType ty, PatFrag kind, NI inst> :
352 Pat<(kind I32:$addr, ty:$val), (inst 0, 0, I32:$addr, ty:$val)>;
Heejin Ahn402b4902018-07-02 21:22:59 +0000353def : AStorePatNoOffset<i32, atomic_store_32, ATOMIC_STORE_I32>;
354def : AStorePatNoOffset<i64, atomic_store_64, ATOMIC_STORE_I64>;
355
356// Select stores with a constant offset.
357
358// Pattern with address + immediate offset
Heejin Ahnd31bc982018-07-09 20:18:21 +0000359class AStorePatImmOff<ValueType ty, PatFrag kind, PatFrag operand, NI inst> :
360 Pat<(kind (operand I32:$addr, imm:$off), ty:$val),
361 (inst 0, imm:$off, I32:$addr, ty:$val)>;
Heejin Ahn402b4902018-07-02 21:22:59 +0000362def : AStorePatImmOff<i32, atomic_store_32, regPlusImm, ATOMIC_STORE_I32>;
363def : AStorePatImmOff<i64, atomic_store_64, regPlusImm, ATOMIC_STORE_I64>;
364def : AStorePatImmOff<i32, atomic_store_32, or_is_add, ATOMIC_STORE_I32>;
365def : AStorePatImmOff<i64, atomic_store_64, or_is_add, ATOMIC_STORE_I64>;
366
Heejin Ahnd31bc982018-07-09 20:18:21 +0000367class AStorePatGlobalAddr<ValueType ty, PatFrag kind, NI inst> :
368 Pat<(kind (regPlusGA I32:$addr, (WebAssemblywrapper tglobaladdr:$off)),
369 ty:$val),
Heejin Ahn402b4902018-07-02 21:22:59 +0000370 (inst 0, tglobaladdr:$off, I32:$addr, ty:$val)>;
371def : AStorePatGlobalAddr<i32, atomic_store_32, ATOMIC_STORE_I32>;
372def : AStorePatGlobalAddr<i64, atomic_store_64, ATOMIC_STORE_I64>;
373
Heejin Ahnd31bc982018-07-09 20:18:21 +0000374class AStorePatExternalSym<ValueType ty, PatFrag kind, NI inst> :
375 Pat<(kind (add I32:$addr, (WebAssemblywrapper texternalsym:$off)), ty:$val),
Heejin Ahn402b4902018-07-02 21:22:59 +0000376 (inst 0, texternalsym:$off, I32:$addr, ty:$val)>;
377def : AStorePatExternalSym<i32, atomic_store_32, ATOMIC_STORE_I32>;
378def : AStorePatExternalSym<i64, atomic_store_64, ATOMIC_STORE_I64>;
379
380// Select stores with just a constant offset.
Heejin Ahnd31bc982018-07-09 20:18:21 +0000381class AStorePatOffsetOnly<ValueType ty, PatFrag kind, NI inst> :
382 Pat<(kind imm:$off, ty:$val), (inst 0, imm:$off, (CONST_I32 0), ty:$val)>;
Heejin Ahn402b4902018-07-02 21:22:59 +0000383def : AStorePatOffsetOnly<i32, atomic_store_32, ATOMIC_STORE_I32>;
384def : AStorePatOffsetOnly<i64, atomic_store_64, ATOMIC_STORE_I64>;
385
Heejin Ahnd31bc982018-07-09 20:18:21 +0000386class AStorePatGlobalAddrOffOnly<ValueType ty, PatFrag kind, NI inst> :
387 Pat<(kind (WebAssemblywrapper tglobaladdr:$off), ty:$val),
Heejin Ahn402b4902018-07-02 21:22:59 +0000388 (inst 0, tglobaladdr:$off, (CONST_I32 0), ty:$val)>;
389def : AStorePatGlobalAddrOffOnly<i32, atomic_store_32, ATOMIC_STORE_I32>;
390def : AStorePatGlobalAddrOffOnly<i64, atomic_store_64, ATOMIC_STORE_I64>;
391
Heejin Ahnd31bc982018-07-09 20:18:21 +0000392class AStorePatExternSymOffOnly<ValueType ty, PatFrag kind, NI inst> :
393 Pat<(kind (WebAssemblywrapper texternalsym:$off), ty:$val),
Heejin Ahn402b4902018-07-02 21:22:59 +0000394 (inst 0, texternalsym:$off, (CONST_I32 0), ty:$val)>;
395def : AStorePatExternSymOffOnly<i32, atomic_store_32, ATOMIC_STORE_I32>;
396def : AStorePatExternSymOffOnly<i64, atomic_store_64, ATOMIC_STORE_I64>;
397
398} // Predicates = [HasAtomics]
399
400// Truncating stores.
Heejin Ahn20ea1822019-02-20 01:29:34 +0000401defm ATOMIC_STORE8_I32 : AtomicStore<I32, "i32.atomic.store8", 0x19>;
402defm ATOMIC_STORE16_I32 : AtomicStore<I32, "i32.atomic.store16", 0x1a>;
403defm ATOMIC_STORE8_I64 : AtomicStore<I64, "i64.atomic.store8", 0x1b>;
404defm ATOMIC_STORE16_I64 : AtomicStore<I64, "i64.atomic.store16", 0x1c>;
405defm ATOMIC_STORE32_I64 : AtomicStore<I64, "i64.atomic.store32", 0x1d>;
Heejin Ahn402b4902018-07-02 21:22:59 +0000406
407// Fragments for truncating stores.
408
409// We don't have single truncating atomic store instructions. For 32-bit
410// instructions, we just need to match bare atomic stores. On the other hand,
411// truncating stores from i64 values are once truncated to i32 first.
Heejin Ahnd31bc982018-07-09 20:18:21 +0000412class trunc_astore_64<PatFrag kind> :
Heejin Ahn402b4902018-07-02 21:22:59 +0000413 PatFrag<(ops node:$addr, node:$val),
Heejin Ahnd31bc982018-07-09 20:18:21 +0000414 (kind node:$addr, (i32 (trunc (i64 node:$val))))>;
Heejin Ahn402b4902018-07-02 21:22:59 +0000415def trunc_astore_8_64 : trunc_astore_64<atomic_store_8>;
416def trunc_astore_16_64 : trunc_astore_64<atomic_store_16>;
417def trunc_astore_32_64 : trunc_astore_64<atomic_store_32>;
418
419let Predicates = [HasAtomics] in {
420
421// Truncating stores with no constant offset
422def : AStorePatNoOffset<i32, atomic_store_8, ATOMIC_STORE8_I32>;
423def : AStorePatNoOffset<i32, atomic_store_16, ATOMIC_STORE16_I32>;
424def : AStorePatNoOffset<i64, trunc_astore_8_64, ATOMIC_STORE8_I64>;
425def : AStorePatNoOffset<i64, trunc_astore_16_64, ATOMIC_STORE16_I64>;
426def : AStorePatNoOffset<i64, trunc_astore_32_64, ATOMIC_STORE32_I64>;
427
428// Truncating stores with a constant offset
429def : AStorePatImmOff<i32, atomic_store_8, regPlusImm, ATOMIC_STORE8_I32>;
430def : AStorePatImmOff<i32, atomic_store_16, regPlusImm, ATOMIC_STORE16_I32>;
431def : AStorePatImmOff<i64, trunc_astore_8_64, regPlusImm, ATOMIC_STORE8_I64>;
432def : AStorePatImmOff<i64, trunc_astore_16_64, regPlusImm, ATOMIC_STORE16_I64>;
433def : AStorePatImmOff<i64, trunc_astore_32_64, regPlusImm, ATOMIC_STORE32_I64>;
434def : AStorePatImmOff<i32, atomic_store_8, or_is_add, ATOMIC_STORE8_I32>;
435def : AStorePatImmOff<i32, atomic_store_16, or_is_add, ATOMIC_STORE16_I32>;
436def : AStorePatImmOff<i64, trunc_astore_8_64, or_is_add, ATOMIC_STORE8_I64>;
437def : AStorePatImmOff<i64, trunc_astore_16_64, or_is_add, ATOMIC_STORE16_I64>;
438def : AStorePatImmOff<i64, trunc_astore_32_64, or_is_add, ATOMIC_STORE32_I64>;
439
440def : AStorePatGlobalAddr<i32, atomic_store_8, ATOMIC_STORE8_I32>;
441def : AStorePatGlobalAddr<i32, atomic_store_16, ATOMIC_STORE16_I32>;
442def : AStorePatGlobalAddr<i64, trunc_astore_8_64, ATOMIC_STORE8_I64>;
443def : AStorePatGlobalAddr<i64, trunc_astore_16_64, ATOMIC_STORE16_I64>;
444def : AStorePatGlobalAddr<i64, trunc_astore_32_64, ATOMIC_STORE32_I64>;
445
446def : AStorePatExternalSym<i32, atomic_store_8, ATOMIC_STORE8_I32>;
447def : AStorePatExternalSym<i32, atomic_store_16, ATOMIC_STORE16_I32>;
448def : AStorePatExternalSym<i64, trunc_astore_8_64, ATOMIC_STORE8_I64>;
449def : AStorePatExternalSym<i64, trunc_astore_16_64, ATOMIC_STORE16_I64>;
450def : AStorePatExternalSym<i64, trunc_astore_32_64, ATOMIC_STORE32_I64>;
451
452// Truncating stores with just a constant offset
453def : AStorePatOffsetOnly<i32, atomic_store_8, ATOMIC_STORE8_I32>;
454def : AStorePatOffsetOnly<i32, atomic_store_16, ATOMIC_STORE16_I32>;
455def : AStorePatOffsetOnly<i64, trunc_astore_8_64, ATOMIC_STORE8_I64>;
456def : AStorePatOffsetOnly<i64, trunc_astore_16_64, ATOMIC_STORE16_I64>;
457def : AStorePatOffsetOnly<i64, trunc_astore_32_64, ATOMIC_STORE32_I64>;
458
459def : AStorePatGlobalAddrOffOnly<i32, atomic_store_8, ATOMIC_STORE8_I32>;
460def : AStorePatGlobalAddrOffOnly<i32, atomic_store_16, ATOMIC_STORE16_I32>;
461def : AStorePatGlobalAddrOffOnly<i64, trunc_astore_8_64, ATOMIC_STORE8_I64>;
462def : AStorePatGlobalAddrOffOnly<i64, trunc_astore_16_64, ATOMIC_STORE16_I64>;
463def : AStorePatGlobalAddrOffOnly<i64, trunc_astore_32_64, ATOMIC_STORE32_I64>;
464
465def : AStorePatExternSymOffOnly<i32, atomic_store_8, ATOMIC_STORE8_I32>;
466def : AStorePatExternSymOffOnly<i32, atomic_store_16, ATOMIC_STORE16_I32>;
467def : AStorePatExternSymOffOnly<i64, trunc_astore_8_64, ATOMIC_STORE8_I64>;
468def : AStorePatExternSymOffOnly<i64, trunc_astore_16_64, ATOMIC_STORE16_I64>;
469def : AStorePatExternSymOffOnly<i64, trunc_astore_32_64, ATOMIC_STORE32_I64>;
470
471} // Predicates = [HasAtomics]
Dan Gohman10e730a2015-06-29 23:51:55 +0000472
473//===----------------------------------------------------------------------===//
Heejin Ahnfed73822018-07-09 22:30:51 +0000474// Atomic binary read-modify-writes
Dan Gohman10e730a2015-06-29 23:51:55 +0000475//===----------------------------------------------------------------------===//
476
Heejin Ahn20ea1822019-02-20 01:29:34 +0000477multiclass WebAssemblyBinRMW<WebAssemblyRegClass rc, string name,
478 int atomic_op> {
479 defm "" :
480 ATOMIC_I<(outs rc:$dst),
481 (ins P2Align:$p2align, offset32_op:$off, I32:$addr, rc:$val),
482 (outs), (ins P2Align:$p2align, offset32_op:$off), [],
483 !strconcat(name, "\t$dst, ${off}(${addr})${p2align}, $val"),
484 !strconcat(name, "\t${off}${p2align}"), atomic_op>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000485}
Dan Gohman10e730a2015-06-29 23:51:55 +0000486
Heejin Ahn20ea1822019-02-20 01:29:34 +0000487defm ATOMIC_RMW_ADD_I32 : WebAssemblyBinRMW<I32, "i32.atomic.rmw.add", 0x1e>;
488defm ATOMIC_RMW_ADD_I64 : WebAssemblyBinRMW<I64, "i64.atomic.rmw.add", 0x1f>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000489defm ATOMIC_RMW8_U_ADD_I32 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000490 WebAssemblyBinRMW<I32, "i32.atomic.rmw8.add_u", 0x20>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000491defm ATOMIC_RMW16_U_ADD_I32 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000492 WebAssemblyBinRMW<I32, "i32.atomic.rmw16.add_u", 0x21>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000493defm ATOMIC_RMW8_U_ADD_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000494 WebAssemblyBinRMW<I64, "i64.atomic.rmw8.add_u", 0x22>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000495defm ATOMIC_RMW16_U_ADD_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000496 WebAssemblyBinRMW<I64, "i64.atomic.rmw16.add_u", 0x23>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000497defm ATOMIC_RMW32_U_ADD_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000498 WebAssemblyBinRMW<I64, "i64.atomic.rmw32.add_u", 0x24>;
Dan Gohman10e730a2015-06-29 23:51:55 +0000499
Heejin Ahn20ea1822019-02-20 01:29:34 +0000500defm ATOMIC_RMW_SUB_I32 : WebAssemblyBinRMW<I32, "i32.atomic.rmw.sub", 0x25>;
501defm ATOMIC_RMW_SUB_I64 : WebAssemblyBinRMW<I64, "i64.atomic.rmw.sub", 0x26>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000502defm ATOMIC_RMW8_U_SUB_I32 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000503 WebAssemblyBinRMW<I32, "i32.atomic.rmw8.sub_u", 0x27>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000504defm ATOMIC_RMW16_U_SUB_I32 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000505 WebAssemblyBinRMW<I32, "i32.atomic.rmw16.sub_u", 0x28>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000506defm ATOMIC_RMW8_U_SUB_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000507 WebAssemblyBinRMW<I64, "i64.atomic.rmw8.sub_u", 0x29>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000508defm ATOMIC_RMW16_U_SUB_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000509 WebAssemblyBinRMW<I64, "i64.atomic.rmw16.sub_u", 0x2a>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000510defm ATOMIC_RMW32_U_SUB_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000511 WebAssemblyBinRMW<I64, "i64.atomic.rmw32.sub_u", 0x2b>;
Dan Gohman10e730a2015-06-29 23:51:55 +0000512
Heejin Ahn20ea1822019-02-20 01:29:34 +0000513defm ATOMIC_RMW_AND_I32 : WebAssemblyBinRMW<I32, "i32.atomic.rmw.and", 0x2c>;
514defm ATOMIC_RMW_AND_I64 : WebAssemblyBinRMW<I64, "i64.atomic.rmw.and", 0x2d>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000515defm ATOMIC_RMW8_U_AND_I32 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000516 WebAssemblyBinRMW<I32, "i32.atomic.rmw8.and_u", 0x2e>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000517defm ATOMIC_RMW16_U_AND_I32 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000518 WebAssemblyBinRMW<I32, "i32.atomic.rmw16.and_u", 0x2f>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000519defm ATOMIC_RMW8_U_AND_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000520 WebAssemblyBinRMW<I64, "i64.atomic.rmw8.and_u", 0x30>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000521defm ATOMIC_RMW16_U_AND_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000522 WebAssemblyBinRMW<I64, "i64.atomic.rmw16.and_u", 0x31>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000523defm ATOMIC_RMW32_U_AND_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000524 WebAssemblyBinRMW<I64, "i64.atomic.rmw32.and_u", 0x32>;
Derek Schuff18ba1922017-08-30 18:07:45 +0000525
Heejin Ahn20ea1822019-02-20 01:29:34 +0000526defm ATOMIC_RMW_OR_I32 : WebAssemblyBinRMW<I32, "i32.atomic.rmw.or", 0x33>;
527defm ATOMIC_RMW_OR_I64 : WebAssemblyBinRMW<I64, "i64.atomic.rmw.or", 0x34>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000528defm ATOMIC_RMW8_U_OR_I32 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000529 WebAssemblyBinRMW<I32, "i32.atomic.rmw8.or_u", 0x35>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000530defm ATOMIC_RMW16_U_OR_I32 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000531 WebAssemblyBinRMW<I32, "i32.atomic.rmw16.or_u", 0x36>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000532defm ATOMIC_RMW8_U_OR_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000533 WebAssemblyBinRMW<I64, "i64.atomic.rmw8.or_u", 0x37>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000534defm ATOMIC_RMW16_U_OR_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000535 WebAssemblyBinRMW<I64, "i64.atomic.rmw16.or_u", 0x38>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000536defm ATOMIC_RMW32_U_OR_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000537 WebAssemblyBinRMW<I64, "i64.atomic.rmw32.or_u", 0x39>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000538
Heejin Ahn20ea1822019-02-20 01:29:34 +0000539defm ATOMIC_RMW_XOR_I32 : WebAssemblyBinRMW<I32, "i32.atomic.rmw.xor", 0x3a>;
540defm ATOMIC_RMW_XOR_I64 : WebAssemblyBinRMW<I64, "i64.atomic.rmw.xor", 0x3b>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000541defm ATOMIC_RMW8_U_XOR_I32 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000542 WebAssemblyBinRMW<I32, "i32.atomic.rmw8.xor_u", 0x3c>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000543defm ATOMIC_RMW16_U_XOR_I32 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000544 WebAssemblyBinRMW<I32, "i32.atomic.rmw16.xor_u", 0x3d>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000545defm ATOMIC_RMW8_U_XOR_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000546 WebAssemblyBinRMW<I64, "i64.atomic.rmw8.xor_u", 0x3e>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000547defm ATOMIC_RMW16_U_XOR_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000548 WebAssemblyBinRMW<I64, "i64.atomic.rmw16.xor_u", 0x3f>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000549defm ATOMIC_RMW32_U_XOR_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000550 WebAssemblyBinRMW<I64, "i64.atomic.rmw32.xor_u", 0x40>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000551
552defm ATOMIC_RMW_XCHG_I32 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000553 WebAssemblyBinRMW<I32, "i32.atomic.rmw.xchg", 0x41>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000554defm ATOMIC_RMW_XCHG_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000555 WebAssemblyBinRMW<I64, "i64.atomic.rmw.xchg", 0x42>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000556defm ATOMIC_RMW8_U_XCHG_I32 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000557 WebAssemblyBinRMW<I32, "i32.atomic.rmw8.xchg_u", 0x43>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000558defm ATOMIC_RMW16_U_XCHG_I32 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000559 WebAssemblyBinRMW<I32, "i32.atomic.rmw16.xchg_u", 0x44>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000560defm ATOMIC_RMW8_U_XCHG_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000561 WebAssemblyBinRMW<I64, "i64.atomic.rmw8.xchg_u", 0x45>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000562defm ATOMIC_RMW16_U_XCHG_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000563 WebAssemblyBinRMW<I64, "i64.atomic.rmw16.xchg_u", 0x46>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000564defm ATOMIC_RMW32_U_XCHG_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000565 WebAssemblyBinRMW<I64, "i64.atomic.rmw32.xchg_u", 0x47>;
Heejin Ahnfed73822018-07-09 22:30:51 +0000566
567// Select binary RMWs with no constant offset.
568class BinRMWPatNoOffset<ValueType ty, PatFrag kind, NI inst> :
569 Pat<(ty (kind I32:$addr, ty:$val)), (inst 0, 0, I32:$addr, ty:$val)>;
570
571// Select binary RMWs with a constant offset.
572
573// Pattern with address + immediate offset
574class BinRMWPatImmOff<ValueType ty, PatFrag kind, PatFrag operand, NI inst> :
575 Pat<(ty (kind (operand I32:$addr, imm:$off), ty:$val)),
576 (inst 0, imm:$off, I32:$addr, ty:$val)>;
577
578class BinRMWPatGlobalAddr<ValueType ty, PatFrag kind, NI inst> :
579 Pat<(ty (kind (regPlusGA I32:$addr, (WebAssemblywrapper tglobaladdr:$off)),
580 ty:$val)),
581 (inst 0, tglobaladdr:$off, I32:$addr, ty:$val)>;
582
583class BinRMWPatExternalSym<ValueType ty, PatFrag kind, NI inst> :
584 Pat<(ty (kind (add I32:$addr, (WebAssemblywrapper texternalsym:$off)),
585 ty:$val)),
586 (inst 0, texternalsym:$off, I32:$addr, ty:$val)>;
587
588// Select binary RMWs with just a constant offset.
589class BinRMWPatOffsetOnly<ValueType ty, PatFrag kind, NI inst> :
590 Pat<(ty (kind imm:$off, ty:$val)),
591 (inst 0, imm:$off, (CONST_I32 0), ty:$val)>;
592
593class BinRMWPatGlobalAddrOffOnly<ValueType ty, PatFrag kind, NI inst> :
594 Pat<(ty (kind (WebAssemblywrapper tglobaladdr:$off), ty:$val)),
595 (inst 0, tglobaladdr:$off, (CONST_I32 0), ty:$val)>;
596
597class BinRMWPatExternSymOffOnly<ValueType ty, PatFrag kind, NI inst> :
598 Pat<(ty (kind (WebAssemblywrapper texternalsym:$off), ty:$val)),
599 (inst 0, texternalsym:$off, (CONST_I32 0), ty:$val)>;
600
601// Patterns for various addressing modes.
602multiclass BinRMWPattern<PatFrag rmw_32, PatFrag rmw_64, NI inst_32,
603 NI inst_64> {
604 def : BinRMWPatNoOffset<i32, rmw_32, inst_32>;
605 def : BinRMWPatNoOffset<i64, rmw_64, inst_64>;
606
607 def : BinRMWPatImmOff<i32, rmw_32, regPlusImm, inst_32>;
608 def : BinRMWPatImmOff<i64, rmw_64, regPlusImm, inst_64>;
609 def : BinRMWPatImmOff<i32, rmw_32, or_is_add, inst_32>;
610 def : BinRMWPatImmOff<i64, rmw_64, or_is_add, inst_64>;
611
612 def : BinRMWPatGlobalAddr<i32, rmw_32, inst_32>;
613 def : BinRMWPatGlobalAddr<i64, rmw_64, inst_64>;
614
615 def : BinRMWPatExternalSym<i32, rmw_32, inst_32>;
616 def : BinRMWPatExternalSym<i64, rmw_64, inst_64>;
617
618 def : BinRMWPatOffsetOnly<i32, rmw_32, inst_32>;
619 def : BinRMWPatOffsetOnly<i64, rmw_64, inst_64>;
620
621 def : BinRMWPatGlobalAddrOffOnly<i32, rmw_32, inst_32>;
622 def : BinRMWPatGlobalAddrOffOnly<i64, rmw_64, inst_64>;
623
624 def : BinRMWPatExternSymOffOnly<i32, rmw_32, inst_32>;
625 def : BinRMWPatExternSymOffOnly<i64, rmw_64, inst_64>;
626}
627
628let Predicates = [HasAtomics] in {
629defm : BinRMWPattern<atomic_load_add_32, atomic_load_add_64, ATOMIC_RMW_ADD_I32,
630 ATOMIC_RMW_ADD_I64>;
631defm : BinRMWPattern<atomic_load_sub_32, atomic_load_sub_64, ATOMIC_RMW_SUB_I32,
632 ATOMIC_RMW_SUB_I64>;
633defm : BinRMWPattern<atomic_load_and_32, atomic_load_and_64, ATOMIC_RMW_AND_I32,
634 ATOMIC_RMW_AND_I64>;
635defm : BinRMWPattern<atomic_load_or_32, atomic_load_or_64, ATOMIC_RMW_OR_I32,
636 ATOMIC_RMW_OR_I64>;
637defm : BinRMWPattern<atomic_load_xor_32, atomic_load_xor_64, ATOMIC_RMW_XOR_I32,
638 ATOMIC_RMW_XOR_I64>;
639defm : BinRMWPattern<atomic_swap_32, atomic_swap_64, ATOMIC_RMW_XCHG_I32,
640 ATOMIC_RMW_XCHG_I64>;
641} // Predicates = [HasAtomics]
642
643// Truncating & zero-extending binary RMW patterns.
644// These are combined patterns of truncating store patterns and zero-extending
645// load patterns above.
646class zext_bin_rmw_8_32<PatFrag kind> :
647 PatFrag<(ops node:$addr, node:$val),
648 (and (i32 (kind node:$addr, node:$val)), 255)>;
649class zext_bin_rmw_16_32<PatFrag kind> :
650 PatFrag<(ops node:$addr, node:$val),
651 (and (i32 (kind node:$addr, node:$val)), 65535)>;
652class zext_bin_rmw_8_64<PatFrag kind> :
653 PatFrag<(ops node:$addr, node:$val),
654 (and (i64 (anyext (i32 (kind node:$addr,
655 (i32 (trunc (i64 node:$val))))))), 255)>;
656class zext_bin_rmw_16_64<PatFrag kind> :
657 PatFrag<(ops node:$addr, node:$val),
658 (and (i64 (anyext (i32 (kind node:$addr,
659 (i32 (trunc (i64 node:$val))))))), 65535)>;
660class zext_bin_rmw_32_64<PatFrag kind> :
661 PatFrag<(ops node:$addr, node:$val),
662 (zext (i32 (kind node:$addr, (i32 (trunc (i64 node:$val))))))>;
663
664// Truncating & sign-extending binary RMW patterns.
665// These are combined patterns of truncating store patterns and sign-extending
666// load patterns above. We match subword RMWs (for 32-bit) and anyext RMWs (for
667// 64-bit) and select a zext RMW; the next instruction will be sext_inreg which
668// is selected by itself.
669class sext_bin_rmw_8_32<PatFrag kind> :
670 PatFrag<(ops node:$addr, node:$val), (kind node:$addr, node:$val)>;
671class sext_bin_rmw_16_32<PatFrag kind> : sext_bin_rmw_8_32<kind>;
672class sext_bin_rmw_8_64<PatFrag kind> :
673 PatFrag<(ops node:$addr, node:$val),
674 (anyext (i32 (kind node:$addr, (i32 (trunc (i64 node:$val))))))>;
675class sext_bin_rmw_16_64<PatFrag kind> : sext_bin_rmw_8_64<kind>;
Thomas Lively6a87dda2019-01-08 06:25:55 +0000676// 32->64 sext RMW gets selected as i32.atomic.rmw.***, i64.extend_i32_s
Heejin Ahnfed73822018-07-09 22:30:51 +0000677
678// Patterns for various addressing modes for truncating-extending binary RMWs.
679multiclass BinRMWTruncExtPattern<
680 PatFrag rmw_8, PatFrag rmw_16, PatFrag rmw_32, PatFrag rmw_64,
681 NI inst8_32, NI inst16_32, NI inst8_64, NI inst16_64, NI inst32_64> {
682 // Truncating-extending binary RMWs with no constant offset
683 def : BinRMWPatNoOffset<i32, zext_bin_rmw_8_32<rmw_8>, inst8_32>;
684 def : BinRMWPatNoOffset<i32, zext_bin_rmw_16_32<rmw_16>, inst16_32>;
685 def : BinRMWPatNoOffset<i64, zext_bin_rmw_8_64<rmw_8>, inst8_64>;
686 def : BinRMWPatNoOffset<i64, zext_bin_rmw_16_64<rmw_16>, inst16_64>;
687 def : BinRMWPatNoOffset<i64, zext_bin_rmw_32_64<rmw_32>, inst32_64>;
688
689 def : BinRMWPatNoOffset<i32, sext_bin_rmw_8_32<rmw_8>, inst8_32>;
690 def : BinRMWPatNoOffset<i32, sext_bin_rmw_16_32<rmw_16>, inst16_32>;
691 def : BinRMWPatNoOffset<i64, sext_bin_rmw_8_64<rmw_8>, inst8_64>;
692 def : BinRMWPatNoOffset<i64, sext_bin_rmw_16_64<rmw_16>, inst16_64>;
693
694 // Truncating-extending binary RMWs with a constant offset
695 def : BinRMWPatImmOff<i32, zext_bin_rmw_8_32<rmw_8>, regPlusImm, inst8_32>;
696 def : BinRMWPatImmOff<i32, zext_bin_rmw_16_32<rmw_16>, regPlusImm, inst16_32>;
697 def : BinRMWPatImmOff<i64, zext_bin_rmw_8_64<rmw_8>, regPlusImm, inst8_64>;
698 def : BinRMWPatImmOff<i64, zext_bin_rmw_16_64<rmw_16>, regPlusImm, inst16_64>;
699 def : BinRMWPatImmOff<i64, zext_bin_rmw_32_64<rmw_32>, regPlusImm, inst32_64>;
700 def : BinRMWPatImmOff<i32, zext_bin_rmw_8_32<rmw_8>, or_is_add, inst8_32>;
701 def : BinRMWPatImmOff<i32, zext_bin_rmw_16_32<rmw_16>, or_is_add, inst16_32>;
702 def : BinRMWPatImmOff<i64, zext_bin_rmw_8_64<rmw_8>, or_is_add, inst8_64>;
703 def : BinRMWPatImmOff<i64, zext_bin_rmw_16_64<rmw_16>, or_is_add, inst16_64>;
704 def : BinRMWPatImmOff<i64, zext_bin_rmw_32_64<rmw_32>, or_is_add, inst32_64>;
705
706 def : BinRMWPatImmOff<i32, sext_bin_rmw_8_32<rmw_8>, regPlusImm, inst8_32>;
707 def : BinRMWPatImmOff<i32, sext_bin_rmw_16_32<rmw_16>, regPlusImm, inst16_32>;
708 def : BinRMWPatImmOff<i64, sext_bin_rmw_8_64<rmw_8>, regPlusImm, inst8_64>;
709 def : BinRMWPatImmOff<i64, sext_bin_rmw_16_64<rmw_16>, regPlusImm, inst16_64>;
710 def : BinRMWPatImmOff<i32, sext_bin_rmw_8_32<rmw_8>, or_is_add, inst8_32>;
711 def : BinRMWPatImmOff<i32, sext_bin_rmw_16_32<rmw_16>, or_is_add, inst16_32>;
712 def : BinRMWPatImmOff<i64, sext_bin_rmw_8_64<rmw_8>, or_is_add, inst8_64>;
713 def : BinRMWPatImmOff<i64, sext_bin_rmw_16_64<rmw_16>, or_is_add, inst16_64>;
714
715 def : BinRMWPatGlobalAddr<i32, zext_bin_rmw_8_32<rmw_8>, inst8_32>;
716 def : BinRMWPatGlobalAddr<i32, zext_bin_rmw_16_32<rmw_16>, inst16_32>;
717 def : BinRMWPatGlobalAddr<i64, zext_bin_rmw_8_64<rmw_8>, inst8_64>;
718 def : BinRMWPatGlobalAddr<i64, zext_bin_rmw_16_64<rmw_16>, inst16_64>;
719 def : BinRMWPatGlobalAddr<i64, zext_bin_rmw_32_64<rmw_32>, inst32_64>;
720
721 def : BinRMWPatGlobalAddr<i32, sext_bin_rmw_8_32<rmw_8>, inst8_32>;
722 def : BinRMWPatGlobalAddr<i32, sext_bin_rmw_16_32<rmw_16>, inst16_32>;
723 def : BinRMWPatGlobalAddr<i64, sext_bin_rmw_8_64<rmw_8>, inst8_64>;
724 def : BinRMWPatGlobalAddr<i64, sext_bin_rmw_16_64<rmw_16>, inst16_64>;
725
726 def : BinRMWPatExternalSym<i32, zext_bin_rmw_8_32<rmw_8>, inst8_32>;
727 def : BinRMWPatExternalSym<i32, zext_bin_rmw_16_32<rmw_16>, inst16_32>;
728 def : BinRMWPatExternalSym<i64, zext_bin_rmw_8_64<rmw_8>, inst8_64>;
729 def : BinRMWPatExternalSym<i64, zext_bin_rmw_16_64<rmw_16>, inst16_64>;
730 def : BinRMWPatExternalSym<i64, zext_bin_rmw_32_64<rmw_32>, inst32_64>;
731
732 def : BinRMWPatExternalSym<i32, sext_bin_rmw_8_32<rmw_8>, inst8_32>;
733 def : BinRMWPatExternalSym<i32, sext_bin_rmw_16_32<rmw_16>, inst16_32>;
734 def : BinRMWPatExternalSym<i64, sext_bin_rmw_8_64<rmw_8>, inst8_64>;
735 def : BinRMWPatExternalSym<i64, sext_bin_rmw_16_64<rmw_16>, inst16_64>;
736
737 // Truncating-extending binary RMWs with just a constant offset
738 def : BinRMWPatOffsetOnly<i32, zext_bin_rmw_8_32<rmw_8>, inst8_32>;
739 def : BinRMWPatOffsetOnly<i32, zext_bin_rmw_16_32<rmw_16>, inst16_32>;
740 def : BinRMWPatOffsetOnly<i64, zext_bin_rmw_8_64<rmw_8>, inst8_64>;
741 def : BinRMWPatOffsetOnly<i64, zext_bin_rmw_16_64<rmw_16>, inst16_64>;
742 def : BinRMWPatOffsetOnly<i64, zext_bin_rmw_32_64<rmw_32>, inst32_64>;
743
744 def : BinRMWPatOffsetOnly<i32, sext_bin_rmw_8_32<rmw_8>, inst8_32>;
745 def : BinRMWPatOffsetOnly<i32, sext_bin_rmw_16_32<rmw_16>, inst16_32>;
746 def : BinRMWPatOffsetOnly<i64, sext_bin_rmw_8_64<rmw_8>, inst8_64>;
747 def : BinRMWPatOffsetOnly<i64, sext_bin_rmw_16_64<rmw_16>, inst16_64>;
748
749 def : BinRMWPatGlobalAddrOffOnly<i32, zext_bin_rmw_8_32<rmw_8>, inst8_32>;
750 def : BinRMWPatGlobalAddrOffOnly<i32, zext_bin_rmw_16_32<rmw_16>, inst16_32>;
751 def : BinRMWPatGlobalAddrOffOnly<i64, zext_bin_rmw_8_64<rmw_8>, inst8_64>;
752 def : BinRMWPatGlobalAddrOffOnly<i64, zext_bin_rmw_16_64<rmw_16>, inst16_64>;
753 def : BinRMWPatGlobalAddrOffOnly<i64, zext_bin_rmw_32_64<rmw_32>, inst32_64>;
754
755 def : BinRMWPatGlobalAddrOffOnly<i32, sext_bin_rmw_8_32<rmw_8>, inst8_32>;
756 def : BinRMWPatGlobalAddrOffOnly<i32, sext_bin_rmw_16_32<rmw_16>, inst16_32>;
757 def : BinRMWPatGlobalAddrOffOnly<i64, sext_bin_rmw_8_64<rmw_8>, inst8_64>;
758 def : BinRMWPatGlobalAddrOffOnly<i64, sext_bin_rmw_16_64<rmw_16>, inst16_64>;
759
760 def : BinRMWPatExternSymOffOnly<i32, zext_bin_rmw_8_32<rmw_8>, inst8_32>;
761 def : BinRMWPatExternSymOffOnly<i32, zext_bin_rmw_16_32<rmw_16>, inst16_32>;
762 def : BinRMWPatExternSymOffOnly<i64, zext_bin_rmw_8_64<rmw_8>, inst8_64>;
763 def : BinRMWPatExternSymOffOnly<i64, zext_bin_rmw_16_64<rmw_16>, inst16_64>;
764 def : BinRMWPatExternSymOffOnly<i64, zext_bin_rmw_32_64<rmw_32>, inst32_64>;
765
766 def : BinRMWPatExternSymOffOnly<i32, sext_bin_rmw_8_32<rmw_8>, inst8_32>;
767 def : BinRMWPatExternSymOffOnly<i32, sext_bin_rmw_16_32<rmw_16>, inst16_32>;
768 def : BinRMWPatExternSymOffOnly<i64, sext_bin_rmw_8_64<rmw_8>, inst8_64>;
769 def : BinRMWPatExternSymOffOnly<i64, sext_bin_rmw_16_64<rmw_16>, inst16_64>;
770}
771
772let Predicates = [HasAtomics] in {
773defm : BinRMWTruncExtPattern<
774 atomic_load_add_8, atomic_load_add_16, atomic_load_add_32, atomic_load_add_64,
775 ATOMIC_RMW8_U_ADD_I32, ATOMIC_RMW16_U_ADD_I32,
776 ATOMIC_RMW8_U_ADD_I64, ATOMIC_RMW16_U_ADD_I64, ATOMIC_RMW32_U_ADD_I64>;
777defm : BinRMWTruncExtPattern<
778 atomic_load_sub_8, atomic_load_sub_16, atomic_load_sub_32, atomic_load_sub_64,
779 ATOMIC_RMW8_U_SUB_I32, ATOMIC_RMW16_U_SUB_I32,
780 ATOMIC_RMW8_U_SUB_I64, ATOMIC_RMW16_U_SUB_I64, ATOMIC_RMW32_U_SUB_I64>;
781defm : BinRMWTruncExtPattern<
782 atomic_load_and_8, atomic_load_and_16, atomic_load_and_32, atomic_load_and_64,
783 ATOMIC_RMW8_U_AND_I32, ATOMIC_RMW16_U_AND_I32,
784 ATOMIC_RMW8_U_AND_I64, ATOMIC_RMW16_U_AND_I64, ATOMIC_RMW32_U_AND_I64>;
785defm : BinRMWTruncExtPattern<
786 atomic_load_or_8, atomic_load_or_16, atomic_load_or_32, atomic_load_or_64,
787 ATOMIC_RMW8_U_OR_I32, ATOMIC_RMW16_U_OR_I32,
788 ATOMIC_RMW8_U_OR_I64, ATOMIC_RMW16_U_OR_I64, ATOMIC_RMW32_U_OR_I64>;
789defm : BinRMWTruncExtPattern<
790 atomic_load_xor_8, atomic_load_xor_16, atomic_load_xor_32, atomic_load_xor_64,
791 ATOMIC_RMW8_U_XOR_I32, ATOMIC_RMW16_U_XOR_I32,
792 ATOMIC_RMW8_U_XOR_I64, ATOMIC_RMW16_U_XOR_I64, ATOMIC_RMW32_U_XOR_I64>;
793defm : BinRMWTruncExtPattern<
794 atomic_swap_8, atomic_swap_16, atomic_swap_32, atomic_swap_64,
795 ATOMIC_RMW8_U_XCHG_I32, ATOMIC_RMW16_U_XCHG_I32,
796 ATOMIC_RMW8_U_XCHG_I64, ATOMIC_RMW16_U_XCHG_I64, ATOMIC_RMW32_U_XCHG_I64>;
797} // Predicates = [HasAtomics]
Heejin Ahnb3724b72018-08-01 19:40:28 +0000798
799//===----------------------------------------------------------------------===//
800// Atomic ternary read-modify-writes
801//===----------------------------------------------------------------------===//
802
Heejin Ahne8653bb2018-08-07 00:22:22 +0000803// TODO LLVM IR's cmpxchg instruction returns a pair of {loaded value, success
804// flag}. When we use the success flag or both values, we can't make use of i64
805// truncate/extend versions of instructions for now, which is suboptimal.
806// Consider adding a pass after instruction selection that optimizes this case
807// if it is frequent.
Heejin Ahnb3724b72018-08-01 19:40:28 +0000808
Heejin Ahn20ea1822019-02-20 01:29:34 +0000809multiclass WebAssemblyTerRMW<WebAssemblyRegClass rc, string name,
810 int atomic_op> {
811 defm "" :
812 ATOMIC_I<(outs rc:$dst),
813 (ins P2Align:$p2align, offset32_op:$off, I32:$addr, rc:$exp,
Thomas Lively972d7d52019-03-09 04:31:37 +0000814 rc:$new_),
Heejin Ahn20ea1822019-02-20 01:29:34 +0000815 (outs), (ins P2Align:$p2align, offset32_op:$off), [],
Thomas Lively972d7d52019-03-09 04:31:37 +0000816 !strconcat(name, "\t$dst, ${off}(${addr})${p2align}, $exp, $new_"),
Heejin Ahn20ea1822019-02-20 01:29:34 +0000817 !strconcat(name, "\t${off}${p2align}"), atomic_op>;
Heejin Ahnb3724b72018-08-01 19:40:28 +0000818}
819
820defm ATOMIC_RMW_CMPXCHG_I32 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000821 WebAssemblyTerRMW<I32, "i32.atomic.rmw.cmpxchg", 0x48>;
Heejin Ahnb3724b72018-08-01 19:40:28 +0000822defm ATOMIC_RMW_CMPXCHG_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000823 WebAssemblyTerRMW<I64, "i64.atomic.rmw.cmpxchg", 0x49>;
Heejin Ahnb3724b72018-08-01 19:40:28 +0000824defm ATOMIC_RMW8_U_CMPXCHG_I32 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000825 WebAssemblyTerRMW<I32, "i32.atomic.rmw8.cmpxchg_u", 0x4a>;
Heejin Ahnb3724b72018-08-01 19:40:28 +0000826defm ATOMIC_RMW16_U_CMPXCHG_I32 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000827 WebAssemblyTerRMW<I32, "i32.atomic.rmw16.cmpxchg_u", 0x4b>;
Heejin Ahnb3724b72018-08-01 19:40:28 +0000828defm ATOMIC_RMW8_U_CMPXCHG_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000829 WebAssemblyTerRMW<I64, "i64.atomic.rmw8.cmpxchg_u", 0x4c>;
Heejin Ahnb3724b72018-08-01 19:40:28 +0000830defm ATOMIC_RMW16_U_CMPXCHG_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000831 WebAssemblyTerRMW<I64, "i64.atomic.rmw16.cmpxchg_u", 0x4d>;
Heejin Ahnb3724b72018-08-01 19:40:28 +0000832defm ATOMIC_RMW32_U_CMPXCHG_I64 :
Heejin Ahn20ea1822019-02-20 01:29:34 +0000833 WebAssemblyTerRMW<I64, "i64.atomic.rmw32.cmpxchg_u", 0x4e>;
Heejin Ahnb3724b72018-08-01 19:40:28 +0000834
835// Select ternary RMWs with no constant offset.
836class TerRMWPatNoOffset<ValueType ty, PatFrag kind, NI inst> :
837 Pat<(ty (kind I32:$addr, ty:$exp, ty:$new)),
838 (inst 0, 0, I32:$addr, ty:$exp, ty:$new)>;
839
840// Select ternary RMWs with a constant offset.
841
842// Pattern with address + immediate offset
843class TerRMWPatImmOff<ValueType ty, PatFrag kind, PatFrag operand, NI inst> :
844 Pat<(ty (kind (operand I32:$addr, imm:$off), ty:$exp, ty:$new)),
845 (inst 0, imm:$off, I32:$addr, ty:$exp, ty:$new)>;
846
847class TerRMWPatGlobalAddr<ValueType ty, PatFrag kind, NI inst> :
848 Pat<(ty (kind (regPlusGA I32:$addr, (WebAssemblywrapper tglobaladdr:$off)),
849 ty:$exp, ty:$new)),
850 (inst 0, tglobaladdr:$off, I32:$addr, ty:$exp, ty:$new)>;
851
852class TerRMWPatExternalSym<ValueType ty, PatFrag kind, NI inst> :
853 Pat<(ty (kind (add I32:$addr, (WebAssemblywrapper texternalsym:$off)),
854 ty:$exp, ty:$new)),
855 (inst 0, texternalsym:$off, I32:$addr, ty:$exp, ty:$new)>;
856
857// Select ternary RMWs with just a constant offset.
858class TerRMWPatOffsetOnly<ValueType ty, PatFrag kind, NI inst> :
859 Pat<(ty (kind imm:$off, ty:$exp, ty:$new)),
860 (inst 0, imm:$off, (CONST_I32 0), ty:$exp, ty:$new)>;
861
862class TerRMWPatGlobalAddrOffOnly<ValueType ty, PatFrag kind, NI inst> :
863 Pat<(ty (kind (WebAssemblywrapper tglobaladdr:$off), ty:$exp, ty:$new)),
864 (inst 0, tglobaladdr:$off, (CONST_I32 0), ty:$exp, ty:$new)>;
865
866class TerRMWPatExternSymOffOnly<ValueType ty, PatFrag kind, NI inst> :
867 Pat<(ty (kind (WebAssemblywrapper texternalsym:$off), ty:$exp, ty:$new)),
868 (inst 0, texternalsym:$off, (CONST_I32 0), ty:$exp, ty:$new)>;
869
870// Patterns for various addressing modes.
871multiclass TerRMWPattern<PatFrag rmw_32, PatFrag rmw_64, NI inst_32,
872 NI inst_64> {
873 def : TerRMWPatNoOffset<i32, rmw_32, inst_32>;
874 def : TerRMWPatNoOffset<i64, rmw_64, inst_64>;
875
876 def : TerRMWPatImmOff<i32, rmw_32, regPlusImm, inst_32>;
877 def : TerRMWPatImmOff<i64, rmw_64, regPlusImm, inst_64>;
878 def : TerRMWPatImmOff<i32, rmw_32, or_is_add, inst_32>;
879 def : TerRMWPatImmOff<i64, rmw_64, or_is_add, inst_64>;
880
881 def : TerRMWPatGlobalAddr<i32, rmw_32, inst_32>;
882 def : TerRMWPatGlobalAddr<i64, rmw_64, inst_64>;
883
884 def : TerRMWPatExternalSym<i32, rmw_32, inst_32>;
885 def : TerRMWPatExternalSym<i64, rmw_64, inst_64>;
886
887 def : TerRMWPatOffsetOnly<i32, rmw_32, inst_32>;
888 def : TerRMWPatOffsetOnly<i64, rmw_64, inst_64>;
889
890 def : TerRMWPatGlobalAddrOffOnly<i32, rmw_32, inst_32>;
891 def : TerRMWPatGlobalAddrOffOnly<i64, rmw_64, inst_64>;
892
893 def : TerRMWPatExternSymOffOnly<i32, rmw_32, inst_32>;
894 def : TerRMWPatExternSymOffOnly<i64, rmw_64, inst_64>;
895}
896
Heejin Ahn43675872019-02-06 00:17:03 +0000897let Predicates = [HasAtomics] in
Heejin Ahnb3724b72018-08-01 19:40:28 +0000898defm : TerRMWPattern<atomic_cmp_swap_32, atomic_cmp_swap_64,
899 ATOMIC_RMW_CMPXCHG_I32, ATOMIC_RMW_CMPXCHG_I64>;
Heejin Ahnb3724b72018-08-01 19:40:28 +0000900
901// Truncating & zero-extending ternary RMW patterns.
902// DAG legalization & optimization before instruction selection may introduce
903// additional nodes such as anyext or assertzext depending on operand types.
904class zext_ter_rmw_8_32<PatFrag kind> :
905 PatFrag<(ops node:$addr, node:$exp, node:$new),
906 (and (i32 (kind node:$addr, node:$exp, node:$new)), 255)>;
907class zext_ter_rmw_16_32<PatFrag kind> :
908 PatFrag<(ops node:$addr, node:$exp, node:$new),
909 (and (i32 (kind node:$addr, node:$exp, node:$new)), 65535)>;
910class zext_ter_rmw_8_64<PatFrag kind> :
911 PatFrag<(ops node:$addr, node:$exp, node:$new),
912 (zext (i32 (assertzext (i32 (kind node:$addr,
913 (i32 (trunc (i64 node:$exp))),
914 (i32 (trunc (i64 node:$new))))))))>;
915class zext_ter_rmw_16_64<PatFrag kind> : zext_ter_rmw_8_64<kind>;
916class zext_ter_rmw_32_64<PatFrag kind> :
917 PatFrag<(ops node:$addr, node:$exp, node:$new),
918 (zext (i32 (kind node:$addr,
919 (i32 (trunc (i64 node:$exp))),
920 (i32 (trunc (i64 node:$new))))))>;
921
922// Truncating & sign-extending ternary RMW patterns.
923// We match subword RMWs (for 32-bit) and anyext RMWs (for 64-bit) and select a
924// zext RMW; the next instruction will be sext_inreg which is selected by
925// itself.
926class sext_ter_rmw_8_32<PatFrag kind> :
927 PatFrag<(ops node:$addr, node:$exp, node:$new),
928 (kind node:$addr, node:$exp, node:$new)>;
929class sext_ter_rmw_16_32<PatFrag kind> : sext_ter_rmw_8_32<kind>;
930class sext_ter_rmw_8_64<PatFrag kind> :
931 PatFrag<(ops node:$addr, node:$exp, node:$new),
932 (anyext (i32 (assertzext (i32
933 (kind node:$addr,
934 (i32 (trunc (i64 node:$exp))),
935 (i32 (trunc (i64 node:$new))))))))>;
936class sext_ter_rmw_16_64<PatFrag kind> : sext_ter_rmw_8_64<kind>;
Thomas Lively6a87dda2019-01-08 06:25:55 +0000937// 32->64 sext RMW gets selected as i32.atomic.rmw.***, i64.extend_i32_s
Heejin Ahnb3724b72018-08-01 19:40:28 +0000938
939// Patterns for various addressing modes for truncating-extending ternary RMWs.
940multiclass TerRMWTruncExtPattern<
941 PatFrag rmw_8, PatFrag rmw_16, PatFrag rmw_32, PatFrag rmw_64,
942 NI inst8_32, NI inst16_32, NI inst8_64, NI inst16_64, NI inst32_64> {
943 // Truncating-extending ternary RMWs with no constant offset
944 def : TerRMWPatNoOffset<i32, zext_ter_rmw_8_32<rmw_8>, inst8_32>;
945 def : TerRMWPatNoOffset<i32, zext_ter_rmw_16_32<rmw_16>, inst16_32>;
946 def : TerRMWPatNoOffset<i64, zext_ter_rmw_8_64<rmw_8>, inst8_64>;
947 def : TerRMWPatNoOffset<i64, zext_ter_rmw_16_64<rmw_16>, inst16_64>;
948 def : TerRMWPatNoOffset<i64, zext_ter_rmw_32_64<rmw_32>, inst32_64>;
949
950 def : TerRMWPatNoOffset<i32, sext_ter_rmw_8_32<rmw_8>, inst8_32>;
951 def : TerRMWPatNoOffset<i32, sext_ter_rmw_16_32<rmw_16>, inst16_32>;
952 def : TerRMWPatNoOffset<i64, sext_ter_rmw_8_64<rmw_8>, inst8_64>;
953 def : TerRMWPatNoOffset<i64, sext_ter_rmw_16_64<rmw_16>, inst16_64>;
954
955 // Truncating-extending ternary RMWs with a constant offset
956 def : TerRMWPatImmOff<i32, zext_ter_rmw_8_32<rmw_8>, regPlusImm, inst8_32>;
957 def : TerRMWPatImmOff<i32, zext_ter_rmw_16_32<rmw_16>, regPlusImm, inst16_32>;
958 def : TerRMWPatImmOff<i64, zext_ter_rmw_8_64<rmw_8>, regPlusImm, inst8_64>;
959 def : TerRMWPatImmOff<i64, zext_ter_rmw_16_64<rmw_16>, regPlusImm, inst16_64>;
960 def : TerRMWPatImmOff<i64, zext_ter_rmw_32_64<rmw_32>, regPlusImm, inst32_64>;
961 def : TerRMWPatImmOff<i32, zext_ter_rmw_8_32<rmw_8>, or_is_add, inst8_32>;
962 def : TerRMWPatImmOff<i32, zext_ter_rmw_16_32<rmw_16>, or_is_add, inst16_32>;
963 def : TerRMWPatImmOff<i64, zext_ter_rmw_8_64<rmw_8>, or_is_add, inst8_64>;
964 def : TerRMWPatImmOff<i64, zext_ter_rmw_16_64<rmw_16>, or_is_add, inst16_64>;
965 def : TerRMWPatImmOff<i64, zext_ter_rmw_32_64<rmw_32>, or_is_add, inst32_64>;
966
967 def : TerRMWPatImmOff<i32, sext_ter_rmw_8_32<rmw_8>, regPlusImm, inst8_32>;
968 def : TerRMWPatImmOff<i32, sext_ter_rmw_16_32<rmw_16>, regPlusImm, inst16_32>;
969 def : TerRMWPatImmOff<i64, sext_ter_rmw_8_64<rmw_8>, regPlusImm, inst8_64>;
970 def : TerRMWPatImmOff<i64, sext_ter_rmw_16_64<rmw_16>, regPlusImm, inst16_64>;
971 def : TerRMWPatImmOff<i32, sext_ter_rmw_8_32<rmw_8>, or_is_add, inst8_32>;
972 def : TerRMWPatImmOff<i32, sext_ter_rmw_16_32<rmw_16>, or_is_add, inst16_32>;
973 def : TerRMWPatImmOff<i64, sext_ter_rmw_8_64<rmw_8>, or_is_add, inst8_64>;
974 def : TerRMWPatImmOff<i64, sext_ter_rmw_16_64<rmw_16>, or_is_add, inst16_64>;
975
976 def : TerRMWPatGlobalAddr<i32, zext_ter_rmw_8_32<rmw_8>, inst8_32>;
977 def : TerRMWPatGlobalAddr<i32, zext_ter_rmw_16_32<rmw_16>, inst16_32>;
978 def : TerRMWPatGlobalAddr<i64, zext_ter_rmw_8_64<rmw_8>, inst8_64>;
979 def : TerRMWPatGlobalAddr<i64, zext_ter_rmw_16_64<rmw_16>, inst16_64>;
980 def : TerRMWPatGlobalAddr<i64, zext_ter_rmw_32_64<rmw_32>, inst32_64>;
981
982 def : TerRMWPatGlobalAddr<i32, sext_ter_rmw_8_32<rmw_8>, inst8_32>;
983 def : TerRMWPatGlobalAddr<i32, sext_ter_rmw_16_32<rmw_16>, inst16_32>;
984 def : TerRMWPatGlobalAddr<i64, sext_ter_rmw_8_64<rmw_8>, inst8_64>;
985 def : TerRMWPatGlobalAddr<i64, sext_ter_rmw_16_64<rmw_16>, inst16_64>;
986
987 def : TerRMWPatExternalSym<i32, zext_ter_rmw_8_32<rmw_8>, inst8_32>;
988 def : TerRMWPatExternalSym<i32, zext_ter_rmw_16_32<rmw_16>, inst16_32>;
989 def : TerRMWPatExternalSym<i64, zext_ter_rmw_8_64<rmw_8>, inst8_64>;
990 def : TerRMWPatExternalSym<i64, zext_ter_rmw_16_64<rmw_16>, inst16_64>;
991 def : TerRMWPatExternalSym<i64, zext_ter_rmw_32_64<rmw_32>, inst32_64>;
992
993 def : TerRMWPatExternalSym<i32, sext_ter_rmw_8_32<rmw_8>, inst8_32>;
994 def : TerRMWPatExternalSym<i32, sext_ter_rmw_16_32<rmw_16>, inst16_32>;
995 def : TerRMWPatExternalSym<i64, sext_ter_rmw_8_64<rmw_8>, inst8_64>;
996 def : TerRMWPatExternalSym<i64, sext_ter_rmw_16_64<rmw_16>, inst16_64>;
997
998 // Truncating-extending ternary RMWs with just a constant offset
999 def : TerRMWPatOffsetOnly<i32, zext_ter_rmw_8_32<rmw_8>, inst8_32>;
1000 def : TerRMWPatOffsetOnly<i32, zext_ter_rmw_16_32<rmw_16>, inst16_32>;
1001 def : TerRMWPatOffsetOnly<i64, zext_ter_rmw_8_64<rmw_8>, inst8_64>;
1002 def : TerRMWPatOffsetOnly<i64, zext_ter_rmw_16_64<rmw_16>, inst16_64>;
1003 def : TerRMWPatOffsetOnly<i64, zext_ter_rmw_32_64<rmw_32>, inst32_64>;
1004
1005 def : TerRMWPatOffsetOnly<i32, sext_ter_rmw_8_32<rmw_8>, inst8_32>;
1006 def : TerRMWPatOffsetOnly<i32, sext_ter_rmw_16_32<rmw_16>, inst16_32>;
1007 def : TerRMWPatOffsetOnly<i64, sext_ter_rmw_8_64<rmw_8>, inst8_64>;
1008 def : TerRMWPatOffsetOnly<i64, sext_ter_rmw_16_64<rmw_16>, inst16_64>;
1009
1010 def : TerRMWPatGlobalAddrOffOnly<i32, zext_ter_rmw_8_32<rmw_8>, inst8_32>;
1011 def : TerRMWPatGlobalAddrOffOnly<i32, zext_ter_rmw_16_32<rmw_16>, inst16_32>;
1012 def : TerRMWPatGlobalAddrOffOnly<i64, zext_ter_rmw_8_64<rmw_8>, inst8_64>;
1013 def : TerRMWPatGlobalAddrOffOnly<i64, zext_ter_rmw_16_64<rmw_16>, inst16_64>;
1014 def : TerRMWPatGlobalAddrOffOnly<i64, zext_ter_rmw_32_64<rmw_32>, inst32_64>;
1015
1016 def : TerRMWPatGlobalAddrOffOnly<i32, sext_ter_rmw_8_32<rmw_8>, inst8_32>;
1017 def : TerRMWPatGlobalAddrOffOnly<i32, sext_ter_rmw_16_32<rmw_16>, inst16_32>;
1018 def : TerRMWPatGlobalAddrOffOnly<i64, sext_ter_rmw_8_64<rmw_8>, inst8_64>;
1019 def : TerRMWPatGlobalAddrOffOnly<i64, sext_ter_rmw_16_64<rmw_16>, inst16_64>;
1020
1021 def : TerRMWPatExternSymOffOnly<i32, zext_ter_rmw_8_32<rmw_8>, inst8_32>;
1022 def : TerRMWPatExternSymOffOnly<i32, zext_ter_rmw_16_32<rmw_16>, inst16_32>;
1023 def : TerRMWPatExternSymOffOnly<i64, zext_ter_rmw_8_64<rmw_8>, inst8_64>;
1024 def : TerRMWPatExternSymOffOnly<i64, zext_ter_rmw_16_64<rmw_16>, inst16_64>;
1025 def : TerRMWPatExternSymOffOnly<i64, zext_ter_rmw_32_64<rmw_32>, inst32_64>;
1026
1027 def : TerRMWPatExternSymOffOnly<i32, sext_ter_rmw_8_32<rmw_8>, inst8_32>;
1028 def : TerRMWPatExternSymOffOnly<i32, sext_ter_rmw_16_32<rmw_16>, inst16_32>;
1029 def : TerRMWPatExternSymOffOnly<i64, sext_ter_rmw_8_64<rmw_8>, inst8_64>;
1030 def : TerRMWPatExternSymOffOnly<i64, sext_ter_rmw_16_64<rmw_16>, inst16_64>;
1031}
1032
Heejin Ahn43675872019-02-06 00:17:03 +00001033let Predicates = [HasAtomics] in
Heejin Ahnb3724b72018-08-01 19:40:28 +00001034defm : TerRMWTruncExtPattern<
1035 atomic_cmp_swap_8, atomic_cmp_swap_16, atomic_cmp_swap_32, atomic_cmp_swap_64,
1036 ATOMIC_RMW8_U_CMPXCHG_I32, ATOMIC_RMW16_U_CMPXCHG_I32,
1037 ATOMIC_RMW8_U_CMPXCHG_I64, ATOMIC_RMW16_U_CMPXCHG_I64,
1038 ATOMIC_RMW32_U_CMPXCHG_I64>;