AArch64/ARM64: remove AArch64 from tree prior to renaming ARM64.
[oota-llvm.git] / lib / Target / ARM64 / ARM64InstrAtomics.td
1 //===- ARM64InstrAtomics.td - ARM64 Atomic codegen support -*- tablegen -*-===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // ARM64 Atomic operand code-gen constructs.
11 //
12 //===----------------------------------------------------------------------===//
13
14 //===----------------------------------
15 // Atomic fences
16 //===----------------------------------
17 def : Pat<(atomic_fence (i64 4), (imm)), (DMB (i32 0x9))>;
18 def : Pat<(atomic_fence (imm), (imm)), (DMB (i32 0xb))>;
19
20 //===----------------------------------
21 // Atomic loads
22 //===----------------------------------
23
24 // When they're actually atomic, only one addressing mode (GPR64sp) is
25 // supported, but when they're relaxed and anything can be used, all the
26 // standard modes would be valid and may give efficiency gains.
27
28 // A atomic load operation that actually needs acquire semantics.
29 class acquiring_load<PatFrag base>
30   : PatFrag<(ops node:$ptr), (base node:$ptr), [{
31   AtomicOrdering Ordering = cast<AtomicSDNode>(N)->getOrdering();
32   assert(Ordering != AcquireRelease && "unexpected load ordering");
33   return Ordering == Acquire || Ordering == SequentiallyConsistent;
34 }]>;
35
36 // An atomic load operation that does not need either acquire or release
37 // semantics.
38 class relaxed_load<PatFrag base>
39   : PatFrag<(ops node:$ptr), (base node:$ptr), [{
40   AtomicOrdering Ordering = cast<AtomicSDNode>(N)->getOrdering();
41   return Ordering == Monotonic || Ordering == Unordered;
42 }]>;
43
44 // 8-bit loads
45 def : Pat<(acquiring_load<atomic_load_8>  GPR64sp:$ptr), (LDARB GPR64sp:$ptr)>;
46 def : Pat<(relaxed_load<atomic_load_8> (ro_Windexed8 GPR64sp:$Rn, GPR32:$Rm,
47                                                      ro_Wextend8:$offset)),
48           (LDRBBroW GPR64sp:$Rn, GPR32:$Rm, ro_Wextend8:$offset)>;
49 def : Pat<(relaxed_load<atomic_load_8> (ro_Xindexed8 GPR64sp:$Rn, GPR64:$Rm,
50                                                      ro_Xextend8:$offset)),
51           (LDRBBroX GPR64sp:$Rn, GPR64:$Rm, ro_Xextend8:$offset)>;
52 def : Pat<(relaxed_load<atomic_load_8> (am_indexed8 GPR64sp:$Rn,
53                                                     uimm12s1:$offset)),
54           (LDRBBui GPR64sp:$Rn, uimm12s1:$offset)>;
55 def : Pat<(relaxed_load<atomic_load_8>
56                (am_unscaled8 GPR64sp:$Rn, simm9:$offset)),
57           (LDURBBi GPR64sp:$Rn, simm9:$offset)>;
58
59 // 16-bit loads
60 def : Pat<(acquiring_load<atomic_load_16> GPR64sp:$ptr), (LDARH GPR64sp:$ptr)>;
61 def : Pat<(relaxed_load<atomic_load_16> (ro_Windexed16 GPR64sp:$Rn, GPR32:$Rm,
62                                                        ro_Wextend16:$extend)),
63           (LDRHHroW GPR64sp:$Rn, GPR32:$Rm, ro_Wextend16:$extend)>;
64 def : Pat<(relaxed_load<atomic_load_16> (ro_Xindexed16 GPR64sp:$Rn, GPR64:$Rm,
65                                                        ro_Xextend16:$extend)),
66           (LDRHHroX GPR64sp:$Rn, GPR64:$Rm, ro_Xextend16:$extend)>;
67 def : Pat<(relaxed_load<atomic_load_16> (am_indexed16 GPR64sp:$Rn,
68                                                       uimm12s2:$offset)),
69           (LDRHHui GPR64sp:$Rn, uimm12s2:$offset)>;
70 def : Pat<(relaxed_load<atomic_load_16>
71                (am_unscaled16 GPR64sp:$Rn, simm9:$offset)),
72           (LDURHHi GPR64sp:$Rn, simm9:$offset)>;
73
74 // 32-bit loads
75 def : Pat<(acquiring_load<atomic_load_32> GPR64sp:$ptr), (LDARW GPR64sp:$ptr)>;
76 def : Pat<(relaxed_load<atomic_load_32> (ro_Windexed32 GPR64sp:$Rn, GPR32:$Rm,
77                                                        ro_Wextend32:$extend)),
78           (LDRWroW GPR64sp:$Rn, GPR32:$Rm, ro_Wextend32:$extend)>;
79 def : Pat<(relaxed_load<atomic_load_32> (ro_Xindexed32 GPR64sp:$Rn, GPR64:$Rm,
80                                                        ro_Xextend32:$extend)),
81           (LDRWroX GPR64sp:$Rn, GPR64:$Rm, ro_Xextend32:$extend)>;
82 def : Pat<(relaxed_load<atomic_load_32> (am_indexed32 GPR64sp:$Rn,
83                                                       uimm12s4:$offset)),
84           (LDRWui GPR64sp:$Rn, uimm12s4:$offset)>;
85 def : Pat<(relaxed_load<atomic_load_32>
86                (am_unscaled32 GPR64sp:$Rn, simm9:$offset)),
87           (LDURWi GPR64sp:$Rn, simm9:$offset)>;
88
89 // 64-bit loads
90 def : Pat<(acquiring_load<atomic_load_64> GPR64sp:$ptr), (LDARX GPR64sp:$ptr)>;
91 def : Pat<(relaxed_load<atomic_load_64> (ro_Windexed64 GPR64sp:$Rn, GPR32:$Rm,
92                                                        ro_Wextend64:$extend)),
93           (LDRXroW GPR64sp:$Rn, GPR32:$Rm, ro_Wextend64:$extend)>;
94 def : Pat<(relaxed_load<atomic_load_64> (ro_Xindexed64 GPR64sp:$Rn, GPR64:$Rm,
95                                                        ro_Xextend64:$extend)),
96           (LDRXroX GPR64sp:$Rn, GPR64:$Rm, ro_Xextend64:$extend)>;
97 def : Pat<(relaxed_load<atomic_load_64> (am_indexed64 GPR64sp:$Rn,
98                                                       uimm12s8:$offset)),
99           (LDRXui GPR64sp:$Rn, uimm12s8:$offset)>;
100 def : Pat<(relaxed_load<atomic_load_64>
101                (am_unscaled64 GPR64sp:$Rn, simm9:$offset)),
102           (LDURXi GPR64sp:$Rn, simm9:$offset)>;
103
104 //===----------------------------------
105 // Atomic stores
106 //===----------------------------------
107
108 // When they're actually atomic, only one addressing mode (GPR64sp) is
109 // supported, but when they're relaxed and anything can be used, all the
110 // standard modes would be valid and may give efficiency gains.
111
112 // A store operation that actually needs release semantics.
113 class releasing_store<PatFrag base>
114   : PatFrag<(ops node:$ptr, node:$val), (base node:$ptr, node:$val), [{
115   AtomicOrdering Ordering = cast<AtomicSDNode>(N)->getOrdering();
116   assert(Ordering != AcquireRelease && "unexpected store ordering");
117   return Ordering == Release || Ordering == SequentiallyConsistent;
118 }]>;
119
120 // An atomic store operation that doesn't actually need to be atomic on ARM64.
121 class relaxed_store<PatFrag base>
122   : PatFrag<(ops node:$ptr, node:$val), (base node:$ptr, node:$val), [{
123   AtomicOrdering Ordering = cast<AtomicSDNode>(N)->getOrdering();
124   return Ordering == Monotonic || Ordering == Unordered;
125 }]>;
126
127 // 8-bit stores
128 def : Pat<(releasing_store<atomic_store_8> GPR64sp:$ptr, GPR32:$val),
129           (STLRB GPR32:$val, GPR64sp:$ptr)>;
130 def : Pat<(relaxed_store<atomic_store_8>
131                (ro_Windexed8 GPR64sp:$Rn, GPR32:$Rm, ro_Wextend8:$extend),
132                GPR32:$val),
133           (STRBBroW GPR32:$val, GPR64sp:$Rn, GPR32:$Rm, ro_Wextend8:$extend)>;
134 def : Pat<(relaxed_store<atomic_store_8>
135                (ro_Xindexed8 GPR64sp:$Rn, GPR64:$Rm, ro_Xextend8:$extend),
136                GPR32:$val),
137           (STRBBroX GPR32:$val, GPR64sp:$Rn, GPR64:$Rm, ro_Xextend8:$extend)>;
138 def : Pat<(relaxed_store<atomic_store_8>
139                (am_indexed8 GPR64sp:$Rn, uimm12s1:$offset), GPR32:$val),
140           (STRBBui GPR32:$val, GPR64sp:$Rn, uimm12s1:$offset)>;
141 def : Pat<(relaxed_store<atomic_store_8>
142                (am_unscaled8 GPR64sp:$Rn, simm9:$offset), GPR32:$val),
143           (STURBBi GPR32:$val, GPR64sp:$Rn, simm9:$offset)>;
144
145 // 16-bit stores
146 def : Pat<(releasing_store<atomic_store_16> GPR64sp:$ptr, GPR32:$val),
147           (STLRH GPR32:$val, GPR64sp:$ptr)>;
148 def : Pat<(relaxed_store<atomic_store_16> (ro_Windexed16 GPR64sp:$Rn, GPR32:$Rm,
149                                                          ro_Wextend16:$extend),
150                                           GPR32:$val),
151           (STRHHroW GPR32:$val, GPR64sp:$Rn, GPR32:$Rm, ro_Wextend16:$extend)>;
152 def : Pat<(relaxed_store<atomic_store_16> (ro_Xindexed16 GPR64sp:$Rn, GPR64:$Rm,
153                                                          ro_Xextend16:$extend),
154                                           GPR32:$val),
155           (STRHHroX GPR32:$val, GPR64sp:$Rn, GPR64:$Rm, ro_Xextend16:$extend)>;
156 def : Pat<(relaxed_store<atomic_store_16>
157               (am_indexed16 GPR64sp:$Rn, uimm12s2:$offset), GPR32:$val),
158           (STRHHui GPR32:$val, GPR64sp:$Rn, uimm12s2:$offset)>;
159 def : Pat<(relaxed_store<atomic_store_16>
160                (am_unscaled16 GPR64sp:$Rn, simm9:$offset), GPR32:$val),
161           (STURHHi GPR32:$val, GPR64sp:$Rn, simm9:$offset)>;
162
163 // 32-bit stores
164 def : Pat<(releasing_store<atomic_store_32> GPR64sp:$ptr, GPR32:$val),
165           (STLRW GPR32:$val, GPR64sp:$ptr)>;
166 def : Pat<(relaxed_store<atomic_store_32> (ro_Windexed32 GPR64sp:$Rn, GPR32:$Rm,
167                                                          ro_Wextend32:$extend),
168                                           GPR32:$val),
169           (STRWroW GPR32:$val, GPR64sp:$Rn, GPR32:$Rm, ro_Wextend32:$extend)>;
170 def : Pat<(relaxed_store<atomic_store_32> (ro_Xindexed32 GPR64sp:$Rn, GPR64:$Rm,
171                                                          ro_Xextend32:$extend),
172                                           GPR32:$val),
173           (STRWroX GPR32:$val, GPR64sp:$Rn, GPR64:$Rm, ro_Xextend32:$extend)>;
174 def : Pat<(relaxed_store<atomic_store_32>
175               (am_indexed32 GPR64sp:$Rn, uimm12s4:$offset), GPR32:$val),
176           (STRWui GPR32:$val, GPR64sp:$Rn, uimm12s4:$offset)>;
177 def : Pat<(relaxed_store<atomic_store_32>
178                (am_unscaled32 GPR64sp:$Rn, simm9:$offset), GPR32:$val),
179           (STURWi GPR32:$val, GPR64sp:$Rn, simm9:$offset)>;
180
181 // 64-bit stores
182 def : Pat<(releasing_store<atomic_store_64> GPR64sp:$ptr, GPR64:$val),
183           (STLRX GPR64:$val, GPR64sp:$ptr)>;
184 def : Pat<(relaxed_store<atomic_store_64> (ro_Windexed64 GPR64sp:$Rn, GPR32:$Rm,
185                                                          ro_Wextend16:$extend),
186                                           GPR64:$val),
187           (STRXroW GPR64:$val, GPR64sp:$Rn, GPR32:$Rm, ro_Wextend64:$extend)>;
188 def : Pat<(relaxed_store<atomic_store_64> (ro_Xindexed64 GPR64sp:$Rn, GPR64:$Rm,
189                                                          ro_Xextend16:$extend),
190                                           GPR64:$val),
191           (STRXroX GPR64:$val, GPR64sp:$Rn, GPR64:$Rm, ro_Xextend64:$extend)>;
192 def : Pat<(relaxed_store<atomic_store_64>
193               (am_indexed64 GPR64sp:$Rn, uimm12s8:$offset), GPR64:$val),
194           (STRXui GPR64:$val, GPR64sp:$Rn, uimm12s8:$offset)>;
195 def : Pat<(relaxed_store<atomic_store_64>
196                (am_unscaled64 GPR64sp:$Rn, simm9:$offset), GPR64:$val),
197           (STURXi GPR64:$val, GPR64sp:$Rn, simm9:$offset)>;
198
199 //===----------------------------------
200 // Low-level exclusive operations
201 //===----------------------------------
202
203 // Load-exclusives.
204
205 def ldxr_1 : PatFrag<(ops node:$ptr), (int_arm64_ldxr node:$ptr), [{
206   return cast<MemIntrinsicSDNode>(N)->getMemoryVT() == MVT::i8;
207 }]>;
208
209 def ldxr_2 : PatFrag<(ops node:$ptr), (int_arm64_ldxr node:$ptr), [{
210   return cast<MemIntrinsicSDNode>(N)->getMemoryVT() == MVT::i16;
211 }]>;
212
213 def ldxr_4 : PatFrag<(ops node:$ptr), (int_arm64_ldxr node:$ptr), [{
214   return cast<MemIntrinsicSDNode>(N)->getMemoryVT() == MVT::i32;
215 }]>;
216
217 def ldxr_8 : PatFrag<(ops node:$ptr), (int_arm64_ldxr node:$ptr), [{
218   return cast<MemIntrinsicSDNode>(N)->getMemoryVT() == MVT::i64;
219 }]>;
220
221 def : Pat<(ldxr_1 GPR64sp:$addr),
222           (SUBREG_TO_REG (i64 0), (LDXRB GPR64sp:$addr), sub_32)>;
223 def : Pat<(ldxr_2 GPR64sp:$addr),
224           (SUBREG_TO_REG (i64 0), (LDXRH GPR64sp:$addr), sub_32)>;
225 def : Pat<(ldxr_4 GPR64sp:$addr),
226           (SUBREG_TO_REG (i64 0), (LDXRW GPR64sp:$addr), sub_32)>;
227 def : Pat<(ldxr_8 GPR64sp:$addr), (LDXRX GPR64sp:$addr)>;
228
229 def : Pat<(and (ldxr_1 GPR64sp:$addr), 0xff),
230           (SUBREG_TO_REG (i64 0), (LDXRB GPR64sp:$addr), sub_32)>;
231 def : Pat<(and (ldxr_2 GPR64sp:$addr), 0xffff),
232           (SUBREG_TO_REG (i64 0), (LDXRH GPR64sp:$addr), sub_32)>;
233 def : Pat<(and (ldxr_4 GPR64sp:$addr), 0xffffffff),
234           (SUBREG_TO_REG (i64 0), (LDXRW GPR64sp:$addr), sub_32)>;
235
236 // Load-exclusives.
237
238 def ldaxr_1 : PatFrag<(ops node:$ptr), (int_arm64_ldaxr node:$ptr), [{
239   return cast<MemIntrinsicSDNode>(N)->getMemoryVT() == MVT::i8;
240 }]>;
241
242 def ldaxr_2 : PatFrag<(ops node:$ptr), (int_arm64_ldaxr node:$ptr), [{
243   return cast<MemIntrinsicSDNode>(N)->getMemoryVT() == MVT::i16;
244 }]>;
245
246 def ldaxr_4 : PatFrag<(ops node:$ptr), (int_arm64_ldaxr node:$ptr), [{
247   return cast<MemIntrinsicSDNode>(N)->getMemoryVT() == MVT::i32;
248 }]>;
249
250 def ldaxr_8 : PatFrag<(ops node:$ptr), (int_arm64_ldaxr node:$ptr), [{
251   return cast<MemIntrinsicSDNode>(N)->getMemoryVT() == MVT::i64;
252 }]>;
253
254 def : Pat<(ldaxr_1 GPR64sp:$addr),
255           (SUBREG_TO_REG (i64 0), (LDAXRB GPR64sp:$addr), sub_32)>;
256 def : Pat<(ldaxr_2 GPR64sp:$addr),
257           (SUBREG_TO_REG (i64 0), (LDAXRH GPR64sp:$addr), sub_32)>;
258 def : Pat<(ldaxr_4 GPR64sp:$addr),
259           (SUBREG_TO_REG (i64 0), (LDAXRW GPR64sp:$addr), sub_32)>;
260 def : Pat<(ldaxr_8 GPR64sp:$addr), (LDAXRX GPR64sp:$addr)>;
261
262 def : Pat<(and (ldaxr_1 GPR64sp:$addr), 0xff),
263           (SUBREG_TO_REG (i64 0), (LDAXRB GPR64sp:$addr), sub_32)>;
264 def : Pat<(and (ldaxr_2 GPR64sp:$addr), 0xffff),
265           (SUBREG_TO_REG (i64 0), (LDAXRH GPR64sp:$addr), sub_32)>;
266 def : Pat<(and (ldaxr_4 GPR64sp:$addr), 0xffffffff),
267           (SUBREG_TO_REG (i64 0), (LDAXRW GPR64sp:$addr), sub_32)>;
268
269 // Store-exclusives.
270
271 def stxr_1 : PatFrag<(ops node:$val, node:$ptr),
272                      (int_arm64_stxr node:$val, node:$ptr), [{
273   return cast<MemIntrinsicSDNode>(N)->getMemoryVT() == MVT::i8;
274 }]>;
275
276 def stxr_2 : PatFrag<(ops node:$val, node:$ptr),
277                      (int_arm64_stxr node:$val, node:$ptr), [{
278   return cast<MemIntrinsicSDNode>(N)->getMemoryVT() == MVT::i16;
279 }]>;
280
281 def stxr_4 : PatFrag<(ops node:$val, node:$ptr),
282                      (int_arm64_stxr node:$val, node:$ptr), [{
283   return cast<MemIntrinsicSDNode>(N)->getMemoryVT() == MVT::i32;
284 }]>;
285
286 def stxr_8 : PatFrag<(ops node:$val, node:$ptr),
287                      (int_arm64_stxr node:$val, node:$ptr), [{
288   return cast<MemIntrinsicSDNode>(N)->getMemoryVT() == MVT::i64;
289 }]>;
290
291
292 def : Pat<(stxr_1 GPR64:$val, GPR64sp:$addr),
293           (STXRB (EXTRACT_SUBREG GPR64:$val, sub_32), GPR64sp:$addr)>;
294 def : Pat<(stxr_2 GPR64:$val, GPR64sp:$addr),
295           (STXRH (EXTRACT_SUBREG GPR64:$val, sub_32), GPR64sp:$addr)>;
296 def : Pat<(stxr_4 GPR64:$val, GPR64sp:$addr),
297           (STXRW (EXTRACT_SUBREG GPR64:$val, sub_32), GPR64sp:$addr)>;
298 def : Pat<(stxr_8 GPR64:$val, GPR64sp:$addr),
299           (STXRX GPR64:$val, GPR64sp:$addr)>;
300
301 def : Pat<(stxr_1 (zext (and GPR32:$val, 0xff)), GPR64sp:$addr),
302           (STXRB GPR32:$val, GPR64sp:$addr)>;
303 def : Pat<(stxr_2 (zext (and GPR32:$val, 0xffff)), GPR64sp:$addr),
304           (STXRH GPR32:$val, GPR64sp:$addr)>;
305 def : Pat<(stxr_4 (zext GPR32:$val), GPR64sp:$addr),
306           (STXRW GPR32:$val, GPR64sp:$addr)>;
307
308 def : Pat<(stxr_1 (and GPR64:$val, 0xff), GPR64sp:$addr),
309           (STXRB (EXTRACT_SUBREG GPR64:$val, sub_32), GPR64sp:$addr)>;
310 def : Pat<(stxr_2 (and GPR64:$val, 0xffff), GPR64sp:$addr),
311           (STXRH (EXTRACT_SUBREG GPR64:$val, sub_32), GPR64sp:$addr)>;
312 def : Pat<(stxr_4 (and GPR64:$val, 0xffffffff), GPR64sp:$addr),
313           (STXRW (EXTRACT_SUBREG GPR64:$val, sub_32), GPR64sp:$addr)>;
314
315 // Store-release-exclusives.
316
317 def stlxr_1 : PatFrag<(ops node:$val, node:$ptr),
318                      (int_arm64_stlxr node:$val, node:$ptr), [{
319   return cast<MemIntrinsicSDNode>(N)->getMemoryVT() == MVT::i8;
320 }]>;
321
322 def stlxr_2 : PatFrag<(ops node:$val, node:$ptr),
323                      (int_arm64_stlxr node:$val, node:$ptr), [{
324   return cast<MemIntrinsicSDNode>(N)->getMemoryVT() == MVT::i16;
325 }]>;
326
327 def stlxr_4 : PatFrag<(ops node:$val, node:$ptr),
328                      (int_arm64_stlxr node:$val, node:$ptr), [{
329   return cast<MemIntrinsicSDNode>(N)->getMemoryVT() == MVT::i32;
330 }]>;
331
332 def stlxr_8 : PatFrag<(ops node:$val, node:$ptr),
333                      (int_arm64_stlxr node:$val, node:$ptr), [{
334   return cast<MemIntrinsicSDNode>(N)->getMemoryVT() == MVT::i64;
335 }]>;
336
337
338 def : Pat<(stlxr_1 GPR64:$val, GPR64sp:$addr),
339           (STLXRB (EXTRACT_SUBREG GPR64:$val, sub_32), GPR64sp:$addr)>;
340 def : Pat<(stlxr_2 GPR64:$val, GPR64sp:$addr),
341           (STLXRH (EXTRACT_SUBREG GPR64:$val, sub_32), GPR64sp:$addr)>;
342 def : Pat<(stlxr_4 GPR64:$val, GPR64sp:$addr),
343           (STLXRW (EXTRACT_SUBREG GPR64:$val, sub_32), GPR64sp:$addr)>;
344 def : Pat<(stlxr_8 GPR64:$val, GPR64sp:$addr),
345           (STLXRX GPR64:$val, GPR64sp:$addr)>;
346
347 def : Pat<(stlxr_1 (zext (and GPR32:$val, 0xff)), GPR64sp:$addr),
348           (STLXRB GPR32:$val, GPR64sp:$addr)>;
349 def : Pat<(stlxr_2 (zext (and GPR32:$val, 0xffff)), GPR64sp:$addr),
350           (STLXRH GPR32:$val, GPR64sp:$addr)>;
351 def : Pat<(stlxr_4 (zext GPR32:$val), GPR64sp:$addr),
352           (STLXRW GPR32:$val, GPR64sp:$addr)>;
353
354 def : Pat<(stlxr_1 (and GPR64:$val, 0xff), GPR64sp:$addr),
355           (STLXRB (EXTRACT_SUBREG GPR64:$val, sub_32), GPR64sp:$addr)>;
356 def : Pat<(stlxr_2 (and GPR64:$val, 0xffff), GPR64sp:$addr),
357           (STLXRH (EXTRACT_SUBREG GPR64:$val, sub_32), GPR64sp:$addr)>;
358 def : Pat<(stlxr_4 (and GPR64:$val, 0xffffffff), GPR64sp:$addr),
359           (STLXRW (EXTRACT_SUBREG GPR64:$val, sub_32), GPR64sp:$addr)>;
360
361
362 // And clear exclusive.
363
364 def : Pat<(int_arm64_clrex), (CLREX 0xf)>;