[SampleProfileLoader] Fix integer overflow in generateMDProfMetadata (#90217)
[llvm-project.git] / llvm / lib / Target / AArch64 / AArch64SchedThunderX3T110.td
blob796bd4b8b5c9ae69e7b12781fba98583309b3887
1 //=- AArch64SchedThunderX3T110.td - Marvell ThunderX3 T110 ---*- tablegen -*-=//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file defines the scheduling model for Marvell ThunderX3T110
10 // family of processors.
12 //===----------------------------------------------------------------------===//
14 //===----------------------------------------------------------------------===//
15 // Pipeline Description.
17 def ThunderX3T110Model : SchedMachineModel {
18   let IssueWidth            =   4; // 4 micro-ops dispatched at a time.
19   let MicroOpBufferSize     =  70; // 70 entries in micro-op re-order buffer.
20   let LoadLatency           =   4; // Optimistic load latency.
21   let MispredictPenalty     =  12; // Extra cycles for mispredicted branch.
22   // Determined via a mix of micro-arch details and experimentation.
23   let LoopMicroOpBufferSize = 128; // FIXME: might be much bigger in TX3.
24   let PostRAScheduler       =   1; // Using PostRA sched.
25   let CompleteModel         =   1;
27   list<Predicate> UnsupportedFeatures = !listconcat(SVEUnsupported.F,
28                                                     PAUnsupported.F,
29                                                     SMEUnsupported.F,
30                                                     [HasMTE, HasCSSC]);
31   // FIXME: Remove when all errors have been fixed.
32   let FullInstRWOverlapCheck = 0;
35 let SchedModel = ThunderX3T110Model in {
37 // Issue ports.
39 // Port 0: ALU.
40 def THX3T110P0 : ProcResource<1>;
42 // Port 1: ALU.
43 def THX3T110P1 : ProcResource<1>;
45 // Port 2: ALU/Branch.
46 def THX3T110P2 : ProcResource<1>;
48 // Port 3: ALU/Branch.
49 def THX3T110P3 : ProcResource<1>;
51 // Port 4: Load/Store.
52 def THX3T110P4 : ProcResource<1>;
54 // Port 5: Load/store.
55 def THX3T110P5 : ProcResource<1>;
57 // Port 6: FP/Neon/SIMD/Crypto.
58 def THX3T110P6FP0 : ProcResource<1>;
60 // Port 7: FP/Neon/SIMD/Crypto.
61 def THX3T110P7FP1 : ProcResource<1>;
63 // Port 8: FP/Neon/SIMD/Crypto.
64 def THX3T110P8FP2 : ProcResource<1>;
66 // Port 9: FP/Neon/SIMD/Crypto.
67 def THX3T110P9FP3 : ProcResource<1>;
69 // Port 10: Store Data Unit.
70 def THX3T110SD0 : ProcResource<1>;
72 // Define groups for the functional units on each issue port.  Each group
73 // created will be used by a WriteRes.
75 // Integer divide/mulhi micro-ops only on port I1.
76 def THX3T110I1 : ProcResGroup<[THX3T110P1]>;
78 // Branch micro-ops on ports I2/I3.
79 def THX3T110I23 : ProcResGroup<[THX3T110P2, THX3T110P3]>;
81 // Branch micro-ops on ports I1/I2/I3.
82 def THX3T110I123 : ProcResGroup<[THX3T110P1, THX3T110P2, THX3T110P3]>;
84 // Integer micro-ops on ports I0/I1/I2.
85 def THX3T110I012 : ProcResGroup<[THX3T110P0, THX3T110P1, THX3T110P2]>;
87 // Integer micro-ops on ports I0/I1/I2/I3.
88 def THX3T110I0123 : ProcResGroup<[THX3T110P0, THX3T110P1,
89                                   THX3T110P2, THX3T110P3]>;
91 // FP micro-ops on ports FP0/FP1/FP2/FP3.
92 def THX3T110FP0123 : ProcResGroup<[THX3T110P6FP0, THX3T110P7FP1,
93                                    THX3T110P8FP2, THX3T110P9FP3]>;
95 // FP micro-ops on ports FP2/FP3.
96 def THX3T110FP23 : ProcResGroup<[THX3T110P8FP2, THX3T110P9FP3]>;
98 // ASIMD micro-ops on ports FP0/FP1/FP2/FP3.
99 def THX3T110SIMD : ProcResGroup<[THX3T110P6FP0, THX3T110P7FP1,
100                                  THX3T110P8FP2, THX3T110P9FP3]>;
102 // Store data micro-ops only on port 10.
103 def THX3T110SD : ProcResGroup<[THX3T110SD0]>;
105 // Load/store micro-ops on ports P4/P5.
106 def THX3T110LS : ProcResGroup<[THX3T110P4, THX3T110P5]>;
108 // 70 entry unified scheduler.
109 def THX3T110ANY: ProcResGroup<[THX3T110P0, THX3T110P1, THX3T110P2,
110                                THX3T110P3, THX3T110P4, THX3T110P5,
111                                THX3T110P6FP0, THX3T110P7FP1,
112                                THX3T110P8FP2, THX3T110P9FP3]> {
113   let BufferSize = 70;
116 // Define commonly used write types for InstRW specializations.
117 // All definitions follow the format: THX3T110Write_<NumCycles>Cyc_<Resources>.
119 // 3 cycles on I1.
120 def THX3T110Write_3Cyc_I1 : SchedWriteRes<[THX3T110I1]> {
121   let Latency = 3;
122   let NumMicroOps = 2;
125 // 4 cycles on I1.
126 def THX3T110Write_4Cyc_I1 : SchedWriteRes<[THX3T110I1]> {
127   let Latency = 4;
128   let NumMicroOps = 2;
131 // 5 cycles on I1.
132 def THX3T110Write_5Cyc_I1 : SchedWriteRes<[THX3T110I1]> {
133   let Latency = 5;
134   let NumMicroOps = 2;
137 // 7 cycles on I1.
138 def THX3T110Write_7Cyc_I1 : SchedWriteRes<[THX3T110I1]> {
139   let Latency = 7;
140   let NumMicroOps = 3;
143 // 23 cycles on I1.
144 def THX3T110Write_23Cyc_I1 : SchedWriteRes<[THX3T110I1]> {
145   let Latency = 23;
146   let ReleaseAtCycles = [13, 23];
147   let NumMicroOps = 4;
150 // 39 cycles on I1.
151 def THX3T110Write_39Cyc_I1 : SchedWriteRes<[THX3T110I1]> {
152   let Latency = 39;
153   let ReleaseAtCycles = [13, 39];
154   let NumMicroOps = 4;
157 // 1 cycle on I2/I3
158 def THX3T110Write_1Cyc_I23 : SchedWriteRes<[THX3T110I23]> {
159   let Latency = 1;
160   let NumMicroOps = 2;
163 // 8 cycles on I2/I3
164 def THX3T110Write_8Cyc_I23 : SchedWriteRes<[THX3T110I23]> {
165   let Latency = 8;
166   let NumMicroOps = 3;
169 // 1 cycle on I1/I2/I3
170 def THX3T110Write_1Cyc_I123 : SchedWriteRes<[THX3T110I123]> {
171   let Latency = 1;
172   let NumMicroOps = 2;
175 // 8 cycles on I1/I2/I3
176 def THX3T110Write_8Cyc_I123 : SchedWriteRes<[THX3T110I123]> {
177   let Latency = 8;
178   let NumMicroOps = 3;
181 // 1 cycle on I0/I1/I2/I3.
182 def THX3T110Write_1Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> {
183   let Latency = 1;
184   let NumMicroOps = 2;
187 // 2 cycles on I0/I1/I2/I3.
188 def THX3T110Write_2Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> {
189   let Latency = 2;
190   let NumMicroOps = 2;
193 // 3 cycles on I0/I1/I2/I3.
194 def THX3T110Write_3Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> {
195   let Latency = 3;
196   let NumMicroOps = 2;
199 // 4 cycles on I0/I1/I2/I3.
200 def THX3T110Write_4Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> {
201   let Latency = 4;
202   let NumMicroOps = 3;
205 // 5 cycles on I0/I1/I2/I3.
206 def THX3T110Write_5Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> {
207   let Latency = 5;
208   let NumMicroOps = 3;
211 // 6 cycles on I0/I1/I2/I3.
212 def THX3T110Write_6Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> {
213   let Latency = 6;
214   let NumMicroOps = 3;
217 // 8 cycles on I0/I1/I2/I3.
218 def THX3T110Write_8Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> {
219   let Latency = 8;
220   let NumMicroOps = 4;
223 // 13 cycles on I0/I1/I2/I3.
224 def THX3T110Write_13Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> {
225   let Latency = 13;
226   let NumMicroOps = 3;
229 // 23 cycles on I0/I1/I2/I3.
230 def THX3T110Write_23Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> {
231   let Latency = 23;
232   let NumMicroOps = 3;
235 // 39 cycles on I0/I1/I2/I3.
236 def THX3T110Write_39Cyc_I0123 : SchedWriteRes<[THX3T110I0123]> {
237   let Latency = 39;
238   let NumMicroOps = 3;
241 // 4 cycles on F2/F3.
242 def THX3T110Write_4Cyc_F23 : SchedWriteRes<[THX3T110FP23]> {
243   let Latency = 4;
244   let NumMicroOps = 2;
247 // 5 cycles on F0/F1/F2/F3.
248 def THX3T110Write_5Cyc_F01 : SchedWriteRes<[THX3T110FP0123]> {
249   let Latency = 5;
250   let NumMicroOps = 2;
253 // 6 cycles on F0/F1/F2/F3.
254 def THX3T110Write_6Cyc_F01 : SchedWriteRes<[THX3T110FP0123]> {
255   let Latency = 6;
256   let NumMicroOps = 3;
259 // 7 cycles on F0/F1/F2/F3.
260 def THX3T110Write_7Cyc_F01 : SchedWriteRes<[THX3T110FP0123]> {
261   let Latency = 7;
262   let NumMicroOps = 3;
265 // 8 cycles on F0/F1/F2/F3.
266 def THX3T110Write_8Cyc_F01 : SchedWriteRes<[THX3T110FP0123]> {
267   let Latency = 8;
268   let NumMicroOps = 3;
271 // 10 cycles on F0/F1/F2/F3.
272 def THX3T110Write_10Cyc_F01 : SchedWriteRes<[THX3T110FP0123]> {
273   let Latency = 10;
274   let NumMicroOps = 3;
277 // 16 cycles on F0/F1/F2/F3.
278 def THX3T110Write_16Cyc_F01 : SchedWriteRes<[THX3T110FP0123]> {
279   let Latency = 16;
280   let NumMicroOps = 3;
281   let ReleaseAtCycles = [8];
284 // 23 cycles on F0/F1/F2/F3.
285 def THX3T110Write_23Cyc_F01 : SchedWriteRes<[THX3T110FP0123]> {
286   let Latency = 23;
287   let NumMicroOps = 3;
288   let ReleaseAtCycles = [11];
291 // 1 cycle on LS0/LS1.
292 def THX3T110Write_1Cyc_LS01 : SchedWriteRes<[THX3T110LS]> {
293   let Latency = 1;
294   let NumMicroOps = 1;
297 // 2 cycles on LS0/LS1.
298 def THX3T110Write_2Cyc_LS01 : SchedWriteRes<[THX3T110LS]> {
299   let Latency = 2;
300   let NumMicroOps = 2;
303 // 4 cycles on LS0/LS1.
304 def THX3T110Write_4Cyc_LS01 : SchedWriteRes<[THX3T110LS]> {
305   let Latency = 4;
306   let NumMicroOps = 2;
307   let ReleaseAtCycles = [2];
310 // 5 cycles on LS0/LS1.
311 def THX3T110Write_5Cyc_LS01 : SchedWriteRes<[THX3T110LS]> {
312   let Latency = 5;
313   let NumMicroOps = 3;
316 // 6 cycles on LS0/LS1.
317 def THX3T110Write_6Cyc_LS01 : SchedWriteRes<[THX3T110LS]> {
318   let Latency = 6;
319   let NumMicroOps = 3;
322 // 4 + 5 cycles on LS0/LS1.
323 // First resource is available after 4 cycles.
324 // Second resource is available after 5 cycles.
325 // Load vector pair, immed offset, Q-form [LDP/LDNP].
326 def THX3T110Write_4_5Cyc_LS01 : SchedWriteRes<[THX3T110LS]> {
327   let Latency = 4;
328   let NumMicroOps = 2;
329   let ReleaseAtCycles = [4, 5];
332 // 4 + 8 cycles on LS0/LS1.
333 // First resource is available after 4 cycles.
334 // Second resource is available after 8 cycles.
335 // Load vector pair, immed offset, S/D-form [LDP/LDNP].
336 def THX3T110Write_4_8Cyc_LS01 : SchedWriteRes<[THX3T110LS]> {
337   let Latency = 4;
338   let NumMicroOps = 2;
339   let ReleaseAtCycles = [4, 8];
342 // 11 cycles on LS0/LS1 and I1.
343 def THX3T110Write_11Cyc_LS01_I1 :
344   SchedWriteRes<[THX3T110LS, THX3T110I1]> {
345   let Latency = 11;
346   let NumMicroOps = 4;
349 // 1 cycles on LS0/LS1 and I0/I1/I2/I3.
350 def THX3T110Write_1Cyc_LS01_I0123 :
351   SchedWriteRes<[THX3T110LS, THX3T110I0123]> {
352   let Latency = 1;
353   let NumMicroOps = 2;
356 // 1 cycles on LS0/LS1 and 2 of I0/I1/I2/I3.
357 def THX3T110Write_1Cyc_LS01_I0123_I0123 :
358   SchedWriteRes<[THX3T110LS, THX3T110I0123, THX3T110I0123]> {
359   let Latency = 1;
360   let NumMicroOps = 3;
363 // 4 cycles on LS0/LS1 and I0/I1/I2/I3.
364 def THX3T110Write_4Cyc_LS01_I0123 :
365   SchedWriteRes<[THX3T110LS, THX3T110I0123]> {
366   let Latency = 4;
367   let NumMicroOps = 3;
370 // 4 cycles on LS0/LS1 and 2 of I0/I1/I2/I3.
371 def THX3T110Write_4Cyc_LS01_I0123_I0123 :
372   SchedWriteRes<[THX3T110LS, THX3T110I0123, THX3T110I0123]> {
373   let Latency = 4;
374   let NumMicroOps = 3;
377 // 5 cycles on LS0/LS1 and I0/I1/I2/I3.
378 def THX3T110Write_5Cyc_LS01_I0123 :
379   SchedWriteRes<[THX3T110LS, THX3T110I0123]> {
380   let Latency = 5;
381   let NumMicroOps = 3;
384 // 5 cycles on LS0/LS1 and 2 of I0/I1/I2/I3.
385 def THX3T110Write_5Cyc_LS01_I0123_I0123 :
386   SchedWriteRes<[THX3T110LS, THX3T110I0123, THX3T110I0123]> {
387   let Latency = 5;
388   let NumMicroOps = 3;
391 // 6 cycles on LS0/LS1 and I0/I1/I2/I3.
392 def THX3T110Write_6Cyc_LS01_I012 :
393   SchedWriteRes<[THX3T110LS, THX3T110I0123]> {
394   let Latency = 6;
395   let NumMicroOps = 4;
398 // 6 cycles on LS0/LS1 and 2 of I0/I1/I2/I3.
399 def THX3T110Write_6Cyc_LS01_I0123_I0123 :
400   SchedWriteRes<[THX3T110LS, THX3T110I0123, THX3T110I0123]> {
401   let Latency = 6;
402   let NumMicroOps = 3;
405 // 1 cycle on LS0/LS1 and SD.
406 def THX3T110Write_1Cyc_LS01_SD :
407   SchedWriteRes<[THX3T110LS, THX3T110SD]> {
408   let Latency = 1;
409   let NumMicroOps = 2;
412 // 2 cycles on LS0/LS1 and SD.
413 def THX3T110Write_2Cyc_LS01_SD :
414   SchedWriteRes<[THX3T110LS, THX3T110SD]> {
415   let Latency = 2;
416   let NumMicroOps = 2;
419 // 4 cycles on LS0/LS1 and SD.
420 def THX3T110Write_4Cyc_LS01_SD :
421   SchedWriteRes<[THX3T110LS, THX3T110SD]> {
422   let Latency = 4;
423   let NumMicroOps = 3;
426 // 5 cycles on LS0/LS1 and SD.
427 def THX3T110Write_5Cyc_LS01_SD :
428   SchedWriteRes<[THX3T110LS, THX3T110SD]> {
429   let Latency = 5;
430   let NumMicroOps = 4;
433 // 6 cycles on LS0/LS1 and SD.
434 def THX3T110Write_6Cyc_LS01_SD :
435   SchedWriteRes<[THX3T110LS, THX3T110SD]> {
436   let Latency = 6;
437   let NumMicroOps = 5;
440 // 1 cycle on LS0/LS1, SD and I0/I1/I2/I3.
441 def THX3T110Write_1Cyc_LS01_SD_I0123 :
442   SchedWriteRes<[THX3T110LS, THX3T110SD, THX3T110I0123]> {
443   let Latency = 1;
444   let NumMicroOps = 2;
447 // 2 cycles on LS0/LS1, SD and I0/I1/I2/I3.
448 def THX3T110Write_2Cyc_LS01_SD_I0123 :
449   SchedWriteRes<[THX3T110LS, THX3T110SD, THX3T110I0123]> {
450   let Latency = 2;
451   let NumMicroOps = 2;
454 // 4 cycles on LS0/LS1, SD and I0/I1/I2/I3.
455 def THX3T110Write_4Cyc_LS01_SD_I0123 :
456   SchedWriteRes<[THX3T110LS, THX3T110SD, THX3T110I0123]> {
457   let Latency = 4;
458   let NumMicroOps = 3;
461 // 5 cycles on LS0/LS1, SD and I0/I1/I2/I3.
462 def THX3T110Write_5Cyc_LS01_SD_I0123 :
463   SchedWriteRes<[THX3T110LS, THX3T110SD, THX3T110I0123]> {
464   let Latency = 5;
465   let NumMicroOps = 4;
468 // 6 cycles on LS0/LS1, SD and I0/I1/I2/I3.
469 def THX3T110Write_6Cyc_LS01_SD_I0123 :
470   SchedWriteRes<[THX3T110LS, THX3T110SD, THX3T110I0123]> {
471   let Latency = 6;
472   let NumMicroOps = 5;
475 // 1 cycles on LS0/LS1 and F0/F1/F2/F3.
476 def THX3T110Write_1Cyc_LS01_F0123 :
477   SchedWriteRes<[THX3T110LS, THX3T110FP0123]> {
478   let Latency = 1;
479   let NumMicroOps = 2;
482 // 5 cycles on LS0/LS1 and F0/F1/F2/F3.
483 def THX3T110Write_5Cyc_LS01_F0123 :
484   SchedWriteRes<[THX3T110LS, THX3T110FP0123]> {
485   let Latency = 5;
486   let NumMicroOps = 3;
489 // 6 cycles on LS0/LS1 and F0/F1/F2/F3.
490 def THX3T110Write_6Cyc_LS01_F0123 :
491   SchedWriteRes<[THX3T110LS, THX3T110FP0123]> {
492   let Latency = 6;
493   let NumMicroOps = 3;
496 // 7 cycles on LS0/LS1 and F0/F1/F2/F3.
497 def THX3T110Write_7Cyc_LS01_F0123 :
498   SchedWriteRes<[THX3T110LS, THX3T110FP0123]> {
499   let Latency = 7;
500   let NumMicroOps = 3;
503 // 8 cycles on LS0/LS1 and F0/F1/F2/F3.
504 def THX3T110Write_8Cyc_LS01_F0123 :
505   SchedWriteRes<[THX3T110LS, THX3T110FP0123]> {
506   let Latency = 8;
507   let NumMicroOps = 3;
510 // 8 cycles on LS0/LS1 and I0/I1/I2/I3.
511 def THX3T110Write_8Cyc_LS01_I0123 :
512   SchedWriteRes<[THX3T110LS, THX3T110I0123]> {
513   let Latency = 8;
514   let NumMicroOps = 3;
517 // 12 cycles on LS0/LS1 and I0/I1/I2/I3.
518 def THX3T110Write_12Cyc_LS01_I0123 :
519   SchedWriteRes<[THX3T110LS, THX3T110I0123]> {
520   let Latency = 12;
521   let NumMicroOps = 4;
524 // 16 cycles on LS0/LS1 and I0/I1/I2/I3.
525 def THX3T110Write_16Cyc_LS01_I0123 :
526   SchedWriteRes<[THX3T110LS, THX3T110I0123]> {
527   let Latency = 16;
528   let NumMicroOps = 5;
531 // 24 cycles on LS0/LS1 and I0/I1/I2/I3.
532 def THX3T110Write_24Cyc_LS01_I0123 :
533   SchedWriteRes<[THX3T110LS, THX3T110I0123]> {
534   let Latency = 24;
535   let NumMicroOps = 10;
538 // 32 cycles on LS0/LS1 and I0/I1/I2/I3.
539 def THX3T110Write_32Cyc_LS01_I0123 :
540   SchedWriteRes<[THX3T110LS, THX3T110I0123]> {
541   let Latency = 32;
542   let NumMicroOps = 14;
545 // 3 cycles on F0/F1/F2/F3.
546 def THX3T110Write_3Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> {
547   let Latency = 3;
548   let NumMicroOps = 2;
551 // 4 cycles on F0/F1/F2/F3.
552 def THX3T110Write_4Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> {
553   let Latency = 4;
554   let NumMicroOps = 2;
557 // 5 cycles on F0/F1/F2/F3.
558 def THX3T110Write_5Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> {
559   let Latency = 5;
560   let NumMicroOps = 2;
563 // 10 cycles on F0/F1/F2/F3.
564 def THX3T110Write_10Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> {
565   let Latency = 10;
566   let NumMicroOps = 4;
569 // 15 cycles on F0/F1/F2/F3.
570 def THX3T110Write_15Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> {
571   let Latency = 15;
572   let NumMicroOps = 7;
575 // 16 cycles on F0/F1/F2/F3.
576 def THX3T110Write_16Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> {
577   let Latency = 16;
578   let NumMicroOps = 3;
581 // 18 cycles on F0/F1/F2/F3.
582 def THX3T110Write_18Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> {
583   let Latency = 18;
584   let NumMicroOps = 3;
587 // 19 cycles on F0/F1/F2/F3.
588 def THX3T110Write_19Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> {
589   let Latency = 19;
590   let NumMicroOps = 4;
593 // 20 cycles on F0/F1/F2/F3.
594 def THX3T110Write_20Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> {
595   let Latency = 20;
596   let NumMicroOps = 4;
599 // 23 cycles on F0/F1/F2/F3.
600 def THX3T110Write_23Cyc_F0123 : SchedWriteRes<[THX3T110FP0123]> {
601   let Latency = 23;
602   let NumMicroOps = 4;
605 // 3 cycles on F2/F3 and 4 cycles on F0/F1/F2/F3.
606 def THX3T110Write_3_4Cyc_F23_F0123 :
607   SchedWriteRes<[THX3T110FP23, THX3T110FP0123]> {
608   let Latency = 3;
609   let NumMicroOps = 2;
610   let ReleaseAtCycles = [3, 4];
614 // Define commonly used read types.
616 // No forwarding is provided for these types.
617 def : ReadAdvance<ReadI,       0>;
618 def : ReadAdvance<ReadISReg,   0>;
619 def : ReadAdvance<ReadIEReg,   0>;
620 def : ReadAdvance<ReadIM,      0>;
621 def : ReadAdvance<ReadIMA,     0>;
622 def : ReadAdvance<ReadID,      0>;
623 def : ReadAdvance<ReadExtrHi,  0>;
624 def : ReadAdvance<ReadAdrBase, 0>;
625 def : ReadAdvance<ReadVLD,     0>;
626 def : ReadAdvance<ReadST,      0>;
628 //===----------------------------------------------------------------------===//
629 // 3. Instruction Tables.
631 //---
632 // 3.1 Branch Instructions
633 //---
635 // Branch, immed
636 // Branch and link, immed
637 // Compare and branch
638 def : WriteRes<WriteBr,      [THX3T110I23]> {
639   let Latency = 1;
640   let NumMicroOps = 2;
643 // Branch, register
644 // Branch and link, register != LR
645 // Branch and link, register = LR
646 def : WriteRes<WriteBrReg,   [THX3T110I23]> {
647   let Latency = 1;
648   let NumMicroOps = 2;
651 def : WriteRes<WriteSys,     []> { let Latency = 1; }
652 def : WriteRes<WriteBarrier, []> { let Latency = 1; }
653 def : WriteRes<WriteHint,    []> { let Latency = 1; }
655 def : WriteRes<WriteAtomic,  []> {
656   let Latency = 4;
657   let NumMicroOps = 2;
660 //---
661 // Branch
662 //---
663 def : InstRW<[THX3T110Write_1Cyc_I23], (instrs B, BL, BR, BLR)>;
664 def : InstRW<[THX3T110Write_1Cyc_I23], (instrs Bcc)>;
665 def : InstRW<[THX3T110Write_1Cyc_I23], (instrs RET)>;
666 def : InstRW<[THX3T110Write_1Cyc_I23],
667             (instrs CBZW, CBZX, CBNZW, CBNZX, TBZW, TBZX, TBNZW, TBNZX)>;
669 //---
670 // 3.2 Arithmetic and Logical Instructions
671 // 3.3 Move and Shift Instructions
672 //---
675 // ALU, basic
676 // Conditional compare
677 // Conditional select
678 // Address generation
679 def : WriteRes<WriteI,       [THX3T110I0123]> {
680   let Latency = 1;
681   let ReleaseAtCycles = [1];
682   let NumMicroOps = 2;
685 def : InstRW<[WriteI],
686             (instregex "ADD?(W|X)r(i|r|s|x)",   "ADDS?(W|X)r(i|r|s|x)(64)?",
687                        "AND?(W|X)r(i|r|s|x)",   "ANDS?(W|X)r(i|r|s|x)",
688                        "ADC(W|X)r",
689                        "BIC?(W|X)r(i|r|s|x)",   "BICS?(W|X)r(i|r|s|x)",
690                        "EON?(W|X)r(i|r|s|x)",   "ORN?(W|X)r(i|r|s|x)",
691                        "ORR?(W|X)r(i|r|s|x)",   "SUB?(W|X)r(i|r|s|x)",
692                        "SUBS?(W|X)r(i|r|s|x)",  "SBC(W|X)r",
693                        "SBCS(W|X)r",            "CCMN(W|X)(i|r)",
694                        "CCMP(W|X)(i|r)",        "CSEL(W|X)r",
695                        "CSINC(W|X)r",           "CSINV(W|X)r",
696                        "CSNEG(W|X)r")>;
698 def : InstRW<[WriteI], (instrs COPY)>;
700 // ALU, extend and/or shift
701 def : WriteRes<WriteISReg,   [THX3T110I0123]> {
702   let Latency = 2;
703   let ReleaseAtCycles = [2];
704   let NumMicroOps = 2;
707 def : InstRW<[WriteISReg],
708             (instregex "ADD?(W|X)r(i|r|s|x)",   "ADDS?(W|X)r(i|r|s|x)(64)?",
709                        "AND?(W|X)r(i|r|s|x)",   "ANDS?(W|X)r(i|r|s|x)",
710                        "ADC(W|X)r",
711                        "BIC?(W|X)r(i|r|s|x)",   "BICS?(W|X)r(i|r|s|x)",
712                        "EON?(W|X)r(i|r|s|x)",   "ORN?(W|X)r(i|r|s|x)",
713                        "ORR?(W|X)r(i|r|s|x)",   "SUB?(W|X)r(i|r|s|x)",
714                        "SUBS?(W|X)r(i|r|s|x)",  "SBC(W|X)r",
715                        "SBCS(W|X)r",            "CCMN(W|X)(i|r)",
716                        "CCMP(W|X)(i|r)",        "CSEL(W|X)r",
717                        "CSINC(W|X)r",           "CSINV(W|X)r",
718                        "CSNEG(W|X)r")>;
720 def : WriteRes<WriteIEReg,   [THX3T110I0123]> {
721   let Latency = 1;
722   let ReleaseAtCycles = [1];
723   let NumMicroOps = 2;
726 def : InstRW<[WriteIEReg],
727             (instregex "ADD?(W|X)r(i|r|s|x)",   "ADDS?(W|X)r(i|r|s|x)(64)?",
728                        "AND?(W|X)r(i|r|s|x)",   "ANDS?(W|X)r(i|r|s|x)",
729                        "ADC(W|X)r",
730                        "BIC?(W|X)r(i|r|s|x)",   "BICS?(W|X)r(i|r|s|x)",
731                        "EON?(W|X)r(i|r|s|x)",   "ORN?(W|X)r(i|r|s|x)",
732                        "ORR?(W|X)r(i|r|s|x)",   "SUB?(W|X)r(i|r|s|x)",
733                        "SUBS?(W|X)r(i|r|s|x)",  "SBC(W|X)r",
734                        "SBCS(W|X)r",            "CCMN(W|X)(i|r)",
735                        "CCMP(W|X)(i|r)",        "CSEL(W|X)r",
736                        "CSINC(W|X)r",           "CSINV(W|X)r",
737                        "CSNEG(W|X)r")>;
739 // Move immed
740 def : WriteRes<WriteImm,     [THX3T110I0123]> {
741   let Latency = 1;
742   let NumMicroOps = 2;
745 def : InstRW<[THX3T110Write_1Cyc_I0123],
746             (instrs MOVKWi, MOVKXi, MOVNWi, MOVNXi, MOVZWi, MOVZXi)>;
748 def : InstRW<[THX3T110Write_1Cyc_I0123],
749             (instrs ASRVWr, ASRVXr, LSLVWr, LSLVXr, RORVWr, RORVXr)>;
751 // Variable shift
752 def : WriteRes<WriteIS,      [THX3T110I0123]> {
753   let Latency = 1;
754   let NumMicroOps = 2;
757 //---
758 // 3.4 Divide and Multiply Instructions
759 //---
761 // Divide, W-form
762 // Latency range of 13-23/13-39.
763 def : WriteRes<WriteID32,    [THX3T110I1]> {
764   let Latency = 39;
765   let ReleaseAtCycles = [39];
766   let NumMicroOps = 4;
769 // Divide, X-form
770 def : WriteRes<WriteID64,    [THX3T110I1]> {
771   let Latency = 23;
772   let ReleaseAtCycles = [23];
773   let NumMicroOps = 4;
776 // Multiply accumulate, W-form
777 def : WriteRes<WriteIM32,    [THX3T110I0123]> {
778   let Latency = 5;
779   let NumMicroOps = 3;
782 // Multiply accumulate, X-form
783 def : WriteRes<WriteIM64,    [THX3T110I0123]> {
784   let Latency = 5;
785   let NumMicroOps = 3;
788 //def : InstRW<[WriteIM32, ReadIM, ReadIM, ReadIMA, THX3T110Write_5Cyc_I012],
789 //             (instrs MADDWrrr, MSUBWrrr)>;
790 def : InstRW<[WriteIM32], (instrs MADDWrrr, MSUBWrrr)>;
791 def : InstRW<[WriteIM32], (instrs MADDXrrr, MSUBXrrr)>;
792 def : InstRW<[THX3T110Write_5Cyc_I0123],
793             (instregex "(S|U)(MADDL|MSUBL)rrr")>;
795 def : InstRW<[WriteID32], (instrs SDIVWr, UDIVWr)>;
796 def : InstRW<[WriteID64], (instrs SDIVXr, UDIVXr)>;
798 // Bitfield extract, two reg
799 def : WriteRes<WriteExtr,    [THX3T110I0123]> {
800   let Latency = 1;
801   let NumMicroOps = 2;
804 // Multiply high
805 def : InstRW<[THX3T110Write_4Cyc_I1], (instrs SMULHrr, UMULHrr)>;
807 // Miscellaneous Data-Processing Instructions
808 // Bitfield extract
809 def : InstRW<[THX3T110Write_1Cyc_I0123], (instrs EXTRWrri, EXTRXrri)>;
811 // Bitifield move - basic
812 def : InstRW<[THX3T110Write_1Cyc_I0123],
813             (instrs SBFMWri, SBFMXri, UBFMWri, UBFMXri)>;
815 // Bitfield move, insert
816 def : InstRW<[THX3T110Write_1Cyc_I0123], (instregex "^BFM")>;
817 def : InstRW<[THX3T110Write_1Cyc_I0123], (instregex "(S|U)?BFM.*")>;
819 // Count leading
820 def : InstRW<[THX3T110Write_3_4Cyc_F23_F0123],
821             (instregex "^CLS(W|X)r$", "^CLZ(W|X)r$")>;
823 // Reverse bits
824 def : InstRW<[THX3T110Write_3_4Cyc_F23_F0123], (instrs RBITWr, RBITXr)>;
826 // Cryptography Extensions
827 def : InstRW<[THX3T110Write_4Cyc_F0123], (instregex "^AES[DE]")>;
828 def : InstRW<[THX3T110Write_4Cyc_F0123], (instregex "^AESI?MC")>;
829 def : InstRW<[THX3T110Write_4Cyc_F0123], (instregex "^PMULL")>;
830 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SHA1SU0")>;
831 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SHA1(H|SU1)")>;
832 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SHA1[CMP]")>;
833 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SHA256SU0")>;
834 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SHA256(H|H2|SU1)")>;
836 // CRC Instructions
837 // def : InstRW<[THX3T110Write_4Cyc_I1], (instregex "^CRC32", "^CRC32C")>;
838 def : InstRW<[THX3T110Write_4Cyc_I1],
839             (instrs CRC32Brr, CRC32Hrr, CRC32Wrr, CRC32Xrr)>;
841 def : InstRW<[THX3T110Write_4Cyc_I1],
842             (instrs CRC32CBrr, CRC32CHrr, CRC32CWrr, CRC32CXrr)>;
844 // Reverse bits/bytes
845 // NOTE: Handled by WriteI.
847 //---
848 // 3.6 Load Instructions
849 // 3.10 FP Load Instructions
850 //---
852 // Load register, literal
853 // Load register, unscaled immed
854 // Load register, immed unprivileged
855 // Load register, unsigned immed
856 def : WriteRes<WriteLD,      [THX3T110LS]> {
857   let Latency = 4;
858   let NumMicroOps = 4;
861 // Load register, immed post-index
862 // NOTE: Handled by WriteLD, WriteI.
863 // Load register, immed pre-index
864 // NOTE: Handled by WriteLD, WriteAdr.
865 def : WriteRes<WriteAdr,     [THX3T110I0123]> {
866   let Latency = 1;
867   let NumMicroOps = 2;
870 // Load pair, immed offset, normal
871 // Load pair, immed offset, signed words, base != SP
872 // Load pair, immed offset signed words, base = SP
873 // LDP only breaks into *one* LS micro-op.  Thus
874 // the resources are handled by WriteLD.
875 def : WriteRes<WriteLDHi,    []> {
876   let Latency = 4;
877   let NumMicroOps = 4;
880 // Load register offset, basic
881 // Load register, register offset, scale by 4/8
882 // Load register, register offset, scale by 2
883 // Load register offset, extend
884 // Load register, register offset, extend, scale by 4/8
885 // Load register, register offset, extend, scale by 2
886 def THX3T110WriteLDIdx : SchedWriteVariant<[
887   SchedVar<ScaledIdxPred, [THX3T110Write_4Cyc_LS01_I0123_I0123]>,
888   SchedVar<NoSchedPred,   [THX3T110Write_4Cyc_LS01_I0123]>]>;
889 def : SchedAlias<WriteLDIdx, THX3T110WriteLDIdx>;
891 def THX3T110ReadAdrBase : SchedReadVariant<[
892   SchedVar<ScaledIdxPred, [ReadDefault]>,
893   SchedVar<NoSchedPred,   [ReadDefault]>]>;
894 def : SchedAlias<ReadAdrBase, THX3T110ReadAdrBase>;
896 // Load pair, immed pre-index, normal
897 // Load pair, immed pre-index, signed words
898 // Load pair, immed post-index, normal
899 // Load pair, immed post-index, signed words
900 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDNPDi)>;
901 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDNPQi)>;
902 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDNPSi)>;
903 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDNPWi)>;
904 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDNPXi)>;
906 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDPDi)>;
907 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDPQi)>;
908 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDPSi)>;
909 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDPSWi)>;
910 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDPWi)>;
911 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, WriteLDHi], (instrs LDPXi)>;
913 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDRBui)>;
914 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDRDui)>;
915 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDRHui)>;
916 def : InstRW<[THX3T110Write_5Cyc_LS01], (instrs LDRQui)>;
917 def : InstRW<[THX3T110Write_5Cyc_LS01], (instrs LDRSui)>;
919 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDRDl)>;
920 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDRQl)>;
921 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDRWl)>;
922 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDRXl)>;
924 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDTRBi)>;
925 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDTRHi)>;
926 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDTRWi)>;
927 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDTRXi)>;
929 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDTRSBWi)>;
930 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDTRSBXi)>;
931 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDTRSHWi)>;
932 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDTRSHXi)>;
933 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDTRSWi)>;
935 def : InstRW<[THX3T110Write_5Cyc_LS01_I0123, WriteLDHi, WriteAdr],
936             (instrs LDPDpre)>;
937 def : InstRW<[THX3T110Write_5Cyc_LS01_I0123, WriteLDHi, WriteAdr],
938             (instrs LDPQpre)>;
939 def : InstRW<[THX3T110Write_5Cyc_LS01_I0123, WriteLDHi, WriteAdr],
940             (instrs LDPSpre)>;
941 def : InstRW<[THX3T110Write_5Cyc_LS01_I0123, WriteLDHi, WriteAdr],
942             (instrs LDPWpre)>;
943 def : InstRW<[THX3T110Write_5Cyc_LS01_I0123, WriteLDHi, WriteAdr],
944             (instrs LDPWpre)>;
946 def : InstRW<[THX3T110Write_4Cyc_LS01, WriteAdr],
947             (instrs LDRBpre, LDRDpre, LDRHpre, LDRQpre,
948                     LDRSpre, LDRWpre, LDRXpre,
949                     LDRSBWpre, LDRSBXpre, LDRSBWpost, LDRSBXpost,
950                     LDRSHWpre, LDRSHXpre, LDRSHWpost, LDRSHXpost,
951                     LDRBBpre, LDRBBpost, LDRHHpre, LDRHHpost)>;
953 def : InstRW<[THX3T110Write_5Cyc_LS01_I0123, WriteLDHi, WriteAdr],
954             (instrs LDPDpost, LDPQpost, LDPSpost, LDPWpost, LDPXpost)>;
956 def : InstRW<[THX3T110Write_5Cyc_LS01_I0123, WriteI],
957             (instrs LDRBpost, LDRDpost, LDRHpost,
958                     LDRQpost, LDRSpost, LDRWpost, LDRXpost)>;
960 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123_I0123, WriteLDHi, WriteAdr],
961             (instrs LDPDpre, LDPQpre, LDPSpre, LDPWpre, LDPXpre)>;
963 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123_I0123, WriteAdr],
964             (instrs LDRBpre, LDRDpre, LDRHpre, LDRQpre,
965                     LDRSpre, LDRWpre, LDRXpre)>;
967 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123_I0123, WriteLDHi, WriteAdr],
968             (instrs LDPDpost, LDPQpost, LDPSpost, LDPWpost, LDPXpost)>;
970 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123_I0123, WriteI],
971             (instrs LDRBpost, LDRDpost, LDRHpost, LDRQpost,
972                     LDRSpost, LDRWpost, LDRXpost)>;
974 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRBroW)>;
975 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRDroW)>;
976 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRHroW)>;
977 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRHHroW)>;
978 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRQroW)>;
979 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRSroW)>;
980 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRSHWroW)>;
981 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRSHXroW)>;
982 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRWroW)>;
983 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRXroW)>;
985 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRBroX)>;
986 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRDroX)>;
987 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRHHroX)>;
988 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRHroX)>;
989 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRQroX)>;
990 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRSroX)>;
991 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRSHWroX)>;
992 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRSHXroX)>;
993 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRWroX)>;
994 def : InstRW<[THX3T110Write_4Cyc_LS01_I0123, ReadAdrBase], (instrs LDRXroX)>;
996 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURBi)>;
997 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURBBi)>;
998 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURDi)>;
999 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURHi)>;
1000 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURHHi)>;
1001 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURQi)>;
1002 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURSi)>;
1003 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURXi)>;
1004 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURSBWi)>;
1005 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURSBXi)>;
1006 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURSHWi)>;
1007 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURSHXi)>;
1008 def : InstRW<[THX3T110Write_4Cyc_LS01], (instrs LDURSWi)>;
1010 // Load exclusive
1011 def : InstRW<[THX3T110Write_4Cyc_LS01], (instregex "^LDAR(B|H|W|X)$")>;
1012 def : InstRW<[THX3T110Write_4Cyc_LS01], (instregex "^LDAXR(B|H|W|X)$")>;
1013 def : InstRW<[THX3T110Write_4Cyc_LS01], (instregex "^LDXR(B|H|W|X)$")>;
1014 def : InstRW<[THX3T110Write_4Cyc_LS01], (instregex "^LDAXP(W|X)$")>;
1015 def : InstRW<[THX3T110Write_4Cyc_LS01], (instregex "^LDXP(W|X)$")>;
1017 //---
1018 // Prefetch
1019 //---
1020 def : InstRW<[THX3T110Write_6Cyc_LS01_I012], (instrs PRFMl)>;
1021 def : InstRW<[THX3T110Write_6Cyc_LS01_I012], (instrs PRFUMi)>;
1022 def : InstRW<[THX3T110Write_6Cyc_LS01_I012], (instrs PRFMui)>;
1023 def : InstRW<[THX3T110Write_6Cyc_LS01_I012], (instrs PRFMroW)>;
1024 def : InstRW<[THX3T110Write_6Cyc_LS01_I012], (instrs PRFMroX)>;
1026 //--
1027 // 3.7 Store Instructions
1028 // 3.11 FP Store Instructions
1029 //--
1031 // Store register, unscaled immed
1032 // Store register, immed unprivileged
1033 // Store register, unsigned immed
1034 def : WriteRes<WriteST,      [THX3T110LS, THX3T110SD]> {
1035   let Latency = 1;
1036   let NumMicroOps = 2;
1039 // Store register, immed post-index
1040 // NOTE: Handled by WriteAdr, WriteST, ReadAdrBase
1042 // Store register, immed pre-index
1043 // NOTE: Handled by WriteAdr, WriteST
1045 // Store register, register offset, basic
1046 // Store register, register offset, scaled by 4/8
1047 // Store register, register offset, scaled by 2
1048 // Store register, register offset, extend
1049 // Store register, register offset, extend, scale by 4/8
1050 // Store register, register offset, extend, scale by 1
1051 def : WriteRes<WriteSTIdx, [THX3T110LS, THX3T110SD, THX3T110I0123]> {
1052   let Latency = 1;
1053   let NumMicroOps = 2;
1056 // Store pair, immed offset, W-form
1057 // Store pair, immed offset, X-form
1058 def : WriteRes<WriteSTP,     [THX3T110LS, THX3T110SD]> {
1059   let Latency = 1;
1060   let NumMicroOps = 2;
1063 // Store pair, immed post-index, W-form
1064 // Store pair, immed post-index, X-form
1065 // Store pair, immed pre-index, W-form
1066 // Store pair, immed pre-index, X-form
1067 // NOTE: Handled by WriteAdr, WriteSTP.
1068 def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STURBi)>;
1069 def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STURBBi)>;
1070 def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STURDi)>;
1071 def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STURHi)>;
1072 def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STURHHi)>;
1073 def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STURQi)>;
1074 def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STURSi)>;
1075 def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STURWi)>;
1076 def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STURXi)>;
1078 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_SD], (instrs STTRBi)>;
1079 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_SD], (instrs STTRHi)>;
1080 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_SD], (instrs STTRWi)>;
1081 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_SD], (instrs STTRXi)>;
1083 def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STNPDi)>;
1084 def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STNPQi)>;
1085 def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STNPXi)>;
1086 def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STNPWi)>;
1088 def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STPDi)>;
1089 def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STPQi)>;
1090 def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STPXi)>;
1091 def : InstRW<[THX3T110Write_1Cyc_LS01_SD], (instrs STPWi)>;
1093 def : InstRW<[THX3T110Write_1Cyc_LS01_I0123], (instrs STRBui)>;
1094 def : InstRW<[THX3T110Write_1Cyc_LS01_I0123], (instrs STRDui)>;
1095 def : InstRW<[THX3T110Write_1Cyc_LS01_I0123], (instrs STRHui)>;
1096 def : InstRW<[THX3T110Write_1Cyc_LS01_I0123], (instrs STRQui)>;
1097 def : InstRW<[THX3T110Write_1Cyc_LS01_I0123], (instrs STRXui)>;
1098 def : InstRW<[THX3T110Write_1Cyc_LS01_I0123], (instrs STRWui)>;
1100 def : InstRW<[WriteSTP, THX3T110Write_1Cyc_LS01_SD], (instrs STRBui)>;
1101 def : InstRW<[WriteSTP, THX3T110Write_1Cyc_LS01_SD], (instrs STRDui)>;
1102 def : InstRW<[WriteSTP, THX3T110Write_1Cyc_LS01_SD], (instrs STRHui)>;
1103 def : InstRW<[WriteSTP, THX3T110Write_1Cyc_LS01_SD], (instrs STRQui)>;
1104 def : InstRW<[WriteSTP, THX3T110Write_1Cyc_LS01_SD], (instrs STRXui)>;
1105 def : InstRW<[WriteSTP, THX3T110Write_1Cyc_LS01_SD], (instrs STRWui)>;
1107 def : InstRW<[WriteSTIdx, THX3T110Write_1Cyc_LS01_SD_I0123], (instrs STRBui)>;
1108 def : InstRW<[WriteSTIdx, THX3T110Write_1Cyc_LS01_SD_I0123], (instrs STRDui)>;
1109 def : InstRW<[WriteSTIdx, THX3T110Write_1Cyc_LS01_SD_I0123], (instrs STRHui)>;
1110 def : InstRW<[WriteSTIdx, THX3T110Write_1Cyc_LS01_SD_I0123], (instrs STRQui)>;
1111 def : InstRW<[WriteSTIdx, THX3T110Write_1Cyc_LS01_SD_I0123], (instrs STRXui)>;
1112 def : InstRW<[WriteSTIdx, THX3T110Write_1Cyc_LS01_SD_I0123], (instrs STRWui)>;
1114 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123],
1115             (instrs STPDpre, STPDpost)>;
1116 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1117             (instrs STPDpre, STPDpost)>;
1118 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123],
1119             (instrs STPQpre, STPQpost)>;
1120 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1121             (instrs STPQpre, STPQpost)>;
1122 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123],
1123             (instrs STPSpre, STPSpost)>;
1124 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1125             (instrs STPSpre, STPSpost)>;
1126 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123],
1127             (instrs STPWpre, STPWpost)>;
1128 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1129             (instrs STPWpre, STPWpost)>;
1130 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123],
1131             (instrs STPXpre, STPXpost)>;
1132 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1133             (instrs STPXpre, STPXpost)>;
1134 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123],
1135             (instrs STRBpre, STRBpost)>;
1136 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1137             (instrs STRBpre, STRBpost)>;
1138 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123],
1139             (instrs STRBBpre, STRBBpost)>;
1140 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1141             (instrs STRBBpre, STRBBpost)>;
1142 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123],
1143             (instrs STRDpre, STRDpost)>;
1144 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1145             (instrs STRDpre, STRDpost)>;
1146 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123],
1147             (instrs STRHpre, STRHpost)>;
1148 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1149             (instrs STRHpre, STRHpost)>;
1150 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123],
1151             (instrs STRHHpre, STRHHpost)>;
1152 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1153             (instrs STRHHpre, STRHHpost)>;
1154 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123],
1155             (instrs STRQpre, STRQpost)>;
1156 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1157             (instrs STRQpre, STRQpost)>;
1158 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123],
1159             (instrs STRSpre, STRSpost)>;
1160 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1161             (instrs STRSpre, STRSpost)>;
1162 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123],
1163             (instrs STRWpre, STRWpost)>;
1164 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1165             (instrs STRWpre, STRWpost)>;
1166 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123],
1167             (instrs STRXpre, STRXpost)>;
1168 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1169             (instrs STRXpre, STRXpost)>;
1170 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1171             (instrs STRBroW, STRBroX)>;
1172 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1173             (instrs STRBBroW, STRBBroX)>;
1174 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1175             (instrs STRDroW, STRDroX)>;
1176 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1177             (instrs STRHroW, STRHroX)>;
1178 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1179             (instrs STRHHroW, STRHHroX)>;
1180 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1181             (instrs STRQroW, STRQroX)>;
1182 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1183             (instrs STRSroW, STRSroX)>;
1184 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1185             (instrs STRWroW, STRWroX)>;
1186 def : InstRW<[WriteAdr, THX3T110Write_1Cyc_LS01_I0123, ReadAdrBase],
1187             (instrs STRXroW, STRXroX)>;
1189 // Store exclusive
1190 def : InstRW<[THX3T110Write_4Cyc_LS01_SD], (instrs STNPWi, STNPXi)>;
1191 def : InstRW<[THX3T110Write_4Cyc_LS01_SD], (instregex "^STLR(B|H|W|X)$")>;
1192 def : InstRW<[THX3T110Write_4Cyc_LS01_SD], (instregex "^STXP(W|X)$")>;
1193 def : InstRW<[THX3T110Write_4Cyc_LS01_SD], (instregex "^STXR(B|H|W|X)$")>;
1194 def : InstRW<[THX3T110Write_4Cyc_LS01_SD], (instregex "^STLXP(W|X)$")>;
1195 def : InstRW<[THX3T110Write_4Cyc_LS01_SD], (instregex "^STLXR(B|H|W|X)$")>;
1197 //---
1198 // 3.8 FP Data Processing Instructions
1199 //---
1201 // FP absolute value
1202 // FP min/max
1203 // FP negate
1204 def : WriteRes<WriteF,       [THX3T110FP0123]> {
1205   let Latency = 5;
1206   let NumMicroOps = 2;
1209 // FP arithmetic
1210 def : InstRW<[THX3T110Write_6Cyc_F01], (instregex "^FADD", "^FSUB")>;
1212 // FP compare
1213 def : WriteRes<WriteFCmp,    [THX3T110FP0123]> {
1214   let Latency = 5;
1215   let NumMicroOps = 2;
1218 // FP Mul, Div, Sqrt
1219 def : WriteRes<WriteFDiv, [THX3T110FP0123]> {
1220   let Latency = 22;
1221   let ReleaseAtCycles = [19];
1224 def THX3T110XWriteFDiv : SchedWriteRes<[THX3T110FP0123]> {
1225   let Latency = 16;
1226   let ReleaseAtCycles = [8];
1227   let NumMicroOps = 4;
1230 def THX3T110XWriteFDivSP : SchedWriteRes<[THX3T110FP0123]> {
1231   let Latency = 16;
1232   let ReleaseAtCycles = [8];
1233   let NumMicroOps = 4;
1236 def THX3T110XWriteFDivDP : SchedWriteRes<[THX3T110FP0123]> {
1237   let Latency = 23;
1238   let ReleaseAtCycles = [12];
1239   let NumMicroOps = 4;
1242 def THX3T110XWriteFSqrtSP : SchedWriteRes<[THX3T110FP0123]> {
1243   let Latency = 16;
1244   let ReleaseAtCycles = [8];
1245   let NumMicroOps = 4;
1248 def THX3T110XWriteFSqrtDP : SchedWriteRes<[THX3T110FP0123]> {
1249   let Latency = 23;
1250   let ReleaseAtCycles = [12];
1251   let NumMicroOps = 4;
1254 // FP divide, S-form
1255 // FP square root, S-form
1256 def : InstRW<[THX3T110XWriteFDivSP], (instrs FDIVSrr)>;
1257 def : InstRW<[THX3T110XWriteFSqrtSP], (instrs FSQRTSr)>;
1258 def : InstRW<[THX3T110XWriteFDivSP], (instregex "^FDIVv.*32$")>;
1259 def : InstRW<[THX3T110XWriteFSqrtSP], (instregex "^.*SQRT.*32$")>;
1260 def : InstRW<[THX3T110Write_16Cyc_F01], (instregex "^FDIVSrr", "^FSQRTSr")>;
1262 // FP divide, D-form
1263 // FP square root, D-form
1264 def : InstRW<[THX3T110XWriteFDivDP], (instrs FDIVDrr)>;
1265 def : InstRW<[THX3T110XWriteFSqrtDP], (instrs FSQRTDr)>;
1266 def : InstRW<[THX3T110XWriteFDivDP], (instregex "^FDIVv.*64$")>;
1267 def : InstRW<[THX3T110XWriteFSqrtDP], (instregex "^.*SQRT.*64$")>;
1268 def : InstRW<[THX3T110Write_23Cyc_F01], (instregex "^FDIVDrr", "^FSQRTDr")>;
1270 // FP multiply
1271 // FP multiply accumulate
1272 def : WriteRes<WriteFMul, [THX3T110FP0123]> {
1273   let Latency = 6;
1274   let ReleaseAtCycles = [2];
1275   let NumMicroOps = 3;
1278 def THX3T110XWriteFMul : SchedWriteRes<[THX3T110FP0123]> {
1279   let Latency = 6;
1280   let ReleaseAtCycles = [2];
1281   let NumMicroOps = 3;
1284 def THX3T110XWriteFMulAcc : SchedWriteRes<[THX3T110FP0123]> {
1285   let Latency = 6;
1286   let ReleaseAtCycles = [2];
1287   let NumMicroOps = 3;
1290 def : InstRW<[THX3T110XWriteFMul], (instregex "^FMUL", "^FNMUL")>;
1291 def : InstRW<[THX3T110XWriteFMulAcc],
1292             (instregex "^FMADD", "^FMSUB", "^FNMADD", "^FNMSUB")>;
1294 // FP round to integral
1295 def : InstRW<[THX3T110Write_7Cyc_F01],
1296             (instregex "^FRINT(A|I|M|N|P|X|Z)(Sr|Dr)")>;
1298 // FP select
1299 def : InstRW<[THX3T110Write_3_4Cyc_F23_F0123], (instregex "^FCSEL")>;
1301 //---
1302 // 3.9 FP Miscellaneous Instructions
1303 //---
1305 // FP convert, from vec to vec reg
1306 // FP convert, from gen to vec reg
1307 // FP convert, from vec to gen reg
1308 def : WriteRes<WriteFCvt, [THX3T110FP0123]> {
1309   let Latency = 7;
1310   let NumMicroOps = 3;
1313 // FP move, immed
1314 // FP move, register
1315 def : WriteRes<WriteFImm, [THX3T110FP0123]> {
1316   let Latency = 4;
1317   let NumMicroOps = 2;
1320 // FP transfer, from gen to vec reg
1321 // FP transfer, from vec to gen reg
1322 def : WriteRes<WriteFCopy, [THX3T110FP0123]> {
1323   let Latency = 4;
1324   let NumMicroOps = 2;
1327 def : InstRW<[THX3T110Write_5Cyc_F01], (instrs FMOVXDHighr, FMOVDXHighr)>;
1329 //---
1330 // 3.12 ASIMD Integer Instructions
1331 //---
1333 // ASIMD absolute diff, D-form
1334 // ASIMD absolute diff, Q-form
1335 // ASIMD absolute diff accum, D-form
1336 // ASIMD absolute diff accum, Q-form
1337 // ASIMD absolute diff accum long
1338 // ASIMD absolute diff long
1339 // ASIMD arith, basic
1340 // ASIMD arith, complex
1341 // ASIMD compare
1342 // ASIMD logical (AND, BIC, EOR)
1343 // ASIMD max/min, basic
1344 // ASIMD max/min, reduce, 4H/4S
1345 // ASIMD max/min, reduce, 8B/8H
1346 // ASIMD max/min, reduce, 16B
1347 // ASIMD multiply, D-form
1348 // ASIMD multiply, Q-form
1349 // ASIMD multiply accumulate long
1350 // ASIMD multiply accumulate saturating long
1351 // ASIMD multiply long
1352 // ASIMD pairwise add and accumulate
1353 // ASIMD shift accumulate
1354 // ASIMD shift by immed, basic
1355 // ASIMD shift by immed and insert, basic, D-form
1356 // ASIMD shift by immed and insert, basic, Q-form
1357 // ASIMD shift by immed, complex
1358 // ASIMD shift by register, basic, D-form
1359 // ASIMD shift by register, basic, Q-form
1360 // ASIMD shift by register, complex, D-form
1361 // ASIMD shift by register, complex, Q-form
1362 def : WriteRes<WriteVd, [THX3T110FP0123]> {
1363   let Latency = 5;
1364   let NumMicroOps = 4;
1365   let ReleaseAtCycles = [4];
1367 def : WriteRes<WriteVq, [THX3T110FP0123]> {
1368   let Latency = 5;
1369   let NumMicroOps = 4;
1370   let ReleaseAtCycles = [4];
1373 // ASIMD arith, reduce, 4H/4S
1374 // ASIMD arith, reduce, 8B/8H
1375 // ASIMD arith, reduce, 16B
1377 // ASIMD logical (MVN (alias for NOT), ORN, ORR)
1378 def : InstRW<[THX3T110Write_5Cyc_F0123],
1379             (instregex "^ANDv", "^BICv", "^EORv", "^ORRv", "^ORNv", "^NOTv")>;
1381 // ASIMD arith, reduce
1382 def : InstRW<[THX3T110Write_5Cyc_F0123],
1383             (instregex "^ADDVv", "^SADDLVv", "^UADDLVv")>;
1385 // ASIMD polynomial (8x8) multiply long
1386 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^(S|U|SQD)MULL")>;
1387 def : InstRW<[THX3T110Write_5Cyc_F0123],
1388             (instregex "(S|U|SQD)(MLAL|MLSL|MULL)v.*")>;
1389 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^PMULL(v8i8|v16i8)")>;
1390 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^PMULL(v1i64|v2i64)")>;
1392 // ASIMD absolute diff accum, D-form
1393 def : InstRW<[THX3T110Write_5Cyc_F0123],
1394             (instregex "^[SU]ABA(v8i8|v4i16|v2i32)$")>;
1395 // ASIMD absolute diff accum, Q-form
1396 def : InstRW<[THX3T110Write_5Cyc_F0123],
1397             (instregex "^[SU]ABA(v16i8|v8i16|v4i32)$")>;
1398 // ASIMD absolute diff accum long
1399 def : InstRW<[THX3T110Write_5Cyc_F0123],
1400             (instregex "^[SU]ABAL")>;
1401 // ASIMD arith, reduce, 4H/4S
1402 def : InstRW<[THX3T110Write_5Cyc_F0123],
1403             (instregex "^[SU]?ADDL?V(v8i8|v4i16|v2i32)v$")>;
1404 // ASIMD arith, reduce, 8B
1405 def : InstRW<[THX3T110Write_5Cyc_F0123],
1406             (instregex "^[SU]?ADDL?V(v8i16|v4i32)v$")>;
1407 // ASIMD arith, reduce, 16B/16H
1408 def : InstRW<[THX3T110Write_10Cyc_F0123],
1409             (instregex "^[SU]?ADDL?Vv16i8v$")>;
1410 // ASIMD max/min, reduce, 4H/4S
1411 def : InstRW<[THX3T110Write_5Cyc_F0123],
1412             (instregex "^[SU](MIN|MAX)V(v4i16|v4i32)v$")>;
1413 // ASIMD max/min, reduce, 8B/8H
1414 def : InstRW<[THX3T110Write_5Cyc_F0123],
1415             (instregex "^[SU](MIN|MAX)V(v8i8|v8i16)v$")>;
1416 // ASIMD max/min, reduce, 16B/16H
1417 def : InstRW<[THX3T110Write_5Cyc_F0123],
1418             (instregex "^[SU](MIN|MAX)Vv16i8v$")>;
1419 // ASIMD multiply, D-form
1420 def : InstRW<[THX3T110Write_5Cyc_F0123],
1421             (instregex "^(P?MUL|SQR?DMULH)" #
1422                        "(v8i8|v4i16|v2i32|v1i8|v1i16|v1i32|v1i64)" #
1423                        "(_indexed)?$")>;
1424 // ASIMD multiply, Q-form
1425 def : InstRW<[THX3T110Write_5Cyc_F0123],
1426             (instregex "^(P?MUL|SQR?DMULH)(v16i8|v8i16|v4i32)(_indexed)?$")>;
1427 // ASIMD multiply accumulate, D-form
1428 def : InstRW<[THX3T110Write_5Cyc_F0123],
1429             (instregex "^ML[AS](v8i8|v4i16|v2i32)(_indexed)?$")>;
1430 // ASIMD multiply accumulate, Q-form
1431 def : InstRW<[THX3T110Write_5Cyc_F0123],
1432             (instregex "^ML[AS](v16i8|v8i16|v4i32)(_indexed)?$")>;
1433 // ASIMD shift accumulate
1434 def : InstRW<[THX3T110Write_5Cyc_F0123],
1435             (instregex "SRSRAv","SSRAv","URSRAv","USRAv")>;
1437 // ASIMD shift by immed, basic
1438 def : InstRW<[THX3T110Write_5Cyc_F0123],
1439             (instregex "RSHRNv","SHRNv", "SQRSHRNv","SQRSHRUNv",
1440                        "SQSHRNv","SQSHRUNv", "UQRSHRNv",
1441                        "UQSHRNv","SQXTNv","SQXTUNv","UQXTNv")>;
1442 // ASIMD shift by immed, complex
1443 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^[SU]?(Q|R){1,2}SHR")>;
1444 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SQSHLU")>;
1445 // ASIMD shift by register, basic, Q-form
1446 def : InstRW<[THX3T110Write_5Cyc_F01],
1447             (instregex "^[SU]SHL(v16i8|v8i16|v4i32|v2i64)")>;
1448 // ASIMD shift by register, complex, D-form
1449 def : InstRW<[THX3T110Write_5Cyc_F0123],
1450             (instregex "^[SU][QR]{1,2}SHL" #
1451                        "(v1i8|v1i16|v1i32|v1i64|v8i8|v4i16|v2i32|b|d|h|s)")>;
1452 // ASIMD shift by register, complex, Q-form
1453 def : InstRW<[THX3T110Write_5Cyc_F0123],
1454             (instregex "^[SU][QR]{1,2}SHL(v16i8|v8i16|v4i32|v2i64)")>;
1456 // ASIMD Arithmetic
1457 def : InstRW<[THX3T110Write_5Cyc_F0123],
1458             (instregex "(ADD|SUB)(v8i8|v4i16|v2i32|v1i64)")>;
1459 def : InstRW<[THX3T110Write_5Cyc_F0123],
1460             (instregex "(ADD|SUB)(v16i8|v8i16|v4i32|v2i64)")>;
1461 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "(ADD|SUB)HNv.*")>;
1462 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "(RADD|RSUB)HNv.*")>;
1463 def : InstRW<[THX3T110Write_5Cyc_F0123],
1464             (instregex "^SQADD", "^SQNEG", "^SQSUB", "^SRHADD",
1465                        "^SUQADD", "^UQADD", "^UQSUB", "^URHADD", "^USQADD")>;
1466 def : InstRW<[THX3T110Write_5Cyc_F0123],
1467             (instregex "ADDP(v16i8|v8i16|v4i32|v2i64)")>;
1468 def : InstRW<[THX3T110Write_5Cyc_F0123],
1469             (instregex "((AND|ORN|EOR|EON)S?(Xr[rsi]|v16i8|v8i16|v4i32)|" #
1470                        "(ORR|BIC)S?(Xr[rs]|v16i8|v8i16|v4i32))")>;
1471 def : InstRW<[THX3T110Write_5Cyc_F0123],
1472             (instregex "(CLS|CLZ|CNT)(v4i32|v8i16|v16i8)")>;
1473 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SADALP","^UADALP")>;
1474 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SADDLPv","^UADDLPv")>;
1475 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SADDLV","^UADDLV")>;
1476 def : InstRW<[THX3T110Write_5Cyc_F0123],
1477              (instregex "^ADDVv","^SMAXVv","^UMAXVv","^SMINVv","^UMINVv")>;
1478 def : InstRW<[THX3T110Write_5Cyc_F0123],
1479              (instregex "^SABAv","^UABAv","^SABALv","^UABALv")>;
1480 def : InstRW<[THX3T110Write_5Cyc_F0123],
1481             (instregex "^SQADDv","^SQSUBv","^UQADDv","^UQSUBv")>;
1482 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^SUQADDv","^USQADDv")>;
1483 def : InstRW<[THX3T110Write_5Cyc_F0123],
1484             (instregex "^ADDHNv","^RADDHNv", "^RSUBHNv",
1485                        "^SQABS", "^SQADD", "^SQNEG", "^SQSUB",
1486                        "^SRHADD", "^SUBHNv", "^SUQADD",
1487                        "^UQADD", "^UQSUB", "^URHADD", "^USQADD")>;
1488 def : InstRW<[THX3T110Write_5Cyc_F0123],
1489             (instregex "^CMEQv","^CMGEv","^CMGTv",
1490                        "^CMLEv","^CMLTv", "^CMHIv","^CMHSv")>;
1491 def : InstRW<[THX3T110Write_5Cyc_F0123],
1492             (instregex "^SMAXv","^SMINv","^UMAXv","^UMINv",
1493                        "^SMAXPv","^SMINPv","^UMAXPv","^UMINPv")>;
1494 def : InstRW<[THX3T110Write_5Cyc_F0123],
1495             (instregex "^SABDv","^UABDv", "^SABDLv","^UABDLv")>;
1497 //---
1498 // 3.13 ASIMD Floating-point Instructions
1499 //---
1501 // ASIMD FP absolute value
1502 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^FABSv")>;
1504 // ASIMD FP arith, normal, D-form
1505 // ASIMD FP arith, normal, Q-form
1506 def : InstRW<[THX3T110Write_3_4Cyc_F23_F0123],
1507             (instregex "^FABDv", "^FADDv", "^FSUBv")>;
1509 // ASIMD FP arith,pairwise, D-form
1510 // ASIMD FP arith, pairwise, Q-form
1511 def : InstRW<[THX3T110Write_3_4Cyc_F23_F0123], (instregex "^FADDPv")>;
1513 // ASIMD FP compare, D-form
1514 // ASIMD FP compare, Q-form
1515 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^FACGEv", "^FACGTv")>;
1516 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^FCMEQv", "^FCMGEv",
1517                                                  "^FCMGTv", "^FCMLEv",
1518                                                  "^FCMLTv")>;
1520 // ASIMD FP round, D-form
1521 def : InstRW<[THX3T110Write_5Cyc_F0123],
1522             (instregex "^FRINT[AIMNPXZ](v2f32)")>;
1523 // ASIMD FP round, Q-form
1524 def : InstRW<[THX3T110Write_5Cyc_F0123],
1525             (instregex "^FRINT[AIMNPXZ](v4f32|v2f64)")>;
1527 // ASIMD FP convert, long
1528 // ASIMD FP convert, narrow
1529 // ASIMD FP convert, other, D-form
1530 // ASIMD FP convert, other, Q-form
1531 // NOTE: Handled by WriteV.
1533 // ASIMD FP convert, long and narrow
1534 def : InstRW<[THX3T110Write_5Cyc_F01], (instregex "^FCVT(L|N|XN)v")>;
1535 // ASIMD FP convert, other, D-form
1536 def : InstRW<[THX3T110Write_5Cyc_F01],
1537       (instregex "^[FVSU]CVT([AMNPZ][SU])?(_Int)?(v2f32|v1i32|v2i32|v1i64)")>;
1538 // ASIMD FP convert, other, Q-form
1539 def : InstRW<[THX3T110Write_5Cyc_F01],
1540       (instregex "^[FVSU]CVT([AMNPZ][SU])?(_Int)?(v4f32|v2f64|v4i32|v2i64)")>;
1542 // ASIMD FP divide, D-form, F32
1543 def : InstRW<[THX3T110Write_16Cyc_F0123], (instrs FDIVv2f32)>;
1544 def : InstRW<[THX3T110Write_16Cyc_F0123], (instregex "FDIVv2f32")>;
1546 // ASIMD FP divide, Q-form, F32
1547 def : InstRW<[THX3T110Write_16Cyc_F0123], (instrs FDIVv4f32)>;
1548 def : InstRW<[THX3T110Write_16Cyc_F0123], (instregex "FDIVv4f32")>;
1550 // ASIMD FP divide, Q-form, F64
1551 def : InstRW<[THX3T110Write_23Cyc_F0123], (instrs FDIVv2f64)>;
1552 def : InstRW<[THX3T110Write_23Cyc_F0123], (instregex "FDIVv2f64")>;
1554 // ASIMD FP max/min, normal, D-form
1555 // ASIMD FP max/min, normal, Q-form
1556 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^FMAXv", "^FMAXNMv",
1557                                                 "^FMINv", "^FMINNMv")>;
1559 // ASIMD FP max/min, pairwise, D-form
1560 // ASIMD FP max/min, pairwise, Q-form
1561 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^FMAXPv", "^FMAXNMPv",
1562                                                 "^FMINPv", "^FMINNMPv")>;
1564 // ASIMD FP max/min, reduce
1565 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^FMAXVv", "^FMAXNMVv",
1566                                                 "^FMINVv", "^FMINNMVv")>;
1568 // ASIMD FP multiply, D-form, FZ
1569 // ASIMD FP multiply, D-form, no FZ
1570 // ASIMD FP multiply, Q-form, FZ
1571 // ASIMD FP multiply, Q-form, no FZ
1572 def : InstRW<[THX3T110Write_5Cyc_F0123],
1573             (instregex "^FMULv", "^FMULXv")>;
1574 def : InstRW<[THX3T110Write_5Cyc_F0123],
1575             (instregex "^FMULX?(v2f32|v1i32|v2i32|v1i64|32|64)")>;
1576 def : InstRW<[THX3T110Write_5Cyc_F0123],
1577             (instregex "^FMULX?(v4f32|v2f64|v4i32|v2i64)")>;
1579 // ASIMD FP multiply accumulate, Dform, FZ
1580 // ASIMD FP multiply accumulate, Dform, no FZ
1581 // ASIMD FP multiply accumulate, Qform, FZ
1582 // ASIMD FP multiply accumulate, Qform, no FZ
1583 def : InstRW<[THX3T110Write_5Cyc_F0123],
1584             (instregex "^FMLAv", "^FMLSv")>;
1585 def : InstRW<[THX3T110Write_5Cyc_F0123],
1586             (instregex "^FML[AS](v2f32|v1i32|v2i32|v1i64)")>;
1587 def : InstRW<[THX3T110Write_5Cyc_F0123],
1588             (instregex "^FML[AS](v4f32|v2f64|v4i32|v2i64)")>;
1590 // ASIMD FP negate
1591 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^FNEGv")>;
1593 //--
1594 // 3.14 ASIMD Miscellaneous Instructions
1595 //--
1597 // ASIMD bit reverse
1598 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^RBITv")>;
1600 // ASIMD bitwise insert, D-form
1601 // ASIMD bitwise insert, Q-form
1602 def : InstRW<[THX3T110Write_3_4Cyc_F23_F0123],
1603             (instregex "^BIFv", "^BITv", "^BSLv")>;
1605 // ASIMD count, D-form
1606 // ASIMD count, Q-form
1607 def : InstRW<[THX3T110Write_3_4Cyc_F23_F0123],
1608             (instregex "^CLSv", "^CLZv", "^CNTv")>;
1610 // ASIMD duplicate, gen reg
1611 // ASIMD duplicate, element
1612 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^DUPv")>;
1613 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^DUP(i8|i16|i32|i64)$")>;
1614 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^DUPv.+gpr")>;
1616 // ASIMD extract
1617 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^EXTv")>;
1619 // ASIMD extract narrow
1620 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^XTNv")>;
1622 // ASIMD extract narrow, saturating
1623 def : InstRW<[THX3T110Write_5Cyc_F0123],
1624             (instregex "^SQXTNv", "^SQXTUNv", "^UQXTNv")>;
1626 // ASIMD insert, element to element
1627 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^INSv")>;
1629 // ASIMD transfer, element to gen reg
1630 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^[SU]MOVv")>;
1632 // ASIMD move, integer immed
1633 def : InstRW<[THX3T110Write_3_4Cyc_F23_F0123], (instregex "^MOVIv")>;
1635 // ASIMD move, FP immed
1636 def : InstRW<[THX3T110Write_3_4Cyc_F23_F0123], (instregex "^FMOVv")>;
1638 // ASIMD transpose
1639 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^TRN1", "^TRN2")>;
1641 // ASIMD unzip/zip
1642 def : InstRW<[THX3T110Write_5Cyc_F0123],
1643             (instregex "^UZP1", "^UZP2", "^ZIP1", "^ZIP2")>;
1645 // ASIMD reciprocal estimate, D-form
1646 // ASIMD reciprocal estimate, Q-form
1647 def : InstRW<[THX3T110Write_5Cyc_F0123],
1648             (instregex "^FRECPEv", "^FRECPXv", "^URECPEv",
1649                        "^FRSQRTEv", "^URSQRTEv")>;
1651 // ASIMD reciprocal step, D-form, FZ
1652 // ASIMD reciprocal step, D-form, no FZ
1653 // ASIMD reciprocal step, Q-form, FZ
1654 // ASIMD reciprocal step, Q-form, no FZ
1655 def : InstRW<[THX3T110Write_5Cyc_F0123],
1656               (instregex "^FRECPSv", "^FRSQRTSv")>;
1658 // ASIMD reverse
1659 def : InstRW<[THX3T110Write_5Cyc_F0123],
1660             (instregex "^REV16v", "^REV32v", "^REV64v")>;
1662 // ASIMD table lookup, D-form
1663 // ASIMD table lookup, Q-form
1664 def : InstRW<[THX3T110Write_5Cyc_F0123],
1665             (instrs TBLv8i8One, TBLv16i8One, TBXv8i8One, TBXv16i8One)>;
1666 def : InstRW<[THX3T110Write_10Cyc_F0123],
1667             (instrs TBLv8i8Two, TBLv16i8Two, TBXv8i8Two, TBXv16i8Two)>;
1668 def : InstRW<[THX3T110Write_15Cyc_F0123],
1669             (instrs TBLv8i8Three, TBLv16i8Three, TBXv8i8Three, TBXv16i8Three)>;
1670 def : InstRW<[THX3T110Write_20Cyc_F0123],
1671             (instrs TBLv8i8Four, TBLv16i8Four, TBXv8i8Four, TBXv16i8Four)>;
1673 // ASIMD transfer, element to word or word
1674 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^[SU]MOVv")>;
1676 // ASIMD transfer, element to gen reg
1677 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "(S|U)MOVv.*")>;
1679 // ASIMD transfer gen reg to element
1680 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^INSv")>;
1682 // ASIMD transpose
1683 def : InstRW<[THX3T110Write_5Cyc_F0123],
1684               (instregex "^TRN1v", "^TRN2v", "^UZP1v", "^UZP2v")>;
1686 // ASIMD unzip/zip
1687 def : InstRW<[THX3T110Write_5Cyc_F0123], (instregex "^ZIP1v", "^ZIP2v")>;
1689 //--
1690 // 3.15 ASIMD Load Instructions
1691 //--
1693 // ASIMD load, 1 element, multiple, 1 reg, D-form
1694 // ASIMD load, 1 element, multiple, 1 reg, Q-form
1695 def : InstRW<[THX3T110Write_4Cyc_LS01],
1696             (instregex "^LD1Onev(8b|4h|2s|1d|16b|8h|4s|2d)$")>;
1697 def : InstRW<[THX3T110Write_4Cyc_LS01, WriteAdr],
1698             (instregex "^LD1Onev(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>;
1700 // ASIMD load, 1 element, multiple, 2 reg, D-form
1701 // ASIMD load, 1 element, multiple, 2 reg, Q-form
1702 def : InstRW<[THX3T110Write_4Cyc_LS01],
1703             (instregex "^LD1Twov(8b|4h|2s|1d|16b|8h|4s|2d)$")>;
1704 def : InstRW<[THX3T110Write_4Cyc_LS01, WriteAdr],
1705             (instregex "^LD1Twov(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>;
1707 // ASIMD load, 1 element, multiple, 3 reg, D-form
1708 // ASIMD load, 1 element, multiple, 3 reg, Q-form
1709 def : InstRW<[THX3T110Write_5Cyc_LS01],
1710             (instregex "^LD1Threev(8b|4h|2s|1d|16b|8h|4s|2d)$")>;
1711 def : InstRW<[THX3T110Write_5Cyc_LS01, WriteAdr],
1712             (instregex "^LD1Threev(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>;
1714 // ASIMD load, 1 element, multiple, 4 reg, D-form
1715 // ASIMD load, 1 element, multiple, 4 reg, Q-form
1716 def : InstRW<[THX3T110Write_6Cyc_LS01],
1717             (instregex "^LD1Fourv(8b|4h|2s|1d|16b|8h|4s|2d)$")>;
1718 def : InstRW<[THX3T110Write_6Cyc_LS01, WriteAdr],
1719             (instregex "^LD1Fourv(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>;
1721 // ASIMD load, 1 element, one lane, B/H/S
1722 // ASIMD load, 1 element, one lane, D
1723 def : InstRW<[THX3T110Write_5Cyc_LS01_F0123],
1724             (instregex "^LD1i(8|16|32|64)$")>;
1725 def : InstRW<[THX3T110Write_5Cyc_LS01_F0123, WriteAdr],
1726             (instregex "^LD1i(8|16|32|64)_POST$")>;
1728 // ASIMD load, 1 element, all lanes, D-form, B/H/S
1729 // ASIMD load, 1 element, all lanes, D-form, D
1730 // ASIMD load, 1 element, all lanes, Q-form
1731 def : InstRW<[THX3T110Write_5Cyc_LS01_F0123],
1732             (instregex "^LD1Rv(8b|4h|2s|1d|16b|8h|4s|2d)$")>;
1733 def : InstRW<[THX3T110Write_5Cyc_LS01_F0123, WriteAdr],
1734             (instregex "^LD1Rv(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>;
1736 // ASIMD load, 2 element, multiple, D-form, B/H/S
1737 // ASIMD load, 2 element, multiple, Q-form, D
1738 def : InstRW<[THX3T110Write_5Cyc_LS01_F0123],
1739             (instregex "^LD2Twov(8b|4h|2s|16b|8h|4s|2d)$")>;
1740 def : InstRW<[THX3T110Write_5Cyc_LS01_F0123, WriteAdr],
1741             (instregex "^LD2Twov(8b|4h|2s|16b|8h|4s|2d)_POST$")>;
1743 // ASIMD load, 2 element, one lane, B/H
1744 // ASIMD load, 2 element, one lane, S
1745 // ASIMD load, 2 element, one lane, D
1746 def : InstRW<[THX3T110Write_5Cyc_LS01_F0123],
1747             (instregex "^LD2i(8|16|32|64)$")>;
1748 def : InstRW<[THX3T110Write_5Cyc_LS01_F0123, WriteAdr],
1749             (instregex "^LD2i(8|16|32|64)_POST$")>;
1751 // ASIMD load, 2 element, all lanes, D-form, B/H/S
1752 // ASIMD load, 2 element, all lanes, D-form, D
1753 // ASIMD load, 2 element, all lanes, Q-form
1754 def : InstRW<[THX3T110Write_5Cyc_LS01_F0123],
1755             (instregex "^LD2Rv(8b|4h|2s|1d|16b|8h|4s|2d)$")>;
1756 def : InstRW<[THX3T110Write_5Cyc_LS01_F0123, WriteAdr],
1757             (instregex "^LD2Rv(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>;
1759 // ASIMD load, 3 element, multiple, D-form, B/H/S
1760 // ASIMD load, 3 element, multiple, Q-form, B/H/S
1761 // ASIMD load, 3 element, multiple, Q-form, D
1762 def : InstRW<[THX3T110Write_8Cyc_LS01_F0123],
1763             (instregex "^LD3Threev(8b|4h|2s|16b|8h|4s|2d)$")>;
1764 def : InstRW<[THX3T110Write_8Cyc_LS01_F0123, WriteAdr],
1765             (instregex "^LD3Threev(8b|4h|2s|16b|8h|4s|2d)_POST$")>;
1767 // ASIMD load, 3 element, one lone, B/H
1768 // ASIMD load, 3 element, one lane, S
1769 // ASIMD load, 3 element, one lane, D
1770 def : InstRW<[THX3T110Write_7Cyc_LS01_F0123],
1771             (instregex "^LD3i(8|16|32|64)$")>;
1772 def : InstRW<[THX3T110Write_7Cyc_LS01_F0123, WriteAdr],
1773             (instregex "^LD3i(8|16|32|64)_POST$")>;
1775 // ASIMD load, 3 element, all lanes, D-form, B/H/S
1776 // ASIMD load, 3 element, all lanes, D-form, D
1777 // ASIMD load, 3 element, all lanes, Q-form, B/H/S
1778 // ASIMD load, 3 element, all lanes, Q-form, D
1779 def : InstRW<[THX3T110Write_7Cyc_LS01_F0123],
1780             (instregex "^LD3Rv(8b|4h|2s|1d|16b|8h|4s|2d)$")>;
1781 def : InstRW<[THX3T110Write_7Cyc_LS01_F0123, WriteAdr],
1782             (instregex "^LD3Rv(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>;
1784 // ASIMD load, 4 element, multiple, D-form, B/H/S
1785 // ASIMD load, 4 element, multiple, Q-form, B/H/S
1786 // ASIMD load, 4 element, multiple, Q-form, D
1787 def : InstRW<[THX3T110Write_8Cyc_LS01_F0123],
1788             (instregex "^LD4Fourv(8b|4h|2s|16b|8h|4s|2d)$")>;
1789 def : InstRW<[THX3T110Write_8Cyc_LS01_F0123, WriteAdr],
1790             (instregex "^LD4Fourv(8b|4h|2s|16b|8h|4s|2d)_POST$")>;
1792 // ASIMD load, 4 element, one lane, B/H
1793 // ASIMD load, 4 element, one lane, S
1794 // ASIMD load, 4 element, one lane, D
1795 def : InstRW<[THX3T110Write_6Cyc_LS01_F0123],
1796             (instregex "^LD4i(8|16|32|64)$")>;
1797 def : InstRW<[THX3T110Write_6Cyc_LS01_F0123, WriteAdr],
1798             (instregex "^LD4i(8|16|32|64)_POST$")>;
1800 // ASIMD load, 4 element, all lanes, D-form, B/H/S
1801 // ASIMD load, 4 element, all lanes, D-form, D
1802 // ASIMD load, 4 element, all lanes, Q-form, B/H/S
1803 // ASIMD load, 4 element, all lanes, Q-form, D
1804 def : InstRW<[THX3T110Write_6Cyc_LS01_F0123],
1805             (instregex "^LD4Rv(8b|4h|2s|1d|16b|8h|4s|2d)$")>;
1806 def : InstRW<[THX3T110Write_6Cyc_LS01_F0123, WriteAdr],
1807             (instregex "^LD4Rv(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>;
1809 //--
1810 // 3.16 ASIMD Store Instructions
1811 //--
1813 // ASIMD store, 1 element, multiple, 1 reg, D-form
1814 // ASIMD store, 1 element, multiple, 1 reg, Q-form
1815 def : InstRW<[THX3T110Write_1Cyc_LS01],
1816             (instregex "^ST1Onev(8b|4h|2s|1d|16b|8h|4s|2d)$")>;
1817 def : InstRW<[THX3T110Write_1Cyc_LS01, WriteAdr],
1818             (instregex "^ST1Onev(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>;
1820 // ASIMD store, 1 element, multiple, 2 reg, D-form
1821 // ASIMD store, 1 element, multiple, 2 reg, Q-form
1822 def : InstRW<[THX3T110Write_1Cyc_LS01],
1823             (instregex "^ST1Twov(8b|4h|2s|1d|16b|8h|4s|2d)$")>;
1824 def : InstRW<[THX3T110Write_1Cyc_LS01, WriteAdr],
1825             (instregex "^ST1Twov(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>;
1827 // ASIMD store, 1 element, multiple, 3 reg, D-form
1828 // ASIMD store, 1 element, multiple, 3 reg, Q-form
1829 def : InstRW<[THX3T110Write_1Cyc_LS01],
1830             (instregex "^ST1Threev(8b|4h|2s|1d|16b|8h|4s|2d)$")>;
1831 def : InstRW<[THX3T110Write_1Cyc_LS01, WriteAdr],
1832             (instregex "^ST1Threev(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>;
1834 // ASIMD store, 1 element, multiple, 4 reg, D-form
1835 // ASIMD store, 1 element, multiple, 4 reg, Q-form
1836 def : InstRW<[THX3T110Write_1Cyc_LS01],
1837             (instregex "^ST1Fourv(8b|4h|2s|1d|16b|8h|4s|2d)$")>;
1838 def : InstRW<[THX3T110Write_1Cyc_LS01, WriteAdr],
1839             (instregex "^ST1Fourv(8b|4h|2s|1d|16b|8h|4s|2d)_POST$")>;
1841 // ASIMD store, 1 element, one lane, B/H/S
1842 // ASIMD store, 1 element, one lane, D
1843 def : InstRW<[THX3T110Write_1Cyc_LS01_F0123],
1844             (instregex "^ST1i(8|16|32|64)$")>;
1845 def : InstRW<[THX3T110Write_1Cyc_LS01_F0123, WriteAdr],
1846             (instregex "^ST1i(8|16|32|64)_POST$")>;
1848 // ASIMD store, 2 element, multiple, D-form, B/H/S
1849 // ASIMD store, 2 element, multiple, Q-form, B/H/S
1850 // ASIMD store, 2 element, multiple, Q-form, D
1851 def : InstRW<[THX3T110Write_1Cyc_LS01_F0123],
1852             (instregex "^ST2Twov(8b|4h|2s|16b|8h|4s|2d)$")>;
1853 def : InstRW<[THX3T110Write_1Cyc_LS01_F0123, WriteAdr],
1854             (instregex "^ST2Twov(8b|4h|2s|16b|8h|4s|2d)_POST$")>;
1856 // ASIMD store, 2 element, one lane, B/H/S
1857 // ASIMD store, 2 element, one lane, D
1858 def : InstRW<[THX3T110Write_1Cyc_LS01_F0123],
1859             (instregex "^ST2i(8|16|32|64)$")>;
1860 def : InstRW<[THX3T110Write_1Cyc_LS01_F0123, WriteAdr],
1861             (instregex "^ST2i(8|16|32|64)_POST$")>;
1863 // ASIMD store, 3 element, multiple, D-form, B/H/S
1864 // ASIMD store, 3 element, multiple, Q-form, B/H/S
1865 // ASIMD store, 3 element, multiple, Q-form, D
1866 def : InstRW<[THX3T110Write_1Cyc_LS01_F0123],
1867             (instregex "^ST3Threev(8b|4h|2s|16b|8h|4s|2d)$")>;
1868 def : InstRW<[THX3T110Write_1Cyc_LS01_F0123, WriteAdr],
1869             (instregex "^ST3Threev(8b|4h|2s|16b|8h|4s|2d)_POST$")>;
1871 // ASIMD store, 3 element, one lane, B/H
1872 // ASIMD store, 3 element, one lane, S
1873 // ASIMD store, 3 element, one lane, D
1874 def : InstRW<[THX3T110Write_1Cyc_LS01_F0123],
1875             (instregex "^ST3i(8|16|32|64)$")>;
1876 def : InstRW<[THX3T110Write_1Cyc_LS01_F0123, WriteAdr],
1877             (instregex "^ST3i(8|16|32|64)_POST$")>;
1879 // ASIMD store, 4 element, multiple, D-form, B/H/S
1880 // ASIMD store, 4 element, multiple, Q-form, B/H/S
1881 // ASIMD store, 4 element, multiple, Q-form, D
1882 def : InstRW<[THX3T110Write_1Cyc_LS01_F0123],
1883             (instregex "^ST4Fourv(8b|4h|2s|16b|8h|4s|2d)$")>;
1884 def : InstRW<[THX3T110Write_1Cyc_LS01_F0123, WriteAdr],
1885             (instregex "^ST4Fourv(8b|4h|2s|16b|8h|4s|2d)_POST$")>;
1887 // ASIMD store, 4 element, one lane, B/H
1888 // ASIMD store, 4 element, one lane, S
1889 // ASIMD store, 4 element, one lane, D
1890 def : InstRW<[THX3T110Write_1Cyc_LS01_F0123],
1891             (instregex "^ST4i(8|16|32|64)$")>;
1892 def : InstRW<[THX3T110Write_1Cyc_LS01_F0123, WriteAdr],
1893             (instregex "^ST4i(8|16|32|64)_POST$")>;
1895 // V8.1a Atomics (LSE)
1896 def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic],
1897             (instrs CASB, CASH, CASW, CASX)>;
1899 def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic],
1900             (instrs CASAB, CASAH, CASAW, CASAX)>;
1902 def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic],
1903             (instrs CASLB, CASLH, CASLW, CASLX)>;
1905 def : InstRW<[THX3T110Write_8Cyc_I0123, WriteAtomic],
1906             (instrs CASALB, CASALH, CASALW, CASALX)>;
1908 def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic],
1909             (instrs LDLARB, LDLARH, LDLARW, LDLARX)>;
1911 def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic],
1912             (instrs LDADDB, LDADDH, LDADDW, LDADDX)>;
1914 def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic],
1915             (instrs LDADDAB, LDADDAH, LDADDAW, LDADDAX)>;
1917 def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic],
1918             (instrs LDADDLB, LDADDLH, LDADDLW, LDADDLX)>;
1920 def : InstRW<[THX3T110Write_8Cyc_I0123, WriteAtomic],
1921             (instrs LDADDALB, LDADDALH, LDADDALW, LDADDALX)>;
1923 def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic],
1924             (instrs LDCLRB, LDCLRH, LDCLRW, LDCLRX)>;
1926 def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic],
1927             (instrs LDCLRAB, LDCLRAH, LDCLRAW, LDCLRAX)>;
1929 def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic],
1930             (instrs LDCLRLB, LDCLRLH, LDCLRLW, LDCLRLX)>;
1932 def : InstRW<[THX3T110Write_8Cyc_I0123, WriteAtomic],
1933             (instrs LDCLRALB, LDCLRALH, LDCLRALW, LDCLRALX)>;
1935 def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic],
1936             (instrs LDEORB, LDEORH, LDEORW, LDEORX)>;
1938 def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic],
1939             (instrs LDEORAB, LDEORAH, LDEORAW, LDEORAX)>;
1941 def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic],
1942             (instrs LDEORLB, LDEORLH, LDEORLW, LDEORLX)>;
1944 def : InstRW<[THX3T110Write_8Cyc_I0123, WriteAtomic],
1945             (instrs LDEORALB, LDEORALH, LDEORALW, LDEORALX)>;
1947 def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic],
1948             (instrs LDSETB, LDSETH, LDSETW, LDSETX)>;
1950 def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic],
1951             (instrs LDSETAB, LDSETAH, LDSETAW, LDSETAX)>;
1953 def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic],
1954             (instrs LDSETLB, LDSETLH, LDSETLW, LDSETLX)>;
1956 def : InstRW<[THX3T110Write_8Cyc_I0123, WriteAtomic],
1957             (instrs LDSETALB, LDSETALH, LDSETALW, LDSETALX)>;
1959 def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic],
1960             (instrs LDSMAXB, LDSMAXH, LDSMAXW, LDSMAXX,
1961              LDSMAXAB, LDSMAXAH, LDSMAXAW, LDSMAXAX,
1962              LDSMAXLB, LDSMAXLH, LDSMAXLW, LDSMAXLX,
1963              LDSMAXALB, LDSMAXALH, LDSMAXALW, LDSMAXALX)>;
1965 def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic],
1966             (instrs LDSMINB, LDSMINH, LDSMINW, LDSMINX,
1967              LDSMINAB, LDSMINAH, LDSMINAW, LDSMINAX,
1968              LDSMINLB, LDSMINLH, LDSMINLW, LDSMINLX,
1969              LDSMINALB, LDSMINALH, LDSMINALW, LDSMINALX)>;
1971 def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic],
1972             (instrs LDUMAXB, LDUMAXH, LDUMAXW, LDUMAXX,
1973              LDUMAXAB, LDUMAXAH, LDUMAXAW, LDUMAXAX,
1974              LDUMAXLB, LDUMAXLH, LDUMAXLW, LDUMAXLX,
1975              LDUMAXALB, LDUMAXALH, LDUMAXALW, LDUMAXALX)>;
1977 def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic],
1978             (instrs LDUMINB, LDUMINH, LDUMINW, LDUMINX,
1979              LDUMINAB, LDUMINAH, LDUMINAW, LDUMINAX,
1980              LDUMINLB, LDUMINLH, LDUMINLW, LDUMINLX,
1981              LDUMINALB, LDUMINALH, LDUMINALW, LDUMINALX)>;
1983 def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic],
1984             (instrs SWPB, SWPH, SWPW, SWPX)>;
1986 def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic],
1987             (instrs SWPAB, SWPAH, SWPAW, SWPAX)>;
1989 def : InstRW<[THX3T110Write_6Cyc_I0123, WriteAtomic],
1990             (instrs SWPLB, SWPLH, SWPLW, SWPLX)>;
1992 def : InstRW<[THX3T110Write_8Cyc_I0123, WriteAtomic],
1993             (instrs SWPALB, SWPALH, SWPALW, SWPALX)>;
1995 def : InstRW<[THX3T110Write_4Cyc_I0123, WriteAtomic],
1996             (instrs STLLRB, STLLRH, STLLRW, STLLRX)>;
1998 // V8.3a PAC
1999 def : InstRW<[THX3T110Write_11Cyc_LS01_I1], (instregex "^LDRAA", "^LDRAB")>;
2000 def : InstRW<[THX3T110Write_8Cyc_I123],
2001             (instrs BLRAA, BLRAAZ, BLRAB, BLRABZ,
2002                     BRAA, BRAAZ, BRAB, BRABZ)>;
2003 def : InstRW<[THX3T110Write_8Cyc_I123], (instrs RETAA, RETAB)>;
2005 } // SchedModel = ThunderX3T110Model