1 //=- AArch64SchedA57.td - ARM Cortex-A57 Scheduling Defs -----*- tablegen -*-=//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 // This file defines the machine model for ARM Cortex-A57 to support
10 // instruction scheduling and other instruction cost heuristics.
12 //===----------------------------------------------------------------------===//
14 //===----------------------------------------------------------------------===//
15 // The Cortex-A57 is a traditional superscalar microprocessor with a
16 // conservative 3-wide in-order stage for decode and dispatch. Combined with the
17 // much wider out-of-order issue stage, this produced a need to carefully
18 // schedule micro-ops so that all three decoded each cycle are successfully
19 // issued as the reservation station(s) simply don't stay occupied for long.
20 // Therefore, IssueWidth is set to the narrower of the two at three, while still
21 // modeling the machine as out-of-order.
23 def CortexA57Model : SchedMachineModel {
24 let IssueWidth = 3; // 3-way decode and dispatch
25 let MicroOpBufferSize = 128; // 128 micro-op re-order buffer
26 let LoadLatency = 4; // Optimistic load latency
27 let MispredictPenalty = 14; // Fetch + Decode/Rename/Dispatch + Branch
29 // Enable partial & runtime unrolling. The magic number is chosen based on
30 // experiments and benchmarking data.
31 let LoopMicroOpBufferSize = 16;
32 let CompleteModel = 1;
34 list<Predicate> UnsupportedFeatures = !listconcat(SVEUnsupported.F,
40 //===----------------------------------------------------------------------===//
41 // Define each kind of processor resource and number available on Cortex-A57.
42 // Cortex A-57 has 8 pipelines that each has its own 8-entry queue where
43 // micro-ops wait for their operands and then issue out-of-order.
45 def A57UnitB : ProcResource<1>; // Type B micro-ops
46 def A57UnitI : ProcResource<2>; // Type I micro-ops
47 def A57UnitM : ProcResource<1>; // Type M micro-ops
48 def A57UnitL : ProcResource<1>; // Type L micro-ops
49 def A57UnitS : ProcResource<1>; // Type S micro-ops
50 def A57UnitX : ProcResource<1>; // Type X micro-ops
51 def A57UnitW : ProcResource<1>; // Type W micro-ops
52 let SchedModel = CortexA57Model in {
53 def A57UnitV : ProcResGroup<[A57UnitX, A57UnitW]>; // Type V micro-ops
56 let SchedModel = CortexA57Model in {
58 //===----------------------------------------------------------------------===//
59 // Define customized scheduler read/write types specific to the Cortex-A57.
61 include "AArch64SchedA57WriteRes.td"
63 //===----------------------------------------------------------------------===//
64 // Map the target-defined scheduler read/write resources and latency for
65 // Cortex-A57. The Cortex-A57 types are directly associated with resources, so
66 // defining the aliases precludes the need for mapping them using WriteRes. The
67 // aliases are sufficient for creating a coarse, working model. As the model
68 // evolves, InstRWs will be used to override some of these SchedAliases.
70 // WARNING: Using SchedAliases is convenient and works well for latency and
71 // resource lookup for instructions. However, this creates an entry in
72 // AArch64WriteLatencyTable with a WriteResourceID of 0, breaking
73 // any SchedReadAdvance since the lookup will fail.
75 def : SchedAlias<WriteImm, A57Write_1cyc_1I>;
76 def : SchedAlias<WriteI, A57Write_1cyc_1I>;
77 def : SchedAlias<WriteISReg, A57Write_2cyc_1M>;
78 def : SchedAlias<WriteIEReg, A57Write_2cyc_1M>;
79 def : SchedAlias<WriteExtr, A57Write_1cyc_1I>;
80 def : SchedAlias<WriteIS, A57Write_1cyc_1I>;
81 def : SchedAlias<WriteID32, A57Write_19cyc_1M>;
82 def : SchedAlias<WriteID64, A57Write_35cyc_1M>;
83 def : WriteRes<WriteIM32, [A57UnitM]> { let Latency = 3; }
84 def : WriteRes<WriteIM64, [A57UnitM]> { let Latency = 5; }
85 def : SchedAlias<WriteBr, A57Write_1cyc_1B>;
86 def : SchedAlias<WriteBrReg, A57Write_1cyc_1B>;
87 def : SchedAlias<WriteLD, A57Write_4cyc_1L>;
88 def : SchedAlias<WriteST, A57Write_1cyc_1S>;
89 def : SchedAlias<WriteSTP, A57Write_1cyc_1S>;
90 def : SchedAlias<WriteAdr, A57Write_1cyc_1I>;
91 def : SchedAlias<WriteLDIdx, A57Write_4cyc_1I_1L>;
92 def : SchedAlias<WriteSTIdx, A57Write_1cyc_1I_1S>;
93 def : SchedAlias<WriteF, A57Write_3cyc_1V>;
94 def : SchedAlias<WriteFCmp, A57Write_3cyc_1V>;
95 def : SchedAlias<WriteFCvt, A57Write_5cyc_1V>;
96 def : SchedAlias<WriteFCopy, A57Write_5cyc_1L>;
97 def : SchedAlias<WriteFImm, A57Write_3cyc_1V>;
98 def : WriteRes<WriteFMul, [A57UnitV]> { let Latency = 5;}
99 def : SchedAlias<WriteFDiv, A57Write_17cyc_1W>;
100 def : SchedAlias<WriteVd, A57Write_3cyc_1V>;
101 def : SchedAlias<WriteVq, A57Write_3cyc_1V>;
102 def : SchedAlias<WriteVLD, A57Write_5cyc_1L>;
103 def : SchedAlias<WriteVST, A57Write_1cyc_1S>;
105 def : WriteRes<WriteAtomic, []> { let Unsupported = 1; }
107 def : WriteRes<WriteSys, []> { let Latency = 1; }
108 def : WriteRes<WriteBarrier, []> { let Latency = 1; }
109 def : WriteRes<WriteHint, []> { let Latency = 1; }
111 def : WriteRes<WriteLDHi, []> { let Latency = 4; }
113 // Forwarding logic is only modeled for multiply and accumulate
114 def : ReadAdvance<ReadI, 0>;
115 def : ReadAdvance<ReadISReg, 0>;
116 def : ReadAdvance<ReadIEReg, 0>;
117 def : ReadAdvance<ReadIM, 0>;
118 def : ReadAdvance<ReadIMA, 2, [WriteIM32, WriteIM64]>;
119 def : ReadAdvance<ReadID, 0>;
120 def : ReadAdvance<ReadExtrHi, 0>;
121 def : ReadAdvance<ReadST, 0>;
122 def : ReadAdvance<ReadAdrBase, 0>;
123 def : ReadAdvance<ReadVLD, 0>;
126 //===----------------------------------------------------------------------===//
127 // Specialize the coarse model by associating instruction groups with the
128 // subtarget-defined types. As the modeled is refined, this will override most
129 // of the above ShchedAlias mappings.
132 // -----------------------------------------------------------------------------
134 def : InstRW<[WriteI], (instrs COPY)>;
137 // Branch Instructions
138 // -----------------------------------------------------------------------------
140 def : InstRW<[A57Write_1cyc_1B_1I], (instrs BL)>;
141 def : InstRW<[A57Write_2cyc_1B_1I], (instrs BLR)>;
144 // Shifted Register with Shift == 0
145 // ----------------------------------------------------------------------------
147 def A57WriteISReg : SchedWriteVariant<[
148 SchedVar<RegShiftedPred, [WriteISReg]>,
149 SchedVar<NoSchedPred, [WriteI]>]>;
150 def : InstRW<[A57WriteISReg], (instregex ".*rs$")>;
153 // Divide and Multiply Instructions
154 // -----------------------------------------------------------------------------
157 def : InstRW<[A57Write_6cyc_1M], (instrs SMULHrr, UMULHrr)>;
160 // Miscellaneous Data-Processing Instructions
161 // -----------------------------------------------------------------------------
163 def : InstRW<[A57Write_1cyc_1I], (instrs EXTRWrri)>;
164 def : InstRW<[A57Write_3cyc_1I_1M], (instrs EXTRXrri)>;
165 def : InstRW<[A57Write_2cyc_1M], (instregex "BFM")>;
168 // Cryptography Extensions
169 // -----------------------------------------------------------------------------
171 def A57ReadAES : SchedReadAdvance<3, [A57Write_3cyc_1W]>;
172 def : InstRW<[A57Write_3cyc_1W], (instregex "^AES[DE]")>;
173 def : InstRW<[A57Write_3cyc_1W, A57ReadAES], (instregex "^AESI?MC")>;
174 def : InstRW<[A57Write_6cyc_2V], (instregex "^SHA1SU0")>;
175 def : InstRW<[A57Write_3cyc_1W], (instregex "^SHA1(H|SU1)")>;
176 def : InstRW<[A57Write_6cyc_2W], (instregex "^SHA1[CMP]")>;
177 def : InstRW<[A57Write_3cyc_1W], (instregex "^SHA256SU0")>;
178 def : InstRW<[A57Write_6cyc_2W], (instregex "^SHA256(H|H2|SU1)")>;
179 def : InstRW<[A57Write_3cyc_1W], (instregex "^CRC32")>;
183 // -----------------------------------------------------------------------------
185 def : InstRW<[A57Write_8cyc_1L_1V], (instregex "LD1i(8|16|32)$")>;
186 def : InstRW<[WriteAdr, A57Write_8cyc_1L_1V], (instregex "LD1i(8|16|32)_POST$")>;
187 def : InstRW<[A57Write_5cyc_1L], (instregex "LD1i(64)$")>;
188 def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instregex "LD1i(64)_POST$")>;
190 def : InstRW<[A57Write_8cyc_1L_1V], (instregex "LD1Rv(8b|4h|2s)$")>;
191 def : InstRW<[WriteAdr, A57Write_8cyc_1L_1V], (instregex "LD1Rv(8b|4h|2s)_POST$")>;
192 def : InstRW<[A57Write_5cyc_1L], (instregex "LD1Rv(1d)$")>;
193 def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instregex "LD1Rv(1d)_POST$")>;
194 def : InstRW<[A57Write_8cyc_1L_1V], (instregex "LD1Rv(16b|8h|4s|2d)$")>;
195 def : InstRW<[WriteAdr, A57Write_8cyc_1L_1V], (instregex "LD1Rv(16b|8h|4s|2d)_POST$")>;
197 def : InstRW<[A57Write_5cyc_1L], (instregex "LD1Onev(8b|4h|2s|1d)$")>;
198 def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instregex "LD1Onev(8b|4h|2s|1d)_POST$")>;
199 def : InstRW<[A57Write_5cyc_1L], (instregex "LD1Onev(16b|8h|4s|2d)$")>;
200 def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instregex "LD1Onev(16b|8h|4s|2d)_POST$")>;
201 def : InstRW<[A57Write_5cyc_1L], (instregex "LD1Twov(8b|4h|2s|1d)$")>;
202 def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instregex "LD1Twov(8b|4h|2s|1d)_POST$")>;
203 def : InstRW<[A57Write_6cyc_2L], (instregex "LD1Twov(16b|8h|4s|2d)$")>;
204 def : InstRW<[WriteAdr, A57Write_6cyc_2L], (instregex "LD1Twov(16b|8h|4s|2d)_POST$")>;
205 def : InstRW<[A57Write_6cyc_2L], (instregex "LD1Threev(8b|4h|2s|1d)$")>;
206 def : InstRW<[WriteAdr, A57Write_6cyc_2L], (instregex "LD1Threev(8b|4h|2s|1d)_POST$")>;
207 def : InstRW<[A57Write_7cyc_3L], (instregex "LD1Threev(16b|8h|4s|2d)$")>;
208 def : InstRW<[WriteAdr, A57Write_7cyc_3L], (instregex "LD1Threev(16b|8h|4s|2d)_POST$")>;
209 def : InstRW<[A57Write_6cyc_2L], (instregex "LD1Fourv(8b|4h|2s|1d)$")>;
210 def : InstRW<[WriteAdr, A57Write_6cyc_2L], (instregex "LD1Fourv(8b|4h|2s|1d)_POST$")>;
211 def : InstRW<[A57Write_8cyc_4L], (instregex "LD1Fourv(16b|8h|4s|2d)$")>;
212 def : InstRW<[WriteAdr, A57Write_8cyc_4L], (instregex "LD1Fourv(16b|8h|4s|2d)_POST$")>;
214 def : InstRW<[A57Write_8cyc_1L_2V], (instregex "LD2i(8|16)$")>;
215 def : InstRW<[WriteAdr, A57Write_8cyc_1L_2V], (instregex "LD2i(8|16)_POST$")>;
216 def : InstRW<[A57Write_6cyc_2L], (instregex "LD2i(32)$")>;
217 def : InstRW<[WriteAdr, A57Write_6cyc_2L], (instregex "LD2i(32)_POST$")>;
218 def : InstRW<[A57Write_8cyc_1L_1V], (instregex "LD2i(64)$")>;
219 def : InstRW<[WriteAdr, A57Write_8cyc_1L_1V], (instregex "LD2i(64)_POST$")>;
221 def : InstRW<[A57Write_8cyc_1L_1V], (instregex "LD2Rv(8b|4h|2s)$")>;
222 def : InstRW<[WriteAdr, A57Write_8cyc_1L_1V], (instregex "LD2Rv(8b|4h|2s)_POST$")>;
223 def : InstRW<[A57Write_5cyc_1L], (instregex "LD2Rv(1d)$")>;
224 def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instregex "LD2Rv(1d)_POST$")>;
225 def : InstRW<[A57Write_8cyc_1L_2V], (instregex "LD2Rv(16b|8h|4s|2d)$")>;
226 def : InstRW<[WriteAdr, A57Write_8cyc_1L_2V], (instregex "LD2Rv(16b|8h|4s|2d)_POST$")>;
228 def : InstRW<[A57Write_8cyc_1L_1V], (instregex "LD2Twov(8b|4h|2s)$")>;
229 def : InstRW<[WriteAdr, A57Write_8cyc_1L_1V], (instregex "LD2Twov(8b|4h|2s)_POST$")>;
230 def : InstRW<[A57Write_9cyc_2L_2V], (instregex "LD2Twov(16b|8h|4s)$")>;
231 def : InstRW<[WriteAdr, A57Write_9cyc_2L_2V], (instregex "LD2Twov(16b|8h|4s)_POST$")>;
232 def : InstRW<[A57Write_6cyc_2L], (instregex "LD2Twov(2d)$")>;
233 def : InstRW<[WriteAdr, A57Write_6cyc_2L], (instregex "LD2Twov(2d)_POST$")>;
235 def : InstRW<[A57Write_9cyc_1L_3V], (instregex "LD3i(8|16)$")>;
236 def : InstRW<[WriteAdr, A57Write_9cyc_1L_3V], (instregex "LD3i(8|16)_POST$")>;
237 def : InstRW<[A57Write_8cyc_1L_2V], (instregex "LD3i(32)$")>;
238 def : InstRW<[WriteAdr, A57Write_8cyc_1L_2V], (instregex "LD3i(32)_POST$")>;
239 def : InstRW<[A57Write_6cyc_2L], (instregex "LD3i(64)$")>;
240 def : InstRW<[WriteAdr, A57Write_6cyc_2L], (instregex "LD3i(64)_POST$")>;
242 def : InstRW<[A57Write_8cyc_1L_2V], (instregex "LD3Rv(8b|4h|2s)$")>;
243 def : InstRW<[WriteAdr, A57Write_8cyc_1L_2V], (instregex "LD3Rv(8b|4h|2s)_POST$")>;
244 def : InstRW<[A57Write_6cyc_2L], (instregex "LD3Rv(1d)$")>;
245 def : InstRW<[WriteAdr, A57Write_6cyc_2L], (instregex "LD3Rv(1d)_POST$")>;
246 def : InstRW<[A57Write_9cyc_1L_3V], (instregex "LD3Rv(16b|8h|4s)$")>;
247 def : InstRW<[WriteAdr, A57Write_9cyc_1L_3V], (instregex "LD3Rv(16b|8h|4s)_POST$")>;
248 def : InstRW<[A57Write_9cyc_2L_3V], (instregex "LD3Rv(2d)$")>;
249 def : InstRW<[WriteAdr, A57Write_9cyc_2L_3V], (instregex "LD3Rv(2d)_POST$")>;
251 def : InstRW<[A57Write_9cyc_2L_2V], (instregex "LD3Threev(8b|4h|2s)$")>;
252 def : InstRW<[WriteAdr, A57Write_9cyc_2L_2V], (instregex "LD3Threev(8b|4h|2s)_POST$")>;
253 def : InstRW<[A57Write_10cyc_3L_4V], (instregex "LD3Threev(16b|8h|4s)$")>;
254 def : InstRW<[WriteAdr, A57Write_10cyc_3L_4V], (instregex "LD3Threev(16b|8h|4s)_POST$")>;
255 def : InstRW<[A57Write_8cyc_4L], (instregex "LD3Threev(2d)$")>;
256 def : InstRW<[WriteAdr, A57Write_8cyc_4L], (instregex "LD3Threev(2d)_POST$")>;
258 def : InstRW<[A57Write_9cyc_2L_3V], (instregex "LD4i(8|16)$")>;
259 def : InstRW<[WriteAdr, A57Write_9cyc_2L_3V], (instregex "LD4i(8|16)_POST$")>;
260 def : InstRW<[A57Write_8cyc_1L_2V], (instregex "LD4i(32)$")>;
261 def : InstRW<[WriteAdr, A57Write_8cyc_1L_2V], (instregex "LD4i(32)_POST$")>;
262 def : InstRW<[A57Write_9cyc_2L_3V], (instregex "LD4i(64)$")>;
263 def : InstRW<[WriteAdr, A57Write_9cyc_2L_3V], (instregex "LD4i(64)_POST$")>;
265 def : InstRW<[A57Write_8cyc_1L_2V], (instregex "LD4Rv(8b|4h|2s)$")>;
266 def : InstRW<[WriteAdr, A57Write_8cyc_1L_2V], (instregex "LD4Rv(8b|4h|2s)_POST$")>;
267 def : InstRW<[A57Write_6cyc_2L], (instregex "LD4Rv(1d)$")>;
268 def : InstRW<[WriteAdr, A57Write_6cyc_2L], (instregex "LD4Rv(1d)_POST$")>;
269 def : InstRW<[A57Write_9cyc_2L_3V], (instregex "LD4Rv(16b|8h|4s)$")>;
270 def : InstRW<[WriteAdr, A57Write_9cyc_2L_3V], (instregex "LD4Rv(16b|8h|4s)_POST$")>;
271 def : InstRW<[A57Write_9cyc_2L_4V], (instregex "LD4Rv(2d)$")>;
272 def : InstRW<[WriteAdr, A57Write_9cyc_2L_4V], (instregex "LD4Rv(2d)_POST$")>;
274 def : InstRW<[A57Write_9cyc_2L_2V], (instregex "LD4Fourv(8b|4h|2s)$")>;
275 def : InstRW<[WriteAdr, A57Write_9cyc_2L_2V], (instregex "LD4Fourv(8b|4h|2s)_POST$")>;
276 def : InstRW<[A57Write_11cyc_4L_4V], (instregex "LD4Fourv(16b|8h|4s)$")>;
277 def : InstRW<[WriteAdr, A57Write_11cyc_4L_4V], (instregex "LD4Fourv(16b|8h|4s)_POST$")>;
278 def : InstRW<[A57Write_8cyc_4L], (instregex "LD4Fourv(2d)$")>;
279 def : InstRW<[WriteAdr, A57Write_8cyc_4L], (instregex "LD4Fourv(2d)_POST$")>;
282 // -----------------------------------------------------------------------------
284 def : InstRW<[A57Write_1cyc_1S], (instregex "ST1i(8|16|32)$")>;
285 def : InstRW<[WriteAdr, A57Write_1cyc_1S], (instregex "ST1i(8|16|32)_POST$")>;
286 def : InstRW<[A57Write_3cyc_1S_1V], (instregex "ST1i(64)$")>;
287 def : InstRW<[WriteAdr, A57Write_3cyc_1S_1V], (instregex "ST1i(64)_POST$")>;
289 def : InstRW<[A57Write_1cyc_1S], (instregex "ST1Onev(8b|4h|2s|1d)$")>;
290 def : InstRW<[WriteAdr, A57Write_1cyc_1S], (instregex "ST1Onev(8b|4h|2s|1d)_POST$")>;
291 def : InstRW<[A57Write_2cyc_2S], (instregex "ST1Onev(16b|8h|4s|2d)$")>;
292 def : InstRW<[WriteAdr, A57Write_2cyc_2S], (instregex "ST1Onev(16b|8h|4s|2d)_POST$")>;
293 def : InstRW<[A57Write_2cyc_2S], (instregex "ST1Twov(8b|4h|2s|1d)$")>;
294 def : InstRW<[WriteAdr, A57Write_2cyc_2S], (instregex "ST1Twov(8b|4h|2s|1d)_POST$")>;
295 def : InstRW<[A57Write_4cyc_4S], (instregex "ST1Twov(16b|8h|4s|2d)$")>;
296 def : InstRW<[WriteAdr, A57Write_4cyc_4S], (instregex "ST1Twov(16b|8h|4s|2d)_POST$")>;
297 def : InstRW<[A57Write_3cyc_3S], (instregex "ST1Threev(8b|4h|2s|1d)$")>;
298 def : InstRW<[WriteAdr, A57Write_3cyc_3S], (instregex "ST1Threev(8b|4h|2s|1d)_POST$")>;
299 def : InstRW<[A57Write_6cyc_6S], (instregex "ST1Threev(16b|8h|4s|2d)$")>;
300 def : InstRW<[WriteAdr, A57Write_6cyc_6S], (instregex "ST1Threev(16b|8h|4s|2d)_POST$")>;
301 def : InstRW<[A57Write_4cyc_4S], (instregex "ST1Fourv(8b|4h|2s|1d)$")>;
302 def : InstRW<[WriteAdr, A57Write_4cyc_4S], (instregex "ST1Fourv(8b|4h|2s|1d)_POST$")>;
303 def : InstRW<[A57Write_8cyc_8S], (instregex "ST1Fourv(16b|8h|4s|2d)$")>;
304 def : InstRW<[WriteAdr, A57Write_8cyc_8S], (instregex "ST1Fourv(16b|8h|4s|2d)_POST$")>;
306 def : InstRW<[A57Write_3cyc_1S_1V], (instregex "ST2i(8|16|32)$")>;
307 def : InstRW<[WriteAdr, A57Write_3cyc_1S_1V], (instregex "ST2i(8|16|32)_POST$")>;
308 def : InstRW<[A57Write_2cyc_2S], (instregex "ST2i(64)$")>;
309 def : InstRW<[WriteAdr, A57Write_2cyc_2S], (instregex "ST2i(64)_POST$")>;
311 def : InstRW<[A57Write_3cyc_2S_1V], (instregex "ST2Twov(8b|4h|2s)$")>;
312 def : InstRW<[WriteAdr, A57Write_3cyc_2S_1V], (instregex "ST2Twov(8b|4h|2s)_POST$")>;
313 def : InstRW<[A57Write_4cyc_4S_2V], (instregex "ST2Twov(16b|8h|4s)$")>;
314 def : InstRW<[WriteAdr, A57Write_4cyc_4S_2V], (instregex "ST2Twov(16b|8h|4s)_POST$")>;
315 def : InstRW<[A57Write_4cyc_4S], (instregex "ST2Twov(2d)$")>;
316 def : InstRW<[WriteAdr, A57Write_4cyc_4S], (instregex "ST2Twov(2d)_POST$")>;
318 def : InstRW<[A57Write_3cyc_1S_1V], (instregex "ST3i(8|16)$")>;
319 def : InstRW<[WriteAdr, A57Write_3cyc_1S_1V], (instregex "ST3i(8|16)_POST$")>;
320 def : InstRW<[A57Write_3cyc_3S], (instregex "ST3i(32)$")>;
321 def : InstRW<[WriteAdr, A57Write_3cyc_3S], (instregex "ST3i(32)_POST$")>;
322 def : InstRW<[A57Write_3cyc_2S_1V], (instregex "ST3i(64)$")>;
323 def : InstRW<[WriteAdr, A57Write_3cyc_2S_1V], (instregex "ST3i(64)_POST$")>;
325 def : InstRW<[A57Write_3cyc_3S_2V], (instregex "ST3Threev(8b|4h|2s)$")>;
326 def : InstRW<[WriteAdr, A57Write_3cyc_3S_2V], (instregex "ST3Threev(8b|4h|2s)_POST$")>;
327 def : InstRW<[A57Write_6cyc_6S_4V], (instregex "ST3Threev(16b|8h|4s)$")>;
328 def : InstRW<[WriteAdr, A57Write_6cyc_6S_4V], (instregex "ST3Threev(16b|8h|4s)_POST$")>;
329 def : InstRW<[A57Write_6cyc_6S], (instregex "ST3Threev(2d)$")>;
330 def : InstRW<[WriteAdr, A57Write_6cyc_6S], (instregex "ST3Threev(2d)_POST$")>;
332 def : InstRW<[A57Write_3cyc_1S_1V], (instregex "ST4i(8|16)$")>;
333 def : InstRW<[WriteAdr, A57Write_3cyc_1S_1V], (instregex "ST4i(8|16)_POST$")>;
334 def : InstRW<[A57Write_4cyc_4S], (instregex "ST4i(32)$")>;
335 def : InstRW<[WriteAdr, A57Write_4cyc_4S], (instregex "ST4i(32)_POST$")>;
336 def : InstRW<[A57Write_3cyc_2S_1V], (instregex "ST4i(64)$")>;
337 def : InstRW<[WriteAdr, A57Write_3cyc_2S_1V], (instregex "ST4i(64)_POST$")>;
339 def : InstRW<[A57Write_4cyc_4S_2V], (instregex "ST4Fourv(8b|4h|2s)$")>;
340 def : InstRW<[WriteAdr, A57Write_4cyc_4S_2V], (instregex "ST4Fourv(8b|4h|2s)_POST$")>;
341 def : InstRW<[A57Write_8cyc_8S_4V], (instregex "ST4Fourv(16b|8h|4s)$")>;
342 def : InstRW<[WriteAdr, A57Write_8cyc_8S_4V], (instregex "ST4Fourv(16b|8h|4s)_POST$")>;
343 def : InstRW<[A57Write_8cyc_8S], (instregex "ST4Fourv(2d)$")>;
344 def : InstRW<[WriteAdr, A57Write_8cyc_8S], (instregex "ST4Fourv(2d)_POST$")>;
347 // -----------------------------------------------------------------------------
349 // Reference for forms in this group
350 // D form - v8i8, v4i16, v2i32
351 // Q form - v16i8, v8i16, v4i32
352 // D form - v1i8, v1i16, v1i32, v1i64
353 // Q form - v16i8, v8i16, v4i32, v2i64
354 // D form - v8i8_v8i16, v4i16_v4i32, v2i32_v2i64
355 // Q form - v16i8_v8i16, v8i16_v4i32, v4i32_v2i64
357 // Cortex A57 Software Optimization Guide Sec 3.14
358 // Advance for absolute diff accum, pairwise add and accumulate, shift accumulate
359 def A57ReadIVA3 : SchedReadAdvance<3, [A57Write_4cyc_1X_NonMul_Forward, A57Write_5cyc_2X_NonMul_Forward]>;
361 // ASIMD absolute diff accum, D-form
362 def : InstRW<[A57Write_4cyc_1X_NonMul_Forward, A57ReadIVA3], (instregex "^[SU]ABA(v8i8|v4i16|v2i32)$")>;
363 // ASIMD absolute diff accum, Q-form
364 def : InstRW<[A57Write_5cyc_2X_NonMul_Forward, A57ReadIVA3], (instregex "^[SU]ABA(v16i8|v8i16|v4i32)$")>;
365 // ASIMD absolute diff accum long
366 def : InstRW<[A57Write_4cyc_1X_NonMul_Forward, A57ReadIVA3], (instregex "^[SU]ABAL")>;
368 // ASIMD arith, reduce, 4H/4S
369 def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU]?ADDL?V(v8i8|v4i16|v2i32)v$")>;
370 // ASIMD arith, reduce, 8B/8H
371 def : InstRW<[A57Write_7cyc_1V_1X], (instregex "^[SU]?ADDL?V(v8i16|v4i32)v$")>;
372 // ASIMD arith, reduce, 16B
373 def : InstRW<[A57Write_8cyc_2X], (instregex "^[SU]?ADDL?Vv16i8v$")>;
375 // ASIMD max/min, reduce, 4H/4S
376 def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU](MIN|MAX)V(v4i16|v4i32)v$")>;
377 // ASIMD max/min, reduce, 8B/8H
378 def : InstRW<[A57Write_7cyc_1V_1X], (instregex "^[SU](MIN|MAX)V(v8i8|v8i16)v$")>;
379 // ASIMD max/min, reduce, 16B
380 def : InstRW<[A57Write_8cyc_2X], (instregex "^[SU](MIN|MAX)Vv16i8v$")>;
382 // ASIMD multiply, D-form
384 def : InstRW<[A57Write_5cyc_1W_Mul_Forward], (instregex "^MUL(v8i8|v4i16|v2i32|v1i8|v1i16|v1i32|v1i64)(_indexed)?$")>;
385 // PMUL, SQDMULH, SQRDMULH
386 def : InstRW<[A57Write_5cyc_1W], (instregex "^(PMUL|SQR?DMULH)(v8i8|v4i16|v2i32|v1i8|v1i16|v1i32|v1i64)(_indexed)?$")>;
388 // ASIMD multiply, Q-form
390 def : InstRW<[A57Write_6cyc_2W_Mul_Forward], (instregex "^MUL(v16i8|v8i16|v4i32)(_indexed)?$")>;
391 // PMUL, SQDMULH, SQRDMULH
392 def : InstRW<[A57Write_6cyc_2W], (instregex "^(PMUL|SQR?DMULH)(v16i8|v8i16|v4i32)(_indexed)?$")>;
394 // Cortex A57 Software Optimization Guide Sec 3.14
395 def A57ReadIVMA4 : SchedReadAdvance<4 , [A57Write_5cyc_1W_Mul_Forward, A57Write_6cyc_2W_Mul_Forward]>;
396 def A57ReadIVMA3 : SchedReadAdvance<3 , [A57Write_5cyc_1W_Mul_Forward, A57Write_6cyc_2W_Mul_Forward]>;
398 // ASIMD multiply accumulate, D-form
399 def : InstRW<[A57Write_5cyc_1W_Mul_Forward, A57ReadIVMA4], (instregex "^ML[AS](v8i8|v4i16|v2i32)(_indexed)?$")>;
400 // ASIMD multiply accumulate, Q-form
401 def : InstRW<[A57Write_6cyc_2W_Mul_Forward, A57ReadIVMA4], (instregex "^ML[AS](v16i8|v8i16|v4i32)(_indexed)?$")>;
403 // ASIMD multiply accumulate long
404 // ASIMD multiply accumulate saturating long
405 def : InstRW<[A57Write_5cyc_1W_Mul_Forward, A57ReadIVMA4], (instregex "^(S|U)ML[AS]L")>;
406 def : InstRW<[A57Write_5cyc_1W_Mul_Forward, A57ReadIVMA3], (instregex "^SQDML[AS]L")>;
408 // ASIMD multiply long
409 def : InstRW<[A57Write_5cyc_1W_Mul_Forward], (instregex "^(S|U)MULL")>;
410 def : InstRW<[A57Write_5cyc_1W], (instregex "^SQDMULL")>;
411 def : InstRW<[A57Write_5cyc_1W], (instregex "^PMULL(v8i8|v16i8)")>;
412 def : InstRW<[A57Write_3cyc_1W], (instregex "^PMULL(v1i64|v2i64)")>;
414 // ASIMD pairwise add and accumulate
415 // ASIMD shift accumulate
416 def : InstRW<[A57Write_4cyc_1X_NonMul_Forward, A57ReadIVA3], (instregex "^[SU]ADALP")>;
417 def : InstRW<[A57Write_4cyc_1X_NonMul_Forward, A57ReadIVA3], (instregex "^(S|SR|U|UR)SRA")>;
419 // ASIMD shift by immed, complex
420 def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU]?(Q|R){1,2}SHR")>;
421 def : InstRW<[A57Write_4cyc_1X], (instregex "^SQSHLU")>;
424 // ASIMD shift by register, basic, Q-form
425 def : InstRW<[A57Write_4cyc_2X], (instregex "^[SU]SHL(v16i8|v8i16|v4i32|v2i64)")>;
427 // ASIMD shift by register, complex, D-form
428 def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU][QR]{1,2}SHL(v1i8|v1i16|v1i32|v1i64|v8i8|v4i16|v2i32|b|d|h|s)")>;
430 // ASIMD shift by register, complex, Q-form
431 def : InstRW<[A57Write_5cyc_2X], (instregex "^[SU][QR]{1,2}SHL(v16i8|v8i16|v4i32|v2i64)")>;
434 // Vector - Floating Point
435 // -----------------------------------------------------------------------------
437 // Reference for forms in this group
439 // Q form - v4f32, v2f64
441 // D form - v1i32, v1i64
443 // Q form - v4i32, v2i64
445 // ASIMD FP arith, normal, D-form
446 def : InstRW<[A57Write_5cyc_1V], (instregex "^(FABD|FADD|FSUB)(v2f32|32|64|v2i32p)")>;
447 // ASIMD FP arith, normal, Q-form
448 def : InstRW<[A57Write_5cyc_2V], (instregex "^(FABD|FADD|FSUB)(v4f32|v2f64|v2i64p)")>;
450 // ASIMD FP arith, pairwise, D-form
451 def : InstRW<[A57Write_5cyc_1V], (instregex "^FADDP(v2f32|32|64|v2i32)")>;
452 // ASIMD FP arith, pairwise, Q-form
453 def : InstRW<[A57Write_9cyc_3V], (instregex "^FADDP(v4f32|v2f64|v2i64)")>;
455 // ASIMD FP compare, D-form
456 def : InstRW<[A57Write_5cyc_1V], (instregex "^(FACGE|FACGT|FCMEQ|FCMGE|FCMGT|FCMLE|FCMLT)(v2f32|32|64|v1i32|v2i32|v1i64)")>;
457 // ASIMD FP compare, Q-form
458 def : InstRW<[A57Write_5cyc_2V], (instregex "^(FACGE|FACGT|FCMEQ|FCMGE|FCMGT|FCMLE|FCMLT)(v4f32|v2f64|v4i32|v2i64)")>;
460 // ASIMD FP convert, long and narrow
461 def : InstRW<[A57Write_8cyc_3V], (instregex "^FCVT(L|N|XN)v")>;
462 // ASIMD FP convert, other, D-form
463 def : InstRW<[A57Write_5cyc_1V], (instregex "^[FSU]CVT([AMNPZ][SU])?(_Int)?(v2f32|v1i32|v2i32|v1i64)")>;
464 // ASIMD FP convert, other, Q-form
465 def : InstRW<[A57Write_5cyc_2V], (instregex "^[FSU]CVT([AMNPZ][SU])?(_Int)?(v4f32|v2f64|v4i32|v2i64)")>;
467 // ASIMD FP divide, D-form, F32
468 def : InstRW<[A57Write_17cyc_1W], (instregex "FDIVv2f32")>;
469 // ASIMD FP divide, Q-form, F32
470 def : InstRW<[A57Write_34cyc_2W], (instregex "FDIVv4f32")>;
471 // ASIMD FP divide, Q-form, F64
472 def : InstRW<[A57Write_64cyc_2W], (instregex "FDIVv2f64")>;
474 // Note: These were simply duplicated from ASIMD FDIV because of missing documentation
475 // ASIMD FP square root, D-form, F32
476 def : InstRW<[A57Write_17cyc_1W], (instregex "FSQRTv2f32")>;
477 // ASIMD FP square root, Q-form, F32
478 def : InstRW<[A57Write_34cyc_2W], (instregex "FSQRTv4f32")>;
479 // ASIMD FP square root, Q-form, F64
480 def : InstRW<[A57Write_64cyc_2W], (instregex "FSQRTv2f64")>;
482 // ASIMD FP max/min, normal, D-form
483 def : InstRW<[A57Write_5cyc_1V], (instregex "^(FMAX|FMIN)(NM)?(v2f32)")>;
484 // ASIMD FP max/min, normal, Q-form
485 def : InstRW<[A57Write_5cyc_2V], (instregex "^(FMAX|FMIN)(NM)?(v4f32|v2f64)")>;
486 // ASIMD FP max/min, pairwise, D-form
487 def : InstRW<[A57Write_5cyc_1V], (instregex "^(FMAX|FMIN)(NM)?P(v2f32|v2i32)")>;
488 // ASIMD FP max/min, pairwise, Q-form
489 def : InstRW<[A57Write_9cyc_3V], (instregex "^(FMAX|FMIN)(NM)?P(v4f32|v2f64|v2i64)")>;
490 // ASIMD FP max/min, reduce
491 def : InstRW<[A57Write_10cyc_3V], (instregex "^(FMAX|FMIN)(NM)?Vv")>;
493 // ASIMD FP multiply, D-form, FZ
494 def : InstRW<[A57Write_5cyc_1V_FP_Forward], (instregex "^FMULX?(v2f32|v1i32|v2i32|v1i64|32|64)")>;
495 // ASIMD FP multiply, Q-form, FZ
496 def : InstRW<[A57Write_5cyc_2V_FP_Forward], (instregex "^FMULX?(v4f32|v2f64|v4i32|v2i64)")>;
498 // ASIMD FP multiply accumulate, D-form, FZ
499 // ASIMD FP multiply accumulate, Q-form, FZ
500 def A57WriteFPVMAD : SchedWriteRes<[A57UnitV]> { let Latency = 9; }
501 def A57WriteFPVMAQ : SchedWriteRes<[A57UnitV, A57UnitV]> { let Latency = 10; }
503 // Cortex A57 Software Optimization Guide Sec 3.15
504 // Advances from FP mul and mul-accum to mul-accum
505 def A57ReadFPVMA5 : SchedReadAdvance<5, [A57WriteFPVMAD, A57WriteFPVMAQ, A57Write_5cyc_1V_FP_Forward, A57Write_5cyc_2V_FP_Forward]>;
506 def A57ReadFPVMA6 : SchedReadAdvance<6, [A57WriteFPVMAD, A57WriteFPVMAQ, A57Write_5cyc_1V_FP_Forward, A57Write_5cyc_2V_FP_Forward]>;
508 def : InstRW<[A57WriteFPVMAD, A57ReadFPVMA5], (instregex "^FML[AS](v2f32|v1i32|v2i32|v1i64)")>;
509 def : InstRW<[A57WriteFPVMAQ, A57ReadFPVMA6], (instregex "^FML[AS](v4f32|v2f64|v4i32|v2i64)")>;
511 // ASIMD FP round, D-form
512 def : InstRW<[A57Write_5cyc_1V], (instregex "^FRINT[AIMNPXZ](v2f32)")>;
513 // ASIMD FP round, Q-form
514 def : InstRW<[A57Write_5cyc_2V], (instregex "^FRINT[AIMNPXZ](v4f32|v2f64)")>;
517 // Vector - Miscellaneous
518 // -----------------------------------------------------------------------------
520 // Reference for forms in this group
521 // D form - v8i8, v4i16, v2i32
522 // Q form - v16i8, v8i16, v4i32
523 // D form - v1i8, v1i16, v1i32, v1i64
524 // Q form - v16i8, v8i16, v4i32, v2i64
526 // ASIMD bitwise insert, Q-form
527 def : InstRW<[A57Write_3cyc_2V], (instregex "^(BIF|BIT|BSL|BSP)v16i8")>;
529 // ASIMD duplicate, gen reg, D-form and Q-form
530 def : InstRW<[A57Write_8cyc_1L_1V], (instregex "^DUP(i8|i16|i32|i64)$")>;
531 def : InstRW<[A57Write_8cyc_1L_1V], (instregex "^DUPv.+gpr")>;
533 // ASIMD move, saturating
534 def : InstRW<[A57Write_4cyc_1X], (instregex "^[SU]QXTU?N")>;
536 // ASIMD reciprocal estimate, D-form
537 def : InstRW<[A57Write_5cyc_1V], (instregex "^[FU](RECP|RSQRT)(E|X)(v2f32|v1i32|v2i32|v1i64)")>;
538 // ASIMD reciprocal estimate, Q-form
539 def : InstRW<[A57Write_5cyc_2V], (instregex "^[FU](RECP|RSQRT)(E|X)(v2f64|v4f32|v4i32)")>;
541 // ASIMD reciprocal step, D-form, FZ
542 def : InstRW<[A57Write_9cyc_1V], (instregex "^F(RECP|RSQRT)S(v2f32|v1i32|v2i32|v1i64|32|64)")>;
543 // ASIMD reciprocal step, Q-form, FZ
544 def : InstRW<[A57Write_9cyc_2V], (instregex "^F(RECP|RSQRT)S(v2f64|v4f32|v4i32)")>;
546 // ASIMD table lookup, D-form
547 def : InstRW<[A57Write_3cyc_1V], (instregex "^TB[LX]v8i8One")>;
548 def : InstRW<[A57Write_6cyc_2V], (instregex "^TB[LX]v8i8Two")>;
549 def : InstRW<[A57Write_9cyc_3V], (instregex "^TB[LX]v8i8Three")>;
550 def : InstRW<[A57Write_12cyc_4V], (instregex "^TB[LX]v8i8Four")>;
551 // ASIMD table lookup, Q-form
552 def : InstRW<[A57Write_6cyc_3V], (instregex "^TB[LX]v16i8One")>;
553 def : InstRW<[A57Write_9cyc_5V], (instregex "^TB[LX]v16i8Two")>;
554 def : InstRW<[A57Write_12cyc_7V], (instregex "^TB[LX]v16i8Three")>;
555 def : InstRW<[A57Write_15cyc_9V], (instregex "^TB[LX]v16i8Four")>;
557 // ASIMD transfer, element to gen reg
558 def : InstRW<[A57Write_6cyc_1I_1L], (instregex "^[SU]MOVv")>;
560 // ASIMD transfer, gen reg to element
561 def : InstRW<[A57Write_8cyc_1L_1V], (instregex "^INSv")>;
563 // ASIMD unzip/zip, Q-form
564 def : InstRW<[A57Write_6cyc_3V], (instregex "^(UZP|ZIP)(1|2)(v16i8|v8i16|v4i32|v2i64)")>;
568 // -----------------------------------------------------------------------------
570 def : InstRW<[A57Write_5cyc_1V], (instregex "^F(ADD|SUB)[DS]rr")>;
572 // Cortex A57 Software Optimization Guide Sec 3.10
573 def A57WriteFPMA : SchedWriteRes<[A57UnitV]> { let Latency = 9; }
574 def A57ReadFPMA5 : SchedReadAdvance<5, [A57WriteFPMA, WriteFMul]>;
575 def A57ReadFPM : SchedReadAdvance<0>;
576 def : InstRW<[A57WriteFPMA, A57ReadFPM, A57ReadFPM, A57ReadFPMA5], (instregex "^FN?M(ADD|SUB)[DS]rrr")>;
578 def : InstRW<[A57Write_10cyc_1L_1V], (instregex "^[FSU]CVT[AMNPZ][SU](_Int)?[SU]?[XW]?[DS]?[rds]i?")>;
579 def : InstRW<[A57Write_10cyc_1L_1V], (instregex "^[SU]CVTF")>;
581 def : InstRW<[A57Write_32cyc_1W], (instrs FDIVDrr)>;
582 def : InstRW<[A57Write_17cyc_1W], (instrs FDIVSrr)>;
584 def : InstRW<[A57Write_5cyc_1V], (instregex "^F(MAX|MIN).+rr")>;
586 def : InstRW<[A57Write_5cyc_1V], (instregex "^FRINT.+r")>;
588 def : InstRW<[A57Write_32cyc_1W], (instrs FSQRTDr)>;
589 def : InstRW<[A57Write_17cyc_1W], (instrs FSQRTSr)>;
591 def : InstRW<[A57Write_5cyc_1L, WriteLDHi], (instrs LDNPDi)>;
592 def : InstRW<[A57Write_6cyc_2L, WriteLDHi], (instrs LDNPQi)>;
593 def : InstRW<[A57Write_5cyc_1L, WriteLDHi], (instrs LDNPSi)>;
594 def : InstRW<[A57Write_5cyc_1L, WriteLDHi], (instrs LDPDi)>;
595 def : InstRW<[WriteAdr, A57Write_5cyc_1L, WriteLDHi], (instrs LDPDpost)>;
596 def : InstRW<[WriteAdr, A57Write_5cyc_1L, WriteLDHi], (instrs LDPDpre)>;
597 def : InstRW<[A57Write_6cyc_2L, WriteLDHi], (instrs LDPQi)>;
598 def : InstRW<[WriteAdr, A57Write_6cyc_2L, WriteLDHi], (instrs LDPQpost)>;
599 def : InstRW<[WriteAdr, A57Write_6cyc_2L, WriteLDHi], (instrs LDPQpre)>;
600 def : InstRW<[A57Write_5cyc_1I_2L, WriteLDHi], (instrs LDPSWi)>;
601 def : InstRW<[WriteAdr, A57Write_5cyc_1I_2L, WriteLDHi], (instrs LDPSWpost)>;
602 def : InstRW<[WriteAdr, A57Write_5cyc_1I_2L, WriteLDHi], (instrs LDPSWpre)>;
603 def : InstRW<[A57Write_5cyc_1L, WriteLDHi], (instrs LDPSi)>;
604 def : InstRW<[WriteAdr, A57Write_5cyc_1L, WriteLDHi], (instrs LDPSpost)>;
605 def : InstRW<[WriteAdr, A57Write_5cyc_1L, WriteLDHi], (instrs LDPSpre)>;
606 def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRBpost)>;
607 def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instrs LDRBpre)>;
608 def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRBroW)>;
609 def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRBroX)>;
610 def : InstRW<[A57Write_5cyc_1L], (instrs LDRBui)>;
611 def : InstRW<[A57Write_5cyc_1L], (instrs LDRDl)>;
612 def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRDpost)>;
613 def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instrs LDRDpre)>;
614 def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRDroW)>;
615 def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRDroX)>;
616 def : InstRW<[A57Write_5cyc_1L], (instrs LDRDui)>;
617 def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRHHroW)>;
618 def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRHHroX)>;
619 def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRHpost)>;
620 def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instrs LDRHpre)>;
621 def : InstRW<[A57Write_6cyc_1I_1L, ReadAdrBase], (instrs LDRHroW)>;
622 def : InstRW<[A57Write_6cyc_1I_1L, ReadAdrBase], (instrs LDRHroX)>;
623 def : InstRW<[A57Write_5cyc_1L], (instrs LDRHui)>;
624 def : InstRW<[A57Write_5cyc_1L], (instrs LDRQl)>;
625 def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRQpost)>;
626 def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instrs LDRQpre)>;
627 def : InstRW<[A57Write_6cyc_1I_1L, ReadAdrBase], (instrs LDRQroW)>;
628 def : InstRW<[A57Write_6cyc_1I_1L, ReadAdrBase], (instrs LDRQroX)>;
629 def : InstRW<[A57Write_5cyc_1L], (instrs LDRQui)>;
630 def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRSHWroW)>;
631 def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRSHWroX)>;
632 def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRSHXroW)>;
633 def : InstRW<[A57Write_5cyc_1I_1L, ReadAdrBase], (instrs LDRSHXroX)>;
634 def : InstRW<[A57Write_5cyc_1L], (instrs LDRSl)>;
635 def : InstRW<[A57Write_5cyc_1L, WriteI], (instrs LDRSpost)>;
636 def : InstRW<[WriteAdr, A57Write_5cyc_1L], (instrs LDRSpre)>;
637 def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRSroW)>;
638 def : InstRW<[A57Write_5cyc_1L, ReadAdrBase], (instrs LDRSroX)>;
639 def : InstRW<[A57Write_5cyc_1L], (instrs LDRSui)>;
640 def : InstRW<[A57Write_5cyc_1L], (instrs LDURBi)>;
641 def : InstRW<[A57Write_5cyc_1L], (instrs LDURDi)>;
642 def : InstRW<[A57Write_5cyc_1L], (instrs LDURHi)>;
643 def : InstRW<[A57Write_5cyc_1L], (instrs LDURQi)>;
644 def : InstRW<[A57Write_5cyc_1L], (instrs LDURSi)>;
646 def : InstRW<[A57Write_2cyc_2S], (instrs STNPDi)>;
647 def : InstRW<[A57Write_4cyc_1I_4S], (instrs STNPQi)>;
648 def : InstRW<[A57Write_2cyc_2S], (instrs STNPXi)>;
649 def : InstRW<[A57Write_2cyc_2S], (instrs STPDi)>;
650 def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STPDpost)>;
651 def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STPDpre)>;
652 def : InstRW<[A57Write_4cyc_1I_4S], (instrs STPQi)>;
653 def : InstRW<[WriteAdr, A57Write_4cyc_1I_4S], (instrs STPQpost)>;
654 def : InstRW<[WriteAdr, A57Write_4cyc_2I_4S], (instrs STPQpre)>;
655 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STPSpost)>;
656 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STPSpre)>;
657 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STPWpost)>;
658 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STPWpre)>;
659 def : InstRW<[A57Write_2cyc_2S], (instrs STPXi)>;
660 def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STPXpost)>;
661 def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STPXpre)>;
662 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRBBpost)>;
663 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRBBpre)>;
664 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRBpost)>;
665 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STRBpre)>;
666 def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRBroW)>;
667 def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRBroX)>;
668 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRDpost)>;
669 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STRDpre)>;
670 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRHHpost)>;
671 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRHHpre)>;
672 def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRHHroW)>;
673 def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRHHroX)>;
674 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRHpost)>;
675 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STRHpre)>;
676 def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRHroW)>;
677 def : InstRW<[A57Write_3cyc_1I_1S, ReadAdrBase], (instrs STRHroX)>;
678 def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S, ReadAdrBase], (instrs STRQpost)>;
679 def : InstRW<[WriteAdr, A57Write_2cyc_1I_2S], (instrs STRQpre)>;
680 def : InstRW<[A57Write_2cyc_1I_2S, ReadAdrBase], (instrs STRQroW)>;
681 def : InstRW<[A57Write_2cyc_1I_2S, ReadAdrBase], (instrs STRQroX)>;
682 def : InstRW<[A57Write_2cyc_1I_2S], (instrs STRQui)>;
683 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRSpost)>;
684 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S], (instrs STRSpre)>;
685 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRWpost)>;
686 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRWpre)>;
687 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRXpost)>;
688 def : InstRW<[WriteAdr, A57Write_1cyc_1I_1S, ReadAdrBase], (instrs STRXpre)>;
689 def : InstRW<[A57Write_2cyc_2S], (instrs STURQi)>;
691 } // SchedModel = CortexA57Model